diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md
new file mode 100644
index 00000000000..5893b3c2374
--- /dev/null
+++ b/.github/pull_request_template.md
@@ -0,0 +1,12 @@
+## Summary
+
+## Additional background
+
+## Checklist
+
+The proposed changes:
+- [ ] fix a bug or incorrect behavior in AMReX
+- [ ] add new capabilities to AMReX
+- [ ] changes answers in the test suite to more than roundoff level
+- [ ] are likely to significantly affect the results of downstream AMReX users
+- [ ] are described in the proposed changes to the AMReX documentation, if appropriate
diff --git a/.github/workflows/dependencies/dependencies_clang6.sh b/.github/workflows/dependencies/dependencies_clang6.sh
new file mode 100755
index 00000000000..19b348b920b
--- /dev/null
+++ b/.github/workflows/dependencies/dependencies_clang6.sh
@@ -0,0 +1,14 @@
+#!/usr/bin/env bash
+#
+# Copyright 2020 The AMReX Community
+#
+# License: BSD-3-Clause-LBNL
+# Authors: Axel Huebl
+
+set -eu -o pipefail
+
+sudo apt-get update
+
+sudo apt-get install -y  \
+    build-essential      \
+    clang gfortran
diff --git a/.github/workflows/dependencies/dependencies_dpcpp.sh b/.github/workflows/dependencies/dependencies_dpcpp.sh
new file mode 100755
index 00000000000..53f29b45084
--- /dev/null
+++ b/.github/workflows/dependencies/dependencies_dpcpp.sh
@@ -0,0 +1,24 @@
+#!/usr/bin/env bash
+#
+# Copyright 2020 The AMReX Community
+#
+# License: BSD-3-Clause-LBNL
+# Authors: Axel Huebl
+
+set -eu -o pipefail
+
+# Ref.: https://github.com/rscohn2/oneapi-ci
+# intel-basekit intel-hpckit are too large in size
+wget -q -O - https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS-2023.PUB \
+  | sudo apt-key add -
+echo "deb https://apt.repos.intel.com/oneapi all main" \
+  | sudo tee /etc/apt/sources.list.d/oneAPI.list
+
+sudo apt-get update
+
+sudo apt-get install -y --no-install-recommends \
+    build-essential \
+    intel-oneapi-dpcpp-cpp-compiler intel-oneapi-mkl-devel \
+    g++ gfortran    \
+    libopenmpi-dev  \
+    openmpi-bin
diff --git a/.github/workflows/dependencies/dependencies_hip.sh b/.github/workflows/dependencies/dependencies_hip.sh
new file mode 100755
index 00000000000..3c120487d69
--- /dev/null
+++ b/.github/workflows/dependencies/dependencies_hip.sh
@@ -0,0 +1,48 @@
+#!/usr/bin/env bash
+#
+# Copyright 2020 The AMReX Community
+#
+# License: BSD-3-Clause-LBNL
+# Authors: Axel Huebl
+
+# search recursive inside a folder if a file contains tabs
+#
+# @result 0 if no files are found, else 1
+#
+
+set -eu -o pipefail
+
+# Ref.: https://rocmdocs.amd.com/en/latest/Installation_Guide/Installation-Guide.html#ubuntu
+wget -q -O - http://repo.radeon.com/rocm/rocm.gpg.key \
+  | sudo apt-key add -
+echo 'deb [arch=amd64] http://repo.radeon.com/rocm/apt/debian/ xenial main' \
+  | sudo tee /etc/apt/sources.list.d/rocm.list
+
+echo 'export PATH=$PATH:/opt/rocm/bin:/opt/rocm/profiler/bin:/opt/rocm/opencl/bin' \
+  | sudo tee -a /etc/profile.d/rocm.sh
+# we should not need to export HIP_PATH=/opt/rocm/hip with those installs
+
+sudo apt-get update
+
+# Ref.: https://rocmdocs.amd.com/en/latest/Installation_Guide/Installation-Guide.html#installing-development-packages-for-cross-compilation
+# meta-package: rocm-dkms
+# OpenCL: rocm-opencl
+# other: rocm-dev rocm-utils
+sudo apt-get install -y --no-install-recommends \
+    build-essential \
+    gfortran        \
+    libnuma-dev     \
+    libopenmpi-dev  \
+    openmpi-bin     \
+    rocm-dev rocrand
+
+# activate
+#
+source /etc/profile.d/rocm.sh
+hipcc --version
+
+# cmake-easyinstall
+#
+sudo curl -L -o /usr/local/bin/cmake-easyinstall https://git.io/JvLxY
+sudo chmod a+x /usr/local/bin/cmake-easyinstall
+export CEI_SUDO="sudo"
diff --git a/.github/workflows/dependencies/dependencies_mac.sh b/.github/workflows/dependencies/dependencies_mac.sh
index 7fa6878dbb9..6226a4baadd 100755
--- a/.github/workflows/dependencies/dependencies_mac.sh
+++ b/.github/workflows/dependencies/dependencies_mac.sh
@@ -7,6 +7,10 @@
 
 set -eu -o pipefail
 
+brew uninstall openssl@1.0.2t
+brew uninstall python@2.7.17
+brew untap local/openssl
+brew untap local/python2
 brew update
 brew install libomp
 brew install open-mpi
diff --git a/.github/workflows/linux.yml b/.github/workflows/linux.yml
index 26ca812a498..e54fccad944 100644
--- a/.github/workflows/linux.yml
+++ b/.github/workflows/linux.yml
@@ -5,8 +5,9 @@ on: [push, pull_request]
 jobs:
   # Build and install libamrex as AMReX CMake project
   library:
-    name: GNU@7.5 C++17 [lib]
+    name: GNU@7.5 C++17 Release [lib]
     runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wunreachable-code"}
     steps:
     - uses: actions/checkout@v2
     - name: Dependencies
@@ -16,15 +17,44 @@ jobs:
         mkdir build
         cd build
         cmake ..                                  \
+            -DCMAKE_VERBOSE_MAKEFILE=ON           \
             -DCMAKE_INSTALL_PREFIX=/tmp/my-amrex  \
             -DCMAKE_CXX_STANDARD=17
-        make -j 2 VERBOSE=ON
+        make -j 2
+        make install
+
+  library_clang:
+    name: Clang@6.0 C++14 SP NOMPI Debug [lib]
+    runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wextra-semi -Wunreachable-code"}
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies_clang6.sh
+    - name: Build & Install
+      run: |
+        mkdir build
+        cd build
+        cmake ..                        \
+            -DCMAKE_BUILD_TYPE=Debug    \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DCMAKE_INSTALL_PREFIX=/tmp/my-amrex      \
+            -DAMReX_MPI=OFF                           \
+            -DAMReX_PARTICLES=ON                      \
+            -DAMReX_PRECISION=SINGLE                  \
+            -DAMReX_PARTICLES_PRECISION=SINGLE        \
+            -DCMAKE_CXX_STANDARD=14                   \
+            -DCMAKE_C_COMPILER=$(which clang)         \
+            -DCMAKE_CXX_COMPILER=$(which clang++)     \
+            -DCMAKE_Fortran_COMPILER=$(which gfortran)
+        make -j 2
         make install
 
   # Build libamrex and all tutorials
   tutorials:
     name: GNU@7.5 C++14 [tutorials]
     runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wunreachable-code"}
     steps:
     - uses: actions/checkout@v2
     - name: Dependencies
@@ -33,13 +63,18 @@ jobs:
       run: |
         mkdir build
         cd build
-        cmake .. -DENABLE_TUTORIALS=ON
-        make -j 2 tutorials
+        cmake ..                        \
+            -DCMAKE_BUILD_TYPE=Debug    \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DAMReX_BUILD_TUTORIALS=ON  \
+            -DAMReX_PARTICLES=ON
+        make -j 2
 
   # Build libamrex and all tutorials
   tutorials_cxx20:
     name: GNU@10.1 C++20 [tutorials]
     runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wno-error=deprecated-declarations -Wshadow -Woverloaded-virtual -Wunreachable-code"}
     steps:
     - uses: actions/checkout@v2
     - name: Dependencies
@@ -48,18 +83,22 @@ jobs:
       run: |
         mkdir build
         cd build
-        cmake ..                     \
-            -DENABLE_TUTORIALS=ON    \
-            -DCMAKE_CXX_STANDARD=20  \
+        cmake ..                        \
+            -DCMAKE_BUILD_TYPE=Debug    \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DAMReX_BUILD_TUTORIALS=ON  \
+            -DAMReX_PARTICLES=ON        \
+            -DCMAKE_CXX_STANDARD=20     \
             -DCMAKE_C_COMPILER=$(which gcc-10)              \
             -DCMAKE_CXX_COMPILER=$(which g++-10)            \
             -DCMAKE_Fortran_COMPILER=$(which gfortran-10)
-        make -j 2 tutorials
+        make -j 2
 
   # Build libamrex and all tutorials w/o MPI
   tutorials-nonmpi:
-    name: GNU@7.5 C++14 non-MPI [tutorials]
+    name: GNU@7.5 C++14 NOMPI [tutorials]
     runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wunreachable-code"}
     steps:
     - uses: actions/checkout@v2
     - name: Dependencies
@@ -68,13 +107,19 @@ jobs:
       run: |
         mkdir build
         cd build
-        cmake .. -DENABLE_TUTORIALS=ON -DENABLE_MPI=OFF
-        make -j 2 tutorials
+        cmake ..                        \
+            -DCMAKE_BUILD_TYPE=Debug    \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DAMReX_BUILD_TUTORIALS=ON  \
+            -DAMReX_MPI=OFF             \
+            -DAMReX_PARTICLES=ON
+        make -j 2
 
   # Build libamrex and all tutorials
   tutorials-nofortran:
     name: GNU@7.5 C++11 w/o Fortran [tutorials]
     runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wunreachable-code"}
     steps:
     - uses: actions/checkout@v2
     - name: Dependencies
@@ -83,15 +128,18 @@ jobs:
       run: |
         mkdir build
         cd build
-        cmake ..                    \
-            -DENABLE_TUTORIALS=ON   \
-            -DENABLE_FORTRAN=OFF    \
+        cmake ..                        \
+            -DCMAKE_BUILD_TYPE=Debug    \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DAMReX_BUILD_TUTORIALS=ON  \
+            -DAMReX_PARTICLES=ON       \
+            -DAMReX_FORTRAN=OFF        \
             -DCMAKE_CXX_STANDARD=11
-        make -j 2 tutorials
+        make -j 2
 
   # Build libamrex and all tutorials with CUDA
   tutorials-cuda:
-    name: CUDA@9.1.85 GNU@4.8.5 C++11 [tutorials]
+    name: CUDA@9.1.85 GNU@4.8.5 C++11 Release [tutorials]
     runs-on: ubuntu-latest
     steps:
     - uses: actions/checkout@v2
@@ -102,11 +150,143 @@ jobs:
         mkdir build
         cd build
         cmake ..                                         \
-            -DENABLE_TUTORIALS=ON                        \
-            -DENABLE_CUDA=ON                             \
+            -DCMAKE_VERBOSE_MAKEFILE=ON                  \
+            -DAMReX_BUILD_TUTORIALS=ON                   \
+            -DAMReX_PARTICLES=ON                        \
+            -DAMReX_GPU_BACKEND=CUDA                         \
             -DCMAKE_C_COMPILER=$(which gcc-4.8)              \
             -DCMAKE_CXX_COMPILER=$(which g++-4.8)            \
             -DCMAKE_CUDA_HOST_COMPILER=$(which g++-4.8)      \
             -DCMAKE_Fortran_COMPILER=$(which gfortran-4.8)   \
-            -DCUDA_ARCH=6.0
-        make -j 2 tutorials
+            -DAMReX_CUDA_ARCH=6.0
+        make -j 2
+
+  tutorials-dpcpp:
+    name: DPCPP@PubBeta GFortran@7.5 C++17 [tutorials]
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies_dpcpp.sh
+    - name: Build & Install
+      run: |
+        set +e
+        source /opt/intel/oneapi/setvars.sh
+        set -e
+        mkdir build
+        cd build
+        cmake ..                                           \
+            -DCMAKE_VERBOSE_MAKEFILE=ON                    \
+            -DAMReX_BUILD_TUTORIALS=ON                          \
+            -DAMReX_PARTICLES=ON                          \
+            -DAMReX_GPU_BACKEND=SYCL                       \
+            -DCMAKE_C_COMPILER=$(which clang)              \
+            -DCMAKE_CXX_COMPILER=$(which dpcpp)            \
+            -DCMAKE_Fortran_COMPILER=$(which gfortran)
+        make -j 2
+
+  tutorials-hip:
+    name: HIP ROCm@3.8 GFortran@9.3 C++17 [tutorials]
+    runs-on: ubuntu-20.04
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies_hip.sh
+    - name: Build & Install
+      run: |
+        source /etc/profile.d/rocm.sh
+        hipcc --version
+        mkdir build
+        cd build
+        cmake ..                                           \
+            -DCMAKE_VERBOSE_MAKEFILE=ON                    \
+            -DAMReX_BUILD_TUTORIALS=ON                     \
+            -DAMReX_PARTICLES=ON                          \
+            -DAMReX_FORTRAN=ON                            \
+            -DAMReX_LINEAR_SOLVERS=ON                     \
+            -DAMReX_GPU_BACKEND=HIP                       \
+            -DAMReX_AMD_ARCH=gfx900                              \
+            -DCMAKE_C_COMPILER=$(which hipcc)              \
+            -DCMAKE_CXX_COMPILER=$(which hipcc)            \
+            -DCMAKE_Fortran_COMPILER=$(which gfortran)
+        make -j 2
+
+  # Build 1D libamrex with configure
+  configure-1d:
+    name: GNU@7.5 Release [configure 1D]
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies.sh
+    - name: Build & Install
+      run: |
+        ./configure --dim 1
+        make -j2
+        make install
+
+  # Build 2D libamrex with configure
+  configure-2d:
+    name: Clang@6.0 NOMPI Release [configure 2D]
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies_clang6.sh
+    - name: Build & Install
+      run: |
+        ./configure --dim 2 --with-fortran no --comp llvm --with-mpi no
+        make -j2 WARN_ALL=TRUE WARN_ERROR=TRUE
+        make install
+
+  # Build 3D libamrex with configure
+  configure-3d:
+    name: GNU@7.5 Release [configure 3D]
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies.sh
+    - name: Build & Install
+      run: |
+        ./configure --dim 3 --enable-eb yes --enable-xsdk-defaults yes
+        make -j2 WARN_ALL=TRUE WARN_ERROR=TRUE
+        make install
+
+  # Build 3D libamrex debug omp build with configure
+  configure-3d-omp-debug:
+    name: GNU@7.5 OMP Debug [configure 3D]
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies.sh
+    - name: Build & Install
+      run: |
+        ./configure --dim 3 --enable-eb yes --enable-xsdk-defaults yes --with-omp yes --debug yes
+        make -j2 WARN_ALL=TRUE WARN_ERROR=TRUE
+        make install
+
+  # Build libamrex and run all tests
+  tests:
+    name: GNU@7.5 C++14 [tests]
+    runs-on: ubuntu-latest
+    env: {CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wunreachable-code"}
+    steps:
+    - uses: actions/checkout@v2
+    - name: Dependencies
+      run: .github/workflows/dependencies/dependencies.sh
+    - name: Build & Install
+      run: |
+        mkdir build
+        cd build
+        cmake ..                        \
+            -DAMReX_OMP=ON             \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DAMReX_ENABLE_TESTS=ON     \
+            -DAMReX_PARTICLES=ON
+        make -j 2
+    - name: Run tests
+      run: |
+        cd build
+        ctest --output-on-failure -R
diff --git a/.github/workflows/macos.yml b/.github/workflows/macos.yml
index 71fe768e220..4a37ba1d906 100644
--- a/.github/workflows/macos.yml
+++ b/.github/workflows/macos.yml
@@ -2,6 +2,9 @@ name: macos
 
 on: [push, pull_request]
 
+env:
+  CXXFLAGS: "-Werror -Wshadow -Woverloaded-virtual -Wextra-semi -Wunreachable-code"
+
 jobs:
   # Build libamrex and all tutorials
   tutorials-macos:
@@ -15,5 +18,9 @@ jobs:
       run: |
         mkdir build
         cd build
-        cmake .. -DENABLE_TUTORIALS=ON
-        make -j 2 tutorials
+        cmake ..                        \
+            -DCMAKE_BUILD_TYPE=Debug    \
+            -DCMAKE_VERBOSE_MAKEFILE=ON \
+            -DAMReX_BUILD_TUTORIALS=ON  \
+            -DAMReX_PARTICLES=ON
+        make -j 2
diff --git a/.github/workflows/windows.yml b/.github/workflows/windows.yml
new file mode 100644
index 00000000000..f81564346e6
--- /dev/null
+++ b/.github/workflows/windows.yml
@@ -0,0 +1,17 @@
+name: windows
+
+on: [push, pull_request]
+
+jobs:
+  # Build libamrex and all tutorials
+  tutorials:
+    name: MSVC C++17 w/o Fortran w/o MPI
+    runs-on: windows-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Build & Install
+      run: |
+        mkdir build
+        cd build
+        cmake .. -DCMAKE_BUILD_TYPE=Debug -DCMAKE_VERBOSE_MAKEFILE=ON -DAMReX_BUILD_TUTORIALS=ON -DAMReX_FORTRAN=OFF -DAMReX_MPI=OFF
+        cmake --build . --config Debug
diff --git a/.gitignore b/.gitignore
index 47f16d489b0..a879e781eeb 100644
--- a/.gitignore
+++ b/.gitignore
@@ -5,6 +5,7 @@ nohup.out
 *.exe
 *.exe.dSYM
 *~
+build/
 tmp_build_dir/
 d/
 f/
diff --git a/CHANGES b/CHANGES
index e7a7b3e4563..4b23a0ba44b 100644
--- a/CHANGES
+++ b/CHANGES
@@ -1,3 +1,289 @@
+# 20.11
+
+  -- The default hypre interface in MLMG is now IJ matrix for both EB and
+     non-EB.  Previously, it was semi-struct for non-EB. (#1492)
+
+  -- USE_SAVE_TEMPS option in GNU Make system for HIP. (#1492)
+
+  -- The device version of `Error`, `Abort` and `Warning` is no-op, unless
+     `NDEBUG` is defined. (#1492)
+
+  -- Ascent: Use Default Name for Mesh Ghost (#1488)
+
+  -- Add fill method to GpuArray (#1472)
+
+  -- Add Gpu::Atomic::AddNoRet (#1469)
+
+  -- Option to make the code NOT enforce solvability in MLMG for singular
+     problems. (#1471)
+
+  -- CMake: improve HDF5 support (#1468)
+
+  -- CMake: FindPETSc must not overwrite CMAKE_Fortran_FLAGS (#1464)
+
+  -- CMake: prevent in-source builds (#1453)
+
+  -- change char * to char const* so SWFFT code compiles with USE_CUDA=TRUE
+     (#1454)
+
+  -- Fix when small_volfrac is used -- we need to adjust the data in cut
+     cell neighbors as well as regular neighbors. (#1451)
+
+  -- Allow users to set a Geometry object for ParticleContainer
+     independently of the AmrCore / AmrLevel object. (#1446)
+
+  -- HDF5 plotfile write bug fix and performance improvement (#1448)
+
+  -- CMake: add HIP support (#1316)
+
+  -- NodalProjector: use volume-weighted average down (#1444)
+
+  -- Fix race conditions in EB interpolation from cell centers to faces
+     (#1443)
+
+  -- Allow tagging value to vary by level (#1441)
+
+  -- Hypre with overset (#1439)
+
+  -- Hypre IJ interface: Enable access to additional solvers and
+     preconditioners available in Hypre (#1437)
+
+  -- Fix CPU version of uninitailiedFillNImpl in PODVector (#1435)
+
+  -- CMake: Fix missing compile time definitions for HYPRE/PETSc (#1436)
+
+  -- Fix bug in EB extdir slopes (#1434)
+
+  -- Make the id and cpu members of amrex_particle private, as they should
+     no longer be accessed directly. (#1433)
+
+  -- Disable OpenMPI C++ binding in GNU make system (#1398)
+
+  -- Fix a long standing bug in eb levelset (#1432)
+
+# 20.10
+
+  -- CMake: fix ENABLE_PROFPARSER and ENABLE_SENSEI options (#1428)
+
+  -- Remove EB LSCore and levelset, and reimplement signed distance function
+     capability. (#1429 & #1425)
+
+  -- Remove flags setCGVerbose and setCGMaxIter since those are more
+     accurately called setBottomVerbose and setBottomMaxIter.  The
+     "setCG..."  flags are misleading since they actually apply to non-CG
+     bottom solvers as well. (#1413)
+
+  -- Remove GetPosition and SetPosition from ParIter.  These were added for
+     WarpX, but they are not used any more. (#1408)
+
+  -- Only check the requested MPI Threading level if AMReX also initialized
+     MPI. (#1406)
+
+  -- DPCPP support for mulitple GPUs (#1392)
+
+  -- Random Number Generation on Device (#1363) In order to support RNG on
+     device with DPC++, we have to change the API because DPC++ does not
+     support global device variables.
+
+  -- Remove redundant particle tests and old/obsolete/non-test tests (#1389
+     & #1381)
+
+  -- Gpu kernel fusing is integrated in MFIter. (#1332)
+
+  -- New runtime parameter, amrex.max_gpu_streams. (#1386)
+
+  -- Switch to `use mpi` from `include 'mpif.h'` (#1385)
+
+  -- Remove reliance on managed memory from
+     AMReX_ParticleCommunication.H/.cpp (#1380)
+
+  -- CMake: re-organize tutorials (#1333)
+
+  -- Implement Particle in a way that does not involve UB. (#1337)
+
+  -- amrex::EB_average_down(): Fix indexing error. (#1360)
+
+  -- Only add one copy of the ghost particle regardless of how many isects
+     we have (#1359)
+
+  -- Add non-EB slopes and extend the generality of EB slope routines in 2D
+     and 3D (#1350)
+
+  -- Async IO: Check Runtime Threading (#1351)
+
+  -- Changes to make AMR codes compiled with EB but not building any
+     Geometry work as if it is all regular. (#1349)
+
+  -- Fix mkconfig.py (#1344)
+
+  -- Add -Xcudafe --diag_suppress=esa_on_defaulted_function_ignored to
+     suppress spurious warnings from nvcc. (#1342)
+
+  -- EB extend_domain_face (#1321)
+
+  -- Add parameter that stores OpenMP support version (#1325)
+
+# 20.09
+
+  -- Fix interpolation coefficients for EB stencil in cell-centered linear
+     solvers when the EB surface at the domain boundary is tilted.
+
+  -- Add a parameter to `AMReX_omp_mod` that can be used by Fortran code to
+     check whether AMReX was built with OpenMP support, and, if yes, what
+     the version number (_OPENMP) was at the time AMReX was compiled.
+
+  -- CMake: re-write genex evaluation functions.
+
+  -- Extend the number of unique particles per cpu we can have at once.
+
+  -- Add a new method to the `amrex_distromap` type in
+     F_Interfaces. `get_pmap` fills a caller-owned array of PEs.
+
+  -- Fix a long standing bug in GNU make system on the use of HOST and
+     HOSTNAME.
+
+  -- Add Scan::InclusiveSum and ExclusiveSum for CPU to avoid ifdef.
+
+  -- Add check for empty probin_file in Amr::restart.
+
+  -- Update Sundials interface, documentation, and build to be version
+     agnostic.
+
+  -- Updates for ROCm 3.6 and 3.7.
+
+  -- Add section to Make.unknown for intel mpi.
+
+  -- CMake: re-factor third party libraries setup.
+
+  -- Port TagBoxArray to GPU.
+
+  -- Fix a bug in matching of COMP_VERSION to correctly treat CCE > 9.
+
+  -- By default, EB outside the domain will be generated by extending from
+     the domain faces.
+
+  -- Fix an issues due to roundoff error in determining whether particles
+     are inside the domain.
+
+  -- Remove Perilla because it's incompatible with our GPU strategy and it's
+     no longer being maintained.
+
+  -- Switch the overset mask convention to that 1 means unknown and 0 means
+     known.  The new convention is more convenient for AMR-Wind.
+
+  -- Remove old solvers, Src/LinearSolvers/C_CellMG and C_TensorMG.  They
+     have been superseded by Src/LinearSolvers/MLMG.
+
+  -- MacProjector: allow for re-use of the object and enhance multi-level
+     algorithm.
+
+  -- Add asserts for bounds checking to Array1D and Array2D.
+
+  -- Optimization of the construction of SFC.
+
+  -- Refactoring of particle buffer map.
+
+  -- Optimization of FPinfo and complementIn.
+
+  -- Move the Amr/Extrapolater used in IAMR/PeleLM to C++/GPU compliant.
+
+  -- Less surprising behavior for the ok() method of FabArray. This makes
+     the `ok()` method of FabArray return `false` instead of crashing if the
+     `define()` method has yet to be called.
+
+  -- Optimization of regrid.
+
+  -- Special FillBoundary for Almo.
+
+  -- Fix the average_down_faces calls in linear solvers to see periodicity.
+
+  -- Make sure the calculation of divu at inflow face in nodal projection
+     does not use tangential velocities on an inflow face.
+
+# 20.08
+
+  -- New average_down_faces functions that take periodic boundary into account.
+
+  -- Update the documentation for Nsight.
+
+  -- Fix a bug with HDF5 boxcenter data.
+
+  -- New runtime parameter, `eb2.extend_domain_face`, that can be used to extraploate EB information
+     from domain faces.
+
+  -- New GNU Make options for GCC and Clang, `WARN_ALL` and `WARN_ERROR`. `WARN_ALL` turns on more
+     compiler warnings.  `WARN_ERROR` turns warnings into errors.
+
+  -- Fix various compiler warnings.
+
+  -- Fix memory fragmentation issue with communication buffer.
+
+  -- Semi-coarsening support in linear solvers.
+
+  -- Fix virtual particle issues.
+
+  -- Capability to fuse GPU kernel launches.
+
+  -- Make ghost particles support soa data.
+
+  -- CMake: ability to export build tree.
+
+  -- Reset amrex_geometry_module initialization state when finalizing.
+
+  -- Remove Long version of Gatherv.
+
+  -- Optimization of TagBoxArray::collate.
+
+  -- CMake: fix missing PETSc setup in Config file.
+
+  -- BndryFunc for nodal data.
+
+  -- MLMG Hypre fix for singular problems.
+
+  -- Add particle copy filters.
+
+  -- Async output support for particles.
+
+  -- BackgroundThread class.
+
+# 20.07
+
+  -- Nodal hypre solver now supports coarsening before hypre is called.
+
+  -- A new ParmParse parameter, `amrex.the_arena_is_managed` is introduced to set the default memory
+     type of `The_Arena`.
+
+  -- MFIter is now OMP thread safe when it is compiled with GPU support.
+
+  -- Overset support is added to cell-center and tensor linear solvers.
+
+  -- Remove compile time flag, BACKTRACE, for simplicity.
+
+  -- Updates on Blueprint and Ascent.
+
+  -- HDF5 support in GNU Make and CMake.
+
+  -- CMake support for DPC++.
+
+  -- Add -DNDEBUG for non-debug build.
+
+  -- Support for Windows.
+
+  -- Support for ParallelContext in Particles.
+
+  -- Non const iterator for neighbor list.
+
+  -- Tool for comparing single-level plotfiles of all nodalities.
+
+  -- GNU Make: Use -M instead the perl script to generate dependencies.
+
+  -- Particle: Remove directly accessing the m_idata and m_rdata structs internally.
+
+  -- Extend the makeSFC method to take an additional argument where the user can override the number
+     of processes a BoxArray is distributed to.
+
+  -- Turn tiling off by default for gpu.
+
 # 20.06
 
   -- Set a non-default CMAKE_INSTALL_PREFIX only if AMReX is the
@@ -43,7 +329,7 @@
 
   -- Add CUPTI trace for CUDA kernel timing.
 
-  -- Implement ENABLE_FORTRAN (BL_NO_FORT) option in CMake.
+  -- Implement AMReX_FORTRAN (BL_NO_FORT) option in CMake.
 
   -- Fix CUDA build of tools.
 
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 43b8020b660..8ffb19eb045 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -1,49 +1,28 @@
 cmake_minimum_required(VERSION 3.14)
 
-########################################################################
 #
-# Set variables for AMReX versioning
+# Prevent in-source builds
 #
-########################################################################
-find_package (Git QUIET)
-
-set( _tmp "" )
-
-# Try to inquire software version from git
-if ( EXISTS ${CMAKE_CURRENT_LIST_DIR}/.git AND ${GIT_FOUND} )
-   execute_process ( COMMAND git describe --abbrev=12 --dirty --always --tags
-      WORKING_DIRECTORY ${CMAKE_CURRENT_LIST_DIR}
-      OUTPUT_VARIABLE _tmp )
-   string( STRIP ${_tmp} _tmp )
-   # filter invalid descriptions in shallow git clones
-   if (NOT _tmp MATCHES "^([0-9]+)\\.([0-9]+)(\\.([0-9]+))*(-.*)*$")
-       set( _tmp "")
-   endif ()
-endif()
-
-# Grep first line from file CHANGES if cannot find version from Git
-if (NOT _tmp)
-   file(STRINGS ${CMAKE_CURRENT_LIST_DIR}/CHANGES ALL_VERSIONS REGEX "#")
-   list(GET ALL_VERSIONS 0 _tmp)
-   string(REPLACE "#" "" _tmp "${_tmp}")
-   string(STRIP "${_tmp}" _tmp )
-   set(_tmp "${_tmp}.0")
+if (CMAKE_BINARY_DIR STREQUAL CMAKE_SOURCE_DIR)
+   message(FATAL_ERROR
+      "\nin-source builds are not allowed: "
+      "build directory cannot be in the source directory path!\n"
+      "You MUST remove the file ${CMAKE_BINARY_DIR}/CMakeCache.txt and "
+      " the directory ${CMAKE_BINARY_DIR}/CMakeFiles/ to be able to build again.")
 endif ()
 
-set( AMREX_GIT_VERSION "${_tmp}" CACHE INTERNAL "" )
-unset(_tmp)
 
-# Package version is a modified form of AMREX_GIT_VERSION
-if (AMREX_GIT_VERSION)
-    string(FIND "${AMREX_GIT_VERSION}" "-" _idx REVERSE)
-    string(SUBSTRING "${AMREX_GIT_VERSION}" 0 "${_idx}" _pkg_version )
-    string(FIND "${_pkg_version}" "-" _idx REVERSE)
-    string(SUBSTRING "${_pkg_version}" 0 "${_idx}" _pkg_version )
-    string(REPLACE "-" "." _pkg_version "${_pkg_version}")
-endif ()
+#
+# Set search path for AMReX-specific CMake modules
+#
+set( AMREX_CMAKE_MODULES_PATH "${CMAKE_CURRENT_LIST_DIR}/Tools/CMake" CACHE INTERNAL "" )
+set( CMAKE_MODULE_PATH ${AMREX_CMAKE_MODULES_PATH} )
 
-set( AMREX_PKG_VERSION "${_pkg_version}" CACHE INTERNAL "" )
-unset(_pkg_version)
+#
+# Retrieve amrex version
+#
+include( AMReX_Utils )
+get_amrex_version()
 
 
 ########################################################################
@@ -60,11 +39,6 @@ project( AMReX
 
 message(STATUS "CMake version: ${CMAKE_VERSION}")
 
-#
-# Load required modules
-#
-set( AMREX_CMAKE_MODULES_PATH "${CMAKE_CURRENT_LIST_DIR}/Tools/CMake" CACHE INTERNAL "" )
-set( CMAKE_MODULE_PATH ${AMREX_CMAKE_MODULES_PATH} )
 
 #
 # Provide a default install directory
@@ -74,28 +48,52 @@ if ( CMAKE_SOURCE_DIR STREQUAL PROJECT_SOURCE_DIR AND CMAKE_INSTALL_PREFIX_INITI
           CACHE PATH "AMReX installation directory" FORCE)
 endif ()
 
+message(STATUS "AMReX installation directory: ${CMAKE_INSTALL_PREFIX}")
+
+#
+# Check if CMAKE_BUILD_TYPE is given. If not, use default
+#
+if ( NOT CMAKE_BUILD_TYPE )
+   set(CMAKE_CONFIGURATION_TYPES "Release;Debug;MinSizeRel;RelWithDebInfo")
+   set(CMAKE_BUILD_TYPE Release
+       CACHE STRING
+       "Choose the build type, e.g. Release, Debug, or RelWithDebInfo." FORCE)
+else ()
+   message(STATUS "Build type set by user to '${CMAKE_BUILD_TYPE}'.")
+endif()
+
 #
 # Include options, utilities and other stuff we need
 #
-include( AMReX_Utils )
-include( AMReX_Options )
-include( AMReX_Machines )
+include( AMReXOptions )
 
 #
 # Enable Fortran if requested
 #
-if(ENABLE_FORTRAN)
+if(AMReX_FORTRAN)
    enable_language(Fortran)
 endif ()
 
 #
 # Enable CUDA if requested
 #
-if (ENABLE_CUDA)
+if (AMReX_CUDA)
+    # CMake 3.18+: CMAKE_CUDA_ARCHITECTURES
+    # https://cmake.org/cmake/help/latest/policy/CMP0104.html
+    if(POLICY CMP0104)
+        cmake_policy(SET CMP0104 OLD)
+    endif()
+
     enable_language(CUDA)
     include(AMReX_SetupCUDA)
 endif ()
 
+#
+# Check compiler version
+#
+set_mininum_cxx_compiler_version(GNU 4.8)
+set_mininum_cxx_compiler_version(MSVC 19.23)
+
 #
 # Set CMAKE_<LANG>_FLAGS_<CONFIG> if not already defined
 #
@@ -109,19 +107,30 @@ add_subdirectory(Src)
 #
 # Tutorials and "test_install" target
 #
-option(ENABLE_TUTORIALS "Enable Tutorials" NO)
+option(AMReX_BUILD_TUTORIALS "Build tutorials" NO)
 
-if (ENABLE_TUTORIALS)
+if (AMReX_BUILD_TUTORIALS)
+   message(STATUS "Enabling Tutorials")
    add_subdirectory(Tutorials)
 endif ()
 
 #
 # Plotfile tools
 #
-option(ENABLE_PLOTFILE_TOOLS "Enable Plotfile tools" NO)
+option(AMReX_PLOTFILE_TOOLS "Enable Plotfile tools" NO)
 
-if (ENABLE_PLOTFILE_TOOLS)
+if (AMReX_PLOTFILE_TOOLS)
    # If this get executed, it cannot be EXCLUDED_FROM_ALL
    # because it needs to get installed
    add_subdirectory(Tools/Plotfile)
 endif ()
+
+
+#
+# Enable CTests
+#
+option(AMReX_ENABLE_TESTS "Enable CTest suite for AMReX"  NO)
+if (AMReX_ENABLE_TESTS)
+   enable_testing()
+   add_subdirectory(Tests)
+endif ()
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 399f577efb9..93eb0a64337 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -8,9 +8,6 @@ Development generally follows the following ideas:
     Nightly regression testing is used to ensure that no answers
     change (or if they do, that the changes were expected).
 
-    If a change is critical, we can cherry-pick the commit from
-    `development` to `master`.
-
   * Bug fixes, questions and contributions of new features are welcome!
 
        * Bugs should be reported through GitHub issues
@@ -33,15 +30,10 @@ Development generally follows the following ideas:
             distribute, and sublicense such enhancements or derivative works
             thereof, in binary and source code form.
 
-  * On the first workday of each month, we perform a merge of
-    `development` into `master`.  For this merge to take place, we
-    need to be passing the regression tests.
-
-    To accommodate this need, we close the merge window into
-    `development` a few days before the merge day.  While the merge
-    window is closed, only bug fixes should be pushed into
-    `development`.  Once the merge from `development` -> `master` is
-    done, the merge window reopens.
+  * On the first workday of each month, we make a tagged release.  The merge window into
+    `development` is closed a few days before the release day.  While the merge window is closed,
+    only bug fixes should be merged into `development`.  Once the release is done, the merge window
+    reopens.
 
 ## Git workflow
 
@@ -79,9 +71,8 @@ git remote add upstream https://github.com/AMReX-Codes/amrex
 git remote set-url --push upstream https://github.com/<myGithubUsername>/amrex.git
 git fetch upstream
 
-# We recommend setting your development and master branches to track the upstream ones instead of your fork:
+# We recommend setting your development branch to track the upstream one instead of your fork:
 git branch -u upstream/development
-git checkout -t -b master upstream/master
 ```
 Now you are free to play with your fork (for additional information, you can visit the
 [Github fork help page](https://help.github.com/en/articles/fork-a-repo)).
@@ -91,7 +82,7 @@ Now you are free to play with your fork (for additional information, you can vis
 > on your fork with
 > ```
 > git checkout development
-> git pull development
+> git pull
 > ```
 
 Make sure you are on the `development` branch with
@@ -177,6 +168,57 @@ and you can delete the remote one on your fork with
 git push origin --delete <branch_name>
 ```
 
+Generally speaking, you want to follow the following rules.
+
+  * Do not merge your branch for PR into your local `development` branch that tracks AMReX
+    `development` branch.  Otherwise your local `development` branch will diverge from AMReX
+    `development` branch.
+
+  * Do not commit in your `development` branch that tracks AMReX `development` branch.
+
+  * Always create a new branch based off `development` branch for each pull request, unless you are
+    going to use git to fix it later.
+
+If you have accidentally committed in `development` branch, you can fix it as follows,
+```
+git checkout -b new_branch
+git checkout development
+git reset HEAD~2  # Here 2 is the number of commits you have accidentally committed in development
+git checkout .
+```
+After this, the local `development` should be in sync with AMReX `development` and your recent
+commits have been saved in `new_branch` branch.
+
+If for some reason your PR branch has diverged from AMReX, you can try to fix it as follows.  Before
+you try it, you should back up your code in case things might go wrong.
+```
+git fetch upstream   # assuming upstream is the remote name for the official amrex repo
+git checkout -b xxx upstream/development  # replace xxx with whatever name you like
+git branch -D development
+git checkout -b development upstream/development
+git checkout xxx
+git merge yyy  # here yyy is your PR branch with unclean history
+git rebase -i upstream/development
+```
+You will see something like below in your editor,
+```
+pick 7451d9d commit message a
+pick c4c2459 commit message b
+pick 6fj3g90 commit message c
+```
+This now requires a bit of knowledge on what those commits are, which commits have been merged,
+which commits are actually new.  However, you should only see your only commits.  So it should be
+easy to figure out which commits have already been merged.  Assuming the first two commits have been
+merged, you can drop them by replace `pick` with `drop`,
+```
+drop 7451d9d commit message a
+drop c4c2459 commit message b
+pick 6fj3g90 commit message c
+```
+After saving and then exiting the editor, `git log` should show a clean history based on top of
+`development` branch.  You can also do `git diff yyy..xxx` to make sure nothing new was dropped.  If
+all goes well, you can submit a PR using `xxx` branch.
+Don't worry, if something goes wrong during the rebase, you an always `git rebase --abort` and start over.
 ## Core Developers
 
 People who make a number of substantive contributions will be named
diff --git a/Docs/Doxygen/doxygen.conf b/Docs/Doxygen/doxygen.conf
index 1762f9005d3..93dc968056e 100644
--- a/Docs/Doxygen/doxygen.conf
+++ b/Docs/Doxygen/doxygen.conf
@@ -848,7 +848,7 @@ RECURSIVE              = YES
 # Note that relative paths are relative to the directory from which doxygen is
 # run.
 
-EXCLUDE = ../../Src/F_Interfaces ../../Src/AmrTask
+EXCLUDE = ../../Src/F_Interfaces
 
 # The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
 # directories that are symbolic links (a Unix file system feature) are excluded
@@ -1298,7 +1298,7 @@ CHM_FILE               =
 HHC_LOCATION           =
 
 # The GENERATE_CHI flag controls if a separate .chi index file is generated
-# (YES) or that it should be included in the master .chm file (NO).
+# (YES) or that it should be included in the main .chm file (NO).
 # The default value is: NO.
 # This tag requires that the tag GENERATE_HTMLHELP is set to YES.
 
diff --git a/Docs/Notes/DPCPPWishlist.md b/Docs/Notes/DPCPPWishlist.md
index 0c26f5712e8..fdaf1806a08 100644
--- a/Docs/Notes/DPCPPWishlist.md
+++ b/Docs/Notes/DPCPPWishlist.md
@@ -1,97 +1,120 @@
 
 # Critical
 
-* Global variables.  Could DPC++ support global variables and add
+* [Feature Request] Global variables.  Could DPC++ support global variables and add
   something similar to cudaMemcpyToSymbol?
   [oneAPI-spec issue #125](https://github.com/oneapi-src/oneAPI-spec/issues/125)
 
-* Device API for random number generator.  Currently we can only use
+* [Feature Request] Device API for random number generator.  Currently we can only use
   oneMKL's host API to generate random numbers.
-  [Intel oneAPI Base Toolkit Forum](https://software.intel.com/en-us/forums/intel-oneapi-base-toolkit/topic/856436)
+  [Intel oneAPI Base Toolkit Forum](https://software.intel.com/en-us/forums/intel-oneapi-base-toolkit/topic/856436),
   [oneAPI-spec issue #139](https://github.com/oneapi-src/oneAPI-spec/issues/139)
 
-* Recursive function call on device.  This is very important for ECP
+* [Feature Request] Recursive function call on device.  This is very important for ECP
   WarpX code.
   [oneAPI-spec issue #123](https://github.com/oneapi-src/oneAPI-spec/issues/123)
+  A test code is available at https://github.com/WeiqunZhang/dpcpp/tree/main/recursive
 
-* Memory fence.  Could DPC++ privode a memory fence function for the
+* [Feature Request] Memory fence.  Could DPC++ privode a memory fence function for the
   whole device (not just group)?  Or is the CUDA distinction between
   `__threadfence` and `__thread_block` unnecessary for Intel GPUs?
   [oneAPI-spec issue #130](https://github.com/oneapi-src/oneAPI-spec/issues/130)
 
-* The compiler has some troubles with some very big device functions
+  This has been partially resolved.  SYCL 2020 has introduced `memory_scope::device` ordering.
+
+* [Bug] The compiler has some troubles with some very big device functions
   (e.g., `mlndlap_stencil_rap` in
   `Src/LinearSolvers/MLMG/AMReX_MLNodeLap_3D_K.H`).  It hangs at JIT
   compilation.  We have to disable GPU launch for these functions and
-  run them on CPU. 
+  run them on CPU.
+
+  This can be reproduced by the test code at
+  https://github.com/AMReX-Codes/amrex/blob/development/Tests/LinearSolvers/NodeEB/
+
+  ```
+  make -j8 USE_DPCPP=TRUE XTRA_CPPFLAGS=-DAMREX_DPCPP_STENCIL_RAP_ON_GPU
+  ./main3d.dpcpp.TEST.ex inputs.rt.3d.y
+  ```
+
+  If this is compiled without `XTRA_CPPFLAGS=-DAMREX_DPCPP_STENCIL_RAP_ON_GPU`, it runs fine by
+  putting function `mlndlap_stencil_rap` on CPU.
 
 # Major
 
-* The maximum size of kernel parameter is 1KB on current Intel GPUs.
+* [Feature Request] The maximum size of kernel parameter is 1KB on current Intel GPUs.
   This is not sufficient for many of our kernels.
 
-* Sometimes the JIT compilation will raise floating-point exception at
+* [Bug] Sometimes the JIT compilation will raise floating-point exception at
   runtime.  This forces us to disable floating-point exception signal
-  handling that we often rely on for debugging.
+  handling that we often rely on for debugging.  A bug reproducer is
+  available at https://github.com/WeiqunZhang/dpcpp/tree/main/jitfpe
 
-* Option to be less OOP.  Could we have access to thread id, group id,
+* [Feature Request] Option to be less OOP.  Could we have access to thread id, group id,
   memory fence, barrier functions, etc. without using an nd_item like
   object?
   [oneAPI-spec issue #118](https://github.com/oneapi-src/oneAPI-spec/issues/118)
 
-* Local memory.  Could DPC++ support static local memory
+* [Feature Request] Local memory.  Could DPC++ support static local memory
   (e.g. something like CUDA `__shared__ a[256]`) and dynamic local
   memory (e.g., something like CUDA `extern __shared__ a[]` with the
   amount of memory specified at runtime during kernel launch) from
   anywhere in device code?
   [oneAPI-spec issue #126](https://github.com/oneapi-src/oneAPI-spec/issues/126)
 
-# Minor
+* [Feature Request] DPC++ does not work with ccache.
+  [intel/llvm issue #1797](https://github.com/intel/llvm/issues/1797)
 
-* Compiler flag to make implicit capture of this pointer via `[=]` an
-  error.  [Implicit capture of this pointer](http://eel.is/c++draft/depr#capture.this)
-  has been deprecated in C++ 20.  For many codes, it's almost always a
-  bug when `this` is implicitly captured onto device via `[=]`.
-  [oneAPI-spec issue #127](https://github.com/oneapi-src/oneAPI-spec/issues/127)
+# Minor
 
-* Host callback.  Could DPC++ support appending a host callback
+* [Feature Request] Host callback.  Could DPC++ support appending a host callback
   function to an ordered queue?
   [oneAPI-spec issue #124](https://github.com/oneapi-src/oneAPI-spec/issues/124)
 
-* Subgroup size.  Querying `sycl::info::device::sub_group_size` gives
-  several numbers.  For example, we get 8, 16 and 32 for Gen9.  We
-  would like to specify the sub group size and this feature is
-  supported.  All three sizes seem to work except that subgroup
-  primitives such as `shuffle_down` do not work for all sizes.  By try
-  and error, we have found that shuffle_down works for 16.  Could
-  oneAPI provide a query function for returning the "primitive"
-  subgroup size?
-  [oneAPI-spec issue #118](https://github.com/oneapi-src/oneAPI-spec/issues/118)
+* [Bug] Subgroup size.  Querying `sycl::info::device::sub_group_size` gives several numbers.  For
+  example, we get 8, 16 and 32 for Gen9.  We would like to specify the sub group size and this
+  feature is supported.  All three sizes seem to work except that subgroup primitives such as
+  `shuffle_down` do not work with size of 32.  Could oneAPI provide a query function for returning
+  the "primitive" subgroup size?  [oneAPI-spec issue #118](https://github.com/oneapi-src/oneAPI-spec/issues/118)
+  A bug reproducer is available at https://github.com/WeiqunZhang/dpcpp/tree/main/subgroupsize
 
-* `assert(0)`. `assert(0)` when called on device does not throw any
+* [Feature Request] `assert(0)`. `assert(0)` when called on device does not throw any
   errors or abort the run.  Is it possible to make it abort or return
   an error code that can be checked on the host?  In CUDA, the users
   can check an error code.
   [oneAPI-spec issue #128](https://github.com/oneapi-src/oneAPI-spec/issues/128)
 
-* `sycl::abs`. `sycl::abs(int)` returns an `unsigned int` in contrast to
+* [Defect] `sycl::abs`. `sycl::abs(int)` returns an `unsigned int` in contrast to
   `int std::abs(int)`.  Currently `std::abs` does not work on device.  If
   `std::abs` is made to work on device, could it return the same type
   as the C++ standard?
   [oneAPI-spec issue #129](https://github.com/oneapi-src/oneAPI-spec/issues/129)
 
+* [Defect] When `dpcpp -M` is used to generate dependency for make file, the output is saved in a
+  file.  But for most if not all other compilers (including Intel C/C++ compiler), the output
+  appears in stdout.  If there are no particular reasons for this, could DPC++ compiler change the
+  behavior to what other compilers do.  It will simplify our make build system.  (This has been
+  reported to Intel via Intel Premier Support.)
+
 # Resolved
 
-* ~~Classes that are not standard layout.  The current specification of
+* [Feature Request] Classes that are not standard layout.  The current specification of
   oneAPI does not support the capture of objects that are not standard
-  layout.  This includes the following example,~~
+  layout.  This includes the following example,
 
   ```
   class A {int a;}; class B {long B;}; class C : A, B {};
   ```
 
-  ~~AMReX has a data structure called GpuTuple that is built with a
+  AMReX has a data structure called GpuTuple that is built with a
   pattern like the example shown above.  It works in CUDA, but not in
-  DPC++.  We wish this requirement can be relaxed.~~
+  DPC++.  We wish this requirement can be relaxed.
 
   This restriction has been relaxed since beta5.
+
+* [Feature Request] Compiler flag to make implicit capture of this pointer via `[=]` an
+  error.  [Implicit capture of this pointer](http://eel.is/c++draft/depr#capture.this)
+  has been deprecated in C++ 20.  For many codes, it's almost always a
+  bug when `this` is implicitly captured onto device via `[=]`.
+  [oneAPI-spec issue #127](https://github.com/oneapi-src/oneAPI-spec/issues/127)
+
+  This has been implemented in the intel/llvm github repo.
diff --git a/Docs/Notes/Readme.backtrace b/Docs/Notes/Readme.backtrace
deleted file mode 100644
index 478cc5f69cb..00000000000
--- a/Docs/Notes/Readme.backtrace
+++ /dev/null
@@ -1,45 +0,0 @@
-To help debugging, AMReX handles various signals in the C standard
-library raised in the runs.  This gives us a chance to print out more
-information using Linux/Unix backtrace capability.  The signals
-include seg fault, interruption by the user (control-c), assertion
-errors, and floating point exceptions (NaNs, divided by zero and
-overflow).  The handling of seg fault, assertion errors and
-interruption by control-C are enabled by default. (Note that in C++
-AMReX, AMREX_ASSERT() is only on when compiled with DEBUG=TRUE or
-USE_ASSERTION=TRUE.)  The trapping of floating point exceptions is not
-enabled by default unless the code is compiled with TEST=TRUE or
-DEBUG=TRUE in C++ AMReX, or TEST=t or NDEBUG= in Fortran AMReX.  For
-C++ AMReX codes, one can also use runtime parameters to control the
-handling of floating point exceptions: amrex.fpe_trap_invalid for
-NaNs, amrex.fpe_trap_zero for division by zero and
-amrex.fpe_trap_overflow for overflow.  To more effectively trap the
-use of uninitialized values, AMReX also initializes MulitFabs and
-arrays allocated by bl_allocate to signaling NaNs when it is compiled
-with TEST=TRUE or DEBUG=TRUE in C++ AMReX, or TEST=t or NDEBUG= in
-Fortran AMReX.  In C++ AMReX, one can also control the setting using
-the runtime parameter, fab.init_snan.
-
-If it is compiled with BACKTRACE=TRUE, one can get more information
-than the backtrace of the call stack by instrumenting the code.  (This
-is in C++ code only.)  Here is an example.  You know the line "Real
-rho = state(cell,0);" is causing a segfault.  You could add a print
-statement before that.  But it might print out thousands (or even
-millions) of line before it hits the segfault.  With BACKTRACE, you
-could do
-
-   #include <AMReX_BLBackTrace.H>
-   
-   #ifdef AMREX_BACKTRACING
-       std::ostringstream ss;
-       ss << "state.box() = " << state.box() << " cell = " << cell;
-       BL_BACKTRACE_PUSH(ss.str()); // PUSH takes std::string
-   #endif
-       Real rho = state(cell,0);  // state is a Fab, and cell is an IntVect.
-   #ifdef AMREX_BACKTRACING
-       BL_BACKTRACE_POP(); // One can omit this line.  In that case,
-                           // there is an implicit POP when "PUSH" is
-                           // out of scope.
-   #endif
-
-When it hits the segfault, you will only see the last pint out.
-
diff --git a/Docs/sphinx_documentation/make_api.py b/Docs/sphinx_documentation/make_api.py
index bd3b36da5ec..27362696127 100644
--- a/Docs/sphinx_documentation/make_api.py
+++ b/Docs/sphinx_documentation/make_api.py
@@ -32,8 +32,8 @@ def generate_filelist(rootdir, outfile, output_data, subdir_prefix=""):
             # found a subdirectory - create a new _files.rst file and call
             # generate_filelist on the subdir
 
-            # ignore AmrTask and F_Interfaces
-            if subdir.lower() in ['amrtask', 'f_interfaces']:
+            # ignore F_Interfaces
+            if subdir.lower() in ['f_interfaces']:
                 continue
 
             output_data += """{}_files
diff --git a/Docs/sphinx_documentation/source/AMReX_Profiling_Tools.rst b/Docs/sphinx_documentation/source/AMReX_Profiling_Tools.rst
index 1e0c9cdf618..a61ce2464c4 100644
--- a/Docs/sphinx_documentation/source/AMReX_Profiling_Tools.rst
+++ b/Docs/sphinx_documentation/source/AMReX_Profiling_Tools.rst
@@ -26,10 +26,10 @@ in your GNUMakefile.   If using cmake then set the following cmake flags
 
 ::
 
-  AMREX_ENABLE_TINY_PROFILE = ON
-  AMREX_ENABLE_BASE_PROFILE = OFF
+  AMReX_TINY_PROFILE = ON
+  AMReX_BASE_PROFILE = OFF
 
-Note that if you set ``PROFILE = TRUE``  (or ``AMREX_ENABLE_BASE_PROFILE =
+Note that if you set ``PROFILE = TRUE``  (or ``AMReX_BASE_PROFILE =
 ON``) then this will override the ``TINY_PROFILE`` flag and tiny profiling will
 be disabled.
 
@@ -245,4 +245,3 @@ parser itself. It has been integrated into Amrvis for visual interpretation of
 the data allowing Amrvis to open the bl_prof database like a plotfile but with
 interfaces appropriate to profiling data. AMRProfParser and Amrvis can be run
 in parallel both interactively and in batch mode.
-
diff --git a/Docs/sphinx_documentation/source/AmrCore.rst b/Docs/sphinx_documentation/source/AmrCore.rst
index 8bcd30e750e..53326901262 100644
--- a/Docs/sphinx_documentation/source/AmrCore.rst
+++ b/Docs/sphinx_documentation/source/AmrCore.rst
@@ -41,7 +41,7 @@
 AmrCore Source Code: Details
 ============================
 
-Here we provide more information about the source code in ``amrex/Src/AmrCore.``
+Here we provide more information about the source code in ``amrex/Src/AmrCore``.
 
 AmrMesh and AmrCore
 -------------------
@@ -219,7 +219,7 @@ of using :cpp:`MultiFab::FillBoundary` and :cpp:`FillDomainBoundary()`.
 A :cpp:`FillPatchUtil` uses an :cpp:`Interpolator`. This is largely hidden from application codes.
 AMReX_Interpolater.cpp/H contains the virtual base class :cpp:`Interpolater`, which provides
 an interface for coarse-to-fine spatial interpolation operators. The fillpatch routines described
-above require an Interpolater for FillPatchTwoLevels()
+above require an Interpolater for FillPatchTwoLevels().
 Within AMReX_Interpolater.cpp/H are the derived classes:
 
 -  :cpp:`NodeBilinear`
@@ -449,7 +449,7 @@ Here is a high-level pseudo-code of the flow of the program:
             AmrCoreAdv::MakeNewLevelFromScratch()
                   /* allocate phi_old, phi_new, t_new, and flux registers */
                   initdata()  // fill phi
-          } (while (finest_level < max_level);
+          } while (finest_level < max_level);
         }
       amr_core_adv.Evolve()
         loop over time steps {
diff --git a/Docs/sphinx_documentation/source/AmrLevel.rst b/Docs/sphinx_documentation/source/AmrLevel.rst
index 85dbcbf4404..de4180d25e3 100644
--- a/Docs/sphinx_documentation/source/AmrLevel.rst
+++ b/Docs/sphinx_documentation/source/AmrLevel.rst
@@ -125,7 +125,7 @@ cells, number of components, and the interlevel interpolation (See
 AMReX_Interpolator for various interpolation types. We also see how to specify
 physical boundary functions by providing a function (in this case,
 :cpp:`nullfill` since we are not using physical boundary conditions), where
-:cpp:`nullfill` is defined in a fortran routine in the tutorial source code.
+:cpp:`nullfill` is defined in a Fortran routine in the tutorial source code.
 
 Example: Advection_AmrLevel
 ===========================
diff --git a/Docs/sphinx_documentation/source/AsyncIter.rst b/Docs/sphinx_documentation/source/AsyncIter.rst
deleted file mode 100644
index 3742d629088..00000000000
--- a/Docs/sphinx_documentation/source/AsyncIter.rst
+++ /dev/null
@@ -1,95 +0,0 @@
-FillPatch Iterator
-==================
-
-FillPatch is an important operation commonly used in AMReX applications.
-This operation interpolates data in both space and time.
-Communication between AMR levels may incur when FillPatch interpolates data from a coarse AMR level and stores the result on the next finer level.
-This operation also results in communication within the same AMR level when the subcycling option is used, which requires data interpolation in time.
-
-We develop an asynchronous version of the FillPatch operation, called Asynchronous FillPatch Iterator.
-Each iterator takes care of the communication with the previous and next subcycles at the same AMR level (time) and between the current and the next finer AMR levels (space and time).
-The iterator first automatically prepares temporary data needed for these communication activities and the data connections (aka data paths or data dependencies) among them.
-
-Based on this setup, the programmer can design numerical solvers.
-This work is fairly simple.
-At a certain simulation time on an AMR level, the programmer can ask the runtime system which FABs have received sufficient data for advancing to the next time step.
-Although the FillPatch operation can be handled independently by the communication handler of the runtime system, this operation requires some computations such as packing/unpacking and extrapolation.
-The programmer has the freedom to dedicate a few threads from the pool of worker threads to parallelize those computations.
-This design choice may help the runtime process FillPatch operations faster, but may slow down the main computation.
-Thus, our advise to the programmer on using how many threads for the FillPatch is that it depends on the compute intensity of the actual workload.
-If the simulation is memory-bandwidth or network-bandwidth bound, the programmer can get the benefit from sparing more threads for doing FillPatch.
-
-RegionGraph Iterator
-====================
-
-We can simplify the programming work further with a new abstraction called RegionGraph Iterator a.k.a RGIter.
-This abstraction is a for loop (see the following code snippet), which can hide details of the asynchronous FillPatch Iterator in the init part and the graph traversal in the ++ operator.
-The only job required from the programmer is to specify the computations on the data, and they can easily place these computations in the loop body.
-
-.. highlight:: c++
-
-::
-
-    for (RGIter rgi(afpi_vec, upper_afpi_vec, ...); rgi.isValid(); ++rgi){
-        int f = rgi.currentRegion;
-	...//computation on FAB f
-    }
-
-The execution of RGIter is as follows.
-Initially, an object of RGIter (i.e. rgi) is instantiated, taking vectors of FillPatch Iterators on the current and upper AMR levels as arguments (each element of the vector corresponds to a specific time).
-Based on these arguments, a task dependency graph spanning two AMR levels will be established. 
-Next, isValid() asks the runtime system for FABs that have received all dependent data.
-When there is such a FAB, the computations in the loop body can execute on the FAB's data.
-When the computations on a FAB finish, the ++ operator is called.
-We overload this operator to traverse to the next runnable FAB.
-
-Note: RGIter also supports data tiling.
-Specifically, we overload the ++ operator so that it will traverse data tiles in a FAB before it goes to next FAB if the tiling flag in the FAB is enabled.
-Instead of applying the computations in the loop body on the entire FAB, it executes them on a single tile at a time.
-
-
-Generated Task Graph Code
-=========================
-
-The real input to the runtime system is an AMR program containing task dependency graphs (or task graph for short).
-Thus, the code written with the above asynchronous iterators will be transformed into a task graph form.
-The definition of a task dependency graph is as follows.
-Each task of a graph performs some computations on an FArrayBox (FAB).
-Tasks are connected with each other via edges, denoting the dependency on data.
-A task can be executed when all data dependencies have been satisfied.
-The code snippet below queries runnable tasks of a task dependency graph named regionGraph.
-Note that each task dependency graph is more or less a wrapper of a MultiFab.
-In this example, a task of regionGraph computes the body code of the while loop to update the associated FAB.
-Each task of this graph receives data arrived at the runtime system and injects the data into the associated FAB.
-After updating FAB, it lets the runtime know about the change.
-The runtime system uses AMR domain knowledge to establish data dependencies among tasks, and thus it can answer which tasks are runnable and how to update neighbor FABs when a current FAB changes.
-
-.. highlight:: c++
-
-::
-
-    while(!regionGraph->isGraphEmpty())
-    {
-        f = regionGraph->getAnyFireableRegion();
-	multifabCopyPull(..., f, ...); //inject arrived dependent data into the fab, if any
-        syncWorkerThreads();
-	...//compute on the fab f of multifab associated with coarseRegionGraph
-        syncWorkerThreads();
-        multifabCopyPush(..., f, ...); //tell the runtime that data of Fab f changed
-        regionGraph->finalizeRegion(f)
-    }
-
-The process of learning the domain knowledge is as follows.
-At the beginning of the program, the runtime extracts the metadata needed for establishing data dependencies among tasks of the same graph or between two different graphs.
-Every time the AMR grid hierarchy changes (i.e. when a few or all AMR levels regrid), the runtime re-extracts the metadata to correct the task dependency graphs.
-Once the metadata extraction completes, the runtime system invokes the computation on AMR levels (e.g., timeStep, initTimeStep, and postTimeStep).
-
-Known Limitations
-=================
-
-To realize enough task parallelism, the runtime system constructs a task dependency graph for the whole coarse time step and executes it asynchronously to the completion of the step.
-As a result, any request to regrid an AMR level must be foreseen before the execution of a coarse time step.
-If there is a regridding request during the graph execution, the runtime system simply ignores it.
-In the future we may relax this constraint in the programming model.
-However, such a support would come at a significant performance cost due to the required checkpointing and rollback activities.
-
diff --git a/Docs/sphinx_documentation/source/AsyncIter_Chapter.rst b/Docs/sphinx_documentation/source/AsyncIter_Chapter.rst
deleted file mode 100644
index 446709442ef..00000000000
--- a/Docs/sphinx_documentation/source/AsyncIter_Chapter.rst
+++ /dev/null
@@ -1,49 +0,0 @@
-.. _Chap:AsyncIter:
-
-Asynchronous Iterators (AmrTask)
-================================
-
-Hiding communication overheads via overlapping communication with computation requires a sufficiently large amount of task parallelism.
-This problem is even more challenging due to various types of tasks in an AMReX program, including data parallel tasks (same workload on different data partitions) and control parallel tasks (different types of workload). 
-This chapter introduces the API of AMReX's asynchronous iterators that can facilitate the job of identifying tasks in the applications.  
-We have developed two iterators called FillPatch and RegionGraph Iterators, which will be described later on in this chapter.
-We first show how the programmer can use a runtime system to execute application codes written with these iterators.
-
-In ``amrex/Src/AmrTask/rts_impls``, we implement RTS - a runtime system that can execute asynchronous AMReX applications efficiently on large-scale systems.
-RTS is a black box to the application developer as showed in the following code snippet, which is the main function of a typical AMReX application running asynchronously under the control of the runtime system.
-The programmer first needs to use the namespace ``perilla``, which covers all the C++ classes for the runtime system.
-To execute an AMR program (i.e. object of the Amr class), the programmer can simply create an object of RTS and pass the program object into the ``Iterate`` method. 
-The runtime system will iteratively execute coarse time steps until the program completes.
-By default RTS links to MPI and Pthreads libraries.
-The programmer can also switch to other backends such as UPCXX (1-sided communication model compared to the common 2-sided model in MPI) without changing the application source code.
-
-.. highlight:: c++
-
-::
-
-    using namespace perilla;
-    int main (int argc, char* argv[])
-    {
-        amrex::Initialize(argc,argv);
-        ... //set up program input, e.g. start_time, stop_time, max_step
-        Amr amr;
-        amr.init(start_time,stop_time);
-        RTS rts;
-        rts.Iterate(&amr, max_step, stop_time);
-        amrex::Finalize();
-        return 0;
-    }
-
-In a few functions of the Amr class, the runtime exposes multiple threads per process.
-As a result, the programmer needs to place sufficient memory protection for shared data within the process, e.g. when updating the state data. This multithreaded interface adds some programming cost, but is necessary for mitigating the task scheduling overhead.
-To avoid these programming details, the programmer can use built-in iterators, such as fillpatch iterator and task graph iterator that we next discuss.
-The API of these iterators is very simple, and the asynchronous code is very similar to the original code using the synchronous multifab iterator (MFIter) described earlier in chapter Basics.
-
-
-.. toctree::
-   :maxdepth: 1
-
-   AsyncIter
-
-
-
diff --git a/Docs/sphinx_documentation/source/Basics.rst b/Docs/sphinx_documentation/source/Basics.rst
index 15ace124b35..c1c8a30a9fc 100644
--- a/Docs/sphinx_documentation/source/Basics.rst
+++ b/Docs/sphinx_documentation/source/Basics.rst
@@ -38,7 +38,7 @@ It is used throughout AMReX, however its functions are not defined
 for device code. :cpp:`GpuArray` is AMReX's built-in alternative.  It
 is a trivial type that works on both host and device.  It also works
 when compiled just for CPU.  Besides :cpp:`GpuArray`, AMReX also
-provides GPU safe :cpp:`Array1D`, :cpp:`Array2D` and :cpp:`Array3d` that are
+provides GPU safe :cpp:`Array1D`, :cpp:`Array2D` and :cpp:`Array3D` that are
 1, 2 and 3-dimensional fixed size arrays, respectively.  These three
 class templates can have non-zero based indexing.
 
@@ -279,6 +279,34 @@ run with
 
 to change the value of :cpp:`ncells` and :cpp:`hydro.cfl`.
 
+Sometimes an application code may want to set a default that differs from the
+default in AMReX.  In this case, it is often convenient to define a function that
+sets the variable(s), and pass the name of that function to :cpp:`amrex::Initialize`.
+As an example, we may define :cpp:`add_par` to set :cpp:`extend_domain_face`
+to false if it hasn't already been set in the inputs file.
+
+.. highlight:: c++
+
+::
+
+    void add_par () {
+       ParmParse pp("eb2");
+       if(not pp.contains("extend_domain_face")) {
+          pp.add("extend_domain_face",false);
+       }
+    };
+
+Then we would pass :cpp:`add_par` into :cpp:`amrex::Initialize`:
+
+.. highlight:: c++
+
+::
+
+    amrex::Initialize(argc, argv, true, MPI_COMM_WORLD, add_par);
+
+This value replaces the current default value of true in AMReX itself, but
+can still be over-written by setting a value in the inputs file.
+
 
 .. _sec:basics:initialize:
 
@@ -347,7 +375,7 @@ arguments.
     main2d*.exe inputs amrex.v=1 amrex.fpe_trap_invalid=1 -- -tao_monitor
 
 then AMReX will parse the inputs file and the optional AMReX's command
-line arguments, but will ignore everything after "--".
+line arguments, but will ignore everything after the double dashes.
 
 .. _sec:basics:amrgrids:
 
@@ -624,8 +652,8 @@ the index type. Some examples are shown below.
       Print() << facebx.coarsen(2);      // ((16,16,16) (32,31,31) (1,0,0))
 
       Box uncoarsenable ({16,16,16}, {30,30,30});
-      print() << uncoarsenable.coarsen(2); // ({8,8,8}, {15,15,15});
-      print() << uncoarsenable.refine(2);  // ({16,16,16}, {31,31,31});
+      Print() << uncoarsenable.coarsen(2); // ((8,8,8), (15,15,15));
+      Print() << uncoarsenable.refine(2);  // ((16,16,16), (31,31,31));
                                            // Different from the original!
 
 Note that the behavior of refinement and coarsening depends on the
@@ -1259,7 +1287,7 @@ will be :cpp:`Box{(6,6,6) (16,16,16)}` in this example. For cells in
 :cpp:`FArrayBox`, we call those in the original :cpp:`Box` **valid cells** and
 the grown part **ghost cells**. Note that :cpp:`FArrayBox` itself does not have
 the concept of ghost cells.  Ghost cells are a key concept of
-:cpp:`MultiFab`,however, that allows for local operations on ghost cell data
+:cpp:`MultiFab`, however, that allows for local operations on ghost cell data
 originated from remote processes. We will discuss how to fill ghost cells with
 data from valid cells later in this section.  :cpp:`MultiFab` also has a
 default constructor. One can define an empty :cpp:`MultiFab` first and then
@@ -1335,7 +1363,7 @@ face averaged variables.
       MultiFab zflux(amrex::convert(ba, IntVect{0,0,1}), dm, ncomp, 0);
 
 Here all :cpp:`MultiFab`\ s  use the same :cpp:`DistributionMapping`, but their
-:cpp:`BoxArrays` have different index types. The state is cell-based, whereas
+:cpp:`BoxArray`\ s have different index types. The state is cell-based, whereas
 the fluxes are on the faces. Suppose the cell based :cpp:`BoxArray` contains a
 :cpp:`Box{(8,8,16), (15,15,31)}`. The state on that :cpp:`Box` is conceptually
 a Fortran Array with the dimension of :fortran:`(8:15,8:15,16:31,0:2)`. The
@@ -2470,13 +2498,51 @@ Debugging
 Debugging is an art.  Everyone has their own favorite method.  Here we
 offer a few tips we have found to be useful.
 
-Compiling in debug mode (e.g., ``make DEBUG=TRUE``) and running with
-``ParmParse`` parameter ``amrex.fpe_trap_invalid=1`` can be helpful.
-In debug mode, many compiler debugging flags are turned on and all
-``MultiFab`` data are initialized to signaling NaNs.  The
-``amrex.fpe_trap_invalid`` parameter will result in backtrace files
-when floating point exception occurs.  One can then examine those
-files to track down the origin of the issue.
+To help debugging, AMReX handles various signals in the C standard
+library raised in the runs.  This gives us a chance to print out more
+information using Linux/Unix backtrace capability.  The signals
+include seg fault, interruption by the user (control-c), assertion
+errors, and floating point exceptions (NaNs, divided by zero and
+overflow).  The handling of seg fault, assertion errors and
+interruption by control-C are enabled by default.  Note that
+``AMREX_ASSERT()`` is only on when compiled with ``DEBUG=TRUE`` or
+``USE_ASSERTION=TRUE`` in GNU make, or with ``-DCMAKE_BUILD_TYPE=Debug`` or
+``-DAMReX_ASSERTIONS=YES`` in CMake.  The trapping of floating point exceptions is not
+enabled by default unless the code is compiled with ``DEBUG=TRUE`` in GNU make, or with
+``-DCMAKE_BUILD_TYPE=Debug`` or ``-DAMReX_FPE=YES`` in CMake to turn on compiler flags
+if supported.  Alternatively, one can always use runtime parameters to control the
+handling of floating point exceptions: ``amrex.fpe_trap_invalid`` for
+NaNs, ``amrex.fpe_trap_zero`` for division by zero and
+``amrex.fpe_trap_overflow`` for overflow.  To more effectively trap the
+use of uninitialized values, AMReX also initializes ``FArrayBox``\ s in
+``MulitFab``\ s and arrays allocated by ``bl_allocate`` to signaling NaNs when it is compiled
+with ``TEST=TRUE`` or ``DEBUG=TRUE`` in GNU make, or with ``-DCMAKE_BUILD_TYPE=Debug`` in CMake.
+One can also control the setting for ``FArrayBox`` using the runtime parameter, ``fab.init_snan``.
+
+One can get more information than the backtrace of the call stack by
+instrumenting the code.  Here is an example.
+You know the line ``Real rho = state(cell,0);`` is causing a segfault.  You
+could add a print statement before that.  But it might print out
+thousands (or even millions) of line before it hits the segfault.  What
+you could do is the following,
+
+.. highlight:: c++
+
+::
+
+   #include <AMReX_BLBackTrace.H>
+
+   std::ostringstream ss;
+   ss << "state.box() = " << state.box() << " cell = " << cell;
+   BL_BACKTRACE_PUSH(ss.str()); // PUSH takes std::string
+
+   Real rho = state(cell,0);  // state is a Fab, and cell is an IntVect.
+
+   BL_BACKTRACE_POP(); // One can omit this line.  In that case,
+                       // there is an implicit POP when "PUSH" is
+                       // out of scope.
+
+When it hits the segfault, you will only see the last pint out.
 
 Writing a ``MultiFab`` to disk with
 
@@ -2601,7 +2667,7 @@ domain, the physical coordinates of the box, and the periodicity:
         IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
         Box domain(dom_lo, dom_hi);
 
-        // Initialize the boxarray "ba" from the single box "bx"
+        // Initialize the boxarray "ba" from the single box "domain"
         ba.define(domain);
         // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
         ba.maxSize(max_grid_size);
@@ -2650,7 +2716,7 @@ We demonstrate how to build an array of face-based ``MultiFabs`` :
         flux[dir].define(edge_ba, dm, 1, 0);
     }
 
-To access and/or modify data n a ``MultiFab`` we use the ``MFIter``, where each
+To access and/or modify data in a ``MultiFab`` we use the ``MFIter``, where each
 processor loops over grids it owns to access and/or modify data on that grid:
 
 ::
diff --git a/Docs/sphinx_documentation/source/BuildingAMReX.rst b/Docs/sphinx_documentation/source/BuildingAMReX.rst
index 32b9da1a48c..8731d2fbef8 100644
--- a/Docs/sphinx_documentation/source/BuildingAMReX.rst
+++ b/Docs/sphinx_documentation/source/BuildingAMReX.rst
@@ -28,34 +28,40 @@ list of important variables.
 
 .. table:: Important make variables
 
-   +------------+-------------------------------------+--------------------+
-   | Variable   | Value                               | Default            |
-   +============+=====================================+====================+
-   | AMREX_HOME | Path to amrex                       | environment        |
-   +------------+-------------------------------------+--------------------+
-   | COMP       | gnu, cray, ibm, intel, llvm, or pgi | none               |
-   +------------+-------------------------------------+--------------------+
-   | CXXSTD     | C++ standard (``c++11``, ``c++14``) | compiler default,  |
-   |            |                                     | at least ``c++11`` |
-   +------------+-------------------------------------+--------------------+
-   | DEBUG      | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
-   | DIM        | 1 or 2 or 3                         | 3                  |
-   +------------+-------------------------------------+--------------------+
-   | PRECISION  | DOUBLE or FLOAT                     | DOUBLE             |
-   +------------+-------------------------------------+--------------------+
-   | USE_MPI    | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
-   | USE_OMP    | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
-   | USE_CUDA   | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
-   | USE_HIP    | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
-   | USE_DPC++  | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
-   | USE_RPATH  | TRUE or FALSE                       | FALSE              |
-   +------------+-------------------------------------+--------------------+
+   +-----------------+-------------------------------------+--------------------+
+   | Variable        | Value                               | Default            |
+   +=================+=====================================+====================+
+   | AMREX_HOME      | Path to amrex                       | environment        |
+   +-----------------+-------------------------------------+--------------------+
+   | COMP            | gnu, cray, ibm, intel, llvm, or pgi | none               |
+   +-----------------+-------------------------------------+--------------------+
+   | CXXSTD          | C++ standard (``c++11``, ``c++14``, | compiler default,  |
+   |                 | ``c++17``, ``c++20``)               | at least ``c++11`` |
+   +-----------------+-------------------------------------+--------------------+
+   | DEBUG           | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | DIM             | 1 or 2 or 3                         | 3                  |
+   +-----------------+-------------------------------------+--------------------+
+   | PRECISION       | DOUBLE or FLOAT                     | DOUBLE             |
+   +-----------------+-------------------------------------+--------------------+
+   | USE_MPI         | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | USE_OMP         | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | USE_CUDA        | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | USE_HIP         | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | USE_DPCPP       | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | USE_RPATH       | TRUE or FALSE                       | FALSE              |
+   +-----------------+-------------------------------------+--------------------+
+   | WARN_ALL        | TRUE or FALSE                       | TRUE for DEBUG     |
+   |                 |                                     | FALSE otherwise    |
+   +-----------------+-------------------------------------+--------------------+
+   | AMREX_CUDA_ARCH | CUDA arch such as 70                | 70 if not set      |
+   |    or CUDA_ARCH |                                     | or detected        |
+   +-----------------+-------------------------------------+--------------------+
 
 .. raw:: latex
 
@@ -92,12 +98,15 @@ One could set the ``DIM`` variable to either 1, 2, or 3, depending on
 the dimensionality of the problem.  The default dimensionality is 3.
 AMReX uses double precision by default.  One can change to single
 precision by setting ``PRECISION=FLOAT``.
+(Particles have an equivalent flag ``USE_SINGLE_PRECISION_PARTICLES=TRUE/FALSE``.)
 
 Variables ``DEBUG``, ``USE_MPI`` and ``USE_OMP`` are optional with default set
 to FALSE.  The meaning of these variables should
 be obvious.  When ``DEBUG=TRUE``, aggressive compiler optimization flags are
 turned off and assertions in source code are turned on. For production runs,
 ``DEBUG`` should be set to FALSE.
+An advanced variable, ``MPI_THREAD_MULTIPLE``, can be set to TRUE to initialize
+MPI with support for concurrent MPI calls from multiple threads.
 
 Variables ``USE_CUDA``, ``USE_HIP`` and ``USE_DPCPP`` are used for
 targeting Nvidia, AMD and Intel GPUs, respectively.  At most one of
@@ -109,6 +118,16 @@ If enabled, the library path at link time will be saved as a
 When disabled, dynamic library paths could be provided via ``export LD_LIBRARY_PATH``
 hints at runtime.
 
+For GCC and Clang, the variable ``WARN_ALL`` controls the compiler's warning options.  There is
+also a make variable ``WARN_ERROR`` (with default of ``FALSE``) to turn warnings into errors.
+
+When ``USE_CUDA`` is ``TRUE``, the make system will try to detect what CUDA
+arch should be used by running
+``$(CUDA_HOME)/extras/demo_suite/deviceQuery`` if your computer is unknown.
+If it fails to detect the CUDA arch, the default value of 70 will be used.
+The user could override it by ``make USE_CUDA=TRUE CUDA_ARCH=80`` or ``make
+USE_CUDA=TRUE AMREX_CUDA_ARCH=80``.
+
 After defining these make variables, a number of files, ``Make.defs,
 Make.package`` and ``Make.rules``, are included in the GNUmakefile. AMReX-based
 applications do not need to include all directories in AMReX; an application
@@ -373,15 +392,14 @@ For example, one can enable OpenMP support as follows:
 
 ::
 
-    cmake -DENABLE_OMP=YES -DCMAKE_INSTALL_PREFIX=/path/to/installdir  /path/to/amrex
+    cmake -DAMReX_OMP=YES -DCMAKE_INSTALL_PREFIX=/path/to/installdir  /path/to/amrex
 
-In the example above ``<var>=ENABLE_OMP`` and ``<value>=YES``.
+In the example above ``<var>=AMReX_OMP`` and ``<value>=YES``.
 Configuration variables requiring a boolen value are evaluated to true if they
 are assigned a value of ``1``, ``ON``, ``YES``, ``TRUE``, ``Y``. Conversely they are evaluated to false
 if they are assigned a value of ``0``, ``OFF``, ``NO``, ``FALSE``, ``N``.
 Boolean configuration variables are case-insensitive.
-The list of available options is reported in the table on :ref:`tab:cmakevar`
-below.
+The list of available options is reported in the :ref:`table <tab:cmakevar>` below.
 
 
 .. raw:: latex
@@ -390,95 +408,95 @@ below.
 
 .. _tab:cmakevar:
 
-.. table:: AMReX build options
-
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | Variable Name                | Description                                     | Default     | Possible values |
-   +==============================+=================================================+=============+=================+
-   | CMAKE_Fortran_COMPILER       |  User-defined Fortran compiler                  |             | user-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CMAKE_CXX_COMPILER           |  User-defined C++ compiler                      |             | user-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CMAKE_Fortran_FLAGS          |  User-defined Fortran flags                     |             | user-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CMAKE_CXX_FLAGS              |  User-defined C++ flags                         |             | user-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CMAKE_CXX_STANDARD           |  C++ standard                                   | compiler/11 | 11, 14, 17, 20  |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | DIM                          |  Dimension of AMReX build                       | 3           | 1, 2, 3         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | USE_XSDK_DEFAULTS            |  Use XSDK defaults settings                     | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_FORTRAN               |  Enable Fortran language                        | YES         | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_DP                    |  Build with double-precision reals              | YES         | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_PIC                   |  Build Position Independent Code                | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_MPI                   |  Build with MPI support                         | YES         | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_OMP                   |  Build with OpenMP support                      | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_CUDA                  |  Build with CUDA support                        | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CUDA_ARCH                    |  CUDA target architecture                       | Auto        | User-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CUDA_MAX_THREADS             |  Max number of CUDA threads per block           | 256         | User-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | CUDA_MAXREGCOUNT             |  Limits the number of CUDA registers available  | 255         | User-defined    |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_CUDA_FASTMATH         |  Enable CUDA fastmath library                   | YES         | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_FORTRAN_INTERFACES    |  Build Fortran API                              | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_LINEAR_SOLVERS        |  Build AMReX linear solvers                     | YES         | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_AMRDATA               |  Build data services                            | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_EB                    |  Build Embedded Boundary support                | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_PARTICLES             |  Build particle classes                         | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_DP_PARTICLES          |  Use double-precision reals in particle classes | YES         | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_BASE_PROFILE          |  Build with basic profiling support             | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_TINY_PROFILE          |  Build with tiny profiling support              | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_TRACE_PROFILE         |  Build with trace-profiling support             | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_COMM_PROFILE          |  Build with comm-profiling support              | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_MEM_PROFILE           |  Build with memory-profiling support            | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_PROFPARSER            |  Build with profile parser support              | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_BACKTRACE             |  Build with backtrace support                   | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_FPE                   |  Build with Floating Point Exceptions checks    | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_ASSERTIONS            |  Build with assertions turned on                | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_SUNDIALS              |  Enable SUNDIALS 4 interfaces                   | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_SENSEI_IN_SITU        |  Enable SENSEI_IN_SITU infrastucture            | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_CONDUIT               |  Enable Conduit support                         | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_ASCENT                |  Enable Ascent support                          | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_HYPRE                 |  Enable HYPRE interfaces                        | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_PLOTFILE_TOOLS        |  Build and install plotfile postprocessing tools| NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
-   | ENABLE_TUTORIALS             |  Build tutorials                                | NO          | YES, NO         |
-   +------------------------------+-------------------------------------------------+-------------+-----------------+
+.. table:: AMReX build options (refer to section :ref:`sec:gpu:build` for GPU-related options).
+
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | Variable Name                | Description                                     | Default                 | Possible values       |
+   +==============================+=================================================+=========================+=======================+
+   | CMAKE_Fortran_COMPILER       |  User-defined Fortran compiler                  |                         | user-defined          |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | CMAKE_CXX_COMPILER           |  User-defined C++ compiler                      |                         | user-defined          |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | CMAKE_Fortran_FLAGS          |  User-defined Fortran flags                     |                         | user-defined          |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | CMAKE_CXX_FLAGS              |  User-defined C++ flags                         |                         | user-defined          |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | CMAKE_CXX_STANDARD           |  C++ standard                                   | compiler/11             | 11, 14, 17, 20        |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_SPACEDIM               |  Dimension of AMReX build                       | 3                       | 1, 2, 3               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | USE_XSDK_DEFAULTS            |  Use XSDK defaults settings                     | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_FORTRAN                |  Enable Fortran language                        | YES                     | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PRECISION              |  Set the precision of reals                     | DOUBLE                  | DOUBLE, SINGLE        |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PIC                    |  Build Position Independent Code                | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_MPI                    |  Build with MPI support                         | YES                     | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_OMP                    |  Build with OpenMP support                      | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_GPU_BACKEND            |  Build with on-node, accelerated GPU backend    | NONE                    | NONE, SYCL, HIP, CUDA |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_FORTRAN_INTERFACES     |  Build Fortran API                              | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_LINEAR_SOLVERS         |  Build AMReX linear solvers                     | YES                     | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_AMRDATA                |  Build data services                            | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_EB                     |  Build Embedded Boundary support                | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PARTICLES              |  Build particle classes                         | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PARTICLES_PRECISION    |  Set reals precision in particle classes        | Same as AMReX_PRECISION | DOUBLE, SINGLE        |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_BASE_PROFILE           |  Build with basic profiling support             | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_TINY_PROFILE           |  Build with tiny profiling support              | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_TRACE_PROFILE          |  Build with trace-profiling support             | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_COMM_PROFILE           |  Build with comm-profiling support              | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_MEM_PROFILE            |  Build with memory-profiling support            | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_MPI_THREAD_MULTIPLE    |  Concurrent MPI calls from multiple threads     | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PROFPARSER             |  Build with profile parser support              | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_FPE                    |  Build with Floating Point Exceptions checks    | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_ASSERTIONS             |  Build with assertions turned on                | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_SUNDIALS               |  Enable SUNDIALS 4 interfaces                   | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_SENSEI                 |  Enable SENSEI_IN_SITU infrastucture            | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_CONDUIT                |  Enable Conduit support                         | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_ASCENT                 |  Enable Ascent support                          | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_HYPRE                  |  Enable HYPRE interfaces                        | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PETSC                  |  Enable PETSc interfaces                        | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_HDF5                   |  Enable HDF5-based I/O                          | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_PLOTFILE_TOOLS         |  Build and install plotfile postprocessing tools| NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_BUILD_TUTORIALS        |  Build tutorials                                | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_ENABLE_TESTS           |  Enable CTest suite                             | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
+   | AMReX_DIFFERENT_COMPILER     |  Allow an app to use a different compiler       | NO                      | YES, NO               |
+   +------------------------------+-------------------------------------------------+-------------------------+-----------------------+
 .. raw:: latex
 
    \end{center}
 
-The option ``CMAKE_BUILD_TYPE=Debug`` implies ``ENABLE_ASSERTION=YES``. In order to turn off
-assertions in debug mode, ``ENABLE_ASSERTION=NO`` must be set explicitly while
+The option ``CMAKE_BUILD_TYPE=Debug`` implies ``AMReX_ASSERTIONS=YES``. In order to turn off
+assertions in debug mode, ``AMReX_ASSERTIONS=NO`` must be set explicitly while
 invoking CMake.
 
 
@@ -496,6 +514,36 @@ are defined, AMReX default flags are used.
 For a detailed explanation of GPU support in AMReX CMake, refer to section :ref:`sec:gpu:build`.
 
 
+Building Tutorials
+------------------
+
+In order to build the tutorials provided in ``Tutorials/`` alongside the AMReX library,
+follows these steps:
+
+.. highlight:: console
+
+::
+
+    mkdir /path/to/builddir
+    cd    /path/to/builddir
+    cmake [options]  -DAMReX_BUILD_TUTORIALS=YES  /path/to/amrex
+    make
+
+
+Note that only the tutorials compatible with ``[options]`` will be built.
+To run one of the tutorials, do:
+
+.. highlight:: console
+
+::
+
+    cd  /path/to/builddir/Tutorials/group/name
+    ./Tutorial_group_name [input_file]
+
+
+``[input_file]`` is any of the input files required by the tutorials and located in
+``/path/to/builddir/Tutorials/group/name/``
+
 
 CMake and macOS
 ---------------
@@ -562,7 +610,7 @@ In the above snippet, ``<amrex-target-name>`` is any of the targets listed in th
 
 
 The options used to configure the AMReX build may result in certain parts, or ``components``, of the AMReX source code
-to be excluded from compilation. For example, setting ``-DENABLE_LINEAR_SOLVERS=no`` at configure time
+to be excluded from compilation. For example, setting ``-DAMReX_LINEAR_SOLVERS=no`` at configure time
 prevents the compilation of AMReX linear solvers code.
 Your CMake project can check which component is included in the AMReX library via `find_package`:
 
@@ -590,57 +638,57 @@ A list of AMReX component names and related configure options are shown in the t
    +------------------------------+-----------------+
    | Option                       | Component       |
    +==============================+=================+
-   | DIM                          | 1D, 2D, 3D      |
+   | AMReX_SPACEDIM               | 1D, 2D, 3D      |
    +------------------------------+-----------------+
-   | ENABLE_DP                    | DP              |
+   | AMReX_PRECISION              | DOUBLE, SINGLE  |
    +------------------------------+-----------------+
-   | ENABLE_PIC                   | PIC             |
+   | AMReX_FORTRAN                | FORTRAN         |
    +------------------------------+-----------------+
-   | ENABLE_MPI                   | MPI             |
+   | AMReX_PIC                    | PIC             |
    +------------------------------+-----------------+
-   | ENABLE_OMP                   | OMP             |
+   | AMReX_MPI                    | MPI             |
    +------------------------------+-----------------+
-   | ENABLE_CUDA                  | CUDA            |
+   | AMReX_OMP                    | OMP             |
    +------------------------------+-----------------+
-   | ENABLE_FORTRAN_INTERFACES    | FINTERFACES     |
+   | AMReX_CUDA                   | CUDA            |
    +------------------------------+-----------------+
-   | ENABLE_LINEAR_SOLVERS        | LSOLVERS        |
+   | AMReX_FORTRAN_INTERFACES     | FINTERFACES     |
    +------------------------------+-----------------+
-   | ENABLE_AMRDATA               | AMRDATA         |
+   | AMReX_LINEAR_SOLVERS         | LSOLVERS        |
    +------------------------------+-----------------+
-   | ENABLE_EB                    | EB              |
+   | AMReX_AMRDATA                | AMRDATA         |
    +------------------------------+-----------------+
-   | ENABLE_PARTICLES             | PARTICLES       |
+   | AMReX_EB                     | EB              |
    +------------------------------+-----------------+
-   | ENABLE_DP_PARTICLES          | DPARTICLES      |
+   | AMReX_PARTICLES              | PARTICLES       |
    +------------------------------+-----------------+
-   | ENABLE_BASE_PROFILE          | BASEP           |
+   | AMReX_PARTICLES_PRECISION    | PDOUBLE, PSINGLE|
    +------------------------------+-----------------+
-   | ENABLE_TINY_PROFILE          | TINYP           |
+   | AMReX_BASE_PROFILE           | BASEP           |
    +------------------------------+-----------------+
-   | ENABLE_TRACE_PROFILE         | TRACEP          |
+   | AMReX_TINY_PROFILE           | TINYP           |
    +------------------------------+-----------------+
-   | ENABLE_COMM_PROFILE          | COMMP           |
+   | AMReX_TRACE_PROFILE          | TRACEP          |
    +------------------------------+-----------------+
-   | ENABLE_MEM_PROFILE           | MEMP            |
+   | AMReX_COMM_PROFILE           | COMMP           |
    +------------------------------+-----------------+
-   | ENABLE_PROFPARSER            | PROFPARSER      |
+   | AMReX_MEM_PROFILE            | MEMP            |
    +------------------------------+-----------------+
-   | ENABLE_BACKTRACE             | BACKTRACE       |
+   | AMReX_PROFPARSER             | PROFPARSER      |
    +------------------------------+-----------------+
-   | ENABLE_FPE                   | FPE             |
+   | AMReX_FPE                    | FPE             |
    +------------------------------+-----------------+
-   | ENABLE_ASSERTIONS            | ASSERTIONS      |
+   | AMReX_ASSERTIONS             | ASSERTIONS      |
    +------------------------------+-----------------+
-   | ENABLE_SUNDIALS              | SUNDIALS        |
+   | AMReX_SUNDIALS               | SUNDIALS        |
    +------------------------------+-----------------+
-   | ENABLE_SENSEI_IN_SITU        | SENSEI          |
+   | AMReX_SENSEI                 | SENSEI          |
    +------------------------------+-----------------+
-   | ENABLE_CONDUIT               | CONDUIT         |
+   | AMReX_CONDUIT                | CONDUIT         |
    +------------------------------+-----------------+
-   | ENABLE_ASCENT                | ASCENT          |
+   | AMReX_ASCENT                 | ASCENT          |
    +------------------------------+-----------------+
-   | ENABLE_HYPRE                 | HYPRE           |
+   | AMReX_HYPRE                  | HYPRE           |
    +------------------------------+-----------------+
 
 .. raw:: latex
@@ -681,17 +729,17 @@ More details on ``find_package`` can be found
 AMReX on Windows
 ================
 
-The AMReX team does development on Linux machines, from desktop workstations to supercomputers. Many people also use AMReX on Macs without issues.
+The AMReX team does development on Linux machines, from laptops to supercomputers. Many people also use AMReX on Macs without issues.
 
-We do not officially support AMReX on Windows.  However, we believe there are no fundamental issues for making it work on Windows.
-AMReX mostly uses standard C++11,  and there are only a few places that are UNIX/Linux specific. These are:
+We do not officially support AMReX on Windows, and many of us do not have access to any Windows
+machines.  However, we believe there are no fundamental issues for it to work on Windows.
 
-(1) File system:  We use some of the POSIX standard functions for operations like making a new directory, detecting if a file exists, etc.
-C++17 now has a filesystem library that should work on any platform.  AMReX does not require C++17, but we are happy to provide a C++17 support for the file system part.
+(1) AMReX mostly uses standard C++11, but for Windows C++17 is required.  This is because we use
+    C++17 to support file system operations when POSIX I/O is not available.
 
-(2) Signal handling:  We use POSIX handling when floating point exceptions, segmentation faults, etc. happen.
-This capability allows us to print a backtrace of what leads to the error and is very useful for debugging but not required for using AMReX.
-Some of the POSIX handling is platform-dependent, and Windows does seem to have this capability.  If you need it, it should not be hard for you to make it work on Windows.
+(2) We use POSIX signal handling when floating point exceptions, segmentation faults, etc. happen.
+This capability is not supported on Windows.
 
-(3) Memory profiling:  This is an optional feature in AMReX that is not enabled by default.
-It reads memory system information from the OS to give us a summary of our memory usage.
+(3) Memory profiling is an optional feature in AMReX that is not enabled by default.  It reads
+memory system information from the OS to give us a summary of our memory usage.  This is not
+supported on Windows.
diff --git a/Docs/sphinx_documentation/source/CVODE_top.rst b/Docs/sphinx_documentation/source/CVODE_top.rst
deleted file mode 100644
index 2a30518c32b..00000000000
--- a/Docs/sphinx_documentation/source/CVODE_top.rst
+++ /dev/null
@@ -1,40 +0,0 @@
-.. _Chap:CVODE:
-
-CVODE
-=====
-
-AMReX supports local ODE integration using the CVODE solver, [1]_ which is part
-of the SUNDIALS framework. [2]_ CVODE contains solvers for stiff and non-stiff
-ODEs, and as such is well suited for solving e.g., the complex chemistry
-networks in combustion simulations, or the nuclear reaction networks in
-astrophysical simulations.
-
-Most of CVODE is written in C, but many functions also come with two distinct
-Fortran interfaces.  One interface is FCVODE, which is bundled with the stable
-release of CVODE.  Its usage is described in the CVODE documentation. [3]_
-However, the use of FCVODE is discouraged in AMReX due to its incompatibility
-with being used inside OpenMP parallel regions (which is the primary use case
-in AMReX applications).
-
-The alternative, and recommended, Fortran interface to uses the
-``iso_c_binding`` feature of the Fortran 2003 standard to implement a direct
-interface to the C functions in CVODE.  When compiling CVODE, one need not
-build the CVODE library with the FCVODE interface enabled at all.  Rather, the
-Fortran 2003 interface to CVODE is provided within AMReX itself.  The
-CVODE tutorials provided in AMReX use this new interface.
-
-.. toctree::
-   :maxdepth: 1
-
-   CVODE
-   SUNDIALS3
-
-
-.. [1]
-   https://computation.llnl.gov/projects/sundials/cvode
-
-.. [2]
-   https://computation.llnl.gov/projects/sundials
-
-.. [3]
-   https://computation.llnl.gov/sites/default/files/public/cv_guide.pdf
diff --git a/Docs/sphinx_documentation/source/EB.rst b/Docs/sphinx_documentation/source/EB.rst
index 2407fbecffd..e6a759dae5e 100644
--- a/Docs/sphinx_documentation/source/EB.rst
+++ b/Docs/sphinx_documentation/source/EB.rst
@@ -549,531 +549,6 @@ testing cell types and getting neighbor information. For example
     end do     
 
 
-
-.. _sec:EB:LevelSet:
-
-Level Sets
-==========
-
-In order to speed up direct interactions with embedded boundaries, AMReX also
-provides a way to construct level-sets representing the signed distance function
-from the closest EB surface. In our implementation, the level-set data is stored
-as a 1-component nodal :cpp:`MultiFab` (cf. :ref:`sec:basics:multifab`) where
-each node stores its closest distance to the EB. The subroutine
-:fortran:`amrex_eb_interp_levelset` (in ``/Scr/EB/AMREX_EB_levelset_F.F90``)
-interpolates the level-set :math:`\phi(\mathbf{r})` to any position
-:math:`\mathbf{r}` from the pre-computed level-set :cpp:`MultiFab`. Likewise the
-subroutine :fortran:`amrex_eb_normal_levelset` interpolated the normal
-:math:`\mathbf{\hat{n}}(\mathbf{r})` at any position from the derivative of the
-level-set function :math:`\mathbf{\hat{n}}(\mathbf{r}) = \nabla
-\phi(\mathrm{r})`. **Note** that since the normal is computed by taking the
-derivative of the interpolation function, it is discontinuous at positions
-corresponding to the nodal points of the level-set :cpp:`MultiFab` (i.e.
-:math:`\mathbf{r} = (i, j, k) \cdot h`).
-
-At this point, AMReX does not provide a C++ interface for interpolating the
-level-set at a point. This is because so far the level-set was only needed while performing calculations in Fortran. The interpolation subroutines contained in :fortran:`amrex_eb_levelset_module` are:
-
-.. highlight:: fortran
-
-::
-
-   pure subroutine amrex_eb_interp_levelset(pos, plo,  n_refine, &
-                                            phi, phlo, phhi,     &
-                                            dx,  phi_interp    )
-
-and
-
-.. highlight:: fortran
-
-::
-
-   pure subroutine amrex_eb_normal_levelset(pos, plo,   n_refine, &
-                                            phi, phlo,  phhi,     &
-                                            dx,  normal         )
-
-which interpolate the level-set value :fortran:`phi_interp` and
-:fortran:`normal`, respectively, at the 3-dimensional point :fortran:`pos`. The
-nodal values of the level-set are given by the :fortran:`phi` array.
-:fortran:`dx/n_refine` is the refined cell-size of the level-set array. For
-example
-
-.. highlight:: fortran
-
-::
-
-   use iso_c_binding    , only : c_int
-   use amrex_fort_module, only : c_real => amrex_real
-   use amrex_eb_levelset_module, only: amrex_eb_interp_levelset
-
-   ! ** level-set data
-   !    philo, phihi - dimensions of phi array
-   !    dx           - spatial discretization
-   !    n_refine     - refinement of phi array (wrt to dx)
-   integer(c_int) :: philo(3), phihi(3)
-   real(c_real)   :: phi(  phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-   real(c_real)   :: dx(3)
-   integer(c_int) :: n_refine
-
-   ! ** interpolated level-set
-   !    pos      - coordinate where to interpolate
-   !    ls_value - interpolated level-set value (output)
-   real(c_real) :: pos(3), ls_value
-
-   call amrex_eb_interp_levelset(pos, plo, n_refine, phi, phlo, phhi, dx, ls_value);
-   
-
-AMReX provides collection of functions and subroutines to fill single and
-multi-level level-set data. For convenience, the :cpp:`amrex::LSFactory` helps
-manage the level-set data for a single AMR level. And :cpp:`amrex::LSCore`
-manages multi-level level-set data. These are described in further detail below.
-
-
-A Note on Filling Level-Sets from :cpp:`EBFArrayBoxFactory`
------------------------------------------------------------
-
-The data stored in a :cpp:`EBFArrayBoxFactory`, represents the embedded boundary
-as a discrete collection of volume fractions, and area fractions over a grid.
-Here this is further simplified by thinking of the EB as a collection of planar
-facets. This means that for any given node in a grid, the nearest EB facet might
-be in another grid. Hence if the :cpp:`EBFArrayBoxFactory` has :cpp:`n_pad`
-ghost cells, then for any given grid, there could be EB facets that are
-:cpp:`n_pad + 1` cells away, yet we would *not* "see". In other words, if the
-:cpp:`EBFArrayBoxFactory` is defined on a grid with spacing :math:`h`, then, and
-we do not have any EB facets in the current grid, then any node within that grid
-is *at least* :math:`(n_\mathrm{pad}+1)h` away from the nearest EB surface.
-
-Hence, when filling a level-set, it will "max-out" at
-:math:`\pm(n_\mathrm{pad}+1)h`. Hence it is recommended to think of this kind of
-level-set function as the point being "at least" :math:`\phi(\mathbf{r})` from
-the EB surface.
-
-.. _fig::local_levelset:
-
-.. figure:: ./EB/loc_ls_ex.png
-   :width: 50.0%
-
-   : Example of a "local" level-set representing a cylinder. The level-set
-   function is a (linear) signed distance function near the EB-surface, and it
-   plateaus further away from it.
-
-Figure :numref:`fig::local_levelset` shows an example of such a local level-set
-description for a cylinder. Only cells that are within
-:math:`\pm(n_\mathrm{pad}+1)h` of the EB surface are filled with a level-set.
-The rest is filled with lower (upper) bound. If the goal is capture interactions
-between the EB surface and a point somewhere else, this approach usually
-suffices as we only need to know if we are "far enough" from the EB in most
-applications.
-
-Since finding the closest distance between a point and an arbitrary surface is
-computationally expensive, we advice that :cpp:`n_pad` is chosen as the smallest
-necessary number for the application.
-
-
-.. _ss:ls:nolsf:
-
-Filling Level-Sets without :cpp:`LSFactory`
--------------------------------------------
-
-The static function :cpp:`amrex::LSFactory::fill_data` (defined in
-``Src/EB/AMReX_EB_levelset.cpp``) fills a :cpp:`MultiFab` with the nodal level-set
-values and another :cpp:`iMultiFab` with integer tags that are 1 whenever a node
-is near the EB surface. It is then left up to the application to manage the
-level-set :cpp:`MultiFab`.
-
-AMReX defines embedded surfaces using implicit functions (see above). Normally
-these implicit functions are usually *not* signed distance functions (i.e. their
-value at :math:`\mathbf{r}` is not the minimal distance to the EB surface).
-However, in rare cases such as the :cpp:`EB2::PlaneIF`, it is. In this case, the
-most straight-forward way to fill a level-set. If an signed-distance implicit
-function is know, and stored as a :cpp:`MultiFab mf_impfunc`, then we can use
-
-.. highlight:: c++
-
-::
-
-   static void fill_data (MultiFab & data, iMultiFab & valid,
-                          const MultiFab & mf_impfunc,
-                          int eb_pad, const Geometry & eb_geom);
-
-so then the function call
-
-.. highlight:: c++
-
-::
-
-   // Fill implicit function
-   GShopLSFactory<EB2::CylinderIF> cylinder_lsgs(cylinder_ghsop, geom, ba, dm, 0);
-   std::unique_ptr<MultiFab> cylinder_mf_impfunc = cylinder_lsgs.fill_impfunc();
-
-   
-   MultiFab ls_grid(ba, dm, 1, 0);
-   iMultiFab ls_valid(ba, dm, 1, 0);
-   amrex::LSFactory::fill_data(ls_grid, ls_valid, mf_impfunc, 2, geom_eb);
-
-fills a :cpp:`MultiFab ls_grid` with level-set data given the implicit function
-stored in the :cpp:`MultiFab mf_impfunc`, and a threshold of
-:cpp:`2*geom_eb.CellSize()`. The helper class :cpp:`GShopLSFactory` converts EB2
-implicit functions to :cpp:`MultiFabs` (defined in
-``Src/EB/AMReX_EB_levelset.H``).
-
-The much more interesting application of :cpp:`amrex::LSFactory::fill_data` is
-filling a level-set given a :cpp:`EBFArrayBoxFactory`:
-
-.. highlight:: c++
-
-::
-
-   static void fill_data (MultiFab & data, iMultiFab & valid,
-                          const EBFArrayBoxFactory & eb_factory,
-                          const MultiFab & eb_impfunc,
-                          const IntVect & ebt_size, int ls_ref, int eb_ref,
-                          const Geometry & geom, const Geometry & geom_eb);
-
-which fills the :cpp:`MultiFab data` with level-set data from the
-:cpp:`EBFArrayBoxFactory eb_factory`. Here the user must still supply the EB
-implicit function using the :cpp:`MultiFab eb_impfunc`, as this is used to
-determine the inside/outside when no EB facets can be found, or in special
-edge-cases. The user also needs to specify the tile size (:cpp:`IntVect
-ebt_size`), the level-set and EB refinement (i.e. the grid over which
-:cpp:`data` is defined is refined by a factor of :cpp:`ls_ref/eb_ref` compared
-to the :cpp:`eb_factory` 's grid), and the Geometries :cpp:`geom` and
-:cpp:`geom_eb` corresponding to the grids of :cpp:`data` and :cpp:`eb_factory`
-respectively.
-
-When filling :cpp:`data`, a tile-size of :cpp:`ebt_size` is used. Only EB facets
-within a tile (plus the :cpp:`eb_factory` ghost cells) are considered. Hence,
-chosing an appropriate :cpp:`ebt_size` can significantly increase performance.
-
-For example, the following fills a level-set with a cylinder EB (like that shown
-in Fig. :numref:`fig::local_levelset`).
-
-.. highlight:: c++
-
-::
-
-   // Define nGrow of level-set and EB
-   int ls_pad = 1;
-   int eb_pad = 2;
-
-   // Define EB
-   EB2::CylinderIF cylinder(radius, centre, true);
-   EB2::GeometryShop<EB2::CylinderIF> cylinder_gshop(cylinder);
-   
-   // Build EB
-   EB2::Build(cylinder_gshop, geom, max_level, max_level);
-   const EB2::IndexSpace & cylinder_ebis = EB2::IndexSpace::top();
-   const EB2::Level &      cylinder_lev  = cylinder_ebis.getLevel(geom);
-
-   // Build EB factory
-   EBFArrayBoxFactory eb_factory(cylinder_lev, geom, ba, dm, {eb_pad, eb_pad, eb_pad});
-
-   // Fill implicit function
-   GShopLSFactory<EB2::CylinderIF> cylinder_lsgs(cylinder_ghsop, geom, ba, dm, ls_pad);
-   std::unique_ptr<MultiFab> cylinder_mf_impfunc = cylinder_lsgs.fill_impfunc();
-
-   // Fill level-set
-   MultiFab ls_grid(ba, dm, 1, ls_pad);
-   iMultiFab ls_valid(ba, dm, 1, ls_pad);
-   LSFactory::fill_data(ls_grid, ls_valid, eb_factory, * cylinder_mf_impfunc,
-                        ebt_size, 1, 1, geom, geom);
-
-Note that in theory the :cpp:`EBFArrayBoxFactory eb_factory` could be defined on
-a different resolution as the the :cpp:`BoxArray ba`. In this case, the
-appropriate refinements and geometries must be specified. Also note that the
-thresholding behaviour (due to :cpp:`eb_pad`) is specified via the
-:cpp:`EBFArrayBoxFactory` constructor. The implicit function MultiFab needs to
-have the same grids as `data`.
-
-Since this relies on the interplay of many different parameters, a number of
-utility functions and helper classes have been created. These are discussed in
-the subsequent sections.
-
-The common operations of intersections and unions (similar to EB implicit
-functions, discussed in :ref:`sec:EB:ebinit:IF`) can also be applied to
-level-sets. Without the use of a :cpp:`LSFactory`, the functions:
-
-.. highlight:: c++
-
-::
-
-   static void intersect_data (MultiFab & data, iMultiFab & valid,
-                               const MultiFab & data_in, const iMultiFab & valid_in,
-                               const Geometry & geom_ls);
-
-and  
-
-.. highlight:: c++
-
-::
-
-   static void union_data (MultiFab & data, iMultiFab & valid,
-                           const MultiFab & data_in, const iMultiFab & valid_in,
-                           const Geometry & geom_ls);
-
-These apply the intersection (element-wise minimum) and union (maximum) between
-the :cpp:`MultiFab data`, and :cpp:`data_in`. The result overwrites the contents
-of :cpp:`data`. The tags stored in the :cpp:`iMultiFab valid_in` determine where
-the intersection takes place (i.e. only cells where both :cpp:`valid_in == 1`
-are intersected, others are ignored).
-
-
-Using :cpp:`LSFactory`
-----------------------
-
-In the previous section, we've seen that the level-set and EB grids can exist on
-different levels of refinement. The practical reason behind this is that
-sometimes we want to capture interactions that are very sensitive close to EBs,
-but this can sometimes be difficult to keep track of. Hence the :cpp:`LSFactory`
-can be helpful in taking care of all of these parameters.
-
-The basic principle of the :cpp:`LSFactory` (defined in
-``Src/EB/AMReX_EB_levelset.H``) is that it is created relative to some reference
-:cpp:`BoxArray ba`, :cpp:`Geometry geom`, and :cpp:`DistributionMapping dm`. The
-user then specifies refinement factors :cpp:`ls_ref` of the level-set data and
-:cpp:`eb_ref` of the EB grid. Calling the constructor:
-
-.. highlight:: c++
-
-::
-
-   LSFactory(int lev, int ls_ref, int eb_ref, int ls_pad, int eb_pad,
-             const BoxArray & ba, const Geometry & geom, const DistributionMapping & dm,
-             int eb_tile_size = 32);
-
-Then creates all appropriate grids and geometries. Note that we can also specify
-the tile size used internally in the :cpp:`LSFactory::fill_data` function.
-
-When a :cpp:`LSFacotry` is first created, its level-set values are set to
-:fortran:`huge(amrex_real)`. I. e. there are no surfaces, and so the level-set
-value is effectively infinite. It can then be filled just like in the previous
-section:
-
-.. highlight:: c++
-
-::
-
-   // Define refinement of level-set and EB
-   int ls_ref = 4;
-   int eb_ref = 1;
-
-   // Define nGrow of level-set and EB
-   int ls_pad = 1;
-   int eb_pad = 2;
-
-   // Define EB
-   EB2::CylinderIF cylinder(radius, centre, true);
-   EB2::GeometryShop<EB2::CylinderIF> cylinder_gshop(cylinder);
-
-   // Build level-set factory
-   LSFactory level_set(0, ls_ref, eb_ref, ls_pad, eb_pad, ba, geom, dm);
-
-   // Build EB
-   const Geometry & eb_geom = level_set.get_eb_geom()
-   EB2::Build(cylinder_gshop, eb_geom, max_level, max_level);
-
-   const EB2::IndexSpace & cylinder_ebis = EB2::IndexSpace::top();
-   const EB2::Level &      cylinder_lev  = cylinder_ebis.getLevel(eb_geom);
-
-   // Build EB factory
-   EBFArrayBoxFactory eb_factory(cylinder_lev, eb_geom, level_set.get_eb_ba(), dm,
-                                 {level_set.get_eb_pad(), level_set.get_eb_pad(),
-                                  level_set.get_eb_pad()});
-
-   // Fill level-set (factory)
-   GShopLSFactory<EB2::CylinderIF> cylinder_lsgs(cylinder_ghsop, level_set);
-   std::unique_ptr<MultiFab> cylinder_mf_impfunc = cylinder_lsgs.fill_impfunc();
-   level_set.Fill(eb_factory, * cylinder_mf_impfunc);
-
-where the level-set data can now be accessed using:
-
-.. highlight:: c++
-
-::
-
-   const MultiFab * level_set_data = level_set.get_data();
-
-or alternatively a copy of the data can be generated using:
-
-.. highlight:: c++
-
-::
-
-   std::unique_ptr<MultiFab> level_set_data = level_set.copy_data();
-
-Both of the data above are on grids that have been refined by :cpp:`ls_ref`
-(with respect to the :cpp:`BoxArray ba`). In order to get a copy of the
-level-set data at the coarseness of the original grids, use:
-
-.. highlight:: c++
-
-::
-
-   std::unique_ptr<MultiFab> level_set_data_crse = level_set.coarsen_data();
-
-Note however, that the level-set data is nodal data. Therefore, even though the
-:cpp:`MultiFab level_set_data_crse` is defined on a grid with the same
-resolution as the :cpp:`BoxArray ba`, it is defined on the nodal version of that
-grid.
-
-The :cpp:`LSFactory` is also there to make operations on the level-set easier.
-Intersection and Union operations with EB factories and implicit functions are
-available in the :cpp:`LSFactory` class. As well as functions to regrid
-(updating the underlying :cpp:`BoxArray` and :cpp:`DistributionMapping`),
-copying, and inverting the level-set function.
-
-
-Filling Multi-Level Level-Sets without :cpp:`LSCore`
-----------------------------------------------------
-
-AMReX also provides code to fill the level-set function on different levels of
-refinement. The static function :cpp:`amrex::LSCoreBase::FillLevelSet`,
-:cpp:`amrex::LSCoreBase::MakeNewLevelFromCoarse`, and
-:cpp:`amrex::LSCoreBase::FillVolfracTags` (or
-:cpp:`amrex::LSCoreBase::FillLevelSetTags` for level-set tagging instead of
-volume-fraction tagging) fill a finer level from a coarse one. Just like the
-section on :ref:`ss:ls:nolsf`, the philosophy here is to enable to user to fill
-a :cpp:`MultiFab` with level-set values, and manage this data structure
-themselves. Later we will discuss the :cpp:`LSCore` class, which automatically
-constructs multi-level level-sets.
-
-One common problem with level-set function is that they are expensive to
-compute. Therefore, a strategy would be to compromise by computing the level-set
-function accurately near embedded boundaries (where precision is important), and
-at a lower resolution for from walls. The function
-
-.. highlight:: c++
-
-::
-
-   static void FillVolfracTags( int lev, TagBoxArray & tags,
-                                 const Vector<BoxArray> & grids,
-                                 const Vector<DistributionMapping> & dmap,
-                                 const EB2::Level & eb_lev, const Vector<Geometry> & geom );
-
-fills a :cpp:`TagBoxArray` with tags wherever the volume fraction is between 0
-and 1. This way any cut-cells a buffered of :cpp:`amr.n_error_buf` many
-neighbors is tagged for refinement. If we need finer control over the tagging,
-the function
-
-.. highlight:: c++
-
-::
-
-   static void FillLevelSetTags( int lev, TagBoxArray & tags, const Vector<Real> & phierr,
-                                 const MultiFab & levelset_data, const Vector<Geometry> & geom );
-
-takes a list of threshold level-set values (:cpp:`Vector<Real> & phierr`) and
-tags cells for refinement if the coarse estimate of the levelset
-(:cpp:`levelset_data`) from level :cpp:`lev` is less than :cpp:`phierr[lev]`.
-
-The following code would then fill a multi-level hierarchy of level-sets
-contained in :cpp:`Vector<MultiFab> level_sets`.
-
-.. highlight:: c++
-
-::
-
-   //___________________________________________________________________________
-   // Start with level zero
-
-   EBFArrayBoxFactory eb_factory(* eb_levels[0], geom[0], grids[0], dmap[0],
-                                 {eb_pad, eb_pad, leb_pad}, EBSupport::full);
-
-   // NOTE: reference BoxArray is not nodal
-   BoxArray nd_ba = amrex::convert(grids[0], IntVect::TheNodeVector());
-
-   level_sets[0].define(nd_ba, dmap[0], 1, pad);
-   iMultiFab valid(nd_ba, dmap[0], 1, pad);
-
-   // NOTE: implicit function data might not be on the right grids
-   MultiFab impfunc = MFUtil::regrid(nd_ba, dmap[0], implicit_functions[0], true);
-
-   LSFactory::fill_data(level_sets[0], valid, ebfactory, impfunc,
-                        32, 1, 1, geom[0], geom[0]);
-
-
-   //___________________________________________________________________________
-   // Fill finer levels, using coarser level to estimate level-set
-
-   for (int lev = 1; lev < nlev; lev++) {
-            // NOTE: reference BoxArray is not nodal
-            BoxArray ba = amrex::convert(grids[lev], IntVect::TheNodeVector());
-            level_sets[lev].reset(new MultiFab);
-            iMultiFab valid(ba, dmap[lev], 1, pad);
-
-            // Fills level_sets[lev] with coarse data
-            LSCoreBase::MakeNewLevelFromCoarse( level_sets[lev], level_sets[lev-1],
-                                               ba, dmap[lev], geom[lev], geom[lev-1],
-                                               bcs_ls, refRatio(lev-1));
-
-            EBFArrayBoxFactory eb_factory(* eb_levels[lev], geom[lev], grids[lev], dmap[lev],
-                                          {eb_pad, eb_pad, eb_pad}, EBSupport::full);
-
-            // NOTE: implicit function data might not be on the right grids
-            MultiFab impfunc = MFUtil::regrid(ba, dmap[lev], implicit_functions[lev]);
-
-            IntVect ebt_size{AMREX_D_DECL(32, 32, 32)}; // Fudge factors...
-            LSCoreBase::FillLevelSet(level_sets[lev], level_sets[lev], eb_factory, impfunc,
-                                     ebt_size, eb_pad, geom[lev]);
-        }
-
-Here the :cpp:`Vector<const EB2::Level *> eb_levels` has been filled while
-initializing the embedded boundaries. At the same time, the implicit functions
-need to be saved to :cpp:`Vector<MultiFab> implicit_functions`. The user also
-needs to specify the level-set boundary conditions in :cpp:`Vector<BCRec>
-bcs_ls`. Note that the function :cpp:`LSCoreBase::FillLevelSet` uses the coarse
-level-set as an upper bound to the tile size used for testing EB facets.
-
-
-
-Using :cpp:`LSCore`
--------------------
-
-The process described in the previous section is automated in the :cpp:`LSCore`
-class. It is derived from :cpp:`LSCoreBase`, which in turn is derived from
-:cpp:`AmrCore` (cf. :ref:`Chap:AmrCore`). :cpp:`LSCore` is a template class
-depending on the embedded boundary implicit function. This way, it can build new
-:cpp:`EB2::Level` objects for every new level that is needed.
-
-Since :cpp:`LSCore` is a template class, it might lead to problems in
-applications where the template parameter can depend of runtime parameters. This
-is the reason why it derives from the base class :cpp:`LSCoreBase`.
-:cpp:`LSCore` overwrites the virtual function :cpp:`MakeNewLevelFromScratch` in
-:cpp:`LSCoreBase`. The application can then employ the following polymorphism to
-construct the level-set;
-
-.. highlight:: c++
-
-::
-
-   LSCoreBase * ls_core;
-
-   // sets ls_core pointer
-   make_my_eb(ls_core);
-
-   ls_core->InitData();
-
-where the function :cpp:`make_my_eb` defines the actual EB geometry:
-
-.. highlight:: c++
-
-::
-
-   void make_my_eb(LSCoreBase *& ls_core) {
-
-       // MyIF is an EB2 Implicit Fuction
-       GeometryShop<MyIF> gshop;
-
-       // Build an EB geometry shop here
-
-       ls_core = new LSCore<MyIF>(gshop);
-   }
-
-Here the :cpp:`make_my_eb` is only defines the EB geometry. The function call
-:cpp:`ls_core->InitData()` constructs level hierarchy and fills it with
-level-set values.
-
 Linear Solvers
 ==============
 
diff --git a/Docs/sphinx_documentation/source/EB/loc_ls_ex.png b/Docs/sphinx_documentation/source/EB/loc_ls_ex.png
deleted file mode 100644
index 48f6aa654d3..00000000000
Binary files a/Docs/sphinx_documentation/source/EB/loc_ls_ex.png and /dev/null differ
diff --git a/Docs/sphinx_documentation/source/External_Frameworks_Chapter.rst b/Docs/sphinx_documentation/source/External_Frameworks_Chapter.rst
index 97bcb96c9c7..3d15c083036 100644
--- a/Docs/sphinx_documentation/source/External_Frameworks_Chapter.rst
+++ b/Docs/sphinx_documentation/source/External_Frameworks_Chapter.rst
@@ -6,5 +6,5 @@ External Frameworks
 .. toctree::
    :maxdepth: 1
 
-   CVODE_top
+   SUNDIALS_top
    SWFFT
diff --git a/Docs/sphinx_documentation/source/External_Profiling_Tools.rst b/Docs/sphinx_documentation/source/External_Profiling_Tools.rst
index 6a45a3bd938..71222d7588e 100644
--- a/Docs/sphinx_documentation/source/External_Profiling_Tools.rst
+++ b/Docs/sphinx_documentation/source/External_Profiling_Tools.rst
@@ -279,3 +279,202 @@ generated figures. Some examples are shown here.
 
 .. [5]
    https://www.nersc.gov/users/software/performance-and-debugging-tools/ipm/
+
+Nsight Systems
+==============
+
+The Nsight Systems tool provides a high-level overview of your code, displaying the kernel
+launches, API calls, NVTX regions and more in a timeline for a clear, visual picture of the
+overall runtime patterns.  It analyzes CPU-codes or CUDA-based GPU codes and is available
+on Summit and Cori in a system module.
+
+Nsight Systems provides a variety of profiling options.  This documentation will cover the
+most commonly used options for AMReX users to keep track of useful flags and analysis
+patterns. For the complete details of using Nsight Systems, refer to the `Nsight Systems
+official documentation <https://docs.nvidia.com/nsight-systems/index.html>`_.
+
+Profile Analysis
+----------------
+
+The most common use case of Nsight Systems for AMReX users is the creation of a qdrep file
+that is viewed in the Nsight Systems GUI, typically on a local workstation or machine.
+
+To generate a qdrep file, run nsys with the ``-o`` option:
+
+.. highlight:: console 
+
+::
+
+    nsys profile -o <file_name> ${EXE} ${INPUTS}
+
+AMReX's lambda-based launch system often makes these timelines difficult to parse, as the kernel
+are mangled and are difficult to decipher. AMReX's Tiny Profiler includes NVTX region markers,
+which can be used to mark the respective section of the Nsight Systems timeline.  To include AMReX's
+built-in Tiny Profiler NVTX regions in Nsight Systems outputs, compile AMReX with ``TINY_PROFILE=TRUE``.
+
+Nsight Systems timelines only profile a single, contiguous block of time. There are a variety of
+methods to specify the specific region you would like to analyze. The most common options that AMReX users
+may find helpful are:
+
+1. **Specify an NVTX region as the starting point of the analysis.**
+
+This is done using ``-c nvtx -p "region_name@*" -e NSYS_NVTX_PROFILER_REGISTER_ONLY=0``, where ``region_name``
+is the identification string for the of the NVTX region. The additional environment variable,
+``-e ...`` is needed because AMReX's NVTX region names currently do not use a registered string.
+TinyProfiler's built-in NVTX regions use the same identification string as the timer itself. For
+example, to start an analysis at the ``do_hydro`` NVTX region, run:
+
+.. highlight:: console
+
+::
+
+    nsys profile -o <file_name> -c nvtx -p "do_hydro@*" -e NSYS_NVTX_PROFILER_REGISTER_ONLY=0 ${EXE} ${INPUTS}
+
+This will profile from the first instance of the specified NVTX region until the end of the
+application.  In AMReX applications, this can be helpful to skip initialization and analyze the
+remainder of the code.  To only analyze the specified NVTX region, add the flag ``-x true``, which
+will end the analysis at the end of the region:
+
+.. highlight:: console
+
+::
+
+    nsys profile -o <file_name> -c nvtx -p "do_hydro@*" -x true -e NSYS_NVTX_PROFILER_REGISTER_ONLY=0 ${EXE} ${INPUTS}
+
+Again, it's important to remember that Nsight Systems only analyzes a single contiguous block of
+time. So, this will only give you a profile for the first instance of the named region.  Plan your
+Nsight System analyses accordingly.
+
+2. **Specify a region with cuda profiler function calls.**
+
+This requires manually altering your source code, but can provide better specificity in what you analyze.
+Directly insert ``cudaProfilerStart\Stop`` around the region of code you want to analyze:
+
+.. highlight:: c++
+
+::
+
+    cudaProfilerStart();
+
+    // CODE TO PROFILE
+
+    cudaProfilerStop();
+
+
+Then, run with ``-c cudaProfilerApi``:
+
+.. highlight:: console
+
+::
+
+    nsys profile -o <file_name> -c cudaProfilerApi ${EXE} ${INPUTS}
+
+As with NVTX regions, Nsight Systems will only profile from the first call to ``cudaProfilerStart()``
+to the first call to ``cudaProfilerStop()``, so be sure to add these markers appropriately.
+
+
+Nsight Systems GUI Tips
+-----------------------
+
+* When analyzing an AMReX application in the Nsight Systems GUI using NVTX regions or ``TINY_PROFILE=TRUE``,
+  AMReX users may find it useful to turn on the feature "Rename CUDA Kernels by NVTX". This will change the
+  CUDA kernel names to match the inner-most NVTX region in which they were launched instead of the typical
+  mangled compiler name. This will make identifying AMReX CUDA kernels in Nsight Systems reports considerably easier. 
+
+  This feature can be found in the GUI's drop down menu, under:
+
+.. highlight:: console
+
+::
+
+ Tools -> Options -> Environment -> Rename CUDA Kernels by NVTX.
+
+
+Nsight Compute
+==============
+
+The Nsight Compute tool provides a detailed, fine-grained analysis of your CUDA kernels,
+giving details about the kernel launch, occupancy, and limitations while suggesting possible
+improvements to maximize the use of the GPU.  It analyzes CUDA-based GPU codes and is available
+on Summit and Cori in system modules.
+
+Nsight Compute provides a variety of profiling options.  This documentation will focus on the
+most commonly used options for AMReX users, primarily to keep track of useful flags and analysis
+patterns.  For the complete details of using Nsight Compute, refer to the `Nsight compute
+official documentation <https://docs.nvidia.com/nsight-compute/index.html>`_.
+
+
+Kernel Analysis
+---------------
+
+The standard way to run Nsight Compute on an AMReX application is to specify an output file
+that will be transferred to a local workstation of machine for viewing in the Nsight Compute GUI.
+Nsight Compute can be told to return a report file using the ``-o`` flag. In addition, when
+running with Nsight compute on an AMReX application, it is important to turn off the floating
+point exception trap, as it causes a runtime error.  So, an entire AMReX application can be 
+analyzed with Nsight Compute by running:
+
+.. highlight:: console
+
+::
+
+    ncu -o <file_name> ${EXE} ${INPUTS} amrex.fpe_trap_invalid=0
+
+However, this implementation should almost never used by AMReX applications, as the analysis of
+every kernel would be  extremely lengthy and unnecessary.  To analyze a desired subset of CUDA
+kernels, AMReX users can use the Tiny Profiler's built-in NVTX regions to narrow the scope of
+the analysis.  Nsight Compute allows users to specify which NVTX regions to include and exclude
+through the ``--nvtx``, ``--nvtx-include`` and ``--nvtx-exclude`` flags. For example:
+
+.. highlight:: console
+
+::
+
+    ncu --nvtx --nvtx-include "Hydro()" --nvtx-exclude "StencilA(),StencilC()" -o kernels ${EXE} ${INPUTS} amrex.fpe_trap_invalid=0
+
+will return a file named ``kernels`` which contains an analysis of the CUDA kernels launched inside
+the ``Hydro()`` region, ignoring any kernels launched inside ``StencilA()`` and ``StencilC()``.  
+When using the NVTX regions built into AMReX's TinyProfiler, be aware that the application must be built
+with ``TINY_PROFILE=TRUE`` and the NVTX region names are identical to the TinyProfiler timer names.
+
+Another helpful flag for selecting a reasonable subset of kernels for analysis is the ``-c`` option. This
+flag specifies the total number of kernels to be analyzed. For example:
+
+.. highlight:: console
+
+::
+
+    ncu --nvtx --nvtx-include "GravitySolve()" -c 10 -o kernels ${EXE} ${INPUTS} amrex.fpe_trap_invalid=0
+
+will only analyze the first ten kernels inside of the ``GravitySolve()`` NVTX region.
+
+For further details on how to choose a subset of CUDA kernels to analyze, or to run a more detailed
+analysis, including CUDA hardware counters, refer to the Nsight Compute official documentation on
+`NVTX Filtering <https://docs.nvidia.com/nsight-compute/NsightComputeCli/index.html#nvtx-filtering>`_.
+
+
+Roofline
+--------
+
+As of version 2020.1.0, Nsight Compute has added the capability to perform roofline analyses on CUDA
+kernels to describe how well a given kernel is running on a given NVIDIA architecture.  For details
+on the roofline capabilities in Nsight Compute, refer to the `NVIDIA Kernel Profiling Guide
+<https://docs.nvidia.com/nsight-compute/ProfilingGuide/index.html#roofline>`_.
+
+To run a roofline analysis on an AMReX application, run ``ncu`` with the flag
+``--section SpeedOfLight_RooflineChart``. Again, using appropriate NVTX flags to limit the scope of the
+analysis will be critical to achieve results within a reasonable time. For example:
+
+.. highlight:: console
+
+::
+
+    ncu --section SpeedOfLight_RooflineChart --nvtx --nvtx-include "MLMG()" -c 10 -o roofline ${EXE} ${INPUTS} amrex.fpe_trap_invalid=0
+
+will perform a roofline analysis of the first ten kernels inside of the region ``MLMG()``, and report
+their relative performance in the file ``roofline``, which can be read by the Nsight Compute GUI. 
+
+For further information on the roofline model, refer to the scientific literature, `Wikipedia 
+overview <https://en.wikipedia.org/wiki/Roofline_model>`_, NERSC
+`documentation <https://docs.nersc.gov/development/performance-debugging-tools/roofline/>`_ and 
+`tutorials <https://www.nersc.gov/users/training/events/roofline-on-nvidia-gpus-hackathon/>`_. 
diff --git a/Docs/sphinx_documentation/source/External_Profiling_Tools_Chapter.rst b/Docs/sphinx_documentation/source/External_Profiling_Tools_Chapter.rst
index 3ec6c6c3666..dc62454e8f8 100644
--- a/Docs/sphinx_documentation/source/External_Profiling_Tools_Chapter.rst
+++ b/Docs/sphinx_documentation/source/External_Profiling_Tools_Chapter.rst
@@ -3,6 +3,10 @@
 External Profiling Tools
 ===========================
 
+AMReX is compatible with most commonly used profiling tools. This chapter provides some
+selected useful documentation on implementing a few of these tools on AMReX. For additional
+details on running these tools, please refer to the official documentation of the tools.
+
 .. toctree::
    :maxdepth: 1
 
diff --git a/Docs/sphinx_documentation/source/Fortran.rst b/Docs/sphinx_documentation/source/Fortran.rst
index 46286073e00..9631374e53b 100644
--- a/Docs/sphinx_documentation/source/Fortran.rst
+++ b/Docs/sphinx_documentation/source/Fortran.rst
@@ -276,7 +276,7 @@ example,
                   ! mf1 is still the owner of the data.
       call amrex_multifab_destroy(mf1)
       ! mf2 no longer contains a valid pointer because mf1 has been destroyed. 
-      call amrex_multifab_destroyed(mf2)  ! But we still need to destroy it.
+      call amrex_multifab_destroy(mf2)  ! But we still need to destroy it.
 
 If we need to transfer the ownership, :fortran:`amrex_multifab`,
 :fortran:`amrex_boxarray` and :fortran:`amrex_distromap` provide type-bound
@@ -290,7 +290,7 @@ If we need to transfer the ownership, :fortran:`amrex_multifab`,
       call amrex_multifab_build(mf1, ...)
       call mf2%move(mf1)   ! mf2 is now the data owner and mf1 is not.
       call amrex_multifab_destroy(mf1)
-      call amrex_multifab_destroyed(mf2)
+      call amrex_multifab_destroy(mf2)
 
 :fortran:`amrex_multifab` also has a type-bound :fortran:`swap` procedure for
 exchanging the data.
diff --git a/Docs/sphinx_documentation/source/GPU.rst b/Docs/sphinx_documentation/source/GPU.rst
index 9e507e42fdc..c26fade1e2b 100644
--- a/Docs/sphinx_documentation/source/GPU.rst
+++ b/Docs/sphinx_documentation/source/GPU.rst
@@ -182,44 +182,201 @@ can run it and that will generate results like:
 
 Building with CMake
 -------------------
-To build AMReX with GPU support in CMake, add ``-DENABLE_CUDA=YES`` to the
-``cmake`` invocation. By default, CMake will try to determine which GPU
-architecture is supported by the system. If more than one is found, CMake
-will build for all of them. This will generally results in a larger library and longer build times.
-If autodetection fails, a set of "common" architectures is assumed.
-You can specify the target architecture to build for via the configuration option
-``-DCUDA_ARCH=<target-architecture>``, where ``<target-architecture>`` can be either
-the name of the NVIDIA GPU, i.e. ``Turing``, ``Volta``, ``Pascal``, ``...`` , or its
-version number, i.e. ``10.0``, ``9.0``, ``8.0``, ``...`` .
+
+Enabling CUDA support
+^^^^^^^^^^^^^^^^^^^^^
+
+To build AMReX with CUDA support in CMake, add ``-DAMReX_GPU_BACKEND=CUDA`` to the
+``cmake`` invocation. For a full list of CUDA-specific configuration options,
+check the :ref:`table <tab:cmakecudavar>` below.
+
+.. raw:: latex
+
+   \begin{center}
+
+.. _tab:cmakecudavar:
+
+.. table:: AMReX CUDA-specific build options
+
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | Variable Name                | Description                                     | Default     | Possible values |
+   +==============================+=================================================+=============+=================+
+   | AMReX_CUDA_ARCH              |  CUDA target architecture                       | Auto        | User-defined    |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_FASTMATH          |  Enable CUDA fastmath library                   | YES         | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_BACKTRACE         |  Host function symbol names (e.g. cuda-memcheck)| Auto        | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_COMPILATION_TIMER |  CSV table with time for each compilation phase | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_DEBUG             |  Device debug information (optimizations: off)  | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_ERROR_CAPTURE_THIS|  Error if a CUDA lambda captures a class' this  | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_KEEP_FILES        |  Keep intermediately files (folder: nvcc_tmp)   | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_LTO               |  Enable CUDA link-time-optimization             | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_MAX_THREADS       |  Max number of CUDA threads per block           | 256         | User-defined    |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_MAXREGCOUNT       |  Limits the number of CUDA registers available  | 255         | User-defined    |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_PTX_VERBOSE       |  Verbose code generation statistics in ptxas    | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_SHOW_CODELINES    |  Source information in PTX (optimizations: on)  | Auto        | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_SHOW_LINENUMBERS  |  Line-number information (optimizations: on)    | Auto        | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_CUDA_WARN_CAPTURE_THIS |  Warn if a CUDA lambda captures a class' this   | YES         | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+.. raw:: latex
+
+   \end{center}
+
+
+The target architecture to build for can be specified via the configuration option
+``-DAMReX_CUDA_ARCH=<target-architecture>``, where ``<target-architecture>`` can be either
+the name of the NVIDIA GPU generation, i.e. ``Turing``, ``Volta``, ``Ampere``, ``...`` , or its
+`compute capability <https://developer.nvidia.com/cuda-gpus>`_, i.e. ``10.0``, ``9.0``,  ``...`` .
 For example, on Cori GPUs you can specify the architecture as follows:
 
 .. highlight:: console
 
 ::
 
-   cmake [options] -DENABLE_CUDA=yes -DCUDA_ARCH=Volta /path/to/amrex/source
+   cmake [options] -DAMReX_GPU_BACKEND=CUDA -DAMReX_CUDA_ARCH=Volta /path/to/amrex/source
 
 
-Note that AMReX only supports GPU architectures with version number ``6.0`` or higher.
+If no architecture is specified, CMake will default to the architecture defined in the
+*environment variable* ``AMREX_CUDA_ARCH`` (note: all caps).
+If the latter is not defined, CMake will try to determine which GPU
+architecture is supported by the system. If more than one is found, CMake will build for all of them.
+This will generally results in a larger library and longer build times.
+If autodetection fails, a set of "common" architectures is assumed.
+**Note that AMReX supports NVIDIA GPU architectures with compute capability 6.0 or higher and
+CUDA Toolkit version 9.0 or higher**.
 
 
-In order to import CUDA-enabled AMReX into your CMake project, you need to include
+In order to import the CUDA-enabled AMReX library into your CMake project, you need to include
 the following code into the appropriate CMakeLists.txt file:
 
 .. highlight:: console
-               
+
 ::
 
    # Find CUDA-enabled AMReX installation
    find_package(AMReX REQUIRED CUDA)
 
-   # Add custom CUDA flags
-   set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS}  <your-CUDA-flags>")
+
+If instead of using an external installation of AMReX you prefer to include AMReX as a subproject
+in your CMake setup, we strongly encourage you to use the ``AMReX_SetupCUDA`` module as shown below:
+
+.. highlight:: console
+
+::
+
+   # Enable CUDA in your CMake project
+   enable_language(CUDA)
+
+   # Include the AMReX-provided CUDA setup module
+   include(AMReX_SetupCUDA)
+
+   # Include AMReX source directory ONLY AFTER the two steps above
+   add_subdirectory(/path/to/amrex/source/dir)
+
 
 
-The snippet of code above will find a CUDA-enabled installation of AMReX and setup
-the CUDA support in the host project CMake via the AMReX-provided macro ``setup_cuda()``.
-The host project should **not call directly** ``enable_language(CUDA)``.
+To ensure consistency between CUDA-enabled AMReX and any CMake target that links against it,
+we provide the helper function ``setup_target_for_cuda_compilation()``:
+
+
+.. highlight:: console
+
+::
+
+   # Set all sources for my_target
+   target_sources(my_target source1 source2 source3 ...)
+
+   # Setup my_target to be compiled with CUDA and be linked against CUDA-enabled AMReX
+   # MUST be done AFTER all sources have been assigned to my_target
+   setup_target_for_cuda_compilation(my_target)
+
+   # Link against amrex
+   target_link_libraries(my_target AMReX::amrex)
+
+
+
+Enabling HIP support (experimental)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+To build AMReX with HIP support in CMake, add
+``-DAMReX_GPU_BACKEND=HIP -DAMReX_AMD_ARCH=<target-arch> -DCMAKE_CXX_COMPILER=<your-hip-compiler>``
+to the ``cmake`` invocation.
+
+In AMReX CMake, the HIP compiler is treated as a special C++ compiler and therefore
+the standard CMake variables used to customize the compilation process for C++,
+for example ``CMAKE_CXX_FLAGS``, can be used for HIP as well.
+
+
+Since CMake does not support autodetection of HIP compilers/target architectures
+yet, ``CMAKE_CXX_COMPILER`` must be set to a valid HIP compiler, i.e. ``hipcc`` or ``nvcc``,
+and ``AMReX_AMD_ARCH`` to the target architecture you are building for.
+Thus **AMReX_AMD_ARCH and CMAKE_CXX_COMPILER are required user-inputs when AMReX_GPU_BACKEND=HIP**.
+Below is an example configuration for HIP on Tulip:
+
+.. highlight:: console
+
+::
+
+   cmake -DAMReX_GPU_BACKEND=HIP -DCMAKE_CXX_COMPILER=$(which hipcc) -DAMReX_AMD_ARCH="gfx906,gfx908"  [other options] /path/to/amrex/source
+
+
+Enabling SYCL support (experimental)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+To build AMReX with SYCL support in CMake, add
+``-DAMReX_GPU_BACKEND=SYCL -DCMAKE_CXX_COMPILER=<your-sycl-compiler>``
+to the ``cmake`` invocation.
+For a full list of SYCL-specific configuration options,
+check the :ref:`table <tab:cmakesyclvar>` below.
+
+
+In AMReX CMake, the SYCL compiler is treated as a special C++ compiler and therefore
+the standard CMake variables used to customize the compilation process for C++,
+for example ``CMAKE_CXX_FLAGS``, can be used for DPCPP as well.
+
+
+Since CMake does not support autodetection of SYCL compilers yet,
+``CMAKE_CXX_COMPILER`` must be set to a valid SYCL compiler. i.e. ``dpcpp``.
+Thus **CMAKE_CXX_COMPILER is a required user-input when AMReX_GPU_BACKEND=SYCL**.
+At this time, **the only supported SYCL compiler is dpcpp**.
+Below is an example configuration for SYCL:
+
+.. highlight:: console
+
+::
+
+   cmake -DAMReX_GPU_BACKEND=SYCL -DCMAKE_CXX_COMPILER=$(which dpcpp)  [other options] /path/to/amrex/source
+
+
+.. raw:: latex
+
+   \begin{center}
+
+.. _tab:cmakesyclvar:
+
+.. table:: AMReX SYCL-specific build options
+
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | Variable Name                | Description                                     | Default     | Possible values |
+   +==============================+=================================================+=============+=================+
+   | AMReX_DPCPP_AOT              | Enable DPCPP ahead-of-time compilation          | NO          | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+   | AMReX_DPCPP_SPLIT_KERNEL     | Enable DPCPP kernel splitting                   | YES         | YES, NO         |
+   +------------------------------+-------------------------------------------------+-------------+-----------------+
+.. raw:: latex
+
+   \end{center}
 
 
 
@@ -288,17 +445,17 @@ specific type of GPU memory:
 
 .. table:: Memory Arenas
 
-    +---------------------+------------------+
-    | Arena               |    Memory Type   |
-    +=====================+==================+
-    | The_Arena()         |  unified memory  |
-    +---------------------+------------------+
-    | The_Device_Arena()  |  device memory   |
-    +---------------------+------------------+
-    | The_Managed_Arena() |  unified memory  |
-    +---------------------+------------------+
-    | The_Pinned_Arena()  |  pinned memory   |
-    +---------------------+------------------+
+    +---------------------+----------------------------+
+    | Arena               |        Memory Type         |
+    +=====================+============================+
+    | The_Arena()         |  managed or device memory  |
+    +---------------------+----------------------------+
+    | The_Device_Arena()  |  device memory             |
+    +---------------------+----------------------------+
+    | The_Managed_Arena() |  managed memory            |
+    +---------------------+----------------------------+
+    | The_Pinned_Arena()  |  pinned memory             |
+    +---------------------+----------------------------+
 
 .. raw:: latex
 
@@ -315,11 +472,13 @@ to two functions:
    void free (void* p);
 
 :cpp:`The_Arena()` is used for memory allocation of data in
-:cpp:`BaseFab`.  Therefore the data in a :cpp:`MultiFab` is placed in
-unified memory and is accessible from both CPU host and GPU device.
+:cpp:`BaseFab`.  By default, it allocates managed memory.  This can be changed with
+a boolean runtime parameter ``amrex.the_arena_is_managed``.
+Therefore the data in a :cpp:`MultiFab` is placed in
+managed memory by default and is accessible from both CPU host and GPU device.
 This allows application codes to develop their GPU capability
 gradually.  :cpp:`The_Managed_Arena()` is a separate pool of
-unified memory, that is distinguished from :cpp:`The_Arena()` for
+managed memory, that is distinguished from :cpp:`The_Arena()` for
 performance reasons.  If you want to print out the current memory usage
 of the Arenas, you can call :cpp:`amrex::Arena::PrintUsage()`.
 
@@ -511,7 +670,7 @@ implementation is reproduced here:
 .. highlight:: c++
 
 ::
-   
+
     Real MultiFab::Dot (const MultiFab& x, int xcomp,
 	       const MultiFab& y, int ycomp,
 	       int numcomp, int nghost, bool local) {
@@ -864,9 +1023,9 @@ prepares the device launch based on a :cpp:`Box`, launches with an appropriate s
 GPU kernel and constructs a thread :cpp:`Box` that defines the work for each thread.
 On the CPU, the thread :cpp:`Box` is set equal to the total launch :cpp:`Box`, so
 tiling works as expected.  On the GPU, the thread :cpp:`Box` usually
-contains a single cell to allow all GPU threads to be utilized effectively. 
+contains a single cell to allow all GPU threads to be utilized effectively.
 
-An example of a generic function launch is shown here: 
+An example of a generic function launch is shown here:
 
 .. highlight:: c++
 
@@ -1069,24 +1228,17 @@ as:
                                                  and "b; }" as
                                                  another.
         Real a;      <---- OK
-        Real b;      
+        Real b;
     });
 
 Users that choose to implement the macro launches should be aware of the limitations
 of C++ preprocessing macros to ensure GPU offloading is done properly.
 
-Finally, AMReX's expected OpenMP strategy for GPUs is to utilize OpenMP
-in CPU regions to maintain multi-threaded parallelism on work that cannot be
-offloaded efficiently, while using CUDA independently in GPU regions.
-This means OpenMP pragmas need to be maintained when ``USE_CUDA=FALSE``
-and turned off in locations CUDA is implemented when ``USE_CUDA=TRUE``.
-
-This can currently be implemented in preparation for an OpenMP strategy and
-users are highly encouraged to do so now.  This prevents having to track
-down and label the appropriate OpenMP regions in the future and
-clearly labels for readers that OpenMP and GPUs are not being used at the
-same time.  OpenMP pragmas can be turned off using the conditional pragma
-and :cpp:`Gpu::notInLaunchRegion()`, as shown below:
+Finally, AMReX's most common CPU threading strategy for GPU/CPU systems is to utilize
+OpenMP threads to maintain multi-threaded parallelism on work chosen to run on the host.
+This means OpenMP pragmas should be maintained where CPU work is performed and usually
+turned off where work is offloaded onto the GPU.  OpenMP pragmas can be turned
+off using the conditional pragma and :cpp:`Gpu::notInLaunchRegion()`, as shown below:
 
 .. highlight:: c++
 
@@ -1096,11 +1248,13 @@ and :cpp:`Gpu::notInLaunchRegion()`, as shown below:
     #pragma omp parallel if (Gpu::notInLaunchRegion())
     #endif
 
-This should be added only to MFIter loops that contain GPU work.
+It is generally expected that simply using OpenMP threads to launch GPU work quicker
+will show little improvement or even perform worse. So, this conditional statement
+should be added to MFIter loops that contain GPU work, unless users specifically test
+the performance or are designing more complex workflows that require OpenMP.
 
 .. _sec:gpu:example:
 
-
 An Example of Migrating to GPU
 ==============================
 
@@ -1202,20 +1356,20 @@ To help debugging, we often use :cpp:`amrex::Assert` and
 GPU kernels.  However, implementing these functions requires additional
 GPU registers, which will reduce overall performance.  Therefore, it
 is preferred to implement such calls in debug mode only by wrapping the
-calls using ``#ifdef AMREX_DEBUG``. 
+calls using ``#ifdef AMREX_DEBUG``.
 
 In CPU code, :cpp:`AMREX_GPU_ERROR_CHECK()` can be called
 to check the health of previous GPU launches.  This call
 looks up the return message from the most recently completed GPU
 launch and aborts if it was not successful. Many kernel
-launch macros as well as the :cpp:`MFIter` destructor include a call 
+launch macros as well as the :cpp:`MFIter` destructor include a call
 to :cpp:`AMREX_GPU_ERROR_CHECK()`. This prevents additional launches
 from being called if a previous launch caused an error and ensures
 all GPU launches within an :cpp:`MFIter` loop completed successfully
 before continuing work.
 
-However, due to asynchronicity, determining the source of the error 
-can be difficult.  Even if GPU kernels launched earlier in the code 
+However, due to asynchronicity, determining the source of the error
+can be difficult.  Even if GPU kernels launched earlier in the code
 result in a CUDA error, the error may not be output at a nearby call to
 :cpp:`AMREX_GPU_ERROR_CHECK()` by the CPU.  When tracking down a CUDA
 launch error, :cpp:`Gpu::synchronize()` and
@@ -1274,7 +1428,7 @@ to GPUs using Cuda, OpenACC, and OpenMP, please see :cpp:`Tutorials/Particles/El
 GPU-aware implementations of many common particle operations are provided with AMReX, including neighbor list
 construction and traversal, particle-mesh deposition and interpolation, parallel reductions of particle data,
 and a set of transformation and filtering operations that are useful when operating on sets of particles. For
-examples of these features in use, please see :cpp:`Tests/Particles/`. 
+examples of these features in use, please see :cpp:`Tests/Particles/`.
 
 Finally, the parallel communication of particle data has been ported and optimized for performance on GPU
 platforms. This includes :cpp:`Redistribute()`, which moves particles back to the proper grids after their positions
@@ -1350,6 +1504,32 @@ AMReX for GPUs:
         ...
     }
 
+* Pay attention to what GPUs your job scheduler is assigning to each MPI
+  rank. In most cases you'll achieve the best performance when a single
+  MPI rank is assigned to each GPU, and has boxes large enough to saturate
+  that GPU's compute capacity. While there are some cases where multiple
+  MPI ranks per GPU can make sense (typically this would be when you have
+  some portion of your code that is not GPU accelerated and want to have
+  many MPI ranks to make that part faster), this is probably the minority
+  of cases. For example, on OLCF Summit you would want to ensure that your
+  resource sets contain one MPI rank and GPU each, using `jsrun -n N -a 1 -c 7 -g 1`,
+  where `N` is the total number of MPI ranks/GPUs you want to use. (See the OLCF
+  [job step viewer](https://jobstepviewer.olcf.ornl.gov/) for more information.)
+
+  Conversely, if you choose to have multiple GPUs visible to each MPI rank,
+  AMReX will attempt to do the best job it can assigning MPI ranks to GPUs by
+  doing round robin assignment. This may be suboptimal because this assignment
+  scheme would not be aware of locality benefits that come from having an MPI
+  rank be on the same socket as the GPU it is managing. If you know the hardware
+  layout of the system you're running on, specifically the number of GPUs per
+  socket (`M`) and number of GPUs per node (`N`), you can set the preprocessor
+  defines `-DAMREX_GPUS_PER_SOCKET=M` and `-DAMREX_GPUS_PER_NODE=N`, which are
+  exposed in the GNU Make system through the variables `GPUS_PER_SOCKET` and
+  `GPUS_PER_NODE` respectively (see an example in `Tools/GNUMake/sites/Make.olcf`).
+  Then AMReX can ensure that each MPI rank selects a GPU on the same socket as
+  that rank (assuming your MPI implementation supports MPI 3.)
+
+
 .. ===================================================================
 
 Inputs Parameters
@@ -1401,7 +1581,7 @@ Cuda-specific tests
 
 - Run under ``nvprof -o profile%p.nvvp ./main3d.xxxx`` for
   a small problem and examine page faults using nvvp
-		  
+
 - Run under ``cuda-memcheck``
 
 - Run under ``cuda-gdb``
@@ -1409,8 +1589,8 @@ Cuda-specific tests
 - Run with ``CUDA_LAUNCH_BLOCKING=1``.  This means that only one
   kernel will run at a time.  This can help identify if there are race
   conditions.
-	
-   
+
+
 Limitations
 ===========
 
diff --git a/Docs/sphinx_documentation/source/GettingStarted.rst b/Docs/sphinx_documentation/source/GettingStarted.rst
index 0b4808849cd..534f798dc27 100644
--- a/Docs/sphinx_documentation/source/GettingStarted.rst
+++ b/Docs/sphinx_documentation/source/GettingStarted.rst
@@ -7,9 +7,8 @@ Downloading the Code
 
 The source code is available at https://github.com/AMReX-Codes/amrex. The
 GitHub repo is our central repo for development. The development branch
-includes the latest state of the code, and it is merged into the master branch
-on a monthly basis. The master branch is considered the release branch. The
-releases are tagged with version number YY.MM (e.g., 17.04). The MM part of the
+includes the latest state of the code, and it is tagged as a release
+on a monthly basis with version number YY.MM (e.g., 17.04). The MM part of the
 version is incremented every month, and the YY part every year.  Bug fix
 releases are tagged with YY.MM.patch (e.g., 17.04.1).
 
diff --git a/Docs/sphinx_documentation/source/GridCreation.rst b/Docs/sphinx_documentation/source/GridCreation.rst
index 0b9a37f41ba..c718e7edacc 100644
--- a/Docs/sphinx_documentation/source/GridCreation.rst
+++ b/Docs/sphinx_documentation/source/GridCreation.rst
@@ -42,21 +42,21 @@ Note that :cpp:`n_cell` must be given as three separate integers, one for each c
 However, :cpp:`max_grid_size` and :cpp:`blocking_factor` can be specified as a single value 
 applying to all coordinate directions, or as separate values for each direction.  
 
- - if :cpp:`max_grid_size` (or :cpp:`blocking_factor`) is specified as multiple integers then the first 
+ - If :cpp:`max_grid_size` (or :cpp:`blocking_factor`) is specified as multiple integers then the first 
    integer applies to level 0, the second to level 1, etc.  If you don't specify as many
    integers as there are levels, the final value will be used for the remaining levels.
 
- - if different values of :cpp:`max_grid_size` (or :cpp:`blocking_factor`) are wanted for each coordinate direction, 
+ - If different values of :cpp:`max_grid_size` (or :cpp:`blocking_factor`) are wanted for each coordinate direction, 
    then :cpp:`max_grid_size_x`, :cpp:`max_grid_size_y` and :cpp:`max_grid_size_z` 
    (or :cpp:`blocking_factor_x`, :cpp:`blocking_factor_y` and :cpp:`blocking_factor_z`) must be used.  
    If you don't specify as many integers as there are levels, the final value will be used for the remaining levels.
 
 Additional notes:
 
- - to create identical grids of a specific size, e.g. of length *m* in each direction, 
+ - To create identical grids of a specific size, e.g. of length *m* in each direction, 
    then set :cpp:`max_grid_size` = *m* and :cpp:`blocking_factor` = *m*.
 
- - note that :cpp:`max_grid_size` is just an upper bound; with :cpp:`n_cell = 48` 
+ - Note that :cpp:`max_grid_size` is just an upper bound; with :cpp:`n_cell = 48` 
    and :cpp:`max_grid_size = 32`, we will typically have one grid of length 32 and one of length 16.
 
 The grid creation process at level 0 proceeds as follows (if not using the KD-tree approach):
diff --git a/Docs/sphinx_documentation/source/IO.rst b/Docs/sphinx_documentation/source/IO.rst
index 4bd2b8c6741..8bce21ceb37 100644
--- a/Docs/sphinx_documentation/source/IO.rst
+++ b/Docs/sphinx_documentation/source/IO.rst
@@ -55,7 +55,7 @@ making such strings.
       const std::string& pfname2 = amrex::Concatenate("plt",istep,4); // plt0258  
 
       istep =1234567;  // Having more than 5 digits is OK.
-      const std::string& pfname3 = amrex::Concatenate("plt",istep); // plt12344567
+      const std::string& pfname3 = amrex::Concatenate("plt",istep); // plt1234567
 
 The argument :cpp:`mf` above (:cpp:`MultiFab` for single level and
 :cpp:`Vector<const MultiFab*>` for multi-level) is the data to be written
diff --git a/Docs/sphinx_documentation/source/LinearSolvers.rst b/Docs/sphinx_documentation/source/LinearSolvers.rst
index 9759b7f1904..d205c732cc0 100644
--- a/Docs/sphinx_documentation/source/LinearSolvers.rst
+++ b/Docs/sphinx_documentation/source/LinearSolvers.rst
@@ -81,7 +81,7 @@ one needs to call the member function
 
 The :cpp:`int amrlev` parameter should be zero for single-level
 solves.  For multi-level solves, each level needs to be provided with
-``alpha`` and ``beta``, or ``Sigma``.  For composite solves, :cpp:`amrlev` 0 will
+``alpha`` and ``beta``, or ``sigma``.  For composite solves, :cpp:`amrlev` 0 will
 mean the lowest level for the solver, which is not necessarily the lowest
 level in the AMR hierarchy. This is so solves can be done on different sections
 of the AMR hierarchy, e.g. on AMR levels 3 to 5.
@@ -238,7 +238,7 @@ There are many parameters that can be set.  Here we discuss some
 commonly used ones.
 
 :cpp:`MLLinOp::setVerbose(int)`, :cpp:`MLMG::setVerbose(int)` and
-:cpp:`MLMG:setBottomVerbose(int)` can be control the verbosity of the
+:cpp:`MLMG:setBottomVerbose(int)` control the verbosity of the
 linear operator, multigrid solver and the bottom solver, respectively.
 
 The multigrid solver is an iterative solver.  The maximal number of
@@ -266,8 +266,9 @@ operators for the multigrid.
     // out = L(in)
     mlmg.apply(out, in);  // here both in and out are const Vector<MultiFab*>&
 
-At the bottom of the multigrid cycles, we use the biconjugate gradient
-stabilized method as the bottom solver.  :cpp:`MLMG` member method
+At the bottom of the multigrid cycles, we use a ``bottom solver`` which may be
+different than the relaxation used at the other levels. The default bottom solver is the
+biconjugate gradient stabilized method, but can easily be changed with the :cpp:`MLMG` member method
 
 .. highlight:: c++
 
@@ -275,7 +276,7 @@ stabilized method as the bottom solver.  :cpp:`MLMG` member method
 
     void setBottomSolver (BottomSolver s);
 
-can be used to change the bottom solver.  Available choices are
+Available choices are
 
 - :cpp:`MLMG::BottomSolver::bicgstab`: The default.
 
@@ -290,10 +291,32 @@ can be used to change the bottom solver.  Available choices are
 - :cpp:`MLMG::BottomSolver::cgbicg`: Start with cg. Switch to bicgstab
   if cg fails.  The matrix must be symmetric.
 
-- :cpp:`MLMG::BottomSolver::hypre`: BoomerAMG in hypre.
+- :cpp:`MLMG::BottomSolver::hypre`: One of the solvers available through hypre; see the 
+section below on External Solvers 
 
 - :cpp:`MLMG::BottomSolver::petsc`: Currently for cell-centered only.
 
+Boundary Stencils for Cell-Centered Solvers
+===========================================
+
+We have the option using the :cpp:`MLMG` member method
+
+.. highlight:: c++
+
+::
+
+    void setMaxOrder (int maxorder);
+
+to set the order of the cell-centered linear operator stencil at physical boundaries 
+with Dirichlet boundary conditions and at coarse-fine boundaries.  In both of these
+cases, the boundary value is not defined at the center of the ghost cell. 
+The order determines the number of interior cells that are used in the extrapolation
+of the boundary value from the cell face to the center of the ghost cell, where 
+the extrapolated value is then used in the regular stencil.  For example, 
+:cpp:`maxorder = 2` uses the boundary value and the first interior value to extrapolate
+to the ghost cell center; :cpp:`maxorder = 3` uses the boundary value and the first two interior values.
+
+
 Curvilinear Coordinates
 =======================
 
@@ -382,23 +405,106 @@ as living at face centroids, modify the setBCoeffs command to be
 External Solvers
 ================
 
-AMReX can use the `hypre <https://computing.llnl.gov/projects/hypre-scalable-linear-solvers-multigrid-methods>`_ algebraic multigrid solver, BoomerAMG, 
-as a bottom solver for both cell-centered and node-based problems.
-For challenging problems, our geometric multigrid solver may have difficulty solving,
-whereas an algebraic multigrid method might be more robust.  
-We note that by default our solver always tries to geometrically coarsen the
+AMReX provides interfaces to the `hypre <https://computing.llnl.gov/projects/hypre-scalable-linear-solvers-multigrid-methods>`_ preconditioners and solvers, including BoomerAMG, GMRES (all variants), PCG, and BICGStab as
+solvers, and BoomerAMG and Euclid as preconditioners.  These can be called as 
+as bottom solvers for both cell-centered and node-based problems.
+
+By default the AMReX linear solver code always tries to geometrically coarsen the
 problem as much as possible.  However, as we have mentioned, we can
 call :cpp:`setMaxCoarseningLevel(0)` on the :cpp:`LPInfo` object
 passed to the constructor of a linear operator to disable the
 coarsening completely.  In that case the bottom solver is solving the
-residual correction form of the original problem.  
+residual correction form of the original problem. To build Hypre, follow the next steps:
+
+.. highlight:: c++
+
+::
+
+    1.- git clone https://github.com/hypre-space/hypre.git
+    2.- cd hypre/src
+    3.- ./configure
+        (if you want to build hypre with long long int, do ./configure --enable-bigint ) 
+    4.- make install
+    5.- Create an environment variable with the HYPRE directory --
+        HYPRE_DIR=/hypre_path/hypre/src/hypre
 
 To use hypre, one must include ``amrex/Src/Extern/HYPRE`` in the build system. 
-For an example of using hypre, we refer the reader to
-``Tutorials/LinearSolvers/ABecLaplacian_C``.
+For examples of using hypre, we refer the reader to
+``Tutorials/LinearSolvers/ABecLaplacian_C`` or ``Tutorials/LinearSolvers/NodalProjection_EB``.
+
+Caveat: to use hypre for the nodal solver,  you must either build with USE_EB = TRUE, 
+or explicitly set the coarsening strategy in the calling routine to be ``RAP`` rather than ``Sigma``
+by adding 
+
+.. highlight:: c++
+
+::
+
+    nodal_projector.getLinOp().setCoarseningStrategy(MLNodeLaplacian::CoarseningStrategy::RAP);
+
+where
+:cpp:`nodal_projector` is the :cpp:`NodalProjector` object we have built.
+
+The following parameter should be set to True if the problem to be solved has a singular matrix.
+In this case, the solution is only defined to within a constant.  Setting this parameter to True 
+replaces one row in the matrix sent to hypre from AMReX by a row that sets the value at one cell to 0.
+
+- :cpp:`hypre.adjust_singular_matrix`:   Default is False.
+
+
+The following parameters can be set in the inputs file to control the choice of preconditioner and smoother:
+
+- :cpp:`hypre.hypre_solver`:   Default is BoomerAMG.
+
+- :cpp:`hypre.hypre_preconditioner`: Default is none;  otherwise the type must be specified.
+
+- :cpp:`hypre.recompute_preconditioner`: Default true.  Option to recompute the preconditioner.
+
+- :cpp:`hypre.write_matrix_files`: Default false.   Option to write out matrix into text files.
+
+- :cpp:`hypre.overwrite_existing_matrix_files`: Default false.   Option to over-write existing matrix files.
+
+
+The following parameters can be set in the inputs file to control the BoomerAMG solver specifically:
+
+- :cpp:`hypre.bamg_verbose`: verbosity of BoomerAMG preconditioner. Default 0. See `HYPRE_BoomerAMGSetPrintLevel`
+
+- :cpp:`hypre.bamg_logging`: Default 0. See `HYPRE_BoomerAMGSetLogging`
+
+- :cpp:`hypre.bamg_coarsen_type`: Default 6.  See `HYPRE_BoomerAMGSetCoarsenType`
+
+- :cpp:`hypre.bamg_cycle_type`: Default 1.  See `HYPRE_BoomerAMGSetCycleType`
+
+- :cpp:`hypre.bamg_relax_type`: Default 6.  See `HYPRE_BoomerAMGSetRelaxType`
+
+- :cpp:`hypre.bamg_relax_order`: Default 1.  See `HYPRE_BoomerAMGSetRelaxOrder`
+
+- :cpp:`hypre.bamg_num_sweeps`: Default 2.  See `HYPRE_BoomerAMGSetNumSweeps`
+
+- :cpp:`hypre.bamg_max_levels`: Default 20.  See `HYPRE_BoomerAMGSetMaxLevels`
+
+- :cpp:`hypre.bamg_strong_threshold`: Default 0.25 for 2D, 0.57 for 3D.  See `HYPRE_BoomerAMGSetStrongThreshold`
+
+- :cpp:`hypre.bamg_interp_type`:  Default 0.  See `HYPRE_BoomerAMGSetInterpType`
+
+The user is referred to the
+`hypre <https://computing.llnl.gov/projects/hypre-scalable-linear-solvers-multigrid-methods>`_ Hypre Reference Manual for full details on the usage of the parameters described briefly above.
 
 AMReX can also use `PETSc <https://www.mcs.anl.gov/petsc/>`_ as a bottom solver for cell-centered
-problems.  To use PETSc, one must include ``amrex/Src/Extern/PETSc``
+problems. To build PETSc, follow the next steps:
+
+.. highlight:: c++
+
+::
+
+    1.- git clone https://github.com/petsc/petsc.git
+    2.- cd petsc
+    3.- ./configure --download-hypre=yes --prefix=build_dir
+    4.- Follow the steps given by petsc 
+    5.- Create an environment variable with the PETSC directory --
+        PETSC_DIR=/petsc_path/petsc/build_dir
+
+To use PETSc, one must include ``amrex/Src/Extern/PETSc``
 in the build system.  For an example of using PETSc, we refer the
 reader to ``Tutorials/LinearSolvers/ABecLaplacian_C``.
 
@@ -508,7 +614,7 @@ the MACProjector object and use it to perform a MAC projection.
                                       LinOpBCType::Periodic)});
 
     macproj.setVerbose(mg_verbose);
-    macproj.setCGVerbose(cg_verbose);
+    macproj.setBottomVerbose(bottom_verbose);
 
     // Define the relative tolerance
     Real reltol = 1.e-8;
@@ -665,10 +771,10 @@ gradient term to make the vector field result satisfy the divergence constraint.
 
    // We can specify the maximum number of iterations
    nodal_solver.setMaxIter(mg_maxiter);
-   nodal_solver.setCGMaxIter(mg_cg_maxiter);
+   nodal_solver.setBottomMaxIter(mg_bottom_maxiter);
 
    nodal_solver.setVerbose(mg_verbose);
-   nodal_solver.setCGVerbose(mg_cg_verbose);
+   nodal_solver.setBottomVerbose(mg_bottom_verbose);
 
    // Set bottom-solver to use hypre instead of native BiCGStab 
    //   ( we could also have set this to cg, bicgcg, cgbicg)
diff --git a/Docs/sphinx_documentation/source/LoadBalancing.rst b/Docs/sphinx_documentation/source/LoadBalancing.rst
index 85c6a17cec8..fa384ea1659 100644
--- a/Docs/sphinx_documentation/source/LoadBalancing.rst
+++ b/Docs/sphinx_documentation/source/LoadBalancing.rst
@@ -16,16 +16,41 @@ grid creation process is governed by trying to balance the work in each grid.)
 
 Single-level load balancing algorithms are sequentially applied to each AMR level independently, 
 and the resulting distributions are mapped onto the ranks taking into account the weights 
-already assigned to them (assign heaviest set of grids to the least loaded rank)
+already assigned to them (assign heaviest set of grids to the least loaded rank).  Note that the
+load of each process is measured by how much memory has already been allocated, not how much memory
+will be allocated.  Therefore the following code is not recommended because it tends to generate
+non-optimal distributions.
 
-Options supported by AMReX include the following; the default is SFC:
+.. highlight:: c++
+
+::
+
+   for (int lev = 0; lev < nlevels; ++lev) {
+       // build DistributionMapping for Level lev
+   }
+   for (int lev = 0; lev < nlevels; ++lev) {
+       // build MultiFabs for Level lev
+   }
+
+Instead, one should do,
+
+.. highlight:: c++
+
+::
+
+   for (int lev = 0; lev < nlevels; ++lev) {
+       // build DistributionMapping for Level lev
+       // build MultiFabs for Level lev
+   }
+
+Distribution options supported by AMReX include the following; the default is SFC:
 
 - Knapsack: the default weight of a grid in the knapsack algorithm is the number of grid cells, 
   but AMReX supports the option to pass an array of weights -- one per grid -- or alternatively 
-  to pass in a MultiFab of weights per cell which is used to compute the weight per grid
+  to pass in a MultiFab of weights per cell which is used to compute the weight per grid.
 
 - SFC: enumerate grids with a space-filling Z-morton curve, then partition the 
-  resulting ordering across ranks in a way that balances the load
+  resulting ordering across ranks in a way that balances the load.
 
 - Round-robin: sort grids and assign them to ranks in round-robin fashion -- specifically
   FAB i is owned by CPU i%N where N is the total number of MPI ranks.
diff --git a/Docs/sphinx_documentation/source/Particle.rst b/Docs/sphinx_documentation/source/Particle.rst
index 25c82cf223d..4d9746242b2 100644
--- a/Docs/sphinx_documentation/source/Particle.rst
+++ b/Docs/sphinx_documentation/source/Particle.rst
@@ -371,8 +371,8 @@ skipped. You can also access the SoA data using the :math:`ParIter` as follows:
     using MyParIter = ParIter<0, 0, 2, 2>;
     for (MyParIter pti(pc, lev); pti.isValid(); ++pti) {
         auto& particle_attributes = pti.GetStructOfArrays();
-        Vector<Real>& real_comp0 = particle_attributes.GetRealData(0);
-        Vector<int>&  int_comp1  = particle_attributes.GetIntData(1);
+        RealVector& real_comp0 = particle_attributes.GetRealData(0);
+        IntVector&  int_comp1  = particle_attributes.GetIntData(1);
         for (int i = 0; i < pti.numParticles; ++i) {
             // do stuff with your SoA data...
         }
@@ -434,7 +434,7 @@ both these sorts of operations.
     Ey.FillBoundary(gm.periodicity());
     Ez.FillBoundary(gm.periodicity());
     for (MyParIter pti(MyPC, lev); pti.isValid(); ++pti) {
-        const Box& box = Ex[pti].validBox();
+        const Box& box = pti.validbox();
 
         const auto& particles = pti.GetArrayOfStructs();
         int nstride = particles.dataShape().first;
@@ -474,7 +474,7 @@ is quite similar:
 
     rho.setVal(0.0, ng);
     for (MyParIter pti(*this, lev); pti.isValid(); ++pti) {
-        const Box& box = rho[pti].validbox();
+        const Box& box = pti.validbox();
 
         const auto& particles = pti.GetArrayOfStructs();
         int nstride = particles.dataShape().first;
diff --git a/Docs/sphinx_documentation/source/SUNDIALS.rst b/Docs/sphinx_documentation/source/SUNDIALS.rst
new file mode 100644
index 00000000000..420002ec178
--- /dev/null
+++ b/Docs/sphinx_documentation/source/SUNDIALS.rst
@@ -0,0 +1,78 @@
+.. role:: cpp(code)
+   :language: c++
+
+.. role:: fortran(code)
+   :language: fortran
+
+
+Compiling AMReX with SUNDIALS 5
+===============================
+
+The following steps describe how to compile an AMReX application with
+SUNDIALS 5 support.
+
+In order to use SUNDIALS:
+
+#. AMReX suggests using the Github mirror:
+   https://github.com/LLNL/sundials
+
+   ::
+
+      #!/bin/bash
+      set -e
+      git clone https://github.com/LLNL/sundials
+      cd sundials
+      mkdir builddir instdir
+      INSTALL_PREFIX=$(pwd)/instdir
+      cd builddir
+      cmake \
+      -DCMAKE_INSTALL_PREFIX=${INSTALL_PREFIX}  \
+      -DCMAKE_INSTALL_LIBDIR=lib \
+      -DCMAKE_VERBOSE_MAKEFILE:BOOL=ON \
+      -DCMAKE_C_COMPILER=$(which gcc)  \
+      -DCMAKE_CXX_COMPILER=$(which g++)   \
+      -DCMAKE_CUDA_HOST_COMPILER=$(which g++)    \
+      -DEXAMPLES_INSTALL_PATH=${INSTALL_PREFIX}/examples \
+      -DCMAKE_BUILD_TYPE=Release \
+      -DCMAKE_C_FLAGS_RELEASE="-O3 -DNDEBUG" \
+      -DCMAKE_CXX_FLAGS_RELEASE="-O3 -DNDEBUG"  \
+      -DCUDA_ENABLE=ON  \
+      -DMPI_ENABLE=OFF  \
+      -DOPENMP_ENABLE=ON   \
+      -DF2003_INTERFACE_ENABLE=ON   \
+      -DCUDA_ARCH=sm_70 ../
+      make -j8
+      make install -j8
+
+#. Note that ``CMAKE_C_COMPILER`` and ``CMAKE_CXX_COMPILER`` need to be consistent with the AMReX
+   make variable COMP to ensure matching OMP runtime libraries for use with the OpenMP NVector. 
+
+#. ``CUDA_ARCH`` must be set to the appropriate value for the GPU being targeted
+
+#. For more detailed instructions for installing SUNDIALS with different flags and versions see
+   the `SUNDIALS documentation <https://computing.llnl.gov/projects/sundials/sundials-software>`_.
+
+#. In the ``GNUmakefile`` for the application which uses the interface to SUNDIALS, add
+   ``USE_SUNDIALS = TRUE`` and ``SUNDIALS_ROOT=${INSTALL_PREFIX}``. Note that one must define the
+   ``SUNDIALS_LIB_DIR`` make variable to point to the location where the libraries are installed
+   if they are not installed in the default location which is ``${INSTALL_PREFIX}/lib64``.
+
+#. If the application uses the SUNDIALS CVODE time integrator package, then the variable
+   ``USE_CVODE_LIBS = TRUE`` should also be added in the ``GNUmakefile`` for the application.
+   If the application used the SUNDIALS ARKode time integrator package, then the variable
+   ``USE_ARKODE_LIBS = TRUE`` should be added.
+
+#. Fortran 2003 interfaces for the pgi compilers are currently not supported.
+
+
+Note that SUNDIALS can also be installed via Spack:
+
+   ::
+      
+      spack install sundials+cuda+f2003+openmp
+  
+
+SUNDIALS 5 Tutorials
+--------------------------
+
+AMReX provides in the ``amrex/Tutorials/SUNDIALS`` directory.
diff --git a/Docs/sphinx_documentation/source/SUNDIALS3.rst b/Docs/sphinx_documentation/source/SUNDIALS3.rst
deleted file mode 100644
index 073e6bc3427..00000000000
--- a/Docs/sphinx_documentation/source/SUNDIALS3.rst
+++ /dev/null
@@ -1,98 +0,0 @@
-.. role:: cpp(code)
-   :language: c++
-
-.. role:: fortran(code)
-   :language: fortran
-
-
-Compiling AMReX with Sundials version 3.X or later
----------------------------------------------------
-
-The following steps describe how to compile an AMReX application with
-SUNDIALS_3.X support.  On Cray systems (e.g., Cori or Edison at NERSC), Cray provides
-a system module called ``cray-tpsl`` ("Cray Third-Party Scientific Libraries")
-which as of this writing contains the 2.7 version of the SUNDIALS solver suite (including
-CVODE).  
-
-In order to use the Sundials 3.X version:
-
-#. Obtain the CVODE source code, which is hosted here:
-   https://computation.llnl.gov/projects/sundials/sundials-software.
-   One can download either the complete SUNDIALS package, or just the CVODE components.
-
-#. Unpack the CVODE / SUNDIALS tarball, and create a new "build" directory (it
-   can be anywhere).
-
-#. Navigate to the new, empty build directory, and type
-
-   ::
-
-         cmake \
-           -DCMAKE_INSTALL_PREFIX:PATH=/path/to/install/dir \
-           /path/to/cvode/or/sundials/top/level/source/dir
-
-
-   The ``CMAKE_INSTALL_DIR`` option tells CMake where to install the libraries.
-   Note that CMake will attempt to deduce the compilers automatically, but
-   respects certain environment variables if they are defined, such as ``CC``
-   (for the C compiler), ``CXX`` (for the C++ compiler), and ``FC`` (for the
-   Fortran compiler).  So one may modify the above CMake invocation to be
-   something like the following:
-
-   ::
-
-         CC=/path/to/gcc \
-         CXX=/path/to/g++ \
-         FC=/path/to/gfortran \
-           cmake \
-           -DCMAKE_INSTALL_PREFIX:PATH=/path/to/install/dir \
-           /path/to/cvode/or/sundials/top/level/source/dir
-
-
-   One can supply additional flags to CMake or to the compiler to customize the
-   compilation process.  Flags of interest may include ``CMAKE_C_FLAGS``, which
-   add the specified flags to the compile statement, e.g.,
-   ``-DCMAKE_C_FLAGS="-h list=a"`` will append the ``-h list=a`` flag to the
-   ``cc`` statement when compiling the source code.  Here one may wish to add
-   something like ``"-O2 -g"`` to provide an optimized library that still
-   contains debugging symbols; if one neglects debugging symbols in the CVODE
-   library, and if a code that uses CVODE encounters a segmentation fault in
-   the solve, then the backtrace has no information about where in the solver
-   the error occurred.  Also, if one wishes to compile only the solver library
-   itself and not the examples that come with the source (compiling the
-   examples is enabled by default), one can add ``"-DEXAMPLES_ENABLE=OFF"``.
-   Users should be aware that the CVODE examples are linked dynamically, so
-   when compiling the solver library on Cray system using the Cray compiler
-   wrappers ``cc``, ``CC``, and ``ftn``, one should explicitly disable
-   compiling the examples via the ``"-DEXAMPLES_ENABLE=OFF"`` flag.
-
-#. In the ``GNUmakefile`` for the application which uses the Fortran 2003
-   interface to CVODE or ARKODE, add ``SUNDIALS_3x4x = TRUE``, which will compile the Fortran 2003
-   interfaces and link the libraries.  Note that one must define the
-   ``CVODE_LIB_DIR`` environment variable to point to the location where the
-   libraries are installed.
-
-#. In the ``GNUmakefile`` for the application which uses the Fortran 2003
-   interface to ARKODE, also add ``USE_ARKODE_LIBS = TRUE``. It is assumed that the
-   ``CVODE_LIB_DIR`` environment variable points to the location where the ARKODE
-   libraries are installed as well.
-
-#. Fortran 2003 interfaces for the pgi compilers and for developmental versions of SUNDIALS
-   are currently not supported.
-
-SUNDIALS 3.X Tutorials
--------------------------
-
-AMReX provides six tutorials in the ``amrex/Tutorials/CVODE/SUNDIALS3_finterface`` directory.
-``EX1`` is modeled after the CVODE Tutorial ``EX1`` showing use with AMReX.
-The four ``EX_cv_*`` tutorials are based on examples provided with the interface, which
-are more closely modeled after CVODE examples. The ``EX_ark_analytic_fp`` tutorial is based
-on the ``EX_cv_analytic_fp`` tutorial, but uses ARKODE instead of CVODE.
-
-AMReX provides three tutorials in the ``amrex/Tutorials/CVODE/SUNDIALS3_cppversion`` directory.
-These are versions of ``EX1`` which operate on a packed version of the data. ``EX1_SERIAL_NVEC``
-packs a box worth of equations into a serial NVector, uses CVODE to solve, and then unpacks
-the solution back into the box it came from. ``EX1_CUDA_NVEC`` uses the cuda NVector implementation instead.
-``EX1_GPU_PRAGMA`` uses the cuda NVector, and the gpu pragma functionality.
-
-.. _SUNDIALS3:
diff --git a/Docs/sphinx_documentation/source/CVODE.rst b/Docs/sphinx_documentation/source/SUNDIALS_CVODE.rst
similarity index 95%
rename from Docs/sphinx_documentation/source/CVODE.rst
rename to Docs/sphinx_documentation/source/SUNDIALS_CVODE.rst
index 3f90028401e..eb38fe608b1 100644
--- a/Docs/sphinx_documentation/source/CVODE.rst
+++ b/Docs/sphinx_documentation/source/SUNDIALS_CVODE.rst
@@ -5,8 +5,8 @@
    :language: fortran
 
 
-Compiling AMReX with CVODE (Cray or Sundials version 2.7)
------------------------------------------------------------
+Compiling AMReX with CVODE 2.7
+==============================
 
 The following steps describe how to compile an AMReX application with
 CVODE support.  On Cray systems (e.g., Cori or Edison at NERSC), Cray provides
@@ -73,8 +73,9 @@ On systems which are not Cray:
    ``CVODE_LIB_DIR`` environment variable to point to the location where the
    libraries are installed.
 
-CVODE Tutorials
-------------------
+
+CVODE 2.7 Tutorials
+-------------------
 
 AMReX provides two CVODE tutorials in the ``amrex/Tutorials/CVODE`` directory, called
 ``EX1`` and ``EX2``.  See the Tutorials CVODE_ documentation for more detail.
diff --git a/Docs/sphinx_documentation/source/SUNDIALS_top.rst b/Docs/sphinx_documentation/source/SUNDIALS_top.rst
new file mode 100644
index 00000000000..9eaa3b596d3
--- /dev/null
+++ b/Docs/sphinx_documentation/source/SUNDIALS_top.rst
@@ -0,0 +1,36 @@
+.. _Chap:SUNDIALS:
+
+SUNDIALS
+========
+
+AMReX supports local ODE integration using the ARKode [1]_ and CVODE [2]_
+time integrators which are part of the SUNDIALS framework [3]_. ARKode
+and CVODE contains solvers for stiff and non-stiff ODEs, and as such they
+are well suited for solving e.g., the complex chemistry networks in combustion
+simulations, or the nuclear reaction networks in astrophysical simulations.
+
+Most of SUNDIALS is written in C, but it is distributed with Fortran
+interfaces that use the ``iso_c_binding`` feature of the Fortran 2003 standard.
+AMReX supports these Fortran 2003 interfaces and they are used in the AMReX
+SUNDIALS 5 tutorials.
+
+AMReX currently supports SUNDIALS version 5, and for CVODE only, a legacy
+interface to SUNDIALS 2.7 which is the version available in the ``cray-tpsl``
+system module made available on Cray systems.
+
+
+.. toctree::
+   :maxdepth: 2
+
+   SUNDIALS
+   SUNDIALS_CVODE
+
+.. [1]
+   https://computation.llnl.gov/projects/sundials/arkode
+
+.. [2]
+   https://computation.llnl.gov/projects/sundials/cvode
+
+.. [3]
+   https://computation.llnl.gov/projects/sundials
+
diff --git a/Docs/sphinx_documentation/source/Testing.rst b/Docs/sphinx_documentation/source/Testing.rst
index e2994931010..58ee2420a7d 100644
--- a/Docs/sphinx_documentation/source/Testing.rst
+++ b/Docs/sphinx_documentation/source/Testing.rst
@@ -119,6 +119,6 @@ do is start from an existing test and modify it. For example, this entry:
 
 defines a test called :cpp:`MLMG_FI_PoisCom` by specifying the apppropriate build directory, inputs file,
 and a set of configuration options. The above options are the most commonly changed; for a full list
-of options, see the example configuration file at https://github.com/AMReX-Codes/regression_testing/blob/master/example-tests.ini.
+of options, see the example configuration file at https://github.com/AMReX-Codes/regression_testing/blob/main/example-tests.ini.
 
 
diff --git a/Docs/sphinx_documentation/source/Visualization.rst b/Docs/sphinx_documentation/source/Visualization.rst
index c87d4a8e848..56c9982d8e3 100644
--- a/Docs/sphinx_documentation/source/Visualization.rst
+++ b/Docs/sphinx_documentation/source/Visualization.rst
@@ -755,7 +755,7 @@ and point to the CMake configuration installed with SENSEI.
 
 .. code-block:: bash
 
-   cmake -DENABLE_SENSEI=ON -DSENSEI_DIR=<path to install>/lib/cmake ..
+   cmake -DAMReX_SENSEI=ON -DSENSEI_DIR=<path to install>/lib/cmake ..
 
 When CMake generates the make files proceed as usual.
 
diff --git a/Docs/sphinx_documentation/source/index.rst b/Docs/sphinx_documentation/source/index.rst
index a7247a8ab23..3ec3e895474 100644
--- a/Docs/sphinx_documentation/source/index.rst
+++ b/Docs/sphinx_documentation/source/index.rst
@@ -12,8 +12,8 @@ AMReX is developed at LBNL, NREL, and ANL as part of the Block-Structured AMR
 Co-Design Center in DOE's Exascale Computing Project.
 
 All of AMReX's development is done in the github repository under the
-development branch; anyone can see the latest updates. Changes are merged into
-the master branch at the beginning of each month.
+development branch; anyone can see the latest updates. A monthly release is tagged at the beginning
+of each month.
 
 We are always happy to have users contribute to the AMReX source code. To
 contribute, issue a pull request against the development branch (details `here
@@ -42,7 +42,6 @@ Documentation on migration from BoxLib is available in the AMReX repository at D
    ManagingGridHierarchy_Chapter
    AmrCore_Chapter
    AmrLevel_Chapter
-   AsyncIter_Chapter
    ForkJoin
    IO_Chapter
    LinearSolvers_Chapter
diff --git a/Docs/sphinx_tutorials/source/AMR_Tutorial.rst b/Docs/sphinx_tutorials/source/AMR_Tutorial.rst
index aa50376ca25..dfdecaec29b 100644
--- a/Docs/sphinx_tutorials/source/AMR_Tutorial.rst
+++ b/Docs/sphinx_tutorials/source/AMR_Tutorial.rst
@@ -17,8 +17,11 @@ or with VisIt.
 
 Advection_AmrCore: This tutorial contains an AMR advection code that advects
 a single scalar field with a velocity field that is specified on faces.
+It is written entirely in C++, can be built in 2D or 3D and run with the same
+inputs file,
 
-It is an AMReX based code designed to run in parallel using MPI/OMP.
+It is an AMReX-based code designed to run in parallel using MPI+X, where X
+may be OMP for multicore machines and CUDA for hybrid CPU/GPU architectures.
 
 This example uses source code from the amrex/Src/Base, Boundary, and AmrCore
 directories.
@@ -26,7 +29,7 @@ directories.
 Notably, this example does not use source code from amrex/Src/Amr
 (see the tutorial Advection_AmrLevel).
 
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
+The directory Exec includes a makefile and a sample inputs file.  
 
 **Advection_AmrLevel**
 ----------------------
diff --git a/Docs/sphinx_tutorials/source/CVODE_Tutorial.rst b/Docs/sphinx_tutorials/source/CVODE_Tutorial.rst
index 0599d937e35..4d511f8a1bc 100644
--- a/Docs/sphinx_tutorials/source/CVODE_Tutorial.rst
+++ b/Docs/sphinx_tutorials/source/CVODE_Tutorial.rst
@@ -8,15 +8,15 @@ Tutorials/CVODE
 ==========================
 
 There are two CVODE tutorials in the ``amrex/Tutorials/CVODE`` directory, called
-``EX1`` and ``EX2``.  ``EX1`` consists of a single ODE that is integrated with
+``EX1_F`` and ``EX2_F``.  ``EX1_F`` consists of a single ODE that is integrated with
 CVODE within each cell of a 3-D grid.  It demonstrates how to initialize the
 CVODE solver, how to call the ODE right-hand-side (RHS), and, more importantly,
 how to *re-*\ initialize the solver between cells, which avoids allocating and
 freeing solver memory between each cell (see the call to ``FCVReInit()`` in the
-``integrate_ode.f90`` file in the ``EX1`` directory.)
+``integrate_ode.f90`` file in the ``EX1_F`` directory.)
 
-The ``EX2`` example demonstrates the slightly more complicated case of
-integrating a system of coupled ODEs within each cell.  Similarly to ``EX1``,
+The ``EX2_F`` example demonstrates the slightly more complicated case of
+integrating a system of coupled ODEs within each cell.  Similarly to ``EX1_F``,
 it provides an RHS and some solver initialization.  However, it also
 demonstrates the performance effect of providing an analytic Jacobian matrix
 for the system of ODEs, rather than requiring the solver to compute the
diff --git a/Docs/sphinx_tutorials/source/SENSEI_Tutorial.rst b/Docs/sphinx_tutorials/source/SENSEI_Tutorial.rst
deleted file mode 100644
index e74ce4c87d1..00000000000
--- a/Docs/sphinx_tutorials/source/SENSEI_Tutorial.rst
+++ /dev/null
@@ -1,215 +0,0 @@
-.. role:: cpp(code)
-   :language: c++
-
-.. role:: fortran(code)
-   :language: fortran
-
-Tutorials/SENSEI
-==========================
-
-SENSEI is a middleware that allows one to send data to various visualization and
-analysis back ends through a uniform interface. It's data model and API enable
-one to chose the desired visualization and analysis back end for a given task
-with out limitting ones options, as the back ends can be inter-changed at run
-time via a text based config file.
-
-Configuring the environment at NERSC
-------------------------------------
-
-First select the desired SENSEI install. Each install will support different set of
-backends. This is necessary because not all of the back ends are compatible with
-each other.
-
-For instance to use SENSEI with ParaView Catalyst:
-
-.. highlight:: shell
-
-::
-
-    module load sensei/2.1.0-catalyst
-
-
-To use SENSEI with VisIt Libsim:
-
-.. highlight:: shell
-
-::
-
-
-   module load sensei/2.1.0-libsim
-
-
-SENSEI features in AMReX are conditionally compiled when the Make file variable
-``USE_SENSEI_INSITU`` is set. When this variable is set, the Make file will query
-environment variables to determine the list of include directories and link
-libraries needed to compile with SENSEI.
-
-The ``sensei_config`` tool that is installed with SENSEI  will set the environment
-variables that are used in the make files.
-
-With a SENSEI module loaded, in a bash shell:
-
-.. highlight:: shell
-
-::
-
-
-   source sensei_config
-
-
-There are two SENSEI tutorials included with AMReX, for for use with ``AmrCore``, and one
-for ``AmrLevel``.
-
-
-Compiling and Running the ``Advection_AmrCore`` tutorial
---------------------------------------------------------
-
-This example uses source code from the amrex/Src/Base, Boundary, and AmrCore directories.
-Notably, this example does not use source code from amrex/Src/Amr
-(see the tutorial Advection_AmrLevel).
-
-The directory Exec/SingleVortex in Tutorials/SENSEI/Advection_AmrCore
-includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with VisIt.
-
-
-Edit the file ``Exec/SingleVortex/GNUmakefile``, set
-
-.. highlight:: shell
-
-::
-
-
-   USE_SENSEI_INSITU = TRUE
-
-
-Build the tutorial
-
-.. highlight:: shell
-
-::
-
-
-   make -j4
-
-
-To use SENSEI in AMReX one needs to enable it via ParmParse input file.
-Additionally one needs to provide a SENSEI XML configuration that selects
-and configures the desired SENSEI backend.
-
-Example XML configs are included in ``Exec/SingleVortex/SENSEI``.
-
-Edit the file ``Exec/SingleVortex/inputs``
-
-Running with ParaView Catalyst:
-
-.. highlight:: shell
-
-::
-
-
-   sensei.enabled = 1                          # turn SENSEI in situ on/off
-   sensei.config = SENSEI/render_catalyst.xml  # render simulation data with ParaView Catalyst
-   sensei.frequency = 1                        # number of level 0 steps between in situ processing
-
-
-Running with VisIt Libsim:
-
-.. highlight:: shell
-
-::
-
-
-   sensei.enabled = 1                          # turn SENSEI in situ on/off
-   sensei.config = SENSEI/render_libsim.xml    # render simulation data with VisIt Libsim
-   sensei.frequency = 1                        # number of level 0 steps between in situ processing
-
-
-Once the inputs files has been edited, run the execcutable as usual
-
-.. highlight:: shell
-
-::
-
-
-   mpiexec -np 4 ./main2d.gnu.MPI.ex inputs
-
-
-
-Compiling and Running the ``Advection_AmrLevel`` tutorial
----------------------------------------------------------
-
-This example uses source code from the amrex/Src/Base, Boundary, Amrlevel, and
-Amr directories.
-
-The directories Exec/SingleVortex and Exec/UniformVelocity in Tutorials/SENSEI/Advection_AmrLevel
-each include a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with VisIt.
-
-Edit the file ``Exec/SingleVortex/GNUmakefile``, set
-
-.. highlight:: shell
-
-::
-
-
-   USE_SENSEI_INSITU = TRUE
-
-
-Finally, make the tutorial
-
-.. highlight:: shell
-
-::
-
-
-   make -j4
-
-
-## Running ##
-To use SENSEI in AMReX one needs to enable it via ParmParse input file.
-Additionally one needs to provide a SENSEI XML configuration that selects
-and configures the desired SENSEI backend.
-
-Example XML configs are included in ``Exec/SingleVortex/SENSEI``.
-
-Edit the file ``Exec/SingleVortex/inputs``
-
-
-Running with ParaView Catalyst:
-
-.. highlight:: shell
-
-::
-
-
-   sensei.enabled = 1                          # turn SENSEI in situ on/off
-   sensei.config = SENSEI/render_catalyst.xml  # render simulation data with ParaView Catalyst
-   sensei.frequency = 1                        # number of level 0 steps between in situ processing
-
-
-Running with VisIt Libsim:
-
-.. highlight:: shell
-
-::
-
-
-   sensei.enabled = 1                          # turn SENSEI in situ on/off
-   sensei.config = SENSEI/render_libsim.xml    # render simulation data with VisIt Libsim
-   sensei.frequency = 1                        # number of level 0 steps between in situ processing
-
-
-Once the inputs files has been edited, run the execcutable as usual
-
-.. highlight:: shell
-
-::
-
-
-   mpiexec -np 4 ./main2d.gnu.MPI.ex inputs
-
diff --git a/Docs/sphinx_tutorials/source/SUNDIALS_Tutorial.rst b/Docs/sphinx_tutorials/source/SUNDIALS_Tutorial.rst
new file mode 100644
index 00000000000..f97e376801a
--- /dev/null
+++ b/Docs/sphinx_tutorials/source/SUNDIALS_Tutorial.rst
@@ -0,0 +1,21 @@
+.. role:: cpp(code)
+   :language: c++
+
+.. role:: fortran(code)
+   :language: fortran
+
+Tutorials/SUNDIALS
+==========================
+
+AMReX provides five tutorials in the ``amrex/Tutorials/SUNDIALS`` directory.
+There are three versions of ``EX1`` which parallelize differently. ``EX1_C``
+packs a box worth of equations into a serial NVector, uses CVODE to solve, and then unpacks
+the solution back into the box it came from. ``EX1_CUDA`` uses the cuda NVector implementation
+instead. ``EX1_F`` parallelizes over the cells individually. ``EX2_F`` is based on
+``fcvRoberts_dns.f`` example code in CVODE. ``EX-CUSOLVER`` uses a Castro-style driver and
+tests different ode solving configurations.
+
+See the SUNDIALS_ section of the AMReX documentation for general instructions 
+on how to include SUNDIALS in an AMReX application.
+
+.. _SUNDIALS: https://amrex-codes.github.io/amrex/docs_html/SUNDIALS.html
diff --git a/Docs/sphinx_tutorials/source/index.rst b/Docs/sphinx_tutorials/source/index.rst
index a9acb82c044..7368b45b5ef 100644
--- a/Docs/sphinx_tutorials/source/index.rst
+++ b/Docs/sphinx_tutorials/source/index.rst
@@ -35,7 +35,6 @@ The amrex/Tutorials directory is broken into the following categories:
    MUI_Tutorial
    Particles_Tutorial
    SDC_Tutorial
-   SENSEI_Tutorial
    SWFFT_Tutorial
 
 Indices and tables
diff --git a/Src/Amr/AMReX_Amr.H b/Src/Amr/AMReX_Amr.H
index 6a7432c3ec7..90e54a53fd3 100644
--- a/Src/Amr/AMReX_Amr.H
+++ b/Src/Amr/AMReX_Amr.H
@@ -15,19 +15,11 @@
 
 #include <AMReX_AmrCore.H>
 
-#ifdef USE_PERILLA
-#include <RegionGraph.H>
-#include <Perilla.H>
-#endif
-
 namespace amrex {
 
 class AmrLevel;
 class LevelBld;
 class BoxDomain;
-template <class T>
-class MFGraph;
-class AmrTask;
 #if defined(BL_USE_SENSEI_INSITU)
 class AmrInSituBridge;
 #endif
@@ -43,9 +35,6 @@ class AmrInSituBridge;
 class Amr
     : public AmrCore
 {
-  template <class T>
-  friend class MFGraph;
-  friend class AmrTask;
   typedef std::multimap< std::pair<int, int>, double >  BoundaryPointList;
 
 public:
@@ -189,6 +178,8 @@ public:
     static void fillDerivePlotVarList ();
     static void fillDeriveSmallPlotVarList ();
 
+    static void setComputeNewDtOnRegrid (int flag) { compute_new_dt_on_regrid = flag; }
+
     static void Initialize ();
     static void Finalize ();
     //! AmrLevel lev.
@@ -274,7 +265,7 @@ public:
         intersect_hix = IntersectHiX;
         intersect_loy = IntersectLoY;
         intersect_hiy = IntersectHiY;
-    };
+    }
 
     /**
     * \brief More general version:
@@ -296,32 +287,32 @@ public:
         intersect_hiy = IntersectHiY;
         intersect_loz = IntersectLoZ;
         intersect_hiz = IntersectHiZ;
-    };
+    }
 
     BoundaryPointList& getIntersectLoX() noexcept
     {
         return intersect_lox;
-    };
+    }
     BoundaryPointList& getIntersectHiX() noexcept
     {
         return intersect_hix;
-    };
+    }
     BoundaryPointList& getIntersectLoY() noexcept
     {
         return intersect_loy;
-    };
+    }
     BoundaryPointList& getIntersectHiY() noexcept
     {
         return intersect_hiy;
-    };
+    }
     BoundaryPointList& getIntersectLoZ() noexcept
     {
         return intersect_loz;
-    };
+    }
     BoundaryPointList& getIntersectHiZ() noexcept
     {
         return intersect_hiz;
-    };
+    }
 
 #ifdef AMREX_PARTICLES
     //! Redistribute particles
@@ -374,14 +365,14 @@ protected:
                            Real stop_time);
 
     // pure virtural function in AmrCore
-    virtual void MakeNewLevelFromScratch (int lev, Real time, const BoxArray& ba, const DistributionMapping& dm) override
-	{ amrex::Abort("How did we get her!"); }
-    virtual void MakeNewLevelFromCoarse (int lev, Real time, const BoxArray& ba, const DistributionMapping& dm) override
-	{ amrex::Abort("How did we get her!"); }
-    virtual void RemakeLevel (int lev, Real time, const BoxArray& ba, const DistributionMapping& dm) override
-	{ amrex::Abort("How did we get her!"); }
-    virtual void ClearLevel (int lev) override
-	{ amrex::Abort("How did we get her!"); }
+    virtual void MakeNewLevelFromScratch (int /*lev*/, Real /*time*/, const BoxArray& /*ba*/, const DistributionMapping& /*dm*/) override
+	{ amrex::Abort("How did we get here!"); }
+    virtual void MakeNewLevelFromCoarse (int /*lev*/, Real /*time*/, const BoxArray& /*ba*/, const DistributionMapping& /*dm*/) override
+	{ amrex::Abort("How did we get here!"); }
+    virtual void RemakeLevel (int /*lev*/, Real /*time*/, const BoxArray& /*ba*/, const DistributionMapping& /*dm*/) override
+	{ amrex::Abort("How did we get here!"); }
+    virtual void ClearLevel (int /*lev*/) override
+	{ amrex::Abort("How did we get here!"); }
 
     //! Whether to write a plotfile now
     bool writePlotNow () noexcept;
@@ -475,18 +466,13 @@ protected:
     static Vector<BoxArray> initial_ba;
     //! Array of BoxArrays read in to externally define grid hierarchy at each regrid
     static Vector<BoxArray> regrid_ba;
+    static int compute_new_dt_on_regrid;
 
 #if defined(BL_USE_SENSEI_INSITU)
     static AmrInSituBridge *insitu_bridge;
 #endif
 
 public:
-#ifdef USE_PERILLA
-    std::vector<std::vector<RegionGraph*> > graphArray;
-    std::vector<RegionGraph*> amrGraphArray;
-    std::vector<RegionGraph*> &get_graphArray(int level){return graphArray[level];}
-#endif
-
     BoundaryPointList intersect_lox;
     BoundaryPointList intersect_loy;
     BoundaryPointList intersect_loz;
diff --git a/Src/Amr/AMReX_Amr.cpp b/Src/Amr/AMReX_Amr.cpp
index bf6f20eda89..db8e7942511 100644
--- a/Src/Amr/AMReX_Amr.cpp
+++ b/Src/Amr/AMReX_Amr.cpp
@@ -12,10 +12,6 @@
 #include <omp.h>
 #endif
 
-#include <sys/types.h>
-#include <sys/stat.h>
-#include <unistd.h>
-
 #include <AMReX_Geometry.H>
 #include <AMReX_TagBox.H>
 #include <AMReX_Array.H>
@@ -48,29 +44,6 @@
 #include <DatasetClient.H>
 #endif
 
-#ifdef USE_PERILLA
-#include <WorkerThread.H>
-#include <Perilla.H>
-#ifdef USE_PERILLA
-//#ifndef USE_PERILLA_ON_DEMAND
-    pthread_mutex_t teamFinishLock=PTHREAD_MUTEX_INITIALIZER;
-//#endif
-#ifdef PERILLA_USE_UPCXX
-extern struct rMsgMap_t{
-    std::map< int, std::map< int,  std::list< Package* > > > map;
-    volatile int size=0;
-    pthread_mutex_t lock= PTHREAD_MUTEX_INITIALIZER;
-}rMsgMap;
-extern struct sMsgMap_t{
-    std::map< int, std::map< int,  std::list< Package* > > > map;
-    volatile int size=0;
-    pthread_mutex_t lock= PTHREAD_MUTEX_INITIALIZER;
-}sMsgMap;
-
-#endif
-#endif
-#endif
-
 #ifdef BL_USE_SENSEI_INSITU
 #include <AMReX_AmrInSituBridge.H>
 #endif
@@ -88,6 +61,7 @@ bool                   Amr::first_plotfile;
 bool                   Amr::first_smallplotfile;
 Vector<BoxArray>       Amr::initial_ba;
 Vector<BoxArray>       Amr::regrid_ba;
+int                    Amr::compute_new_dt_on_regrid;
 #ifdef BL_USE_SENSEI_INSITU
 AmrInSituBridge*       Amr::insitu_bridge;
 #endif
@@ -97,11 +71,7 @@ namespace
     const std::string CheckPointVersion("CheckPointVersion_1.0");
 
     bool initialized = false;
-}
 
-//Tan Nov 24, 2017 : I removed this anonymous namespace so I could access the inner variables from other source files 
-//namespace   
-//{
     //
     // These are all ParmParse'd in.  Set defaults in Initialize()!!!
     //
@@ -116,12 +86,11 @@ namespace
     int  insitu_on_restart;
     int  checkpoint_on_restart;
     bool checkpoint_files_output;
-    int  compute_new_dt_on_regrid;
     bool precreateDirectories;
     bool prereadFAHeaders;
     VisMF::Header::Version plot_headerversion(VisMF::Header::Version_v1);
     VisMF::Header::Version checkpoint_headerversion(VisMF::Header::Version_v1);
-//}
+}
 
 
 
@@ -1277,7 +1246,7 @@ Amr::initialInit (Real              strt_time,
 
 void
 Amr::InitializeInit(Real              strt_time,
-                    Real              stop_time,
+                    Real              /*stop_time*/,
                     const BoxArray*   lev0_grids,
                     const Vector<int>* pmap)
 {
@@ -1402,7 +1371,10 @@ Amr::restart (const std::string& filename)
     //
     int linit = false;
 
-    readProbinFile(linit);
+    if (!probin_file.empty()) {
+        readProbinFile(linit);
+    }
+
     //
     // Start calculation from given restart file.
     //
@@ -1906,11 +1878,6 @@ Amr::timeStep (int  level,
                int  niter,
                Real stop_time)
 {
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    perilla::syncAllWorkerThreads();
-    if(perilla::isMasterThread())
-    {
-#endif
     BL_PROFILE("Amr::timeStep()");
     BL_COMM_PROFILE_NAMETAG("Amr::timeStep TOP");
 
@@ -1932,38 +1899,12 @@ Amr::timeStep (int  level,
     else
     {
         int lev_top = std::min(finest_level, max_level-1);
-
-#ifdef USE_PERILLA
-        int cnt=0;
-        bool *metadataChanged=new bool[finest_level+1];
-        for (int l=0; l <= finest_level; l++)
-            metadataChanged[l]=false;
-#endif
-
         for (int i(level); i <= lev_top; ++i)
         {
             const int old_finest = finest_level;
 
             if (okToRegrid(i))
             {
-#ifdef USE_PERILLA
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-		//ask the communication thread to stop so that I can update the metadata
-                Perilla::updateMetadata_request=1;
-		while(!Perilla::updateMetadata_noticed){
-
-		}
-#endif
-                //for (int k(i>0?i-1:0); k <= finest_level; ++k) {
-                for (int k=0; k <= finest_level; ++k) {
-                    if(metadataChanged[k]==false){
-                        graphArray[k].clear();
-                        getLevel(k).finalizePerilla(time);
-                        metadataChanged[k]=true;
-			cnt++;
-		    }
-		}
-#endif
                 regrid(i,time);
 
                 //
@@ -2002,22 +1943,6 @@ Amr::timeStep (int  level,
                 lev_top = std::min(finest_level, max_level - 1);
 	    }
         }
-#ifdef USE_PERILLA
-	if(cnt){
-	    if(ParallelDescriptor::NProcs()>1){
-	        Perilla::clearTagMap();
-	        Perilla::clearMyTagMap();
-	        Perilla::genTags=true;
-	        Perilla::uTags=0;
-	        Perilla::pTagCnt.clear();
-            }
-            for(int i=0; i<= finest_level; i++){
-                getLevel(i).initPerilla(cumtime);
-	    }
- 	    Perilla::updateMetadata_done++;
-	}
-        delete [] metadataChanged;
-#endif
 
         if (max_level == 0 && loadbalance_level0_int > 0 && loadbalance_with_workestimates)
         {
@@ -2045,21 +1970,9 @@ Amr::timeStep (int  level,
 		       << "ADVANCE with dt = " << dt_level[level] << "\n";
     }
 
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    }
-    perilla::syncAllWorkerThreads();
-#endif
-
-    BL_PROFILE_REGION_START("amr_level.advance");
     Real dt_new = amr_level[level]->advance(time,dt_level[level],iteration,niter);
     BL_PROFILE_REGION_STOP("amr_level.advance");
 
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    perilla::syncAllWorkerThreads();
-    if(perilla::isMasterThread())
-    {
-#endif
-
     dt_min[level] = iteration == 1 ? dt_new : std::min(dt_min[level],dt_new);
 
     level_steps[level]++;
@@ -2089,17 +2002,8 @@ Amr::timeStep (int  level,
 		dt_level[k] = dt_level[k-1] / n_cycle[k];
 	    }
 	}
-#ifdef USE_PERILLA
-//        getLevel(level).finalizePerilla(cumtime);
-//        getLevel(level).initPerilla(cumtime);
-#endif
     }
 
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    }
-    perilla::syncAllWorkerThreads();
-#endif
-
     //
     // Advance grids at higher level.
     //
@@ -2122,23 +2026,10 @@ Amr::timeStep (int  level,
         }
     }
 
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    perilla::syncAllWorkerThreads();
-#endif
-
     amr_level[level]->post_timestep(iteration);
 
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    perilla::syncAllWorkerThreads();
-    if(perilla::isMasterThread())
-    {
-#endif
     // Set this back to negative so we know whether we are in fact in this routine
     which_level_being_advanced = -1;
-#if defined(USE_PERILLA_PTHREADS) || defined(USE_PERILLA_OMP)
-    }
-    perilla::syncAllWorkerThreads();
-#endif
 }
 
 Real
@@ -2153,13 +2044,6 @@ Amr::coarseTimeStep (Real stop_time)
 {
     Real      run_stop;
     Real run_strt;
-#ifdef USE_PERILLA_PTHREADS
-    //mpi+pthreads (default) or upcxx+pthreads
-    std::vector<RegionGraph*> flattenedGraphArray;
-    perilla::syncAllThreads();
-    if(perilla::isMasterThread())
-    {
-#endif
     BL_PROFILE_REGION_START("Amr::coarseTimeStep()");
     BL_PROFILE("Amr::coarseTimeStep()");
     std::stringstream stepName;
@@ -2193,189 +2077,7 @@ Amr::coarseTimeStep (Real stop_time)
     }
 
     BL_PROFILE_REGION_START(stepName.str());
-
-#ifdef USE_PERILLA
-#ifdef USE_PERILLA_PTHREADS
-    //mpi+pthreads (default) or upcxx+pthreads
-    }
-    perilla::syncAllThreads();
-
-    if(perilla::isMasterThread()){
-        Perilla::updateMetadata_request = 0;
-        Perilla::updateMetadata_noticed = 0;
-        Perilla::updateMetadata_done = 0;
-        Perilla::numTeamsFinished = 0;
-        RegionGraph::graphCnt = 0;
-        if(levelSteps(0)==0){
-	    graphArray.resize(finest_level+1);
-            for(int i=0; i<= finest_level; i++)
-                getLevel(i).initPerilla(cumtime);
-	    if(ParallelDescriptor::NProcs()>1){
-  	        Perilla::syncProcesses();
-                Perilla::communicateTags();
-	        Perilla::syncProcesses();
-	    }
-        }
-    }
-    perilla::syncAllThreads();
-
-    if(perilla::isCommunicationThread())
-    {
-        Perilla::flattenGraphHierarchy(graphArray, flattenedGraphArray);
-	bool doublechecked=false;
-        while(true){
-   	    if(!Perilla::updateMetadata_request){
-                Perilla::serviceMultipleGraphCommDynamic(flattenedGraphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-		{
-                    Perilla::syncProcesses();
-	            flattenedGraphArray.clear();
-                    Perilla::syncProcesses();
-                    break;
-		}
-            }else{
-	        Perilla::syncProcesses();
-        	for(int g=0; g<flattenedGraphArray.size(); g++)
-          	{
-		       //cancel messages preposted previously
-		       flattenedGraphArray[g]->graphTeardown();
-		}
-#ifdef PERILLA_USE_UPCXX
-                    pthread_mutex_lock(&(rMsgMap.lock));
-                    for(int i=0; i<rMsgMap.map.size(); i++){
-                        for(int j=0; j<rMsgMap.map[i].size(); j++){
-                            while(rMsgMap.map[i][j].size()>0){
-                               rMsgMap.map[i][j].pop_front();
-                               rMsgMap.size--;
-                            }
-                        }
-                    }
-                    pthread_mutex_unlock(&(rMsgMap.lock));
-                    while(sMsgMap.size>0){
-                    }
-#endif
-	        Perilla::syncProcesses();
-	        Perilla::updateMetadata_noticed=1;
-	        while(Perilla::updateMetadata_done==0){//!= (max_level+1)){
-		
-	        }
-	        Perilla::updateMetadata_request=0;
-	        Perilla::updateMetadata_noticed=0;
-	        Perilla::updateMetadata_done=0;
-                if(ParallelDescriptor::NProcs()>1){
-	            Perilla::syncProcesses();
-                    Perilla::communicateTags();
-	            Perilla::syncProcesses();
-		}
-	        flattenedGraphArray.clear();
-		Perilla::flattenGraphHierarchy(graphArray, flattenedGraphArray);
-	        Perilla::serviceMultipleGraphCommDynamic(flattenedGraphArray,true,perilla::tid());
-
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-		{
-	 	    Perilla::syncProcesses();
-  	            flattenedGraphArray.clear();
-	 	    Perilla::syncProcesses();
-                    break;
-		}
- 	    }
-        }  
-    }else{
-        timeStep(0,cumtime,1,1,stop_time);
-        if(perilla::isMasterWorkerThread()){
-            pthread_mutex_lock(&teamFinishLock);
-            Perilla::numTeamsFinished++;
-            pthread_mutex_unlock(&teamFinishLock);
-        }
-    }
-
-    perilla::syncAllThreads();
-    if(perilla::isMasterThread()){
-        if(!okToContinue() || (level_steps[0] == Perilla::max_step) || (stop_time -(dt_level[0] + cumTime())<=0)){
-            for(int i=0; i<= finest_level; i++){
-                getLevel(i).finalizePerilla(cumtime);
-            }
-        }
-    }
-#else
-    Perilla::numTeamsFinished = 0;
-    RegionGraph::graphCnt = 0;
-    if(levelSteps(0)==0){
-	graphArray.resize(finest_level+1);
-        for(int i=0; i<= finest_level; i++)
-            getLevel(i).initPerilla(cumtime);
-        if(ParallelDescriptor::NProcs()>1){
-            Perilla::communicateTags();
-        }
-    }
-    Perilla::syncProcesses();
-
-#ifdef USE_PERILLA_OMP
-//    int nThreads= perilla::NUM_THREAD_TEAMS * perilla::NUM_THREADS_PER_TEAM; 
-// num_threads(nThreads)
-#pragma omp parallel default(shared)
-    {
-        if(perilla::isCommunicationThread())
-        {
-   	    std::vector<RegionGraph*> flattenedGraphArray;
-            while(true){
-                Perilla::flattenGraphHierarchy(graphArray, flattenedGraphArray);
-                Perilla::serviceMultipleGraphCommDynamic(flattenedGraphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-                {
-	            //perilla::syncWorkers();
-	            //if(perilla::wid()==0){
-                        //Perilla::syncProcesses();
-                        /*for(int g=0; g<flattenedGraphArray.size(); g++)
-                        {
-                            //cancel messages preposted previously
-                            flattenedGraphArray[g]->graphTeardown();
-                        }*/
-            	    //}
-                    flattenedGraphArray.clear();
-	            //perilla::syncWorkers();
-                    if(perilla::wid()==0) Perilla::syncProcesses();
-                    break;
-                }
-	    }
-        }
-        else{
-            timeStep(0,cumtime,1,1,stop_time);
-            if(perilla::isMasterWorkerThread()){
-		#pragma omp atomic
-                Perilla::numTeamsFinished++;
-            }
-        }
-    }
-#elif defined(USE_PERILLA_ON_DEMAND)
-    //RTS on-demand
-    timeStep(0,cumtime,1,1,stop_time);
-#else
-    cout<<"Undefined Async Mode"<<endl;
-    exit(0);
-#endif
-
-#if 0
-    if(!okToContinue() || (level_steps[0] == Perilla::max_step) || (stop_time -(dt_level[0] + cumTime())<=0)){
-        for(int i=0; i<= finest_level; i++){
-            getLevel(i).finalizePerilla(cumtime);
-        }
-    }
-#endif
-//end nonPthreads backends
-#endif
-//end Perilla backends
-#else
-    //synchronous
     timeStep(0,cumtime,1,1,stop_time);
-#endif
-
-#ifdef USE_PERILLA_PTHREADS
-    perilla::syncAllThreads();
-    if(perilla::isMasterThread())
-    {
-#endif
-
     BL_PROFILE_REGION_STOP(stepName.str());
 
     cumtime += dt_level[0];
@@ -2588,12 +2290,6 @@ Amr::coarseTimeStep (Real stop_time)
           }
 	}
     }
-
-
-#ifdef USE_PERILLA_PTHREADS
-    }
-#endif
-
 }
 
 bool
@@ -2747,6 +2443,8 @@ Amr::defBaseLevel (Real              strt_time,
                    const BoxArray*   lev0_grids,
                    const Vector<int>* pmap)
 {
+    amrex::ignore_unused(pmap);
+
     BL_PROFILE("Amr::defBaseLevel()");
     // Just initialize this here for the heck of it
     which_level_being_advanced = -1;
@@ -2847,9 +2545,12 @@ Amr::regrid (int  lbase,
 
     //
     // Reclaim old-time grid space for all remain levels > lbase.
+    // But skip this if we're in the middle of a post-timestep regrid.
     //
     for(int lev = start; lev <= finest_level; ++lev) {
-	amr_level[lev]->removeOldData();
+        if (!amr_level[lev]->postStepRegrid()) {
+            amr_level[lev]->removeOldData();
+        }
     }
     //
     // Reclaim all remaining storage for levels > new_finest.
@@ -3107,7 +2808,7 @@ Amr::printGridInfo (std::ostream& os,
         int                       numgrid = bs.size();
         Long                      ncells  = amr_level[lev]->countCells();
         double                    ntot    = Geom(lev).Domain().d_numPts();
-        Real                      frac    = 100.0_rt*(Real(ncells) / ntot);
+        Real                      frac    = Real(100.0)*(Real(ncells) / ntot);
         const DistributionMapping& map    = amr_level[lev]->get_new_data(0).DistributionMap();
 
         os << "  Level "
diff --git a/Src/Amr/AMReX_AmrLevel.H b/Src/Amr/AMReX_AmrLevel.H
index c2b6741068b..16f142b1daa 100644
--- a/Src/Amr/AMReX_AmrLevel.H
+++ b/Src/Amr/AMReX_AmrLevel.H
@@ -27,9 +27,6 @@ namespace amrex {
 
 class TagBox;
 class TagBoxArray;
-template <class T>
-class MFGraph;
-class RGIter;
 
 /**
 * \brief Virtual base class for managing individual levels.
@@ -42,9 +39,6 @@ class AmrLevel
     friend class Amr;
     friend class FillPatchIterator;
     friend class FillPatchIteratorHelper;
-    template <class T> friend class MFGraph;
-    friend class RGIter;
-    friend class AsyncFillPatchIterator;
 
 public:
     //! What time are we at?
@@ -102,9 +96,9 @@ public:
     * Unlike writePlotFile, this is NOT a pure virtual function 
     * so implementation by derived classes is optional.
     */
-    virtual void writeSmallPlotFile (const std::string& dir,
-                                     std::ostream&      os,
-				     VisMF::How         how = VisMF::NFiles) {};
+    virtual void writeSmallPlotFile (const std::string& /*dir*/,
+                                     std::ostream&      /*os*/,
+				     VisMF::How         /*how*/ = VisMF::NFiles) {}
     //! Write current state to checkpoint file.
     virtual void checkPoint (const std::string& dir,
                              std::ostream&      os,
@@ -162,13 +156,6 @@ public:
                           int  iteration,
                           int  ncycle) = 0;
 
-#ifdef USE_PERILLA
-    // For Perilla initialization
-    virtual void initPerilla (Real time)=0;
-    virtual void finalizePerilla (Real time)=0;
-#endif
-
-
     /**
     * \brief Contains operations to be done after a timestep.  This is a
     * pure virtual function and hence MUST be implemented by derived
@@ -183,7 +170,7 @@ public:
     /**
     * \brief Operations to be done after restart.
     */
-    virtual void post_restart () {};
+    virtual void post_restart () {}
     /**
     * \brief Operations to be done after regridding
     * This is a pure virtual function and hence MUST be
@@ -380,7 +367,7 @@ public:
 
 #ifdef AMREX_PARTICLES
     //! This function can be called from the parent 
-    virtual void particle_redistribute (int lbase = 0, bool a_init = false) {;}
+    virtual void particle_redistribute (int /*lbase*/ = 0, bool /*a_init*/ = false) {;}
 #endif
 
     static void FillPatch (AmrLevel& amrlevel,
@@ -498,111 +485,7 @@ class FillPatchIterator
 
     MultiFab& get_mf() noexcept { return m_fabs; }
 
-#ifdef USE_PERILLA
-    FillPatchIterator (AmrLevel& amrlevel,
-                       MultiFab& leveldata,
-                       int       boxGrow,
-                       Real      time,
-                       int       state_indx,
-                       int       scomp,
-                       int       ncomp,
-                       int       f);
-
-    void initFillPatch(int boxGrow, int time, int index, int scomp, int ncomp, int iter);
-
-    void InitializePush (int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int f);
-
-    void InitializePull (int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int f);
-
-    void FillPatchPush (int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int f,
-                         unsigned char pushLevel,
-                         bool singleT=false);
-
-    void FillPatchPull (int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int f,
-                         bool singleT=false);
-
-    void finalizeGraphs()
-    {
-      //std::cout << "Completing RGs ";
-
-      if(destGraph != NULL)
-        {
-          //std::cout << destGraph->graphID << " ";
-           destGraph->finalizeGraph();
-        }
-      if(csrcGraph != NULL)
-        {
-          //std::cout << csrcGraph->graphID << " ";
-          csrcGraph->finalizeGraph();
-        }
-      if(fsrcGraph != NULL)
-        {
-          //std::cout << fsrcGraph->graphID << " ";
-          fsrcGraph->finalizeGraph();
-        }
-      if(m_rg_crse_patch != NULL)
-        {
-          //std::cout << m_rg_crse_patch->graphID << " ";
-          m_rg_crse_patch->finalizeGraph();
-        }
-
-      //std::cout <<" by tg " << tg << std::endl;
-    }
-
-    void Reset()
-    {
-      int tg= perilla::wid();
-      //std::cout << "Resetting RGs ";
-      if(destGraph != NULL)
-        {
-          //std::cout << destGraph->graphID << " ";
-           destGraph->Reset();
-        }
-      if(csrcGraph != NULL)
-        {
-          //std::cout << csrcGraph->graphID << " ";
-          csrcGraph->Reset();
-        }
-      if(fsrcGraph != NULL)
-        {
-          //std::cout << fsrcGraph->graphID << " ";
-          fsrcGraph->Reset();
-        }
-      if(m_rg_crse_patch != NULL)
-        {
-          //std::cout << m_rg_crse_patch->graphID << " ";
-          m_rg_crse_patch->Reset();
-        }
-      //std::cout <<" by tg " << tg << std::endl;
-    }
-
-    RegionGraph* get_destGraph(){return destGraph;}
-    RegionGraph* get_crscGraph(){return csrcGraph;}
-    RegionGraph* get_fsrcGraph(){return fsrcGraph;}
-#endif
-
-    
-  private:
+private:
     //
     // Disallowed.
     //
@@ -621,80 +504,6 @@ class FillPatchIterator
     std::vector< std::pair<int,int> > m_range;
     MultiFab                          m_fabs;
     int                               m_ncomp;
-
-public:
-#ifdef USE_PERILLA
-    RegionGraph*                      destGraph;
-    RegionGraph*                      csrcGraph;
-    RegionGraph*                      fsrcGraph;
-    RegionGraph*                      m_rg_crse_patch;
-    std::list<RegionGraph*>	      regionList;
-    std::list<MultiFab*>	      mfList;
-    std::list<StateDataPhysBCFunct*>  stateDataList;
-
-
-
-    MultiFab*                         m_mf_crse_patch;
-    const FabArrayBase::FPinfo*       m_fpc;
-    MultiFab*                         dmf;
-    MultiFab*                         dmff;
-    Vector<MultiFab*>                 smf;
-    Geometry*                         geom;
-    StateDataPhysBCFunct*             physbcf;
-    bool                              isProperlyNested;
-    Vector<MultiFab*>                 smf_crse;
-    Vector<Real>                      stime_crse;
-    StateDataPhysBCFunct*             physbcf_crse;
-    Geometry*                         geom_crse;
-    Vector<MultiFab*>                 smf_fine;
-    Vector<Real>                      stime_fine;
-    StateDataPhysBCFunct*             physbcf_fine;
-    Geometry*                         geom_fine;
-
-    Vector<Real>                 stime;
-    void FillFromLevel0Push (Real time, int index, int scomp, int dcomp, int ncomp, int f);
-    void FillFromLevel0PushOnly (Real time, int index, int scomp, int dcomp, int ncomp, int f, bool singleT);
-    void FillFromLevel0Pull (Real time, int index, int scomp, int dcomp, int ncomp, int f, bool singleT);
-    void FillFromTwoLevelsPushOnly (Real time, int index, int scomp, int dcomp, int ncomp, int f, unsigned char pushLevel, bool singleT);
-    void FillFromTwoLevelsPush (Real time, int index, int scomp, int dcomp, int ncomp, int f, unsigned char pushLevel, bool singleT);
-    void FillFromTwoLevelsPull (Real time, int index, int scomp, int dcomp, int ncomp, int f, bool singleT);
-    void FillPatchTwoLevelsPush (Amr& amr, MultiFab& mf, Real time,
-                                 Vector<MultiFab*>& cmf, Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, Vector<Real>& ft,
-                                 RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-                                 FillPatchIterator* fpIter,
-                                 MultiFab *dmf,
-                                 MultiFab *dmff,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs, unsigned char pushLevel, bool singleT);
-
-    void FillPatchTwoLevelsPull (MultiFab& mf, Real time,
-                                 Vector<MultiFab*>& cmf, Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, Vector<Real>& ft,
-                                 RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-                                 FillPatchIterator* fpIter,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs, bool singleT);
-
-    void FillPatchSingleLevelPush (Amr& amr, MultiFab& mf, Real time,
-                                   Vector<MultiFab*>& smf, Vector<Real>& stime,
-                                   RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-                                   MultiFab *dmf,
-                                   int scomp, int dcomp, int ncomp,
-                                   const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT);
-    void FillPatchSingleLevelPull (MultiFab& mf, Real time,
-                                   Vector<MultiFab*>& smf, Vector<Real>& stime,
-                                   RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-                                   int scomp, int dcomp, int ncomp,
-                                   const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT);
-
-#endif
 };
 
 class FillPatchIteratorHelper
@@ -754,329 +563,6 @@ private:
     std::map< int,Vector< Vector< Vector<FillBoxId> > > > m_fbid; // [grid][level][fillablesubbox][oldnew]
 };
 
-
-  //////////////////////////////////////Perilla/////////////////////
-#ifdef USE_PERILLA
-class AsyncFillPatchIterator
-    :
-    public MFIter
-{
-  public:
-
-  friend class AmrLevel;
-  friend class RGIter;
-
-    AsyncFillPatchIterator (AmrLevel& amrlevel,
-                            MultiFab& leveldata,
-                            int       boxGrow,
-                            Real      time,
-                            int       state_indx,
-                            int       scomp,
-                            int       ncomp,
-                            int iter);
-
-    void initFillPatch(int boxGrow,
-                       Real time,
-                       int index,
-                       int scomp,
-                       int ncomp,
-                       int iter);
-
-    static void  initialSend(amrex::Vector<amrex::AsyncFillPatchIterator*> afpi,
-                             amrex::Vector<amrex::AsyncFillPatchIterator*> upper_afpi,
-                             int  boxGrow,
-                             Real time,
-                             int  state_indx,
-                             int  scomp,
-                             int  ncomp,
-                             int  iter);
-
-    void PushOnly (int  boxGrow,
-                   Real time,
-                   int  state_indx,
-                   int  scomp,
-                   int  ncomp,
-                   int f,
-                   unsigned char pushLevel,
-                   bool singleT=false);
-
-    void SendIntraLevel (RGIter& rgi,
-                         int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int  iter,
-                         int f,
-                         bool singleT=false);
-
-    void SendIntraLevel (RGIter* rgi,
-                         int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int  iter,
-                         int f,
-                         bool singleT=false);
-
-    void SendInterLevel (RGIter& rgi,
-                         int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int  iter,
-                         int f,
-                         bool singleT=false);
-
-    void SendInterLevel (RGIter* rgi,
-                         int  boxGrow,
-                         Real time,
-                         int  state_indx,
-                         int  scomp,
-                         int  ncomp,
-                         int  iter,
-                         int f,
-                         bool singleT=false);
-
-    void Receive (RGIter& rgi,
-                   int  boxGrow,
-                   Real time,
-                   int  state_indx,
-                   int  scomp,
-                   int  ncomp,
-                   int f,
-                   bool singleT=false);
-
-    void Receive (RGIter* rgi,
-                   int  boxGrow,
-                   Real time,
-                   int  state_indx,
-                   int  scomp,
-                   int  ncomp,
-                   int f,
-                   bool singleT=false);
-
-    void Receive (RGIter& rgi,
-                  MultiFab& dest,
-                  int  boxGrow,
-                  Real time,
-                  int  state_indx,
-                  int  scomp,
-                  int  ncomp,
-                  int f,
-                  bool singleT=false);
-
-    void Receive (RGIter* rgi,
-                  MultiFab& dest,
-                  int  boxGrow,
-                  const Real time,
-                  int  state_indx,
-                  int  scomp,
-                  int  ncomp,
-                  int f,
-                  bool singleT=false);
-
-    void PullOnly (int  boxGrow,
-                   Real time,
-                   int  state_indx,
-                   int  scomp,
-                   int  ncomp,
-                   int f,
-                   bool singleT=false);
-
-    void PullOnly (MultiFab& dest,
-                   int  boxGrow,
-                   Real time,
-                   int  state_indx,
-                   int  scomp,
-                   int  ncomp,
-                   int f,
-                   bool singleT=false);
-
-    void FillPatchTwoLevelsPush (Amr& amr, MultiFab& mf, Real time,
-                                 Vector<MultiFab*>& cmf, Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, Vector<Real>& ft,
-                                 RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-                                 AsyncFillPatchIterator* fpIter,
-                                 MultiFab *dmf,
-                                 MultiFab *dmff,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs, unsigned char pushLevel, bool singleT);
-
-    void FillPatchTwoLevelsPull (MultiFab& mf, Real time,
-                                 Vector<MultiFab*>& cmf, Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, Vector<Real>& ft,
-                                 RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-                                 AsyncFillPatchIterator* fpIter,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs, bool singleT);
-
-    void FillPatchSingleLevelPush (Amr& amr, MultiFab& mf, Real time,
-                                   Vector<MultiFab*>& smf, const Vector<Real>& stime,
-                                   RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-                                   MultiFab *dmf,
-                                   int scomp, int dcomp, int ncomp,
-                                   const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT);
-    void FillPatchSingleLevelPull (MultiFab& mf, Real time,
-                                   Vector<MultiFab*>& smf, const Vector<Real>& stime,
-                                   RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-                                   int scomp, int dcomp, int ncomp,
-                                   const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT);
-
-    void FillFromTwoLevelsPush (Real time,
-                                int index,
-                                int scomp,
-                                int dcomp,
-                                int ncomp,
-                                int f,
-                                unsigned char pushLevel,
-                                bool singleT);
-    void FillFromTwoLevelsPull (Real time,
-                                int index,
-                                int scomp,
-                                int dcomp,
-                                int ncomp,
-                                int f,
-                                bool singleT);
-
-    void FillFromTwoLevelsPull (MultiFab& dest,
-                                Real time,
-                                int index,
-                                int scomp,
-                                int dcomp,
-                                int ncomp,
-                                int f,
-                                bool singleT);
-
-    ~AsyncFillPatchIterator ();
-
-    FArrayBox& operator() () { return m_fabs[MFIter::index()]; }
-
-    Box UngrownBox () const { return MFIter::validbox(); }
-
-    MultiFab& get_mf() { return m_fabs; }
-
-  //  protected:
-    //
-    // Disallowed.
-    //
-    AsyncFillPatchIterator ();
-    AsyncFillPatchIterator (const AsyncFillPatchIterator& rhs);
-    AsyncFillPatchIterator& operator= (const AsyncFillPatchIterator& rhs);
-
-    //
-    // The data.
-    //
-    AmrLevel&                         m_amrlevel;
-    MultiFab&                         m_leveldata;
-    std::vector< std::pair<int,int> > m_range;
-    MultiFab                          m_fabs;
-    int                               m_ncomp;
-
-public:
-    bool                              isProperlyNested;
-
-    amrex::Vector<MultiFab*>                  smf;
-    amrex::Vector<Real>                       stime;
-    StateDataPhysBCFunct*             physbcf;
-    Geometry*                         geom;
-
-
-    amrex::Vector<MultiFab*>                  smf_crse;
-    amrex::Vector<Real>                       stime_crse;
-    StateDataPhysBCFunct*             physbcf_crse;
-    Geometry*                         geom_crse;
-
-    amrex::Vector<MultiFab*>                  smf_fine;
-    amrex::Vector<Real>                       stime_fine;
-    StateDataPhysBCFunct*             physbcf_fine;
-    Geometry*                         geom_fine;
-
-
-    RegionGraph*                      destGraph;
-    RegionGraph*                      csrcGraph;
-    RegionGraph*                      fsrcGraph;
-
-    MultiFab*                         m_mf_crse_patch;
-    RegionGraph*                      m_rg_crse_patch;
-    const FabArrayBase::FPinfo*       m_fpc;
-
-  //PArray<MultiFab>                  raii;
-    MultiFab*                         dmf;
-    MultiFab*                         dmff;
-    std::list<RegionGraph*>           regionList;
-    std::list<MultiFab*>              mfList;
-    std::list<StateDataPhysBCFunct*>  stateDataList;
-
-
-
-    void completeRegionGraphs()
-    { 
-      //std::cout << "Completing RGs ";
-      
-      if(destGraph != NULL)
-        { 
-          //std::cout << destGraph->graphID << " ";
-           destGraph->finalizeRegionGraph();
-        }
-      if(csrcGraph != NULL)
-        { 
-          //std::cout << csrcGraph->graphID << " ";
-          csrcGraph->finalizeRegionGraph();
-        }
-      if(fsrcGraph != NULL)
-        { 
-          //std::cout << fsrcGraph->graphID << " ";
-          fsrcGraph->finalizeRegionGraph();
-        }
-      if(m_rg_crse_patch != NULL)
-        { 
-          //std::cout << m_rg_crse_patch->graphID << " ";
-          m_rg_crse_patch->finalizeRegionGraph();
-        }
-      //std::cout <<" by tg " << tg << std::endl;
-    }
-
-    void Reset()
-    {
-      //std::cout << "Resetting RGs ";
-      if(destGraph != NULL)
-        {
-          //std::cout << destGraph->graphID << " ";
-           destGraph->Reset();
-        }
-      if(csrcGraph != NULL)
-        {
-          //std::cout << csrcGraph->graphID << " ";
-          csrcGraph->Reset();
-        }
-      if(fsrcGraph != NULL)
-        {
-          //std::cout << fsrcGraph->graphID << " ";
-          fsrcGraph->Reset();
-        }
-      if(m_rg_crse_patch != NULL)
-        {
-          //std::cout << m_rg_crse_patch->graphID << " ";
-          m_rg_crse_patch->Reset();
-        }
-      //std::cout <<" by tg " << tg << std::endl;
-    }
-
-  // Variables for optimization calls of two level push/pulll
-
-};
-#endif
-
-
 }
 
 #endif /*_AmrLevel_H_*/
diff --git a/Src/Amr/AMReX_AmrLevel.cpp b/Src/Amr/AMReX_AmrLevel.cpp
index 20c43e7b27a..40c30dedd07 100644
--- a/Src/Amr/AMReX_AmrLevel.cpp
+++ b/Src/Amr/AMReX_AmrLevel.cpp
@@ -1,7 +1,6 @@
 
 #include <sstream>
 
-#include <unistd.h>
 #include <memory>
 #include <limits>
 
@@ -21,14 +20,7 @@
 #include <AMReX_EB2.H>
 #endif
 
-#ifdef USE_PERILLA
-#include <WorkerThread.H>
-#endif
-
 namespace amrex {
-#ifdef USE_PERILLA
-using namespace perilla;
-#endif
 
 #ifdef AMREX_USE_EB
 int AmrLevel::m_eb_basic_grow_cells = 5;
@@ -54,12 +46,12 @@ AmrLevel::postCoarseTimeStep (Real time)
 }
 
 void
-AmrLevel::set_preferred_boundary_values (MultiFab& S,
-                                         int       state_index,
-                                         int       scomp,
-                                         int       dcomp,
-                                         int       ncomp,
-                                         Real      time) const
+AmrLevel::set_preferred_boundary_values (MultiFab& /*S*/,
+                                         int       /*state_index*/,
+                                         int       /*scomp*/,
+                                         int       /*dcomp*/,
+                                         int       /*ncomp*/,
+                                         Real      /*time*/) const
 {}
 
 DeriveList&
@@ -69,8 +61,8 @@ AmrLevel::get_derive_lst () noexcept
 }
 
 void
-AmrLevel::manual_tags_placement (TagBoxArray&    tags,
-                                 const Vector<IntVect>& bf_lev)
+AmrLevel::manual_tags_placement (TagBoxArray& /*tags*/,
+                                 const Vector<IntVect>& /*bf_lev*/)
 {}
 
 AmrLevel::AmrLevel () noexcept
@@ -113,14 +105,17 @@ AmrLevel::AmrLevel (Amr&            papa,
     state.resize(desc_lst.size());
 
 #ifdef AMREX_USE_EB
-    m_factory = makeEBFabFactory(geom, ba, dm,
-                                 {m_eb_basic_grow_cells,
-                                  m_eb_volume_grow_cells,
-                                  m_eb_full_grow_cells},
-                                 m_eb_support_level);
-#else
-    m_factory.reset(new FArrayBoxFactory());
+    if (EB2::TopIndexSpaceIfPresent()) {
+        m_factory = makeEBFabFactory(geom, ba, dm,
+                                     {m_eb_basic_grow_cells,
+                                      m_eb_volume_grow_cells,
+                                      m_eb_full_grow_cells},
+                                     m_eb_support_level);
+    } else
 #endif
+    {
+        m_factory.reset(new FArrayBoxFactory());
+    }
 
     // Note that this creates a distribution map associated with grids.
     for (int i = 0; i < state.size(); i++)
@@ -184,7 +179,9 @@ AmrLevel::writePlotFile (const std::string& dir,
     int n_data_items = plot_var_map.size() + derive_names.size();
 
 #ifdef AMREX_USE_EB
-    n_data_items += 1;
+    if (EB2::TopIndexSpaceIfPresent()) {
+        n_data_items += 1;
+    }
 #endif
 
     // get the time from the first State_Type
@@ -219,7 +216,9 @@ AmrLevel::writePlotFile (const std::string& dir,
         }
 
 #ifdef AMREX_USE_EB
-        os << "vfrac\n";
+        if (EB2::TopIndexSpaceIfPresent()) {
+            os << "vfrac\n";
+        }
 #endif
 
         os << AMREX_SPACEDIM << '\n';
@@ -304,10 +303,12 @@ AmrLevel::writePlotFile (const std::string& dir,
         }
 
 #ifdef AMREX_USE_EB
-        // volfrac threshhold for amrvis
-        if (level == parent->finestLevel()) {
-            for (int lev = 0; lev <= parent->finestLevel(); ++lev) {
-                os << "1.0e-6\n";
+        if (EB2::TopIndexSpaceIfPresent()) {
+            // volfrac threshhold for amrvis
+            if (level == parent->finestLevel()) {
+                for (int lev = 0; lev <= parent->finestLevel(); ++lev) {
+                    os << "1.0e-6\n";
+                }
             }
         }
 #endif
@@ -342,9 +343,11 @@ AmrLevel::writePlotFile (const std::string& dir,
     }
 
 #ifdef AMREX_USE_EB
-    plotMF.setVal(0.0, cnt, 1, nGrow);
-    auto factory = static_cast<EBFArrayBoxFactory*>(m_factory.get());
-    MultiFab::Copy(plotMF,factory->getVolFrac(),0,cnt,1,nGrow);
+    if (EB2::TopIndexSpaceIfPresent()) {
+        plotMF.setVal(0.0, cnt, 1, nGrow);
+        auto factory = static_cast<EBFArrayBoxFactory*>(m_factory.get());
+        MultiFab::Copy(plotMF,factory->getVolFrac(),0,cnt,1,nGrow);
+    }
 #endif
 
     //
@@ -363,15 +366,15 @@ AmrLevel::writePlotFile (const std::string& dir,
 
 
 void
-AmrLevel::writePlotFilePre (const std::string& dir,
-                            std::ostream&      os)
+AmrLevel::writePlotFilePre (const std::string& /*dir*/,
+                            std::ostream&      /*os*/)
 {
 }
 
 
 void
-AmrLevel::writePlotFilePost (const std::string& dir,
-                             std::ostream&      os)
+AmrLevel::writePlotFilePost (const std::string& /*dir*/,
+                             std::ostream&      /*os*/)
 {
 }
 
@@ -425,12 +428,17 @@ AmrLevel::restart (Amr&          papa,
     parent->SetDistributionMap(level, dmap);
 
 #ifdef AMREX_USE_EB
-    m_factory = makeEBFabFactory(geom, grids, dmap,
-                                 {m_eb_basic_grow_cells, m_eb_volume_grow_cells, m_eb_full_grow_cells},
-                                 m_eb_support_level);
-#else
-    m_factory.reset(new FArrayBoxFactory());
+    if (EB2::TopIndexSpaceIfPresent()) {
+        m_factory = makeEBFabFactory(geom, grids, dmap,
+                                     {m_eb_basic_grow_cells,
+                                      m_eb_volume_grow_cells,
+                                      m_eb_full_grow_cells},
+                                     m_eb_support_level);
+    } else
 #endif
+    {
+        m_factory.reset(new FArrayBoxFactory());
+    }
 
     state.resize(ndesc);
     for (int i = 0; i < ndesc; ++i)
@@ -449,7 +457,7 @@ AmrLevel::restart (Amr&          papa,
 }
 
 void
-AmrLevel::set_state_in_checkpoint (Vector<int>& state_in_checkpoint)
+AmrLevel::set_state_in_checkpoint (Vector<int>& /*state_in_checkpoint*/)
 {
     amrex::Error("Class derived AmrLevel has to handle this!");
 }
@@ -538,16 +546,16 @@ AmrLevel::checkPoint (const std::string& dir,
 
 
 void
-AmrLevel::checkPointPre (const std::string& dir,
-                         std::ostream&      os)
+AmrLevel::checkPointPre (const std::string& /*dir*/,
+                         std::ostream&      /*os*/)
 {
     BL_PROFILE("AmrLevel::checkPointPre()");
 }
 
 
 void
-AmrLevel::checkPointPost (const std::string& dir,
-                          std::ostream&      os)
+AmrLevel::checkPointPost (const std::string& /*dir*/,
+                          std::ostream&      /*os*/)
 {
     BL_PROFILE("AmrLevel::checkPointPost()");
 }
@@ -660,7 +668,9 @@ FillPatchIterator::FillPatchIterator (AmrLevel& amrlevel,
     m_amrlevel(amrlevel),
     m_leveldata(leveldata),
     m_ncomp(0)
-{}
+{
+    MFIter::depth = 0;
+}
 
 FillPatchIteratorHelper::FillPatchIteratorHelper (AmrLevel&     amrlevel,
                                                   MultiFab&     leveldata,
@@ -701,6 +711,7 @@ FillPatchIterator::FillPatchIterator (AmrLevel& amrlevel,
     BL_ASSERT(AmrLevel::desc_lst[idx].inRange(scomp,ncomp));
     BL_ASSERT(0 <= idx && idx < AmrLevel::desc_lst.size());
 
+    MFIter::depth = 0;
     Initialize(boxGrow,time,idx,scomp,ncomp);
 
 #ifdef BL_USE_TEAM
@@ -1012,7 +1023,9 @@ FillPatchIterator::Initialize (int  boxGrow,
 	    } else {
 
 #ifdef AMREX_USE_EB
-                amrex::Abort("Grids must be properly nested for EB");
+                if (EB2::TopIndexSpaceIfPresent()) {
+                    amrex::Abort("Grids must be properly nested for EB");
+                }
 #endif
 
 		static bool first = true;
@@ -1491,27 +1504,7 @@ FillPatchIteratorHelper::fill (FArrayBox& fab,
 
 FillPatchIteratorHelper::~FillPatchIteratorHelper () {}
 
-FillPatchIterator::~FillPatchIterator () {
-#ifdef USE_PERILLA
-        while(regionList.size()){
-          RegionGraph* tmp= regionList.front();
-          delete tmp;
-          regionList.pop_front();
-        }
-
-        while(mfList.size()){
-          MultiFab *tmp= mfList.front();
-          delete tmp;
-          mfList.pop_front();
-        }
-
-        while(stateDataList.size()){
-          StateDataPhysBCFunct *tmp= stateDataList.front();
-          delete tmp;
-          stateDataList.pop_front();
-        }
-#endif
-    }
+FillPatchIterator::~FillPatchIterator () {}
 
 void
 AmrLevel::FillCoarsePatch (MultiFab& mf,
@@ -1566,12 +1559,16 @@ AmrLevel::FillCoarsePatch (MultiFab& mf,
             crseBA.set(j,mapper->CoarseBox(bx, crse_ratio));
         }
 
+        MultiFab crseMF;
 #ifdef AMREX_USE_EB
-        auto cfactory = makeEBFabFactory(cgeom, crseBA, mf_DM, {0,0,0}, EBSupport::basic);
-        MultiFab crseMF(crseBA,mf_DM,NComp,0,MFInfo(),*cfactory);
-#else
-	MultiFab crseMF(crseBA,mf_DM,NComp,0);
+        if (EB2::TopIndexSpaceIfPresent()) {
+            auto cfactory = makeEBFabFactory(cgeom, crseBA, mf_DM, {0,0,0}, EBSupport::basic);
+            crseMF.define(crseBA,mf_DM,NComp,0,MFInfo(),*cfactory);
+        } else
 #endif
+        {
+            crseMF.define(crseBA,mf_DM,NComp,0);
+        }
 
 	if ( level == 1 
 	     || amrex::ProperlyNested(crse_ratio, parent->blockingFactor(level),
@@ -1830,7 +1827,8 @@ AmrLevel::derive (const std::string& name, Real time, MultiFab& mf, int dcomp)
                 const Box& bx = mfi.growntilebox();
                 FArrayBox& derfab = mf[mfi];
                 FArrayBox const& datafab = srcMF[mfi];
-                rec->derFuncFab()(bx, derfab, dcomp, ncomp, datafab, geom, time, rec->getBC(), level);
+                const int dncomp = rec->numDerive();
+                rec->derFuncFab()(bx, derfab, dcomp, dncomp, datafab, geom, time, rec->getBC(), level);
             }
         }
         else
@@ -2266,1104 +2264,5 @@ AmrLevel::CreateLevelDirectory (const std::string &dir)
     levelDirectoryCreated = true;
 }
 
-
-#ifdef USE_PERILLA
-    void FillPatchIterator::FillPatchSingleLevelPush (Amr& amr, MultiFab& mf, Real time,
-                                   Vector<MultiFab*>& smf, Vector<Real>& stime,
-                                   RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-                                   MultiFab *dmf,
-                                   int scomp, int dcomp, int ncomp,
-                                   const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT)
-      {
-
-        BL_PROFILE("FillPatchSingleLevel");
-
-        BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-        BL_ASSERT(dcomp+ncomp <= mf.nComp());
-        BL_ASSERT(smf.size() == stime.size());
-        BL_ASSERT(smf.size() != 0);
-
-        int tg = WorkerThread::perilla_wid();
-        int nt = WorkerThread::perilla_wtid();
-
-        if (smf.size() == 1)
-          {
-          //mf.copy(smf[0], scomp, dcomp, ncomp, 0, mf.nGrow(), geom.periodicity());        
-            Perilla::multifabCopyPushAsync( destGraph, srcGraph, &mf, smf[0],  f, dcomp, scomp, ncomp, mf.nGrow(), 0, singleT);
-          }
-        else if (smf.size() == 2)
-          {
-            BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-            //PArray<MultiFab> raii(PArrayManage);
-            //MultiFab * dmf;
-            int destcomp;
-            bool sameba;
-            if (mf.boxArray() == smf[0]->boxArray())
-              {
-                //dmf = &mf;
-                destcomp = dcomp;
-                sameba = true;
-
-                int fis = smf[0]->IndexArray()[f];
-                int fid = mf.IndexArray()[f];
-                const Box& bx = mf[fid].box();
-                mf[fid].linInterp<RunOn::Host>
-                               ((*smf[0])[fis],
-                                scomp,
-                                (*smf[1])[fis],
-                                scomp,
-                                stime[0],
-                                stime[1],
-                                time,
-                                bx,
-                                destcomp,
-                                ncomp);
-                Perilla::fillBoundaryPush(destGraph, &mf, f);
-              }
-            else
-              {
-
-                //dmf = raii.push_back(new MultiFab(smf[0].boxArray(), ncomp, 0));
-                //MultiFab dmf(smf[0].boxArray(), ncomp, 0);
-                destcomp = 0;
-                sameba = false;
-
-                assert(smf[0]);
-                assert(smf[0]->IndexArray().size()>f);
-                assert(dmf);
-                assert(dmf->IndexArray().size()>f);
-                int fis = smf[0]->IndexArray()[f];
-                int fid = dmf->IndexArray()[f];
-
-                for(int t=0; t<srcGraph->fabTiles[f]->numTiles; t++)
-                  if( singleT || t % (perilla::NUM_THREADS_PER_TEAM-1) == nt)
-                    {
-                      const Box& bx = *(srcGraph->fabTiles[f]->tileBx[t]);
-
-                      //const Box& bx = (*dmf)[fid].box();
-                      (*dmf)[fid].linInterp<RunOn::Host>
-                                           ((*smf[0])[fis],
-                                            scomp,
-                                            (*smf[1])[fis],
-                                            scomp,
-                                            stime[0],
-                                            stime[1],
-                                            time,
-                                            bx,
-                                            destcomp,
-                                            ncomp);
-                    }
-                if(!singleT)
-                  srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-                int src_ngrow = 0;
-                int dst_ngrow = mf.nGrow();
-                Perilla::multifabCopyPushAsync( destGraph, srcGraph, &mf, dmf, f, dcomp, 0, ncomp, mf.nGrow(), 0, singleT);
-              }
-          }
-        else
-          {
-            amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-          }
-      }
-
-
-    void FillPatchIterator::FillPatchTwoLevelsPush (Amr& amr, MultiFab& mf, Real time,
-                                 Vector<MultiFab*>& cmf, Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, Vector<Real>& ft,
-                                 RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-                                 FillPatchIterator* fpIter,
-                                 MultiFab *dmf,
-                                 MultiFab *dmff,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs, unsigned char pushLevel,  bool singleT)
-    {
-        BL_PROFILE("FillPatchTwoLevels");
-
-        int ngrow = mf.nGrow();
-
-        if(f>=0){//fill only this fab
-            if(pushLevel & 0x01 )
-            {
-                if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-                {
-
-                    if (!fpIter->m_fpc->ba_crse_patch.empty())
-                    {
-                        FillPatchSingleLevelPush(amr, *(fpIter->m_mf_crse_patch), time, cmf, ct, fpIter->m_rg_crse_patch, csrcGraph, f, dmf, scomp, 0, ncomp, cgeom, cbc, singleT);
-                    }
-                }
-            }
-            if((pushLevel & 0x02) && (pushLevel != 0x03))
-            {
-                 FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, f, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-            }
-        }else{ //fill the whole multifab
-            if(pushLevel & 0x01 && pushLevel & 0x02)
-            {
-                int tg = perilla::wid();
-                for(int fi=0; fi < fmf[0]->IndexArray().size(); fi++)
-                {
-                    if(WorkerThread::isMyRegion(tg,fi))
-                    {
-                      FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, fi, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-                    } 
-                }
-            }       
-            if(pushLevel & 0x04)
-            {
-                int tg = perilla::wid();
-                for(int fi=0; fi < fmf[0]->IndexArray().size(); fi++)
-                {
-                    if(WorkerThread::isMyRegion(tg,fi))
-                    {
-                        FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, fi, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-                    }   
-                }
-            }       
-        }       
-    }       
-
-    void FillPatchIterator::FillPatchSingleLevelPull (MultiFab& mf, Real time,
-                                   Vector<MultiFab*>& smf, Vector<Real>& stime,
-                                   RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-                                   int scomp, int dcomp, int ncomp,
-                                   const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT)
-      {
-
-        BL_PROFILE("FillPatchSingleLevel");
-
-        BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-        BL_ASSERT(dcomp+ncomp <= mf.nComp());
-        BL_ASSERT(smf.size() == stime.size());
-        BL_ASSERT(smf.size() != 0);
-
-        if (smf.size() == 1)
-        {
-          //mf.copy(smf[0], scomp, dcomp, ncomp, 0, mf.nGrow(), geom.periodicity());      
-          Perilla::multifabCopyPull( destGraph, srcGraph, &mf, smf[0], f, dcomp, scomp, ncomp, mf.nGrow(), 0, singleT);
-        }
-        else if (smf.size() == 2)
-        {
-            BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-            //Vector<MultiFab> raii(PArrayManage);
-            MultiFab * dmf;
-            int destcomp;
-            bool sameba;
-            if (mf.boxArray() == smf[0]->boxArray()) {
-              dmf = &mf;
-              destcomp = dcomp;
-              sameba = true;
-            } else {
-              //dmf = srcGraph->assocMF;              
-              destcomp = 0;
-              sameba = false;
-            }
-            if (sameba)
-            {
-                // Note that when sameba is true mf's BoxArray is nonoverlapping.
-                // So FillBoundary is safe.
-                //mf.FillBoundary(dcomp,ncomp,geom.periodicity());
-              Perilla::fillBoundaryPull(destGraph, dmf, f, singleT);
-            }
-            else
-            {
-                int src_ngrow = 0;
-                int dst_ngrow = mf.nGrow();
-                MultiFab* dummyMF;
-                //mf.copy(*dmf, 0, dcomp, ncomp, src_ngrow, dst_ngrow, geom.periodicity());
-                Perilla::multifabCopyPull( destGraph, srcGraph, &mf, dummyMF, f, dcomp, 0, ncomp, mf.nGrow(), 0, singleT);
-            }
-        }
-        else {
-            amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-        }
-#if 0
-        physbcf.doit_fab(mf, f, dcomp, ncomp, time);
-#endif
-    }
-
-    void FillPatchIterator::FillPatchTwoLevelsPull (MultiFab& mf, Real time,
-                                 Vector<MultiFab*>& cmf, Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, Vector<Real>& ft,
-                                 RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-                                 FillPatchIterator* fpIter,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs, bool singleT)
-    {
-        BL_PROFILE("FillPatchTwoLevels");
-
-        int ngrow = mf.nGrow();
-
-        int tg = WorkerThread::perilla_wid();
-        int nt = WorkerThread::perilla_wtid();
-
-        if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-        {
-
-            if ( ! fpIter->m_fpc->ba_crse_patch.empty())
-            {
-
-                int idummy1=0, idummy2=0;
-                bool cc = fpIter->m_fpc->ba_crse_patch.ixType().cellCentered();
-                  {
-                    int gi = mf.IndexArray()[f];
-                    for(int i=0; i<destGraph->task[f]->depTaskIDs.size();i++)
-                      {
-                        int li = destGraph->task[f]->depTaskIDs[i];
-                        int mfi = fpIter->m_mf_crse_patch[0].IndexArray()[li];
-                        FillPatchSingleLevelPull(*(fpIter->m_mf_crse_patch), time, cmf, ct, fpIter->m_rg_crse_patch, csrcGraph, li, scomp, 0, ncomp, cgeom, cbc, singleT);
-                      }
-                    if(!singleT)
-                      destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-                    int nt = WorkerThread::perilla_wtid();
-                    Box fdomain = fgeom.Domain();
-                    for(int i=0; i<destGraph->task[f]->depTaskIDs.size();i++)
-                      {
-                        int li = destGraph->task[f]->depTaskIDs[i];
-                        int mfi = fpIter->m_mf_crse_patch[0].IndexArray()[li];
-                        if(singleT)
-                          {
-                            const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-                            //Array<BCRec> bcr(ncomp);
-		            Vector<BCRec> bcr(ncomp);
-                            amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-                            mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-                                           0,
-                                           mf[gi],
-                                           dcomp,
-                                           ncomp,
-                                           dbx,
-                                           ratio,
-                                           cgeom,
-                                           fgeom,
-                                           bcr,
-                                           idummy1, idummy2, RunOn::Cpu);
-                          }
-                        else
-                          {
-                          if(!cc)
-                            {
-                              if(WorkerThread::perilla_isMasterWorkerThread())
-                                {
-                                  const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-                                  //Box fdomain = fgeom.Domain();
-
-                                  Vector<BCRec> bcr(ncomp);
-                                  amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-                                mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-                                               0,
-                                               mf[gi],
-                                               dcomp,
-                                               ncomp,
-                                               dbx,
-                                               ratio,
-                                               cgeom,
-                                               fgeom,
-                                               bcr,
-                                               idummy1, idummy2, RunOn::Cpu);
-
-                                }
-                            }
-                          else
-                            {
-                              if(i % (perilla::NUM_THREADS_PER_TEAM-1) == nt-1)
-                                {
-
-                                  const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-
-                                  Vector<BCRec> bcr(ncomp);
-                                  amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-                                  mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-                                                 0,
-                                                 mf[gi],
-                                                 dcomp,
-                                                 ncomp,
-                                                 dbx,
-                                                 ratio,
-                                                 cgeom,
-                                                 fgeom,
-                                                 bcr,
-                                                 idummy1, idummy2, RunOn::Cpu);
-
-                                }
-                            }
-                          }
-                        //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-                      }
-                    if(!singleT)
-                      destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-                  }
-            }
-        }
-
-
-        FillPatchSingleLevelPull(mf, time, fmf, ft, destGraph, fsrcGraph, f, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-    }
-
-void FillPatchIterator::FillFromTwoLevelsPush (Real time,
-                                          int index,
-                                          int scomp,
-                                          int dcomp,
-                                          int ncomp,
-                                          int f,
-                                          unsigned char pushLevel,
-                                          bool singleT)
-{
-    int ilev_fine = m_amrlevel.level;
-    int ilev_crse = ilev_fine-1;
-    
-    BL_ASSERT(ilev_crse >= 0);
-    
-    AmrLevel& fine_level = m_amrlevel;
-    AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-        
-    Geometry* tgeom_fine = &fine_level.geom;
-    Geometry* tgeom_crse = &crse_level.geom;
-    
-    Vector<MultiFab*> tsmf_crse;
-    Vector<MultiFab*> tsmf_fine;
-    Vector<Real> tstime_crse;
-    Vector<Real> tstime_fine;
-    StateData& statedata_crse = crse_level.state[index];
-    statedata_crse.getData(tsmf_crse,tstime_crse,time);
-    StateDataPhysBCFunct* tphysbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-        
-    StateData& statedata_fine = fine_level.state[index];
-    statedata_fine.getData(tsmf_fine,tstime_fine,time);
-    StateDataPhysBCFunct* tphysbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-        
-    const StateDescriptor& desc = AmrLevel::desc_lst[index];
-    
-    FillPatchTwoLevelsPush(*(m_amrlevel.parent), m_fabs, time,
-                                   tsmf_crse, tstime_crse,
-                                   tsmf_fine, tstime_fine,
-                                   destGraph, csrcGraph, fsrcGraph, f,
-                                   this,
-                                   dmf,
-                                   dmff,
-                                   scomp, dcomp, ncomp, 
-                                   *tgeom_crse, *tgeom_fine,
-                                   *tphysbcf_crse, *tphysbcf_fine,
-                                   crse_level.fineRatio(), 
-                                   desc.interp(scomp), desc.getBCs(), pushLevel, singleT);
-}
-
-void
-FillPatchIterator::FillFromTwoLevelsPushOnly (Real time, int index, int scomp, int dcomp, int ncomp, int f, unsigned char pushLevel, bool singleT)
-{
-    int ilev_fine = m_amrlevel.level;
-    int ilev_crse = ilev_fine-1;
-
-    BL_ASSERT(ilev_crse >= 0);
-
-    AmrLevel& fine_level = m_amrlevel;
-    AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-
-    //if(physbcf_fine == NULL && physbcf_crse == NULL)
-    //{
-
-    Geometry* tgeom_fine = &fine_level.geom;
-    Geometry* tgeom_crse = &crse_level.geom;
-
-    Vector<MultiFab*> tsmf_crse;
-    Vector<MultiFab*> tsmf_fine;
-    Vector<Real> tstime_crse;
-    Vector<Real> tstime_fine;
-    StateData& statedata_crse = crse_level.state[index];
-    statedata_crse.getData(tsmf_crse,tstime_crse,time);
-    StateDataPhysBCFunct* tphysbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-
-    StateData& statedata_fine = fine_level.state[index];
-    statedata_fine.getData(tsmf_fine,tstime_fine,time);
-    StateDataPhysBCFunct* tphysbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-        //}
-
-    const StateDescriptor& desc = AmrLevel::desc_lst[index];
-
-    FillPatchTwoLevelsPush(*(m_amrlevel.parent), m_fabs, time,
-                                   tsmf_crse, tstime_crse,
-                                   tsmf_fine, tstime_fine,
-                                   destGraph, csrcGraph, fsrcGraph, f,
-                                   this,
-                                   dmf,
-                                   dmff,
-                                   scomp, dcomp, ncomp,
-                                   *tgeom_crse, *tgeom_fine,
-                                   *tphysbcf_crse, *tphysbcf_fine,
-                                   crse_level.fineRatio(),
-                                   desc.interp(scomp), desc.getBCs(), pushLevel, singleT);
-}
-
-void FillPatchIterator::FillFromTwoLevelsPull (Real time, int index, int scomp, int dcomp, int ncomp, int f, bool singleT)
-{
-
-    int ilev_fine = m_amrlevel.level;
-    int ilev_crse = ilev_fine-1;
-
-    BL_ASSERT(ilev_crse >= 0);
-
-    AmrLevel& fine_level = m_amrlevel;
-    AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-
-    Geometry* tgeom_fine = &fine_level.geom;
-    Geometry* tgeom_crse = &crse_level.geom;
-
-    Vector<MultiFab*> tsmf_crse;
-    Vector<MultiFab*> tsmf_fine;
-    Vector<Real> tstime_crse;
-    Vector<Real> tstime_fine;
-    StateData& statedata_crse = crse_level.state[index];
-    statedata_crse.getData(tsmf_crse,tstime_crse,time);
-    StateDataPhysBCFunct* tphysbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-
-    StateData& statedata_fine = fine_level.state[index];
-    statedata_fine.getData(tsmf_fine,tstime_fine,time);
-    StateDataPhysBCFunct* tphysbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-
-
-    const StateDescriptor& desc = AmrLevel::desc_lst[index];
-
-    FillPatchTwoLevelsPull(m_fabs, time,
-                                   tsmf_crse, tstime_crse,
-                                   tsmf_fine, tstime_fine,
-                                   destGraph, csrcGraph, fsrcGraph, f,
-                                   this,
-                                   scomp, dcomp, ncomp,
-                                   *tgeom_crse, *tgeom_fine,
-                                   *tphysbcf_crse, *tphysbcf_fine,
-                                   crse_level.fineRatio(),
-                                   desc.interp(scomp), desc.getBCs(), singleT);
-}
-
-void
-FillPatchIterator::FillPatchPush (int  boxGrow,
-                             Real time,
-                             int  index,
-                             int  scomp,
-                             int  ncomp,
-                             int f,
-                             unsigned char pushLevel,
-                             bool singleT)
-{
-    BL_PROFILE("FillPatchIterator::InitializePush");
-
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-    //const IndexType& boxType = m_leveldata.boxArray().ixType();
-    const int level = m_amrlevel.level;
-
-    for (int i = 0, DComp = 0; i < m_range.size(); i++)
-    {
-      if(i>0)
-        amrex::Abort("**** Error in FillPatchIterator::Initialize:  non contigeous components not implemented");
-
-      const int SComp = m_range[i].first;
-      const int NComp = m_range[i].second;
-
-      if (level == 0)
-        {
-          FillPatchSingleLevelPush (*(m_amrlevel.parent), m_fabs, time, smf, stime, destGraph, fsrcGraph, f, dmf, SComp, DComp, NComp, *geom, *physbcf, singleT);
-        }
-      else
-        {
-          if (level == 1 || isProperlyNested)
-            {
-              FillFromTwoLevelsPushOnly(time, index, SComp, DComp, NComp, f, pushLevel, singleT);
-            } else {
-            amrex::Abort("**** Error in FillPatchIterator::Initialize:  !ProperlyNested not implemented");
-          }
-        }
-      DComp += NComp;
-    }
-}
-
-void
-FillPatchIterator::FillPatchPull (int  boxGrow,
-                                   Real time,
-                                   int  index,
-                                   int  scomp,
-                                   int  ncomp,
-                                   int f,
-                                   bool singleT)
-{
-    BL_PROFILE("FillPatchIterator::InitializePull");
-
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-    //const IndexType& boxType = m_leveldata.boxArray().ixType();
-    const int level = m_amrlevel.level;
-
-
-    for (int i = 0, DComp = 0; i < m_range.size(); i++)
-      {
-        if(i>0)
-          amrex::Abort("**** Error in FillPatchIterator::Initialize:  non contigeous components not implemented");
-
-        const int SComp = m_range[i].first;
-        const int NComp = m_range[i].second;
-
-        if (level == 0)
-          {
-            FillPatchSingleLevelPull (m_fabs, time, smf, stime, destGraph, fsrcGraph, f, SComp, DComp, NComp, *geom, *physbcf, singleT);
-          }
-        else
-          {
-            if (level == 1 || isProperlyNested)
-              {
-                FillFromTwoLevelsPull(time, index, SComp, DComp, NComp, f, singleT);
-              } else {
-              amrex::Abort("**** Error in FillPatchIterator::Initialize:  !ProperlyNested not implemented");
-            }
-          }
-        //if(WorkerThread::isTeamMasterThread(tid))
-          {
-            const MultiFab& mf_fillpatched = m_fabs;
-            
-            if(singleT)
-              {
-                for(int t=0; t<destGraph->fabTiles_gtbx[f]->numTiles; t++)
-                  {
-                    const Box& bx = *(destGraph->fabTiles_gtbx[f]->tileBx[t]);
-                    MultiFab::Copy(m_leveldata, mf_fillpatched, f, 0, DComp, ncomp, bx);
-                  } 
-              }   
-            else
-              {
-                perilla::syncAllWorkerThreads();
-                int nt = WorkerThread::perilla_wtid();
-                for(int t=0; t<destGraph->fabTiles_gtbx[f]->numTiles; t++)
-                  if(t % (perilla::NUM_THREADS_PER_TEAM-1) == nt-1)
-                    {
-                      const Box& bx = *(destGraph->fabTiles_gtbx[f]->tileBx[t]);
-                      MultiFab::Copy(m_leveldata, mf_fillpatched, f, 0, DComp, ncomp, bx);
-                    } 
-                perilla::syncAllWorkerThreads();
-              } 
-          }   
-        DComp += NComp;
-    }   
-    //
-    // Call hack to touch up fillPatched data.
-    //
-    /*m_amrlevel.set_preferred_boundary_values(m_fabs,
-                                             index,
-                                             scomp,
-                                             0,
-                                             ncomp,
-                                             time);*/
-
-    }
-
-void
-FillPatchIterator::initFillPatch(int boxGrow, int time, int index, int scomp, int ncomp, int iter)
-{
-#ifdef USE_PERILLA_PTHREADS
-//    perilla::syncAllThreads();
-#endif
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-
-    const StateDescriptor& desc = AmrLevel::desc_lst[index];
-#ifdef USE_PERILLA_PTHREADS
-//    if(perilla::isMasterThread())
-#endif
-    {
-        m_ncomp = ncomp;
-        m_range = desc.sameInterps(scomp,ncomp);
-
-        m_fabs.define(m_leveldata.boxArray(),m_leveldata.DistributionMap(), m_ncomp,boxGrow);
-
-        BL_ASSERT(m_leveldata.DistributionMap() == m_fabs.DistributionMap());
-    }
-#ifdef USE_PERILLA_PTHREADS
-//    perilla::syncAllThreads();
-#endif
-
-    const IndexType& boxType = m_leveldata.boxArray().ixType();
-    const int level = m_amrlevel.level;
-
-    for (int i = 0, DComp = 0; i < m_range.size(); i++)
-    {
-        const int SComp = m_range[i].first;
-        const int NComp = m_range[i].second;
-        int dcomp = DComp;
-        if (level == 0)
-        {
-#if 1
-#ifdef USE_PERILLA_PTHREADS
-//            perilla::syncAllThreads();
-//            if(perilla::isMasterThread())
-#endif
-
-            {
-                BL_ASSERT(m_amrlevel.level == 0);
-                StateData& statedata = m_amrlevel.state[index];
-                statedata.getData(smf,stime,time);
-                geom = &m_amrlevel.geom;
-                physbcf = new StateDataPhysBCFunct(statedata,scomp,*geom);
-		stateDataList.push_back(physbcf);
-                BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-                BL_ASSERT(dcomp+ncomp <= m_fabs.nComp());
-                BL_ASSERT(smf.size() == stime.size());
-                BL_ASSERT(smf.size() != 0);
-            }
-#ifdef USE_PERILLA_PTHREADS
-//            perilla::syncAllThreads();
-#endif
-            if (smf.size() == 1)
-            {
-#ifdef USE_PERILLA_PTHREADS
-//                if(perilla::isMasterThread())
-#endif
-                {
-                    destGraph = new RegionGraph(m_fabs.IndexArray().size());
-                    fsrcGraph = new RegionGraph(smf[0]->IndexArray().size());
-		    regionList.push_back(destGraph);
-		    regionList.push_back(fsrcGraph);
-                }
-#ifdef USE_PERILLA_PTHREADS
-//                perilla::syncAllThreads();
-#endif
-
-#if 1
-                Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *(smf[0]), (const int) ncomp, m_fabs.nGrow(), 0, geom->periodicity());
-#endif
-#ifdef USE_PERILLA_PTHREADS
-//                perilla::syncAllThreads();
-//                if(perilla::isMasterThread())
-#endif
-                {
-                    m_amrlevel.parent->graphArray[level].push_back(destGraph);
-                    m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-                }
-#ifdef USE_PERILLA_PTHREADS
-//              perilla::syncAllThreads();
-#endif
-            }
-            else if (smf.size() == 2)
-            {
-                BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-
-                if (m_fabs.boxArray() == smf[0]->boxArray())
-                {
-#ifdef USE_PERILLA_PTHREADS
-//                    if(perilla::isMasterThread())
-#endif
-                    {
-                        dmf = &m_fabs;
-                        destGraph = new RegionGraph(m_fabs.IndexArray().size());
-		        regionList.push_back(destGraph);
-                    }
-#ifdef USE_PERILLA_PTHREADS
- //                   perilla::syncAllThreads();
-#endif
-                        Perilla::multifabBuildFabCon(destGraph, m_fabs, geom->periodicity());
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-//                    if(perilla::isMasterThread())
-#endif
-                    {
-                        m_amrlevel.parent->graphArray[level].push_back(destGraph);
-                    }
-                }
-                else
-                {
-#ifdef USE_PERILLA_PTHREADS
-//                    if(perilla::isMasterThread())
-#endif
-                    {
-                        dmf = new MultiFab(smf[0]->boxArray(), smf[0]->DistributionMap(), ncomp, 0);
-                        //dmf->initVal(); // for Perilla NUMA
-                        destGraph = new RegionGraph(m_fabs.IndexArray().size());
-                        fsrcGraph = new RegionGraph(dmf->IndexArray().size());
-                        fsrcGraph->buildTileArray(*dmf);
-		        regionList.push_back(destGraph);
-		        regionList.push_back(fsrcGraph);
-		        mfList.push_back(dmf);
-                    }
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-#endif
-
-                    Perilla::multifabExtractCopyAssoc(destGraph, fsrcGraph, m_fabs, *dmf, ncomp, m_fabs.nGrow(), 0, geom->periodicity());
-
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-//                    if(perilla::isMasterThread())
-#endif
-                    {
-                        m_amrlevel.parent->graphArray[level].push_back(destGraph);
-                        m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-                    }
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-#endif
-                }
-             }
-             else
-             {
-                //BoxLib::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-             }
-#endif
-            //-------------------------------------------------- FillFromLevel0 initialization completed
-          }
-        else
-          {
-#ifdef USE_PERILLA_PTHREADS
-//             perilla::syncAllThreads();
-//             if(perilla::isMasterThread())
-#endif
-             {
-                isProperlyNested = amrex::ProperlyNested(m_amrlevel.crse_ratio,
-                                                      m_amrlevel.parent->blockingFactor(m_amrlevel.level),
-                                                      boxGrow, boxType, desc.interp(SComp));
-             }
-#ifdef USE_PERILLA_PTHREADS
-//           perilla::syncAllThreads();
-#endif
-             if (level == 1 || isProperlyNested)
-                {
-                  int ilev_fine = m_amrlevel.level;
-                  int ilev_crse = ilev_fine-1;
-                  BL_ASSERT(ilev_crse >= 0);
-                  AmrLevel& fine_level = m_amrlevel;
-                  AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-#ifdef USE_PERILLA_PTHREADS
-//                  if(perilla::isMasterThread())
-#endif
-                  {
-                      geom_fine = &fine_level.geom;
-                      geom_crse = &crse_level.geom;
-                  }
-                  StateData& statedata_crse = crse_level.state[index];
-                  StateData& statedata_fine = fine_level.state[index];
-#ifdef USE_PERILLA_PTHREADS
-//                  perilla::syncAllThreads();
-//                  if(perilla::isMasterThread())
-#endif
-                  {
-                      statedata_crse.getData(smf_crse,stime_crse,time);
-                      statedata_fine.getData(smf_fine,stime_fine,time);
-                      physbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-                      physbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-		      stateDataList.push_back(physbcf_crse);
-		      stateDataList.push_back(physbcf_fine);
-                  }
-#ifdef USE_PERILLA_PTHREADS
-//                perilla::syncAllThreads();
-#endif
-                  const StateDescriptor& desc = AmrLevel::desc_lst[index];
-                  int ngrow = m_fabs.nGrow();
-                  if (ngrow > 0 || m_fabs.getBDKey() != smf_fine[0]->getBDKey())
-                  {
-#ifdef USE_PERILLA_PTHREADS
-//                    if(perilla::isMasterThread())
-#endif
-                      {
-                          InterpolaterBoxCoarsener coarsener = desc.interp(scomp)->BoxCoarsener(crse_level.fineRatio());
-                          Box fdomain = geom_fine->Domain();
-                          fdomain.convert(m_fabs.boxArray().ixType());
-                          Box fdomain_g(fdomain);
-                          for (int i = 0; i < BL_SPACEDIM; ++i) {
-                             if (geom_fine->isPeriodic(i)) {
-                                 fdomain_g.grow(i,ngrow);
-                             }
-                          }
-			  Box c_dom= amrex::coarsen(geom_fine->Domain(), m_amrlevel.crse_ratio);
-                          m_fpc = &FabArrayBase::TheFPinfo(*(smf_fine[0]), m_fabs, fdomain_g, IntVect(ngrow), coarsener, c_dom, NULL);
-                      }
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-#endif
-                      if (!m_fpc->ba_crse_patch.empty())
-                      {
-#ifdef USE_PERILLA_PTHREADS
-                          if(perilla::isMasterThread())
-#endif
-                          {
-                             m_mf_crse_patch = new MultiFab(m_fpc->ba_crse_patch, m_fpc->dm_crse_patch, ncomp, 0);
-		             mfList.push_back(m_mf_crse_patch);
-                             //m_mf_crse_patch->initVal(); // for Perilla NUMA
-                             BL_ASSERT(scomp+ncomp <= smf_crse[0]->nComp());
-                             BL_ASSERT(dcomp+ncomp <= m_mf_crse_patch->nComp());
-                             BL_ASSERT(smf_crse.size() == stime_crse.size());
-                             BL_ASSERT(smf_crse.size() != 0);
-                          }
-#ifdef USE_PERILLA_PTHREADS
-//                        perilla::syncAllThreads();
-#endif
-                          if (iter == 1)
-                          {
-#ifdef USE_PERILLA_PTHREADS
-//                            if(perilla::isMasterThread())
-#endif
-                              {
-                                  m_rg_crse_patch = new RegionGraph(m_mf_crse_patch->IndexArray().size());
-                                  m_rg_crse_patch->isDepGraph = true;
-                                  csrcGraph = new RegionGraph(smf_crse[0]->IndexArray().size());
-		    		  regionList.push_back(m_rg_crse_patch);
-		    		  regionList.push_back(csrcGraph);
-                              }
-#ifdef USE_PERILLA_PTHREADS
-//                            perilla::syncAllThreads();
-#endif
-#if 1
-                              Perilla::multifabExtractCopyAssoc( m_rg_crse_patch, csrcGraph, *m_mf_crse_patch, *(smf_crse[0]), ncomp, m_mf_crse_patch->nGrow(), 0,geom_crse->periodicity());
-#endif
-#ifdef USE_PERILLA_PTHREADS
-//                              perilla::syncAllThreads();
-//                            if(perilla::isMasterThread())
-#endif
-                              {
-                                  m_amrlevel.parent->graphArray[level].push_back(m_rg_crse_patch);
-                                  m_amrlevel.parent->graphArray[level].push_back(csrcGraph);
-                              }
-                          }
-                          else if (iter > 1)
-                          {
-#if 1
-                              //BL_ASSERT(smf_crse[0].boxArray() == smf_crse[1].boxArray());
-                              //PArray<MultiFab> raii(PArrayManage);
-                              //MultiFab * dmf;
-
-                              if (m_mf_crse_patch->boxArray() == smf_crse[0]->boxArray())
-                                {
-                                  //dmf = m_mf_crse_patch;
-                                  m_rg_crse_patch = new RegionGraph(m_mf_crse_patch->IndexArray().size());
-
-                                  //std::cout<< " level " << level  << " rg_crs_ptch ID " << m_rg_crse_patch->graphID << std::endl;
-
-                                  Perilla::multifabBuildFabCon(m_rg_crse_patch, *m_mf_crse_patch, geom->periodicity());
-                                  m_amrlevel.parent->graphArray[level].push_back(m_rg_crse_patch);
-		    		  regionList.push_back(m_rg_crse_patch);
-                                }
-                              else
-                              {
-#ifdef USE_PERILLA_PTHREADS
-//                                if(perilla::isMasterThread())
-#endif
-                                  {
-                                      //dmf = raii.push_back(new MultiFab(smf_crse[0].boxArray(), ncomp, 0));
-                                      dmf = new MultiFab(smf_crse[0]->boxArray(), smf_crse[0]->DistributionMap(), ncomp, 0);
-                                      //dmf->initVal(); // for Perilla NUMA
-                                      m_rg_crse_patch = new RegionGraph(m_mf_crse_patch->IndexArray().size());
-                                      m_rg_crse_patch->isDepGraph = true;
-                                      csrcGraph = new RegionGraph(dmf->IndexArray().size());
-                                      csrcGraph->buildTileArray(*dmf);
-		    		      regionList.push_back(m_rg_crse_patch);
-		    		      regionList.push_back(csrcGraph);
-		    		      mfList.push_back(dmf);
-                                  }
-#ifdef USE_PERILLA_PTHREADS
-//                                perilla::syncAllThreads();
-#endif
-
-#if 1
-                                  Perilla::multifabExtractCopyAssoc( m_rg_crse_patch, csrcGraph, *m_mf_crse_patch, *dmf, ncomp, m_mf_crse_patch->nGrow(), 0, geom_crse->periodicity());
-#endif
-#ifdef USE_PERILLA_PTHREADS
-//                                perilla::syncAllThreads();
-//                                if(perilla::isMasterThread())
-#endif
-                                  {
-                                      m_amrlevel.parent->graphArray[level].push_back(m_rg_crse_patch);
-                                      m_amrlevel.parent->graphArray[level].push_back(csrcGraph);
-                                  }
-                              }
-#endif
-                           }
-                           else
-                           {
-                             // BoxLib::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-                           }
-                        }
-                    }
-#if 1
-                  BL_ASSERT(scomp+ncomp <= smf_fine[0]->nComp());
-                  BL_ASSERT(dcomp+ncomp <= m_fabs.nComp());
-                  BL_ASSERT(smf_fine.size() == stime_fine.size());
-                  BL_ASSERT(smf_fine.size() != 0);
-
-                  if(true) // it will always be the case because same level comm and time will be available
-                  {
-#ifdef USE_PERILLA_PTHREADS
-//                    if(perilla::isMasterThread())
-#endif
-                      {
-                          dmff = new MultiFab(smf_fine[0]->boxArray(), smf_fine[0]->DistributionMap(), ncomp, 0);
-                          destGraph = new RegionGraph(m_fabs.IndexArray().size());
-                          //fsrcGraph = new RegionGraph(smf_fine[0]->IndexArray().size());
-                          fsrcGraph = new RegionGraph(dmff->IndexArray().size());
-			  regionList.push_back(destGraph);
-			  regionList.push_back(fsrcGraph);
-			  mfList.push_back(dmff);
-
-                          if(m_rg_crse_patch != 0)
-                          {
-                             destGraph->srcLinkGraph = m_rg_crse_patch;
-                             //for(int lfi=0; lfi < destGraph->numTasks; lfi++ )
-                             {
-                                for (MFIter mfi(*(m_mf_crse_patch),false); mfi.isValid(); ++mfi)
-                                {
-                                  int li = mfi.LocalIndex();
-                                  int gi = m_fpc->dst_idxs[li];
-                                  //if(gi == m_mf_crse_patch->IndexArray()[li])
-                                    {
-                                      int lfi = m_fabs.localindex(gi);
-                                      destGraph->task[lfi]->depTasksCompleted = false;
-                                      destGraph->task[lfi]->depTaskIDs.push_back(li);
-                                    }
-                                }
-                             }
-                          }
-                      }
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-#endif
-
-                      //if(level == 2)
-                      //std::cout<< "Sending In "<<destGraph<<" "<< fsrcGraph << " myP " << ParallelDescriptor::MyProc()<<std::endl;                                      
-#if 1
-                      Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *(dmff), ncomp, m_fabs.nGrow(), 0, geom_fine->periodicity());
-#endif
-#ifdef USE_PERILLA_PTHREADS
-//                    perilla::syncAllThreads();
-//                    if(perilla::isMasterThread())
-#endif
-                      {
-                          m_amrlevel.parent->graphArray[level].push_back(destGraph);
-                          m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-                      }
-                  }
-                  else if (smf_fine.size() == 2)
-                  {
-                      if (m_fabs.boxArray() == smf_fine[0]->boxArray())
-                      {
-                          //dmf = &m_fabs;
-                          destGraph = new RegionGraph(m_fabs.IndexArray().size());
-                          Perilla::multifabBuildFabCon(destGraph, m_fabs, geom->periodicity());
-                          m_amrlevel.parent->graphArray[level].push_back(destGraph);
-			  regionList.push_back(destGraph);
-                      }
-                      else
-                      {
-#ifdef USE_PERILLA_PTHREADS
-//                        if(perilla::isMasterThread())
-#endif
-                          {
-                              //dmf = raii.push_back(new MultiFab(smf_fine[0].boxArray(), ncomp, 0));
-                              dmff = new MultiFab(smf_fine[0]->boxArray(), smf_fine[0]->DistributionMap(), ncomp, 0);
-                              //dmff->initVal(); // for Perilla NUMA
-                              destGraph = new RegionGraph(m_fabs.IndexArray().size());
-                              fsrcGraph = new RegionGraph(dmff->IndexArray().size());
-                              fsrcGraph->buildTileArray(*dmff);
-			      regionList.push_back(destGraph);
-			      regionList.push_back(fsrcGraph);
-			      mfList.push_back(dmff);
-                          }
-#ifdef USE_PERILLA_PTHREADS
-//                        perilla::syncAllThreads();
-#endif
-#if 1
-                          Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *dmff, ncomp, m_fabs.nGrow(), 0, geom_fine->periodicity());
-#endif
-#ifdef USE_PERILLA_PTHREADS
-//                        perilla::syncAllThreads();
-//                        if(perilla::isMasterThread())
-#endif
-                          {
-                              m_amrlevel.parent->graphArray[level].push_back(destGraph);
-                              m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-                          }
-                       }
-                  }
-                  else
-                  {
-                      amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-                  }
-#endif
-                  //-------------------- FillFromTwoLevels initialization completed
-                } // if(level==1 OR ProperlyNested)
-              else
-                {
-                  amrex::Abort("initFillPatch: level is not properly nested");
-                }
-          }
-
-        DComp += NComp;
-    }
-#if 1
-#ifdef USE_PERILLA_PTHREADS
-//    perilla::syncAllThreads();
-//    if(perilla::isMasterThread())
-#endif
-    {
-        destGraph->buildTileArray(m_fabs);
-        destGraph->buildTileArray_gtbx(m_leveldata,boxGrow);
-    }
-#ifdef USE_PERILLA_PTHREADS
-//    perilla::syncAllThreads();
-#endif
-#endif
-}
-
-FillPatchIterator::FillPatchIterator (AmrLevel& amrlevel,
-                                      MultiFab& leveldata,
-                                      int       boxGrow,
-                                      Real      time,
-                                      int       index,
-                                      int       scomp,
-                                      int       ncomp,
-                                      int       f)
-    :
-    MFIter(leveldata),
-    m_amrlevel(amrlevel),
-    m_leveldata(leveldata),
-    m_ncomp(ncomp),
-    physbcf(0),
-    physbcf_crse(0),
-    physbcf_fine(0),
-    destGraph(0),
-    fsrcGraph(0),
-    csrcGraph(0),
-    m_rg_crse_patch(NULL),
-    //raii(PArrayManage)
-    dmf(NULL),
-    dmff(NULL)
-{
-#if 1
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(AmrLevel::desc_lst[index].inRange(scomp,ncomp));
-    BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-    //InitializePush(boxGrow,time,index,scomp,ncomp,f,tid);
-
-#ifdef BL_USE_TEAM
-    ParallelDescriptor::MyTeam().MemoryBarrier();
-#endif
-
-#endif
-}
-
-//end USE_PERILLA
-#endif
-
 }
 
diff --git a/Src/Amr/AMReX_AsyncFillPatch.cpp b/Src/Amr/AMReX_AsyncFillPatch.cpp
deleted file mode 100644
index 0f99ab43fa2..00000000000
--- a/Src/Amr/AMReX_AsyncFillPatch.cpp
+++ /dev/null
@@ -1,1486 +0,0 @@
-#include <sstream>
-#include <unistd.h>
-#include <memory>
-#include <limits>
-
-#include <AMReX_AmrLevel.H>
-#include <AMReX_Derive.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_FillPatchUtil.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BLProfiler.H>
-#include <AMReX_Print.H>
-#include <AMReX_VisMF.H>
-
-#ifdef USE_PERILLA
-#include <WorkerThread.H>
-
-namespace amrex {
-    using namespace perilla;
-
-    AsyncFillPatchIterator::AsyncFillPatchIterator (AmrLevel& amrlevel,
-	    MultiFab& leveldata,
-	    int       boxGrow,
-	    Real      time,
-	    int       index,
-	    int       scomp,
-	    int       ncomp,
-	    int       iter)
-	:
-	    MFIter(leveldata),
-	    m_amrlevel(amrlevel),
-	    m_leveldata(leveldata),
-	    m_ncomp(ncomp),
-	    physbcf(0),
-	    physbcf_crse(0),
-	    physbcf_fine(0),
-	    destGraph(0),
-	    fsrcGraph(0),
-	    csrcGraph(0),
-	    m_rg_crse_patch(0),
-	    dmf(0),
-	    dmff(0)
-    {
-	BL_ASSERT(scomp >= 0);
-	BL_ASSERT(ncomp >= 1);
-	BL_ASSERT(AmrLevel::desc_lst[index].inRange(scomp,ncomp));
-	BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-	initFillPatch(boxGrow, time, index, scomp, ncomp, iter);
-
-#ifdef BL_USE_TEAM
-	ParallelDescriptor::MyTeam().MemoryBarrier();
-#endif
-    }
-
-
-AsyncFillPatchIterator::~AsyncFillPatchIterator () {
-#ifdef USE_PERILLA
-        while(regionList.size()){
-          RegionGraph* tmp= regionList.front();
-          delete tmp;
-          regionList.pop_front();
-        }
-
-        while(mfList.size()){
-          MultiFab *tmp= mfList.front();
-          delete tmp;
-          mfList.pop_front();
-        }
-
-        while(stateDataList.size()){
-          StateDataPhysBCFunct *tmp= stateDataList.front();
-          delete tmp;
-          stateDataList.pop_front();
-        }
-#endif
-    }
-
-
-    void AsyncFillPatchIterator::FillFromTwoLevelsPush (Real time,
-	    int index,
-	    int scomp,
-	    int dcomp,
-	    int ncomp,
-	    int f,
-	    unsigned char pushLevel,
-	    bool singleT)
-    {
-
-	int ilev_fine = m_amrlevel.level;
-	int ilev_crse = ilev_fine-1;
-
-	BL_ASSERT(ilev_crse >= 0);
-
-	AmrLevel& fine_level = m_amrlevel;
-	AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-
-	Geometry* tgeom_fine = &fine_level.geom;
-	Geometry* tgeom_crse = &crse_level.geom;
-
-	Vector<MultiFab*> tsmf_crse;
-	Vector<MultiFab*> tsmf_fine;
-	Vector<Real> tstime_crse;
-	Vector<Real> tstime_fine;
-	StateData& statedata_crse = crse_level.state[index];
-	statedata_crse.getData(tsmf_crse,tstime_crse,time);
-	StateDataPhysBCFunct* tphysbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-
-	StateData& statedata_fine = fine_level.state[index];
-	statedata_fine.getData(tsmf_fine,tstime_fine,time);
-	StateDataPhysBCFunct* tphysbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-
-	const StateDescriptor& desc = AmrLevel::desc_lst[index];
-
-	FillPatchTwoLevelsPush(*(m_amrlevel.parent), m_fabs, time,
-		tsmf_crse, tstime_crse,
-		tsmf_fine, tstime_fine,
-		destGraph, csrcGraph, fsrcGraph, f,
-		this,
-		dmf,
-		dmff,
-		scomp, dcomp, ncomp,
-		*tgeom_crse, *tgeom_fine,
-		*tphysbcf_crse, *tphysbcf_fine,
-		crse_level.fineRatio(),
-		desc.interp(scomp), desc.getBCs(), pushLevel,singleT);
-    }
-
-    void AsyncFillPatchIterator::FillFromTwoLevelsPull (Real time,
-	    int index,
-	    int scomp,
-	    int dcomp,
-	    int ncomp,
-	    int f,
-	    bool singleT)
-    {
-
-	int ilev_fine = m_amrlevel.level;
-	int ilev_crse = ilev_fine-1;
-
-	BL_ASSERT(ilev_crse >= 0);
-
-	AmrLevel& fine_level = m_amrlevel;
-	AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-
-	Geometry* tgeom_fine = &fine_level.geom;
-	Geometry* tgeom_crse = &crse_level.geom;
-
-	Vector<MultiFab*> tsmf_crse;
-	Vector<MultiFab*> tsmf_fine;
-	Vector<Real> tstime_crse;
-	Vector<Real> tstime_fine;
-	StateData& statedata_crse = crse_level.state[index];
-	statedata_crse.getData(tsmf_crse,tstime_crse,time);
-	StateDataPhysBCFunct* tphysbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-
-	StateData& statedata_fine = fine_level.state[index];
-	statedata_fine.getData(tsmf_fine,tstime_fine,time);
-	StateDataPhysBCFunct* tphysbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-
-
-	const StateDescriptor& desc = AmrLevel::desc_lst[index];
-
-	FillPatchTwoLevelsPull(m_fabs, time,
-		tsmf_crse, tstime_crse,
-		tsmf_fine, tstime_fine,
-		destGraph, csrcGraph, fsrcGraph, f,
-		this,
-		scomp, dcomp, ncomp,
-		*tgeom_crse, *tgeom_fine,
-		*tphysbcf_crse, *tphysbcf_fine,
-		crse_level.fineRatio(),
-		desc.interp(scomp), desc.getBCs(), singleT);
-    }
-
-    void AsyncFillPatchIterator::FillFromTwoLevelsPull (MultiFab& dest,
-	    Real time,
-	    int index,
-	    int scomp,
-	    int dcomp,
-	    int ncomp,
-	    int f,
-	    bool singleT)
-    {
-	int ilev_fine = m_amrlevel.level;
-	int ilev_crse = ilev_fine-1;
-
-	BL_ASSERT(ilev_crse >= 0);
-
-	AmrLevel& fine_level = m_amrlevel;
-	AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-
-	Geometry* tgeom_fine = &fine_level.geom;
-	Geometry* tgeom_crse = &crse_level.geom;
-
-	Vector<MultiFab*> tsmf_crse;
-	Vector<MultiFab*> tsmf_fine;
-	Vector<Real> tstime_crse;
-	Vector<Real> tstime_fine;
-	StateData& statedata_crse = crse_level.state[index];
-	statedata_crse.getData(tsmf_crse,tstime_crse,time);
-	StateDataPhysBCFunct* tphysbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-
-	StateData& statedata_fine = fine_level.state[index];
-	statedata_fine.getData(tsmf_fine,tstime_fine,time);
-	StateDataPhysBCFunct* tphysbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-
-
-	const StateDescriptor& desc = AmrLevel::desc_lst[index];
-
-	FillPatchTwoLevelsPull(dest, time,
-		tsmf_crse, tstime_crse,
-		tsmf_fine, tstime_fine,
-		destGraph, csrcGraph, fsrcGraph, f,
-		this,
-		scomp, dcomp, ncomp,
-		*tgeom_crse, *tgeom_fine,
-		*tphysbcf_crse, *tphysbcf_fine,
-		crse_level.fineRatio(),
-		desc.interp(scomp), desc.getBCs(), singleT);
-    }
-
-    void AsyncFillPatchIterator::initFillPatch(int boxGrow,
-	    Real time,
-	    int index,
-	    int scomp,
-	    int ncomp,
-	    int iter)
-    {
-	BL_ASSERT(scomp >= 0);
-	BL_ASSERT(ncomp >= 1);
-	BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-
-	const StateDescriptor& desc = AmrLevel::desc_lst[index];
-
-	m_ncomp = ncomp;
-	m_range = desc.sameInterps(scomp,ncomp);
-
-	m_fabs.define(m_leveldata.boxArray(),m_leveldata.DistributionMap(),
-		m_ncomp,boxGrow);
-
-	BL_ASSERT(m_leveldata.DistributionMap() == m_fabs.DistributionMap());
-
-	const IndexType& boxType = m_leveldata.boxArray().ixType();
-	const int level = m_amrlevel.level;
-
-	for (int i = 0, DComp = 0; i < m_range.size(); i++)
-	{
-	    const int SComp = m_range[i].first;
-	    const int NComp = m_range[i].second;
-	    int dcomp = DComp;
-
-	    if (level == 0)
-	    {
-		BL_ASSERT(m_amrlevel.level == 0);
-		StateData& statedata = m_amrlevel.state[index];
-		statedata.getData(smf,stime,time);
-		geom = &m_amrlevel.geom;
-		physbcf = new StateDataPhysBCFunct(statedata,scomp,*geom);
-                stateDataList.push_back(physbcf);
-		BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-		BL_ASSERT(dcomp+ncomp <= m_fabs.nComp());
-		BL_ASSERT(smf.size() == stime.size());
-		BL_ASSERT(smf.size() != 0);
-
-		if (smf.size() == 1)
-		{
-		    dmf = new MultiFab(smf[0]->boxArray(), smf[0]->DistributionMap(), ncomp, 0);
-		    destGraph = new RegionGraph(m_fabs.IndexArray().size());
-		    fsrcGraph = new RegionGraph(smf[0]->IndexArray().size());
-                    regionList.push_back(destGraph);
-                    regionList.push_back(fsrcGraph);
-		    Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *smf[0], ncomp, m_fabs.nGrow(), 0, geom->periodicity());
-		    m_amrlevel.parent->graphArray[level].push_back(destGraph);
-		    m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-		}
-		else if (smf.size() == 2)
-		{
-		    BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-		    if (m_fabs.boxArray() == smf[0]->boxArray())
-		    {
-			dmf = &m_fabs;
-			destGraph = new RegionGraph(m_fabs.IndexArray().size());
-                        regionList.push_back(destGraph);
-			Perilla::multifabBuildFabCon(destGraph, m_fabs, geom->periodicity());
-			m_amrlevel.parent->graphArray[level].push_back(destGraph);
-		    }
-		    else
-		    {
-			dmf = new MultiFab(smf[0]->boxArray(), smf[0]->DistributionMap(), ncomp, 0);
-			destGraph = new RegionGraph(m_fabs.IndexArray().size());
-			fsrcGraph = new RegionGraph(dmf->IndexArray().size());
-			fsrcGraph->buildTileArray(*dmf);
-                        regionList.push_back(destGraph);
-                        regionList.push_back(fsrcGraph);
-                        mfList.push_back(dmf);
-
-			Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *dmf, ncomp, m_fabs.nGrow(), 0, geom->periodicity());
-			m_amrlevel.parent->graphArray[level].push_back(destGraph);
-			m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-		    }
-		}
-		else
-		{
-		    amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-		}
-		//-------------------------------------------------- FillFromLevel0 initialization completed
-	    }
-	    else
-	    {
-		isProperlyNested = amrex::ProperlyNested(m_amrlevel.crse_ratio,
-			m_amrlevel.parent->blockingFactor(m_amrlevel.level),
-			boxGrow, boxType, desc.interp(SComp));
-		if (level == 1 || isProperlyNested)
-		{
-		    int ilev_fine = m_amrlevel.level;
-		    int ilev_crse = ilev_fine-1;
-		    BL_ASSERT(ilev_crse >= 0);
-		    AmrLevel& fine_level = m_amrlevel;
-		    AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-		    geom_fine = &fine_level.geom;
-		    geom_crse = &crse_level.geom;
-		    StateData& statedata_crse = crse_level.state[index];
-		    statedata_crse.getData(smf_crse,stime_crse,time);
-		    physbcf_crse = new StateDataPhysBCFunct(statedata_crse,scomp,*geom_crse);
-		    StateData& statedata_fine = fine_level.state[index];
-		    statedata_fine.getData(smf_fine,stime_fine,time);
-		    physbcf_fine = new StateDataPhysBCFunct(statedata_fine,scomp,*geom_fine);
-
-                    stateDataList.push_back(physbcf_crse);
-                    stateDataList.push_back(physbcf_fine);
-
-		    const StateDescriptor& desc = AmrLevel::desc_lst[index];
-		    int ngrow = m_fabs.nGrow();
-		    if (ngrow > 0 || m_fabs.getBDKey() != smf_fine[0]->getBDKey())
-		    {
-			InterpolaterBoxCoarsener coarsener = desc.interp(scomp)->BoxCoarsener(crse_level.fineRatio());
-			Box fdomain = geom_fine->Domain();
-			fdomain.convert(m_fabs.boxArray().ixType());
-			Box fdomain_g(fdomain);
-			for (int i = 0; i < BL_SPACEDIM; ++i) {
-			    if (geom_fine->isPeriodic(i)) {
-				fdomain_g.grow(i,ngrow);
-			    }
-			}
-			// dummytostopcraycompilererror
-			std::cout << "";
-
-			Box c_dom= amrex::coarsen(geom_fine->Domain(), m_amrlevel.crse_ratio);
-
-			m_fpc = &FabArrayBase::TheFPinfo(*smf_fine[0], m_fabs, fdomain_g, IntVect(ngrow), coarsener, c_dom, NULL);
-
-			if (!m_fpc->ba_crse_patch.empty())
-			{
-			    m_mf_crse_patch = new MultiFab(m_fpc->ba_crse_patch, m_fpc->dm_crse_patch, ncomp, 0);
-                            mfList.push_back(m_mf_crse_patch);
-			    BL_ASSERT(scomp+ncomp <= smf_crse[0]->nComp());
-			    BL_ASSERT(dcomp+ncomp <= m_mf_crse_patch->nComp());
-			    BL_ASSERT(smf_crse.size() == stime_crse.size());
-			    BL_ASSERT(smf_crse.size() != 0);
-
-			    //if (smf_crse.size() == 1)
-			    if (iter == 1)
-			    {
-				m_rg_crse_patch = new RegionGraph(m_mf_crse_patch->IndexArray().size());
-
-				m_rg_crse_patch->isDepGraph = true;
-
-				csrcGraph = new RegionGraph(smf_crse[0]->IndexArray().size());
-
-                                regionList.push_back(m_rg_crse_patch);
-                                regionList.push_back(csrcGraph);
-
-				Perilla::multifabExtractCopyAssoc( m_rg_crse_patch, csrcGraph, *m_mf_crse_patch, *smf_crse[0], ncomp, m_mf_crse_patch->nGrow(), 0,geom_crse->periodicity());
-#if 0
-				MultiFab  temp_4_tile(m_fpc->ba_dst_boxes, m_fpc->dm_crse_patch, ncomp, 0);
-				m_rg_crse_patch->buildTileArray(temp_4_tile);
-#endif
-				///m_rg_crse_patch->buildTileArray(*m_mf_crse_patch);
-				m_amrlevel.parent->graphArray[level].push_back(m_rg_crse_patch);
-				m_amrlevel.parent->graphArray[level].push_back(csrcGraph);
-			    }
-
-			    else if (iter > 1)
-			    {
-				if (m_mf_crse_patch->boxArray() == smf_crse[0]->boxArray())
-				{
-				    //dmf = m_mf_crse_patch;
-				    m_rg_crse_patch = new RegionGraph(m_mf_crse_patch->IndexArray().size());
-
-				    //std::cout<< " level " << level  << " rg_crs_ptch ID " << m_rg_crse_patch->graphID << std::endl;
-
-				    Perilla::multifabBuildFabCon(m_rg_crse_patch, *m_mf_crse_patch,geom_crse->periodicity());
-				    m_amrlevel.parent->graphArray[level].push_back(m_rg_crse_patch);
-                                    regionList.push_back(m_rg_crse_patch);
-				}
-				else
-				{
-				    dmf = new MultiFab(smf_crse[0]->boxArray(), smf_crse[0]->DistributionMap(), ncomp, 0);
-				    m_rg_crse_patch = new RegionGraph(m_mf_crse_patch->IndexArray().size());
-				    m_rg_crse_patch->isDepGraph = true;
-				    csrcGraph = new RegionGraph(dmf->IndexArray().size());
-				    csrcGraph->buildTileArray(*dmf);
-
-#if 0
-				    MultiFab      temp_4_tile(m_fpc->ba_dst_boxes, m_fpc->dm_crse_patch, ncomp, 0);
-				    m_rg_crse_patch->buildTileArray(temp_4_tile);
-#endif
-
-                                      regionList.push_back(m_rg_crse_patch);
-                                      regionList.push_back(csrcGraph);
-                                      mfList.push_back(dmf);
-
-
-				    Perilla::multifabExtractCopyAssoc( m_rg_crse_patch, csrcGraph, *m_mf_crse_patch, *dmf, ncomp, m_mf_crse_patch->nGrow(), 0, geom_crse->periodicity());
-				    m_amrlevel.parent->graphArray[level].push_back(m_rg_crse_patch);
-				    m_amrlevel.parent->graphArray[level].push_back(csrcGraph);
-				}
-			    }
-			    else
-			    {
-				amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-			    }
-
-			}
-		    }
-
-		    BL_ASSERT(scomp+ncomp <= smf_fine[0]->nComp());
-		    BL_ASSERT(dcomp+ncomp <= m_fabs.nComp());
-		    BL_ASSERT(smf_fine.size() == stime_fine.size());
-		    BL_ASSERT(smf_fine.size() != 0);
-
-		    //if (smf_fine.size() == 1)       // probabily it should aways be this because same level
-		    //if (iter == 1)
-		    if(true) // it will always be the case because same level comm and time will be available
-		    {
-			destGraph = new RegionGraph(m_fabs.IndexArray().size());
-			fsrcGraph = new RegionGraph(smf_fine[0]->IndexArray().size());
-
-                          regionList.push_back(destGraph);
-                          regionList.push_back(fsrcGraph);
-
-
-			if(m_rg_crse_patch != 0)
-			{
-			    destGraph->srcLinkGraph = m_rg_crse_patch;
-			    //for(int lfi=0; lfi < destGraph->numTasks; lfi++ )
-
-			    //std::cout << " m_mf_crse_patch->IndexArray().size() " << m_mf_crse_patch->IndexArray().size() << " size " << m_mf_crse_patch->size() << " myP " << myProc<< std::endl;
-
-			    {
-				for (MFIter mfi(*(m_mf_crse_patch),false); mfi.isValid(); ++mfi)
-				{
-				    int li = mfi.LocalIndex();
-				    int gi = m_fpc->dst_idxs[li];
-				    //if(gi == m_mf_crse_patch->IndexArray()[li])
-				    {
-					int lfi = m_fabs.localindex(gi);
-					destGraph->task[lfi]->depTasksCompleted = false;
-					destGraph->task[lfi]->depTaskIDs.push_back(li);
-
-				    }
-				}
-			    }
-			}
-			//if(level == 2)
-			//std::cout<< "Sending In "<<destGraph<<" "<< fsrcGraph << " myP " << ParallelDescriptor::MyProc()<<std::endl;                                      
-			Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *smf_fine[0], ncomp, m_fabs.nGrow(), 0, geom_fine->periodicity());
-
-			m_amrlevel.parent->graphArray[level].push_back(destGraph);
-			m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-		    }
-		    else if (smf_fine.size() == 2)
-			//else if (iter > 1) 
-		    {
-
-			//BL_ASSERT(smf_fine[0]->boxArray() == smf_fine[1]->boxArray());
-			//PArray<MultiFab> raii(PArrayManage);
-			//MultiFab * dmf;
-
-			if (m_fabs.boxArray() == smf_fine[0]->boxArray())
-			{
-			    //dmf = &m_fabs;
-			    destGraph = new RegionGraph(m_fabs.IndexArray().size());
-
-			    Perilla::multifabBuildFabCon(destGraph, m_fabs, geom_fine->periodicity());
-			    m_amrlevel.parent->graphArray[level].push_back(destGraph);
-                            regionList.push_back(destGraph);
-			}
-			else
-			{
-			    //dmf = raii.push_back(new MultiFab(smf_fine[0]->boxArray(), m_amrlevel.dmap, ncomp, 0));
-			    dmff = new MultiFab(smf_fine[0]->boxArray(), smf_fine[0]->DistributionMap(), ncomp, 0);
-			    //dmff->initVal(); // for Perilla NUMA
-			    destGraph = new RegionGraph(m_fabs.IndexArray().size());
-			    fsrcGraph = new RegionGraph(dmff->IndexArray().size());
-			    fsrcGraph->buildTileArray(*dmff);
-                              regionList.push_back(destGraph);
-                              regionList.push_back(fsrcGraph);
-                              mfList.push_back(dmff);
-
-			    Perilla::multifabExtractCopyAssoc( destGraph, fsrcGraph, m_fabs, *dmff, ncomp, m_fabs.nGrow(), 0, geom_fine->periodicity());
-			    m_amrlevel.parent->graphArray[level].push_back(destGraph);
-			    m_amrlevel.parent->graphArray[level].push_back(fsrcGraph);
-			}
-		    }
-		    else
-		    {
-			amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-		    }
-		    //-------------------- FillFromTwoLevels initialization completed
-
-		} // if(level==1 OR ProperlyNested)
-		else
-		{
-		    amrex::Abort("initFillPatch: level is not properly nested");
-		}
-	    }
-	    DComp += NComp;
-	}
-
-	destGraph->buildTileArray(m_fabs);
-	destGraph->buildTileArray_gtbx(m_leveldata,boxGrow);
-	//MemOpt 
-	//m_fabs.clear();
-    }
-
-    void AsyncFillPatchIterator::SendIntraLevel (RGIter& rgi,
-	    int  boxGrow,
-	    Real time,
-	    int  index,
-	    int  scomp,
-	    int  ncomp,
-	    int iteration,
-	    int f,
-	    bool singleT)
-    {
-	if(rgi.currentItr != rgi.totalItr)
-	    return;
-
-	const int level = m_amrlevel.level;
-
-
-
-	int ncycle = m_amrlevel.parent->nCycle(level);
-	unsigned char pushLevel = 0x02;
-	PushOnly(boxGrow, time, index, scomp, ncomp, f, pushLevel, singleT);
-    }
-    void AsyncFillPatchIterator::SendInterLevel (RGIter* rgi,
-	    int  boxGrow,
-	    Real time,
-	    int  index,
-	    int  scomp,
-	    int  ncomp,
-	    int iteration,
-	    int f,
-	    bool singleT)
-    {
-	if(rgi->currentItr != rgi->totalItr)
-	    return;
-
-	if(m_amrlevel.level-1 < m_amrlevel.parent->finestLevel())
-	{
-	    unsigned char tuc = 0x01;
-	    PushOnly(boxGrow, time+((iteration-1)*m_amrlevel.parent->dtLevel(m_amrlevel.level)), index, scomp, ncomp, f, tuc, singleT);
-	}
-    }
-
-    void AsyncFillPatchIterator::SendInterLevel (RGIter& rgi,
-            int  boxGrow,
-            Real time,
-            int  index,
-            int  scomp,
-            int  ncomp,
-            int iteration,
-            int f,
-            bool singleT)
-    {
-	SendInterLevel(&rgi, boxGrow, time, index, scomp, ncomp, iteration, f, singleT);
-    }
-
-
-    void AsyncFillPatchIterator::PushOnly (int  boxGrow,
-	    Real time,
-	    int  index,
-	    int  scomp,
-	    int  ncomp,
-	    int f,
-	    unsigned char pushLevel,
-	    bool singleT)
-    {
-	BL_PROFILE("FillPatchIterator::InitializePush");
-	BL_ASSERT(scomp >= 0);
-	BL_ASSERT(ncomp >= 1);
-	BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-	//const IndexType& boxType = m_leveldata.boxArray().ixType();
-	const int level = m_amrlevel.level;
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	for (int i = 0, DComp = 0; i < m_range.size(); i++)
-	{
-	    if(i>0)
-		amrex::Abort("**** Error in FillPatchIterator::Initialize:  non contigeous components not implemented");
-
-	    const int SComp = m_range[i].first;
-	    const int NComp = m_range[i].second;
-
-	    if (level == 0)
-	    {
-		Vector<MultiFab*>                  tsmf;
-		Vector<Real>                       tstime;
-		StateData& statedata = m_amrlevel.state[index];
-		statedata.getData(tsmf,tstime,time);
-		FillPatchSingleLevelPush (*(m_amrlevel.parent), m_fabs, time, tsmf, tstime, destGraph, fsrcGraph, f, dmf, SComp, DComp, NComp, *geom, *physbcf, singleT);
-	    }else{
-		if (level == 1 || isProperlyNested)
-		{
-		    FillFromTwoLevelsPush(time, index, SComp, DComp, NComp, f, pushLevel, singleT);
-		}else {
-		    amrex::Abort("**** Error in FillPatchIterator::Initialize:  !ProperlyNested not implemented");
-		}
-	    }
-	    DComp += NComp;
-	}
-    }
-
-    void AsyncFillPatchIterator::PullOnly (int  boxGrow,
-	    Real time,
-	    int  index,
-	    int  scomp,
-	    int  ncomp,
-	    int f,
-	    bool singleT)
-    {
-	BL_PROFILE("FillPatchIterator::InitializePull");
-	BL_ASSERT(scomp >= 0);
-	BL_ASSERT(ncomp >= 1);
-	BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-	//const IndexType& boxType = m_leveldata.boxArray().ixType();
-	const int level = m_amrlevel.level;
-
-	for (int i = 0, DComp = 0; i < m_range.size(); i++)
-	{
-	    if(i>0)
-		amrex::Abort("**** Error in FillPatchIterator::Initialize:  non contigeous components not implemented");
-
-	    const int SComp = m_range[i].first;
-	    const int NComp = m_range[i].second;
-
-	    if (level == 0)
-	    {
-		FillPatchSingleLevelPull (m_fabs, time, smf, stime, destGraph, fsrcGraph, f, SComp, DComp, NComp, *geom, *physbcf, singleT);
-	    }
-	    else
-	    {
-		if (level == 1 || isProperlyNested)
-		{
-		    FillFromTwoLevelsPull(time, index, SComp, DComp, NComp, f, singleT);
-		} else {
-		    amrex::Abort("**** Error in FillPatchIterator::Initialize:  !ProperlyNested not implemented");
-		}
-	    }
-	    //if(WorkerThread::isTeamMasterThread(tid))
-	    {
-		const MultiFab& mf_fillpatched = m_fabs;
-		if(singleT)
-		{
-		    for(int t=0; t<destGraph->fabTiles_gtbx[f]->numTiles; t++)
-		    {
-			const Box& bx = *(destGraph->fabTiles_gtbx[f]->tileBx[t]);
-			MultiFab::Copy(m_leveldata, mf_fillpatched, f, 0, DComp, ncomp, bx);
-		    }
-		}
-		else
-		{
-		    int nt = perilla::wtid();
-		    int totalCompThreads= perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS;
-		    for(int t=nt; t<destGraph->fabTiles_gtbx[f]->numTiles; t+= totalCompThreads)
-		    {
-			const Box& bx = *(destGraph->fabTiles_gtbx[f]->tileBx[t]);
-			MultiFab::Copy(m_leveldata, mf_fillpatched, f, 0, DComp, ncomp, bx);
-		    }
-		}
-	    }
-	    DComp += NComp;
-	}
-    }
-
-
-void
-AsyncFillPatchIterator::PullOnly (MultiFab& dest,
-                                  int  boxGrow,
-                                  Real time,
-                                  int  index,
-                                  int  scomp,
-                                  int  ncomp,
-                                  int f,
-                                  bool singleT)
-{
-    BL_PROFILE("FillPatchIterator::InitializePull");
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(0 <= index && index < AmrLevel::desc_lst.size());
-
-    int myProc = amrex::ParallelDescriptor::MyProc();
-
-    //const IndexType& boxType = m_leveldata.boxArray().ixType();
-    const int level = m_amrlevel.level;
-
-    for (int i = 0, DComp = 0; i < m_range.size(); i++)
-      {
-        if(i>0)
-          amrex::Abort("**** Error in FillPatchIterator::Initialize:  non contigeous components not implemented");
-
-        const int SComp = m_range[i].first;
-        const int NComp = m_range[i].second;
-
-        if (level == 0)
-          {
-
-            //double start_time_wtime = omp_get_wtime();            
-            try{
-              //MemOpt
-              FillPatchSingleLevelPull (dest, time, smf, stime, destGraph, fsrcGraph, f, SComp, DComp, NComp, *geom, *physbcf, singleT);
-              //amrex::FillPatchSingleLevelPull (m_fabs, time, smf, stime, destGraph, fsrcGraph, f, tid, SComp, DComp, NComp, *geom, *physbcf, singleT);
-            }
-            catch(std::exception& e){
-              std::cout<< "AFPI_Receive_FPSLPull: Proc " <<myProc << " tid " << tid <<" exception: " << e.what() <<std::endl;
-            }
-          }
-        else
-          {
-            if (level == 1 || isProperlyNested)
-              {
-                try{
-                  //MemOpt
-                  FillFromTwoLevelsPull(dest, time, index, SComp, DComp, NComp, f,singleT);
-                  //FillFromTwoLevelsPull(time, index, SComp, DComp, NComp, f, tid, singleT);
-                }
-                catch(std::exception& e){
-                  std::cout<< "AFPI_Receive_FPTLPull: Proc " <<myProc << " tid " << tid <<" exception: " << e.what() <<std::endl;
-                }
-
-              } else {
-              amrex::Abort("**** Error in FillPatchIterator::Initialize:  !ProperlyNested not implemented");
-            }
-          }
-    }
-}
-
-
-    void AsyncFillPatchIterator::FillPatchSingleLevelPush (Amr& amr, MultiFab& mf, Real time,
-	    Vector<MultiFab*>& smf, const Vector<Real>& stime,
-	    RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-	    MultiFab *dmf,
-	    int scomp, int dcomp, int ncomp,
-	    const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT)
-    {
-	BL_PROFILE("FillPatchSingleLevel");
-	BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-	BL_ASSERT(dcomp+ncomp <= mf.nComp());
-	BL_ASSERT(smf.size() == stime.size());
-	BL_ASSERT(smf.size() != 0);
-
-	int tg = perilla::wid();
-	int nt = perilla::wtid();
-
-	if (smf.size() == 1)
-	{
-	    //mf.copy(smf[0], scomp, dcomp, ncomp, 0, mf.nGrow(), geom.periodicity());        
-	    Perilla::multifabCopyPush(destGraph, srcGraph, &mf, smf[0],  f, dcomp, scomp, ncomp, mf.nGrow(), 0, singleT);
-	}
-	else if (smf.size() == 2)
-	{
-	    BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-	    //PArray<MultiFab> raii(PArrayManage);
-	    //MultiFab * dmf;
-	    int destcomp;
-	    bool sameba;
-	    //if (false && mf.boxArray() == smf[0]->boxArray())
-	    if (mf.boxArray() == smf[0]->boxArray())
-	    {
-		std::cout << "FillPatchUtil SLPush Nt Handled" << std::endl;
-
-		//dmf = &mf;
-		destcomp = dcomp;
-		sameba = true;
-
-		int fis = smf[0]->IndexArray()[f];
-		int fid = mf.IndexArray()[f];
-
-		const Box& bx = mf[fid].box();
-		mf[fid].linInterp(smf[0]->get(fis),
-			scomp,
-			smf[1]->get(fis),
-			scomp,
-			stime[0],
-			stime[1],
-			time,
-			bx,
-			destcomp,
-			ncomp);
-		Perilla::fillBoundaryPush(destGraph, &mf, f);
-	    }
-	    else
-	    {
-		destcomp = 0;
-		sameba = false;
-
-		int fis = smf[0]->IndexArray()[f];
-		int fid = dmf->IndexArray()[f];
-
-		for(int t=0; t<srcGraph->fabTiles[f]->numTiles; t++)
-		    if( singleT || t % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == nt)
-		    {
-			const Box& bx = *(srcGraph->fabTiles[f]->tileBx[t]);
-			if(bx.ok())
-			    (*dmf)[fid].linInterp(smf[0]->get(fis),
-				    scomp,
-				    smf[1]->get(fis),
-				    scomp,
-				    stime[0],
-				    stime[1],
-				    time,
-				    bx,
-				    destcomp,
-				    ncomp);
-		    }
-		if(!singleT)
-		    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-		int src_ngrow = 0;
-		int dst_ngrow = mf.nGrow();
-		Perilla::multifabCopyPush( destGraph, srcGraph, &mf, dmf, f, dcomp, 0, ncomp, mf.nGrow(), 0 ,singleT);
-
-	    }
-	}
-	else
-	{
-	    amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-	}
-    }
-
-    void AsyncFillPatchIterator::FillPatchSingleLevelPull (MultiFab& mf, Real time,
-	    Vector<MultiFab*>& smf, const Vector<Real>& stime,
-	    RegionGraph* destGraph, RegionGraph* srcGraph, int f,
-	    int scomp, int dcomp, int ncomp,
-	    const Geometry& geom, StateDataPhysBCFunct& physbcf, bool singleT)
-    {
-	BL_PROFILE("FillPatchSingleLevel");
-
-	BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-	BL_ASSERT(dcomp+ncomp <= mf.nComp());
-	BL_ASSERT(smf.size() == stime.size());
-	BL_ASSERT(smf.size() != 0);
-
-	int tg = perilla::wid(); 
-
-	if (smf.size() == 1)
-	{
-	    //mf.copy(smf[0], scomp, dcomp, ncomp, 0, mf.nGrow(), geom.periodicity());      
-	    Perilla::multifabCopyPull( destGraph, srcGraph, &mf, smf[0], f, dcomp, scomp, ncomp, mf.nGrow(), 0, singleT);
-	}
-	else if (smf.size() == 2)
-	{
-	    BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-	    Vector<MultiFab*> raii;
-	    MultiFab * dmf;
-	    int destcomp;
-	    bool sameba;
-	    //if (false && mf.boxArray() == smf[0]->boxArray()) {
-	    if (mf.boxArray() == smf[0]->boxArray()) {
-		//dmf = &mf;
-		destcomp = dcomp;
-		sameba = true;
-	    } else {
-
-		//dmf = srcGraph->assocMF;              
-		destcomp = 0;
-		sameba = false;
-	    }
-	    if (sameba)
-	    {
-		// Note that when sameba is true mf's BoxArray is nonoverlapping.
-		// So FillBoundary is safe.
-		//mf.FillBoundary(dcomp,ncomp,geom.periodicity());
-
-		Perilla::fillBoundaryPull(destGraph, &mf, f, singleT);
-
-		//std::cout << "After sameba fBPull" << std::endl;
-	    }
-	    else
-	    {
-		int src_ngrow = 0;
-		int dst_ngrow = mf.nGrow();
-		MultiFab* dummyMF;
-
-		//mf.copy(*dmf, 0, dcomp, ncomp, src_ngrow, dst_ngrow, geom.periodicity());
-
-		Perilla::multifabCopyPull( destGraph, srcGraph, &mf, dummyMF, f, dcomp, 0, ncomp, mf.nGrow(), 0, singleT);
-
-	    }
-	}
-	    else {
-		amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-	    }
-
-	    if(!singleT)
-		destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	}
-
-
-	void AsyncFillPatchIterator::FillPatchTwoLevelsPush (Amr& amr, MultiFab& mf, Real time,
-		Vector<MultiFab*>& cmf, Vector<Real>& ct,
-		Vector<MultiFab*>& fmf, Vector<Real>& ft,
-		RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-		AsyncFillPatchIterator* fpIter,
-		MultiFab *dmf,
-		MultiFab *dmff,
-		int scomp, int dcomp, int ncomp,
-		const Geometry& cgeom, const Geometry& fgeom,
-		StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-		const IntVect& ratio,
-		Interpolater* mapper, const Vector<BCRec>& bcs, unsigned char pushLevel, bool singleT)
-	{   
-	    BL_PROFILE("FillPatchTwoLevels");
-
-	    int ngrow = mf.nGrow();
-
-	    if(f>=0){//fill only this fab
-		if(pushLevel & 0x01 )
-		{   
-		    if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-		    {
-
-			if (!fpIter->m_fpc->ba_crse_patch.empty())
-			{   
-			    FillPatchSingleLevelPush(amr, *(fpIter->m_mf_crse_patch), time, cmf, ct, fpIter->m_rg_crse_patch, csrcGraph, f, dmf, scomp, 0, ncomp, cgeom, cbc, singleT);
-			}
-		    }
-		}
-		if((pushLevel & 0x02) && (pushLevel != 0x03))
-		{    
-		    FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, f, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-		}
-	    }else{ //fill the whole multifab
-		if(pushLevel & 0x01 && pushLevel & 0x02)
-		{   
-		    int tg = perilla::wid();
-		    for(int fi=0; fi < fmf[0]->IndexArray().size(); fi++)
-		    {   
-			if(WorkerThread::isMyRegion(tg,fi))
-			{ 
-			    FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, fi, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-			}
-		    }
-		}
-		if(pushLevel & 0x04)
-		{
-		    int tg = perilla::wid();
-		    for(int fi=0; fi < fmf[0]->IndexArray().size(); fi++)
-		    {
-			if(WorkerThread::isMyRegion(tg,fi))
-			{
-			    FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, fi, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-			}
-		    }
-		}
-	    }
-
-#if 0
-	    BL_PROFILE("FillPatchTwoLevels");
-
-	    int ngrow = mf.nGrow();
-
-	    if(pushLevel & 0x01 )
-	    { 
-		if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-		{ 
-		    if ( ! fpIter->m_fpc->ba_crse_patch.empty())
-		    {                 
-			FillPatchSingleLevelPush(amr, *(fpIter->m_mf_crse_patch), time, cmf, ct, fpIter->m_rg_crse_patch, csrcGraph, f, tid, dmf, scomp, 0, ncomp, cgeom, cbc, singleT);
-
-		    }
-		}
-
-
-		if(tf == 0 && (pushLevel & 0x02) )
-		{ 
-		    int tg = WorkerThread::groupID(tid);
-		    for(int fi=0; fi < fmf[0]->IndexArray().size(); fi++)
-		    { 
-			if(WorkerThread::isMyRegion(tg,fi))
-			{ 
-			    FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, fi, tid, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-			}
-		    }
-		}
-	    }
-	    if(tf == 0 && (pushLevel & 0x04) )
-	    {
-		int tg = WorkerThread::groupID(tid);
-		for(int fi=0; fi < fmf[0]->IndexArray().size(); fi++)
-		{
-		    if(WorkerThread::isMyRegion(tg,fi))
-		    {
-			FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, fi, tid, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-		    } 
-		}   
-	    }   
-
-	    if((pushLevel & 0x02) && (pushLevel != 0x03))
-	    {
-		FillPatchSingleLevelPush(amr, mf, time, fmf, ft, destGraph, fsrcGraph, f, tid, dmff, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-	    }
-#endif
-	}     
-
-
-	void AsyncFillPatchIterator::FillPatchTwoLevelsPull (MultiFab& mf, Real time,
-		Vector<MultiFab*>& cmf, Vector<Real>& ct,
-		Vector<MultiFab*>& fmf, Vector<Real>& ft,
-		RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f,
-		AsyncFillPatchIterator* fpIter,
-		int scomp, int dcomp, int ncomp,
-		const Geometry& cgeom, const Geometry& fgeom,
-		StateDataPhysBCFunct& cbc, StateDataPhysBCFunct& fbc,
-		const IntVect& ratio,
-		Interpolater* mapper, const Vector<BCRec>& bcs, bool singleT)
-	{
-	    BL_PROFILE("FillPatchTwoLevels");
-	    int ngrow = mf.nGrow();
-	    int tg = WorkerThread::perilla_wid();
-	    int nt = WorkerThread::perilla_wtid();
-
-	    if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-	    {
-
-		if ( ! fpIter->m_fpc->ba_crse_patch.empty())
-		{
-
-		    int idummy1=0, idummy2=0;
-		    bool cc = fpIter->m_fpc->ba_crse_patch.ixType().cellCentered();
-		    {
-			int gi = mf.IndexArray()[f];
-			for(int i=0; i<destGraph->task[f]->depTaskIDs.size();i++)
-			{ 
-			    int li = destGraph->task[f]->depTaskIDs[i];
-			    int mfi = fpIter->m_mf_crse_patch[0].IndexArray()[li];
-			    FillPatchSingleLevelPull(*(fpIter->m_mf_crse_patch), time, cmf, ct, fpIter->m_rg_crse_patch, csrcGraph, li, scomp, 0, ncomp, cgeom, cbc, singleT);
-			}
-			if(!singleT)
-			    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-			int nt = WorkerThread::perilla_wtid();
-			Box fdomain = fgeom.Domain();
-			for(int i=0; i<destGraph->task[f]->depTaskIDs.size();i++)
-			{
-			    int li = destGraph->task[f]->depTaskIDs[i];
-			    int mfi = fpIter->m_mf_crse_patch[0].IndexArray()[li];
-			    if(singleT)
-			    {
-				const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-				//Array<BCRec> bcr(ncomp);
-				Vector<BCRec> bcr(ncomp);
-				amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-				mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-					0,
-					mf[gi],
-					dcomp,
-					ncomp,
-					dbx,
-					ratio,
-					cgeom,
-					fgeom,
-					bcr,
-					idummy1, idummy2, RunOn::Cpu);
-			    }
-			    else
-			    {
-				if(!cc)
-				{
-				    if(WorkerThread::perilla_isMasterWorkerThread())
-				    {
-					const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-					//Box fdomain = fgeom.Domain();
-
-					Vector<BCRec> bcr(ncomp);
-					amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-					mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-						0,
-						mf[gi],
-						dcomp,
-						ncomp,
-						dbx,
-						ratio,
-						cgeom,
-						fgeom,
-						bcr,
-						idummy1, idummy2, RunOn::Cpu);
-
-				    }
-				}
-				else
-				{
-
-				    for(int j=0; j < fpIter->m_rg_crse_patch->fabTiles[li]->numTiles; j++)
-					if(j % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == nt)
-					{
-					    const Box& dbx = *(fpIter->m_rg_crse_patch->fabTiles[li]->tileBx[j]);
-					    if(dbx.ok())
-					    {
-						Vector<BCRec> bcr(ncomp);
-						amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-						mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-							0,
-							mf[gi],
-							dcomp,
-							ncomp,
-							dbx,
-							ratio,
-							cgeom,
-							fgeom,
-							bcr,
-							idummy1, idummy2, RunOn::Cpu);
-					    }
-					}
-
-				}
-			    }
-			    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-			}
-			if(!singleT)
-			    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-		    }
-		}
-	    }
-
-	    FillPatchSingleLevelPull(mf, time, fmf, ft, destGraph, fsrcGraph, f, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-	}
-
-#if 0
-	void AsyncFillPatchIterator::FillPatchTwoLevelsPull (MultiFab& mf, Real time,
-		Vector<MultiFab*>& cmf, const Vector<Real>& ct,
-		Vector<MultiFab*>& fmf, const Vector<Real>& ft,
-		RegionGraph* destGraph, RegionGraph* csrcGraph, RegionGraph* fsrcGraph, int f, int tid,
-		AsyncFillPatchIterator* fpIter,
-		int scomp, int dcomp, int ncomp,
-		const Geometry& cgeom, const Geometry& fgeom,
-		PhysBCFunctBase& cbc, PhysBCFunctBase& fbc,
-		const IntVect& ratio,
-		Interpolater* mapper, const Vector<BCRec>& bcs, bool singleT)
-	{
-	    BL_PROFILE("FillPatchTwoLevels");
-
-	    int ngrow = mf.nGrow();
-
-	    int tg = perilla:wid();//WorkerThread::groupID(tid);
-	    int nt = perilla::wtid();//WorkerThread::numaTID(tid);
-
-
-	    int myProc = ParallelDescriptor::MyProc();
-	    //std::ofstream fout;
-	    //fout.open(std::to_string(myProc)+ "_" + std::to_string(tid) + ".txt", std::fstream::app);
-
-
-	    if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-	    {
-
-		//fout << "FPTL fpIter->m_fpc->ba_crse_patch.empty() " << fpIter->m_fpc->ba_crse_patch.empty() << std::endl;
-
-		if ( ! fpIter->m_fpc->ba_crse_patch.empty())
-		{
-
-		    int idummy1=0, idummy2=0;
-		    bool cc = fpIter->m_fpc->ba_crse_patch.ixType().cellCentered();
-
-		    //std::cout << "Check CC : " << cc << std::endl;
-		    //#ifdef _OPENMP
-		    //#pragma omp parallel if (cc)
-		    //#endif
-
-
-		    //for (MFIter mfi(*(fpIter->m_mf_crse_patch),false,false); mfi.isValid(); ++mfi)
-		    {
-			//int li = mfi.LocalIndex();
-			//int gi = fpIter->m_fpc->dst_idxs[li];
-			//if(gi == mf.IndexArray()[f])
-			int gi = mf.IndexArray()[f];
-			//if(gi == f)
-
-			// fout << "FPTL gi " << gi << " f " << f << " destGraph->task[f]->depTaskIDs.size() " << destGraph->task[f]->depTaskIDs.size() << std::endl;
-
-			//double start_time_wtime = omp_get_wtime();
-
-			for(int i=0; i<destGraph->task[f]->depTaskIDs.size();i++)
-			{
-			    int li = destGraph->task[f]->depTaskIDs[i];
-			    int mfi = fpIter->m_mf_crse_patch[0].IndexArray()[li];
-
-			    //fout << "Calling FPSL for dependent gi "<< gi << " li " << li << std::endl;
-			    FillPatchSingleLevelPull(*(fpIter->m_mf_crse_patch), time, cmf, ct, fpIter->m_rg_crse_patch, csrcGraph, li, tid, scomp, 0, ncomp, cgeom, cbc, singleT);
-			}
-			//if(!singleT)
-			//destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-			//double end_time_wtime = omp_get_wtime();
-			/*if(singleT)
-			  Perilla::getPPPTimeSplit[8] += end_time_wtime - start_time_wtime;
-			  else
-			  if(WorkerThread::isTeamMasterThread(tid))
-			  Perilla::getPPPTimeSplit[8] += end_time_wtime - start_time_wtime;
-			 */
-			//if(myProc == 0 && nt == 4)
-			//std::cout << "CC " << cc << " DepTasks " << destGraph->task[f]->depTaskIDs.size() << std::endl;
-
-
-			//start_time_wtime = omp_get_wtime();
-			int nt = perilla::wtid();//WorkerThread::numaTID(tid);
-			Box fdomain = fgeom.Domain();
-			for(int i=0; i<destGraph->task[f]->depTaskIDs.size();i++)
-			{
-			    int li = destGraph->task[f]->depTaskIDs[i];
-			    int mfi = fpIter->m_mf_crse_patch[0].IndexArray()[li];
-			    /*              
-					    const Box& dbx1 = fpIter->m_fpc->dst_boxes[li];
-
-					    std::ofstream fout;
-					    fout.open(std::to_string(myProc)+ "_" + std::to_string(tid) + ".txt", std::fstream::app);
-					    fout << "i "<< i << " depsiz " << destGraph->task[f]->depTaskIDs.size() <<" li "<< li << " f "<< f << " mfi "<< mfi << " gi " << gi << std::endl; 
-					    fout <<" numFabs " << fpIter->m_rg_crse_patch->fabTiles.size() << " numTls " << fpIter->m_rg_crse_patch->fabTiles[li]->numTiles << " ndbs " << fpIter->m_fpc->dst_boxes.size() << std::endl;
-			    //fout <<"dbx " << dbx << std::endl;
-			    fout <<"dst_bxs " << dbx1 << std::endl;
-			    fout <<"fine bx " << mf[gi].box() << std::endl;
-			    fout <<"crse bx " << fpIter->m_mf_crse_patch[0][mfi].box() << std::endl;
-			    fout.close();
-			     */
-
-			    if(singleT)
-			    {
-				const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-				//Box fdomain = fgeom.Domain();
-
-				Vector<BCRec> bcr(ncomp);
-				amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-				mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-					0,
-					mf[gi],
-					dcomp,
-					ncomp,
-					dbx,
-					ratio,
-					cgeom,
-					fgeom,
-					bcr,
-					idummy1, idummy2, RunOn::Cpu);
-			    }
-			    else
-			    {
-				if(!cc)
-				{
-				    if(WorkerThread::isTeamMasterThread(tid))
-				    {
-					const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-					//Box fdomain = fgeom.Domain();
-
-					Array<BCRec> bcr(ncomp);
-					amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-					mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-						0,
-						mf[gi],
-						dcomp,
-						ncomp,
-						dbx,
-						ratio,
-						cgeom,
-						fgeom,
-						bcr,
-						idummy1, idummy2, RunOn::Cpu);
-
-				    }
-				}
-				else
-				{
-				    //std::cout << "myP " << myProc << " nt "<< nt << " li "<< li << " mfi " << mfi << " ntiles " << fpIter->m_rg_crse_patch->fabTiles.size()<< std::endl;
-				    ///for(int j=0; j < fpIter->m_rg_crse_patch->fabTiles[f]->numTiles; j++)
-				    for(int j=0; j < fpIter->m_rg_crse_patch->fabTiles[li]->numTiles; j++)
-					if(j % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == nt-perilla::NUM_COMM_THREADS)
-					    ///if(i % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == nt-perilla::NUM_COMM_THREADS)
-					{
-
-					    //if(myProc == 0 && nt == 4)
-					    //std::cout << "CC " << cc << " DepTasks " << destGraph->task[f]->depTaskIDs.size() << " i " << i  << std::endl;
-					    ///const Box& dbx = fpIter->m_fpc->dst_boxes[li];
-					    ///const Box& dbx = *(fpIter->m_rg_crse_patch->fabTiles[f]->tileBx[j]);
-					    const Box& dbx = *(fpIter->m_rg_crse_patch->fabTiles[li]->tileBx[j]);
-					    //Box fdomain = fgeom.Domain();
-
-					    //if(myProc == 0 && nt == 4)
-					    //std::cout << "CC " << cc << " DepTasks " << destGraph->task[f]->depTaskIDs.size() << " i " << i  << " dbx " << dbx << std::endl;
-
-
-					    //fout << "FPTL interping gi "<< gi << " li " << li<< " dbx " << dbx << std::endl;
-					    if(dbx.ok())
-					    {
-						Vector<BCRec> bcr(ncomp);
-						amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-						mapper->interp(fpIter->m_mf_crse_patch[0][mfi],
-							0,
-							mf[gi],
-							dcomp,
-							ncomp,
-							dbx,
-							ratio,
-							cgeom,
-							fgeom,
-							bcr,
-							idummy1, idummy2, RunOn::Cpu);
-					    }
-					}
-				}
-			    }
-			    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-			}
-			if(!singleT)
-			    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-			/*
-			   end_time_wtime = omp_get_wtime();
-			   if(singleT)
-			   Perilla::getPPPTimeSplit[9] += end_time_wtime - start_time_wtime;
-			   else
-			   if(WorkerThread::isTeamMasterThread(tid))
-			   Perilla::getPPPTimeSplit[9] += end_time_wtime - start_time_wtime;
-			 */
-		    }
-		}
-	    }
-	    /*
-	       int mfi = mf.IndexArray()[f];
-	       const Box& bx = mf[mfi].box();
-	    //if(mfi == 0 )
-	    {
-	    fout << "Before second FPSL at FPSL mfi " << mfi << " bx " << bx.smallEnd() << bx.bigEnd() <<  std::endl;
-	    for(int i=bx.smallEnd(0); i<=bx.smallEnd(0); i++)
-	    {
-	    for(int j=bx.smallEnd(1); j<=bx.bigEnd(1); j++)
-	    {
-	    for(int k=bx.smallEnd(2); k<=bx.bigEnd(2); k++)
-	    {
-	    fout << mf[mfi](IntVect(i,j,k))  << " ";
-	    }
-	    fout << std::endl;
-	    }
-	    fout << std::endl;
-	    }
-	    }
-	     */
-	    //fout.close();
-	    //double start_time_wtime = omp_get_wtime();
-
-	    FillPatchSingleLevelPull(mf, time, fmf, ft, destGraph, fsrcGraph, f, tid, scomp, dcomp, ncomp, fgeom, fbc, singleT);
-	    /*      
-		    double end_time_wtime = omp_get_wtime();
-		    if(singleT)
-		    Perilla::getPPPTimeSplit[10] += end_time_wtime - start_time_wtime;
-		    else
-		    if(WorkerThread::isTeamMasterThread(tid))
-		    Perilla::getPPPTimeSplit[10] += end_time_wtime - start_time_wtime;
-	     */
-	}
-
-
-#endif
-
-
-
-	void AsyncFillPatchIterator::initialSend(Vector<amrex::AsyncFillPatchIterator*> afpi,
-		Vector<amrex::AsyncFillPatchIterator*> upper_afpi,
-		int  boxGrow,
-		Real time,
-		int  state_indx,
-		int  scomp,
-		int  ncomp,
-		int  iteration)
-	{
-	    int myProc = amrex::ParallelDescriptor::MyProc();
-	    int level = afpi[iteration-1]->m_amrlevel.level;
-	    if(level == 0 && iteration == 1)
-	    {
-		int tg = perilla::wid();
-		for(int f=0; f < afpi[iteration-1]->m_fabs.IndexArray().size(); f++)
-		{
-		    if(WorkerThread::isMyRegion(tg, f))
-		    {
-			for(int i=0; i < afpi[iteration-1]->m_amrlevel.parent->nCycle(level); i++){
-			    //fill neighbor fabs of the same AMR level
-			    afpi[i]->PushOnly( boxGrow, time+(i*afpi[iteration-1]->m_amrlevel.parent->dtLevel(level)), state_indx, scomp, ncomp, f, 0xFF, false);
-			}
-		    }
-		}
-	    }
-
-	    if(level < afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-	    {
-		int i = 0;
-		unsigned char tuc = 0x04;
-		//init Fill Patch at the next finer AMR level
-		upper_afpi[i]->PushOnly(boxGrow, time+(i*afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)), state_indx, scomp, ncomp, -1/* all FABs*/, tuc, false);
-	    }
-	}
-
-	void AsyncFillPatchIterator::Receive (RGIter& rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  index,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    bool singleT)
-	    {
-		if(rgi.currentItr != 1)
-		    return;
-
-		PullOnly(boxGrow, time, index, scomp, ncomp, f, singleT);
-	    }
-
-	void AsyncFillPatchIterator::Receive (RGIter* rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  index,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    bool singleT)
-	    {
-		if(rgi->currentItr != 1)
-		    return;
-
-		PullOnly(boxGrow, time, index, scomp, ncomp, f, singleT);
-	    }
-
-
-	void AsyncFillPatchIterator::Receive (RGIter& rgi,
-		    MultiFab& dest,
-		    int  boxGrow,
-		    Real time,
-		    int  index,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    bool singleT)
-	    {
-		if(rgi.currentItr != 1)
-		    return;
-
-		PullOnly(dest, boxGrow, time, index, scomp, ncomp, f, singleT);
-	    }
-
-
-	void AsyncFillPatchIterator::Receive (RGIter* rgi,
-		    MultiFab& dest,
-		    int  boxGrow,
-		    Real time,
-		    int  index,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    bool singleT)
-	    {
-		if(rgi->currentItr != 1)
-		    return;
-
-		PullOnly(dest, boxGrow, time, index, scomp, ncomp, f, singleT);
-	    }
-    }//end amrex namespace
-
-#endif
-    //end USE_PERILLA
diff --git a/Src/Amr/AMReX_Extrapolater.cpp b/Src/Amr/AMReX_Extrapolater.cpp
index c4e97decfc7..8ce3c6974d5 100644
--- a/Src/Amr/AMReX_Extrapolater.cpp
+++ b/Src/Amr/AMReX_Extrapolater.cpp
@@ -1,53 +1,51 @@
 
 #include <AMReX_Extrapolater.H>
+#include <AMReX_extrapolater_K.H>
 #include <AMReX_iMultiFab.H>
 
 #ifdef _OPENMP
 #include <omp.h>
 #endif
 
-extern "C"
-{
-    void amrex_first_order_extrap(amrex::Real* u, const int* ulo, const int* uhi, const int& nu,
-			    const int* msk, const int* mlo, const int* mhi,
-			    const int* lo, const int* hi, 
-			    const int& scomp, const int& ncomp);
-}
-
 namespace amrex {
 
 namespace Extrapolater
 {
     void FirstOrderExtrap (MultiFab& mf, const Geometry& geom, int scomp, int ncomp)
     {
-        Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO gpu
+        BL_ASSERT(mf.nGrow() == 1);
+        BL_ASSERT(scomp >= 0);
+        BL_ASSERT((scomp+ncomp) <= mf.nComp());
 
-	BL_ASSERT(mf.nGrow() == 1);
-	BL_ASSERT(scomp >= 0);
-	BL_ASSERT(ncomp <= mf.nComp());
-
-	iMultiFab mask(mf.boxArray(), mf.DistributionMap(), 1, 1, MFInfo(),
+        iMultiFab mask(mf.boxArray(), mf.DistributionMap(), 1, 1, MFInfo(),
                        DefaultFabFactory<IArrayBox>());
-	mask.BuildMask(geom.Domain(), geom.periodicity(),
-		       finebnd, crsebnd, physbnd, interior);
-
-	int N = mf.nComp();
+        mask.BuildMask(geom.Domain(), geom.periodicity(),
+                       finebnd, crsebnd, physbnd, interior);
 
 #ifdef _OPENMP
-#pragma omp parallel
+#pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
-	for (MFIter mfi(mf); mfi.isValid(); ++mfi)
-	{
-	    const Box& bx = mfi.validbox();
-	    const IArrayBox& maskfab = mask[mfi];
-	    const Box& maskbox = maskfab.box();
-	    FArrayBox& datafab = mf[mfi];
-	    const Box& databox = datafab.box();
-
-	    amrex_first_order_extrap(datafab.dataPtr(), databox.loVect(), databox.hiVect(), N, 
-			       maskfab.dataPtr(), maskbox.loVect(), maskbox.hiVect(),
-			       bx.loVect(), bx.hiVect(), scomp, ncomp);
-	}
+        for (MFIter mfi(mf); mfi.isValid(); ++mfi)
+        {
+           const Box& bx        = mfi.validbox();
+           auto const& mask_arr = mask.const_array(mfi);
+           auto const& data_arr = mf.array(mfi,scomp);
+
+           if (Gpu::inLaunchRegion()) {
+              ParallelFor(amrex::grow(bx,1), ncomp,
+              [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept
+              {
+                 if (mask_arr(i,j,k) == crsebnd) data_arr(i,j,k,n) = 0.0;
+              });
+              ParallelFor(amrex::grow(bx,1), ncomp,
+              [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept
+              {
+                 amrex_first_order_extrap_gpu(i, j, k, n, bx, mask_arr, data_arr);
+              });
+           } else {
+              amrex_first_order_extrap_cpu(bx, ncomp, mask_arr, data_arr);
+           }
+        }
     }
 }
 
diff --git a/Src/Amr/AMReX_StateData.cpp b/Src/Amr/AMReX_StateData.cpp
index 8014c4b38c0..b61dd8ced6a 100644
--- a/Src/Amr/AMReX_StateData.cpp
+++ b/Src/Amr/AMReX_StateData.cpp
@@ -1,9 +1,8 @@
 
 #include <iostream>
+#include <limits>
 #include <algorithm>
 
-#include <unistd.h>
-
 #include <AMReX_RealBox.H>
 #include <AMReX_StateData.H>
 #include <AMReX_StateDescriptor.H>
@@ -16,7 +15,11 @@
 
 namespace amrex {
 
-static constexpr Real INVALID_TIME = -1.0e200;
+#ifdef AMREX_USE_FLOAT
+static constexpr Real INVALID_TIME = -1.0e30;
+#else
+static constexpr Real INVALID_TIME = -1.0e200; 
+#endif
 
 static constexpr int MFNEWDATA = 0;
 static constexpr int MFOLDDATA = 1;
@@ -460,7 +463,7 @@ StateData::FillBoundary (FArrayBox&     dest,
         const int sc  = src_comp+i;
         Real*     dat = dest.dataPtr(dc);
 
-        if (desc->master(sc))
+        if (desc->primary(sc))
         {
             const int groupsize = desc->groupsize(sc);
 
@@ -535,7 +538,7 @@ StateData::FillBoundary (Box const&      bx,
         const int dc  = dest_comp+i;
         const int sc  = src_comp+i;
 
-        if (desc->master(sc))
+        if (desc->primary(sc))
         {
             const int groupsize = desc->groupsize(sc);
 
diff --git a/Src/Amr/AMReX_StateDescriptor.H b/Src/Amr/AMReX_StateDescriptor.H
index 2877e0493da..54417adc5ee 100644
--- a/Src/Amr/AMReX_StateDescriptor.H
+++ b/Src/Amr/AMReX_StateDescriptor.H
@@ -219,7 +219,7 @@ public:
     * \param bc
     * \param func
     * \param interp
-    * \param master_or_slave
+    * \param primary_or_secondary
     * \param groupsize
     */
     void setComponent (int                comp,
@@ -227,7 +227,7 @@ public:
                        const BCRec&       bc,
                        const BndryFunc&   func,
                        Interpolater*      interp,
-                       bool               master_or_slave,
+                       bool               primary_or_secondary,
                        int                groupsize);
 
     /**
@@ -380,7 +380,7 @@ public:
     */
     bool store_in_checkpoint () const noexcept;
 
-    bool master (int i) const noexcept { return m_master[i]; }
+    bool primary (int i) const noexcept { return m_primary[i]; }
 
     int groupsize (int i) const noexcept { return m_groupsize[i]; }
 
@@ -412,8 +412,8 @@ private:
     Vector<std::string> names;        //!< Printable names of components
     Vector<BCRec>       bc;           //!< Array of bndry types for entire level
     Vector<std::unique_ptr<BndryFunc> >  bc_func;      //!< Array of pointers to bndry fill functions
-    Vector<int>         m_master;     //!< Are we a master or slave? (true or false)
-    Vector<int>         m_groupsize;     //!< Groupsize if we're a master
+    Vector<int>         m_primary;     //!< Are we a primary or secondary? (true or false)
+    Vector<int>         m_groupsize;     //!< Groupsize if we're a primary
 
     /**
     * \brief If mapper_comp[icomp] != 0, that map is used instead of mapper
diff --git a/Src/Amr/AMReX_StateDescriptor.cpp b/Src/Amr/AMReX_StateDescriptor.cpp
index a978b039def..fb62b4d7305 100644
--- a/Src/Amr/AMReX_StateDescriptor.cpp
+++ b/Src/Amr/AMReX_StateDescriptor.cpp
@@ -20,8 +20,8 @@ StateDescriptor::BndryFunc::clone () const
 StateDescriptor::BndryFunc::~BndryFunc () {}
 
 bool
-StateDescriptor::bf_thread_safety (const int* lo,const int* hi,
-				   const int* dom_lo, const int* dom_hi,
+StateDescriptor::bf_thread_safety (const int* /*lo*/,const int* /*hi*/,
+				   const int* /*dom_lo*/, const int* /*dom_hi*/,
 				   const int* bc, int ng)
 {
     bool thread_safe = true;
@@ -39,26 +39,26 @@ void
 StateDescriptor::BndryFunc::operator () (Real* data,const int* lo,const int* hi,
                                          const int* dom_lo, const int* dom_hi,
                                          const Real* dx, const Real* grd_lo,
-                                         const Real* time, const int* bc) const
+                                         const Real* time, const int* a_bc) const
 {
     BL_ASSERT(m_func != 0 || m_func3D != 0);
 
-    bool thread_safe = bf_thread_safety(lo, hi, dom_lo, dom_hi, bc, 1);
+    bool thread_safe = bf_thread_safety(lo, hi, dom_lo, dom_hi, a_bc, 1);
     if (thread_safe) {
       if (m_func != 0)
-	m_func(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,bc);
+	m_func(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,a_bc);
       else
 	m_func3D(data,AMREX_ARLIM_3D(lo),AMREX_ARLIM_3D(hi),AMREX_ARLIM_3D(dom_lo),AMREX_ARLIM_3D(dom_hi),
-                 AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,bc);
+                 AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,a_bc);
     } else {
 #ifdef _OPENMP
 #pragma omp critical (bndryfunc)
 #endif
       if (m_func != 0)
-	m_func(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,bc);
+	m_func(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,a_bc);
       else
 	m_func3D(data,AMREX_ARLIM_3D(lo),AMREX_ARLIM_3D(hi),AMREX_ARLIM_3D(dom_lo),AMREX_ARLIM_3D(dom_hi),
-                 AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,bc);
+                 AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,a_bc);
     }
 }
 
@@ -66,26 +66,26 @@ void
 StateDescriptor::BndryFunc::operator () (Real* data,const int* lo,const int* hi,
                                          const int* dom_lo, const int* dom_hi,
                                          const Real* dx, const Real* grd_lo,
-                                         const Real* time, const int* bc, int ng) const
+                                         const Real* time, const int* a_bc, int ng) const
 {
     BL_ASSERT(m_gfunc != 0 || m_gfunc3D != 0);
 
-    bool thread_safe = bf_thread_safety(lo, hi, dom_lo, dom_hi, bc, ng);
+    bool thread_safe = bf_thread_safety(lo, hi, dom_lo, dom_hi, a_bc, ng);
     if (thread_safe) {
         if (m_gfunc != 0)
-	  m_gfunc(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,bc);
+	  m_gfunc(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,a_bc);
 	else
 	  m_gfunc3D(data,AMREX_ARLIM_3D(lo),AMREX_ARLIM_3D(hi),AMREX_ARLIM_3D(dom_lo),AMREX_ARLIM_3D(dom_hi),
-                    AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,bc);
+                    AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,a_bc);
     } else {
 #ifdef _OPENMP
 #pragma omp critical (bndryfunc)
 #endif
         if (m_gfunc != 0)
-	  m_gfunc(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,bc);
+	  m_gfunc(data,AMREX_ARLIM(lo),AMREX_ARLIM(hi),dom_lo,dom_hi,dx,grd_lo,time,a_bc);
 	else
 	  m_gfunc3D(data,AMREX_ARLIM_3D(lo),AMREX_ARLIM_3D(hi),AMREX_ARLIM_3D(dom_lo),AMREX_ARLIM_3D(dom_hi),
-                    AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,bc);
+                    AMREX_ZFILL(dx),AMREX_ZFILL(grd_lo),time,a_bc);
     }
 }
 
@@ -147,9 +147,9 @@ DescriptorList::setComponent (int                               indx,
 {
     for (int i = 0; i < nm.size(); i++)
     {
-        const bool master = (i == 0) ? true : false;
+        const bool is_primary = (i == 0) ? true : false;
 
-        desc[indx]->setComponent(comp+i,nm[i],bc[i],func,interp,master,nm.size());
+        desc[indx]->setComponent(comp+i,nm[i],bc[i],func,interp,is_primary,nm.size());
     }
 }
 
@@ -210,7 +210,7 @@ StateDescriptor::StateDescriptor (IndexType                   btyp,
     bc.resize(num_comp);
     bc_func.resize(num_comp);
     mapper_comp.resize(num_comp);
-    m_master.resize(num_comp);
+    m_primary.resize(num_comp);
     m_groupsize.resize(num_comp);
     max_map_start_comp.resize(num_comp);
     min_map_end_comp.resize(num_comp);
@@ -336,7 +336,7 @@ StateDescriptor::define (IndexType                   btyp,
     bc.resize(num_comp);
     bc_func.resize(num_comp);
     mapper_comp.resize(num_comp);
-    m_master.resize(num_comp);
+    m_primary.resize(num_comp);
     m_groupsize.resize(num_comp);
     max_map_start_comp.resize(num_comp);
     min_map_end_comp.resize(num_comp);
@@ -356,7 +356,7 @@ StateDescriptor::setComponent (int                               comp,
     names[comp]       = nm;
     bc[comp]          = bcr;
     mapper_comp[comp] = a_interp;
-    m_master[comp]    = false;
+    m_primary[comp]    = false;
     m_groupsize[comp] = 0;
 
     if (max_map_start_comp_>=0 && min_map_end_comp_>=0)
@@ -381,12 +381,12 @@ StateDescriptor::setComponent (int                               comp,
                                const BCRec&                      bcr,
                                const StateDescriptor::BndryFunc& func,
                                Interpolater*                     a_interp,
-                               bool                              a_master,
+                               bool                              a_primary,
                                int                               a_groupsize)
 {
     setComponent(comp,nm,bcr,func,a_interp,-1,-1);
 
-    m_master[comp]    = a_master;
+    m_primary[comp]    = a_primary;
     m_groupsize[comp] = a_groupsize;
 }
 
diff --git a/Src/Amr/AMReX_extrapolater_1D_K.H b/Src/Amr/AMReX_extrapolater_1D_K.H
new file mode 100644
index 00000000000..5e939275156
--- /dev/null
+++ b/Src/Amr/AMReX_extrapolater_1D_K.H
@@ -0,0 +1,55 @@
+#ifndef AMReX_extrapolater_1D_K_H_
+#define AMReX_extrapolater_1D_K_H_
+
+namespace amrex {
+
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+void
+amrex_first_order_extrap_cpu(amrex::Box const& bx,
+                             int               nComp,
+                             amrex::Array4<const int>   const& mask,
+                             amrex::Array4<amrex::Real> const& data) noexcept
+{
+   constexpr int crsecell = 0;
+
+   const auto lo = amrex::lbound(bx);
+   const auto hi = amrex::ubound(bx);
+
+   if (mask(lo.x-1,lo.y,lo.z) == crsecell) {
+      for (int n = 0; n < nComp; n++) {
+         data(lo.x-1,lo.y,lo.z,n) = data(lo.x,lo.y,lo.z,n);
+      }
+   }
+   if (mask(hi.x+1,hi.y,hi.z) == crsecell) {
+      for (int n = 0; n < nComp; n++) {
+         data(hi.x+1,hi.y,hi.z,n) = data(hi.x,hi.y,hi.z,n);
+      }
+   }
+
+}
+
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+void
+amrex_first_order_extrap_gpu(int i, int j, int k, int n,
+                             amrex::Box const& bx,
+                             amrex::Array4<const int>   const& mask,
+                             amrex::Array4<amrex::Real> const& data) noexcept
+{
+   constexpr int crsecell = 0;
+
+   const auto lo = amrex::lbound(bx);
+   const auto hi = amrex::ubound(bx);
+
+   if ( (i == lo.x-1) && ( mask(i,j,k) == crsecell ) ) {
+      data(i,j,k,n) = data(i+1,j,k,n);
+   }
+
+   if ( (i == hi.x+1) && ( mask(i,j,k) == crsecell ) ) {
+      data(i,j,k,n) = data(i-1,j,k,n);
+   }
+}
+
+}
+#endif
diff --git a/Src/Amr/AMReX_extrapolater_1d.f90 b/Src/Amr/AMReX_extrapolater_1d.f90
deleted file mode 100644
index 45d20b935dc..00000000000
--- a/Src/Amr/AMReX_extrapolater_1d.f90
+++ /dev/null
@@ -1,33 +0,0 @@
-
-module amrex_extrapolater
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-  integer, parameter :: finecell = 1 ! must be consistent with Extrapolater.H
-  integer, parameter :: crsecell = 0
-
-contains
-
-  subroutine amrex_first_order_extrap (u, ulo, uhi, nu, msk, mlo, mhi, lo, hi, sc, nc) &
-       bind(c,name='amrex_first_order_extrap')
-
-    integer, intent(in) :: ulo(1), uhi(1), nu, mlo(1), mhi(1), lo(1), hi(1), sc, nc
-    real(amrex_real), intent(inout) :: u(ulo(1):uhi(1),0:nu-1)
-    integer     , intent(in)  :: msk(mlo(1):mhi(1))
-
-    integer :: n
-
-    do n = sc, sc+nc-1
-       if (msk(lo(1)-1) .eq. crsecell) then
-          u(lo(1)-1,n) = u(lo(1),n)
-       end if
-
-       if (msk(hi(1)+1) .eq. crsecell) then
-          u(hi(1)+1,n) = u(hi(1),n)
-       end if
-    end do
-
-  end subroutine amrex_first_order_extrap
-
-end module amrex_extrapolater
diff --git a/Src/Amr/AMReX_extrapolater_2D_K.H b/Src/Amr/AMReX_extrapolater_2D_K.H
new file mode 100644
index 00000000000..be1d30ec6b1
--- /dev/null
+++ b/Src/Amr/AMReX_extrapolater_2D_K.H
@@ -0,0 +1,210 @@
+#ifndef AMReX_extrapolater_2D_K_H_
+#define AMReX_extrapolater_2D_K_H_
+
+namespace amrex {
+
+AMREX_GPU_HOST
+AMREX_FORCE_INLINE
+void
+amrex_first_order_extrap_cpu(amrex::Box const& bx,
+                             int               nComp,
+                             amrex::Array4<const int>   const& mask,
+                             amrex::Array4<amrex::Real> const& data) noexcept
+{
+   using namespace amrex::literals;
+
+   constexpr int finecell = 1;
+   constexpr int crsecell = 0;
+
+   const auto lo = amrex::lbound(bx);
+   const auto hi = amrex::ubound(bx);
+
+   int k = lo.z;
+
+   for (int n = 0; n < nComp; n++) {
+
+      // set all crse cells to zero first
+      for (int j = lo.y-1; j <= hi.y+1; ++j) {
+         for (int i = lo.x-1; i <= hi.x+1; ++i) {
+             if (mask(i,j,k) == crsecell) data(i,j,k,n) = Real(0.0);
+         }
+      }
+
+      // Corners
+      // xlo, ylo
+      {
+         int i = lo.x-1;
+         int j = lo.y-1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i+1,j,k) == finecell ) ||
+                 ( mask(i,j+1,k) == finecell ) ) {
+               data(i,j,k,n) = ( mask(i+1,j,k) * data(i+1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                               / ( mask(i+1,j,k) + mask(i,j+1,k) );
+            } else {
+               data(i,j,k,n) = data(i+1,j+1,k,n);
+            }
+         }
+      }
+      // xlo, yhi
+      {
+         int i = lo.x-1;
+         int j = hi.y+1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i+1,j,k) == finecell ) ||
+                 ( mask(i,j-1,k) == finecell ) ) {
+               data(i,j,k,n) = ( mask(i+1,j,k) * data(i+1,j,k,n) + mask(i,j-1,k) * data(i,j-1,k,n) )
+                               / ( mask(i+1,j,k) + mask(i,j-1,k) );
+            } else {
+               data(i,j,k,n) = data(i+1,j-1,k,n);
+            }
+         }
+      }
+      // xhi, ylo
+      {
+         int i = hi.x+1;
+         int j = lo.y-1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i-1,j,k) == finecell ) ||
+                 ( mask(i,j+1,k) == finecell ) ) {
+               data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                               / ( mask(i-1,j,k) + mask(i,j+1,k) );
+            } else {
+               data(i,j,k,n) = data(i-1,j+1,k,n);
+            }
+         }
+      }
+      // xhi, yhi
+      {
+         int i = hi.x+1;
+         int j = hi.y+1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i-1,j,k) == finecell ) ||
+                 ( mask(i,j-1,k) == finecell ) ) {
+               data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i,j-1,k) * data(i,j-1,k,n) )
+                               / ( mask(i-1,j,k) + mask(i,j-1,k) );
+            } else {
+               data(i,j,k,n) = data(i-1,j-1,k,n);
+            }
+         }
+      }
+      // Edges
+      // xlo, y-valid
+      {
+         int i = lo.x-1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            if ( mask(i,j,k) == crsecell ) {
+               data(i,j,k,n) = ( mask(i,j-1,k) * data(i,j-1,k,n) + data(i+1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                               / ( mask(i,j-1,k) + 1 + mask(i,j+1,k) );
+            }
+         }
+      }
+      // xhi, y-valid
+      {
+         int i = hi.x+1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            if ( mask(i,j,k) == crsecell ) {
+               data(i,j,k,n) = ( mask(i,j-1,k) * data(i,j-1,k,n) + data(i-1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                               / ( mask(i,j-1,k) + 1 + mask(i,j+1,k) );
+            }
+         }
+      }
+      // x-valid, ylo
+      {
+         int j = lo.y-1;
+         for (int i = lo.x; i <= hi.x; ++i) {
+            if ( mask(i,j,k) == crsecell ) {
+               data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i+1,j,k) * data(i+1,j,k,n) + data(i,j+1,k,n) )
+                               / ( mask(i-1,j,k) + mask(i+1,j,k) + 1 );
+            }
+         }
+      }
+      // x-valid, yhi
+      {
+         int j = hi.y+1;
+         for (int i = lo.x; i <= hi.x; ++i) {
+            if ( mask(i,j,k) == crsecell ) {
+               data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i+1,j,k) * data(i+1,j,k,n) + data(i,j-1,k,n) )
+                               / ( mask(i-1,j,k) + mask(i+1,j,k) + 1 );
+            }
+         }
+      }
+   }
+}
+
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+void
+amrex_first_order_extrap_gpu(int i, int j, int k, int n,
+                             amrex::Box const& bx,
+                             amrex::Array4<const int>   const& mask,
+                             amrex::Array4<amrex::Real> const& data) noexcept
+{
+   using namespace amrex::literals;
+
+   constexpr int finecell = 1;
+   constexpr int crsecell = 0;
+
+   const auto lo = amrex::lbound(bx);
+   const auto hi = amrex::ubound(bx);
+
+   if ( mask(i,j,k) == crsecell ) {
+      // Corners
+      // xlo, ylo
+      if ( (i == lo.x-1) && (j == lo.y-1) ) {
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ) {
+            data(i,j,k,n) = ( mask(i+1,j,k) * data(i+1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                          / ( mask(i+1,j,k) + mask(i,j+1,k) );
+         } else {
+            data(i,j,k,n) = data(i+1,j+1,k,n);
+         }
+      // xlo, yhi
+      } else if ( (i == lo.x-1) && (j == hi.y+1) ) {
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ) {
+            data(i,j,k,n) = ( mask(i+1,j,k) * data(i+1,j,k,n) + mask(i,j-1,k) * data(i,j-1,k,n) )
+                          / ( mask(i+1,j,k) + mask(i,j-1,k) );
+         } else {
+            data(i,j,k,n) = data(i+1,j-1,k,n);
+         }
+      // xhi, ylo
+      } else if ( (i == hi.x+1) && (j == lo.y-1) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ) {
+            data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                          / ( mask(i-1,j,k) + mask(i,j+1,k) );
+         } else {
+            data(i,j,k,n) = data(i-1,j+1,k,n);
+         }
+      // xhi, yhi
+      } else if ( (i == hi.x+1) && (j == hi.y+1) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ) {
+            data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i,j-1,k) * data(i,j-1,k,n) )
+                          / ( mask(i-1,j,k) + mask(i,j-1,k) );
+         } else {
+            data(i,j,k,n) = data(i-1,j-1,k,n);
+         }
+      // Edges
+      // xlo, y-valid
+      } else if ( (i == lo.x-1) && (j >= lo.y) && (j <= hi.y) ) {
+         data(i,j,k,n) = ( mask(i,j-1,k) * data(i,j-1,k,n) + data(i+1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                       / ( mask(i,j-1,k) + 1 + mask(i,j+1,k) );
+      // xhi, y-valid
+      } else if ( (i == hi.x+1) && (j >= lo.y) && (j <= hi.y) ) {
+         data(i,j,k,n) = ( mask(i,j-1,k) * data(i,j-1,k,n) + data(i-1,j,k,n) + mask(i,j+1,k) * data(i,j+1,k,n) )
+                       / ( mask(i,j-1,k) + 1 + mask(i,j+1,k) );
+      // x-valid, ylo
+      } else if ( (i >= lo.x) && (i <= hi.x) && (j == lo.y-1) ) {
+         data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i+1,j,k) * data(i+1,j,k,n) + data(i,j+1,k,n) )
+                       / ( mask(i-1,j,k) + mask(i+1,j,k) + 1 );
+      // x-valid, yhi
+      } else if ( (i >= lo.x) && (i <= hi.x) && (j == hi.y+1) ) {
+         data(i,j,k,n) = ( mask(i-1,j,k) * data(i-1,j,k,n) + mask(i+1,j,k) * data(i+1,j,k,n) + data(i,j-1,k,n) )
+                         / ( mask(i-1,j,k) + mask(i+1,j,k) + 1 );
+      }
+   }
+}
+
+}
+#endif
diff --git a/Src/Amr/AMReX_extrapolater_2d.f90 b/Src/Amr/AMReX_extrapolater_2d.f90
deleted file mode 100644
index 382c9eedb56..00000000000
--- a/Src/Amr/AMReX_extrapolater_2d.f90
+++ /dev/null
@@ -1,119 +0,0 @@
-module amrex_extrapolater
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-  integer, parameter :: finecell = 1 ! must be consistent with Extrapolater.H
-  integer, parameter :: crsecell = 0
-
-  ! The value of msk is either 0 or 1.
-
-contains
-
-  subroutine amrex_first_order_extrap (u, ulo, uhi, nu, msk, mlo, mhi, lo, hi, sc, nc) &
-       bind(c,name='amrex_first_order_extrap')
-
-    integer, intent(in) :: ulo(2), uhi(2), nu, mlo(2), mhi(2), lo(2), hi(2), sc, nc
-    real(amrex_real), intent(inout) ::   u(ulo(1):uhi(1),ulo(2):uhi(2),0:nu-1)
-    integer     , intent(in)    :: msk(mlo(1):mhi(1),mlo(2):mhi(2))
-
-    integer :: i, j, n
-
-    do n = sc, sc+nc-1
-       ! set all crse cells to zero first
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-             if (msk(i,j) .eq. crsecell) then
-                u(i,j,n) = 0.d0
-             end if
-          end do
-       end do
-
-       ! ylo, xlo
-       j = lo(2)-1
-       i = lo(1)-1
-       if (msk(i,j) .eq. crsecell) then
-          if (msk(i,j+1) .eq. finecell .or. msk(i+1,j) .eq. finecell) then
-             u(i,j,n) = (msk(i,j+1)*u(i,j+1,n) + msk(i+1,j)*u(i+1,j,n)) &
-                  &   / (msk(i,j+1)            + msk(i+1,j)           )
-          else
-             u(i,j,n) = u(i+1,j+1,n)
-          end if
-       end if
-
-       ! ylo, x-valid
-       j = lo(2)-1
-       do i = lo(1), hi(1)
-          if (msk(i,j) .eq. crsecell) then
-             u(i,j,n) = (msk(i-1,j)*u(i-1,j,n)+msk(i+1,j)*u(i+1,j,n)+u(i,j+1,n)) &
-                  &   / (msk(i-1,j)           +msk(i+1,j)           +1         )
-          end if
-       end do
-
-       ! ylo, xhi
-       j = lo(2)-1
-       i = hi(1)+1
-       if (msk(i,j) .eq. crsecell) then
-          if (msk(i-1,j).eq.finecell .or. msk(i,j+1).eq.finecell) then
-             u(i,j,n) = (msk(i-1,j)*u(i-1,j,n)+msk(i,j+1)*u(i,j+1,n)) &
-                  &   / (msk(i-1,j)           +msk(i,j+1))
-          else
-             u(i,j,n) = u(i-1,j+1,n)
-          end if
-       end if
-
-       ! y-valid, xlo
-       i = lo(1)-1
-       do j = lo(2), hi(2)
-          if (msk(i,j) .eq. crsecell) then
-             u(i,j,n) = (msk(i,j-1)*u(i,j-1,n)+u(i+1,j,n)+msk(i,j+1)*u(i,j+1,n)) &
-                  &   / (msk(i,j-1)           +1         +msk(i,j+1)           )
-          end if
-       end do
-
-       ! y-valid, xhi
-       i = hi(1)+1
-       do j = lo(2), hi(2)
-          if (msk(i,j) .eq. crsecell) then
-             u(i,j,n) = (msk(i,j-1)*u(i,j-1,n)+u(i-1,j,n)+msk(i,j+1)*u(i,j+1,n)) &
-                  &   / (msk(i,j-1)           +1         +msk(i,j+1)           )
-          end if
-       end do
-       
-       ! yhi, xlo
-       j = hi(2)+1
-       i = lo(1)-1
-       if (msk(i,j) .eq. crsecell) then
-          if (msk(i,j-1).eq.finecell .or. msk(i+1,j).eq.finecell) then
-             u(i,j,n) = (msk(i,j-1)*u(i,j-1,n)+msk(i+1,j)*u(i+1,j,n)) &
-                  &   / (msk(i,j-1)           +msk(i+1,j)           )
-          else
-             u(i,j,n) = u(i+1,j-1,n)
-          end if
-       end if
-
-       ! yhi, xvalid
-       j = hi(2)+1
-       do i = lo(1), hi(1)
-          if (msk(i,j) .eq. crsecell) then
-             u(i,j,n) = (u(i,j-1,n)+msk(i-1,j)*u(i-1,j,n)+msk(i+1,j)*u(i+1,j,n)) &
-                  &   / (1         +msk(i-1,j)           +msk(i+1,j)           )
-          end if
-       end do
-
-       ! yhi, xhi
-       i = hi(1)+1
-       j = hi(2)+1
-       if (msk(i,j) .eq. crsecell) then
-          if (msk(i-1,j).eq.finecell .or. msk(i,j-1).eq.finecell) then
-             u(i,j,n) = (msk(i-1,j)*u(i-1,j,n)+msk(i,j-1)*u(i,j-1,n)) &
-                  &   / (msk(i-1,j)           +msk(i,j-1)           )
-          else
-             u(i,j,n) = u(i-1,j-1,n)
-          end if
-       end if
-    end do
-
-  end subroutine amrex_first_order_extrap
-
-end module amrex_extrapolater
diff --git a/Src/Amr/AMReX_extrapolater_3D_K.H b/Src/Amr/AMReX_extrapolater_3D_K.H
new file mode 100644
index 00000000000..4dd3be07219
--- /dev/null
+++ b/Src/Amr/AMReX_extrapolater_3D_K.H
@@ -0,0 +1,1124 @@
+#ifndef AMReX_extrapolater_3D_K_H_
+#define AMReX_extrapolater_3D_K_H_
+
+namespace amrex {
+
+AMREX_GPU_HOST
+AMREX_FORCE_INLINE
+void
+amrex_first_order_extrap_cpu(amrex::Box const& bx,
+                             int               nComp,
+                             amrex::Array4<const int>   const& mask,
+                             amrex::Array4<amrex::Real> const& data) noexcept
+{
+   using namespace amrex::literals;
+
+   constexpr int finecell = 1;
+   constexpr int crsecell = 0;
+
+   const auto lo = amrex::lbound(bx);
+   const auto hi = amrex::ubound(bx);
+
+   for (int n = 0; n < nComp; n++) {
+
+      // set all crse cells to zero first
+      for (int k = lo.z-1; k <= hi.z+1; ++k) {
+         for (int j = lo.y-1; j <= hi.y+1; ++j) {
+            for (int i = lo.x-1; i <= hi.x+1; ++i) {
+               if (mask(i,j,k) == crsecell) data(i,j,k,n) = Real(0.0);
+            }
+         }
+      }
+
+      // Corners
+      // xlo, ylo, zlo
+      {
+         int i = lo.x-1;
+         int j = lo.y-1;
+         int k = lo.z-1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i+1,j,k) == finecell ) ||
+                 ( mask(i,j+1,k) == finecell ) ||
+                 ( mask(i,j,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                                + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                + mask(i,j,k+1) * data(i,j,k+1,n) )
+                               / ( mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+            } else if ( ( mask(i+1,j+1,k) == finecell ) ||
+                        ( mask(i+1,j,k+1) == finecell ) ||
+                        ( mask(i,j+1,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j+1,k) * data(i+1,j+1,k,n) 
+                                + mask(i+1,j,k+1) * data(i+1,j,k+1,n) 
+                                + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                               / ( mask(i+1,j+1,k) + mask(i+1,j,k+1) + mask(i,j+1,k+1) );
+            } else {
+               data(i,j,k,n) = data(i+1,j+1,k+1,n);
+            }
+         }
+      }
+      // xlo, ylo, zhi
+      {
+         int i = lo.x-1;
+         int j = lo.y-1;
+         int k = hi.z+1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i+1,j,k) == finecell ) ||
+                 ( mask(i,j+1,k) == finecell ) ||
+                 ( mask(i,j,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                                + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                + mask(i,j,k-1) * data(i,j,k-1,n) )
+                               / ( mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+            } else if ( ( mask(i+1,j+1,k) == finecell ) ||
+                        ( mask(i+1,j,k-1) == finecell ) ||
+                        ( mask(i,j+1,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j+1,k) * data(i+1,j+1,k,n) 
+                                + mask(i+1,j,k-1) * data(i+1,j,k-1,n) 
+                                + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                               / ( mask(i+1,j+1,k) + mask(i+1,j,k-1) + mask(i,j+1,k-1) );
+            } else {
+               data(i,j,k,n) = data(i+1,j+1,k-1,n);
+            }
+         }
+      }
+      // xlo, yhi, zlo
+      {
+         int i = lo.x-1;
+         int j = hi.y+1;
+         int k = lo.z-1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i+1,j,k) == finecell ) ||
+                 ( mask(i,j-1,k) == finecell ) ||
+                 ( mask(i,j,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                                + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                + mask(i,j,k+1) * data(i,j,k+1,n) )
+                               / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k+1) );
+            } else if ( ( mask(i+1,j-1,k) == finecell ) ||
+                        ( mask(i+1,j,k+1) == finecell ) ||
+                        ( mask(i,j-1,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n) 
+                                + mask(i+1,j,k+1) * data(i+1,j,k+1,n) 
+                                + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                               / ( mask(i+1,j-1,k) + mask(i+1,j,k+1) + mask(i,j-1,k+1) );
+            } else {
+               data(i,j,k,n) = data(i+1,j-1,k+1,n);
+            }
+         }
+      }
+      // xlo, yhi, zhi
+      {
+         int i = lo.x-1;
+         int j = hi.y+1;
+         int k = hi.z+1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i+1,j,k) == finecell ) ||
+                 ( mask(i,j-1,k) == finecell ) ||
+                 ( mask(i,j,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                                + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                + mask(i,j,k-1) * data(i,j,k-1,n) )
+                               / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) );
+            } else if ( ( mask(i+1,j-1,k) == finecell ) ||
+                        ( mask(i+1,j,k-1) == finecell ) ||
+                        ( mask(i,j-1,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n) 
+                                + mask(i+1,j,k-1) * data(i+1,j,k-1,n) 
+                                + mask(i,j-1,k-1) * data(i,j-1,k-1,n) )
+                               / ( mask(i+1,j-1,k) + mask(i+1,j,k-1) + mask(i,j-1,k-1) );
+            } else {
+               data(i,j,k,n) = data(i+1,j-1,k-1,n);
+            }
+         }
+      }
+      // xhi, ylo, zlo
+      {
+         int i = hi.x+1;
+         int j = lo.y-1;
+         int k = lo.z-1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i-1,j,k) == finecell ) ||
+                 ( mask(i,j+1,k) == finecell ) ||
+                 ( mask(i,j,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                                + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                + mask(i,j,k+1) * data(i,j,k+1,n) )
+                               / ( mask(i-1,j,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+            } else if ( ( mask(i-1,j+1,k) == finecell ) ||
+                        ( mask(i-1,j,k+1) == finecell ) ||
+                        ( mask(i,j+1,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n) 
+                                + mask(i-1,j,k+1) * data(i-1,j,k+1,n) 
+                                + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                               / ( mask(i-1,j+1,k) + mask(i-1,j,k+1) + mask(i,j+1,k+1) );
+            } else {
+               data(i,j,k,n) = data(i-1,j+1,k+1,n);
+            }
+         }
+      }
+      // xhi, ylo, zhi
+      {
+         int i = hi.x+1;
+         int j = lo.y-1;
+         int k = hi.z+1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i-1,j,k) == finecell ) ||
+                 ( mask(i,j+1,k) == finecell ) ||
+                 ( mask(i,j,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                                + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                + mask(i,j,k-1) * data(i,j,k-1,n) )
+                               / ( mask(i-1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+            } else if ( ( mask(i-1,j+1,k) == finecell ) ||
+                        ( mask(i-1,j,k-1) == finecell ) ||
+                        ( mask(i,j+1,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n) 
+                                + mask(i-1,j,k-1) * data(i-1,j,k-1,n) 
+                                + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                               / ( mask(i-1,j+1,k) + mask(i-1,j,k-1) + mask(i,j+1,k-1) );
+            } else {
+               data(i,j,k,n) = data(i-1,j+1,k-1,n);
+            }
+         }
+      }
+      // xhi, yhi, zlo
+      {
+         int i = hi.x+1;
+         int j = hi.y+1;
+         int k = lo.z-1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i-1,j,k) == finecell ) ||
+                 ( mask(i,j-1,k) == finecell ) ||
+                 ( mask(i,j,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                                + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                + mask(i,j,k+1) * data(i,j,k+1,n) )
+                               / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j,k+1) );
+            } else if ( ( mask(i-1,j-1,k) == finecell ) ||
+                        ( mask(i-1,j,k+1) == finecell ) ||
+                        ( mask(i,j-1,k+1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n) 
+                                + mask(i-1,j,k+1) * data(i-1,j,k+1,n) 
+                                + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                               / ( mask(i-1,j-1,k) + mask(i-1,j,k+1) + mask(i,j-1,k+1) );
+            } else {
+               data(i,j,k,n) = data(i-1,j-1,k+1,n);
+            }
+         }
+      }
+      // xhi, yhi, zhi
+      {
+         int i = hi.x+1;
+         int j = hi.y+1;
+         int k = hi.z+1;
+         if ( mask(i,j,k) == crsecell ) {
+            if ( ( mask(i-1,j,k) == finecell ) ||
+                 ( mask(i,j-1,k) == finecell ) ||
+                 ( mask(i,j,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                                + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                + mask(i,j,k-1) * data(i,j,k-1,n) )
+                               / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) );
+            } else if ( ( mask(i-1,j-1,k) == finecell ) ||
+                        ( mask(i-1,j,k-1) == finecell ) ||
+                        ( mask(i,j-1,k-1) == finecell ) ) {
+               data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n) 
+                                + mask(i-1,j,k-1) * data(i-1,j,k-1,n) 
+                                + mask(i,j-1,k-1) * data(i,j-1,k-1,n) )
+                               / ( mask(i-1,j-1,k) + mask(i-1,j,k-1) + mask(i,j-1,k-1) );
+            } else {
+               data(i,j,k,n) = data(i-1,j-1,k-1,n);
+            }
+         }
+      }
+      // Edges
+      // xlo, ylo, z-valid
+      {
+         int i = lo.x-1;
+         int j = lo.y-1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (                    data(i+1,j+1,k,n)
+                                   + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                                   + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                                   + mask(i,j+1,k-1) * data(i,j+1,k-1,n)
+                                   + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                                 / ( 1.0 + mask(i+1,j,k-1) + mask(i+1,j,k+1) + mask(i,j+1,k-1) + mask(i,j+1,k+1) );
+               }
+            }
+         }
+      }
+      // xlo, yhi, z-valid
+      {
+         int i = lo.x-1;
+         int j = hi.y+1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (                    data(i+1,j-1,k,n)
+                                   + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                                   + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                                   + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                                   + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                                 / ( 1.0 + mask(i+1,j,k-1) + mask(i+1,j,k+1) + mask(i,j-1,k-1) + mask(i,j-1,k+1) );
+               }
+            }
+         }
+      }
+      // xhi, ylo, z-valid
+      {
+         int i = hi.x+1;
+         int j = lo.y-1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (                    data(i-1,j+1,k,n)
+                                   + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                                   + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                                   + mask(i,j+1,k-1) * data(i,j+1,k-1,n)
+                                   + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                                 / ( 1.0 + mask(i-1,j,k-1) + mask(i-1,j,k+1) + mask(i,j+1,k-1) + mask(i,j+1,k+1) );
+               }
+            }
+         }
+      }
+      // xhi, yhi, z-valid
+      {
+         int i = hi.x+1;
+         int j = hi.y+1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (                    data(i-1,j-1,k,n)
+                                   + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                                   + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                                   + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                                   + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                                 / ( 1.0 + mask(i-1,j,k-1) + mask(i-1,j,k+1) + mask(i,j-1,k-1) + mask(i,j-1,k+1) );
+               }
+            }
+         }
+      }
+      // xlo, y-valid, zlo
+      {
+         int i = lo.x-1;
+         int k = lo.z-1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                                   + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                                   +                   data(i+1,j,k+1,n)
+                                   + mask(i,j-1,k+1) * data(i,j-1,k+1,n)
+                                   + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                                 / ( mask(i+1,j-1,k) + mask(i+1,j+1,k) + 1.0 + mask(i,j-1,k+1) + mask(i,j+1,k+1) );
+               }
+            }
+         }
+      }
+      // xlo, y-valid, zhi
+      {
+         int i = lo.x-1;
+         int k = hi.z+1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                                 / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                                   + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                                   +                   data(i+1,j,k-1,n)
+                                   + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                                   + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                                 / ( mask(i+1,j-1,k) + mask(i+1,j+1,k) + 1.0 + mask(i,j-1,k-1) + mask(i,j+1,k-1) );
+               }
+            }
+         }
+      }
+      // xhi, y-valid, zlo
+      {
+         int i = hi.x+1;
+         int k = lo.z-1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                                   + mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                                   +                   data(i-1,j,k+1,n)
+                                   + mask(i,j-1,k+1) * data(i,j-1,k+1,n)
+                                   + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                                 / ( mask(i-1,j-1,k) + mask(i-1,j+1,k) + 1.0 + mask(i,j-1,k+1) + mask(i,j+1,k+1) );
+               }
+            }
+         }
+      }
+      // xhi, y-valid, zhi
+      {
+         int i = hi.x+1;
+         int k = hi.z+1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                                   + mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                                   +                   data(i-1,j,k-1,n)
+                                   + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                                   + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                                 / ( mask(i-1,j-1,k) + mask(i-1,j+1,k) + 1.0 + mask(i,j-1,k-1) + mask(i,j+1,k-1) );
+               }
+            }
+         }
+      }
+      // x-valid, ylo, zlo
+      {
+         int j = lo.y-1;
+         int k = lo.z-1;
+         for (int i = lo.x; i <= hi.x; ++i) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n) 
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                                   + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                                   + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                                   + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                                   +                   data(i,j+1,k+1,n) )
+                                 / ( mask(i-1,j+1,k) + mask(i+1,j+1,k) + mask(i-1,j,k+1) + mask(i+1,j,k+1) + 1.0 );
+               }
+            }
+         }
+      }
+      // x-valid, ylo, zhi
+      {
+         int j = lo.y-1;
+         int k = hi.z+1;
+         for (int i = lo.x; i <= hi.x; ++i) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j+1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n) 
+                                   + mask(i,j+1,k) * data(i,j+1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                                   + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                                   + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                                   + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                                   +                   data(i,j+1,k-1,n) )
+                                 / ( mask(i-1,j+1,k) + mask(i+1,j+1,k) + mask(i-1,j,k-1) + mask(i+1,j,k-1) + 1.0 );
+               }
+            }
+         }
+      }
+      // x-valid, yhi, zlo
+      {
+         int j = hi.y+1;
+         int k = lo.z-1;
+         for (int i = lo.x; i <= hi.x; ++i) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j,k+1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n) 
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k+1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                                   + mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                                   + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                                   + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                                   +                   data(i,j-1,k+1,n) )
+                                 / ( mask(i-1,j-1,k) + mask(i+1,j-1,k) + mask(i-1,j,k+1) + mask(i+1,j,k+1) + 1.0 );
+               }
+            }
+         }
+      }
+      // x-valid, yhi, zhi
+      {
+         int j = hi.y+1;
+         int k = hi.z+1;
+         for (int i = lo.x; i <= hi.x; ++i) {
+            if ( mask(i,j,k) == crsecell ) {
+               if ( ( mask(i-1,j,k) == finecell ) ||
+                    ( mask(i+1,j,k) == finecell ) ||
+                    ( mask(i,j-1,k) == finecell ) ||
+                    ( mask(i,j,k-1) == finecell ) ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n) 
+                                   + mask(i,j-1,k) * data(i,j-1,k,n) 
+                                   + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) );
+               } else {
+                  data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                                   + mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                                   + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                                   + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                                   +                   data(i,j-1,k-1,n) )
+                                 / ( mask(i-1,j-1,k) + mask(i+1,j-1,k) + mask(i-1,j,k-1) + mask(i+1,j,k-1) + 1.0 );
+               }
+            }
+         }
+      }
+      // Faces
+      // xlo, y-valid, z-valid
+      {
+         int i = lo.x-1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+               if ( mask(i,j,k) == crsecell ) {
+                  data(i,j,k,n) = (                  data(i+1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n)
+                                   + mask(i,j+1,k) * data(i,j+1,k,n)
+                                   + mask(i,j,k-1) * data(i,j,k-1,n)
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) )
+                                 / ( 1.0 + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+               }
+            }
+         }
+      }
+      // xhi, y-valid, z-valid
+      {
+         int i = hi.x+1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+               if ( mask(i,j,k) == crsecell ) {
+                  data(i,j,k,n) = (                  data(i-1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n)
+                                   + mask(i,j+1,k) * data(i,j+1,k,n)
+                                   + mask(i,j,k-1) * data(i,j,k-1,n)
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) )
+                                 / ( 1.0 + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+               }
+            }
+         }
+      }
+      // x-valid, ylo, z-valid
+      {
+         int j = lo.y-1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+               if ( mask(i,j,k) == crsecell ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n)
+                                   +                 data(i,j+1,k,n)
+                                   + mask(i,j,k-1) * data(i,j,k-1,n)
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) )
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + 1.0 + mask(i,j,k-1) + mask(i,j,k+1) );
+               }
+            }
+         }
+      }
+      // x-valid, yhi, z-valid
+      {
+         int j = hi.y+1;
+         for (int k = lo.z; k <= hi.z; ++k) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+               if ( mask(i,j,k) == crsecell ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n)
+                                   +                 data(i,j-1,k,n)
+                                   + mask(i,j,k-1) * data(i,j,k-1,n)
+                                   + mask(i,j,k+1) * data(i,j,k+1,n) )
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + 1.0 + mask(i,j,k-1) + mask(i,j,k+1) );
+               }
+            }
+         }
+      }
+      // x-valid, y-valid, zlo
+      {
+         int k = lo.z-1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+               if ( mask(i,j,k) == crsecell ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n)
+                                   + mask(i,j+1,k) * data(i,j+1,k,n)
+                                   +                 data(i,j,k+1,n) )
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + 1.0 );
+               }
+            }
+         }
+      }
+      // x-valid, y-valid, zhi
+      {
+         int k = hi.z+1;
+         for (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+               if ( mask(i,j,k) == crsecell ) {
+                  data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                                   + mask(i+1,j,k) * data(i+1,j,k,n)
+                                   + mask(i,j-1,k) * data(i,j-1,k,n)
+                                   + mask(i,j+1,k) * data(i,j+1,k,n)
+                                   +                 data(i,j,k-1,n) )
+                                 / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + 1.0 );
+               }
+            }
+         }
+      }
+   }
+}
+
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+void
+amrex_first_order_extrap_gpu(int i, int j, int k, int n,
+                             amrex::Box const& bx,
+                             amrex::Array4<const int>   const& mask,
+                             amrex::Array4<amrex::Real> const& data) noexcept
+{
+   using namespace amrex::literals;
+
+   constexpr int finecell = 1;
+   constexpr int crsecell = 0;
+
+   const auto lo = amrex::lbound(bx);
+   const auto hi = amrex::ubound(bx);
+
+   if ( mask(i,j,k) == crsecell ) {
+      // Corners
+      // xlo, ylo, zlo
+      if ( ( i == lo.x-1) && ( j == lo.y-1 ) && ( k == lo.z-1 ) ) {  
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) )
+                            / ( mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+         } else if ( ( mask(i+1,j+1,k) == finecell ) ||
+                     ( mask(i+1,j,k+1) == finecell ) ||
+                     ( mask(i,j+1,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j+1,k) * data(i+1,j+1,k,n) 
+                             + mask(i+1,j,k+1) * data(i+1,j,k+1,n) 
+                             + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                            / ( mask(i+1,j+1,k) + mask(i+1,j,k+1) + mask(i,j+1,k+1) );
+         } else {
+            data(i,j,k,n) = data(i+1,j+1,k+1,n);
+         }
+      // xlo, ylo, zhi
+      } else if ( ( i == lo.x-1) && ( j == lo.y-1 ) && ( k == hi.z+1 ) ) {  
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) )
+                            / ( mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+         } else if ( ( mask(i+1,j+1,k) == finecell ) ||
+                     ( mask(i+1,j,k-1) == finecell ) ||
+                     ( mask(i,j+1,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j+1,k) * data(i+1,j+1,k,n) 
+                             + mask(i+1,j,k-1) * data(i+1,j,k-1,n) 
+                             + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                            / ( mask(i+1,j+1,k) + mask(i+1,j,k-1) + mask(i,j+1,k-1) );
+         } else {
+            data(i,j,k,n) = data(i+1,j+1,k-1,n);
+         }
+      // xlo, yhi, zlo
+      } else if ( ( i == lo.x-1) && ( j == hi.y+1 ) && ( k == lo.z-1 ) ) {  
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) )
+                            / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k+1) );
+         } else if ( ( mask(i+1,j-1,k) == finecell ) ||
+                     ( mask(i+1,j,k+1) == finecell ) ||
+                     ( mask(i,j-1,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n) 
+                             + mask(i+1,j,k+1) * data(i+1,j,k+1,n) 
+                             + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                            / ( mask(i+1,j-1,k) + mask(i+1,j,k+1) + mask(i,j-1,k+1) );
+         } else {
+            data(i,j,k,n) = data(i+1,j-1,k+1,n);
+         }
+      // xlo, yhi, zhi
+      } else if ( ( i == lo.x-1) && ( j == hi.y+1 ) && ( k == hi.z+1 ) ) {  
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) )
+                            / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) );
+         } else if ( ( mask(i+1,j-1,k) == finecell ) ||
+                     ( mask(i+1,j,k-1) == finecell ) ||
+                     ( mask(i,j-1,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n) 
+                             + mask(i+1,j,k-1) * data(i+1,j,k-1,n) 
+                             + mask(i,j-1,k-1) * data(i,j-1,k-1,n) )
+                            / ( mask(i+1,j-1,k) + mask(i+1,j,k-1) + mask(i,j-1,k-1) );
+         } else {
+            data(i,j,k,n) = data(i+1,j-1,k-1,n);
+         }
+      // xhi, ylo, zlo
+      } else if ( ( i == hi.x+1) && ( j == lo.y-1 ) && ( k == lo.z-1 ) ) {  
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) )
+                            / ( mask(i-1,j,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+         } else if ( ( mask(i-1,j+1,k) == finecell ) ||
+                     ( mask(i-1,j,k+1) == finecell ) ||
+                     ( mask(i,j+1,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n) 
+                             + mask(i-1,j,k+1) * data(i-1,j,k+1,n) 
+                             + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                            / ( mask(i-1,j+1,k) + mask(i-1,j,k+1) + mask(i,j+1,k+1) );
+         } else {
+            data(i,j,k,n) = data(i-1,j+1,k+1,n);
+         }
+      // xhi, ylo, zhi
+      } else if ( ( i == hi.x+1) && ( j == lo.y-1 ) && ( k == hi.z+1 ) ) {  
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) )
+                            / ( mask(i-1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+         } else if ( ( mask(i-1,j+1,k) == finecell ) ||
+                     ( mask(i-1,j,k-1) == finecell ) ||
+                     ( mask(i,j+1,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n) 
+                             + mask(i-1,j,k-1) * data(i-1,j,k-1,n) 
+                             + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                            / ( mask(i-1,j+1,k) + mask(i-1,j,k-1) + mask(i,j+1,k-1) );
+         } else {
+            data(i,j,k,n) = data(i-1,j+1,k-1,n);
+         }
+      // xhi, yhi, zlo
+      } else if ( ( i == hi.x+1) && ( j == hi.y+1 ) && ( k == lo.z-1 ) ) {  
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) )
+                            / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j,k+1) );
+         } else if ( ( mask(i-1,j-1,k) == finecell ) ||
+                     ( mask(i-1,j,k+1) == finecell ) ||
+                     ( mask(i,j-1,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n) 
+                             + mask(i-1,j,k+1) * data(i-1,j,k+1,n) 
+                             + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                            / ( mask(i-1,j-1,k) + mask(i-1,j,k+1) + mask(i,j-1,k+1) );
+         } else {
+            data(i,j,k,n) = data(i-1,j-1,k+1,n);
+         }
+      // xhi, yhi, zhi
+      } else if ( ( i == hi.x+1) && ( j == hi.y+1 ) && ( k == hi.z+1 ) ) {  
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n) 
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) )
+                            / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) );
+         } else if ( ( mask(i-1,j-1,k) == finecell ) ||
+                     ( mask(i-1,j,k-1) == finecell ) ||
+                     ( mask(i,j-1,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n) 
+                             + mask(i-1,j,k-1) * data(i-1,j,k-1,n) 
+                             + mask(i,j-1,k-1) * data(i,j-1,k-1,n) )
+                            / ( mask(i-1,j-1,k) + mask(i-1,j,k-1) + mask(i,j-1,k-1) );
+         } else {
+            data(i,j,k,n) = data(i-1,j-1,k-1,n);
+         }
+      // Edges
+      // xlo, ylo, z-valid
+      } else if ( ( i == lo.x-1) && ( j == lo.y-1 ) && 
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (                    data(i+1,j+1,k,n)
+                             + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                             + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                             + mask(i,j+1,k-1) * data(i,j+1,k-1,n)
+                             + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                           / ( 1.0 + mask(i+1,j,k-1) + mask(i+1,j,k+1) + mask(i,j+1,k-1) + mask(i,j+1,k+1) );
+         }
+      // xlo, yhi, z-valid
+      } else if ( ( i == lo.x-1) && ( j == hi.y+1 ) && 
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (                    data(i+1,j-1,k,n)
+                             + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                             + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                             + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                             + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                           / ( 1.0 + mask(i+1,j,k-1) + mask(i+1,j,k+1) + mask(i,j-1,k-1) + mask(i,j-1,k+1) );
+         }
+      // xhi, ylo, z-valid
+      } else if ( ( i == hi.x+1) && ( j == lo.y-1 ) && 
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (                    data(i-1,j+1,k,n)
+                             + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                             + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                             + mask(i,j+1,k-1) * data(i,j+1,k-1,n)
+                             + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                           / ( 1.0 + mask(i-1,j,k-1) + mask(i-1,j,k+1) + mask(i,j+1,k-1) + mask(i,j+1,k+1) );
+         }
+      // xhi, yhi, z-valid
+      } else if ( ( i == hi.x+1) && ( j == hi.y+1 ) && 
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (                    data(i-1,j-1,k,n)
+                             + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                             + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                             + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                             + mask(i,j-1,k+1) * data(i,j-1,k+1,n) )
+                           / ( 1.0 + mask(i-1,j,k-1) + mask(i-1,j,k+1) + mask(i,j-1,k-1) + mask(i,j-1,k+1) );
+         }
+      // xlo, y-valid, zlo
+      } else if ( ( i == lo.x-1) && ( j >= lo.y ) && 
+                  ( j <= hi.y )  && ( k == lo.z-1 ) ) {
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                             + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                             +                   data(i+1,j,k+1,n)
+                             + mask(i,j-1,k+1) * data(i,j-1,k+1,n)
+                             + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                           / ( mask(i+1,j-1,k) + mask(i+1,j+1,k) + 1.0 + mask(i,j-1,k+1) + mask(i,j+1,k+1) );
+         }
+      // xlo, y-valid, zhi
+      } else if ( ( i == lo.x-1) && ( j >= lo.y ) && 
+                  ( j <= hi.y )  && ( k == hi.z+1 ) ) {
+         if ( ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i+1,j,k) * data(i+1,j,k,n)
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                           / ( mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+         } else {
+            data(i,j,k,n) = (  mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                             + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                             +                   data(i+1,j,k-1,n)
+                             + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                             + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                           / ( mask(i+1,j-1,k) + mask(i+1,j+1,k) + 1.0 + mask(i,j-1,k-1) + mask(i,j+1,k-1) );
+         }
+      // xhi, y-valid, zlo
+      } else if ( ( i == hi.x+1) && ( j >= lo.y ) && 
+                  ( j <= hi.y )  && ( k == lo.z-1 ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                             + mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                             +                   data(i-1,j,k+1,n)
+                             + mask(i,j-1,k+1) * data(i,j-1,k+1,n)
+                             + mask(i,j+1,k+1) * data(i,j+1,k+1,n) )
+                           / ( mask(i-1,j-1,k) + mask(i-1,j+1,k) + 1.0 + mask(i,j-1,k+1) + mask(i,j+1,k+1) );
+         }
+      // xhi, y-valid, zhi
+      } else if ( ( i == hi.x+1) && ( j >= lo.y ) && 
+                  ( j <= hi.y )  && ( k == hi.z+1 ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+         } else {
+            data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                             + mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                             +                   data(i-1,j,k-1,n)
+                             + mask(i,j-1,k-1) * data(i,j-1,k-1,n)
+                             + mask(i,j+1,k-1) * data(i,j+1,k-1,n) )
+                           / ( mask(i-1,j-1,k) + mask(i-1,j+1,k) + 1.0 + mask(i,j-1,k-1) + mask(i,j+1,k-1) );
+         }
+      // x-valid, ylo, zlo
+      } else if ( ( i >= lo.x) && ( i <= hi.x ) && 
+                  ( j == lo.y-1 )  && ( k == lo.z-1 ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                             + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                             + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                             + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                             +                   data(i,j+1,k+1,n) )
+                           / ( mask(i-1,j+1,k) + mask(i+1,j+1,k) + mask(i-1,j,k+1) + mask(i+1,j,k+1) + 1.0 );
+         }
+      // x-valid, ylo, zhi
+      } else if ( ( i >= lo.x) && ( i <= hi.x ) && 
+                  ( j == lo.y-1 )  && ( k == hi.z+1 ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j+1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j+1,k) * data(i,j+1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j+1,k) + mask(i,j,k-1) );
+         } else {
+            data(i,j,k,n) = (  mask(i-1,j+1,k) * data(i-1,j+1,k,n)
+                             + mask(i+1,j+1,k) * data(i+1,j+1,k,n)
+                             + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                             + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                             +                   data(i,j+1,k-1,n) )
+                           / ( mask(i-1,j+1,k) + mask(i+1,j+1,k) + mask(i-1,j,k-1) + mask(i+1,j,k-1) + 1.0 );
+         }
+      // x-valid, yhi, zlo
+      } else if ( ( i >= lo.x) && ( i <= hi.x ) && 
+                  ( j == hi.y+1 )  && ( k == lo.z-1 ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k+1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k+1) * data(i,j,k+1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k+1) );
+         } else {
+            data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                             + mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                             + mask(i-1,j,k+1) * data(i-1,j,k+1,n)
+                             + mask(i+1,j,k+1) * data(i+1,j,k+1,n)
+                             +                   data(i,j-1,k+1,n) )
+                           / ( mask(i-1,j-1,k) + mask(i+1,j-1,k) + mask(i-1,j,k+1) + mask(i+1,j,k+1) + 1.0 );
+         }
+      // x-valid, yhi, zhi
+      } else if ( ( i >= lo.x) && ( i <= hi.x ) && 
+                  ( j == hi.y+1 )  && ( k == hi.z+1 ) ) {
+         if ( ( mask(i-1,j,k) == finecell ) ||
+              ( mask(i+1,j,k) == finecell ) ||
+              ( mask(i,j-1,k) == finecell ) ||
+              ( mask(i,j,k-1) == finecell ) ) {
+            data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                             + mask(i+1,j,k) * data(i+1,j,k,n) 
+                             + mask(i,j-1,k) * data(i,j-1,k,n) 
+                             + mask(i,j,k-1) * data(i,j,k-1,n) ) 
+                           / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j,k-1) );
+         } else {
+            data(i,j,k,n) = (  mask(i-1,j-1,k) * data(i-1,j-1,k,n)
+                             + mask(i+1,j-1,k) * data(i+1,j-1,k,n)
+                             + mask(i-1,j,k-1) * data(i-1,j,k-1,n)
+                             + mask(i+1,j,k-1) * data(i+1,j,k-1,n)
+                             +                   data(i,j-1,k-1,n) )
+                           / ( mask(i-1,j-1,k) + mask(i+1,j-1,k) + mask(i-1,j,k-1) + mask(i+1,j,k-1) + 1.0 );
+         }
+      // Faces
+      // xlo, y-valid, z-valid
+      } else if ( ( i == lo.x-1) &&
+                  ( j >= lo.y )  && ( j <= hi.y ) &&
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         data(i,j,k,n) = (                  data(i+1,j,k,n)
+                          + mask(i,j-1,k) * data(i,j-1,k,n)
+                          + mask(i,j+1,k) * data(i,j+1,k,n)
+                          + mask(i,j,k-1) * data(i,j,k-1,n)
+                          + mask(i,j,k+1) * data(i,j,k+1,n) )
+                        / ( 1.0 + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+      // xhi, y-valid, z-valid
+      } else if ( ( i == hi.x+1) &&
+                  ( j >= lo.y )  && ( j <= hi.y ) &&
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         data(i,j,k,n) = (                  data(i-1,j,k,n)
+                          + mask(i,j-1,k) * data(i,j-1,k,n)
+                          + mask(i,j+1,k) * data(i,j+1,k,n)
+                          + mask(i,j,k-1) * data(i,j,k-1,n)
+                          + mask(i,j,k+1) * data(i,j,k+1,n) )
+                        / ( 1.0 + mask(i,j-1,k) + mask(i,j+1,k) + mask(i,j,k-1) + mask(i,j,k+1) );
+      // x-valid, ylo, z-valid
+      } else if ( ( i >= lo.x )  && ( i <= hi.x ) &&
+                  ( j == lo.y-1) &&
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                          + mask(i+1,j,k) * data(i+1,j,k,n)
+                          +                 data(i,j+1,k,n)
+                          + mask(i,j,k-1) * data(i,j,k-1,n)
+                          + mask(i,j,k+1) * data(i,j,k+1,n) )
+                        / ( mask(i-1,j,k) + mask(i+1,j,k) + 1.0 + mask(i,j,k-1) + mask(i,j,k+1) );
+      // x-valid, yhi, z-valid
+      } else if ( ( i >= lo.x )  && ( i <= hi.x ) &&
+                  ( j == hi.y+1) &&
+                  ( k >= lo.z )  && ( k <= hi.z ) ) {
+         data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                          + mask(i+1,j,k) * data(i+1,j,k,n)
+                          +                 data(i,j-1,k,n)
+                          + mask(i,j,k-1) * data(i,j,k-1,n)
+                          + mask(i,j,k+1) * data(i,j,k+1,n) )
+                        / ( mask(i-1,j,k) + mask(i+1,j,k) + 1.0 + mask(i,j,k-1) + mask(i,j,k+1) );
+      // x-valid, y-valid, zlo
+      } else if ( ( i >= lo.x )  && ( i <= hi.x ) &&
+                  ( j >= lo.y )  && ( j <= hi.y ) &&
+                  ( k == lo.z-1) ) {
+         data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                          + mask(i+1,j,k) * data(i+1,j,k,n)
+                          + mask(i,j-1,k) * data(i,j-1,k,n)
+                          + mask(i,j+1,k) * data(i,j+1,k,n)
+                          +                 data(i,j,k+1,n) )
+                        / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + 1.0 );
+      // x-valid, y-valid, zhi
+      } else if ( ( i >= lo.x )  && ( i <= hi.x ) &&
+                  ( j >= lo.y )  && ( j <= hi.y ) &&
+                  ( k == hi.z+1) ) {
+         data(i,j,k,n) = (  mask(i-1,j,k) * data(i-1,j,k,n)
+                          + mask(i+1,j,k) * data(i+1,j,k,n)
+                          + mask(i,j-1,k) * data(i,j-1,k,n)
+                          + mask(i,j+1,k) * data(i,j+1,k,n)
+                          +                 data(i,j,k-1,n) )
+                        / ( mask(i-1,j,k) + mask(i+1,j,k) + mask(i,j-1,k) + mask(i,j+1,k) + 1.0 );
+      }
+   }
+}
+
+}
+#endif
diff --git a/Src/Amr/AMReX_extrapolater_3d.f90 b/Src/Amr/AMReX_extrapolater_3d.f90
deleted file mode 100644
index 6add0d72398..00000000000
--- a/Src/Amr/AMReX_extrapolater_3d.f90
+++ /dev/null
@@ -1,656 +0,0 @@
-
-module amrex_extrapolater
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-  integer, parameter :: finecell = 1 ! must be consistent with Extrapolater.H
-  integer, parameter :: crsecell = 0
-
-  ! The value of msk is either 0 or 1.
-
-contains
-
-  subroutine amrex_first_order_extrap (u, ulo, uhi, nu, msk, mlo, mhi, lo, hi, sc, nc) &
-       bind(c,name='amrex_first_order_extrap')
-
-    integer, intent(in) :: ulo(3), uhi(3), nu, mlo(3), mhi(3), lo(3), hi(3), sc, nc
-    real(amrex_real), intent(inout) ::   u(ulo(1):uhi(1),ulo(2):uhi(2),ulo(3):uhi(3),0:nu-1)
-    integer     , intent(in)    :: msk(mlo(1):mhi(1),mlo(2):mhi(2),mlo(3):mhi(3))
-
-    integer :: i, j, k, n
-
-    do n = sc, sc+nc-1
-       ! set all crse cells to zero first
-       do       k = lo(3)-1, hi(3)+1
-          do    j = lo(2)-1, hi(2)+1
-             do i = lo(1)-1, hi(1)+1
-                if (msk(i,j,k) .eq. crsecell) then
-                   u(i,j,k,n) = 0.d0
-                end if
-             end do
-          end do
-       end do
-
-       ! z-lo, y-lo, x-lo
-       i = lo(1)-1
-       j = lo(2)-1
-       k = lo(3)-1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i+1,j,k) .eq. finecell &
-               .or. msk(i,j+1,k) .eq. finecell &
-               .or. msk(i,j,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                  +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                  +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                  / (msk(i+1,j,k) + msk(i,j+1,k) + msk(i,j,k+1))
-
-          else if ( msk(i+1,j+1,k) .eq. finecell &
-               .or. msk(i+1,j,k+1) .eq. finecell &
-               .or. msk(i,j+1,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j+1,k) * u(i+1,j+1,k,n) &
-                  +        msk(i+1,j,k+1) * u(i+1,j,k+1,n) &
-                  +        msk(i,j+1,k+1) * u(i,j+1,k+1,n)) &
-                  / (msk(i+1,j+1,k) + msk(i+1,j,k+1) + msk(i,j+1,k+1))
-          else
-             u(i,j,k,n) = u(i+1,j+1,k+1,n)
-          end if
-       end if
-
-       ! z-lo, y-lo, x-valid
-       j = lo(2)-1
-       k = lo(3)-1
-       do i = lo(1), hi(1)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i-1,j,k) + msk(i+1,j,k) + msk(i,j+1,k) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (msk(i-1,j+1,k) * u(i-1,j+1,k,n) &
-                     +        msk(i+1,j+1,k) * u(i+1,j+1,k,n) &
-                     +        msk(i-1,j,k+1) * u(i-1,j,k+1,n) &
-                     +        msk(i+1,j,k+1) * u(i+1,j,k+1,n) &
-                     +                         u(i,j+1,k+1,n)) / &
-                     (msk(i-1,j+1,k) + msk(i+1,j+1,k) + msk(i-1,j,k+1) + msk(i+1,j,k+1) + 1)
-             end if
-          end if
-       end do
-
-       ! z-lo, y-lo, x-hi
-       i = hi(1)+1
-       j = lo(2)-1
-       k = lo(3)-1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i-1,j,k) .eq. finecell &
-               .or. msk(i,j+1,k) .eq. finecell &
-               .or. msk(i,j,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                  +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                  +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                  / (msk(i-1,j,k) + msk(i,j+1,k) + msk(i,j,k+1))
-
-          else if ( msk(i-1,j+1,k) .eq. finecell &
-               .or. msk(i-1,j,k+1) .eq. finecell &
-               .or. msk(i,j+1,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j+1,k) * u(i-1,j+1,k,n) &
-                  +        msk(i-1,j,k+1) * u(i-1,j,k+1,n) &
-                  +        msk(i,j+1,k+1) * u(i,j+1,k+1,n)) &
-                  / (msk(i-1,j+1,k) + msk(i-1,j,k+1) + msk(i,j+1,k+1))
-          else
-             u(i,j,k,n) = u(i-1,j+1,k+1,n)
-          end if
-       end if
-
-       ! z-lo, y-valid, x-lo
-       i = lo(1)-1
-       k = lo(3)-1
-       do j = lo(2), hi(2)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) / &
-                     (msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j+1,k) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (msk(i+1,j-1,k) * u(i+1,j-1,k,n) &
-                     +        msk(i+1,j+1,k) * u(i+1,j+1,k,n) &
-                     +                         u(i+1,j,k+1,n) &
-                     +        msk(i,j-1,k+1) * u(i,j-1,k+1,n) &
-                     +        msk(i,j+1,k+1) * u(i,j+1,k+1,n)) / &
-                     (msk(i+1,j-1,k) + msk(i+1,j+1,k) + 1 + msk(i,j-1,k+1) + msk(i,j+1,k+1))
-             end if
-          end if
-       end do
-
-       ! z-lo, y-valid, x-valid
-       k = lo(3)-1
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (msk(i,j,k) .eq. crsecell) then
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +                       u(i,j,k+1,n)) / &
-                (msk(i-1,j,k) + msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j+1,k) + 1)
-             end if
-          end do
-       end do
-
-       ! z-lo, y-valid, x-hi
-       i = hi(1)+1
-       k = lo(3)-1
-       do j = lo(2), hi(2)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i-1,j,k) + msk(i,j-1,k) + msk(i,j+1,k) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (msk(i-1,j-1,k)*u(i-1,j-1,k,n) &
-                     +        msk(i-1,j+1,k)*u(i-1,j+1,k,n) &
-                     +                       u(i-1,j,k+1,n) &
-                     +        msk(i,j-1,k+1)*u(i,j-1,k+1,n) &
-                     +        msk(i,j+1,k+1)*u(i,j+1,k+1,n)) / &
-                     (msk(i-1,j-1,k) + msk(i-1,j+1,k) + 1 + msk(i,j-1,k+1) + msk(i,j+1,k+1))
-             end if
-          end if
-       end do
-
-       ! z-lo, y-hi, x-lo
-       i = lo(1)-1
-       j = hi(2)+1
-       k = lo(3)-1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i+1,j,k) .eq. finecell &
-               .or. msk(i,j-1,k) .eq. finecell &
-               .or. msk(i,j,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                  +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                  +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                  / (msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j,k+1))
-
-          else if ( msk(i+1,j-1,k) .eq. finecell &
-               .or. msk(i+1,j,k+1) .eq. finecell &
-               .or. msk(i,j-1,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j-1,k) * u(i+1,j-1,k,n) &
-                  +        msk(i+1,j,k+1) * u(i+1,j,k+1,n) &
-                  +        msk(i,j-1,k+1) * u(i,j-1,k+1,n)) &
-                  / (msk(i+1,j-1,k) + msk(i+1,j,k+1) + msk(i,j-1,k+1))
-          else
-             u(i,j,k,n) = u(i+1,j-1,k+1,n)
-          end if
-       end if
-
-       ! z-lo, y-hi, x-valid
-       j = hi(2)+1
-       k = lo(3)-1
-       do i = lo(1), hi(1)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i-1,j,k) + msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (msk(i-1,j-1,k) * u(i-1,j-1,k,n) &
-                     +        msk(i+1,j-1,k) * u(i+1,j-1,k,n) &
-                     +        msk(i-1,j,k+1) * u(i-1,j,k+1,n) &
-                     +        msk(i+1,j,k+1) * u(i+1,j,k+1,n) &
-                     +                         u(i,j-1,k+1,n)) / &
-                     (msk(i-1,j-1,k) + msk(i+1,j-1,k) + msk(i-1,j,k+1) + msk(i+1,j,k+1) + 1)
-             end if
-          end if
-       end do
-
-       ! z-lo, y-hi, x-hi
-       i = hi(1)+1
-       j = hi(2)+1
-       k = lo(3)-1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i-1,j,k) .eq. finecell &
-               .or. msk(i,j-1,k) .eq. finecell &
-               .or. msk(i,j,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                  +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                  +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                  / (msk(i-1,j,k) + msk(i,j-1,k) + msk(i,j,k+1))
-
-          else if ( msk(i-1,j-1,k) .eq. finecell &
-               .or. msk(i-1,j,k+1) .eq. finecell &
-               .or. msk(i,j-1,k+1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j-1,k) * u(i-1,j-1,k,n) &
-                  +        msk(i-1,j,k+1) * u(i-1,j,k+1,n) &
-                  +        msk(i,j-1,k+1) * u(i,j-1,k+1,n)) &
-                  / (msk(i-1,j-1,k) + msk(i-1,j,k+1) + msk(i,j-1,k+1))
-          else
-             u(i,j,k,n) = u(i-1,j-1,k+1,n)
-          end if
-       end if
-
-       ! z-valid, y-lo, x-lo
-       i = lo(1)-1
-       j = lo(2)-1
-       do k = lo(3), hi(3)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i+1,j,k) + msk(i,j+1,k) + msk(i,j,k-1) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (                 u(i+1,j+1,k,n) &
-                     +        msk(i+1,j,k-1) * u(i+1,j,k-1,n) &
-                     +        msk(i+1,j,k+1) * u(i+1,j,k+1,n) &
-                     +        msk(i,j+1,k-1) * u(i,j+1,k-1,n) &
-                     +        msk(i,j+1,k+1) * u(i,j+1,k+1,n)) / &
-                     (1 + msk(i+1,j,k-1) + msk(i+1,j,k+1) + msk(i,j+1,k-1) + msk(i,j+1,k+1))
-             end if
-          end if
-       end do
-
-       ! z-valid, y-lo, x-valid
-       j = lo(2)-1
-       do k = lo(3), hi(3)
-          do i = lo(1), hi(1)
-             if (msk(i,j,k) .eq. crsecell) then
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +                       u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) / &
-                     (msk(i-1,j,k) + msk(i+1,j,k) + 1 + msk(i,j,k-1) + msk(i,j,k+1))
-             end if
-          end do
-       end do
-
-       ! z-valid, y-lo, x-hi
-       i = hi(1)+1
-       j = lo(2)-1
-       do k = lo(3), hi(3)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i-1,j,k) + msk(i,j+1,k) + msk(i,j,k-1) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (                 u(i-1,j+1,k,n) &
-                     +        msk(i-1,j,k-1) * u(i-1,j,k-1,n) &
-                     +        msk(i-1,j,k+1) * u(i-1,j,k+1,n) &
-                     +        msk(i,j+1,k-1) * u(i,j+1,k-1,n) &
-                     +        msk(i,j+1,k+1) * u(i,j+1,k+1,n)) / &
-                     (1 + msk(i-1,j,k-1) + msk(i-1,j,k+1) + msk(i,j+1,k-1) + msk(i,j+1,k+1))
-             end if
-          end if
-       end do
-
-       ! z-valid, y-valid, x-lo
-       i = lo(1)-1
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             if (msk(i,j,k) .eq. crsecell) then
-                u(i,j,k,n) = (               u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) / &
-                     (1 + msk(i,j-1,k) + msk(i,j+1,k) + msk(i,j,k-1) + msk(i,j,k+1))
-             end if
-          end do
-       end do
-       
-       ! z-valid, y-valid, x-hi
-       i = hi(1)+1
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             if (msk(i,j,k) .eq. crsecell) then
-                u(i,j,k,n) = (               u(i-1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) / &
-                (1 + msk(i,j-1,k) + msk(i,j+1,k) + msk(i,j,k-1) + msk(i,j,k+1))
-             end if
-          end do
-       end do
-       
-       ! z-valid, y-hi, x-lo
-       i = lo(1)-1
-       j = hi(2)+1
-       do k = lo(3), hi(3)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j,k-1) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (                 u(i+1,j-1,k,n) &
-                     +        msk(i+1,j,k-1) * u(i+1,j,k-1,n) &
-                     +        msk(i+1,j,k+1) * u(i+1,j,k+1,n) &
-                     +        msk(i,j-1,k-1) * u(i,j-1,k-1,n) &
-                     +        msk(i,j-1,k+1) * u(i,j-1,k+1,n)) &
-                     / (1 + msk(i+1,j,k-1) + msk(i+1,j,k+1) + msk(i,j-1,k-1) + msk(i,j-1,k+1))
-             end if
-          end if
-       end do
-
-       ! z-valid, y-hi, x-valid
-       j = hi(2)+1
-       do k = lo(3), hi(3)
-          do i = lo(1), hi(1)
-             if (msk(i,j,k) .eq. crsecell) then
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +                       u(i,j-1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) / &
-                     (msk(i-1,j,k) + msk(i+1,j,k) + 1 + msk(i,j,k-1) + msk(i,j,k+1))
-             end if
-          end do
-       end do
-
-       ! z-valid, y-hi, x-hi
-       i = hi(1)+1
-       j = hi(2)+1
-       do k = lo(3), hi(3)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell &
-                  .or. msk(i,j,k+1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n) &
-                     +        msk(i,j,k+1) * u(i,j,k+1,n)) &
-                     / (msk(i-1,j,k) + msk(i,j-1,k) + msk(i,j,k-1) + msk(i,j,k+1))
-             else
-                u(i,j,k,n) = (                 u(i-1,j-1,k,n) &
-                     +        msk(i-1,j,k-1) * u(i-1,j,k-1,n) &
-                     +        msk(i-1,j,k+1) * u(i-1,j,k+1,n) &
-                     +        msk(i,j-1,k-1) * u(i,j-1,k-1,n) &
-                     +        msk(i,j-1,k+1) * u(i,j-1,k+1,n)) / &
-                     (1 + msk(i-1,j,k-1) + msk(i-1,j,k+1) + msk(i,j-1,k-1) + msk(i,j-1,k+1))
-             end if
-          end if
-       end do
-
-       ! z-hi, y-lo, x-lo
-       i = lo(1)-1
-       j = lo(2)-1
-       k = hi(3)+1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i+1,j,k) .eq. finecell &
-               .or. msk(i,j+1,k) .eq. finecell &
-               .or. msk(i,j,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                  +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                  +        msk(i,j,k-1) * u(i,j,k-1,n)) &
-                  / (msk(i+1,j,k) + msk(i,j+1,k) + msk(i,j,k-1))
-
-          else if ( msk(i+1,j+1,k) .eq. finecell &
-               .or. msk(i+1,j,k-1) .eq. finecell &
-               .or. msk(i,j+1,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j+1,k) * u(i+1,j+1,k,n) &
-                  +        msk(i+1,j,k-1) * u(i+1,j,k-1,n) &
-                  +        msk(i,j+1,k-1) * u(i,j+1,k-1,n)) &
-                  / (msk(i+1,j+1,k) + msk(i+1,j,k-1) + msk(i,j+1,k-1))
-          else
-             u(i,j,k,n) = u(i+1,j+1,k-1,n)
-          end if
-       end if
-
-       ! z-hi, y-lo, x-valid
-       j = lo(2)-1
-       k = hi(3)+1
-       do i = lo(1), hi(1)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n)) &
-                     / (msk(i-1,j,k) + msk(i+1,j,k) + msk(i,j+1,k) + msk(i,j,k-1))
-             else
-                u(i,j,k,n) = (msk(i-1,j+1,k) * u(i-1,j+1,k,n) &
-                     +        msk(i+1,j+1,k) * u(i+1,j+1,k,n) &
-                     +        msk(i-1,j,k-1) * u(i-1,j,k-1,n) &
-                     +        msk(i+1,j,k-1) * u(i+1,j,k-1,n) &
-                     +                         u(i,j+1,k-1,n)) / &
-                     (msk(i-1,j+1,k) + msk(i+1,j+1,k) + msk(i-1,j,k-1) + msk(i+1,j,k-1) + 1)
-             end if                
-          end if
-       end do
-
-       ! z-hi, y-lo, x-hi
-       i = hi(1)+1
-       j = lo(2)-1
-       k = hi(3)+1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i-1,j,k) .eq. finecell &
-               .or. msk(i,j+1,k) .eq. finecell &
-               .or. msk(i,j,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                  +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                  +        msk(i,j,k-1) * u(i,j,k-1,n)) &
-                  / (msk(i-1,j,k) + msk(i,j+1,k) + msk(i,j,k-1))
-
-          else if ( msk(i-1,j+1,k) .eq. finecell &
-               .or. msk(i-1,j,k-1) .eq. finecell &
-               .or. msk(i,j+1,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j+1,k) * u(i-1,j+1,k,n) &
-                  +        msk(i-1,j,k-1) * u(i-1,j,k-1,n) &
-                  +        msk(i,j+1,k-1) * u(i,j+1,k-1,n)) &
-                  / (msk(i-1,j+1,k) + msk(i-1,j,k-1) + msk(i,j+1,k-1))
-          else
-             u(i,j,k,n) = u(i-1,j+1,k-1,n)
-          end if
-       end if
-
-       ! z-hi, y-valid, x-lo
-       i = lo(1)-1
-       k = hi(3)+1
-       do j = lo(2), hi(2)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n)) / &
-                     (msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j+1,k) + msk(i,j,k-1))
-             else
-                u(i,j,k,n) = (msk(i+1,j-1,k) * u(i+1,j-1,k,n) &
-                     +        msk(i+1,j+1,k) * u(i+1,j+1,k,n) &
-                     +                         u(i+1,j,k-1,n) &
-                     +        msk(i,j-1,k-1) * u(i,j-1,k-1,n) &
-                     +        msk(i,j+1,k-1) * u(i,j+1,k-1,n)) / &
-                     (msk(i+1,j-1,k) + msk(i+1,j+1,k) + 1 + msk(i,j-1,k-1) + msk(i,j+1,k-1))
-             end if                
-          end if
-       end do
-
-       ! z-hi, y-valid, x-valid
-       k = hi(3)+1
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (msk(i,j,k) .eq. crsecell) then
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +                       u(i,j,k-1,n)) / &
-                     (msk(i-1,j,k) + msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j+1,k) + 1)
-             end if
-          end do
-       end do
-
-       ! z-hi, y-valid, x-hi
-       i = hi(1)+1
-       k = hi(3)+1
-       do j = lo(2), hi(2)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j+1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j+1,k) * u(i,j+1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n)) / &
-                     (msk(i-1,j,k) + msk(i,j-1,k) + msk(i,j+1,k) + msk(i,j,k-1))
-             else
-                u(i,j,k,n) = (msk(i-1,j-1,k) * u(i-1,j-1,k,n) &
-                     +        msk(i-1,j+1,k) * u(i-1,j+1,k,n) &
-                     +                         u(i-1,j,k-1,n) &
-                     +        msk(i,j-1,k-1) * u(i,j-1,k-1,n) &
-                     +        msk(i,j+1,k-1) * u(i,j+1,k-1,n)) / &
-                     (msk(i-1,j-1,k) + msk(i-1,j+1,k) + 1 + msk(i,j-1,k-1) + msk(i,j+1,k-1))
-             end if                                
-          end if
-       end do
-
-       ! z-hi, y-hi, x-lo
-       i = lo(1)-1
-       j = hi(2)+1
-       k = hi(3)+1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i+1,j,k) .eq. finecell &
-               .or. msk(i,j-1,k) .eq. finecell &
-               .or. msk(i,j,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j,k) * u(i+1,j,k,n) &
-                  +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                  +        msk(i,j,k-1) * u(i,j,k-1,n)) &
-                  / (msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j,k-1))
-
-          else if ( msk(i+1,j-1,k) .eq. finecell &
-               .or. msk(i+1,j,k-1) .eq. finecell &
-               .or. msk(i,j-1,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i+1,j-1,k) * u(i+1,j-1,k,n) &
-                  +        msk(i+1,j,k-1) * u(i+1,j,k-1,n) &
-                  +        msk(i,j-1,k-1) * u(i,j-1,k-1,n)) &
-                  / (msk(i+1,j-1,k) + msk(i+1,j,k-1) + msk(i,j-1,k-1))
-          else
-             u(i,j,k,n) = u(i+1,j-1,k-1,n)
-          end if
-       end if
-
-       ! z-hi, y-hi, x-valid
-       j = hi(2)+1
-       k = hi(3)+1
-       do i = lo(1), hi(1)
-          if (msk(i,j,k) .eq. crsecell) then
-             if (      msk(i-1,j,k) .eq. finecell &
-                  .or. msk(i+1,j,k) .eq. finecell &
-                  .or. msk(i,j-1,k) .eq. finecell &
-                  .or. msk(i,j,k-1) .eq. finecell) then
-
-                u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                     +        msk(i+1,j,k) * u(i+1,j,k,n) &
-                     +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                     +        msk(i,j,k-1) * u(i,j,k-1,n)) &
-                     / (msk(i-1,j,k) + msk(i+1,j,k) + msk(i,j-1,k) + msk(i,j,k-1))
-             else
-                u(i,j,k,n) = (msk(i-1,j-1,k) * u(i-1,j-1,k,n) &
-                     +        msk(i+1,j-1,k) * u(i+1,j-1,k,n) &
-                     +        msk(i-1,j,k-1) * u(i-1,j,k-1,n) &
-                     +        msk(i+1,j,k-1) * u(i+1,j,k-1,n) &
-                     +                         u(i,j-1,k-1,n)) / &
-                     (msk(i-1,j-1,k) + msk(i+1,j-1,k) + msk(i-1,j,k-1) + msk(i+1,j,k-1) + 1)
-             end if                
-          end if
-       end do
-
-       ! z-hi, y-hi, x-hi
-       i = hi(1)+1
-       j = hi(2)+1
-       k = hi(3)+1
-       if (msk(i,j,k) .eq. crsecell) then
-          if (      msk(i-1,j,k) .eq. finecell &
-               .or. msk(i,j-1,k) .eq. finecell &
-               .or. msk(i,j,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j,k) * u(i-1,j,k,n) &
-                  +        msk(i,j-1,k) * u(i,j-1,k,n) &
-                  +        msk(i,j,k-1) * u(i,j,k-1,n)) &
-                  / (msk(i-1,j,k) + msk(i,j-1,k) + msk(i,j,k-1))
-
-          else if ( msk(i-1,j-1,k) .eq. finecell &
-               .or. msk(i-1,j,k-1) .eq. finecell &
-               .or. msk(i,j-1,k-1) .eq. finecell) then
-
-             u(i,j,k,n) = (msk(i-1,j-1,k) * u(i-1,j-1,k,n) &
-                  +        msk(i-1,j,k-1) * u(i-1,j,k-1,n) &
-                  +        msk(i,j-1,k-1) * u(i,j-1,k-1,n)) &
-                  / (msk(i-1,j-1,k) + msk(i-1,j,k-1) + msk(i,j-1,k-1))
-          else
-             u(i,j,k,n) = u(i-1,j-1,k-1,n)
-          end if
-       end if
-    end do
-
-  end subroutine amrex_first_order_extrap
-
-end module amrex_extrapolater
diff --git a/Src/Amr/AMReX_extrapolater_K.H b/Src/Amr/AMReX_extrapolater_K.H
new file mode 100644
index 00000000000..2552bb069c5
--- /dev/null
+++ b/Src/Amr/AMReX_extrapolater_K.H
@@ -0,0 +1,16 @@
+#ifndef AMReX_extrapolater_K_H_
+#define AMReX_extrapolater_K_H_
+
+#include <AMReX_REAL.H>
+#include <AMReX_FArrayBox.H>
+#include <AMReX_Gpu.H>
+
+#if (AMREX_SPACEDIM == 1)
+#include <AMReX_extrapolater_1D_K.H>
+#elif (AMREX_SPACEDIM == 2)
+#include <AMReX_extrapolater_2D_K.H>
+#else
+#include <AMReX_extrapolater_3D_K.H>
+#endif
+
+#endif
diff --git a/Src/Amr/CMakeLists.txt b/Src/Amr/CMakeLists.txt
index 78ac127f65f..b5d16891dde 100644
--- a/Src/Amr/CMakeLists.txt
+++ b/Src/Amr/CMakeLists.txt
@@ -16,12 +16,8 @@ target_sources(amrex
    AMReX_AuxBoundaryData.H
    AMReX_StateDescriptor.cpp
    AMReX_AuxBoundaryData.cpp
+   AMReX_Extrapolater.H
+   AMReX_Extrapolater.cpp
+   AMReX_extrapolater_K.H
+   AMReX_extrapolater_${AMReX_SPACEDIM}D_K.H
    )
-
-if (ENABLE_FORTRAN)
-   target_sources(amrex
-      PRIVATE
-      AMReX_Extrapolater.H
-      AMReX_Extrapolater.cpp
-      AMReX_extrapolater_${DIM}d.f90 )
-endif ()
diff --git a/Src/Amr/Make.package b/Src/Amr/Make.package
index 42595197e4d..12a0cf0b8c4 100644
--- a/Src/Amr/Make.package
+++ b/Src/Amr/Make.package
@@ -1,17 +1,11 @@
 
 AMRLIB_BASE=EXE
 
-C$(AMRLIB_BASE)_sources += AMReX_Amr.cpp AMReX_AmrLevel.cpp AMReX_AsyncFillPatch.cpp AMReX_Derive.cpp AMReX_StateData.cpp \
-                AMReX_StateDescriptor.cpp AMReX_AuxBoundaryData.cpp
+C$(AMRLIB_BASE)_sources += AMReX_Amr.cpp AMReX_AmrLevel.cpp AMReX_Derive.cpp AMReX_StateData.cpp \
+                AMReX_StateDescriptor.cpp AMReX_AuxBoundaryData.cpp AMReX_Extrapolater.cpp
 
 C$(AMRLIB_BASE)_headers += AMReX_Amr.H AMReX_AmrLevel.H AMReX_Derive.H AMReX_LevelBld.H AMReX_StateData.H \
-                AMReX_StateDescriptor.H AMReX_PROB_AMR_F.H AMReX_AuxBoundaryData.H
-
-ifneq ($(BL_NO_FORT),TRUE)
-  f90$(AMRLIB_BASE)_sources += AMReX_extrapolater_$(DIM)d.f90
-  C$(AMRLIB_BASE)_sources += AMReX_Extrapolater.cpp
-  C$(AMRLIB_BASE)_headers += AMReX_Extrapolater.H
-endif
+                AMReX_StateDescriptor.H AMReX_PROB_AMR_F.H AMReX_AuxBoundaryData.H AMReX_Extrapolater.H AMReX_extrapolater_K.H AMReX_extrapolater_$(DIM)D_K.H
 
 VPATH_LOCATIONS += $(AMREX_HOME)/Src/Amr
 INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Amr
diff --git a/Src/AmrCore/AMReX_AmrCore.cpp b/Src/AmrCore/AMReX_AmrCore.cpp
index 5e3fca57267..f94142a0e68 100644
--- a/Src/AmrCore/AMReX_AmrCore.cpp
+++ b/Src/AmrCore/AMReX_AmrCore.cpp
@@ -127,7 +127,7 @@ AmrCore::printGridSummary (std::ostream& os, int min_lev, int max_lev) const noe
         int                       numgrid = bs.size();
         Long                      ncells  = bs.numPts();
         double                    ntot    = Geom(lev).Domain().d_numPts();
-        Real                      frac    = 100.0_rt*(Real(ncells) / ntot);
+        Real                      frac    = Real(100.0)*(Real(ncells) / ntot);
 
         os << "  Level "
            << lev
diff --git a/Src/AmrCore/AMReX_AmrMesh.H b/Src/AmrCore/AMReX_AmrMesh.H
index c79a0ebe07a..65b5cad8f76 100644
--- a/Src/AmrCore/AMReX_AmrMesh.H
+++ b/Src/AmrCore/AMReX_AmrMesh.H
@@ -249,6 +249,7 @@ protected:
     Vector<BoxArray>            grids;
 
     unsigned int num_setdm = 0;
+    unsigned int num_setba = 0;
 
     void checkInput();
 
diff --git a/Src/AmrCore/AMReX_AmrMesh.cpp b/Src/AmrCore/AMReX_AmrMesh.cpp
index ff9b290c1d3..1aeda59d833 100644
--- a/Src/AmrCore/AMReX_AmrMesh.cpp
+++ b/Src/AmrCore/AMReX_AmrMesh.cpp
@@ -380,6 +380,7 @@ AmrMesh::SetDistributionMap (int lev, const DistributionMapping& dmap_in) noexce
 void
 AmrMesh::SetBoxArray (int lev, const BoxArray& ba_in) noexcept
 {
+    ++num_setba;
     if (grids[lev] != ba_in) grids[lev] = ba_in;
 }
 
@@ -502,17 +503,16 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
     Vector<BoxList> p_n(max_level);      // Proper nesting domain.
     Vector<BoxList> p_n_comp(max_level); // Complement proper nesting domain.
 
-    BoxList bl(grids[lbase]);
-    bl.simplify();
+    BoxList bl = grids[lbase].simplified_list();
     bl.coarsen(bf_lev[lbase]);
-    p_n_comp[lbase].complementIn(pc_domain[lbase],bl);
+    p_n_comp[lbase].parallelComplementIn(pc_domain[lbase],bl);
     p_n_comp[lbase].simplify();
     p_n_comp[lbase].accrete(n_proper);
     if (geom[lbase].isAnyPeriodic()) {
         ProjPeriodic(p_n_comp[lbase], pc_domain[lbase],
                      geom[lbase].isPeriodic());
     }
-    p_n[lbase].complementIn(pc_domain[lbase],p_n_comp[lbase]);
+    p_n[lbase].parallelComplementIn(pc_domain[lbase],p_n_comp[lbase]);
     p_n[lbase].simplify();
     bl.clear();
 
@@ -530,7 +530,7 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
 	    ProjPeriodic(p_n_comp[i], pc_domain[i], geom[i].isPeriodic());
 	}
 
-        p_n[i].complementIn(pc_domain[i],p_n_comp[i]);
+        p_n[i].parallelComplementIn(pc_domain[i],p_n_comp[i]);
         p_n[i].simplify();
     }
 
@@ -550,12 +550,12 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
 
         if (levf < new_finest)
         {
-            BoxArray ba_proj(new_grids[levf+1]);
+            BoxArray ba_proj = new_grids[levf+1].simplified();
 
             ba_proj.coarsen(ref_ratio[levf]);
             ba_proj.growcoarsen(n_proper, ref_ratio[levc]);
 
-            BoxArray levcBA = grids[levc];
+            BoxArray levcBA = grids[levc].simplified();
 
             while (!levcBA.contains(ba_proj))
             {
@@ -594,8 +594,7 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
             // Replace this by n_error_buf that may be anisotropic
             // int nerr = n_error_buf[levf];
 
-            BoxList bl_tagged(new_grids[levf+1]);
-            bl_tagged.simplify();
+            BoxList bl_tagged = new_grids[levf+1].simplified_list();
             bl_tagged.coarsen(ref_ratio[levf]);
             //
             // This grows the boxes by n_error_buf[levf][idir] if they touch the edge 
@@ -617,7 +616,7 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
             }
             Box mboxF = amrex::grow(bl_tagged.minimalBox(),1);
             BoxList blFcomp;
-            blFcomp.complementIn(mboxF,bl_tagged);
+            blFcomp.parallelComplementIn(mboxF,bl_tagged);
             blFcomp.simplify();
             bl_tagged.clear();
 
@@ -626,9 +625,8 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
                                                      n_error_buf[levf][2]/ref_ratio[levf][2]));
             blFcomp.accrete(iv);
             BoxList blF;
-            blF.complementIn(mboxF,blFcomp);
-            BoxArray baF(blF);
-            blF.clear();
+            blF.parallelComplementIn(mboxF,blFcomp);
+            BoxArray baF(std::move(blF));
             baF.grow(n_proper);
             //
             // We need to do this in case the error buffering at
@@ -682,10 +680,10 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
         //
         // Map tagged points through periodic boundaries, if any.
         //
-        tags.mapPeriodic(Geometry(pc_domain[levc],
-                                  Geom(levc).ProbDomain(),
-                                  Geom(levc).CoordInt(),
-                                  Geom(levc).isPeriodic()));
+        tags.mapPeriodicRemoveDuplicates(Geometry(pc_domain[levc],
+                                                  Geom(levc).ProbDomain(),
+                                                  Geom(levc).CoordInt(),
+                                                  Geom(levc).isPeriodic()));
         //
         // Remove cells outside proper nesting domain for this level.
         //
@@ -704,62 +702,68 @@ AmrMesh::MakeNewGrids (int lbase, Real time, int& new_finest, Vector<BoxArray>&
             //
             if ( !(useFixedCoarseGrids() && levc<useFixedUpToLevel()) ) {
                 new_finest = std::max(new_finest,levf);
-	    }
-            //
-            // Construct initial cluster.
-            //
-            ClusterList clist(&tagvec[0], tagvec.size());
-            if (use_new_chop)
-            {
-               clist.new_chop(grid_eff);
-            } else {
-               clist.chop(grid_eff);
             }
-            BoxDomain bd;
-            bd.add(p_n[levc]);
-            clist.intersect(bd);
-            bd.clear();
-            //
-            // Efficient properly nested Clusters have been constructed
-            // now generate list of grids at level levf.
-            //
-            BoxList new_bx;
-            clist.boxList(new_bx);
-            new_bx.refine(bf_lev[levc]);
-            new_bx.simplify();
-            BL_ASSERT(new_bx.isDisjoint());
-
-	    if (new_bx.size()>0) {
-		if ( !(Geom(levc).Domain().contains(BoxArray(new_bx).minimalBox())) ) {
-		// Chop new grids outside domain, note that this is likely to result in
-		//  new grids that violate blocking_factor....see warning checking below
-		    new_bx = amrex::intersect(new_bx,Geom(levc).Domain());
-		}
-	    }
 
-            const IntVect& largest_grid_size = max_grid_size[levf] / ref_ratio[levc];
-            //
-            // Ensure new grid boxes are at most max_grid_size in index dirs.
-            //
-            new_bx.maxSize(largest_grid_size);
+            if (levf > useFixedUpToLevel()) {
+                BoxList new_bx;
+                if (ParallelDescriptor::IOProcessor()) {
+                    BL_PROFILE("AmrMesh-cluster");
+                    //
+                    // Construct initial cluster.
+                    //
+                    ClusterList clist(&tagvec[0], tagvec.size());
+                    if (use_new_chop) {
+                        clist.new_chop(grid_eff);
+                    } else {
+                        clist.chop(grid_eff);
+                    }
+                    BoxDomain bd;
+                    bd.add(p_n[levc]);
+                    clist.intersect(bd);
+                    bd.clear();
+                    //
+                    // Efficient properly nested Clusters have been constructed
+                    // now generate list of grids at level levf.
+                    //
+                    clist.boxList(new_bx);
+                    new_bx.refine(bf_lev[levc]);
+                    new_bx.simplify();
+
+                    if (new_bx.size()>0) {
+                        // Chop new grids outside domain
+                        new_bx.intersect(Geom(levc).Domain());
+                    }
+                }
+                new_bx.Bcast();  // Broadcast the new BoxList to other processes
 
-            //
-            // Refine up to levf.
-            //
-            new_bx.refine(ref_ratio[levc]);
-            BL_ASSERT(new_bx.isDisjoint());
+                //
+                // Refine up to levf.
+                //
+                new_bx.refine(ref_ratio[levc]);
+                BL_ASSERT(new_bx.isDisjoint());
 
-	    if (new_bx.size()>0) {
-		if ( !(Geom(levf).Domain().contains(BoxArray(new_bx).minimalBox())) ) {
-		    new_bx = amrex::intersect(new_bx,Geom(levf).Domain());
-		}
+                new_grids[levf] = BoxArray(std::move(new_bx), max_grid_size[levf]);
 	    }
+        }
+    }
 
-            if(levf > useFixedUpToLevel()) {
-              new_grids[levf].define(new_bx);
-	    }
+#ifdef AMREX_DEBUG
+    if (!useFixedCoarseGrids()) {
+        // check proper nesting
+        for (int lev = lbase+1; lev <= new_finest; ++lev) {
+            BoxArray const& cba = (lev == lbase+1) ? grids[lev-1] : new_grids[lev-1];
+            BoxArray const& fba = amrex::coarsen(new_grids[lev],ref_ratio[lev-1]);
+            IntVect np = bf_lev[lev-1] * n_proper;
+            Box const& cdomain = Geom(lev-1).Domain();
+            for (int i = 0, N = fba.size(); i < N; ++i) {
+                Box const& fb = amrex::grow(fba[i],np) & cdomain;
+                if (!cba.contains(fb,true)) {
+                    amrex::Abort("AmrMesh::MakeNewGrids: new grids not properly nested");
+                }
+            }
         }
     }
+#endif
 
     for (int lev = lbase+1; lev <= new_finest; ++lev) {
         if (new_grids[lev].empty())
@@ -788,10 +792,13 @@ AmrMesh::MakeNewGrids (Real time)
 	const BoxArray& ba = MakeBaseGrids();
 	DistributionMapping dm(ba);
         const auto old_num_setdm = num_setdm;
+        const auto old_num_setba = num_setba;
 
 	MakeNewLevelFromScratch(0, time, ba, dm);
 
-        SetBoxArray(0, ba);
+        if (old_num_setba == num_setba) {
+            SetBoxArray(0, ba);
+        }
         if (old_num_setdm == num_setdm) {
             SetDistributionMap(0, dm);
         }
@@ -980,6 +987,22 @@ AmrMesh::checkInput ()
         }
     }
 
+    // Make sure TagBoxArray has no overlapped valid cells after coarsening by block_factor/ref_ratio
+    for (int i = 0; i < max_level; ++i) {
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+            int bf_lev = std::max(1,blocking_factor[i+1][idim]/ref_ratio[i][idim]);
+            int min_grid_size = std::min(blocking_factor[i][idim],max_grid_size[i][idim]);
+            if (min_grid_size % bf_lev != 0) {
+                amrex::Print() << "On level " << i << " in direction " << idim
+                               << " max_grid_size is " << max_grid_size[i][idim]
+                               << " blocking factor is " << blocking_factor[i][idim] << "\n"
+                               << "On level " << i+1 << " in direction " << idim
+                               << " blocking_factor is " << blocking_factor[i+1][idim] << std::endl;
+                amrex::Error("Coarse level blocking factor not a multiple of fine level blocking factor divided by ref ratio");
+            }
+        }
+    }
+
     if( ! (Geom(0).ProbDomain().volume() > 0.0) ) {
         amrex::Error("Amr::checkInput: bad physical problem size");
     }
diff --git a/Src/AmrCore/AMReX_AmrParGDB.H b/Src/AmrCore/AMReX_AmrParGDB.H
index 1c189d45a95..2d7093a2bd5 100644
--- a/Src/AmrCore/AMReX_AmrParGDB.H
+++ b/Src/AmrCore/AMReX_AmrParGDB.H
@@ -13,25 +13,39 @@ public:
 
     explicit AmrParGDB (AmrCore* amr) noexcept
 	: m_amrcore(amr),
+          m_geom(amr->maxLevel()+1),
+          m_has_geom(amr->maxLevel()+1, 0),
 	  m_dmap(amr->maxLevel()+1),
 	  m_ba(amr->maxLevel()+1)
 	{ }
 
     virtual ~AmrParGDB () {;}
-    
-    virtual const Geometry& Geom (int level) const override;
-    virtual const DistributionMapping& ParticleDistributionMap 
-                                             (int level) const override;
-    virtual const DistributionMapping&         DistributionMap 
-                                             (int level) const override;
+
+    virtual const Geometry& ParticleGeom (int level) const override;
+    virtual const Geometry&         Geom (int level) const override;
+
+    virtual const Vector<Geometry>& ParticleGeom () const override;
+    virtual const Vector<Geometry>&         Geom () const override;
+
+    virtual const DistributionMapping& ParticleDistributionMap (int level) const override;
+    virtual const DistributionMapping&         DistributionMap (int level) const override;
+
+    virtual const Vector<DistributionMapping>& ParticleDistributionMap () const override;
+    virtual const Vector<DistributionMapping>&         DistributionMap () const override;
+
     virtual const BoxArray& ParticleBoxArray (int level) const override;
     virtual const BoxArray&         boxArray (int level) const override;
 
+    virtual const Vector<BoxArray>& ParticleBoxArray () const override;
+    virtual const Vector<BoxArray>&         boxArray () const override;
+
     virtual void SetParticleBoxArray (int level, const BoxArray& new_ba) override;
     virtual void SetParticleDistributionMap (int level,	const DistributionMapping& new_dm) override;
+    virtual void SetParticleGeometry (int level, const Geometry& new_geom) override;
 
     virtual void ClearParticleBoxArray (int level) override;
     virtual void ClearParticleDistributionMap (int level) override;
+    virtual void ClearParticleGeometry (int level) override;
 
     virtual bool LevelDefined (int level) const override;
     virtual int finestLevel () const override;
@@ -40,21 +54,55 @@ public:
     virtual IntVect refRatio (int level) const override;
     virtual int MaxRefRatio (int level) const override;
 
+    virtual Vector<IntVect> refRatio () const override;
+
 protected:
-    AmrCore* m_amrcore;
+
+    AmrCore*                    m_amrcore;
+    Vector<Geometry>            m_geom;
+    Vector<int>                 m_has_geom;
     Vector<DistributionMapping> m_dmap;
     Vector<BoxArray>            m_ba;
 };
 
-inline 
-const Geometry& 
+inline
+const Geometry&
+AmrParGDB::ParticleGeom (int level) const
+{
+    if (not m_has_geom[level]) {
+        return m_amrcore->Geom(level);
+    } else {
+        return m_geom[level];
+    }
+}
+
+inline
+const Geometry&
 AmrParGDB::Geom (int level) const
 {
     return m_amrcore->Geom(level);
 }
 
-inline 
-const DistributionMapping& 
+inline
+const Vector<Geometry>&
+AmrParGDB::ParticleGeom () const
+{
+    if (not m_has_geom[0]) {
+        return m_amrcore->Geom();
+    } else {
+        return m_geom;
+    }
+}
+
+inline
+const Vector<Geometry>&
+AmrParGDB::Geom () const
+{
+    return m_amrcore->Geom();
+}
+
+inline
+const DistributionMapping&
 AmrParGDB::ParticleDistributionMap (int level) const
 {
     if (m_dmap[level].empty()) {
@@ -64,14 +112,32 @@ AmrParGDB::ParticleDistributionMap (int level) const
     }
 }
 
-inline 
-const DistributionMapping& 
+inline
+const DistributionMapping&
 AmrParGDB::DistributionMap (int level) const
 {
     return m_amrcore->DistributionMap(level);
 }
 
-inline 
+inline
+const Vector<DistributionMapping>&
+AmrParGDB::ParticleDistributionMap () const
+{
+    if (m_dmap[0].empty()) {
+	return m_amrcore->DistributionMap();
+    } else {
+	return m_dmap;
+    }
+}
+
+inline
+const Vector<DistributionMapping>&
+AmrParGDB::DistributionMap () const
+{
+    return m_amrcore->DistributionMap();
+}
+
+inline
 const BoxArray&
 AmrParGDB::ParticleBoxArray (int level) const
 {
@@ -89,6 +155,24 @@ AmrParGDB::boxArray (int level) const
     return m_amrcore->boxArray(level);
 }
 
+inline
+const Vector<BoxArray>&
+AmrParGDB::ParticleBoxArray () const
+{
+    if (m_ba[0].empty()) {
+	return m_amrcore->boxArray();
+    } else {
+	return m_ba;
+    }
+}
+
+inline
+const Vector<BoxArray>&
+AmrParGDB::boxArray () const
+{
+    return m_amrcore->boxArray();
+}
+
 inline
 void AmrParGDB::SetParticleBoxArray (int level, const BoxArray& new_ba)
 {
@@ -101,6 +185,13 @@ void AmrParGDB::SetParticleDistributionMap (int level, const DistributionMapping
     m_dmap[level] = new_dmap;
 }
 
+inline
+void AmrParGDB::SetParticleGeometry (int level, const Geometry& new_geom)
+{
+    m_has_geom[level] = 1;
+    m_geom[level] = new_geom;
+}
+
 inline
 void AmrParGDB::ClearParticleBoxArray (int level)
 {
@@ -113,36 +204,50 @@ void AmrParGDB::ClearParticleDistributionMap (int level)
     m_dmap[level] = DistributionMapping();
 }
 
-inline 
-bool 
+inline
+void AmrParGDB::ClearParticleGeometry (int level)
+{
+    m_geom[level] = Geometry();
+    m_has_geom[level] = 0;
+}
+
+inline
+bool
 AmrParGDB::LevelDefined (int level) const
 {
     return m_amrcore->LevelDefined(level);
 }
 
-inline 
-int 
+inline
+int
 AmrParGDB::finestLevel () const
 {
     return m_amrcore->finestLevel();
 }
 
-inline 
-int 
+inline
+int
 AmrParGDB::maxLevel () const
 {
     return m_amrcore->maxLevel();
 }
- 
-inline 
-IntVect 
+
+inline
+IntVect
 AmrParGDB::refRatio (int level) const
 {
     return m_amrcore->refRatio(level);
 }
 
-inline 
-int 
+inline
+Vector<IntVect>
+AmrParGDB::refRatio () const
+{
+    return m_amrcore->refRatio();
+}
+
+inline
+int
 AmrParGDB::MaxRefRatio (int level) const
 {
     return m_amrcore->MaxRefRatio(level);
diff --git a/Src/AmrCore/AMReX_Cluster.cpp b/Src/AmrCore/AMReX_Cluster.cpp
index 10030d9995f..fb8bf807cb9 100644
--- a/Src/AmrCore/AMReX_Cluster.cpp
+++ b/Src/AmrCore/AMReX_Cluster.cpp
@@ -5,6 +5,7 @@
 #include <AMReX_BoxDomain.H>
 #include <AMReX_Vector.H>
 #include <AMReX_Array.H>
+#include <AMReX_BLProfiler.H>
 
 namespace amrex {
 
@@ -34,6 +35,8 @@ class InBox
 public:
     explicit InBox (const Box& b) noexcept : m_box(b) {}
 
+    // You might see compiler warning on this is never referenced.
+    // The compiler is wrong.
     bool operator() (const IntVect& iv) const noexcept
     {
         return m_box.contains(iv);
@@ -246,6 +249,8 @@ class Cut
 public:
     Cut (const IntVect& cut, int dir) : m_cut(cut), m_dir(dir) {}
 
+    // You might see compiler warning on this is never referenced.
+    // The compiler is wrong.
     bool operator() (const IntVect& iv) const
     {
         return iv[m_dir] < m_cut[m_dir];
@@ -522,6 +527,7 @@ ClusterList::boxList (BoxList& blst) const
 void
 ClusterList::chop (Real eff)
 {
+    BL_PROFILE("ClusterList::chop()");
 
     for (std::list<Cluster*>::iterator cli = lst.begin(); cli != lst.end(); )
     {
@@ -539,6 +545,7 @@ ClusterList::chop (Real eff)
 void
 ClusterList::new_chop (Real eff)
 {
+    BL_PROFILE("ClusterList::new_chop()");
 
     for (std::list<Cluster*>::iterator cli = lst.begin(); cli != lst.end(); )
     {
@@ -556,6 +563,8 @@ ClusterList::new_chop (Real eff)
 void
 ClusterList::intersect (const BoxDomain& dom)
 {
+    BL_PROFILE("ClusterList::intersect()");
+
     //
     // Make a BoxArray covering dom.
     // We'll use this to speed up the contains() test below.
diff --git a/Src/AmrCore/AMReX_ErrorList.H b/Src/AmrCore/AMReX_ErrorList.H
index 9bdbea056bd..2beae107bb0 100644
--- a/Src/AmrCore/AMReX_ErrorList.H
+++ b/Src/AmrCore/AMReX_ErrorList.H
@@ -8,9 +8,13 @@
 #include <AMReX_Vector.H>
 #include <AMReX_REAL.H>
 #include <AMReX_ArrayLim.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_TagBox.H>
+#include <AMReX_Geometry.H>
 
 namespace amrex {
 
+
 extern "C"
 {
 
@@ -372,6 +376,110 @@ private:
 
 std::ostream& operator << (std::ostream& os, const ErrorList& elst);
 
+  struct AMRErrorTagInfo
+  {
+    int m_max_level = 1000;
+    Real m_min_time = std::numeric_limits<Real>::lowest();
+    Real m_max_time = std::numeric_limits<Real>::max();
+    RealBox m_realbox;
+
+    AMRErrorTagInfo& SetMaxLevel (int max_level) noexcept {
+      m_max_level = max_level;
+      return *this;
+    }
+    AMRErrorTagInfo& SetMinTime (amrex::Real min_time) noexcept {
+      m_min_time = min_time;
+      return *this;
+    }
+    AMRErrorTagInfo& SetMaxTime (amrex::Real max_time) noexcept {
+      m_max_time = max_time;
+      return *this;
+    }
+    AMRErrorTagInfo& SetRealBox (const amrex::RealBox& realbox) noexcept {
+      m_realbox = realbox;
+      return *this;
+    }
+  };
+
+  class AMRErrorTag
+  {
+  public:
+
+    enum TEST {GRAD=0, LESS, GREATER, VORT, BOX, USER};
+
+    struct UserFunc
+    {
+      virtual void operator() (const amrex::Box&                       bx,
+                               amrex::Array4<const amrex::Real> const& dat,
+                               amrex::Array4<char> const&              tag,
+                               amrex::Real                             time,
+                               int                                     level,
+                               char                                    tagval,
+                               char                                    clearval) = 0;
+    };
+
+    explicit AMRErrorTag (const AMRErrorTagInfo& info = AMRErrorTagInfo()) noexcept
+      : m_test(BOX), m_field(std::string()), m_info(info) {m_ngrow = SetNGrow();}
+
+    AMRErrorTag (amrex::Real            value,
+                 AMRErrorTag::TEST      test,
+                 const std::string&     field,
+                 const AMRErrorTagInfo& info = AMRErrorTagInfo()) noexcept
+      : m_test(test), m_field(field), m_info(info)
+      {
+          m_value.resize(info.m_max_level);
+          for (int i = 0; i < m_value.size(); ++i) {
+              m_value[i] = value;
+          }
+          m_ngrow = SetNGrow();
+      }
+
+    AMRErrorTag (amrex::Vector<amrex::Real>  value,
+                 AMRErrorTag::TEST           test,
+                 const std::string&          field,
+                 const AMRErrorTagInfo&      info = AMRErrorTagInfo()) noexcept
+      : m_test(test), m_field(field), m_info(info)
+      {
+          AMREX_ASSERT(value.size() > 0);
+          m_value.resize(info.m_max_level);
+          for (int i = 0; i < m_value.size() && i < value.size(); ++i) {
+              m_value[i] = value[i];
+          }
+          // If the user didn't provided a value for every level,
+          // assume the last value holds for all higher levels.
+          for (int i = value.size(); i < m_value.size(); ++i) {
+              m_value[i] = value[value.size()-1];
+          }
+          m_ngrow = SetNGrow();
+      }
+
+    AMRErrorTag (AMRErrorTag::UserFunc* userfunc,
+                 const std::string&     field,
+                 int                    ngrow,
+                 const AMRErrorTagInfo& info = AMRErrorTagInfo()) noexcept
+      : m_userfunc(userfunc), m_field(field), m_info(info), m_ngrow(ngrow) {}
+
+    virtual void operator() (amrex::TagBoxArray&    tb,
+                             const amrex::MultiFab* mf,
+                             char                   clearval,
+                             char                   tagval,
+                             amrex::Real            time,
+                             int                    level,
+                             const amrex::Geometry& geom) const noexcept;
+
+    int NGrow() const noexcept {return m_ngrow;}
+    const std::string& Field () const noexcept {return m_field;}
+
+  protected:
+    int SetNGrow () const noexcept;
+
+    Vector<Real> m_value;
+    TEST m_test;
+    UserFunc* m_userfunc = nullptr;
+    std::string m_field;
+    AMRErrorTagInfo m_info;
+    int m_ngrow;
+  };
 }
 
 #endif
diff --git a/Src/AmrCore/AMReX_ErrorList.cpp b/Src/AmrCore/AMReX_ErrorList.cpp
index a41bc1a199f..ae1e1543faf 100644
--- a/Src/AmrCore/AMReX_ErrorList.cpp
+++ b/Src/AmrCore/AMReX_ErrorList.cpp
@@ -228,4 +228,194 @@ operator << (std::ostream&    os,
     return os;
 }
 
+  static
+  void
+  AMRErrorTag_GRAD(const Box&                bx,
+                   Array4<const Real> const& dat,
+                   Array4<char> const&       tag,
+                   Real                      threshold,
+                   char                      tagval)
+  {
+    amrex::ParallelFor(bx,
+    [=] AMREX_GPU_HOST_DEVICE (int i, int j, int k) noexcept
+    {
+      auto ax = amrex::Math::abs(dat(i+1,j,k) - dat(i,j,k));
+      ax = amrex::max(ax,amrex::Math::abs(dat(i,j,k) - dat(i-1,j,k)));
+#if AMREX_SPACEDIM == 1
+      if (ax >= threshold) tag(i,j,k) = tagval;
+#else
+      auto ay = amrex::Math::abs(dat(i,j+1,k) - dat(i,j,k));
+      ay = amrex::max(ay,amrex::Math::abs(dat(i,j,k) - dat(i,j-1,k)));
+#if AMREX_SPACEDIM > 2
+      auto az = amrex::Math::abs(dat(i,j,k+1) - dat(i,j,k));
+      az = amrex::max(az,amrex::Math::abs(dat(i,j,k) - dat(i,j,k-1)));
+#endif
+      if (amrex::max(AMREX_D_DECL(ax,ay,az)) >= threshold) {
+        tag(i,j,k) = tagval;
+      }
+#endif
+    });
+  }
+
+  int
+  AMRErrorTag::SetNGrow () const noexcept
+  {
+    AMREX_ALWAYS_ASSERT_WITH_MESSAGE(m_test != USER, "Do not call SetNGrow with USER test");
+    static std::map<TEST,int> ng = { {GRAD,1}, {LESS,0}, {GREATER,0}, {VORT,0}, {BOX,0} };
+    return ng[m_test];
+  }
+  
+  static
+  void
+  AMRErrorTag_LESS(const Box&                bx,
+                   Array4<const Real> const& dat,
+                   Array4<char> const&       tag,
+                   Real                      threshold,
+                   char                      tagval) noexcept
+  {
+    amrex::ParallelFor(bx,
+    [=] AMREX_GPU_HOST_DEVICE (int i, int j, int k) noexcept
+    {
+      if (dat(i,j,k) <= threshold) {
+        tag(i,j,k) = tagval;
+      }
+    });
+  }
+
+  static
+  void
+  AMRErrorTag_GREATER(const Box&                bx,
+                      Array4<const Real> const& dat,
+                      Array4<char> const&       tag,
+                      Real                      threshold,
+                      char                      tagval) noexcept
+  {
+    amrex::ParallelFor(bx,
+    [=] AMREX_GPU_HOST_DEVICE (int i, int j, int k) noexcept
+    {
+      if (dat(i,j,k) >= threshold) {
+        tag(i,j,k) = tagval;
+      }
+    });
+  }
+
+  static
+  void
+  AMRErrorTag_BOX(const Box&          bx,
+                  Array4<char> const& tag,
+                  const RealBox&      tag_rb,
+                  const Geometry&     geom,
+                  char                tagval) noexcept
+  {
+    auto plo = geom.ProbLoArray();
+    auto dx  = geom.CellSizeArray();
+    class RealBox trb(bx,dx.data(),plo.data());
+    if (tag_rb.intersects(trb))
+    {
+      amrex::ParallelFor(bx,
+      [=] AMREX_GPU_HOST_DEVICE (int i, int j, int k) noexcept
+      {
+          GpuArray<Real,AMREX_SPACEDIM> pt = {{AMREX_D_DECL(plo[0]+(Real(i)+Real(0.5))*dx[0],
+                                                            plo[1]+(Real(j)+Real(0.5))*dx[1],
+                                                            plo[2]+(Real(k)+Real(0.5))*dx[2])}};
+        if (tag_rb.contains(pt.data())) {
+          tag(i,j,k) = tagval;
+        }
+      });
+    }
+  }
+
+  static
+  void
+  AMRErrorTag_VORT(const Box&                bx,
+                   Array4<const Real> const& dat,
+                   Array4<char> const&       tag,
+                   int                       level,
+                   Real                      threshold,
+                   char                      tagval) noexcept
+  {
+    const Real fac = threshold * std::pow(2,level);
+    amrex::ParallelFor(bx,
+    [=] AMREX_GPU_HOST_DEVICE (int i, int j, int k) noexcept
+    {
+      if (dat(i,j,k) >= fac) {
+        tag(i,j,k) = tagval;
+      }
+    });
+  }
+
+  void
+  AMRErrorTag::operator() (TagBoxArray&    tba,
+                           const MultiFab* mf,
+                           char            clearval,
+                           char            tagval,
+                           Real            time,
+                           int             level,
+                           const Geometry& geom) const noexcept
+  {
+    BL_PROFILE("AMRErrorTag::operator()");
+
+    if (m_test == USER)
+    {
+      AMREX_ALWAYS_ASSERT_WITH_MESSAGE(m_userfunc!=nullptr,"UserFunc not properly set in AMRErrorTag");
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+      for (MFIter mfi(tba,TilingIfNotGPU()); mfi.isValid(); ++mfi)
+      {
+        const auto& bx    = mfi.tilebox();
+        auto const& dat   = mf->array(mfi);
+        auto tag          = tba.array(mfi);
+        (*m_userfunc)(bx,dat,tag,time,level,tagval,clearval);
+      }
+    }
+    else
+    {
+      if ((level <  m_info.m_max_level) &&
+          (time  >= m_info.m_min_time ) &&
+          (time  <= m_info.m_max_time ) )
+      {
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+        for (MFIter mfi(tba,TilingIfNotGPU()); mfi.isValid(); ++mfi)
+        {
+          const auto& bx    = mfi.tilebox();
+          auto tag          = tba.array(mfi);
+
+          if (m_test == BOX)
+          {
+            AMRErrorTag_BOX(bx, tag, m_info.m_realbox, geom, tagval);
+          }
+          else
+          {
+            auto const& dat   = mf->array(mfi);
+
+            if (m_test == GRAD)
+            {
+              AMRErrorTag_GRAD(bx, dat, tag, m_value[level], tagval);
+            }
+            else if (m_test == LESS)
+            {
+              AMRErrorTag_LESS(bx, dat, tag, m_value[level], tagval);
+            }
+            else if (m_test == GREATER)
+            {
+              AMRErrorTag_GREATER(bx, dat, tag, m_value[level], tagval);
+            }
+            else if (m_test == VORT)
+            {
+              AMRErrorTag_VORT(bx, dat, tag, level, m_value[level], tagval);
+            }
+            else
+            {
+              Abort("Bad AMRErrorTag test flag");
+            }
+          }
+        }
+      }
+    }
+  }
 }
diff --git a/Src/AmrCore/AMReX_FillPatchUtil.H b/Src/AmrCore/AMReX_FillPatchUtil.H
index ccb3c47f213..751c5369f3d 100644
--- a/Src/AmrCore/AMReX_FillPatchUtil.H
+++ b/Src/AmrCore/AMReX_FillPatchUtil.H
@@ -26,7 +26,7 @@ namespace amrex
     template <typename FAB>
     struct NullInterpHook
     {
-        void operator() (FAB& fab, const Box& bx, int icomp, int ncomp) const {}
+        void operator() (FAB& /*fab*/, const Box& /*bx*/, int /*icomp*/, int /*ncomp*/) const {}
     };
 
     template <typename Interp>
diff --git a/Src/AmrCore/AMReX_FillPatchUtil.cpp b/Src/AmrCore/AMReX_FillPatchUtil.cpp
index 688353b2946..0dd68cb8955 100644
--- a/Src/AmrCore/AMReX_FillPatchUtil.cpp
+++ b/Src/AmrCore/AMReX_FillPatchUtil.cpp
@@ -15,8 +15,8 @@ namespace amrex
                                      int ref_ratio)
     {
         InterpCrseFineBndryEMfield(interp_type,
-                                   {AMREX_D_DECL(&crse[0],&crse[1],&crse[2])},
-                                   {AMREX_D_DECL(&fine[0],&fine[1],&fine[2])},
+                                   {{AMREX_D_DECL(&crse[0],&crse[1],&crse[2])}},
+                                   {{AMREX_D_DECL(&fine[0],&fine[1],&fine[2])}},
                                    cgeom, fgeom, ref_ratio);
     }
 
diff --git a/Src/AmrCore/AMReX_FillPatchUtil_I.H b/Src/AmrCore/AMReX_FillPatchUtil_I.H
index e841643b401..4dad3b9965f 100644
--- a/Src/AmrCore/AMReX_FillPatchUtil_I.H
+++ b/Src/AmrCore/AMReX_FillPatchUtil_I.H
@@ -164,34 +164,54 @@ namespace {
                                       int>::type = 0>
     MF make_mf_crse_patch (FabArrayBase::FPinfo const& fpc, int ncomp)
     {
-        MF mf_crse_patch(fpc.ba_crse_patch, fpc.dm_crse_patch, ncomp, 0, MFInfo(),
+        MF mf_crse_patch(fpc.ba_crse_patch, fpc.dm_patch, ncomp, 0, MFInfo(),
                          *fpc.fact_crse_patch);
         return mf_crse_patch;
     }
 
+    template <typename MF,
+              typename std::enable_if<std::is_same<typename MF::FABType::value_type,
+                                                   FArrayBox>::value,
+                                      int>::type = 0>
+    MF make_mf_fine_patch (FabArrayBase::FPinfo const& fpc, int ncomp)
+    {
+        MF mf_fine_patch(fpc.ba_fine_patch, fpc.dm_patch, ncomp, 0, MFInfo(),
+                         *fpc.fact_fine_patch);
+        return mf_fine_patch;
+    }
+
     template <typename MF,
               typename std::enable_if<!std::is_same<typename MF::FABType::value_type,
                                                     FArrayBox>::value,
                                       int>::type = 0>
     MF make_mf_crse_patch (FabArrayBase::FPinfo const& fpc, int ncomp)
     {
-        return MF(fpc.ba_crse_patch, fpc.dm_crse_patch, ncomp, 0);
+        return MF(fpc.ba_crse_patch, fpc.dm_patch, ncomp, 0);
+    }
+
+    template <typename MF,
+              typename std::enable_if<!std::is_same<typename MF::FABType::value_type,
+                                                    FArrayBox>::value,
+                                      int>::type = 0>
+    MF make_mf_fine_patch (FabArrayBase::FPinfo const& fpc, int ncomp)
+    {
+        return MF(fpc.ba_fine_patch, fpc.dm_patch, ncomp, 0);
     }
 
     template <typename MF,
               typename std::enable_if<std::is_same<typename MF::FABType::value_type,
                                                    FArrayBox>::value,
                                       int>::type = 0>
-    void mf_set_domain_bndry (MF &mf, Geometry const & cgeom)
+    void mf_set_domain_bndry (MF &mf, Geometry const & geom)
     {
-        mf.setDomainBndry(std::numeric_limits<Real>::quiet_NaN(), cgeom);
+        mf.setDomainBndry(std::numeric_limits<Real>::quiet_NaN(), geom);
     }
 
     template <typename MF,
               typename std::enable_if<!std::is_same<typename MF::FABType::value_type,
                                                     FArrayBox>::value,
                                       int>::type = 0>
-    void mf_set_domain_bndry (MF &mf, Geometry const & cgeom)
+    void mf_set_domain_bndry (MF &/*mf*/, Geometry const & /*geom*/)
     {
         // nothing
     }
@@ -199,88 +219,73 @@ namespace {
     template <typename MF, typename BC, typename Interp, typename PreInterpHook, typename PostInterpHook>
     EnableIf_t<IsFabArray<MF>::value>
     FillPatchTwoLevels_doit (MF& mf, IntVect const& nghost, Real time,
-			     const Vector<MF*>& cmf, const Vector<Real>& ct,
-			     const Vector<MF*>& fmf, const Vector<Real>& ft,
-			     int scomp, int dcomp, int ncomp,
-			     const Geometry& cgeom, const Geometry& fgeom,
-			     BC& cbc, int cbccomp,
+                             const Vector<MF*>& cmf, const Vector<Real>& ct,
+                             const Vector<MF*>& fmf, const Vector<Real>& ft,
+                             int scomp, int dcomp, int ncomp,
+                             const Geometry& cgeom, const Geometry& fgeom,
+                             BC& cbc, int cbccomp,
                              BC& fbc, int fbccomp,
-			     const IntVect& ratio,
-			     Interp* mapper,
+                             const IntVect& ratio,
+                             Interp* mapper,
                              const Vector<BCRec>& bcs, int bcscomp,
                              const PreInterpHook& pre_interp,
                              const PostInterpHook& post_interp,
                              EB2::IndexSpace const* index_space)
     {
-	BL_PROFILE("FillPatchTwoLevels");
+        BL_PROFILE("FillPatchTwoLevels");
 
         using FAB = typename MF::FABType::value_type;
 
-	if (nghost.max() > 0 || mf.getBDKey() != fmf[0]->getBDKey())
-	{
-	    const InterpolaterBoxCoarsener& coarsener = mapper->BoxCoarsener(ratio);
-
-	    Box fdomain = fgeom.Domain();
-	    fdomain.convert(mf.boxArray().ixType());
-	    Box fdomain_g(fdomain);
-	    for (int i = 0; i < AMREX_SPACEDIM; ++i) {
-		if (fgeom.isPeriodic(i)) {
-		    fdomain_g.grow(i,nghost[i]);
-		}
-	    }
+        if (nghost.max() > 0 || mf.getBDKey() != fmf[0]->getBDKey())
+        {
+            const InterpolaterBoxCoarsener& coarsener = mapper->BoxCoarsener(ratio);
 
-	    const FabArrayBase::FPinfo& fpc = FabArrayBase::TheFPinfo(*fmf[0], mf, fdomain_g,
+            const FabArrayBase::FPinfo& fpc = FabArrayBase::TheFPinfo(*fmf[0], mf,
                                                                       nghost,
                                                                       coarsener,
-                                                                      amrex::coarsen(fgeom.Domain(),ratio),
+                                                                      fgeom,
+                                                                      cgeom,
                                                                       index_space);
 
-	    if ( ! fpc.ba_crse_patch.empty())
-	    {
+            if ( ! fpc.ba_crse_patch.empty())
+            {
                 MF mf_crse_patch = make_mf_crse_patch<MF>(fpc, ncomp);
                 mf_set_domain_bndry (mf_crse_patch, cgeom);
 
-		FillPatchSingleLevel(mf_crse_patch, time, cmf, ct, scomp, 0, ncomp, cgeom, cbc, cbccomp);
+                FillPatchSingleLevel(mf_crse_patch, time, cmf, ct, scomp, 0, ncomp, cgeom, cbc, cbccomp);
+
+                MF mf_fine_patch = make_mf_fine_patch<MF>(fpc, ncomp);
 
-		int idummy1=0, idummy2=0;
-		bool cc = fpc.ba_crse_patch.ixType().cellCentered();
-                ignore_unused(cc);
+                Box const& fdomain = amrex::convert(fgeom.Domain(),mf.ixType());
+                int idummy=0;
 #ifdef _OPENMP
+                bool cc = fpc.ba_crse_patch.ixType().cellCentered();
 #pragma omp parallel if (cc && Gpu::notInLaunchRegion())
 #endif
                 {
                     Vector<BCRec> bcr(ncomp);
-                    for (MFIter mfi(mf_crse_patch); mfi.isValid(); ++mfi)
+                    for (MFIter mfi(mf_fine_patch); mfi.isValid(); ++mfi)
                     {
                         FAB& sfab = mf_crse_patch[mfi];
-                        int li = mfi.LocalIndex();
-                        int gi = fpc.dst_idxs[li];
-                        FAB& dfab = mf[gi];
-                        const Box& dbx = fpc.dst_boxes[li] & dfab.box();
+                        FAB& dfab = mf_fine_patch[mfi];
+                        const Box& dbx = dfab.box();
 
                         amrex::setBC(dbx,fdomain,bcscomp,0,ncomp,bcs,bcr);
 
                         pre_interp(sfab, sfab.box(), 0, ncomp);
 
-                        mapper->interp(sfab,
-                                       0,
-                                       dfab,
-                                       dcomp,
-                                       ncomp,
-                                       dbx,
-                                       ratio,
-                                       cgeom,
-                                       fgeom,
-                                       bcr,
-                                       idummy1, idummy2, RunOn::Gpu);
-
-                        post_interp(dfab, dbx, dcomp, ncomp);
+                        mapper->interp(sfab, 0, dfab, 0, ncomp, dbx, ratio,
+                                       cgeom, fgeom, bcr, dcomp, idummy, RunOn::Gpu);
+
+                        post_interp(dfab, dbx, 0, ncomp);
                     }
                 }
+
+                mf.ParallelCopy(mf_fine_patch, 0, dcomp, ncomp, IntVect{0}, nghost);
 	    }
 	}
 
-	FillPatchSingleLevel(mf, nghost, time, fmf, ft, scomp, dcomp, ncomp,
+        FillPatchSingleLevel(mf, nghost, time, fmf, ft, scomp, dcomp, ncomp,
                              fgeom, fbc, fbccomp);
     } }
 
@@ -445,12 +450,16 @@ InterpFromCoarseLevel (MF& mf, IntVect const& nghost, Real time,
         }
     }
 
+    MF mf_crse_patch;
 #ifdef AMREX_USE_EB
-    auto factory = makeEBFabFactory(cgeom, ba_crse_patch, dm, {0,0,0}, EBSupport::basic);
-    MF mf_crse_patch(ba_crse_patch, dm, ncomp, 0, MFInfo(), *factory);
-#else
-    MF mf_crse_patch(ba_crse_patch, dm, ncomp, 0);
+    if (EB2::TopIndexSpaceIfPresent()) {
+        auto factory = makeEBFabFactory(cgeom, ba_crse_patch, dm, {0,0,0}, EBSupport::basic);
+        mf_crse_patch.define(ba_crse_patch, dm, ncomp, 0, MFInfo(), *factory);
+    } else
 #endif
+    {
+        mf_crse_patch.define(ba_crse_patch, dm, ncomp, 0);
+    }
     mf_set_domain_bndry (mf_crse_patch, cgeom);
 
     mf_crse_patch.copy(cmf, scomp, 0, ncomp, cgeom.periodicity());
diff --git a/Src/AmrCore/AMReX_FluxRegister.cpp b/Src/AmrCore/AMReX_FluxRegister.cpp
index af6053878dd..5156db8b1dd 100644
--- a/Src/AmrCore/AMReX_FluxRegister.cpp
+++ b/Src/AmrCore/AMReX_FluxRegister.cpp
@@ -455,7 +455,7 @@ FluxRegister::FineSetVal (int              dir,
                           int              destcomp,
                           int              numcomp,
                           Real             val,
-                          RunOn            runon) noexcept
+                          RunOn           /*runon*/) noexcept
 {
     Gpu::LaunchSafeGuard lsg(false); // xxxxx gpu todo
 
diff --git a/Src/AmrCore/AMReX_Interp_1D_C.H b/Src/AmrCore/AMReX_Interp_1D_C.H
index 21420e79715..5ba215ace6d 100644
--- a/Src/AmrCore/AMReX_Interp_1D_C.H
+++ b/Src/AmrCore/AMReX_Interp_1D_C.H
@@ -33,8 +33,8 @@ ccinterp_compute_voff (Box const& cbx, IntVect const& ratio, Geometry const& cge
         const int ic = amrex::coarsen(i, ratio[0]);
         const int ii = i - flo.x;
         const int iic = ic - clo.x;
-        const Real fcen = 0.5_rt*(fvc[ii ]+fvc[ii +1]);
-        const Real ccen = 0.5_rt*(cvc[iic]+cvc[iic+1]);
+        const Real fcen = Real(0.5)*(fvc[ii ]+fvc[ii +1]);
+        const Real ccen = Real(0.5)*(cvc[iic]+cvc[iic+1]);
         xoff[ii] = (fcen-ccen)/(cvc[iic+1]-cvc[iic]);
     }
 
@@ -51,17 +51,17 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
 {
     AMREX_PRAGMA_SIMD
     for (int i = lo.x; i <= hi.x; ++i) {
-        slopes(i,0,0,ns) = 0.5_rt*(u(i+1,0,0,nu)-u(i-1,0,0,nu));
+        slopes(i,0,0,ns) = Real(0.5)*(u(i+1,0,0,nu)-u(i-1,0,0,nu));
     }
 
     if (lo.x == slo.x && (bc.lo(0) == BCType::ext_dir || bc.lo(0) == BCType::hoextrap))
     {
         const int i = slo.x;
         if (shi.x-slo.x >= 1) {
-            slopes(i,0,0,ns) = -(16._rt/15._rt)*u(i-1,0,0,nu) + 0.5_rt*u(i,0,0,nu)
-                + (2._rt/3._rt)*u(i+1,0,0,nu) - 0.1_rt*u(i+2,0,0,nu);
+            slopes(i,0,0,ns) = -Real(16./15.)*u(i-1,0,0,nu) + Real(0.5)*u(i,0,0,nu)
+                + Real(2./3.)*u(i+1,0,0,nu) - Real(0.1)*u(i+2,0,0,nu);
         } else {
-            slopes(i,0,0,ns) = 0.25_rt*(u(i+1,0,0,nu)+5._rt*u(i,0,0,nu)-6._rt*u(i-1,0,0,nu));
+            slopes(i,0,0,ns) = Real(0.25)*(u(i+1,0,0,nu)+Real(5.)*u(i,0,0,nu)-Real(6.)*u(i-1,0,0,nu));
         }
     }
 
@@ -69,10 +69,10 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
     {
         const int i = shi.x;
         if (shi.x-slo.x >= 1) {
-            slopes(i,0,0,ns) = (16._rt/15._rt)*u(i+1,0,0,nu) - 0.5_rt*u(i,0,0,nu)
-                - (2._rt/3._rt)*u(i-1,0,0,nu) + 0.1_rt*u(i-2,0,0,nu);
+            slopes(i,0,0,ns) = Real(16./15.)*u(i+1,0,0,nu) - Real(0.5)*u(i,0,0,nu)
+                - Real(2./3.)*u(i-1,0,0,nu) + Real(0.1)*u(i-2,0,0,nu);
         } else {
-            slopes(i,0,0,ns) = -0.25_rt*(u(i-1,0,0,nu)+5._rt*u(i,0,0,nu)-6._rt*u(i+1,0,0,nu));
+            slopes(i,0,0,ns) = -Real(0.25)*(u(i-1,0,0,nu)+Real(5.)*u(i,0,0,nu)-Real(6.)*u(i+1,0,0,nu));
         }
     }
 }
@@ -94,7 +94,7 @@ cellconslin_slopes_linlim (Box const& bx, Array4<Real> const& slopes,
 
     AMREX_PRAGMA_SIMD
     for (int i = lo.x; i <= hi.x; ++i) {
-        sf(i,0,0) = 1.0_rt;
+        sf(i,0,0) = Real(1.);
     }
 
     for (int n = 0; n < ncomp; ++n)
@@ -105,14 +105,14 @@ cellconslin_slopes_linlim (Box const& bx, Array4<Real> const& slopes,
         AMREX_PRAGMA_SIMD
         for (int i = lo.x; i <= hi.x; ++i) {
             Real cen  = slopes(i,0,0,n);
-            Real forw = 2.0_rt*(u(i+1,0,0,nu)-u(i  ,0,0,nu));
-            Real back = 2.0_rt*(u(i  ,0,0,nu)-u(i-1,0,0,nu));
-            Real slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-            slopes(i,0,0,n) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
-            if (cen != 0.0_rt) {
+            Real forw = Real(2.)*(u(i+1,0,0,nu)-u(i  ,0,0,nu));
+            Real back = Real(2.)*(u(i  ,0,0,nu)-u(i-1,0,0,nu));
+            Real slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+            slopes(i,0,0,n) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
+            if (cen != Real(0.)) {
                 sf(i,0,0) = amrex::min(sf(i,0,0), slopes(i,0,0,n)/cen);
             } else {
-                sf(i,0,0) = 0.0_rt;
+                sf(i,0,0) = Real(0.);
             }
         }
     }
@@ -181,10 +181,10 @@ cellconslin_slopes_mclim (Box const& bx, Array4<Real> const& slopes,
         AMREX_PRAGMA_SIMD
         for (int i = lo.x; i <= hi.x; ++i) {
             Real cen  = slopes(i,0,0,n);
-            Real forw = 2.0_rt*(u(i+1,0,0,nu)-u(i  ,0,0,nu));
-            Real back = 2.0_rt*(u(i  ,0,0,nu)-u(i-1,0,0,nu));
-            Real slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-            slopes(i,0,0,n) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
+            Real forw = Real(2.)*(u(i+1,0,0,nu)-u(i  ,0,0,nu));
+            Real back = Real(2.)*(u(i  ,0,0,nu)-u(i-1,0,0,nu));
+            Real slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+            slopes(i,0,0,n) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
         }
     }
 }
@@ -208,12 +208,12 @@ cellconslin_fine_alpha (Box const& bx, Array4<Real> const& alpha,
             const int ic = amrex::coarsen(i,ratio[0]);
             const Real dummy_fine = xoff[i-vlo.x]*slopes(ic,0,0,n);
 
-            if (dummy_fine > mm(ic,0,0,n+ncomp) && dummy_fine != 0.0_rt) {
+            if (dummy_fine > mm(ic,0,0,n+ncomp) && dummy_fine != Real(0.)) {
                 alpha(i,0,0,n) = mm(ic,0,0,n+ncomp) / dummy_fine;
-            } else if (dummy_fine < mm(ic,0,0,n) && dummy_fine != 0.0_rt) {
+            } else if (dummy_fine < mm(ic,0,0,n) && dummy_fine != Real(0.)) {
                 alpha(i,0,0,n) = mm(ic,0,0,n) / dummy_fine;
             } else {
-                alpha(i,0,0,n) = 1.0_rt;
+                alpha(i,0,0,n) = Real(1.);
             }
         }
     }
@@ -230,7 +230,7 @@ cellconslin_slopes_mmlim (Box const& bx, Array4<Real> const& slopes,
     for (int n = 0; n < ncomp; ++n) {
         for (int i = lo.x; i <= hi.x; ++i) {
             const int ii = i*ratio[0];
-            Real a = 1.0_rt;
+            Real a = Real(1.);
             for (int ioff = 0; ioff < ratio[0]; ++ioff) {
                 a = amrex::min(a, alpha(ii+ioff,0,0,n));
             }
@@ -265,7 +265,7 @@ nodebilin_slopes (Box const& bx, Array4<T> const& slope, Array4<T const> const&
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
-    const Real rx = 1.0_rt/ratio[0];
+    const Real rx = Real(1.)/ratio[0];
 
     for (int n = 0; n < ncomp; ++n) {
         AMREX_PRAGMA_SIMD
@@ -296,6 +296,16 @@ nodebilin_interp (Box const& bx, Array4<T> const& fine, const int fcomp, const i
     }
 }
 
+template<typename T>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void
+face_linear_interp_x (int i, int /*j*/, int /*k*/, int n, Array4<T> const& fine,
+                      Array4<T const> const& crse, IntVect const& ratio) noexcept
+{
+    int ii = amrex::coarsen(i,ratio[0]);
+    Real const w = static_cast<Real>(i-ii*ratio[0]) * (Real(1.)/ratio[0]);
+    fine(i,0,0,n) = (Real(1.)-w) * crse(ii,0,0,n) + w * crse(ii+1,0,0,n);
+}
+
 }
 
 #endif
diff --git a/Src/AmrCore/AMReX_Interp_2D_C.H b/Src/AmrCore/AMReX_Interp_2D_C.H
index 7d8396aa01e..57eabbb749a 100644
--- a/Src/AmrCore/AMReX_Interp_2D_C.H
+++ b/Src/AmrCore/AMReX_Interp_2D_C.H
@@ -33,8 +33,8 @@ ccinterp_compute_voff (Box const& cbx, IntVect const& ratio, Geometry const& cge
         const int ic = amrex::coarsen(i, ratio[0]);
         const int ii = i - flo.x;
         const int iic = ic - clo.x;
-        const Real fcen = 0.5_rt*(fvc[ii ]+fvc[ii +1]);
-        const Real ccen = 0.5_rt*(cvc[iic]+cvc[iic+1]);
+        const Real fcen = Real(0.5)*(fvc[ii ]+fvc[ii +1]);
+        const Real ccen = Real(0.5)*(cvc[iic]+cvc[iic+1]);
         xoff[ii] = (fcen-ccen)/(cvc[iic+1]-cvc[iic]);
     }
 
@@ -47,8 +47,8 @@ ccinterp_compute_voff (Box const& cbx, IntVect const& ratio, Geometry const& cge
         const int jc = amrex::coarsen(j, ratio[1]);
         const int jj = j - flo.y;
         const int jjc = jc - clo.y;
-        const Real fcen = 0.5_rt*(fvc[jj ]+fvc[jj +1]);
-        const Real ccen = 0.5_rt*(cvc[jjc]+cvc[jjc+1]);
+        const Real fcen = Real(0.5)*(fvc[jj ]+fvc[jj +1]);
+        const Real ccen = Real(0.5)*(cvc[jjc]+cvc[jjc+1]);
         yoff[jj] = (fcen-ccen)/(cvc[jjc+1]-cvc[jjc]);
     }
 
@@ -66,8 +66,8 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
     for     (int j = lo.y; j <= hi.y; ++j) {
         AMREX_PRAGMA_SIMD
         for (int i = lo.x; i <= hi.x; ++i) {
-            slopes(i,j,0,ns      ) = 0.5_rt*(u(i+1,j,0,nu)-u(i-1,j,0,nu));
-            slopes(i,j,0,ns+ncomp) = 0.5_rt*(u(i,j+1,0,nu)-u(i,j-1,0,nu));
+            slopes(i,j,0,ns      ) = Real(0.5)*(u(i+1,j,0,nu)-u(i-1,j,0,nu));
+            slopes(i,j,0,ns+ncomp) = Real(0.5)*(u(i,j+1,0,nu)-u(i,j-1,0,nu));
         }
     }
 
@@ -76,12 +76,12 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         const int i = slo.x;
         if (shi.x-slo.x >= 1) {
             for     (int j = lo.y; j <= hi.y; ++j) {
-                slopes(i,j,0,ns) = -(16._rt/15._rt)*u(i-1,j,0,nu) + 0.5_rt*u(i,j,0,nu)
-                    + (2._rt/3._rt)*u(i+1,j,0,nu) - 0.1_rt*u(i+2,j,0,nu);
+                slopes(i,j,0,ns) = -Real(16./15.)*u(i-1,j,0,nu) + Real(0.5)*u(i,j,0,nu)
+                    + Real(2./3.)*u(i+1,j,0,nu) - Real(0.1)*u(i+2,j,0,nu);
             }
         } else {
             for     (int j = lo.y; j <= hi.y; ++j) {
-                slopes(i,j,0,ns) = 0.25_rt*(u(i+1,j,0,nu)+5._rt*u(i,j,0,nu)-6._rt*u(i-1,j,0,nu));
+                slopes(i,j,0,ns) = Real(0.25)*(u(i+1,j,0,nu)+Real(5.)*u(i,j,0,nu)-Real(6.)*u(i-1,j,0,nu));
             }
         }
     }
@@ -91,12 +91,12 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         const int i = shi.x;
         if (shi.x-slo.x >= 1) {
             for     (int j = lo.y; j <= hi.y; ++j) {
-                slopes(i,j,0,ns) = (16._rt/15._rt)*u(i+1,j,0,nu) - 0.5_rt*u(i,j,0,nu)
-                    - (2._rt/3._rt)*u(i-1,j,0,nu) + 0.1_rt*u(i-2,j,0,nu);
+                slopes(i,j,0,ns) = Real(16./15.)*u(i+1,j,0,nu) - Real(0.5)*u(i,j,0,nu)
+                    - Real(2./3.)*u(i-1,j,0,nu) + Real(0.1)*u(i-2,j,0,nu);
             }
         } else {
             for     (int j = lo.y; j <= hi.y; ++j) {
-                slopes(i,j,0,ns) = -0.25_rt*(u(i-1,j,0,nu)+5._rt*u(i,j,0,nu)-6._rt*u(i+1,j,0,nu));
+                slopes(i,j,0,ns) = -Real(0.25)*(u(i-1,j,0,nu)+Real(5.)*u(i,j,0,nu)-Real(6.)*u(i+1,j,0,nu));
             }
         }
     }
@@ -107,13 +107,13 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         if (shi.y-slo.y >= 1) {
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
-                slopes(i,j,0,ns+ncomp) = -(16._rt/15._rt)*u(i,j-1,0,nu) + 0.5_rt*u(i,j,0,nu)
-                    + (2._rt/3._rt)*u(i,j+1,0,nu) - 0.1_rt*u(i,j+2,0,nu);
+                slopes(i,j,0,ns+ncomp) = -Real(16./15.)*u(i,j-1,0,nu) + Real(0.5)*u(i,j,0,nu)
+                    + Real(2./3.)*u(i,j+1,0,nu) - Real(0.1)*u(i,j+2,0,nu);
             }
         } else {
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
-                slopes(i,j,0,ns+ncomp) = 0.25_rt*(u(i,j+1,0,nu)+5._rt*u(i,j,0,nu)-6._rt*u(i,j-1,0,nu));
+                slopes(i,j,0,ns+ncomp) = Real(0.25)*(u(i,j+1,0,nu)+Real(5.)*u(i,j,0,nu)-Real(6.)*u(i,j-1,0,nu));
             }
         }
     }
@@ -124,13 +124,13 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         if (shi.y-slo.y >= 1) {
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
-                slopes(i,j,0,ns+ncomp) = (16._rt/15._rt)*u(i,j+1,0,nu) - 0.5_rt*u(i,j,0,nu)
-                    - (2._rt/3._rt)*u(i,j-1,0,nu) + 0.1_rt*u(i,j-2,0,nu);
+                slopes(i,j,0,ns+ncomp) = Real(16./15.)*u(i,j+1,0,nu) - Real(0.5)*u(i,j,0,nu)
+                    - Real(2./3.)*u(i,j-1,0,nu) + Real(0.1)*u(i,j-2,0,nu);
             }
         } else {
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
-                slopes(i,j,0,ns+ncomp) = -0.25_rt*(u(i,j-1,0,nu)+5._rt*u(i,j,0,nu)-6._rt*u(i,j+1,0,nu));
+                slopes(i,j,0,ns+ncomp) = -Real(0.25)*(u(i,j-1,0,nu)+Real(5.)*u(i,j,0,nu)-Real(6.)*u(i,j+1,0,nu));
             }
         }
     }
@@ -154,8 +154,8 @@ cellconslin_slopes_linlim (Box const& bx, Array4<Real> const& slopes,
     for     (int j = lo.y; j <= hi.y; ++j) {
         AMREX_PRAGMA_SIMD
         for (int i = lo.x; i <= hi.x; ++i) {
-            sf(i,j,0,0) = 1.0_rt;
-            sf(i,j,0,1) = 1.0_rt;
+            sf(i,j,0,0) = Real(1.);
+            sf(i,j,0,1) = Real(1.);
         }
     }
 
@@ -168,25 +168,25 @@ cellconslin_slopes_linlim (Box const& bx, Array4<Real> const& slopes,
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
                 Real cen  = slopes(i,j,0,n);
-                Real forw = 2.0_rt*(u(i+1,j,0,nu)-u(i  ,j,0,nu));
-                Real back = 2.0_rt*(u(i  ,j,0,nu)-u(i-1,j,0,nu));
-                Real slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                slopes(i,j,0,n) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
-                if (cen != 0.0_rt) {
+                Real forw = Real(2.)*(u(i+1,j,0,nu)-u(i  ,j,0,nu));
+                Real back = Real(2.)*(u(i  ,j,0,nu)-u(i-1,j,0,nu));
+                Real slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                slopes(i,j,0,n) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
+                if (cen != Real(0.)) {
                     sf(i,j,0,0) = amrex::min(sf(i,j,0,0), slopes(i,j,0,n)/cen);
                 } else {
-                    sf(i,j,0,0) = 0.0_rt;
+                    sf(i,j,0,0) = Real(0.);
                 }
 
                 cen  = slopes(i,j,0,n+ncomp);
-                forw = 2.0_rt*(u(i,j+1,0,nu)-u(i,j  ,0,nu));
-                back = 2.0_rt*(u(i,j  ,0,nu)-u(i,j-1,0,nu));
-                slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                slopes(i,j,0,n+ncomp) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
-                if (cen != 0.0_rt) {
+                forw = Real(2.)*(u(i,j+1,0,nu)-u(i,j  ,0,nu));
+                back = Real(2.)*(u(i,j  ,0,nu)-u(i,j-1,0,nu));
+                slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                slopes(i,j,0,n+ncomp) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
+                if (cen != Real(0.)) {
                     sf(i,j,0,1) = amrex::min(sf(i,j,0,1), slopes(i,j,0,n+ncomp)/cen);
                 } else {
-                    sf(i,j,0,1) = 0.0_rt;
+                    sf(i,j,0,1) = Real(0.);
                 }
             }
         }
@@ -270,16 +270,16 @@ cellconslin_slopes_mclim (Box const& bx, Array4<Real> const& slopes,
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
                 Real cen  = slopes(i,j,0,n);
-                Real forw = 2.0_rt*(u(i+1,j,0,nu)-u(i  ,j,0,nu));
-                Real back = 2.0_rt*(u(i  ,j,0,nu)-u(i-1,j,0,nu));
-                Real slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                slopes(i,j,0,n) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
+                Real forw = Real(2.)*(u(i+1,j,0,nu)-u(i  ,j,0,nu));
+                Real back = Real(2.)*(u(i  ,j,0,nu)-u(i-1,j,0,nu));
+                Real slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                slopes(i,j,0,n) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
 
                 cen  = slopes(i,j,0,n+ncomp);
-                forw = 2.0_rt*(u(i,j+1,0,nu)-u(i,j  ,0,nu));
-                back = 2.0_rt*(u(i,j  ,0,nu)-u(i,j-1,0,nu));
-                slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                slopes(i,j,0,n+ncomp) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
+                forw = Real(2.)*(u(i,j+1,0,nu)-u(i,j  ,0,nu));
+                back = Real(2.)*(u(i,j  ,0,nu)-u(i,j-1,0,nu));
+                slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                slopes(i,j,0,n+ncomp) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
             }
         }
     }
@@ -309,12 +309,12 @@ cellconslin_fine_alpha (Box const& bx, Array4<Real> const& alpha,
                 const Real dummy_fine = xoff[i-vlo.x]*slopes(ic,jc,0,n)
                     +                   yoff[j-vlo.y]*slopes(ic,jc,0,n+ncomp);
 
-                if (dummy_fine > mm(ic,jc,0,n+ncomp) && dummy_fine != 0.0_rt) {
+                if (dummy_fine > mm(ic,jc,0,n+ncomp) && dummy_fine != Real(0.)) {
                     alpha(i,j,0,n) = mm(ic,jc,0,n+ncomp) / dummy_fine;
-                } else if (dummy_fine < mm(ic,jc,0,n) && dummy_fine != 0.0_rt) {
+                } else if (dummy_fine < mm(ic,jc,0,n) && dummy_fine != Real(0.)) {
                     alpha(i,j,0,n) = mm(ic,jc,0,n) / dummy_fine;
                 } else {
-                    alpha(i,j,0,n) = 1.0_rt;
+                    alpha(i,j,0,n) = Real(1.);
                 }
             }
         }
@@ -334,7 +334,7 @@ cellconslin_slopes_mmlim (Box const& bx, Array4<Real> const& slopes,
             const int jj = j*ratio[1];
             for (int i = lo.x; i <= hi.x; ++i) {
                 const int ii = i*ratio[0];
-                Real a = 1.0_rt;
+                Real a = Real(1.);
                 for     (int joff = 0; joff < ratio[1]; ++joff) {
                     for (int ioff = 0; ioff < ratio[0]; ++ioff) {
                         a = amrex::min(a, alpha(ii+ioff,jj+joff,0,n));
@@ -382,8 +382,8 @@ nodebilin_slopes (Box const& bx, Array4<T> const& slope, Array4<T const> const&
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
-    const Real rx = 1.0_rt/ratio[0];
-    const Real ry = 1.0_rt/ratio[1];
+    const Real rx = Real(1.)/ratio[0];
+    const Real ry = Real(1.)/ratio[1];
 
     for (int n = 0; n < ncomp; ++n) {
         for     (int j = lo.y; j <= hi.y; ++j) {
@@ -428,6 +428,28 @@ nodebilin_interp (Box const& bx, Array4<T> const& fine, const int fcomp, const i
     }
 }
 
+template<typename T>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void
+face_linear_interp_x (int i, int j, int /*k*/, int n, Array4<T> const& fine,
+                      Array4<T const> const& crse, IntVect const& ratio) noexcept
+{
+    int ii = amrex::coarsen(i,ratio[0]);
+    int jj = amrex::coarsen(j,ratio[1]);
+    Real const w = static_cast<Real>(i-ii*ratio[0]) * (Real(1.)/ratio[0]);
+    fine(i,j,0,n) = (Real(1.)-w) * crse(ii,jj,0,n) + w * crse(ii+1,jj,0,n);
+}
+
+template<typename T>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void
+face_linear_interp_y (int i, int j, int /*k*/, int n, Array4<T> const& fine,
+                      Array4<T const> const& crse, IntVect const& ratio) noexcept
+{
+    int ii = amrex::coarsen(i,ratio[0]);
+    int jj = amrex::coarsen(j,ratio[1]);
+    Real const w = static_cast<Real>(j-jj*ratio[1]) * (Real(1.)/ratio[1]);
+    fine(i,j,0,n) = (Real(1.)-w) * crse(ii,jj,0,n) + w * crse(ii,jj+1,0,n);
+}
+
 }
 
 #endif
diff --git a/Src/AmrCore/AMReX_Interp_3D_C.H b/Src/AmrCore/AMReX_Interp_3D_C.H
index c3450f2bd0d..091515b0a0e 100644
--- a/Src/AmrCore/AMReX_Interp_3D_C.H
+++ b/Src/AmrCore/AMReX_Interp_3D_C.H
@@ -11,8 +11,8 @@ namespace amrex {
 AMREX_GPU_HOST
 inline
 Vector<Real>
-ccinterp_compute_voff (Box const& cbx, IntVect const& ratio, Geometry const& cgeom,
-                       Geometry const& fgeom) noexcept
+ccinterp_compute_voff (Box const& cbx, IntVect const& ratio, Geometry const& /*cgeom*/,
+                       Geometry const& /*fgeom*/) noexcept
 {
     const Box& fbx = amrex::refine(cbx,ratio);
     const auto& flen = amrex::length(fbx);
@@ -21,13 +21,13 @@ ccinterp_compute_voff (Box const& cbx, IntVect const& ratio, Geometry const& cge
     const int nxyz = flen.x + flen.y + flen.z;
     Vector<Real> voff(nxyz);
     
-    const Real xrinv = 1._rt/ratio[0];
-    const Real yrinv = 1._rt/ratio[1];
-    const Real zrinv = 1._rt/ratio[2];
+    const Real xrinv = Real(1.)/ratio[0];
+    const Real yrinv = Real(1.)/ratio[1];
+    const Real zrinv = Real(1.)/ratio[2];
 
-    const Real xtmp = 0.5_rt*(xrinv-1.0_rt);
-    const Real ytmp = 0.5_rt*(yrinv-1.0_rt);
-    const Real ztmp = 0.5_rt*(zrinv-1.0_rt);
+    const Real xtmp = Real(0.5)*(xrinv-Real(1.));
+    const Real ytmp = Real(0.5)*(yrinv-Real(1.));
+    const Real ztmp = Real(0.5)*(zrinv-Real(1.));
 
     Real* AMREX_RESTRICT xoff = &voff[0];
     AMREX_PRAGMA_SIMD
@@ -68,9 +68,9 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         for     (int j = lo.y; j <= hi.y; ++j) {
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
-                slopes(i,j,k,ns        ) = 0.5_rt*(u(i+1,j,k,nu)-u(i-1,j,k,nu));
-                slopes(i,j,k,ns+ncomp  ) = 0.5_rt*(u(i,j+1,k,nu)-u(i,j-1,k,nu));
-                slopes(i,j,k,ns+ncomp*2) = 0.5_rt*(u(i,j,k+1,nu)-u(i,j,k-1,nu));
+                slopes(i,j,k,ns        ) = Real(0.5)*(u(i+1,j,k,nu)-u(i-1,j,k,nu));
+                slopes(i,j,k,ns+ncomp  ) = Real(0.5)*(u(i,j+1,k,nu)-u(i,j-1,k,nu));
+                slopes(i,j,k,ns+ncomp*2) = Real(0.5)*(u(i,j,k+1,nu)-u(i,j,k-1,nu));
             }
         }
     }
@@ -81,14 +81,14 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         if (shi.x-slo.x >= 1) {
             for         (int k = lo.z; k <= hi.z; ++k) {
                 for     (int j = lo.y; j <= hi.y; ++j) {
-                    slopes(i,j,k,ns) = -(16._rt/15._rt)*u(i-1,j,k,nu) + 0.5_rt*u(i,j,k,nu)
-                        + (2._rt/3._rt)*u(i+1,j,k,nu) - 0.1_rt*u(i+2,j,k,nu);
+                    slopes(i,j,k,ns) = -Real(16./15.)*u(i-1,j,k,nu) + Real(0.5)*u(i,j,k,nu)
+                        + Real(2./3.)*u(i+1,j,k,nu) - Real(0.1)*u(i+2,j,k,nu);
                 }
             }
         } else {
             for         (int k = lo.z; k <= hi.z; ++k) {
                 for     (int j = lo.y; j <= hi.y; ++j) {
-                    slopes(i,j,k,ns) = 0.25_rt*(u(i+1,j,k,nu)+5._rt*u(i,j,k,nu)-6._rt*u(i-1,j,k,nu));
+                    slopes(i,j,k,ns) = Real(0.25)*(u(i+1,j,k,nu)+Real(5.)*u(i,j,k,nu)-Real(6.)*u(i-1,j,k,nu));
                 }
             }
         }
@@ -100,14 +100,14 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
         if (shi.x-slo.x >= 1) {
             for         (int k = lo.z; k <= hi.z; ++k) {
                 for     (int j = lo.y; j <= hi.y; ++j) {
-                    slopes(i,j,k,ns) = (16._rt/15._rt)*u(i+1,j,k,nu) - 0.5_rt*u(i,j,k,nu)
-                        - (2._rt/3._rt)*u(i-1,j,k,nu) + 0.1_rt*u(i-2,j,k,nu);
+                    slopes(i,j,k,ns) = Real(16./15.)*u(i+1,j,k,nu) - Real(0.5)*u(i,j,k,nu)
+                        - Real(2./3.)*u(i-1,j,k,nu) + Real(0.1)*u(i-2,j,k,nu);
                 }
             }                
         } else {
             for         (int k = lo.z; k <= hi.z; ++k) {
                 for     (int j = lo.y; j <= hi.y; ++j) {
-                    slopes(i,j,k,ns) = -0.25_rt*(u(i-1,j,k,nu)+5._rt*u(i,j,k,nu)-6._rt*u(i+1,j,k,nu));
+                    slopes(i,j,k,ns) = -Real(0.25)*(u(i-1,j,k,nu)+Real(5.)*u(i,j,k,nu)-Real(6.)*u(i+1,j,k,nu));
                 }
             }
         }
@@ -120,15 +120,15 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
             for     (int k = lo.z; k <= hi.z; ++k) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+ncomp) = -(16._rt/15._rt)*u(i,j-1,k,nu) + 0.5_rt*u(i,j,k,nu)
-                        + (2._rt/3._rt)*u(i,j+1,k,nu) - 0.1_rt*u(i,j+2,k,nu);
+                    slopes(i,j,k,ns+ncomp) = -Real(16./15.)*u(i,j-1,k,nu) + Real(0.5)*u(i,j,k,nu)
+                        + Real(2./3.)*u(i,j+1,k,nu) - Real(0.1)*u(i,j+2,k,nu);
                 }
             }
         } else {
             for     (int k = lo.z; k <= hi.z; ++k) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+ncomp) = 0.25_rt*(u(i,j+1,k,nu)+5._rt*u(i,j,k,nu)-6._rt*u(i,j-1,k,nu));
+                    slopes(i,j,k,ns+ncomp) = Real(0.25)*(u(i,j+1,k,nu)+Real(5.)*u(i,j,k,nu)-Real(6.)*u(i,j-1,k,nu));
                 }
             }
         }
@@ -141,15 +141,15 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
             for     (int k = lo.z; k <= hi.z; ++k) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+ncomp) = (16._rt/15._rt)*u(i,j+1,k,nu) - 0.5_rt*u(i,j,k,nu)
-                        - (2._rt/3._rt)*u(i,j-1,k,nu) + 0.1_rt*u(i,j-2,k,nu);
+                    slopes(i,j,k,ns+ncomp) = Real(16./15.)*u(i,j+1,k,nu) - Real(0.5)*u(i,j,k,nu)
+                        - Real(2./3.)*u(i,j-1,k,nu) + Real(0.1)*u(i,j-2,k,nu);
                 }
             }
         } else {
             for     (int k = lo.z; k <= hi.z; ++k) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+ncomp) = -0.25_rt*(u(i,j-1,k,nu)+5._rt*u(i,j,k,nu)-6._rt*u(i,j+1,k,nu));
+                    slopes(i,j,k,ns+ncomp) = -Real(0.25)*(u(i,j-1,k,nu)+Real(5.)*u(i,j,k,nu)-Real(6.)*u(i,j+1,k,nu));
                 }
             }
         }
@@ -162,15 +162,15 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
             for     (int j = lo.y; j <= hi.y; ++j) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+2*ncomp) = -(16._rt/15._rt)*u(i,j,k-1,nu) + 0.5_rt*u(i,j,k,nu)
-                        + (2._rt/3._rt)*u(i,j,k+1,nu) - 0.1_rt*u(i,j,k+2,nu);
+                    slopes(i,j,k,ns+2*ncomp) = -Real(16./15.)*u(i,j,k-1,nu) + Real(0.5)*u(i,j,k,nu)
+                        + Real(2./3.)*u(i,j,k+1,nu) - Real(0.1)*u(i,j,k+2,nu);
                 }
             }
         } else {
             for     (int j = lo.y; j <= hi.y; ++j) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+2*ncomp) = 0.25_rt*(u(i,j,k+1,nu)+5._rt*u(i,j,k,nu)-6._rt*u(i,j,k-1,nu));
+                    slopes(i,j,k,ns+2*ncomp) = Real(0.25)*(u(i,j,k+1,nu)+Real(5.)*u(i,j,k,nu)-Real(6.)*u(i,j,k-1,nu));
                 }
             }
         }
@@ -183,15 +183,15 @@ compute_slopes (const Dim3& lo, const Dim3& hi,
             for     (int j = lo.y; j <= hi.y; ++j) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+2*ncomp) = (16._rt/15._rt)*u(i,j,k+1,nu) - 0.5_rt*u(i,j,k,nu)
-                        - (2._rt/3._rt)*u(i,j,k-1,nu) + 0.1_rt*u(i,j,k-2,nu);
+                    slopes(i,j,k,ns+2*ncomp) = Real(16./15.)*u(i,j,k+1,nu) - Real(0.5)*u(i,j,k,nu)
+                        - Real(2./3.)*u(i,j,k-1,nu) + Real(0.1)*u(i,j,k-2,nu);
                 }
             }
         } else {
             for     (int j = lo.y; j <= hi.y; ++j) {
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    slopes(i,j,k,ns+2*ncomp) = -0.25_rt*(u(i,j,k-1,nu)+5._rt*u(i,j,k,nu)-6._rt*u(i,j,k+1,nu));
+                    slopes(i,j,k,ns+2*ncomp) = -Real(0.25)*(u(i,j,k-1,nu)+Real(5.)*u(i,j,k,nu)-Real(6.)*u(i,j,k+1,nu));
                 }
             }
         }
@@ -217,9 +217,9 @@ cellconslin_slopes_linlim (Box const& bx, Array4<Real> const& slopes,
         for     (int j = lo.y; j <= hi.y; ++j) {
             AMREX_PRAGMA_SIMD
             for (int i = lo.x; i <= hi.x; ++i) {
-                sf(i,j,k,0) = 1.0_rt;
-                sf(i,j,k,1) = 1.0_rt;
-                sf(i,j,k,2) = 1.0_rt;
+                sf(i,j,k,0) = Real(1.);
+                sf(i,j,k,1) = Real(1.);
+                sf(i,j,k,2) = Real(1.);
             }
         }
     }
@@ -234,36 +234,36 @@ cellconslin_slopes_linlim (Box const& bx, Array4<Real> const& slopes,
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
                     Real cen  = slopes(i,j,k,n);
-                    Real forw = 2.0_rt*(u(i+1,j,k,nu)-u(i  ,j,k,nu));
-                    Real back = 2.0_rt*(u(i  ,j,k,nu)-u(i-1,j,k,nu));
-                    Real slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                    slopes(i,j,k,n) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
-                    if (cen != 0.0_rt) {
+                    Real forw = Real(2.)*(u(i+1,j,k,nu)-u(i  ,j,k,nu));
+                    Real back = Real(2.)*(u(i  ,j,k,nu)-u(i-1,j,k,nu));
+                    Real slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                    slopes(i,j,k,n) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
+                    if (cen != Real(0.)) {
                         sf(i,j,k,0) = amrex::min(sf(i,j,k,0), slopes(i,j,k,n)/cen);
                     } else {
-                        sf(i,j,k,0) = 0.0_rt;
+                        sf(i,j,k,0) = Real(0.);
                     }
 
                     cen  = slopes(i,j,k,n+ncomp);
-                    forw = 2.0_rt*(u(i,j+1,k,nu)-u(i,j  ,k,nu));
-                    back = 2.0_rt*(u(i,j  ,k,nu)-u(i,j-1,k,nu));
-                    slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                    slopes(i,j,k,n+ncomp) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
-                    if (cen != 0.0_rt) {
+                    forw = Real(2.)*(u(i,j+1,k,nu)-u(i,j  ,k,nu));
+                    back = Real(2.)*(u(i,j  ,k,nu)-u(i,j-1,k,nu));
+                    slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                    slopes(i,j,k,n+ncomp) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
+                    if (cen != Real(0.)) {
                         sf(i,j,k,1) = amrex::min(sf(i,j,k,1), slopes(i,j,k,n+ncomp)/cen);
                     } else {
-                        sf(i,j,k,1) = 0.0_rt;
+                        sf(i,j,k,1) = Real(0.);
                     }
 
                     cen  = slopes(i,j,k,n+ncomp*2);
-                    forw = 2.0_rt*(u(i,j,k+1,nu)-u(i,j,k  ,nu));
-                    back = 2.0_rt*(u(i,j,k  ,nu)-u(i,j,k-1,nu));
-                    slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                    slopes(i,j,k,n+ncomp*2) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
-                    if (cen != 0.0_rt) {
+                    forw = Real(2.)*(u(i,j,k+1,nu)-u(i,j,k  ,nu));
+                    back = Real(2.)*(u(i,j,k  ,nu)-u(i,j,k-1,nu));
+                    slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                    slopes(i,j,k,n+ncomp*2) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
+                    if (cen != Real(0.)) {
                         sf(i,j,k,2) = amrex::min(sf(i,j,k,2), slopes(i,j,k,n+ncomp*2)/cen);
                     } else {
-                        sf(i,j,k,2) = 0.0_rt;
+                        sf(i,j,k,2) = Real(0.);
                     }
                 }
             }
@@ -361,22 +361,22 @@ cellconslin_slopes_mclim (Box const& bx, Array4<Real> const& slopes,
                 AMREX_PRAGMA_SIMD
                 for (int i = lo.x; i <= hi.x; ++i) {
                     Real cen  = slopes(i,j,k,n);
-                    Real forw = 2.0_rt*(u(i+1,j,k,nu)-u(i  ,j,k,nu));
-                    Real back = 2.0_rt*(u(i  ,j,k,nu)-u(i-1,j,k,nu));
-                    Real slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                    slopes(i,j,k,n) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
+                    Real forw = Real(2.)*(u(i+1,j,k,nu)-u(i  ,j,k,nu));
+                    Real back = Real(2.)*(u(i  ,j,k,nu)-u(i-1,j,k,nu));
+                    Real slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                    slopes(i,j,k,n) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
 
                     cen  = slopes(i,j,k,n+ncomp);
-                    forw = 2.0_rt*(u(i,j+1,k,nu)-u(i,j  ,k,nu));
-                    back = 2.0_rt*(u(i,j  ,k,nu)-u(i,j-1,k,nu));
-                    slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                    slopes(i,j,k,n+ncomp) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
+                    forw = Real(2.)*(u(i,j+1,k,nu)-u(i,j  ,k,nu));
+                    back = Real(2.)*(u(i,j  ,k,nu)-u(i,j-1,k,nu));
+                    slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                    slopes(i,j,k,n+ncomp) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
 
                     cen  = slopes(i,j,k,n+ncomp*2);
-                    forw = 2.0_rt*(u(i,j,k+1,nu)-u(i,j,k  ,nu));
-                    back = 2.0_rt*(u(i,j,k  ,nu)-u(i,j,k-1,nu));
-                    slp = (forw*back >= 0.0_rt) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : 0.0_rt;
-                    slopes(i,j,k,n+ncomp*2) = amrex::Math::copysign(1.0_rt,cen)*amrex::min(slp,amrex::Math::abs(cen));
+                    forw = Real(2.)*(u(i,j,k+1,nu)-u(i,j,k  ,nu));
+                    back = Real(2.)*(u(i,j,k  ,nu)-u(i,j,k-1,nu));
+                    slp = (forw*back >= Real(0.)) ? amrex::min(amrex::Math::abs(forw),amrex::Math::abs(back)) : Real(0.);
+                    slopes(i,j,k,n+ncomp*2) = amrex::Math::copysign(Real(1.),cen)*amrex::min(slp,amrex::Math::abs(cen));
                 }
             }
         }
@@ -411,12 +411,12 @@ cellconslin_fine_alpha (Box const& bx, Array4<Real> const& alpha,
                         +                   yoff[j-vlo.y]*slopes(ic,jc,kc,n+ncomp)
                         +                   zoff[k-vlo.z]*slopes(ic,jc,kc,n+ncomp*2);
 
-                    if (dummy_fine > mm(ic,jc,kc,n+ncomp) && dummy_fine != 0.0_rt) {
+                    if (dummy_fine > mm(ic,jc,kc,n+ncomp) && dummy_fine != Real(0.)) {
                         alpha(i,j,k,n) = mm(ic,jc,kc,n+ncomp) / dummy_fine;
-                    } else if (dummy_fine < mm(ic,jc,kc,n) && dummy_fine != 0.0_rt) {
+                    } else if (dummy_fine < mm(ic,jc,kc,n) && dummy_fine != Real(0.)) {
                         alpha(i,j,k,n) = mm(ic,jc,kc,n) / dummy_fine;
                     } else {
-                        alpha(i,j,k,n) = 1.0_rt;
+                        alpha(i,j,k,n) = Real(1.);
                     }
                 }
             }
@@ -439,7 +439,7 @@ cellconslin_slopes_mmlim (Box const& bx, Array4<Real> const& slopes,
                 const int jj = j*ratio[1];
                 for (int i = lo.x; i <= hi.x; ++i) {
                     const int ii = i*ratio[0];
-                    Real a = 1.0_rt;
+                    Real a = Real(1.);
                     for         (int koff = 0; koff < ratio[2]; ++koff) {
                         for     (int joff = 0; joff < ratio[1]; ++joff) {
                             for (int ioff = 0; ioff < ratio[0]; ++ioff) {
@@ -498,9 +498,9 @@ nodebilin_slopes (Box const& bx, Array4<T> const& slope, Array4<T const> const&
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
-    const Real rx = 1.0_rt/ratio[0];
-    const Real ry = 1.0_rt/ratio[1];
-    const Real rz = 1.0_rt/ratio[2];
+    const Real rx = Real(1.)/ratio[0];
+    const Real ry = Real(1.)/ratio[1];
+    const Real rz = Real(1.)/ratio[2];
 
     for (int n = 0; n < ncomp; ++n) {
         const int nu = n + icomp;
@@ -566,6 +566,42 @@ nodebilin_interp (Box const& bx, Array4<T> const& fine, const int fcomp, const i
     }
 }
 
+template<typename T>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void
+face_linear_interp_x (int i, int j, int k, int n, Array4<T> const& fine,
+                      Array4<T const> const& crse, IntVect const& ratio) noexcept
+{
+    int ii = amrex::coarsen(i,ratio[0]);
+    int jj = amrex::coarsen(j,ratio[1]);
+    int kk = amrex::coarsen(k,ratio[2]);
+    Real const w = static_cast<Real>(i-ii*ratio[0]) * (Real(1.)/ratio[0]);
+    fine(i,j,k,n) = (Real(1.)-w) * crse(ii,jj,kk,n) + w * crse(ii+1,jj,kk,n);
+}
+
+template<typename T>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void
+face_linear_interp_y (int i, int j, int k, int n, Array4<T> const& fine,
+                      Array4<T const> const& crse, IntVect const& ratio) noexcept
+{
+    int ii = amrex::coarsen(i,ratio[0]);
+    int jj = amrex::coarsen(j,ratio[1]);
+    int kk = amrex::coarsen(k,ratio[2]);
+    Real const w = static_cast<Real>(j-jj*ratio[1]) * (Real(1.)/ratio[1]);
+    fine(i,j,k,n) = (Real(1.)-w) * crse(ii,jj,kk,n) + w * crse(ii,jj+1,kk,n);
+}
+
+template<typename T>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void
+face_linear_interp_z (int i, int j, int k, int n, Array4<T> const& fine,
+                      Array4<T const> const& crse, IntVect const& ratio) noexcept
+{
+    int ii = amrex::coarsen(i,ratio[0]);
+    int jj = amrex::coarsen(j,ratio[1]);
+    int kk = amrex::coarsen(k,ratio[2]);
+    Real const w = static_cast<Real>(k-kk*ratio[2]) * (Real(1.)/ratio[2]);
+    fine(i,j,k,n) = (Real(1.)-w) * crse(ii,jj,kk,n) + w * crse(ii,jj,kk+1,n);
+}
+
 }
 
 #endif
diff --git a/Src/AmrCore/AMReX_Interpolater.H b/Src/AmrCore/AMReX_Interpolater.H
index 3896df24d5e..24cfeb0d6bd 100644
--- a/Src/AmrCore/AMReX_Interpolater.H
+++ b/Src/AmrCore/AMReX_Interpolater.H
@@ -98,19 +98,19 @@ public:
     * \param fine_geom
     * \param bcr
     */
-    virtual void protect (const FArrayBox& crse,
-                          int              crse_comp,
-                          FArrayBox&       fine,
-                          int              fine_comp,
-                          FArrayBox&       fine_state,
-                          int              state_comp,
-                          int              ncomp,
-                          const Box&       fine_region,
-                          const IntVect&   ratio,
-                          const Geometry&  crse_geom,
-                          const Geometry&  fine_geom,
-                          Vector<BCRec>&   bcr,
-                          RunOn            gpu_or_cpu) {};
+    virtual void protect (const FArrayBox& /*crse*/,
+                          int              /*crse_comp*/,
+                          FArrayBox&       /*fine*/,
+                          int              /*fine_comp*/,
+                          FArrayBox&       /*fine_state*/,
+                          int              /*state_comp*/,
+                          int              /*ncomp*/,
+                          const Box&       /*fine_region*/,
+                          const IntVect&   /*ratio*/,
+                          const Geometry&  /*crse_geom*/,
+                          const Geometry&  /*fine_geom*/,
+                          Vector<BCRec>&   /*bcr*/,
+                          RunOn            /*gpu_or_cpu*/) {}
 
     virtual InterpolaterBoxCoarsener BoxCoarsener (const IntVect& ratio);
 
@@ -646,10 +646,76 @@ public:
 };
 #endif
 
+/**
+* \brief Bilinear interpolation on face data.
+*
+* Bilinear interpolation on data.
+*/
+
+class FaceLinear
+    :
+    public Interpolater
+{
+public:
+
+    /**
+    * \brief The destructor.
+    */
+    virtual ~FaceLinear () override;
+
+    /**
+    * \brief Returns coarsened box given fine box and refinement ratio.
+    *
+    * \param fine
+    * \param ratio
+    */
+    virtual Box CoarseBox (const Box& fine,
+                           int        ratio) override;
+
+    /**
+    * \brief Returns coarsened box given fine box and refinement ratio.
+    *
+    * \param fine
+    * \param ratio
+    */
+    virtual Box CoarseBox (const Box&     fine,
+                           const IntVect& ratio) override;
+
+    /**
+    * \brief Coarse to fine interpolation in space.
+    *
+    * \param crse
+    * \param crse_comp
+    * \param fine
+    * \param fine_comp
+    * \param ncomp
+    * \param fine_region
+    * \param ratio
+    * \param crse_geom
+    * \param fine_geom
+    * \param bcr
+    * \param actual_comp
+    * \param actual_state
+    */
+    virtual void interp (const FArrayBox& crse,
+                         int              crse_comp,
+                         FArrayBox&       fine,
+                         int              fine_comp,
+                         int              ncomp,
+                         const Box&       fine_region,
+                         const IntVect&   ratio,
+                         const Geometry&  crse_geom,
+                         const Geometry&  fine_geom,
+                         Vector<BCRec> const& bcr,
+                         int              actual_comp,
+                         int              actual_state,
+                         RunOn            gpu_or_cpu) override;
+};
 
 //! CONSTRUCT A GLOBAL OBJECT OF EACH VERSION.
 extern PCInterp                  pc_interp;
 extern NodeBilinear              node_bilinear_interp;
+extern FaceLinear                face_linear_interp;
 extern CellConservativeLinear    lincc_interp;
 extern CellConservativeLinear    cell_cons_interp;
 
diff --git a/Src/AmrCore/AMReX_Interpolater.cpp b/Src/AmrCore/AMReX_Interpolater.cpp
index 4da717bdc0a..570fdf0e9c6 100644
--- a/Src/AmrCore/AMReX_Interpolater.cpp
+++ b/Src/AmrCore/AMReX_Interpolater.cpp
@@ -13,7 +13,8 @@
 namespace amrex {
 
 //
-// PCInterp, NodeBilinear, and CellConservativeLinear are supported for all dimensions on cpu and gpu.
+// PCInterp, NodeBilinear, FaceLinear, and CellConservativeLinear are supported for all dimensions
+// on cpu and gpu.
 //
 // CellConsertiveProtected only works in 2D and 3D on cpu.
 //
@@ -29,6 +30,7 @@ namespace amrex {
 //
 PCInterp                  pc_interp;
 NodeBilinear              node_bilinear_interp;
+FaceLinear                face_linear_interp;
 CellConservativeLinear    lincc_interp;
 CellConservativeLinear    cell_cons_interp(0);
 
@@ -141,6 +143,76 @@ NodeBilinear::interp (const FArrayBox&  crse,
     });
 }
 
+Box
+FaceLinear::CoarseBox (const Box& fine, int ratio)
+{
+    return CoarseBox(fine, IntVect(ratio));
+}
+
+Box
+FaceLinear::CoarseBox (const Box& fine, const IntVect& ratio)
+{
+    Box b = amrex::coarsen(fine,ratio);
+    for (int i = 0; i < AMREX_SPACEDIM; i++) {
+        if (b.type(i) == IndexType::NODE && b.length(i) < 2) {
+            // Don't want degenerate boxes in nodal direction.
+            b.growHi(i,1);
+        }
+    }
+    return b;
+}
+
+void
+FaceLinear::interp (const FArrayBox&  crse,
+                    int               crse_comp,
+                    FArrayBox&        fine,
+                    int               fine_comp,
+                    int               ncomp,
+                    const Box&        fine_region,
+                    const IntVect&    ratio,
+                    const Geometry& /*crse_geom */,
+                    const Geometry& /*fine_geom */,
+                    Vector<BCRec> const& /*bcr*/,
+                    int               /*actual_comp*/,
+                    int               /*actual_state*/,
+                    RunOn             runon)
+{
+    BL_PROFILE("FaceLinear::interp()");
+
+    AMREX_ASSERT(AMREX_D_TERM(fine_region.type(0),+fine_region.type(1),+fine_region.type(2)) == 1);
+
+    Array4<Real> const& fine_arr = fine.array(fine_comp);
+    Array4<Real const> const& crse_arr = crse.const_array(crse_comp);
+
+    if (fine_region.type(0) == IndexType::NODE)
+    {
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FLAG(runon,fine_region,ncomp,i,j,k,n,
+        {
+            face_linear_interp_x(i,j,k,n,fine_arr,crse_arr,ratio);
+        });
+    }
+#if (AMREX_SPACEDIM >= 2)
+    else if (fine_region.type(1) == IndexType::NODE)
+    {
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FLAG(runon,fine_region,ncomp,i,j,k,n,
+        {
+            face_linear_interp_y(i,j,k,n,fine_arr,crse_arr,ratio);
+        });
+    }
+#if (AMREX_SPACEDIM == 3)
+    else
+    {
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FLAG(runon,fine_region,ncomp,i,j,k,n,
+        {
+            face_linear_interp_z(i,j,k,n,fine_arr,crse_arr,ratio);
+        });
+    }
+#endif
+#endif
+}
+
+FaceLinear::~FaceLinear () {}
+
 #ifndef BL_NO_FORT
 CellBilinear::~CellBilinear () {}
 
@@ -187,7 +259,7 @@ CellBilinear::interp (const FArrayBox&  crse,
                       Vector<BCRec> const& /*bcr*/,
                       int               actual_comp,
                       int               actual_state,
-                      RunOn             runon)
+                      RunOn             /*runon*/)
 {
     BL_PROFILE("CellBilinear::interp()");
     //
@@ -399,8 +471,13 @@ CellQuadratic::interp (const FArrayBox& crse,
                        Vector<BCRec> const&  bcr,
                        int              actual_comp,
                        int              actual_state,
-                       RunOn            runon)
+                       RunOn            /*runon*/)
 {
+#if (AMREX_SPACEDIM == 1)
+    amrex::ignore_unused(crse,crse_comp,fine,fine_comp,ncomp,fine_region,
+                         ratio,crse_geom,fine_geom,bcr,actual_comp,actual_state);
+    amrex::Abort("1D CellQuadratic::interp not supported");
+#else
     BL_PROFILE("CellQuadratic::interp()");
     BL_ASSERT(bcr.size() >= ncomp);
     //
@@ -471,8 +548,6 @@ CellQuadratic::interp (const FArrayBox& crse,
     Vector<int> bc     = GetBCArray(bcr);
     const int* ratioV = ratio.getVect();
 
-#if (AMREX_SPACEDIM > 1)
-
     amrex_cqinterp (fdat,AMREX_ARLIM(flo),AMREX_ARLIM(fhi),
                    AMREX_ARLIM(fblo), AMREX_ARLIM(fbhi),
                    &ncomp,AMREX_D_DECL(&ratioV[0],&ratioV[1],&ratioV[2]),
@@ -566,8 +641,8 @@ CellConservativeProtected::interp (const FArrayBox& crse,
                                    const Geometry&  crse_geom,
                                    const Geometry&  fine_geom,
                                    Vector<BCRec> const&  bcr,
-                                   int              actual_comp,
-                                   int              actual_state,
+                                   int              /*actual_comp*/,
+                                   int              /*actual_state*/,
                                    RunOn            runon)
 {
     BL_PROFILE("CellConservativeProtected::interp()");
@@ -630,8 +705,14 @@ CellConservativeProtected::protect (const FArrayBox& crse,
                                     const Geometry&  crse_geom,
                                     const Geometry&  fine_geom,
                                     Vector<BCRec>&   bcr,
-                                    RunOn            runon)
+                                    RunOn            /*runon*/)
 {
+#if (AMREX_SPACEDIM == 1)
+    amrex::ignore_unused(crse,crse_comp,fine,fine_comp,fine_state,
+                         state_comp,ncomp,fine_region,ratio,
+                         crse_geom,fine_geom,bcr);
+    amrex::Abort("1D CellConservativeProtected::protect not supported");
+#else
     BL_PROFILE("CellConservativeProtected::protect()");
     BL_ASSERT(bcr.size() >= ncomp);
 
@@ -695,8 +776,6 @@ CellConservativeProtected::protect (const FArrayBox& crse,
     Vector<int> bc     = GetBCArray(bcr);
     const int* ratioV = ratio.getVect();
 
-#if (AMREX_SPACEDIM > 1)
-
     amrex_protect_interp (fdat,AMREX_ARLIM(flo),AMREX_ARLIM(fhi),
                          fblo, fbhi,
                          cdat,AMREX_ARLIM(clo),AMREX_ARLIM(chi),
@@ -711,7 +790,7 @@ CellConservativeProtected::protect (const FArrayBox& crse,
                          &ncomp,AMREX_D_DECL(&ratioV[0],&ratioV[1],&ratioV[2]),
                          bc.dataPtr());
 
-#endif /*(AMREX_SPACEDIM > 1)*/
+#endif /*(AMREX_SPACEDIM == 1)*/
 
 }
 #endif
@@ -750,7 +829,7 @@ CellConservativeQuartic::interp (const FArrayBox&  crse,
 				 Vector<BCRec> const&   bcr,
 				 int               actual_comp,
 				 int               actual_state,
-                                 RunOn             runon)
+                                 RunOn             /*runon*/)
 {
     BL_PROFILE("CellConservativeQuartic::interp()");
     BL_ASSERT(bcr.size() >= ncomp);
diff --git a/Src/AmrCore/AMReX_TagBox.H b/Src/AmrCore/AMReX_TagBox.H
index c92bd18fe43..433da05b983 100644
--- a/Src/AmrCore/AMReX_TagBox.H
+++ b/Src/AmrCore/AMReX_TagBox.H
@@ -57,56 +57,24 @@ public:
     /**
     * \brief Construct and return a new tagbox in which the coarsened cell
     * is tagged of any of the corresponding fine cells are tagged.
-    *
-    * \param ratio
-    * \param owner
     */
-    void coarsen (const IntVect& ratio) noexcept;
+    void coarsen (const IntVect& ratio, const Box& cbox) noexcept;
 
     /**
     * \brief Mark neighbors of every tagged cell a distance nbuff away
-    * only search interior for initial tagged points where nwid
-    * is given as the width of the bndry region.
     *
     * \param nbuff
-    * \param nwid
-    */
-    void buffer (const IntVect& nbuf, const IntVect& nwid) noexcept;
-
-    /**
-    * \brief Tag cells on intersect with src if corresponding src cell is tagged.
-    *
-    * \param src
-    */
-    void merge (const TagBox& src) noexcept;
-
-    /**
-    * \brief Add location of every tagged cell to IntVect array,
-    * starting at given location.  Returns the number of
-    * collated points.
-    *
-    * \param ar
-    * \param start
     */
-    Long collate (Vector<IntVect>& ar, int start) const noexcept;
-
-    /**
-    * \brief Returns number of tagged cells in specified Box.
-    *
-    * \param bx
-    */
-    Long numTags (const Box& bx) const noexcept;
-
-    /**
-    * \brief Returns total number of tagged cells in the TagBox.
-    */
-    Long numTags () const noexcept;
+    void buffer (const IntVect& nbuf) noexcept;
 
     /**
     * \brief Returns Vector\<int\> of size domain.numPts() suitable for calling
     * Fortran, with positions set to same value as in the TagBox
     * dataPtr().
     */
+//#if (__cplusplus >= 201402L)
+//    [[deprecated("No need to use this unless calling Fortran < 2003")]]
+//#endif
     Vector<int> tags () const noexcept;
 
     /**
@@ -117,6 +85,9 @@ public:
     * \param ar
     * \param tilebx
     */
+//#if (__cplusplus >= 201402L)
+//    [[deprecated("No need to use this unless calling Fortran < 2003")]]
+//#endif
     void get_itags(Vector<int>& ar, const Box& tilebx) const noexcept;
 
     /**
@@ -125,6 +96,9 @@ public:
     *
     * \param ar
     */
+//#if (__cplusplus >= 201402L)
+//    [[deprecated("No need to use this unless calling Fortran < 2003")]]
+//#endif
     void tags (const Vector<int>& ar) noexcept;
 
     /**
@@ -133,6 +107,9 @@ public:
     *
     * \param ar
     */
+//#if (__cplusplus >= 201402L)
+//    [[deprecated("No need to use this unless calling Fortran < 2003")]]
+//#endif
     void tags_and_untags (const Vector<int>& ar) noexcept;
 
     /**
@@ -142,6 +119,9 @@ public:
     * \param ar
     * \param tilebx
     */
+//#if (__cplusplus >= 201402L)
+//    [[deprecated("No need to use this unless calling Fortran < 2003")]]
+//#endif
     void tags (const Vector<int>& ar, const Box& tilebx) noexcept;
 
     /**
@@ -151,6 +131,9 @@ public:
     * \param ar
     * \param tilebx
     */
+//#if (__cplusplus >= 201402L)
+//    [[deprecated("No need to use this unless calling Fortran < 2003")]]
+//#endif
     void tags_and_untags (const Vector<int>& ar, const Box& tilebx) noexcept;
 };
 
@@ -183,16 +166,10 @@ public:
     ~TagBoxArray () override = default;
 
     TagBoxArray (TagBoxArray&& rhs) noexcept = default;
+    TagBoxArray& operator= (TagBoxArray&& rhs) noexcept = default;
 
     TagBoxArray (const TagBoxArray& rhs) = delete;
     TagBoxArray& operator= (const TagBoxArray& rhs) = delete;
-    TagBoxArray& operator= (TagBoxArray&& rhs) = delete;
-
-
-    /**
-    * \brief Returns the grow factor for the TagBoxArray.
-    */
-    IntVect borderSize () const noexcept;
 
     /**
     * \brief Calls buffer() on all contained TagBoxes.
@@ -202,12 +179,12 @@ public:
     void buffer (const IntVect& nbuf);
 
     /**
-    * \brief Map tagged cells through a periodic boundary to other grids in
-    * TagBoxArray cells which were outside domain are set to TagBox::CLEAR.
+    * \brief This funciton does two things.  Map tagged cells through a periodic boundary to other
+    * grids in TagBoxArray cells, and remove duplicates.
     *
     * \param geom
     */
-    void mapPeriodic (const Geometry& geom);
+    void mapPeriodicRemoveDuplicates (const Geometry& geom);
 
     /**
     * \brief Set values in bl to val.
@@ -241,17 +218,20 @@ public:
     */
     void coarsen (const IntVect& ratio);
 
-    /**
-    * \brief The total number of Tags in all the contained TagBoxes.
-    */
-    Long numTags () const;
-
     /**
     * \brief Calls collate() on all contained TagBoxes.
     *
     * \param TheGlobalCollateSpace
     */
     void collate (Vector<IntVect>& TheGlobalCollateSpace) const;
+
+    // \brief Are there tags in the region defined by bx?
+    bool hasTags (Box const& bx) const;
+
+    void local_collate_cpu (Vector<IntVect>& v) const;
+#ifdef AMREX_USE_GPU
+    void local_collate_gpu (Vector<IntVect>& v) const;
+#endif
 };
 
 }
diff --git a/Src/AmrCore/AMReX_TagBox.cpp b/Src/AmrCore/AMReX_TagBox.cpp
index 7136d1b849b..48b71791108 100644
--- a/Src/AmrCore/AMReX_TagBox.cpp
+++ b/Src/AmrCore/AMReX_TagBox.cpp
@@ -8,6 +8,8 @@
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX_BLProfiler.H>
 #include <AMReX_ccse-mpi.H>
+#include <AMReX_iMultiFab.H>
+#include <AMReX_MultiFabUtil.H>
 
 namespace amrex {
 
@@ -19,257 +21,87 @@ TagBox::TagBox (Arena* ar) noexcept
 
 TagBox::TagBox (const Box& bx, int n, Arena* ar)
     : BaseFab<TagBox::TagType>(bx,n,ar)
-{
-    setVal<RunOn::Host>(TagBox::CLEAR);
-}
+{}
 
 TagBox::TagBox (const Box& bx, int n, bool alloc, bool shared, Arena* ar)
     : BaseFab<TagBox::TagType>(bx,n,alloc,shared,ar)
-{
-    if (alloc) setVal<RunOn::Host>(TagBox::CLEAR);
-}
+{}
 
 TagBox::TagBox (const TagBox& rhs, MakeType make_type, int scomp, int ncomp)
     : BaseFab<TagBox::TagType>(rhs,make_type,scomp,ncomp)
 {}
 
 void
-TagBox::coarsen (const IntVect& ratio) noexcept
+TagBox::coarsen (const IntVect& ratio, const Box& cbox) noexcept
 {
     BL_ASSERT(nComp() == 1);
+    Array4<char const> const& farr = this->const_array();
 
-    TagType*   fdat     = dataPtr();
-    IntVect    lov      = domain.smallEnd();
-    IntVect    hiv      = domain.bigEnd();
-    IntVect    d_length = domain.size();
-    const int* flo      = lov.getVect();
-    const int* fhi      = hiv.getVect();
-    const int* flen     = d_length.getVect();
+    TagBox cfab(cbox, 1, The_Arena());
+    Elixir eli = cfab.elixir();
+    Array4<char> const& carr = cfab.array();
 
-    const Box& cbox = amrex::coarsen(domain,ratio);
+    Box fdomain = domain;
+    Dim3 r{1,1,1};
+    AMREX_D_TERM(r.x = ratio[0];, r.y = ratio[1];, r.z = ratio[2]);
 
-    this->nvar = 1;
-    this->domain = cbox;
-
-    const int* clo      = cbox.loVect();
-    IntVect    cbox_len = cbox.size();
-    const int* clen     = cbox_len.getVect();
-
-    Box b1(amrex::refine(cbox,ratio));
-    const int* lo       = b1.loVect();
-    int        longlen  = b1.longside();
-
-    Long numpts = domain.numPts();
-    Vector<TagType> cfab(numpts);
-    TagType* cdat = cfab.dataPtr();
-
-    Vector<TagType> t(longlen,TagBox::CLEAR);
-
-    int klo = 0, khi = 0, jlo = 0, jhi = 0, ilo, ihi;
-    AMREX_D_TERM(ilo=flo[0]; ihi=fhi[0]; ,
-                 jlo=flo[1]; jhi=fhi[1]; ,
-                 klo=flo[2]; khi=fhi[2];)
-
-#define IXPROJ(i,r) (((i)+(r)*std::abs(i))/(r) - std::abs(i))
-#define IOFF(j,k,lo,len) AMREX_D_TERM(0, +(j-lo[1])*len[0], +(k-lo[2])*len[0]*len[1])
-   
-   int ratiox = 1, ratioy = 1, ratioz = 1;
-   AMREX_D_TERM(ratiox = ratio[0];,
-                ratioy = ratio[1];,
-                ratioz = ratio[2];)
-
-   for (int k = klo; k <= khi; k++)
-   {
-       const int kc = IXPROJ(k,ratioz);
-       amrex::ignore_unused(kc);
-       for (int j = jlo; j <= jhi; j++)
-       {
-           const int     jc = IXPROJ(j,ratioy);
-           TagType*       c = cdat + IOFF(jc,kc,clo,clen);
-           const TagType* f = fdat + IOFF(j,k,flo,flen);
-           //
-           // Copy fine grid row of values into tmp array.
-           //
-           for (int i = ilo; i <= ihi; i++)
-               t[i-lo[0]] = f[i-ilo];
-
-           for (int off = 0; off < ratiox; off++)
-           {
-               for (int ic = 0; ic < clen[0]; ic++)
-               {
-                   const int i = ic*ratiox + off;
-                   c[ic] = std::max(c[ic],t[i]);
-               }
-           }
-       }
-   }
-
-#undef IXPROJ
-#undef IOFF
-
-   for (int i = 0; i < numpts; ++i) {
-       fdat[i] = cdat[i];
-   }
-}
-
-void 
-TagBox::buffer (const IntVect& nbuff, const IntVect& nwid) noexcept
-{
-    //
-    // Note: this routine assumes cell with TagBox::SET tag are in
-    // interior of tagbox (region = grow(domain,-nwid)).
-    //
-    Box inside(domain);
-    inside.grow(-nwid);
-    const int* inlo = inside.loVect();
-    const int* inhi = inside.hiVect();
-
-    int klo = 0, khi = 0, jlo = 0, jhi = 0, ilo, ihi;
-    AMREX_D_TERM(ilo=inlo[0]; ihi=inhi[0]; ,
-                 jlo=inlo[1]; jhi=inhi[1]; ,
-                 klo=inlo[2]; khi=inhi[2];)
-
-    int ni = 0, nj = 0, nk = 0;
-    AMREX_D_TERM(ni=nbuff[0];, nj=nbuff[1];, nk=nbuff[2];)
-
-    IntVect d_length = domain.size();
-    const int* len = d_length.getVect();
-    const int* lo = domain.loVect();
-    TagType* d = dataPtr();
-
-#define OFF(i,j,k,lo,len) AMREX_D_TERM(i-lo[0], +(j-lo[1])*len[0] , +(k-lo[2])*len[0]*len[1])
-   
-    for (int k = klo; k <= khi; k++)
+    AMREX_HOST_DEVICE_FOR_3D(cbox, i, j, k,
     {
-        for (int j = jlo; j <= jhi; j++)
-        {
-            for (int i = ilo; i <= ihi; i++)
-            {
-                TagType* d_check = d + OFF(i,j,k,lo,len);
-                if (*d_check == TagBox::SET)
-                {
-                    for (int kk = -nk; kk <= nk; kk++)
-                    {
-                        for (int jj = -nj; jj <= nj; jj++)
-                        {
-                            for (int ii = -ni; ii <= ni; ii++)
-                            {
-                                TagType* dn = d_check+ AMREX_D_TERM(ii, +jj*len[0], +kk*len[0]*len[1]);
-                                if (*dn !=TagBox::SET)
-                                    *dn = TagBox::BUF;
-                            }
-                        }
+        TagType t = TagBox::CLEAR;
+        for (int koff = 0; koff < r.z; ++koff) {
+            int kk = k*r.z + koff;
+            for (int joff = 0; joff < r.y; ++joff) {
+                int jj = j*r.y + joff;
+                for (int ioff = 0; ioff < r.x; ++ioff) {
+                    int ii = i*r.x + ioff;
+                    if (fdomain.contains(IntVect(AMREX_D_DECL(ii,jj,kk)))) {
+                        t = t || farr(ii,jj,kk);
                     }
                 }
             }
         }
-    }
-#undef OFF
-}
+        carr(i,j,k) = t;
+    });
 
-void 
-TagBox::merge (const TagBox& src) noexcept
-{
-    //
-    // Compute intersections.
-    //
-    const Box& bx = domain & src.domain;
-
-    if (bx.ok())
-    {
-        const int*     dlo        = domain.loVect();
-        IntVect        d_length   = domain.size();
-        const int*     dleng      = d_length.getVect();
-        const int*     slo        = src.domain.loVect();
-        IntVect        src_length = src.domain.size();
-        const int*     sleng      = src_length.getVect();
-        const int*     lo         = bx.loVect();
-        const int*     hi         = bx.hiVect();
-        const TagType* ds0        = src.dataPtr();
-        TagType*       dd0        = dataPtr();
-
-        int klo = 0, khi = 0, jlo = 0, jhi = 0, ilo, ihi;
-        AMREX_D_TERM(ilo=lo[0]; ihi=hi[0]; ,
-               jlo=lo[1]; jhi=hi[1]; ,
-               klo=lo[2]; khi=hi[2];)
-
-#define OFF(i,j,k,lo,len) AMREX_D_TERM(i-lo[0], +(j-lo[1])*len[0] , +(k-lo[2])*len[0]*len[1])
-      
-        for (int k = klo; k <= khi; k++)
-        {
-            for (int j = jlo; j <= jhi; j++)
-            {
-                for (int i = ilo; i <= ihi; i++)
-                {
-                    const TagType* ds = ds0 + OFF(i,j,k,slo,sleng);
-                    if (*ds != TagBox::CLEAR)
-                    {
-                        TagType* dd = dd0 + OFF(i,j,k,dlo,dleng);
-                        *dd = TagBox::SET;
-                    }            
-                }
-            }
-        }
-    }
-#undef OFF
-}
-
-Long
-TagBox::numTags () const noexcept
-{
-    Long nt = 0L;
-    Long len = domain.numPts();
-    const TagType* d = dataPtr();
-    for (Long n = 0; n < len; ++n)
+#ifdef AMREX_USE_GPU
+    if (Gpu::inLaunchRegion()) {
+        Gpu::dtod_memcpy_async(this->dataPtr(), cfab.dataPtr(), sizeof(TagType)*cbox.numPts());
+    } else
+#endif
     {
-        if (d[n] != TagBox::CLEAR)
-            ++nt;
+        std::memcpy(this->dataPtr(), cfab.dataPtr(), sizeof(TagType)*cbox.numPts());
     }
-    return nt;
-}
-
-Long
-TagBox::numTags (const Box& b) const noexcept
-{
-   TagBox tempTagBox(b,1);
-   tempTagBox.copy<RunOn::Host>(*this);
-   return tempTagBox.numTags();
+    this->domain = cbox;
 }
 
-Long
-TagBox::collate (Vector<IntVect>& ar, int start) const noexcept
+void
+TagBox::buffer (const IntVect& a_nbuff) noexcept
 {
-    BL_ASSERT(start >= 0);
-    //
-    // Starting at given offset of array ar, enter location (IntVect) of
-    // each tagged cell in tagbox.
-    //
-    Long count       = 0;
-    IntVect d_length = domain.size();
-    const int* len   = d_length.getVect();
-    const int* lo    = domain.loVect();
-    const TagType* d = dataPtr();
-    int ni = 1, nj = 1, nk = 1;
-    AMREX_D_TERM(ni = len[0]; , nj = len[1]; , nk = len[2];)
-
-    for (int k = 0; k < nk; k++)
+    Array4<char> const& a = this->array();
+    Dim3 nbuf = a_nbuff.dim3();
+    const auto lo = amrex::lbound(domain);
+    const auto hi = amrex::ubound(domain);
+    AMREX_HOST_DEVICE_FOR_3D(domain, i, j, k,
     {
-        for (int j = 0; j < nj; j++)
-        {
-            for (int i = 0; i < ni; i++)
-            {
-                const TagType* dn = d + AMREX_D_TERM(i, +j*len[0], +k*len[0]*len[1]);
-                if (*dn != TagBox::CLEAR)
-                {
-                    ar[start++] = IntVect(AMREX_D_DECL(lo[0]+i,lo[1]+j,lo[2]+k));
-                    count++;
-                }
-            }
+        if (a(i,j,k) == TagBox::CLEAR) {
+            bool to_buf = false;
+            int imin = amrex::max(i-nbuf.x, lo.x);
+            int jmin = amrex::max(j-nbuf.y, lo.y);
+            int kmin = amrex::max(k-nbuf.z, lo.z);
+            int imax = amrex::min(i+nbuf.x, hi.x);
+            int jmax = amrex::min(j+nbuf.y, hi.y);
+            int kmax = amrex::min(k+nbuf.z, hi.z);
+            for (int kk = kmin; kk <= kmax && !to_buf; ++kk) {
+            for (int jj = jmin; jj <= jmax && !to_buf; ++jj) {
+            for (int ii = imin; ii <= imax && !to_buf; ++ii) {
+                if (a(ii,jj,kk) == TagBox::SET) to_buf = true;
+            }}}
+            if (to_buf) a(i,j,k) = TagBox::BUF;
         }
-    }
-    return count;
+    });
 }
 
+// DEPRECATED
 Vector<int>
 TagBox::tags () const noexcept
 {
@@ -287,7 +119,7 @@ TagBox::tags () const noexcept
     return ar;
 }
 
-
+// DEPRECATED
 // Set values as specified by the array -- this only tags.
 // It's an error if ar.length() != domain.numPts().
 void
@@ -305,6 +137,7 @@ TagBox::tags (const Vector<int>& ar) noexcept
     }
 }
 
+// DEPRECATED
 // Set values as specified by the array -- this tags and untags.
 // It's an error if ar.length() != domain.numPts().
 void
@@ -322,6 +155,7 @@ TagBox::tags_and_untags (const Vector<int>& ar) noexcept
     }
 }
 
+// DEPRECATED
 // Since a TagBox is a BaseFab<char>, we can use this utility
 // function to allocate an integer array to have the same number 
 // of elements as cells in tilebx
@@ -364,6 +198,7 @@ TagBox::get_itags(Vector<int>& ar, const Box& tilebx) const noexcept
     }
 }
 
+// DEPRECATED
 // Set values as specified by the array -- this only tags.
 // only changes values in the tilebx region
 void 
@@ -397,6 +232,7 @@ TagBox::tags (const Vector<int>& ar, const Box& tilebx) noexcept
     }
 }
 
+// DEPRECATED
 // Set values as specified by the array -- this tags and untags.
 // only changes values in the tilebx region
 void 
@@ -436,7 +272,7 @@ TagBoxArray::TagBoxArray (const BoxArray& ba,
     :
     FabArray<TagBox>(ba,dm,1,_ngrow,MFInfo(),DefaultFabFactory<TagBox>())
 {
-    if (SharedMemory()) setVal(TagBox::CLEAR);
+    setVal(TagBox::CLEAR);
 }
 
 TagBoxArray::TagBoxArray (const BoxArray& ba,
@@ -445,145 +281,351 @@ TagBoxArray::TagBoxArray (const BoxArray& ba,
     :
     FabArray<TagBox>(ba,dm,1,_ngrow,MFInfo(),DefaultFabFactory<TagBox>())
 {
-    if (SharedMemory()) setVal(TagBox::CLEAR);
-}
-
-IntVect
-TagBoxArray::borderSize () const noexcept
-{
-    return n_grow;
+    setVal(TagBox::CLEAR);
 }
 
 void 
 TagBoxArray::buffer (const IntVect& nbuf)
 {
-    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
-
     AMREX_ASSERT(nbuf.allLE(n_grow));
 
     if (nbuf.max() > 0)
     {
 #ifdef _OPENMP
-#pragma omp parallel
+#pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
-       for (MFIter mfi(*this); mfi.isValid(); ++mfi)
-           get(mfi).buffer(nbuf, n_grow);
+       for (MFIter mfi(*this); mfi.isValid(); ++mfi) {
+           get(mfi).buffer(nbuf);
+       }
     }
 }
 
 void
-TagBoxArray::mapPeriodic (const Geometry& geom)
+TagBoxArray::mapPeriodicRemoveDuplicates (const Geometry& geom)
 {
-    if (!geom.isAnyPeriodic()) return;
-
-    BL_PROFILE("TagBoxArray::mapPeriodic()");
+    BL_PROFILE("TagBoxArray::mapPRD");
 
-    // This function is called after coarsening.
-    // So we can assume that n_grow is 0.
-    BL_ASSERT(n_grow[0] == 0);
+    if (Gpu::inLaunchRegion())
+    {
+        // There is not atomicAdd for char.  So we have to use int.
+        iMultiFab itag = amrex::cast<iMultiFab>(*this);
+        iMultiFab tmp(boxArray(),DistributionMap(),1,nGrowVect());
+        tmp.setVal(0);
+        tmp.ParallelAdd(itag, 0, 0, 1, nGrowVect(), nGrowVect(), geom.periodicity());
+
+        // We need to keep tags in periodic boundary
+        const auto owner_mask = amrex::OwnerMask(tmp, Periodicity::NonPeriodic(), nGrowVect());
+#ifdef _OPENMP
+#pragma omp parallel
+#endif
+        for (MFIter mfi(tmp); mfi.isValid(); ++mfi) {
+            Box const& box = mfi.fabbox();
+            Array4<TagType> const& tag =this->array(mfi);
+            Array4<int const> const& tmptag = tmp.const_array(mfi);
+            Array4<int const> const& msk = owner_mask->const_array(mfi);
+            amrex::ParallelFor(box,
+            [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+            {
+                if (msk(i,j,k)) {
+                    tag(i,j,k) = static_cast<char>(tmptag(i,j,k));
+                } else {
+                    tag(i,j,k) = TagBox::CLEAR;
+                }
+            });
+        }
+    }
+    else
+    {
+        TagBoxArray tmp(boxArray(),DistributionMap(),nGrowVect()); // note that tmp is filled w/ CLEAR.
+        tmp.ParallelAdd(*this, 0, 0, 1, nGrowVect(), nGrowVect(), geom.periodicity());
 
-    TagBoxArray tmp(boxArray(),DistributionMap()); // note that tmp is filled w/ CLEAR.
+        // We need to keep tags in periodic boundary
+        const auto owner_mask = amrex::OwnerMask(tmp, Periodicity::NonPeriodic(), nGrowVect());
+#ifdef _OPENMP
+#pragma omp parallel
+#endif
+        for (MFIter mfi(tmp); mfi.isValid(); ++mfi) {
+            Box const& box = mfi.fabbox();
+            Array4<TagType> const& tag = tmp.array(mfi);
+            Array4<int const> const& msk = owner_mask->const_array(mfi);
+            AMREX_LOOP_3D(box, i, j, k,
+            {
+                if (!msk(i,j,k)) tag(i,j,k) = TagBox::CLEAR;
+            });
+        }
 
-    tmp.copy(*this, geom.periodicity(), FabArrayBase::ADD);
+        std::swap(*this, tmp);
+    }
+}
 
-    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
+void
+TagBoxArray::local_collate_cpu (Vector<IntVect>& v) const
+{
+    if (this->local_size() == 0) return;
 
+    Vector<int> count(this->local_size());
 #ifdef _OPENMP
 #pragma omp parallel
 #endif
-    for (MFIter mfi(*this); mfi.isValid(); ++mfi)
+    for (MFIter fai(*this); fai.isValid(); ++fai)
     {
-        get(mfi).merge(tmp[mfi]);
+        Array4<char const> const& arr = this->const_array(fai);
+        Box const& bx = fai.fabbox();
+        int c = 0;
+        AMREX_LOOP_3D(bx,i,j,k,
+        {
+            if (arr(i,j,k) != TagBox::CLEAR) ++c;
+        });
+        count[fai.LocalIndex()] = c;
     }
-}
 
-Long
-TagBoxArray::numTags () const
-{
-    Long ntag = 0;
+    Vector<int> offset(count.size()+1);
+    offset[0] = 0;
+    std::partial_sum(count.begin(), count.end(), offset.begin()+1);
 
-    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
+    v.resize(offset.back());
+
+    if (v.empty()) return;
 
 #ifdef _OPENMP
-#pragma omp parallel reduction(+:ntag)
+#pragma omp parallel
 #endif
-    for (MFIter mfi(*this); mfi.isValid(); ++mfi)
+    for (MFIter fai(*this); fai.isValid(); ++fai)
     {
-        ntag += get(mfi).numTags();
+        int li = fai.LocalIndex();
+        if (count[li] > 0) {
+            IntVect* p = v.data() + offset[li];
+            Array4<char const> const& arr = this->const_array(fai);
+            Box const& bx = fai.fabbox();
+            AMREX_LOOP_3D(bx,i,j,k,
+            {
+                if (arr(i,j,k) != TagBox::CLEAR) {
+                    *p++ = IntVect(AMREX_D_DECL(i,j,k));
+                }
+            });
+        }
     }
-    
-    ParallelDescriptor::ReduceLongSum(ntag);
-    
-    return ntag;
 }
 
+#ifdef AMREX_USE_GPU
 void
-TagBoxArray::collate (Vector<IntVect>& TheGlobalCollateSpace) const
+TagBoxArray::local_collate_gpu (Vector<IntVect>& v) const
 {
-    BL_PROFILE("TagBoxArray::collate()");
+    const int nfabs = this->local_size();
+    if (nfabs == 0) return;
 
-    // Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
+    constexpr int block_size = 128;
+    Vector<int> nblocks(nfabs);
+    for (MFIter fai(*this); fai.isValid(); ++fai)
+    {
+        Box const& bx = fai.fabbox();
+        nblocks[fai.LocalIndex()] = (bx.numPts() + block_size-1) / block_size;
+    }
+    Vector<int> blockoffset(nblocks.size()+1);
+    blockoffset[0] = 0;
+    std::partial_sum(nblocks.begin(), nblocks.end(), blockoffset.begin()+1);
+    int ntotblocks = blockoffset.back();
 
-    Long count = 0;
+    PODVector<int,DeviceArenaAllocator<int> > dv_ntags(ntotblocks);
 
-#ifdef _OPENMP
-#pragma omp parallel reduction(+:count)
-#endif
     for (MFIter fai(*this); fai.isValid(); ++fai)
     {
-        count += get(fai).numTags();
+        const int li = fai.LocalIndex();
+        int* ntags = dv_ntags.data() + blockoffset[li];
+        const int ncells = fai.fabbox().numPts();
+        const char* tags = (*this)[fai].dataPtr();
+#ifdef AMREX_USE_DPCPP
+        amrex::launch(nblocks[li], block_size, sizeof(int)*Gpu::Device::warp_size,
+                      Gpu::Device::gpuStream(),
+        [=] AMREX_GPU_DEVICE (Gpu::Handler const& h) noexcept
+        {
+            int bid = h.item.get_group_linear_id();
+            int tid = h.item.get_local_id(0);
+            int icell = h.item.get_global_id(0);
+
+            int t = 0;
+            if (icell < ncells && tags[icell] != TagBox::CLEAR) {
+                t = 1;
+            }
+
+            t = Gpu::blockReduce<Gpu::Device::warp_size>
+                (t, Gpu::warpReduce<Gpu::Device::warp_size,int,amrex::Plus<int> >(), 0, h);
+            if (tid == 0) {
+                ntags[bid] = t;
+            }
+        });
+#else
+        amrex::launch(nblocks[li], block_size, Gpu::Device::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept
+        {
+            int bid = blockIdx.x;
+            int tid = threadIdx.x;
+            int icell = blockDim.x*blockIdx.x+threadIdx.x;
+
+            int t = 0;
+            if (icell < ncells && tags[icell] != TagBox::CLEAR) {
+                t = 1;
+            }
+
+            t = Gpu::blockReduce<Gpu::Device::warp_size>
+                (t, Gpu::warpReduce<Gpu::Device::warp_size,int,amrex::Plus<int> >(), 0);
+            if (tid == 0) {
+                ntags[bid] = t;
+            }
+        });
+#endif
     }
 
-    //
-    // Local space for holding just those tags we want to gather to the root cpu.
-    //
-    Vector<IntVect> TheLocalCollateSpace(count);
+    PODVector<int,PinnedArenaAllocator<int> > hv_ntags(ntotblocks);
+    Gpu::dtoh_memcpy(hv_ntags.data(), dv_ntags.data(), ntotblocks*sizeof(int));
 
-    count = 0;
+    PODVector<int,PinnedArenaAllocator<int> > hv_tags_offset(ntotblocks+1);
+    hv_tags_offset[0] = 0;
+    std::partial_sum(hv_ntags.begin(), hv_ntags.end(), hv_tags_offset.begin()+1);
+    int ntotaltags = hv_tags_offset.back();
 
-    // unsafe to do OMP
+    if (ntotaltags == 0) return;
+
+    PODVector<int,DeviceArenaAllocator<int> > dv_tags_offset(ntotblocks);
+    int* dp_tags_offset = dv_tags_offset.data();
+    Gpu::htod_memcpy(dp_tags_offset, hv_tags_offset.data(), ntotblocks*sizeof(int));
+#ifdef AMREX_USE_DPCPP
+    Gpu::synchronize();
+#endif
+
+    PODVector<IntVect,DeviceArenaAllocator<IntVect> > dv_tags(ntotaltags);
+    IntVect* dp_tags = dv_tags.data();
+
+    int iblock = 0;
     for (MFIter fai(*this); fai.isValid(); ++fai)
     {
-        count += get(fai).collate(TheLocalCollateSpace,count);
+        const int li = fai.LocalIndex();
+        int iblock_begin = iblock;
+        int iblock_end = iblock + nblocks[li];
+        iblock = iblock_end;
+        int count = 0;
+        for (int ib = iblock_begin; ib < iblock_end; ++ib) {
+            count += hv_ntags[ib];
+        }
+        if (count > 0) {
+            Box const& bx = fai.fabbox();
+            const auto lo  = amrex::lbound(bx);
+            const auto len = amrex::length(bx);
+            const int ncells = bx.numPts();
+            const char* tags = (*this)[fai].dataPtr();
+#ifdef AMREX_USE_DPCPP
+            amrex::launch(nblocks[li], block_size, sizeof(unsigned int), Gpu::Device::gpuStream(),
+            [=] AMREX_GPU_DEVICE (Gpu::Handler const& h) noexcept
+            {
+                int bid = h.item.get_group(0);
+                int tid = h.item.get_local_id(0);
+                int icell = h.item.get_global_id(0);
+
+                unsigned int* shared_counter = (unsigned int*)h.local;
+                if (tid == 0) {
+                    *shared_counter = 0;
+                }
+                h.item.barrier(sycl::access::fence_space::local_space);
+
+                if (icell < ncells && tags[icell] != TagBox::CLEAR) {
+                    unsigned int itag = Gpu::Atomic::Inc<sycl::access::address_space::local_space>
+                        (shared_counter, 20480u);
+                    IntVect* p = dp_tags + dp_tags_offset[iblock_begin+bid];
+                    int k =  icell /   (len.x*len.y);
+                    int j = (icell - k*(len.x*len.y)) /   len.x;
+                    int i = (icell - k*(len.x*len.y)) - j*len.x;
+                    i += lo.x;
+                    j += lo.y;
+                    k += lo.z;
+                    p[itag] = IntVect(AMREX_D_DECL(i,j,k));
+                }
+            });
+#else
+            amrex::launch(nblocks[li], block_size, sizeof(unsigned int), Gpu::Device::gpuStream(),
+            [=] AMREX_GPU_DEVICE () noexcept
+            {
+                int bid = blockIdx.x;
+                int tid = threadIdx.x;
+                int icell = blockDim.x*blockIdx.x+threadIdx.x;
+
+                Gpu::SharedMemory<unsigned int> gsm;
+                unsigned int * shared_counter = gsm.dataPtr();
+                if (tid == 0) {
+                    *shared_counter = 0;
+                }
+                __syncthreads();
+
+                if (icell < ncells && tags[icell] != TagBox::CLEAR) {
+                    unsigned int itag = Gpu::Atomic::Inc(shared_counter, blockDim.x);
+                    IntVect* p = dp_tags + dp_tags_offset[iblock_begin+bid];
+                    int k =  icell /   (len.x*len.y);
+                    int j = (icell - k*(len.x*len.y)) /   len.x;
+                    int i = (icell - k*(len.x*len.y)) - j*len.x;
+                    i += lo.x;
+                    j += lo.y;
+                    k += lo.z;
+                    p[itag] = IntVect(AMREX_D_DECL(i,j,k));
+                }
+            });
+#endif
+        }
     }
 
-    if (count > 0)
+    v.resize(ntotaltags);
+    Gpu::dtoh_memcpy(v.data(), dp_tags, ntotaltags*sizeof(IntVect));
+}
+#endif
+
+void
+TagBoxArray::collate (Vector<IntVect>& TheGlobalCollateSpace) const
+{
+    BL_PROFILE("TagBoxArray::collate()");
+
+    Vector<IntVect> TheLocalCollateSpace;
+#ifdef AMREX_USE_GPU
+    if (Gpu::inLaunchRegion()) {
+        local_collate_gpu(TheLocalCollateSpace);
+    } else
+#endif
     {
-        amrex::RemoveDuplicates(TheLocalCollateSpace);
-        count = TheLocalCollateSpace.size();
+        local_collate_cpu(TheLocalCollateSpace);
     }
+
+    Long count = TheLocalCollateSpace.size();
+
     //
     // The total number of tags system wide that must be collated.
-    // This is really just an estimate of the upper bound due to duplicates.
-    // While we've removed duplicates per MPI process there's still more systemwide.
     //
     Long numtags = count;
-
     ParallelDescriptor::ReduceLongSum(numtags);
 
     if (numtags == 0) {
         TheGlobalCollateSpace.clear();
         return;
+    } else if (numtags > static_cast<Long>(std::numeric_limits<int>::max())) {
+        // xxxxx todo
+        amrex::Abort("TagBoxArray::collate: Too many tags. Using a larger blocking factor might help. Please file an issue on github");
     }
 
+#ifdef BL_USE_MPI
     //
-    // This holds all tags after they've been gather'd and unique'ified.
+    // On I/O proc. this holds all tags after they've been gather'd.
+    // On other procs. non-mempty signals size is not zero.
     //
-    // Each CPU needs an identical copy since they all must go through grid_places() which isn't parallelized.
-
-    TheGlobalCollateSpace.resize(numtags);
+    if (ParallelDescriptor::IOProcessor()) {
+        TheGlobalCollateSpace.resize(numtags);
+    } else {
+        TheGlobalCollateSpace.resize(1);
+    }
 
-#ifdef BL_USE_MPI
     //
     // Tell root CPU how many tags each CPU will be sending.
     //
     const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
-    count *= AMREX_SPACEDIM;  // Convert from count of tags to count of integers to expect.
-    const std::vector<Long>& countvec = ParallelDescriptor::Gather(count, IOProcNumber);
-    
-    std::vector<Long> offset(countvec.size(),0L);
-    if (ParallelDescriptor::IOProcessor())
-    {
+    const std::vector<int>& countvec = ParallelDescriptor::Gather(static_cast<int>(count),
+                                                                  IOProcNumber);
+    std::vector<int> offset(countvec.size(),0);
+    if (ParallelDescriptor::IOProcessor()) {
         for (int i = 1, N = offset.size(); i < N; i++) {
 	    offset[i] = offset[i-1] + countvec[i-1];
 	}
@@ -591,93 +633,136 @@ TagBoxArray::collate (Vector<IntVect>& TheGlobalCollateSpace) const
     //
     // Gather all the tags to IOProcNumber into TheGlobalCollateSpace.
     //
-    BL_ASSERT(sizeof(IntVect) == AMREX_SPACEDIM * sizeof(int));
-    const int* psend = (count > 0) ? TheLocalCollateSpace[0].getVect() : 0;
-    int* precv = TheGlobalCollateSpace[0].getVect();
-    ParallelDescriptor::Gatherv(psend, count,
-                                precv, countvec, offset, IOProcNumber);
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        amrex::RemoveDuplicates(TheGlobalCollateSpace);
-        numtags = TheGlobalCollateSpace.size();
-    }
-
-    //
-    // Now broadcast them back to the other processors.
-    //
-    ParallelDescriptor::Bcast(&numtags, 1, IOProcNumber);
-    ParallelDescriptor::Bcast(TheGlobalCollateSpace[0].getVect(), numtags*AMREX_SPACEDIM, IOProcNumber);
-    TheGlobalCollateSpace.resize(numtags);
+    const IntVect* psend = (count > 0) ? TheLocalCollateSpace.data() : nullptr;
+    IntVect* precv = TheGlobalCollateSpace.data();
+    ParallelDescriptor::Gatherv(psend, count, precv, countvec, offset, IOProcNumber);
 
 #else
-    //
-    // Copy TheLocalCollateSpace to TheGlobalCollateSpace.
-    //
-    TheGlobalCollateSpace = TheLocalCollateSpace;
+    TheGlobalCollateSpace = std::move(TheLocalCollateSpace);
 #endif
 }
 
 void
-TagBoxArray::setVal (const BoxList& bl,
-                     TagBox::TagVal val)
+TagBoxArray::setVal (const BoxList& bl, TagBox::TagVal val)
 {
     BoxArray ba(bl);
     setVal(ba,val);
 }
 
 void
-TagBoxArray::setVal (const BoxDomain& bd,
-                     TagBox::TagVal   val)
+TagBoxArray::setVal (const BoxDomain& bd, TagBox::TagVal val)
 {
     setVal(bd.boxList(),val);
 }
 
 void
-TagBoxArray::setVal (const BoxArray& ba,
-                     TagBox::TagVal  val)
+TagBoxArray::setVal (const BoxArray& ba, TagBox::TagVal val)
 {
-    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
-
+    Vector<Array4BoxTag<char> > tags;
+    bool run_on_gpu = Gpu::inLaunchRegion();
 #ifdef _OPENMP
-#pragma omp parallel
+#pragma omp parallel if (!run_on_gpu)
 #endif
-    for (MFIter mfi(*this); mfi.isValid(); ++mfi)
     {
         std::vector< std::pair<int,Box> > isects;
-
-        ba.intersections(mfi.fabbox(),isects);
-
-        TagBox& tags = get(mfi);
-
-        for (int i = 0, N = isects.size(); i < N; i++)
+        for (MFIter mfi(*this); mfi.isValid(); ++mfi)
         {
-            tags.setVal<RunOn::Host>(val,isects[i].second,0);
+            TagBox& fab = (*this)[mfi];
+            Array4<char> const& arr = this->array(mfi);
+            ba.intersections(mfi.fabbox(), isects);
+            for (const auto& is : isects) {
+                Box const& b = is.second;
+                if (run_on_gpu) {
+                    tags.push_back({arr,b});
+                } else {
+                   fab.setVal<RunOn::Host>(val,b);
+                }
+            }
         }
     }
+
+#ifdef AMREX_USE_GPU
+    amrex::ParallelFor(tags, 1,
+    [=] AMREX_GPU_DEVICE (int i, int j, int k, int /*n*/, Array4<char> const& a) noexcept
+    {
+        a(i,j,k) = val;
+    });
+#endif
 }
 
 void
 TagBoxArray::coarsen (const IntVect & ratio)
 {
-    // If team is used, all team workers need to go through all the fabs, including ones they don't own.
+    // If team is used, all team workers need to go through all the fabs,
+    // including ones they don't own.
     int teamsize = ParallelDescriptor::TeamSize();
     unsigned char flags = (teamsize == 1) ? 0 : MFIter::AllBoxes;
 
-    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
+    IntVect new_n_grow;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        new_n_grow[idim] = (n_grow[idim]+ratio[idim]-1)/ratio[idim];
+    }
 
 #if defined(_OPENMP)
-#pragma omp parallel if (teamsize == 1)
+#pragma omp parallel if (teamsize == 1 && Gpu::notInLaunchRegion())
 #endif
     for (MFIter mfi(*this,flags); mfi.isValid(); ++mfi)
     {
-        this->fabPtr(mfi)->coarsen(ratio);
+        Box const& cbox = amrex::grow(amrex::coarsen(mfi.validbox(),ratio),new_n_grow);
+        this->fabPtr(mfi)->coarsen(ratio,cbox);
     }
 
-    boxarray.growcoarsen(n_grow,ratio);
-    updateBDKey();  // because we just modify boxarray in-place.
+    boxarray.coarsen(ratio);
+    n_grow = new_n_grow;
+}
+
+bool
+TagBoxArray::hasTags (Box const& a_bx) const
+{
+    bool has_tags = false;
+#ifdef AMREX_USE_GPU
+    if (Gpu::inLaunchRegion()) {
+        ReduceOps<ReduceOpLogicalOr> reduce_op;
+        ReduceData<int> reduce_data(reduce_op);
+        using ReduceTuple = typename decltype(reduce_data)::Type;
+
+        for (MFIter mfi(*this); mfi.isValid(); ++mfi)
+        {
+            Box const& b = a_bx & mfi.fabbox();
+            if (b.ok()) {
+                const auto& arr = this->const_array(mfi);
+                reduce_op.eval(b, reduce_data,
+                [=] AMREX_GPU_DEVICE (int i, int j, int k) -> ReduceTuple
+                {
+                    int tr = arr(i,j,k) != TagBox::CLEAR;
+                    return {tr};
+                });
+            }
+        }
+
+        ReduceTuple hv = reduce_data.value();
+        has_tags = static_cast<bool>(amrex::get<0>(hv));
+    } else
+#endif
+    {
+#ifdef _OPENMP
+#pragma omp parallel reduction(||:has_tags)
+#endif
+        for (MFIter mfi(*this); mfi.isValid(); ++mfi)
+        {
+            Box const& b = a_bx & mfi.fabbox();
+            if (b.ok()) {
+                Array4<char const> const& arr = this->const_array(mfi);
+                AMREX_LOOP_3D(b, i, j, k,
+                {
+                    has_tags = has_tags || (arr(i,j,k) != TagBox::CLEAR);
+                });
+            }
+        }
+    }
 
-    n_grow = IntVect::TheZeroVector();
+    ParallelAllReduce::Or(has_tags, ParallelContext::CommunicatorSub());
+    return has_tags;
 }
 
 }
diff --git a/Src/AmrCore/CMakeLists.txt b/Src/AmrCore/CMakeLists.txt
index 833213eb129..cd7ba6c0589 100644
--- a/Src/AmrCore/CMakeLists.txt
+++ b/Src/AmrCore/CMakeLists.txt
@@ -19,25 +19,25 @@ target_sources(amrex
    AMReX_Interpolater.H
    AMReX_TagBox.H
    AMReX_AmrMesh.H
-   AMReX_FluxReg_${DIM}D_C.H
+   AMReX_FluxReg_${AMReX_SPACEDIM}D_C.H
    AMReX_FluxReg_C.H
    AMReX_Interp_C.H
-   AMReX_Interp_${DIM}D_C.H
+   AMReX_Interp_${AMReX_SPACEDIM}D_C.H
    )
 
-if (ENABLE_FORTRAN)
+if (AMReX_FORTRAN)
    target_sources(amrex
       PRIVATE
       AMReX_FillPatchUtil_F.H
-      AMReX_FillPatchUtil_${DIM}d.F90
+      AMReX_FillPatchUtil_${AMReX_SPACEDIM}d.F90
       AMReX_FLUXREG_F.H
       AMReX_FLUXREG_nd.F90
       AMReX_INTERP_F.H
-      AMReX_INTERP_${DIM}D.F90
+      AMReX_INTERP_${AMReX_SPACEDIM}D.F90
       )
 endif ()
 
 # These files are neeeded only if Particles are enabled
-if ( ENABLE_PARTICLES )
+if ( AMReX_PARTICLES )
   target_sources( amrex PRIVATE AMReX_AmrParGDB.H AMReX_AmrParticles.H )
 endif ()
diff --git a/Src/AmrTask/AMFIter/AMReX_AmrTask.H b/Src/AmrTask/AMFIter/AMReX_AmrTask.H
deleted file mode 100644
index 8a7ab9b8344..00000000000
--- a/Src/AmrTask/AMFIter/AMReX_AmrTask.H
+++ /dev/null
@@ -1,923 +0,0 @@
-#ifndef AMREX_AmrTask_H_
-#define AMREX_AmrTask_H_
-
-#include <fstream>
-#include <memory>
-#include <list>
-
-#include "AMReX_AbstractTask.H"
-#include "AMReX_TaskGraph.H"
-#include "RTS.H"
-#include <AMReX_FabArrayBase.H>
-#include <AMReX_FabArray.H>
-#include <AMReX_IntVect.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Box.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_Vector.H>
-#include <AMReX_BCRec.H>
-#include <AMReX_AmrCore.H>
-
-#include <AMReX_AmrLevelTask.H>
-#include <AMReX_StateDataTask.H>
-bool verbose=false;
-
-namespace amrex {
-    // These are all ParmParse'd in.  Set defaults in Initialize()!!!
-    extern int  plot_nfiles;
-    extern int  mffile_nstreams;
-    extern int  probinit_natonce;
-    extern bool plot_files_output;
-    extern int  checkpoint_nfiles;
-    extern int  regrid_on_restart;
-    extern int  use_efficient_regrid;
-    extern int  plotfile_on_restart;
-    extern int  checkpoint_on_restart;
-    extern bool checkpoint_files_output;
-    extern int  compute_new_dt_on_regrid;
-    extern bool precreateDirectories;
-    extern bool prereadFAHeaders;
-
-    enum task_states{
-	_coarseTimeStep=0,
-	_post_coarseTimeStep,
-	_timeStep,
-	_timeStep_advance,
-	_post_timeStep,
-	_final,
-    };
-
-    /**** State transition diagrams of tasks on the coarse level (lower part) and fine level (upper part)
-     *
-     *			       _timeStep -> _timeStep_advance  -> _post_timestep	
-     *		  	      ^\            ^\              |                 |   \\
-     * 			        \             \_____________|                 |    \\
-     *			    //	 \                                            |	    \\ (signal)
-     *			   // 	  \____________(subcycling)___________________|      \\
-     *			  //							      \\
-     *		       	 // 	                     			                            			        					(fine task)
-     *			-------------------------------------------------------------------------------------------------------------------------------------------
-     *			// (signal)	
-     *	_coarseTimeStep -> _timeStep  -------> _timeStep_advance           -------------> _post_timestep    	-------------->          _post_coarseTimeStep 		(coarsest task)
-     *	 |^\		  	             ^\		       |                      				  					      |
-     *	 |  \		     	               \_______________|		         				  				      |
-     *	 |   \ 		     						         				  					      |
-     *	 |    \	              											  					      |
-     *	 |     \									 				  				      |
-     * _final   \_____________________________________________________________________________________________________________________________________________|
-     */
-
-    class AmrTask: public Task
-    {
-	LocalConnection l_con;
-	RemoteConnection r_con;
-	struct TileArray
-	{
-	    Vector<int> numLocalTiles;
-	    Vector<int> localTileIndexMap;
-	    Vector<Box> tileArray;
-	} ta;
-	bool _do_tiling;
-	int current_tile;
-	Amr* _amr;
-	int max_step;
-	Real stop_time;
-
-	public:
-	AmrTask(){}
-	Amr* originalAmr(){return _amr;}
-	AmrLevel& originalAmrLevel(int lev){return _amr->getLevel(lev);}
-
-
-	size_t tagGen(int src, int dest, int amrlevels, int fabs)
-	{
-	    return (src*fabs + dest%fabs)*amrlevels;
-	}
-
-        void multifabCopyPush(amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int dstcomp, int srccomp, int nc, int ng, int ngsrc, amrex::FabArrayBase::CPC *cpc)
-        {
-        }
-
-
-	void FillBoundaryPush(){
-	    for(int i=0; i<l_con.nscpy; i++)
-	    {
-		Data* msg= new Data(TaskName(l_con.scpy[i].ns), TaskName(l_con.scpy[i].nd), l_con.scpy[i].sz);
-		msg->SetTag(i); //this is local copy so the recipient will have the matching tag
-		msg->SetDestRank(ParallelDescriptor::MyProc());
-		_fab->copyToMem(l_con.scpy[i].sbx, 0, _mf->nComp(), msg->GetBuffer()); //pack box to the message
-		_outputs.push(msg);//let the runtime know that the output is available
-	    }
-	    int np = ParallelDescriptor::NProcs();
-	    if (np==1) return;
-	    for(int i=0; i<r_con.nsnd; i++)
-	    {
-		Data* msg= new Data(TaskName(r_con.snd[i].ns), TaskName(r_con.snd[i].nd), r_con.snd[i].sz);
-		msg->SetTag(tagGen(r_con.snd[i].ns, r_con.snd[i].nd, 1, _mf->size()));
-		msg->SetDestRank(r_con.snd[i].pr);
-		_fab->copyToMem(r_con.snd[i].sbx, 0, _mf->nComp(), msg->GetBuffer());
-		_outputs.push(msg);
-	    }
-	}
-
-	void FillPatchSingleLevelPush (MultiFab& mf, MultiFab *dmf, Real time,
-		const Vector<MultiFab*>& smf, const Vector<Real>& stime,
-		int scomp, int dcomp, int ncomp,
-		const Geometry& geom, PhysBCFunctBase& physbcf)
-	{
-	    BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-	    BL_ASSERT(dcomp+ncomp <= mf.nComp());
-	    BL_ASSERT(smf.size() == stime.size());
-	    BL_ASSERT(smf.size() != 0);
-
-	    if (smf.size() == 1)
-	    {
-		multifabCopyPush(*smf[0], _lIdx, dcomp, scomp, ncomp, _mf.nGrow(), 0);
-	    }
-	    else if (smf.size() == 2)
-	    {
-		const Box& bx = validbox(mf);
-		if (mf.boxArray() == smf[0]->boxArray())
-		{
-		    int s_idx = smf[0]->IndexArray()[_lIdx];
-		    int d_idx = mf.IndexArray()[_lIdx];
-		    FArrayBox& fab= validFab(*_mf);
-
-		    fab.linInterp(smf[0]->get(s_idx),
-			    scomp,
-			    smf[1]->get(s_idx),
-			    scomp,
-			    stime[0],
-			    stime[1],
-			    time,
-			    bx,
-			    dcomp,
-			    ncomp);
-		    FillBoundaryPush();
-		}else{
-		    int s_idx = smf[0]->IndexArray()[_lIdx];
-		    int d_idx = dmf->IndexArray()[_lIdx];
-		    FArrayBox& fab= validFab(*dmf);
-		    fab.linInterp(smf[0]->get(s_idx),
-			    scomp,
-			    smf[1]->get(s_idx),
-			    scomp,
-			    stime[0],
-			    stime[1],
-			    time,
-			    bx,
-			    0,
-			    ncomp);
-                    //multifabCopyPush(dmf, _lIdx, dcomp, 0, ncomp, _mf.nGrow(), 0);
-		}
-	    }
-	    //physbcf.FillBoundary(mf, dcomp, ncomp, time);
-	}
-
-        void FillPatchTwoLevelsPush (Real time,
-                                 Vector<MultiFab*>& cmf, const Vector<Real>& ct,
-                                 Vector<MultiFab*>& fmf, const Vector<Real>& ft,
-                                 int scomp, int dcomp, int ncomp,
-                                 const Geometry& cgeom, const Geometry& fgeom,
-                                 PhysBCFunctBase& cbc, PhysBCFunctBase& fbc,
-                                 const IntVect& ratio,
-                                 Interpolater* mapper, const Vector<BCRec>& bcs)
-         {
-
-
-
-	 }
-
-
-	void InitAmrTask (const void* amr, int m_step, Real st_time){
-	    assert(_amr);
-	    TaskName name= MyName();
-	    _taskState= name[0]==0?_coarseTimeStep:_timeStep;
-	    _amr= (Amr*)amr;
-	    max_step= m_step;
-	    stop_time= st_time;
-	    cumtime= _amr->cumtime;
-	    dt_level.resize(_amr->finest_level+1);
-	    dt_min.resize(_amr->finest_level+1);
-	    level_steps.resize(_amr->finest_level+1);
-	    level_count.resize(_amr->finest_level+1);
-	    for (int i = 0; i <= _amr->finest_level; i++){
-		dt_level[i] = _amr->dtLevel(i);
-		dt_min[i] = _amr->dt_min[i];
-		level_steps[i] = _amr->level_steps[i];
-		level_count[i] = _amr->level_count[i];
-	    }
-	    which_level_being_advanced= _amr->which_level_being_advanced;
-	    sub_cycle= _amr->sub_cycle;
-	    subcycling_iteration =0;
-	    parent_subcycling_iteration=0;
-	    if(name[0]<_amr->finest_level){
-		MultiFab& mfSrc = _amr->amr_level[name[0]]->get_new_data(0);
-		MultiFab& mfDst = _amr->amr_level[name[0]+1]->get_new_data(0);
-		const BoxArray& fine_BA = mfDst.boxArray();
-		BoxArray crse_S_fine_BA = fine_BA;
-		crse_S_fine_BA.coarsen(_amr->refRatio(1));
-		MultiFab *crse_S_fine = new MultiFab(crse_S_fine_BA, mfDst.DistributionMap(), mfDst.nComp(),0);
-		TheCPC_sendup= (amrex::FabArrayBase::CPC*)&(crse_S_fine->getCPC(IntVect::TheZeroVector(),,
-                                                                                mfSrc,
-                                                                                IntVect::TheZeroVector(),
-                                                                                Periodicity::NonPeriodic()));
-	    }
-	    if(name[0]>0){
-		MultiFab& mfSrc1 = _amr->amr_level[name[0]-1]->get_new_data(0);
-		MultiFab& mfDst1 = _amr->amr_level[name[0]]->get_new_data(0);
-		const BoxArray& fine_BA = mfDst1.boxArray();
-		BoxArray crse_S_fine_BA = fine_BA;
-		crse_S_fine_BA.coarsen(_amr->refRatio(1));
-		MultiFab *crse_S_fine = new MultiFab(crse_S_fine_BA, mfDst1.DistributionMap(), mfDst1.nComp(),0);
-		TheCPC_pullup= (amrex::FabArrayBase::CPC*)&(crse_S_fine->getCPC(IntVect::TheZeroVector(),
-                                                                                mfSrc1,
-                                                                                IntVect::TheZeroVector(),
-                                                                                Periodicity::NonPeriodic()));
-	    }
-	}
-	void CreateLevelTask(int level){
-	    TaskName name= MyName();
-	    levelTask= new AmrLevelTask(this, level);
-	    nStates= _amr->amr_level[level]->numStates();
-	    state.resize(nStates);
-	    for(int i=0; i<nStates; i++){
-		state[i].define(_amr->amr_level[level]->get_state_data(i));
-	    }
-	}
-
-	void Signal(TaskName dest, int tag=0){
-	    Data* data= new Data(_id, dest, 1);
-	    data->SetTag(tag);
-	    _outputs.push(data);
-	}
-
-	bool DependSignal(TaskName src, int tag=0){
-	    bool arrived= Depend_on(src, tag);
-	    if(!arrived) return false;
-	    return true;
-	}
-
-	void DependSignal_reset(TaskName src, int tag=0){
-	    Data* msg= _neighbors_in.pop_front(src, tag);
-	    msg->Free();
-	}
-
-	void Job(){
-	    TaskName name= MyName();
-	    if(name[0]==0){//tasks on the coarsest level
-		switch(_taskState){
-		    case _coarseTimeStep: 
-			if ( _amr->okToContinue() &&
-				(levelSteps(0) < max_step || max_step < 0) &&
-				(cumtime < stop_time || stop_time < 0.0) )
-
-			{
-			    coarseTimeStepTask_init(stop_time);
-			    _taskState= _timeStep;
-			}else{ 
-			    //_final:
-			    coarseTimeStepTask_end(stop_time);
-			    delete levelTask;
-			    SelfDestroy();
-			    break;
-			}
-		    case _timeStep: 
-			timeStepTask_init(0,cumtime,1,1,stop_time);
-			amr_level= &originalAmrLevel(name[0]);
-			advanceTask_init(cumtime, dt_level[0], 1, stop_time);
-			cout<<"Task (Level) " <<name[0] <<" (StateData) "<<name[1] <<" (FabIdx) "<<name[2]<< " (SubcyclingIter) "<<name[3]<< " is running a time step"<<endl;
-			if (_amr->finest_level >0)
-			{
-			    const int nloc_cpAsc = TheCPC_sendup->m_LocTags->size();
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_sendup->m_LocTags)[i];
-				if(name[2] == tag.srcIndex){
-				    Signal(TaskName(name[0]+1, name[1], tag.dstIndex, name[3]*_amr->n_cycle[1]), 0);
-				}
-			    }
-			}
-			_taskState= _timeStep_advance;
-			break;
-		    case _timeStep_advance:
-			if(advanceTask())
-			{
-			    dt_new= post_advanceTask();
-			    _taskState= _post_timeStep;
-			    if (_amr->finest_level >0)
-			    {
-				for(int d=name[3]*_amr->n_cycle[1]+1; d< (name[3]+1)*_amr->n_cycle[1]; d++){
-				    const int nloc_cpAsc = TheCPC_sendup->m_LocTags->size();
-				    for(int i=0; i<nloc_cpAsc; i++)
-				    {
-					const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_sendup->m_LocTags)[i];
-					if(name[2] == tag.srcIndex){
-					    Signal(TaskName(name[0]+1, name[1], tag.dstIndex, d), 0);
-					}
-				    }
-				}
-			    }
-			}else{
-			    _taskState= _timeStep_advance;
-			}
-			break; 
-		    case _post_timeStep: 
-			dt_level[0] = dt_new;
-			level_steps[0]++;
-			level_count[0]++;
-			post_timestepTask(1);
-			//enable next advance iteration if any
-			if((name[3]+1)%_amr->n_cycle[0]!=0) Signal(TaskName(name[0], name[1],name[2], name[3]+1), 0);
-			_taskState= _post_coarseTimeStep;
-			break;
-		    case _post_coarseTimeStep: 
-			//_amr->amr_level[0]->postCoarseTimeStep(cumtime);
-			cumtime += dt_level[0];
-			_taskState= _coarseTimeStep;
-			break;
-		    default:
-			cout<<"Error state"<<endl;
-			exit(0);
-		}
-	    }else if(name[0]<=_amr->finest_level){
-		int lev= name[0];
-		switch(_taskState){
-		    case _timeStep:
-			cout<<"Task (Level) " <<name[0] <<" (StateData) "<<name[1] <<" (FabIdx) "<<name[2]<< " (SubcyclingIter) "<<name[3]<< " is running a time step"<<endl;
-			timeStepTask_init(lev, cumtime+ (name[3]-1)*dt_level[lev], name[3], _amr->n_cycle[lev], stop_time);
-			if (lev < _amr->finest_level)
-			{
-			    const int nloc_cpAsc = TheCPC_sendup->m_LocTags->size();
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_sendup->m_LocTags)[i];
-				if(name[2] == tag.srcIndex){
-				    Signal(TaskName(name[0]+1, name[1], tag.dstIndex, name[3]*_amr->n_cycle[lev+1]), 0);
-				}
-			    }
-			}
-			_taskState= _timeStep_advance;
-			//advanceObj= new advanceTask(cumtime+ (subcycling_iteration-1)*dt_level[lev], dt_level[lev], subcycling_iteration, _amr->n_cycle[lev]);
-		    case _timeStep_advance:
-			if(advanceTask())
-			{
-			    dt_new= post_advanceTask();
-			    _taskState= _post_timeStep;
-			    if (lev < _amr->finest_level)
-			    {
-				for(int d=name[3]*_amr->n_cycle[lev+1]+1; d< (name[3]+1)*_amr->n_cycle[lev+1]; d++){
-				    const int nloc_cpAsc = TheCPC_sendup->m_LocTags->size();
-				    for(int i=0; i<nloc_cpAsc; i++)
-				    {
-					const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_sendup->m_LocTags)[i];
-					if(name[2] == tag.srcIndex){
-					    Signal(TaskName(name[0]+1, name[1], tag.dstIndex, d), 0);
-					}
-				    }
-				}
-			    }
-			}else{
-			    _taskState= _timeStep_advance;
-			    //if(name[3]<_amr->n_cycle[lev]-1) Signal(TaskName(name[0], name[1],name[2], name[3]+1), 0);
-			}
-			break;
-			//dt_new= advanceTask(cumtime+ (subcycling_iteration-1)*dt_level[lev], dt_level[lev], subcycling_iteration, _amr->n_cycle[lev]);
-			//if(advance->state()!=advance->finalState()){
-			//    delete advanceObj;
-			//    break; //keep doing advance
-			//}
-			//_taskState= _post_timeStep;
-		    case _post_timeStep:
-			cumtime += dt_level[lev];
-			dt_level[lev] = dt_new;
-			level_steps[lev]++;
-			level_count[lev]++;
-			post_timestepTask(lev);
-			if((name[3]+1)%_amr->n_cycle[lev]==0) {
-			    //now we already synced all subcycling iteration before and at lower AMR levels, it's time to enable the parent to move on
-			    const int nloc_cpAsc = TheCPC_pullup->m_LocTags->size();
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_pullup->m_LocTags)[i];
-				if(name[2] == tag.dstIndex){
-				    Signal(TaskName(lev-1, name[1], tag.srcIndex, name[3]/_amr->n_cycle[lev]), 0);
-				}
-			    }
-			}else{
-			    //enable next subcycling iteration if any
-			    Signal(TaskName(name[0], name[1],name[2], name[3]+1), 0);
-			}
-			SelfDestroy();
-			delete levelTask;
-			break;
-			//_amr->amr_level[lev]->postTimeStep(cumtime);
-		    default:
-			cout<<"Error state"<<endl;
-			exit(0);
-		}
-	    } 
-	}
-
-	/*
-	   if(name[0]>0 && name[0]<=_amr->finest_level){ //execute advance
-	   TaskName parentName(name);
-	   int tag=0;
-	   Data* msg= _neighbors_in.pop_front(TaskName(parentName), tag);
-	   char* pos;
-	   Real time= ((Real*)msg)[0];
-	   Real dt= ((Real*)msg)[1];
-	   pos= sizeof(Real)*2; 
-	   int  iteration= ((int*)pos)[0];
-	   int  ncycle= ((int*)pos)[1];
-	   advanceTask(time, dt, iteration, ncycle);
-	   cout<<"task "<<name[0]<<" "<<name[1]<<" "<<name[2]<<" subcycling"<<endl;
-	   SelfDestroy();//just for now
-	   }
-	 */
-
-	bool Dependency(){
-	    TaskName name= MyName();
-	    int my_level=name[0];
-	    switch(_taskState){
-		case _coarseTimeStep:
-		    assert(my_level==0);
-		    return true; 
-		case _timeStep:
-		    if(my_level==0) return true; //at this state, coarse tasks just need to perform the initialization of the timestep
-		    else { 
-			if(name[3]%_amr->n_cycle[my_level] !=0){//depend on previous subcycling iteration and the parent
-			    if(DependSignal(TaskName(name[0], name[1], name[2], name[3]-1))==false) return false;
-			    //check if the signal from parent arrived
-			    const int nloc_cpAsc = TheCPC_pullup->m_LocTags->size();
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_pullup->m_LocTags)[i];
-				if(name[2] == tag.dstIndex){
-				    if(DependSignal(TaskName(my_level-1, name[1], tag.srcIndex, name[3]/_amr->n_cycle[my_level]))==false) return false;
-				}
-			    }
-			    //all messages arrived, consume them now
-			    DependSignal_reset(TaskName(name[0], name[1], name[2], name[3]-1));
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_pullup->m_LocTags)[i];
-				if(name[2] == tag.dstIndex){
-				    DependSignal_reset(TaskName(my_level-1, name[1], tag.srcIndex, name[3]/_amr->n_cycle[my_level]));
-				}
-			    }
-			    return true;
-			}
-			//waiting for signals from tasks at the coarser level
-			const int nloc_cpAsc = TheCPC_pullup->m_LocTags->size();
-			const int nsnds_cpAsc = TheCPC_pullup->m_SndTags->size();
-			const int nrcvs_cpAsc = TheCPC_pullup->m_RcvTags->size();
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_pullup->m_LocTags)[i];
-			    if(name[2] == tag.dstIndex){
-				if(DependSignal(TaskName(my_level-1, name[1], tag.srcIndex, name[3]/_amr->n_cycle[my_level]), 0)==false) return false;
-			    }
-			}
-
-			//now all signals have arrived
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_pullup->m_LocTags)[i];
-			    if(name[2] == tag.dstIndex){
-				DependSignal_reset(TaskName(my_level-1, name[1], tag.srcIndex, name[3]/_amr->n_cycle[my_level]), 0);
-			    }
-			}
-			return true;
-		    }
-		case _timeStep_advance:
-		    return advanceTaskDependency();
-		case _post_timeStep:
-		    if(my_level == _amr->finest_level) return true; 
-		    else{
-			//sync with tasks of the last subcycle iteration
-			const int nloc_cpAsc = TheCPC_sendup->m_LocTags->size();
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_sendup->m_LocTags)[i];
-			    if(name[2] == tag.srcIndex){
-				if(DependSignal(TaskName(name[0]+1, name[1], tag.dstIndex, (name[3]+1)*_amr->n_cycle[1]-1), 0)==false) return false;
-			    }
-			}
-
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const amrex::FabArrayBase::CopyComTag& tag = (*TheCPC_sendup->m_LocTags)[i];
-			    if(name[2] == tag.srcIndex){
-				DependSignal_reset(TaskName(name[0]+1, name[1], tag.dstIndex, (name[3]+1)*_amr->n_cycle[1]-1), 0);
-			    }
-			}
-			return true;
-		    }
-		case _post_coarseTimeStep:
-		    return true;
-	    }
-	}
-
-	void PostCompletion(){
-	}
-
-	//! Return the Fab associated with this task
-	FArrayBox& validFab(const FabArray<FArrayBox> &mf){
-	    return *(mf.m_fabs_v[_lIdx]);
-	}
-	//! Return the local index of the Fab associated with this task. It can then be used to locate corresponding Fabs on other multifabs that have the same layout.
-	int localFabIdx(){
-	    return _lIdx;
-	}
-
-	void SetFab(FArrayBox* fab){_fab= fab;}
-
-	void SetMF(const FabArray<FArrayBox> &mf){
-	    _mf= (FabArray<FArrayBox>*)&mf;
-	}
-
-	void SetIdx(int idx){
-	    _idx=idx;
-	}
-
-	void SetLocalIdx(int lIdx){_lIdx= lIdx;}
-
-	void enable_tiling(){_do_tiling=true;}
-
-	Box validbox() const{
-	    return _mf->box(_idx);
-	}
-
-	Box validbox(const FabArray<FArrayBox> &mf) const{
-	    return mf.box(_idx);
-	}
-
-	void generateTileArray(const IntVect& tileSize){
-	    IntVect nt_in_fab, tsize, nleft;
-	    int ntiles = 1;
-	    const Box& bx = validbox();
-
-	    for (int d=0; d<BL_SPACEDIM; d++) {
-		int ncells = bx.length(d);
-		nt_in_fab[d] = std::max(ncells/tileSize[d], 1);
-		tsize    [d] = ncells/nt_in_fab[d];
-		nleft    [d] = ncells - nt_in_fab[d]*tsize[d];
-		ntiles *= nt_in_fab[d];
-	    }
-
-	    IntVect small, big, ijk;  // note that the initial values are all zero.
-	    ijk[0] = -1;
-	    for (int t = 0; t < ntiles; ++t) {
-		ta.localTileIndexMap.push_back(t);
-		ta.numLocalTiles.push_back(ntiles);
-
-		for (int d=0; d<BL_SPACEDIM; d++) {
-		    if (ijk[d]<nt_in_fab[d]-1) {
-			ijk[d]++;
-			break;
-		    } else {
-			ijk[d] = 0;
-		    }
-		}
-
-		for (int d=0; d<BL_SPACEDIM; d++) {
-		    if (ijk[d] < nleft[d]) {
-			small[d] = ijk[d]*(tsize[d]+1);
-			big[d] = small[d] + tsize[d];
-		    } else {
-			small[d] = ijk[d]*tsize[d] + nleft[d];
-			big[d] = small[d] + tsize[d] - 1;
-		    }
-		}
-
-		Box tbx(small, big, IndexType::TheCellType());
-		tbx.shift(bx.smallEnd());
-
-		ta.tileArray.push_back(tbx);
-	    }
-	}
-
-	FabArray<FArrayBox> *_mf;
-	FArrayBox* _fab;
-	int _idx;
-	int _lIdx;
-
-	//! Set the timestep on each level.
-	void setDtLevelTask (const Vector<Real>& dt_lev){
-	    for (int i = 0; i <= _amr->finest_level; i++)
-		dt_level[i] = dt_lev[i];
-	}
-
-	//! Set the timestep at one level.
-	void setDtLevelTask (Real dt, int lev){
-	    dt_level[lev] = dt;
-	}
-
-	//! Set the dtmin on each level.
-	void setDtMinTask (const Vector<Real>& dt_min_in){
-	    for (int i = 0; i <= _amr->finest_level; i++)
-		dt_min[i] = dt_min_in[i];
-	}
-
-	/**  
-	 * \brief What is "level" in Amr::timeStep?  This is only relevant if we are still in Amr::timeStep;
-	 *      it is set back to -1 on leaving Amr::timeStep.
-	 */  
-	int level_being_advancedTask () const { return which_level_being_advanced; }
-
-	int levelSteps (int lev) const { return level_steps[lev]; }
-
-	//! Physical time.
-	Real cumTimeTask () const { return cumtime; }
-
-	void setCumTimeTask (Real t) {cumtime = t;}
-
-	//! Time step at specified level.
-	Real dtLevelTask (int level) const { return dt_level[level]; }
-
-	//! Max time step (typically based on physics) at specified level
-	Real dtMinTask (int level) const { return dt_min[level]; }
-
-	//! Array of time steps at all levels.
-	const Vector<Real>& dtLevelTask () const { return dt_level; }
-
-	void coarseTimeStepTask_init (Real stop_time){
-	    if (levelSteps(0) > 0)
-	    {
-		int post_regrid_flag = 0;
-		_amr->amr_level[0]->computeNewDt(_amr->finest_level,
-			sub_cycle,
-			_amr->n_cycle,
-			_amr->ref_ratio,
-			_amr->dt_min,
-			dt_level,
-			stop_time,
-			post_regrid_flag);
-	    }
-	    else
-	    {
-		_amr->amr_level[0]->computeInitialDt(_amr->finest_level,
-			sub_cycle,
-			_amr->n_cycle,
-			_amr->ref_ratio,
-			dt_level,
-			stop_time);
-	    }
-	}
-
-	//postCoarseTimeStepTask(cumtime);
-
-	void coarseTimeStepTask_end(Real stop_time){
-	    if (verbose > 0)
-	    {
-		if(isMasterTask()){
-		    amrex::Print()
-			<< "\nSTEP = " << level_steps[0]
-			<< " TIME = "  << cumtime
-			<< " DT = "    << dt_level[0] << "\n\n";
-		}
-	    }
-	    if (_amr->record_run_info && ParallelDescriptor::IOProcessor())
-	    {
-		if(isMasterTask()){
-		    _amr->runlog << "STEP = "  << level_steps[0]
-			<< " TIME = " << cumtime
-			<< " DT = "   << dt_level[0] << '\n';
-		}
-	    }
-	    if (_amr->record_run_info_terse && ParallelDescriptor::IOProcessor())
-		if(isMasterTask())
-		    _amr->runlog_terse << level_steps[0] << " " << cumtime << " " << dt_level[0] << '\n';
-
-	    int check_test = 0;
-
-	    if (_amr->check_per > 0.0)
-	    {
-		const int num_per_old = (cumtime-_amr->dt_level[0]) / _amr->check_per;
-		const int num_per_new = (cumtime            ) / _amr->check_per;
-
-		if (num_per_old != num_per_new)
-		{
-		    check_test = 1;
-		}
-	    }
-
-	    int to_stop       = 0;
-	    int to_checkpoint = 0;
-	    int to_plot       = 0;
-	    if (_amr->message_int > 0 && level_steps[0] % _amr->message_int == 0) {
-		if(isMasterTask()){
-		    if (ParallelDescriptor::IOProcessor())
-		    {
-			FILE *fp;
-			if ((fp=fopen("dump_and_continue","r")) != 0)
-			{
-			    remove("dump_and_continue");
-			    to_checkpoint = 1;
-			    fclose(fp);
-			}
-			else if ((fp=fopen("stop_run","r")) != 0)
-			{
-			    remove("stop_run");
-			    to_stop = 1;
-			    fclose(fp);
-			}
-			else if ((fp=fopen("dump_and_stop","r")) != 0)
-			{
-			    remove("dump_and_stop");
-			    to_checkpoint = 1;
-			    to_stop = 1;
-			    fclose(fp);
-			}
-
-			if ((fp=fopen("plot_and_continue","r")) != 0)
-			{
-			    remove("plot_and_continue");
-			    to_plot = 1;
-			    fclose(fp);
-			}
-		    }
-		    int packed_data[2];
-		    packed_data[0] = to_stop;
-		    packed_data[1] = to_checkpoint;
-		    ParallelDescriptor::Bcast(packed_data, 2, ParallelDescriptor::IOProcessorNumber());
-		    to_stop = packed_data[0];
-		    to_checkpoint = packed_data[1];
-		    if(to_stop == 1 && to_checkpoint == 0) {  // prevent main from writing files
-			_amr->last_checkpoint = level_steps[0];
-			_amr->last_plotfile   = level_steps[0];
-		    }
-
-		    if (to_checkpoint && _amr->write_plotfile_with_checkpoint)
-			to_plot = 1;
-
-		    if ((_amr->check_int > 0 && level_steps[0] % _amr->check_int == 0) || check_test == 1
-			    || to_checkpoint)
-		    {
-			_amr->checkPoint();
-		    }
-
-		    if (_amr->writePlotNow() || to_plot)
-		    {
-			_amr->writePlotFile();
-		    }
-
-		    if (_amr->writeSmallPlotNow())
-		    {
-			_amr->writeSmallPlotFile();
-		    }
-		    _amr->bUserStopRequest = to_stop;
-		    if (to_stop)
-		    {
-			ParallelDescriptor::Barrier("Amr::coarseTimeStep::to_stop");
-			if(ParallelDescriptor::IOProcessor()) {
-			    if (to_checkpoint)
-			    {
-				std::cerr << "Stopped by user w/ checkpoint" << std::endl;
-			    }
-			    else
-			    {
-				std::cerr << "Stopped by user w/o checkpoint" << std::endl;
-			    }
-			}
-		    }
-		}
-	    }
-	}
-
-	virtual void advanceTask_init (Real time, Real dt, int iteration, int ncycle) = 0;
-	virtual bool advanceTask ()=0;
-	virtual bool advanceTaskDependency (){return true;}
-	virtual Real post_advanceTask()=0;
-
-	void timeStepTask_init (int level, Real time, int iteration, int niter, Real stop_time){
-	    which_level_being_advanced = level;	    
-	    int lev_top = std::min(_amr->finest_level, _amr->max_level-1);
-
-	    for (int i(level); i <= lev_top; ++i)
-	    {
-		const int old_finest = _amr->finest_level;
-
-		if (_amr->okToRegrid(i))
-		{
-		    _amr->regrid(i,time);
-		    if (compute_new_dt_on_regrid && (i == 0) )
-		    {
-			int post_regrid_flag = 1;
-			_amr->amr_level[0]->computeNewDt(_amr->finest_level,
-				sub_cycle,
-				_amr->n_cycle,
-				_amr->ref_ratio,
-				dt_min,
-				dt_level,
-				stop_time,
-				post_regrid_flag);
-		    }
-		    for (int k(i); k <= _amr->finest_level; ++k) {
-			level_count[k] = 0;
-		    }
-		    if (old_finest < _amr->finest_level)
-		    {
-			// The new levels will not have valid time steps
-			// and iteration counts.
-			for (int k(old_finest + 1); k <= _amr->finest_level; ++k)
-			{
-			    dt_level[k]    = dt_level[k-1]/_amr->n_cycle[k];
-			}
-		    }
-		}
-		if (old_finest > _amr->finest_level) {
-		    lev_top = std::min(_amr->finest_level, _amr->max_level - 1);
-		}
-	    }
-	}
-
-	//	Real dt_new = advanceTask(time,dt_level[level],iteration,niter);
-
-#if 0
-	void _postTimeStepTask(int level, Real time, int iteration, int niter, Real stop_time){
-	    dt_min[level] = iteration == 1 ? dt_new : std::min(dt_min[level],dt_new);
-	    level_steps[level]++;
-	    level_count[level]++;
-	    if (verbose > 0)
-	    {
-		amrex::Print() << "[Level " << level << " step " << level_steps[level] << "] "
-		    << "Advanced " << _amr->amr_level[level]->countCells() << " cells\n";
-	    }
-
-	    // If the level signified that it wants a regrid after the advance has
-	    // occurred, do that now.
-	    if (_amr->amr_level[level]->postStepRegrid()) {
-
-		int old_finest = _amr->finest_level;
-
-		_amr->regrid(level, time);
-
-		if (old_finest < _amr->finest_level)
-		{
-		    // The new levels will not have valid time steps.
-		    for (int k = old_finest + 1; k <= _amr->finest_level; ++k)
-		    {
-			dt_level[k] = dt_level[k-1] / _amr->n_cycle[k];
-		    }
-		}
-	    }
-
-	    //signal timeStepTask at the next level
-	    if (level < _amr->finest_level)
-	    {
-		const int lev_fine = level+1;
-
-		if (_amr->sub_cycle)
-		{
-		    const int ncycle = _amr->n_cycle[lev_fine];
-
-		    for (int i = 1; i <= ncycle; i++)
-			timeStepTask(lev_fine,time+(i-1)*dt_level[lev_fine],i,ncycle,stop_time);
-		}
-		else
-		{
-		    timeStepTask(lev_fine,time,1,1,stop_time);
-		}
-	    }
-
-	    //_amr->amr_level[level]->post_timestep(iteration);
-
-	    // Set this back to negative so we know whether we are in fact in this routine
-	    which_level_being_advanced = -1;
-	}//end timeStep
-#endif
-
-	virtual void post_timestepTask(int  iteration)=0;
-	private:
-	amrex::FabArrayBase::CPC *TheCPC_sendup;
-	amrex::FabArrayBase::CPC *TheCPC_pullup;
-	amrex::FabArrayBase::CPC *TheCPC_senddown;
-	amrex::FabArrayBase::CPC *TheCPC_pulldown;
-
-	protected:
-	int subcycling_iteration;
-	int parent_subcycling_iteration;
-	int _taskState;
-	// The data that need to be privatized
-	Real             cumtime;      // Physical time variable.
-	Real 	         dt_new;
-	Vector<Real>     dt_level;     // Timestep at this level.
-	Vector<Real>     dt_min;
-	Vector<int>       level_count;
-	Vector<int>       level_steps;  // Number of time steps at this level.
-	int              which_level_being_advanced; // Only >=0 if we are in Amr::timeStep(level,...)
-	int              sub_cycle;
-
-	//for an AMR level
-	AmrLevel *amr_level;
-	AmrLevelTask     *levelTask;
-	int nStates;
-	Vector<StateDataTask> state;        // Array of state data.
-	MultiFab& get_old_data (int state_indx) { return state[state_indx].oldDataTask(); }
-	MultiFab& get_new_data (int state_indx) { return state[state_indx].newDataTask(); }
-    };
-}//end namespace
-#endif /*_Amr_H_*/
diff --git a/Src/AmrTask/AMFIter/AMReX_AsyncMFIter.H b/Src/AmrTask/AMFIter/AMReX_AsyncMFIter.H
deleted file mode 100644
index 216d9d0aadd..00000000000
--- a/Src/AmrTask/AMFIter/AMReX_AsyncMFIter.H
+++ /dev/null
@@ -1,594 +0,0 @@
-#ifndef AMREX_ASYNC_MFITER
-#define AMREX_ASYNC_MFITER
-//Question? email tannguyen@lbl.gov
-//Created 09-07-2017
-//Last modification 09-07-2017
-
-#include "AMReX_AbstractTask.H"
-#include "AMReX_TaskGraph.H"
-#include "RTS.H"
-#include <AMReX_FabArrayBase.H>
-#include <AMReX_FabArray.H>
-#include <AMReX_IntVect.H>
-#include <AMReX_FArrayBox.H>
-#include "AMReX_Connections.H"
-#include <AMReX_Amr.H>
-#include <AMReX_AmrLevel.H>
-
-//#ifdef _OPENMP
-#include <omp.h>
-//#endif
-
-namespace amrex {
-    typedef MFIter LocalFabIdx; 
-    class Action :public Task{
-	protected:
-	    LocalConnection l_con;
-	    RemoteConnection r_con;
-	    struct TileArray
-	    {
-		Vector<int> numLocalTiles;
-		Vector<int> localTileIndexMap;
-		Vector<Box> tileArray;
-	    } ta;
-	    bool _do_tiling;
-	    int current_tile;
-
-	    size_t tagGen(int src, int dest, int amrlevels, int fabs)
-	    {
-		return (src*fabs + dest%fabs)*amrlevels;
-	    }
-	    void FillBoundary_Push(){
-		for(int i=0; i<l_con.nscpy; i++)
-		{
-		    Data* msg= new Data(TaskName(l_con.scpy[i].ns), TaskName(l_con.scpy[i].nd), l_con.scpy[i].sz);
-		    msg->SetTag(i); //this is local copy so the recipient will have the matching tag
-		    msg->SetDestRank(ParallelDescriptor::MyProc());
-		    _fab->copyToMem(l_con.scpy[i].sbx, 0, _mf->nComp(), msg->GetBuffer()); //pack box to the message
-		    _outputs.push(msg);//let the runtime know that the output is available
-		}
-		int np = ParallelDescriptor::NProcs();
-		if (np==1) return;
-		for(int i=0; i<r_con.nsnd; i++)
-		{
-		    Data* msg= new Data(TaskName(r_con.snd[i].ns), TaskName(r_con.snd[i].nd), r_con.snd[i].sz);
-		    msg->SetTag(tagGen(r_con.snd[i].ns, r_con.snd[i].nd, 1, _mf->size()));
-		    msg->SetDestRank(r_con.snd[i].pr);
-		    _fab->copyToMem(r_con.snd[i].sbx, 0, _mf->nComp(), msg->GetBuffer());
-		    _outputs.push(msg);
-		}
-	    }
-	    void FillBoundary_Pull(){
-		for(int i=0; i<l_con.ndcpy; i++)
-		{
-		    int tag=l_con.dcpy[i].sPartner;
-		    Data* msg= _neighbors_in.pop_front(TaskName(l_con.dcpy[i].ns), tag);
-		    _fab->copyFromMem(l_con.dcpy[i].dbx,0, _mf->nComp(), msg->GetBuffer());//unpack message to box
-		    msg->Free();
-		}
-		int np = ParallelDescriptor::NProcs();
-		if (np==1) return;
-		for(int i=0; i<r_con.nrcv; i++)
-		{
-		    size_t tag= tagGen(r_con.rcv[i].ns, r_con.rcv[i].nd, 1, _mf->size());
-		    Data* msg= _neighbors_in.pop_front(TaskName(r_con.rcv[i].ns), tag);
-		    _fab->copyFromMem(r_con.rcv[i].dbx, 0, _mf->nComp(), msg->GetBuffer());
-		    msg->Free();
-		}
-	    }
-	    bool isSatisfied(){
-		if(!DependSignal()) return false; //wait for dependent signal if ANY
-		bool satisfied=true;
-		for(int i=0; i<l_con.ndcpy; i++){
-		    satisfied= Depend_on(TaskName(l_con.dcpy[i].ns), l_con.dcpy[i].sPartner);
-		    if(!satisfied) return false;
-		}
-		//remote connections
-		if(ParallelDescriptor::NProcs() == 1) return true;
-		for(int i=0; i<r_con.nrcv; i++)
-		{
-		    satisfied= Depend_on(TaskName(r_con.rcv[i].ns), tagGen(r_con.rcv[i].ns, r_con.rcv[i].nd, 1, _mf->size()));
-		    if(!satisfied) return false;
-		}
-		return true;
-	    }
-	    void extendIters(int extra){_nIters+= extra;}
-	    int _iter, _nIters;
-	    FabArray<FArrayBox> *_mf;
-	    FArrayBox* _fab;
-	    int _idx;
-	    int _lIdx;
-	    bool _communicateFirstTimeStep; //exchange ghost cells before starting the first time step
-	    bool _communicateUponCompletion; //exchange ghost cells after computing the last time step
-	public:
-	    LocalConnection& LCon(){return l_con;}
-	    RemoteConnection& RCon(){return r_con;}
-	    Action(){
-		_iter=-1;
-		_nIters=1;
-		_communicateFirstTimeStep=true; //the default is we exchange ghost cells before the first time step
-		_communicateUponCompletion=false;
-		_do_tiling=false;
-	    }
-	    ~Action(){
-		free(l_con.scpy);
-		free(l_con.dcpy);
-		free(r_con.snd);
-		free(r_con.rcv);
-	    }
-	    void enable_tiling(){_do_tiling=true;}
-	    vector<Box>& getTileArray(){return ta.tileArray;}
-	    void SetFab(FArrayBox* fab){_fab= fab;}
-	    void SetSteps(int nIters){
-		assert(nIters>=1);
-		_nIters= nIters;
-	    }
-	    void SetMF(const FabArray<FArrayBox> &mf){
-		_mf= (FabArray<FArrayBox>*)&mf;
-	    }
-	    void SetIdx(int idx){
-		_idx=idx;
-	    }
-	    void SetLocalIdx(int lIdx){_lIdx= lIdx;}
-	    virtual void Compute(Box)=0;
-	    virtual void Init(){};
-	    virtual bool DependSignal(){return true;}
-
-	    void tileIndices(int &beginIndex, int &endIndex){
-#ifdef _OPENMP
-		int tid = omp_get_thread_num();
-		int nthreads= omp_get_num_threads();
-		int ntot= ta.tileArray.size();
-		int nr   = ntot / nthreads;
-		int nlft = ntot - nr * nthreads;
-		if (tid < nlft) {  // get nr+1 items
-		    beginIndex += tid * (nr + 1);
-		    endIndex = beginIndex + nr + 1;
-		} else {           // get nr items
-		    beginIndex += tid * nr + nlft;
-		    endIndex = beginIndex + nr;
-		}
-#else
-		beginIndex=0;
-		endIndex= ta.tileArray.size();
-#endif
-	    }
-	    void Job(){
-		if(_communicateFirstTimeStep){
-		    if(_iter==-1) FillBoundary_Push();
-		    else if (_iter==0){
-			FillBoundary_Pull();
-		    }
-		}else if(_iter==-1) _iter++; //go directly to the first compute step
-		if(_iter>=0 && _iter<_nIters){ //always compute from time step 0 to _nIters-1
-		    if(_iter>0)FillBoundary_Pull(); //communication at step 0 is already governed by _communicateFirstTimeStep 
-		    if(!_do_tiling) Compute(validbox());//execute task at Fab level
-		    else{
-#ifdef _OPENMP
-#pragma omp parallel
-			{
-#endif
-			    int beginIndex, endIndex;
-			    tileIndices(beginIndex, endIndex);
-			    for(int tile=beginIndex; tile<endIndex; tile++){
-				Compute(ta.tileArray[tile]);
-			    }
-#ifdef _OPENMP
-			}
-#endif
-		    }
-		    if(_iter<_nIters-1) FillBoundary_Push();
-		}
-		_iter++;
-		if(_communicateUponCompletion){
-		    if(_iter<=_nIters) {
-			if(_iter==_nIters)FillBoundary_Push(); 
-		    }else if (_iter==(_nIters+1)){
-			FillBoundary_Pull();
-			SelfDestroy();
-		    }
-		}else{
-		    if(_iter==_nIters)SelfDestroy();
-		}
-	    }
-	    bool Dependency(){
-		if(_iter==-1) return true;
-		return isSatisfied();
-	    }
-	    void SetFirstTimeStepComm(bool input){
-		_communicateFirstTimeStep= input;
-	    }
-	    void SetCompletionComm(bool input){
-		_communicateUponCompletion= input;
-	    }
-	    void PostCompletion(){
-		//nothing
-	    }
-	    Box validbox() const{
-		return _mf->box(_idx);
-	    }
-	    //! Return the Fab associated with this task
-	    FArrayBox& validFab(){
-		return *(_mf->m_fabs_v[_lIdx]);
-	    }
-	    //! Return the local index of the Fab associated with this task. It can then be used to locate corresponding Fabs on other multifabs that have the same layout.
-	    int localFabIdx(){
-		return _lIdx;
-	    }
-	    //! Locate in multifab mf the Fab that has the same coordinate as this task' Fab
-	    FArrayBox& validFab(const FabArray<FArrayBox> &mf){
-		return *(mf.m_fabs_v[_lIdx]);
-	    }
-	    //! Locate in multifab mf the Fab that has local index lIdx
-	    FArrayBox& validFab(const FabArray<FArrayBox> &mf, int lIdx){
-		return *(mf.m_fabs_v[lIdx]);
-	    }
-
-	    void generateTileArray(const IntVect& tileSize){
-		IntVect nt_in_fab, tsize, nleft;
-		int ntiles = 1;
-		const Box& bx = validbox();
-
-		for (int d=0; d<BL_SPACEDIM; d++) {
-		    int ncells = bx.length(d);
-		    nt_in_fab[d] = std::max(ncells/tileSize[d], 1);
-		    tsize    [d] = ncells/nt_in_fab[d];
-		    nleft    [d] = ncells - nt_in_fab[d]*tsize[d];
-		    ntiles *= nt_in_fab[d];
-		}
-
-		IntVect small, big, ijk;  // note that the initial values are all zero.
-		ijk[0] = -1;
-		for (int t = 0; t < ntiles; ++t) {
-		    ta.localTileIndexMap.push_back(t);
-		    ta.numLocalTiles.push_back(ntiles);
-
-		    for (int d=0; d<BL_SPACEDIM; d++) {
-			if (ijk[d]<nt_in_fab[d]-1) {
-			    ijk[d]++;
-			    break;
-			} else {
-			    ijk[d] = 0;
-			}
-		    }
-
-		    for (int d=0; d<BL_SPACEDIM; d++) {
-			if (ijk[d] < nleft[d]) {
-			    small[d] = ijk[d]*(tsize[d]+1);
-			    big[d] = small[d] + tsize[d];
-			} else {
-			    small[d] = ijk[d]*tsize[d] + nleft[d];
-			    big[d] = small[d] + tsize[d] - 1;
-			}
-		    }
-
-		    Box tbx(small, big, IndexType::TheCellType());
-		    tbx.shift(bx.smallEnd());
-
-		    ta.tileArray.push_back(tbx);
-		}
-	    }
-	    Box growntilebox (Box bx, int ng){
-		const Box& vbx = _mf->m_fabs_v[_lIdx]->box();
-		for (int d=0; d<BL_SPACEDIM; ++d) {
-		    if (bx.smallEnd(d) == vbx.smallEnd(d)) {
-			bx.growLo(d, ng);
-		    }
-		    if (bx.bigEnd(d) == vbx.bigEnd(d)) {
-			bx.growHi(d, ng);
-		    }
-		}
-		return bx;
-	    }
-    };//end class Action
-
-    template <class T>
-	class MFGraph: public AbstractTaskGraph<T>{
-	    protected:
-		string _graphName;
-		bool _do_tiling;
-	    public:
-		MFGraph(const FabArray<FArrayBox> &mf, int nSteps, int rank, int nProcs, Periodicity period, bool do_tiling){
-		    AbstractTaskGraph<T>::_nProcs= nProcs;
-		    AbstractTaskGraph<T>::_rank= rank;
-		    for(int i=0; i< mf.local_size(); i++){
-			TaskName name(mf.IndexArray()[i]);
-			T *t= new T();
-			t->SetSteps(nSteps);
-			t->SetMF(mf);
-			t->SetFab(mf.m_fabs_v[i]);
-			t->SetIdx(mf.IndexArray()[i]);
-			t->SetName(name);
-			t->SetLocalIdx(i);
-			if(do_tiling){  
-			    IntVect ts= FabArrayBase::mfiter_tile_size;
-			    t->generateTileArray(ts); //create tile array associated with this FAB
-			}
-			t->Init();
-			if(do_tiling) t->enable_tiling();
-			AbstractTaskGraph<T>::_initialTasks.push_back(t);
-			AbstractTaskGraph<T>::_taskPool[name]= t;
-		    }
-		    AbstractTaskGraph<T>::_begin= *(AbstractTaskGraph<T>::_initialTasks.begin());
-		    AbstractTaskGraph<T>::_end= *(AbstractTaskGraph<T>::_initialTasks.end());
-		    AbstractTaskGraph<T>::_currIt= AbstractTaskGraph<T>::_initialTasks.begin();
-		    AbstractTaskGraph<T>::_current= *(AbstractTaskGraph<T>::_currIt);
-		    AbstractTaskGraph<T>::_mode= _Push;
-		    SetupFabConnections(mf, period);
-		    _do_tiling= do_tiling;
-		}
-
-		MFGraph(const Amr* amr, int max_step, Real stop_time, int rank, int nProcs, bool do_tiling){
-		    AbstractTaskGraph<T>::_nProcs= nProcs;
-		    AbstractTaskGraph<T>::_rank= rank;
-		    //create an initial graph corresponding to the coarsest AMR level, this graph will evolve with time
-		    int n_intervals=1;
-		    for(int l=0; l<= amr->finest_level; l++){
-			n_intervals*= amr->n_cycle[l];
-			for(int s=0; s< amr->amr_level[l]->numStates(); s++){
-			    MultiFab& mf = amr->amr_level[l]->get_new_data(s);
-			    amr->amr_level[l]->get_state_data(s).allocOldData();
-			    for(int i=0; i< mf.local_size(); i++){
-				for(int it=0; it< n_intervals; it++){
-				    TaskName name(l /*level*/, s/*state*/, mf.IndexArray()[i] /*fab*/, it);
-				    T *t= new T();
-				    t->SetName(name);
-				    t->SetLocalIdx(i);
-				    t->SetMF(mf);
-				    t->SetFab(mf.m_fabs_v[i]);
-				    t->SetIdx(mf.IndexArray()[i]);
-				    t->InitAmrTask(amr, max_step, stop_time);
-				    t->CreateLevelTask(l);
-				    if(i==0) t->SetMaster();
-				    if(do_tiling){
-					IntVect ts= FabArrayBase::mfiter_tile_size;
-					t->generateTileArray(ts); //create tile array associated with this FAB
-				    }
-				    if(do_tiling) t->enable_tiling();
-				    AbstractTaskGraph<T>::_initialTasks.push_back(t);
-				    AbstractTaskGraph<T>::_taskPool[name]= t;
-		    		    SetupFabConnections(mf, amr->amr_level[l]->Geom().periodicity());
-				}
-			    }
-			}
-		    }
-		    AbstractTaskGraph<T>::_begin= *(AbstractTaskGraph<T>::_initialTasks.begin());
-		    AbstractTaskGraph<T>::_end= *(AbstractTaskGraph<T>::_initialTasks.end());
-		    AbstractTaskGraph<T>::_currIt= AbstractTaskGraph<T>::_initialTasks.begin();
-		    AbstractTaskGraph<T>::_current= *(AbstractTaskGraph<T>::_currIt);
-		    AbstractTaskGraph<T>::_mode= _Push;
-		    _do_tiling= do_tiling;
-		}
-
-		int FindProcessAssociation(TaskName name){
-		    assert(false);
-		}
-		void SetupFabConnections(const FabArray<FArrayBox> &mf, Periodicity period){
-		    int np = ParallelDescriptor::NProcs();
-		    int myProc = ParallelDescriptor::MyProc();
-		    int numfabs = mf.size();
-		    bool cross = false;
-		    const FabArrayBase::FB& TheFB = mf.getFB(mf.nGrowVect(),period);
-		    const int n_loc_mf = TheFB.m_LocTags->size();
-		    const int n_snds_mf = TheFB.m_SndTags->size();
-		    const int n_rcvs_mf = TheFB.m_RcvTags->size();
-		    Vector<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-		    Vector<int> send_pr;
-		    send_cctc.reserve(n_snds_mf);
-
-		    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheFB.m_SndTags->begin(),
-			    m_End = TheFB.m_SndTags->end();
-			    m_it != m_End;
-			    ++m_it)
-		    {
-			if(m_it->first != myProc)      // Not destined to me.
-			{
-			    send_pr.push_back(m_it->first);
-			    send_cctc.push_back(&(m_it->second));
-			}
-		    }
-		    Vector<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-		    Vector<int> recv_pr;
-		    recv_cctc.reserve(n_rcvs_mf);
-
-		    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheFB.m_RcvTags->begin(),
-			    m_End = TheFB.m_RcvTags->end();
-			    m_it != m_End;
-			    ++m_it)
-		    {
-			if(m_it->first != myProc)      // I am not the source for this receipt
-			{
-			    recv_pr.push_back(m_it->first);
-			    recv_cctc.push_back(&(m_it->second));
-			}
-		    }
-		    for(int f=0; f<numfabs; f++) //          !create local communication metadata for each fab
-		    {
-			LocalConnection &l_con= ((Action*)AbstractTaskGraph<T>::_initialTasks[f])->LCon();
-			l_con.nscpy = 0;
-			l_con.ndcpy = 0;
-			l_con.firingRuleCnt = 0;
-			for(int i=0; i<n_loc_mf; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheFB.m_LocTags)[i];
-			    if(f == tag.srcIndex)
-				l_con.nscpy++;
-			    if(f == tag.dstIndex)
-				l_con.ndcpy++;
-			}
-		    }
-		    if(np > 1)
-		    {
-			for(int f=0; f<numfabs; f++)
-			{
-			    RemoteConnection &r_con= ((Action*)AbstractTaskGraph<T>::_initialTasks[f])->RCon();
-			    r_con.nrcv = 0;
-			    r_con.nsnd = 0;
-			    r_con.firingRuleCnt = 0;
-			    for(int i=0; i<n_snds_mf; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(f == it->srcIndex)
-					r_con.nsnd++;
-				}
-			    }
-			    for(int i=0; i<n_rcvs_mf; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(f == it->dstIndex)
-					r_con.nrcv++;
-				}
-			    }
-			}
-		    }
-		    int scnt, dcnt;
-		    for(int f=0; f<numfabs; f++)
-		    {
-			scnt = -1;
-			dcnt = -1;
-			LocalConnection &l_con= ((Action*)AbstractTaskGraph<T>::_initialTasks[f])->LCon();
-			l_con.scpy = new LocalCopyDescriptor[l_con.nscpy];
-			l_con.dcpy = new LocalCopyDescriptor[l_con.ndcpy];
-			for(int i=0; i<n_loc_mf; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheFB.m_LocTags)[i];
-			    if(f == tag.srcIndex)
-			    {
-				scnt++;
-				l_con.scpy[scnt].ns = tag.srcIndex;
-				l_con.scpy[scnt].nd = tag.dstIndex;
-				l_con.scpy[scnt].sbx = tag.sbox;
-				l_con.scpy[scnt].dbx = tag.dbox;
-				l_con.scpy[scnt].sz = tag.sbox.numPts() * mf.nComp() * sizeof(double);
-			    }
-			    if(f == tag.dstIndex)
-			    {
-				dcnt++;
-				l_con.dcpy[dcnt].ns = tag.srcIndex;
-				l_con.dcpy[dcnt].nd = tag.dstIndex;
-				l_con.dcpy[dcnt].sbx = tag.sbox;
-				l_con.dcpy[dcnt].dbx = tag.dbox; 
-				l_con.dcpy[dcnt].sz = tag.dbox.numPts() * mf.nComp() * sizeof(double);
-			    }
-			} 
-		    }
-		    for(int f=0; f<numfabs; f++)
-		    {
-			LocalConnection &l_con= ((Action*)AbstractTaskGraph<T>::_initialTasks[f])->LCon();
-			for(int i=0; i<l_con.nscpy; i++){
-			    LocalConnection &l_con1= ((Action*)AbstractTaskGraph<T>::_initialTasks[l_con.scpy[i].nd])->LCon();
-			    for(int j=0; j<l_con1.ndcpy; j++){
-				if(l_con.scpy[i].dbx == l_con1.dcpy[j].dbx)
-				    l_con.scpy[i].dPartner = j;
-			    }
-			}
-
-			for(int i=0; i<l_con.ndcpy; i++){
-			    LocalConnection &l_con1= ((Action*)AbstractTaskGraph<T>::_initialTasks[l_con.dcpy[i].ns])->LCon();
-			    for(int j=0; j<l_con1.nscpy; j++)
-				if(l_con.dcpy[i].dbx == l_con1.scpy[j].dbx)
-				    l_con.dcpy[i].sPartner = j;
-			}
-		    }
-
-
-		    if(np == 1) return;
-		    int nsnd, nrcv;
-
-		    for(int f=0; f<numfabs; f++)
-		    {
-			RemoteConnection &r_con= ((Action*)AbstractTaskGraph<T>::_initialTasks[f])->RCon();
-			r_con.snd = new RemoteCommDescriptor[r_con.nsnd];
-			r_con.rcv = new RemoteCommDescriptor[r_con.nrcv];
-			nrcv= -1;
-			for(int i=0; i<n_rcvs_mf; i++)
-			{
-			    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-			    int pr = recv_pr[i];
-			    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-				    it != cctc.end(); ++it)
-			    {
-				if(f == it->dstIndex)
-				{
-				    nrcv++;
-				    r_con.rcv[nrcv].ns = it->srcIndex;
-				    r_con.rcv[nrcv].lns = -1;
-				    r_con.rcv[nrcv].nd = it->dstIndex;
-				    r_con.rcv[nrcv].lnd = mf.localindex(it->dstIndex);
-				    r_con.rcv[nrcv].sbx = it->sbox;
-				    r_con.rcv[nrcv].dbx = it->dbox;
-				    r_con.rcv[nrcv].pr = pr;
-				    r_con.rcv[nrcv].cnt = 0;
-				    r_con.rcv[nrcv].sz = it->sbox.numPts() * mf.nComp() * sizeof(double);
-				}
-			    }
-			}
-			nsnd = -1;
-			for(int i=0; i<n_snds_mf; i++)
-			{
-			    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-			    int pr = send_pr[i];
-			    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-				    it != cctc.end(); ++it)
-			    {
-				if(f == it->dstIndex )
-				{
-				    nsnd++;
-				    r_con.snd[nsnd].ns = it->srcIndex;
-				    r_con.snd[nsnd].lns = mf.localindex(it->srcIndex);
-				    r_con.snd[nsnd].nd = it->dstIndex;
-				    r_con.snd[nsnd].lnd = -1;
-				    r_con.snd[nsnd].sbx = it->sbox;
-				    r_con.snd[nsnd].dbx = it->dbox;
-				    r_con.snd[nsnd].pr = pr;
-				    r_con.snd[nsnd].cnt = 0;
-				    r_con.snd[nsnd].sz = it->dbox.numPts() * mf.nComp() * sizeof(double);
-				}
-			    }
-			} // for(i<n_snds_mf)
-		    }
-		}
-	};
-
-    template <class A>
-#define max_life 2^32-1
-	class AMFIter{
-	    private:
-		RTS rts;
-		MFGraph<A> *graph;
-		bool _do_tiling;
-	    public:
-		AMFIter(const FabArray<FArrayBox> &mf, int nSteps, Periodicity period, bool do_tiling=false){
-		    _do_tiling= do_tiling;
-		    graph= new MFGraph<A>(mf, nSteps, ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs(), period, do_tiling);
-		}
-
-		AMFIter(const FabArray<FArrayBox> &mf, Periodicity period, bool do_tiling=false){
-		    _do_tiling= do_tiling;
-		    graph= new MFGraph<A>(mf, max_life, ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs(), period, do_tiling);
-		}
-
-		AMFIter(const Amr* amr, int max_step, Real stop_time, bool do_tiling=false){
-		    _do_tiling= do_tiling;
-		    graph= new MFGraph<A>(amr, max_step, stop_time, ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs(), do_tiling);
-		}
-
-		~AMFIter(){
-		    delete graph;
-		}
-
-		void Iterate(){
-		    rts.Init(ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs());
-		    rts.Iterate(graph);
-		    rts.Finalize();
-		}
-	};
-#undef max_life
-} //end namespace
-#endif
diff --git a/Src/AmrTask/AMFIter/AMReX_AsyncMFIter.cpp b/Src/AmrTask/AMFIter/AMReX_AsyncMFIter.cpp
deleted file mode 100644
index ebdb948f4d1..00000000000
--- a/Src/AmrTask/AMFIter/AMReX_AsyncMFIter.cpp
+++ /dev/null
@@ -1,4 +0,0 @@
-#include "AMReX_AsyncMFIter.H"
-
-namespace amrex {
-}
diff --git a/Src/AmrTask/AMFIter/AMReX_Connections.H b/Src/AmrTask/AMFIter/AMReX_Connections.H
deleted file mode 100644
index e9f6426862a..00000000000
--- a/Src/AmrTask/AMFIter/AMReX_Connections.H
+++ /dev/null
@@ -1,59 +0,0 @@
-#ifndef AMREX_CONNECTIONS_H
-#define AMREX_CONNECTION_H
-
-#include <AMReX_FArrayBox.H>
-#include <AMReX_FabArrayBase.H>
-#include <AMReX_IntVect.H>
-
-namespace amrex {
-
-    struct LocalCopyDescriptor
-    {
-	int ns;   // ! Source box in layout
-	int nd;   //! Destination box in layout
-	Box sbx;     // ! Sub-box for this copy
-	Box dbx;     // ! Sub-box for this copy
-        size_t sz;
-	int sPartner, dPartner;
-	int dcpyCnt, scpyCnt;
-    };
-
-    struct LocalConnection
-    {
-	int nscpy;   //! Number of cpy chunks
-	int ndcpy;   //! Number of cpy chunks
-        int firingRuleCnt;
-	LocalCopyDescriptor *scpy;
-	LocalCopyDescriptor *dcpy;
-    };
-
-    struct RemoteCommDescriptor
-    {
-	int ns, lns;   // ! Source box in layout
-	int nd, lnd;   //! Destination box in layout
-	size_t sz;
-        int pr;
-	Box sbx;     // ! Sub-box for this copy
-	Box dbx;     // ! Sub-box for this copy
-	int cnt;
-    };
-
-    struct TransDescriptor
-    {
-	int sz, pv, pr;
-    };
-
-    struct RemoteConnection
-    {
-	int nsnd;
-	int nrcv;
-	int nrp, nsp;
-        int firingRuleCnt;
-	RemoteCommDescriptor *snd;
-	RemoteCommDescriptor *rcv;
-	TransDescriptor *str;
-	TransDescriptor *rtr;
-    };
-}//end namespace
-#endif
-
diff --git a/Src/AmrTask/AMFIter/Makefile b/Src/AmrTask/AMFIter/Makefile
deleted file mode 100755
index 5eda141c3f8..00000000000
--- a/Src/AmrTask/AMFIter/Makefile
+++ /dev/null
@@ -1,25 +0,0 @@
-include ../arch.common 
-
-OBJECTS= AMReX_AsyncMFIter.o 
-
-AMFIterLIB= AMReX_AsyncMFIter.a
-
-all: $(AMFIterLIB)
-
-$(AMFIterLIB): $(OBJECTS)
-	ar rv $(AMFIterLIB) $(OBJECTS) 
-
-
-INCLUDE += -DBL_USE_MPI -DBL_USE_OMP -DBL_SPACEDIM=3 -DAMREX_SPACEDIM=3 -DBL_FORT_USE_UNDERSCORE -DBL_Linux
-
-all: $(OBJECTS)
-  
-AMReX_AsyncMFIter.o: AMReX_AsyncMFIter.cpp AMReX_AsyncMFIter.H
-	$(C++) $(C++FLAGS) -I./ -I../../Base -I../../Amr -I../../AmrCore -I../graph -I$(INCLUDE) -c AMReX_AsyncMFIter.cpp -o AMReX_AsyncMFIter.o
-
-.PHONY: clean
-
-clean:
-	$(RM) $(OBJECTS)
-	$(RM) *.a
-
diff --git a/Src/AmrTask/Amr/AMReX_AmrLevelTask.H b/Src/AmrTask/Amr/AMReX_AmrLevelTask.H
deleted file mode 100644
index 9a0d6581337..00000000000
--- a/Src/AmrTask/Amr/AMReX_AmrLevelTask.H
+++ /dev/null
@@ -1,291 +0,0 @@
-#ifndef AMREX_AmrLevelAsync_H_
-#define AMREX_AmrLevelAsync_H_
-
-#include "AMReX_AmrLevel.H"
-
-namespace amrex {
-
-    class AmrLevelAsync: public AmrLevel
-    {
-	public:
-	    friend class AsyncFillPatchIterator;
-	    virtual void initPerilla (Real time) = 0;
-	    virtual void finalizePerilla (Real time) = 0;
-    };
-
-    class AsyncFillPatchIterator :public MFIter
-    {
-	public:
-
-	    friend class AmrLevelAsync;
-	    friend class RGIter;
-
-	    AsyncFillPatchIterator (AmrLevel& amrlevel,
-		    MultiFab& leveldata,
-		    int       boxGrow,
-		    Real      time,
-		    int       state_indx,
-		    int       scomp,
-		    int       ncomp,
-		    int       f,
-		    int iter,
-		    int       tid);
-
-	    void initFillPatch(int boxGrow,
-		    int time,
-		    int index,
-		    int scomp,
-		    int ncomp,
-		    int iter);
-	    static void  initialSend(amrex::Vector<amrex::AsyncFillPatchIterator*> afpi,
-		    amrex::Vector<amrex::AsyncFillPatchIterator*> upper_afpi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int  iter,
-		    int tid);
-
-	    void PushOnly (int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    unsigned char pushLevel,
-		    int tf,
-		    bool singleT=false);
-
-	    void SendIntraLevel (RGIter& rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int  iter,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void SendIntraLevel (RGIter* rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int  iter,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void SendInterLevel (RGIter& rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int  iter,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void SendInterLevel (RGIter* rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int  iter,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void Receive (RGIter& rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void Receive (RGIter* rgi,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void Receive (RGIter& rgi,
-		    MultiFab& dest,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void Receive (RGIter* rgi,
-		    MultiFab& dest,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void PullOnly (int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-
-	    void PullOnly (MultiFab& dest,
-		    int  boxGrow,
-		    Real time,
-		    int  state_indx,
-		    int  scomp,
-		    int  ncomp,
-		    int f,
-		    int tid,
-		    bool singleT=false);
-	    void FillFromTwoLevelsPush (Real time,
-		    int index,
-		    int scomp,
-		    int dcomp,
-		    int ncomp,
-		    int f,
-		    int tid,
-		    unsigned char pushLevel,
-		    int tf,
-		    bool singleT);
-	    void FillFromTwoLevelsPull (Real time,
-		    int index,
-		    int scomp,
-		    int dcomp,
-		    int ncomp,
-		    int f,
-		    int tid,
-		    bool singleT);
-
-	    ~AsyncFillPatchIterator ();
-
-	    FArrayBox& operator() () { return m_fabs[MFIter::index()]; }
-
-	    Box UngrownBox () const { return MFIter::validbox(); }
-
-	    MultiFab& get_mf() { return m_fabs; }
-	    AsyncFillPatchIterator ();
-	    AsyncFillPatchIterator (const AsyncFillPatchIterator& rhs);
-	    AsyncFillPatchIterator& operator= (const AsyncFillPatchIterator& rhs);
-
-	    AmrLevel&                         m_amrlevel;
-	    MultiFab&                         m_leveldata;
-	    std::vector< std::pair<int,int> > m_range;
-	    MultiFab                          m_fabs;
-	    int                               m_ncomp;
-
-	public:
-	    bool                              isProperlyNested;
-
-	    Vector<MultiFab*>                  smf;
-	    Vector<Real>                       stime;
-	    StateDataPhysBCFunct*             physbcf;
-	    Geometry*                         geom;
-
-
-	    Vector<MultiFab*>                  smf_crse;
-	    Vector<Real>                       stime_crse;
-	    StateDataPhysBCFunct*             physbcf_crse;
-	    Geometry*                         geom_crse;
-
-	    Vector<MultiFab*>                  smf_fine;
-	    Vector<Real>                       stime_fine;
-	    StateDataPhysBCFunct*             physbcf_fine;
-	    Geometry*                         geom_fine;
-
-
-	    RegionGraph*                      destGraph;
-	    RegionGraph*                      csrcGraph;
-	    RegionGraph*                      fsrcGraph;
-
-	    MultiFab*                         m_mf_crse_patch;
-	    RegionGraph*                      m_rg_crse_patch;
-	    const FabArrayBase::FPinfo*       m_fpc;
-
-	    //PArray<MultiFab>                  raii;
-	    MultiFab*                         dmf;
-	    MultiFab*                         dmff;
-
-	    void completeRegionGraphs(int tg)
-	    {
-		//std::cout << "Completing RGs ";
-
-		if(destGraph != NULL)
-		{
-		    //std::cout << destGraph->graphID << " ";
-		    destGraph->completeRegionGraph(tg);
-		}
-		if(csrcGraph != NULL)
-		{
-		    //std::cout << csrcGraph->graphID << " ";
-		    csrcGraph->completeRegionGraph(tg);
-		}
-		if(fsrcGraph != NULL)
-		{
-		    //std::cout << fsrcGraph->graphID << " ";
-		    fsrcGraph->completeRegionGraph(tg);
-		}
-		if(m_rg_crse_patch != NULL)
-		{
-		    //std::cout << m_rg_crse_patch->graphID << " ";
-		    m_rg_crse_patch->completeRegionGraph(tg);
-		}
-
-		//std::cout <<" by tg " << tg << std::endl;
-	    }
-	    void Reset(int tg)
-	    {
-		//std::cout << "Resetting RGs ";
-		if(destGraph != NULL)
-		{
-		    //std::cout << destGraph->graphID << " ";
-		    destGraph->Reset(tg);
-		}
-		if(csrcGraph != NULL)
-		{
-		    //std::cout << csrcGraph->graphID << " ";
-		    csrcGraph->Reset(tg);
-		}
-		if(fsrcGraph != NULL)
-		{
-		    //std::cout << fsrcGraph->graphID << " ";
-		    fsrcGraph->Reset(tg);
-		}
-		if(m_rg_crse_patch != NULL)
-		{
-		    //std::cout << m_rg_crse_patch->graphID << " ";
-		    m_rg_crse_patch->Reset(tg);
-		}
-		//std::cout <<" by tg " << tg << std::endl;
-	    }
-
-	    // Variables for optimization calls of two level push/pulll
-
-    };
-
-
-#endif
diff --git a/Src/AmrTask/Amr/AMReX_AmrLevelTask.cpp b/Src/AmrTask/Amr/AMReX_AmrLevelTask.cpp
deleted file mode 100644
index 4f8cda112c4..00000000000
--- a/Src/AmrTask/Amr/AMReX_AmrLevelTask.cpp
+++ /dev/null
@@ -1,2075 +0,0 @@
-
-#include <sstream>
-
-#include <unistd.h>
-#include <memory>
-
-#include <AMReX_AmrLevel.H>
-#include <AMReX_AmrLevelTask.H>
-#include <AMReX_Derive.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_FillPatchUtil.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BLProfiler.H>
-#include <AMReX_Print.H>
-#include <AMReX_VisMF.H>
-
-#ifdef AMREX_USE_EB
-#include <AMReX_EBFabFactory.H>
-#include <AMReX_EBMultiFabUtil.H>
-#endif
-
-namespace amrex {
-
-#ifdef AMREX_USE_EB
-int AmrLevel::m_eb_basic_grow_cells = 5;
-int AmrLevel::m_eb_volume_grow_cells = 4;
-int AmrLevel::m_eb_full_grow_cells = 2;
-EBSupport AmrLevel::m_eb_support_level = EBSupport::volume;
-#endif
-
-DescriptorList AmrLevel::desc_lst;
-DeriveList     AmrLevel::derive_lst;
-
-void
-AmrLevel::postCoarseTimeStep (Real time)
-{
-    BL_ASSERT(level == 0);
-    // sync up statedata time
-    for (int lev = 0; lev <= parent->finestLevel(); ++lev) {
-	AmrLevel& amrlevel = parent->getLevel(lev);
-	for (int i = 0; i < amrlevel.state.size(); ++i) {
-	    amrlevel.state[i].syncNewTimeLevel(time);
-	}
-    }
-}
-
-void
-AmrLevel::set_preferred_boundary_values (MultiFab& S,
-                                         int       state_index,
-                                         int       scomp,
-                                         int       dcomp,
-                                         int       ncomp,
-                                         Real      time) const
-{}
-
-DeriveList&
-AmrLevel::get_derive_lst ()
-{
-    return derive_lst;
-}
-
-void
-AmrLevel::manual_tags_placement (TagBoxArray&    tags,
-                                 const Vector<IntVect>& bf_lev)
-{}
-
-AmrLevel::AmrLevel ()
-{
-   parent = 0;
-   level = -1;
-}
-
-AmrLevel::AmrLevel (Amr&            papa,
-                    int             lev,
-                    const Geometry& level_geom,
-                    const BoxArray& ba,
-		    const DistributionMapping& dm,
-                    Real            time)
-    :
-    geom(level_geom),
-    grids(ba),
-    dmap(dm)
-{
-    BL_PROFILE("AmrLevel::AmrLevel(dm)");
-    level  = lev;
-    parent = &papa;
-
-    fine_ratio = IntVect::TheUnitVector(); fine_ratio.scale(-1);
-    crse_ratio = IntVect::TheUnitVector(); crse_ratio.scale(-1);
-
-    if (level > 0)
-    {
-        crse_ratio = parent->refRatio(level-1);
-    }
-    if (level < parent->maxLevel())
-    {
-        fine_ratio = parent->refRatio(level);
-    }
-
-    state.resize(desc_lst.size());
-
-#ifdef AMREX_USE_EB
-    m_factory.reset(new EBFArrayBoxFactory(geom, ba, dm,
-                                           {m_eb_basic_grow_cells, m_eb_volume_grow_cells, m_eb_full_grow_cells},
-                                           m_eb_support_level));
-#else
-    m_factory.reset(new FArrayBoxFactory());
-#endif
-
-    // Note that this creates a distribution map associated with grids.
-    for (int i = 0; i < state.size(); i++)
-    {
-        state[i].define(geom.Domain(),
-                        grids,
-			dm,
-                        desc_lst[i],
-                        time,
-                        parent->dtLevel(lev),
-                        *m_factory);
-    }
-
-    if (parent->useFixedCoarseGrids()) constructAreaNotToTag();
-
-    post_step_regrid = 0;
-
-    finishConstructor();
-}
-
-void
-AmrLevel::writePlotFile (const std::string& dir,
-                         std::ostream&      os,
-                         VisMF::How         how)
-{
-    int i, n;
-    //
-    // The list of indices of State to write to plotfile.
-    // first component of pair is state_type,
-    // second component of pair is component # within the state_type
-    //
-    std::vector<std::pair<int,int> > plot_var_map;
-    for (int typ = 0; typ < desc_lst.size(); typ++)
-        for (int comp = 0; comp < desc_lst[typ].nComp();comp++)
-            if (parent->isStatePlotVar(desc_lst[typ].name(comp)) &&
-                desc_lst[typ].getType() == IndexType::TheCellType())
-                plot_var_map.push_back(std::pair<int,int>(typ,comp));
-
-    int n_data_items = plot_var_map.size();
-
-    // get the time from the first State_Type
-    // if the State_Type is ::Interval, this will get t^{n+1/2} instead of t^n
-    Real cur_time = state[0].curTime();
-
-    if (level == 0 && ParallelDescriptor::IOProcessor())
-    {
-        //
-        // The first thing we write out is the plotfile type.
-        //
-        os << thePlotFileType() << '\n';
-
-        if (n_data_items == 0)
-            amrex::Error("Must specify at least one valid data item to plot");
-
-        os << n_data_items << '\n';
-
-	//
-	// Names of variables
-	//
-	for (i =0; i < static_cast<int>(plot_var_map.size()); i++)
-        {
-	    int typ = plot_var_map[i].first;
-	    int comp = plot_var_map[i].second;
-	    os << desc_lst[typ].name(comp) << '\n';
-        }
-
-        os << BL_SPACEDIM << '\n';
-        os << parent->cumTime() << '\n';
-        int f_lev = parent->finestLevel();
-        os << f_lev << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbLo(i) << ' ';
-        os << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbHi(i) << ' ';
-        os << '\n';
-        for (i = 0; i < f_lev; i++)
-            os << parent->refRatio(i)[0] << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->Geom(i).Domain() << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->levelSteps(i) << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-        {
-            for (int k = 0; k < BL_SPACEDIM; k++)
-                os << parent->Geom(i).CellSize()[k] << ' ';
-            os << '\n';
-        }
-        os << (int) Geom().Coord() << '\n';
-        os << "0\n"; // Write bndry data.
-
-    }
-    // Build the directory to hold the MultiFab at this level.
-    // The name is relative to the directory containing the Header file.
-    //
-    static const std::string BaseName = "/Cell";
-    char buf[64];
-    sprintf(buf, "Level_%d", level);
-    std::string sLevel = buf;
-    //
-    // Now for the full pathname of that directory.
-    //
-    std::string FullPath = dir;
-    if (!FullPath.empty() && FullPath[FullPath.size()-1] != '/')
-        FullPath += '/';
-    FullPath += sLevel;
-    //
-    // Only the I/O processor makes the directory if it doesn't already exist.
-    //
-    if (ParallelDescriptor::IOProcessor())
-        if (!amrex::UtilCreateDirectory(FullPath, 0755))
-            amrex::CreateDirectoryFailed(FullPath);
-    //
-    // Force other processors to wait till directory is built.
-    //
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << level << ' ' << grids.size() << ' ' << cur_time << '\n';
-        os << parent->levelSteps(level) << '\n';
-
-        for (i = 0; i < grids.size(); ++i)
-        {
-            RealBox gridloc = RealBox(grids[i],geom.CellSize(),geom.ProbLo());
-            for (n = 0; n < BL_SPACEDIM; n++)
-                os << gridloc.lo(n) << ' ' << gridloc.hi(n) << '\n';
-        }
-        //
-        // The full relative pathname of the MultiFabs at this level.
-        // The name is relative to the Header file containing this name.
-        // It's the name that gets written into the Header.
-        //
-        if (n_data_items > 0)
-        {
-            std::string PathNameInHeader = sLevel;
-            PathNameInHeader += BaseName;
-            os << PathNameInHeader << '\n';
-        }
-    }
-    //
-    // We combine all of the multifabs -- state, derived, etc -- into one
-    // multifab -- plotMF.
-    // NOTE: In this tutorial code, there is no derived data
-    int       cnt   = 0;
-    const int nGrow = 0;
-    MultiFab  plotMF(grids,dmap,n_data_items,nGrow,MFInfo(),Factory());
-    MultiFab* this_dat = 0;
-    //
-    // Cull data from state variables -- use no ghost cells.
-    //
-    for (i = 0; i < static_cast<int>(plot_var_map.size()); i++)
-    {
-	int typ  = plot_var_map[i].first;
-	int comp = plot_var_map[i].second;
-	this_dat = &state[typ].newData();
-	MultiFab::Copy(plotMF,*this_dat,comp,cnt,1,nGrow);
-	cnt++;
-    }
-
-    //
-    // Use the Full pathname when naming the MultiFab.
-    //
-    std::string TheFullPath = FullPath;
-    TheFullPath += BaseName;
-    VisMF::Write(plotMF,TheFullPath,how,true);
-}
-
-
-void
-AmrLevel::restart (Amr&          papa,
-                   std::istream& is,
-		   bool          bReadSpecial)
-{
-    BL_PROFILE("AmrLevel::restart()");
-    parent = &papa;
-
-    is >> level;
-    is >> geom;
-
-    fine_ratio = IntVect::TheUnitVector(); fine_ratio.scale(-1);
-    crse_ratio = IntVect::TheUnitVector(); crse_ratio.scale(-1);
-
-    if (level > 0)
-    {
-        crse_ratio = parent->refRatio(level-1);
-    }
-    if (level < parent->maxLevel())
-    {
-        fine_ratio = parent->refRatio(level);
-    }
-
-    if (bReadSpecial)
-    {
-        amrex::readBoxArray(grids, is, bReadSpecial);
-    }
-    else
-    {
-        grids.readFrom(is);
-    }
-
-    int nstate;
-    is >> nstate;
-    int ndesc = desc_lst.size();
-
-    Vector<int> state_in_checkpoint(ndesc, 1);
-    if (ndesc > nstate) {
-	set_state_in_checkpoint(state_in_checkpoint);
-    } else {
-	BL_ASSERT(nstate == ndesc);
-    }
-
-    dmap.define(grids);
-
-    parent->SetBoxArray(level, grids);
-    parent->SetDistributionMap(level, dmap);
-
-#ifdef AMREX_USE_EB
-    m_factory.reset(new EBFArrayBoxFactory(geom, grids, dmap,
-                                           {m_eb_basic_grow_cells, m_eb_volume_grow_cells, m_eb_full_grow_cells},
-                                           m_eb_support_level));
-#else
-    m_factory.reset(new FArrayBoxFactory());
-#endif
-
-    state.resize(ndesc);
-    for (int i = 0; i < ndesc; ++i)
-    {
-	if (state_in_checkpoint[i]) {
-	    state[i].restart(is, geom.Domain(), grids, dmap, *m_factory,
-			     desc_lst[i], papa.theRestartFile());
-	}
-    }
- 
-    if (parent->useFixedCoarseGrids()) constructAreaNotToTag();
-
-    post_step_regrid = 0;
-
-    finishConstructor();
-}
-
-void
-AmrLevel::set_state_in_checkpoint (Vector<int>& state_in_checkpoint)
-{
-    amrex::Error("Class derived AmrLevel has to handle this!");
-}
-
-void
-AmrLevel::finishConstructor () {}
-
-void
-AmrLevel::setTimeLevel (Real time,
-                        Real dt_old,
-                        Real dt_new)
-{
-    for (int k = 0; k < desc_lst.size(); k++)
-    {
-        state[k].setTimeLevel(time,dt_old,dt_new);
-    }
-}
-
-bool
-AmrLevel::isStateVariable (const std::string& name,
-                           int&           typ,
-                           int&            n)
-{
-    for (typ = 0; typ < desc_lst.size(); typ++)
-    {
-        const StateDescriptor& desc = desc_lst[typ];
-
-        for (n = 0; n < desc.nComp(); n++)
-        {
-            if (desc.name(n) == name)
-                return true;
-        }
-    }
-    return false;
-}
-
-long
-AmrLevel::countCells () const
-{
-    const int N = grids.size();
-
-    long cnt = 0;
-
-#ifdef _OPENMP
-#pragma omp parallel for reduction(+:cnt)
-#endif
-    for (int i = 0; i < N; i++)
-    {
-        cnt += grids[i].numPts();
-    }
-
-    return cnt;
-}
-
-void
-AmrLevel::checkPoint (const std::string& dir,
-                      std::ostream&      os,
-                      VisMF::How         how,
-                      bool               dump_old)
-{
-    BL_PROFILE("AmrLevel::checkPoint()");
-    int ndesc = desc_lst.size(), i;
-    //
-    // Build directory to hold the MultiFabs in the StateData at this level.
-    // The directory is relative the the directory containing the Header file.
-    //
-    std::string LevelDir, FullPath;
-    LevelDirectoryNames(dir, LevelDir, FullPath);
-    if( ! levelDirectoryCreated) {
-      CreateLevelDirectory(dir);
-      // ---- Force other processors to wait until directory is built.
-      ParallelDescriptor::Barrier("AmrLevel::checkPoint::dir");
-    }
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << level << '\n' << geom  << '\n';
-        grids.writeOn(os);
-        os << ndesc << '\n';
-    }
-    //
-    // Output state data.
-    //
-
-    for (i = 0; i < ndesc; i++)
-    {
-        //
-        // Now build the full relative pathname of the StateData.
-        // The name is relative to the Header file containing this name.
-        // It's the name that gets written into the Header.
-        //
-        std::string PathNameInHdr = amrex::Concatenate(LevelDir + "/SD_", i, 1);
-        std::string FullPathName  = amrex::Concatenate(FullPath + "/SD_", i, 1);
-
-        state[i].checkPoint(PathNameInHdr, FullPathName, os, how, dump_old);
-    }
-
-    levelDirectoryCreated = false;  // ---- now that the checkpoint is finished
-}
-
-AmrLevel::~AmrLevel ()
-{
-    parent = 0;
-}
-
-void
-AmrLevel::allocOldData ()
-{
-    for (int i = 0; i < desc_lst.size(); i++)
-    {
-        state[i].allocOldData();
-    }
-}
-
-void
-AmrLevel::removeOldData ()
-{
-    for (int i = 0; i < desc_lst.size(); i++)
-    {
-        state[i].removeOldData();
-    }
-}
-
-void
-AmrLevel::reset ()
-{
-    for (int i = 0; i < desc_lst.size(); i++)
-    {
-        state[i].reset();
-    }
-}
-
-MultiFab&
-AmrLevel::get_data (int  state_indx,
-                    Real time)
-{
-    const Real old_time = state[state_indx].prevTime();
-    const Real new_time = state[state_indx].curTime();
-    const Real eps = 0.001*(new_time - old_time);
-
-    if (time > old_time-eps && time < old_time+eps)
-    {
-        return get_old_data(state_indx);
-    }
-    else if (time > new_time-eps && time < new_time+eps)
-    {
-        return get_new_data(state_indx);
-    }
-
-    amrex::Error("get_data: invalid time");
-    static MultiFab bogus;
-    return bogus;
-}
-
-const BoxArray&
-AmrLevel::getEdgeBoxArray (int dir) const
-{
-    BL_ASSERT(dir >=0 && dir < BL_SPACEDIM);
-    if (edge_grids[dir].empty()) {
-	edge_grids[dir] = grids;
-	edge_grids[dir].surroundingNodes(dir);
-    }
-    return edge_grids[dir];
-}
-
-const BoxArray&
-AmrLevel::getNodalBoxArray () const
-{
-    if (nodal_grids.empty()) {
-	nodal_grids = grids;
-	nodal_grids.surroundingNodes();
-    }
-    return nodal_grids;
-}
-
-void
-AmrLevel::setPhysBoundaryValues (FArrayBox& dest,
-                                 int        state_indx,
-                                 Real       time,
-                                 int        dest_comp,
-                                 int        src_comp,
-                                 int        num_comp)
-{
-    state[state_indx].FillBoundary(dest,time,geom.CellSize(),
-                                   geom.ProbDomain(),dest_comp,src_comp,num_comp);
-}
-
-FillPatchIteratorHelper::FillPatchIteratorHelper (AmrLevel& amrlevel,
-                                                  MultiFab& leveldata)
-    :
-    m_amrlevel(amrlevel),
-    m_leveldata(leveldata),
-    m_mfid(m_amrlevel.level+1)
-{}
-
-FillPatchIterator::FillPatchIterator (AmrLevel& amrlevel,
-                                      MultiFab& leveldata)
-    :
-    MFIter(leveldata),
-    m_amrlevel(amrlevel),
-    m_leveldata(leveldata),
-    m_ncomp(0)
-{}
-
-FillPatchIteratorHelper::FillPatchIteratorHelper (AmrLevel&     amrlevel,
-                                                  MultiFab&     leveldata,
-                                                  int           boxGrow,
-                                                  Real          time,
-                                                  int           index,
-                                                  int           scomp,
-                                                  int           ncomp,
-                                                  Interpolater* mapper)
-    :
-    m_amrlevel(amrlevel),
-    m_leveldata(leveldata),
-    m_mfid(m_amrlevel.level+1),
-    m_time(time),
-    m_growsize(boxGrow),
-    m_index(index),
-    m_scomp(scomp),
-    m_ncomp(ncomp)
-{
-    Initialize(boxGrow,time,index,scomp,ncomp,mapper);
-}
-
-FillPatchIterator::FillPatchIterator (AmrLevel& amrlevel,
-                                      MultiFab& leveldata,
-                                      int       boxGrow,
-                                      Real      time,
-                                      int       idx,
-                                      int       scomp,
-                                      int       ncomp)
-    :
-    MFIter(leveldata),
-    m_amrlevel(amrlevel),
-    m_leveldata(leveldata),
-    m_ncomp(ncomp)
-{
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(AmrLevel::desc_lst[idx].inRange(scomp,ncomp));
-    BL_ASSERT(0 <= idx && idx < AmrLevel::desc_lst.size());
-
-    Initialize(boxGrow,time,idx,scomp,ncomp);
-
-#ifdef BL_USE_TEAM
-    ParallelDescriptor::MyTeam().MemoryBarrier();
-#endif
-}
-
-static
-bool
-NeedToTouchUpPhysCorners (const Geometry& geom)
-{
-    return geom.isAnyPeriodic() && !geom.isAllPeriodic();
-}
-
-void
-FillPatchIteratorHelper::Initialize (int           boxGrow,
-                                     Real          time,
-                                     int           idx,
-                                     int           scomp,
-                                     int           ncomp,
-                                     Interpolater* mapper)
-{
-    BL_PROFILE("FillPatchIteratorHelper::Initialize()");
-
-    BL_ASSERT(mapper);
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(AmrLevel::desc_lst[idx].inRange(scomp,ncomp));
-    BL_ASSERT(0 <= idx && idx < AmrLevel::desc_lst.size());
-
-    m_map          = mapper;
-    m_time         = time;
-    m_growsize     = boxGrow;
-    m_index        = idx;
-    m_scomp        = scomp;
-    m_ncomp        = ncomp;
-    m_FixUpCorners = NeedToTouchUpPhysCorners(m_amrlevel.geom);
-
-    const int         MyProc     = ParallelDescriptor::MyProc();
-    auto&             amrLevels  = m_amrlevel.parent->getAmrLevels();
-    const AmrLevel&   topLevel   = *amrLevels[m_amrlevel.level];
-    const Box&        topPDomain = topLevel.state[m_index].getDomain();
-    const IndexType&  boxType    = m_leveldata.boxArray().ixType();
-    const bool        extrap     = AmrLevel::desc_lst[m_index].extrap();
-    //
-    // Check that the interpolaters are identical.
-    //
-    BL_ASSERT(AmrLevel::desc_lst[m_index].identicalInterps(scomp,ncomp));
-
-    for (int l = 0; l <= m_amrlevel.level; ++l)
-    {
-        amrLevels[l]->state[m_index].RegisterData(m_mfcd, m_mfid[l]);
-    }
-    for (int i = 0, N = m_leveldata.boxArray().size(); i < N; ++i)
-    {
-        //
-        // A couple typedefs we'll use in the next code segment.
-        //
-        typedef std::map<int,Vector<Vector<Box> > >::value_type IntAABoxMapValType;
-
-        typedef std::map<int,Vector<Vector<Vector<FillBoxId> > > >::value_type IntAAAFBIDMapValType;
-
-        if (m_leveldata.DistributionMap()[i] != MyProc) continue;
-        //
-        // Insert with a hint since the indices are ordered lowest to highest.
-        //
-        IntAAAFBIDMapValType v1(i,Vector<Vector<Vector<FillBoxId> > >());
-
-        m_fbid.insert(m_fbid.end(),v1)->second.resize(m_amrlevel.level+1);
-
-        IntAABoxMapValType v2(i,Vector<Vector<Box> >());
-
-        m_fbox.insert(m_fbox.end(),v2)->second.resize(m_amrlevel.level+1);
-        m_cbox.insert(m_cbox.end(),v2)->second.resize(m_amrlevel.level+1);
-
-        m_ba.insert(m_ba.end(),std::map<int,Box>::value_type(i,amrex::grow(m_leveldata.boxArray()[i],m_growsize)));
-    }
-
-    BoxList        tempUnfillable(boxType);
-    BoxList        unfillableThisLevel(boxType);
-    Vector<Box>     unfilledThisLevel;
-    Vector<Box>     crse_boxes;
-    Vector<IntVect> pshifts(27);
-
-    for (std::map<int,Box>::const_iterator it = m_ba.begin(), End = m_ba.end();
-         it != End;
-         ++it)
-    {
-        const int  bxidx = it->first;
-        const Box& box   = it->second;
-
-        unfilledThisLevel.clear();
-        unfilledThisLevel.push_back(box);
-
-        if (!topPDomain.contains(box))
-        {
-            unfilledThisLevel.back() &= topPDomain;
-
-            if (topLevel.geom.isAnyPeriodic())
-            {
-                //
-                // May need to add additional unique pieces of valid region
-                // in order to do periodic copies into ghost cells.
-                //
-                topLevel.geom.periodicShift(topPDomain,box,pshifts);
-
-                for (const auto& iv : pshifts)
-                {
-                    Box shbox = box + iv;
-                    shbox    &= topPDomain;
-
-                    if (boxType.nodeCentered())
-                    {
-                        for (int dir = 0; dir < BL_SPACEDIM; dir++)
-                        {
-                            if (iv[dir] > 0)
-                            {
-                                shbox.growHi(dir,-1);
-                            }
-                            else if (iv[dir] < 0)
-                            {
-                                shbox.growLo(dir,-1);
-                            }
-                        }
-                    }
-
-                    if (shbox.ok())
-                    {
-                        BoxList bl = amrex::boxDiff(shbox,box);
-
-                        unfilledThisLevel.insert(unfilledThisLevel.end(), bl.begin(), bl.end());
-                    }
-                }
-            }
-        }
-
-	// cells outside physical boundaries are not included in unfilledThisLevel
-
-        bool Done = false;
-
-        Vector< Vector<Box> >&                TheCrseBoxes = m_cbox[bxidx];
-        Vector< Vector<Box> >&                TheFineBoxes = m_fbox[bxidx];
-        Vector< Vector< Vector<FillBoxId> > >& TheFBIDs     = m_fbid[bxidx];
-
-        for (int l = m_amrlevel.level; l >= 0 && !Done; --l)
-        {
-            unfillableThisLevel.clear();
-
-            AmrLevel&       theAmrLevel = *amrLevels[l];
-            StateData&      theState    = theAmrLevel.state[m_index];
-            const Box&      thePDomain  = theState.getDomain();
-            const Geometry& theGeom     = theAmrLevel.geom;
-            const bool      is_periodic = theGeom.isAnyPeriodic();
-            const IntVect&  fine_ratio  = theAmrLevel.fine_ratio;
-            Vector<Box>&     FineBoxes   = TheFineBoxes[l];
-            //
-            // These are the boxes on this level contained in thePDomain
-            // that need to be filled in order to directly fill at the
-            // highest level or to interpolate up to the next higher level.
-            //
-            FineBoxes = unfilledThisLevel;
-            //
-            // Now build coarse boxes needed to interpolate to fine.
-            //
-            // If we're periodic and we're not at the finest level, we may
-            // need to get some additional data at this level in order to
-            // properly fill the CoarseBox()d versions of the fineboxes.
-            //
-            crse_boxes.clear();
-
-            for (const auto& fbx : FineBoxes)
-            {
-                crse_boxes.push_back(fbx);
-
-                if (l != m_amrlevel.level)
-                {
-                    const Box& cbox = m_map->CoarseBox(fbx,fine_ratio);
-
-		    crse_boxes.back() = cbox;
-
-                    if (is_periodic && !thePDomain.contains(cbox))
-                    {
-                        theGeom.periodicShift(thePDomain,cbox,pshifts);
-
-                        for (const auto& iv : pshifts)
-                        {
-                            Box shbox = cbox + iv;
-                            shbox    &= thePDomain;
-
-                            if (boxType.nodeCentered())
-                            {
-                                for (int dir = 0; dir < BL_SPACEDIM; dir++)
-                                {
-                                    if (iv[dir] > 0)
-                                    {
-                                        shbox.growHi(dir,-1);
-                                    }
-                                    else if (iv[dir] < 0)
-                                    {
-                                        shbox.growLo(dir,-1);
-                                    }
-                                }
-                            }
-
-                            if (shbox.ok())
-                            {
-                                crse_boxes.push_back(shbox);
-                            }
-                        }
-                    }
-                }
-            }
-
-            Vector< Vector<FillBoxId> >& FBIDs     = TheFBIDs[l];
-            Vector<Box>&                CrseBoxes = TheCrseBoxes[l];
-
-            FBIDs.resize(crse_boxes.size());
-            CrseBoxes.resize(crse_boxes.size());
-            //
-            // Now attempt to get as much coarse data as possible.
-            //
-            for (int i = 0, M = CrseBoxes.size(); i < M; i++)
-            {
-                BL_ASSERT(tempUnfillable.isEmpty());
-
-                CrseBoxes[i] = crse_boxes[i];
-
-                BL_ASSERT(CrseBoxes[i].intersects(thePDomain));
-
-                theState.InterpAddBox(m_mfcd,
-				      m_mfid[l],
-				      &tempUnfillable,
-				      FBIDs[i],
-				      CrseBoxes[i],
-				      m_time,
-				      m_scomp,
-				      0,
-				      m_ncomp,
-				      extrap);
-
-                unfillableThisLevel.catenate(tempUnfillable);
-            }
-
-            unfillableThisLevel.intersect(thePDomain);
-
-            if (unfillableThisLevel.isEmpty())
-            {
-                Done = true;
-            }
-            else
-            {
-                unfilledThisLevel.clear();
-
-                unfilledThisLevel.insert(unfilledThisLevel.end(),
-                                         unfillableThisLevel.begin(),
-                                         unfillableThisLevel.end());
-            }
-        }
-    }
-
-    m_mfcd.CollectData();
-}
-
-void
-FillPatchIterator::Initialize (int  boxGrow,
-                               Real time,
-                               int  idx,
-                               int  scomp,
-                               int  ncomp)
-{
-    BL_PROFILE("FillPatchIterator::Initialize");
-
-    BL_ASSERT(scomp >= 0);
-    BL_ASSERT(ncomp >= 1);
-    BL_ASSERT(0 <= idx && idx < AmrLevel::desc_lst.size());
-
-    const StateDescriptor& desc = AmrLevel::desc_lst[idx];
-
-    m_ncomp = ncomp;
-    m_range = desc.sameInterps(scomp,ncomp);
-
-    m_fabs.define(m_leveldata.boxArray(),m_leveldata.DistributionMap(),
-		  m_ncomp,boxGrow,MFInfo(),m_leveldata.Factory());
-
-    const IndexType& boxType = m_leveldata.boxArray().ixType();
-    const int level = m_amrlevel.level;
-
-    for (int i = 0, DComp = 0; i < static_cast<int>(m_range.size()); i++)
-    {
-        const int SComp = m_range[i].first;
-        const int NComp = m_range[i].second;
-
-	if (level == 0)
-	{
-	    FillFromLevel0(time, idx, SComp, DComp, NComp);
-	}
-	else
-	{
-	    if (level == 1 || 
-		amrex::ProperlyNested(m_amrlevel.crse_ratio,
-				       m_amrlevel.parent->blockingFactor(m_amrlevel.level),
-				       boxGrow, boxType, desc.interp(SComp)))
-	    {
-		FillFromTwoLevels(time, idx, SComp, DComp, NComp);
-	    } else {
-
-#ifdef AMREX_USE_EB
-                amrex::Abort("Grids must be properly nested for EB");
-#endif
-
-		static bool first = true;
-		if (first) {
-		    first = false;
-		    if (ParallelDescriptor::IOProcessor()) {
-			IntVect new_blocking_factor = m_amrlevel.parent->blockingFactor(m_amrlevel.level);
-                        new_blocking_factor *= 2;
-			for (int j = 0; j < 10; ++j) {
-			    if (amrex::ProperlyNested(m_amrlevel.crse_ratio,
-						       new_blocking_factor,
-						       boxGrow, boxType, desc.interp(SComp))) {
-				break;
-			    } else {
-				new_blocking_factor *= 2;
-			    }
-			}
-			std::cout << "WARNING: Grids are not properly nested.  We might have to use\n"
-				  << "         two coarse levels to do fillpatch.  Consider using\n";
-			if (new_blocking_factor < IntVect{AMREX_D_DECL(128,128,128)}) {
-			    std::cout << "         amr.blocking_factor=" << new_blocking_factor;
-			} else {
-			    std::cout << "         larger amr.blocking_factor. ";
-			}
-			std::cout << std::endl;
-		    }
-		}
-
-		FillPatchIteratorHelper* fph = 0;
-		fph = new FillPatchIteratorHelper(m_amrlevel,
-						  m_leveldata,
-						  boxGrow,
-						  time,
-						  idx,
-						  SComp,
-						  NComp,
-						  desc.interp(SComp));
-
-#if defined(AMREX_CRSEGRNDOMP) || (!defined(AMREX_XSDK) && defined(CRSEGRNDOMP))
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-#endif
-		for (MFIter mfi(m_fabs); mfi.isValid(); ++mfi)
-		{
-		    fph->fill(m_fabs[mfi],DComp,mfi.index());
-		}
-		
-		delete fph;
-	    }
-	}
-
-        DComp += NComp;
-    }
-    //
-    // Call hack to touch up fillPatched data.
-    //
-    m_amrlevel.set_preferred_boundary_values(m_fabs,
-                                             idx,
-                                             scomp,
-                                             0,
-                                             ncomp,
-                                             time);
-}
-
-void
-FillPatchIterator::FillFromLevel0 (Real time, int idx, int scomp, int dcomp, int ncomp)
-{
-    BL_ASSERT(m_amrlevel.level == 0);
-
-    StateData& statedata = m_amrlevel.state[idx];
-
-    Vector<MultiFab*> smf;
-    Vector<Real> stime;
-    statedata.getData(smf,stime,time);
-
-    const Geometry& geom = m_amrlevel.geom;
-
-    StateDataPhysBCFunct physbcf(statedata,scomp,geom);
-
-    amrex::FillPatchSingleLevel (m_fabs, time, smf, stime, scomp, dcomp, ncomp, geom, physbcf);
-}
-
-void
-FillPatchIterator::FillFromTwoLevels (Real time, int idx, int scomp, int dcomp, int ncomp)
-{
-    int ilev_fine = m_amrlevel.level;
-    int ilev_crse = ilev_fine-1;
-
-    BL_ASSERT(ilev_crse >= 0);
-
-    AmrLevel& fine_level = m_amrlevel;
-    AmrLevel& crse_level = m_amrlevel.parent->getLevel(ilev_crse);
-
-    const Geometry& geom_fine = fine_level.geom;
-    const Geometry& geom_crse = crse_level.geom;
-    
-    Vector<MultiFab*> smf_crse;
-    Vector<Real> stime_crse;
-    StateData& statedata_crse = crse_level.state[idx];
-    statedata_crse.getData(smf_crse,stime_crse,time);
-    StateDataPhysBCFunct physbcf_crse(statedata_crse,scomp,geom_crse);
-
-    Vector<MultiFab*> smf_fine;
-    Vector<Real> stime_fine;
-    StateData& statedata_fine = fine_level.state[idx];
-    statedata_fine.getData(smf_fine,stime_fine,time);
-    StateDataPhysBCFunct physbcf_fine(statedata_fine,scomp,geom_fine);
-
-    const StateDescriptor& desc = AmrLevel::desc_lst[idx];
-
-    amrex::FillPatchTwoLevels(m_fabs, time, 
-			       smf_crse, stime_crse, 
-			       smf_fine, stime_fine,
-			       scomp, dcomp, ncomp, 
-			       geom_crse, geom_fine,
-			       physbcf_crse, physbcf_fine,
-			       crse_level.fineRatio(), 
-			       desc.interp(scomp), desc.getBCs());
-}
-
-static
-bool
-HasPhysBndry (const Box&      b,
-              const Box&      dmn,
-              const Geometry& geom)
-{
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        if (!geom.isPeriodic(i))
-        {
-            if (b.smallEnd(i) < dmn.smallEnd(i) || b.bigEnd(i) > dmn.bigEnd(i))
-            {
-                return true;
-            }
-        }
-    }
-
-    return false;
-}
-
-static
-void
-FixUpPhysCorners (FArrayBox&      fab,
-                  AmrLevel&       TheLevel,
-                  int             state_indx,
-                  Real            time,
-                  int             scomp,
-                  int             dcomp,
-                  int             ncomp)
-{
-    StateData&      TheState   = TheLevel.get_state_data(state_indx);
-    const Geometry& TheGeom    = TheLevel.Geom();
-    const Box&      ProbDomain = TheState.getDomain();
-
-    if (!HasPhysBndry(fab.box(),ProbDomain,TheGeom)) return;
-
-    FArrayBox tmp;
-
-    Box GrownDomain = ProbDomain;
-
-    for (int dir = 0; dir < BL_SPACEDIM; dir++)
-    {
-        if (!TheGeom.isPeriodic(dir))
-        {
-            const int lo = ProbDomain.smallEnd(dir) - fab.box().smallEnd(dir);
-            const int hi = fab.box().bigEnd(dir)    - ProbDomain.bigEnd(dir);
-            if (lo > 0) GrownDomain.growLo(dir,lo);
-            if (hi > 0) GrownDomain.growHi(dir,hi);
-        }
-    }
-
-    for (int dir = 0; dir < BL_SPACEDIM; dir++)
-    {
-        if (!TheGeom.isPeriodic(dir)) continue;
-
-        Box lo_slab = fab.box();
-        Box hi_slab = fab.box();
-        lo_slab.shift(dir, ProbDomain.length(dir));
-        hi_slab.shift(dir,-ProbDomain.length(dir));
-        lo_slab &= GrownDomain;
-        hi_slab &= GrownDomain;
-
-        if (lo_slab.ok())
-        {
-            lo_slab.shift(dir,-ProbDomain.length(dir));
-
-            BL_ASSERT(fab.box().contains(lo_slab));
-            BL_ASSERT(HasPhysBndry(lo_slab,ProbDomain,TheGeom));
-
-            tmp.resize(lo_slab,ncomp);
-            tmp.copy(fab,dcomp,0,ncomp);
-            tmp.shift(dir,ProbDomain.length(dir));
-            TheLevel.setPhysBoundaryValues(tmp,
-                                           state_indx,
-                                           time,
-                                           0,
-                                           scomp,
-                                           ncomp);
-            tmp.shift(dir,-ProbDomain.length(dir));
-            fab.copy(tmp,0,dcomp,ncomp);
-        }
-
-        if (hi_slab.ok())
-        {
-            hi_slab.shift(dir,ProbDomain.length(dir));
-
-            BL_ASSERT(fab.box().contains(hi_slab));
-            BL_ASSERT(HasPhysBndry(hi_slab,ProbDomain,TheGeom));
-
-            tmp.resize(hi_slab,ncomp);
-            tmp.copy(fab,dcomp,0,ncomp);
-            tmp.shift(dir,-ProbDomain.length(dir));
-            TheLevel.setPhysBoundaryValues(tmp,
-                                           state_indx,
-                                           time,
-                                           0,
-                                           scomp,
-                                           ncomp);
-            tmp.shift(dir,ProbDomain.length(dir));
-            fab.copy(tmp,0,dcomp,ncomp);
-        }
-    }
-}
-
-void
-FillPatchIteratorHelper::fill (FArrayBox& fab,
-                               int        dcomp,
-                               int        idx)
-{
-    BL_PROFILE("FillPatchIteratorHelper::fill()");
-
-    BL_ASSERT(fab.box() == m_ba[idx]);
-    BL_ASSERT(fab.nComp() >= dcomp + m_ncomp);
-
-    Vector< Vector<std::unique_ptr<FArrayBox> > > cfab(m_amrlevel.level+1);
-    Vector< Vector<Box> >&                TheCrseBoxes = m_cbox[idx];
-    Vector< Vector<Box> >&                TheFineBoxes = m_fbox[idx];
-    Vector< Vector< Vector<FillBoxId> > >& TheFBIDs     = m_fbid[idx];
-    const bool                          extrap       = AmrLevel::desc_lst[m_index].extrap();
-    auto&                               amrLevels    = m_amrlevel.parent->getAmrLevels();
-    //
-    // Build all coarse fabs from which we'll interpolate and
-    // fill them with coarse data as best we can.
-    //
-    for (int l = 0; l <= m_amrlevel.level; l++)
-    {
-        StateData&                       TheState  = amrLevels[l]->state[m_index];
-        const Vector<Box>&                CrseBoxes = TheCrseBoxes[l];
-        auto&                            CrseFabs  = cfab[l];
-        const Vector< Vector<FillBoxId> >& FBIDs     = TheFBIDs[l];
-        const int                        NC        = CrseBoxes.size();
-
-        CrseFabs.resize(NC);
-
-        for (int i = 0; i < NC; i++)
-        {
-            BL_ASSERT(CrseBoxes[i].ok());
-            CrseFabs[i].reset(new FArrayBox(CrseBoxes[i],m_ncomp));
-	}
-
-        for (int i = 0; i < NC; i++)
-        {
-            //
-            // Set to special value we'll later check
-            // to ensure we've filled the FABs at the coarse level.
-            //
-            TheState.InterpFillFab(m_mfcd,
-				   m_mfid[l],
-				   FBIDs[i],
-				   *CrseFabs[i],
-				   m_time,
-				   0,
-				   0,
-				   m_ncomp,
-				   extrap);
-        }
-    }
-    //
-    // Now work from the bottom up interpolating to next higher level.
-    //
-    for (int l = 0; l < m_amrlevel.level; l++)
-    {
-        auto&              CrseFabs   = cfab[l];
-        AmrLevel&          TheLevel   = *amrLevels[l];
-        StateData&         TheState   = TheLevel.state[m_index];
-        const Box&         ThePDomain = TheState.getDomain();
-        const int          NC         = CrseFabs.size();
-
-        if (TheLevel.geom.isAnyPeriodic())
-        {
-            //
-            // Fill CrseFabs with periodic data in preparation for interp().
-            //
-            for (int i = 0; i < NC; i++)
-            {
-                FArrayBox& dstfab = *CrseFabs[i];
-
-                if (ThePDomain.contains(dstfab.box())) continue;
-
-                Vector<IntVect> pshifts(27);
-
-                TheLevel.geom.periodicShift(ThePDomain,dstfab.box(),pshifts);
-
-                for (const auto& iv : pshifts)
-                {
-                    Box fullsrcbox = dstfab.box() + iv;
-                    fullsrcbox    &= ThePDomain;
-
-                    for (int j = 0; j < NC; j++)
-                    {
-                        const FArrayBox& srcfab = *CrseFabs[j];
-                        const Box&       srcbox = fullsrcbox & srcfab.box();
-
-                        if (srcbox.ok())
-                        {
-                            const Box& dstbox = srcbox - iv;
-
-                            dstfab.copy(srcfab,srcbox,0,dstbox,0,m_ncomp);
-                        }
-                    }
-                }
-            }
-        }
-        //
-        // Set non-periodic BCs in coarse data -- what we interpolate with.
-        // This MUST come after the periodic fill mumbo-jumbo.
-        for (int i = 0; i < NC; ++i)
-        {
-            if ( ! ThePDomain.contains(CrseFabs[i]->box()))
-            {
-                TheLevel.setPhysBoundaryValues(*CrseFabs[i],
-                                               m_index,
-                                               m_time,
-                                               0,
-                                               m_scomp,
-                                               m_ncomp);
-            }
-        }
-
-        if (m_FixUpCorners)
-        {
-            for (int i = 0; i < NC; ++i)
-            {
-                FixUpPhysCorners(*CrseFabs[i],TheLevel,m_index,m_time,m_scomp,0,m_ncomp);
-            }
-        }
-        //
-        // Interpolate up to next level.
-        //
-        AmrLevel&           crseAmrLevel  = *amrLevels[l];
-        AmrLevel&           fineAmrLevel  = *amrLevels[l+1];
-        const IntVect&      fine_ratio    = crseAmrLevel.fine_ratio;
-        const Vector<Box>&   FineBoxes     = TheFineBoxes[l];
-        StateData&          fState        = fineAmrLevel.state[m_index];
-        const Box&          fDomain       = fState.getDomain();
-        auto&               FinerCrseFabs = cfab[l+1];
-        const Vector<BCRec>& theBCs        = AmrLevel::desc_lst[m_index].getBCs();
-        const int           NF            = FineBoxes.size();
-
-        for (int ifine = 0; ifine < NF; ++ifine)
-        {
-            Vector<BCRec> bcr(m_ncomp);
-            FArrayBox    finefab(FineBoxes[ifine],m_ncomp);
-            FArrayBox    crsefab(m_map->CoarseBox(finefab.box(),fine_ratio),m_ncomp);
-            //
-            // Fill crsefab from m_cbox via copy on intersect.
-            //
-            for (int j = 0; j < NC; j++) {
-                crsefab.copy(*CrseFabs[j]);
-	    }
-            //
-            // Get boundary conditions for the fine patch.
-            //
-            amrex::setBC(finefab.box(),
-                          fDomain,
-                          m_scomp,
-                          0,
-                          m_ncomp,
-                          theBCs,
-                          bcr);
-            //
-            // Interpolate up to fine patch.
-            //
-            m_map->interp(crsefab,
-                          0,
-                          finefab,
-                          0,
-                          m_ncomp,
-                          finefab.box(),
-                          fine_ratio,
-                          crseAmrLevel.geom,
-                          fineAmrLevel.geom,
-                          bcr,
-                          m_scomp,
-                          m_index, RunOn::Cpu);
-            //
-            // Copy intersect finefab into next level m_cboxes.
-            //
-	    for (int j = 0, K = FinerCrseFabs.size(); j < K; ++j) {
-		FinerCrseFabs[j]->copy(finefab);
-	    }
-        }
-
-        CrseFabs.clear();
-    }
-    //
-    // Now for the finest level stuff.
-    //
-    StateData&         FineState      = m_amrlevel.state[m_index];
-    const Box&         FineDomain     = FineState.getDomain();
-    const Geometry&    FineGeom       = m_amrlevel.geom;
-    auto&              FinestCrseFabs = cfab[m_amrlevel.level];
-    //
-    // Copy intersect coarse into destination fab.
-    //
-    for (int i = 0, N = FinestCrseFabs.size(); i < N; ++i) {
-        fab.copy(*FinestCrseFabs[i],0,dcomp,m_ncomp);
-    }
-
-    if (FineGeom.isAnyPeriodic() && !FineDomain.contains(fab.box()))
-    {
-        Vector<IntVect> pshifts(27);
-
-        FineGeom.periodicShift(FineDomain,fab.box(),pshifts);
-
-        for (int i = 0, N = FinestCrseFabs.size(); i < N; i++)
-        {
-            for (const auto& iv : pshifts)
-            {
-                fab.shift(iv);
-
-                Box src_dst = FinestCrseFabs[i]->box() & fab.box();
-                src_dst    &= FineDomain;
-
-                if (src_dst.ok())
-                    fab.copy(*FinestCrseFabs[i],src_dst,0,src_dst,dcomp,m_ncomp);
-
-                fab.shift(-iv);
-            }
-        }
-    }
-    //
-    // No longer need coarse data at finest level.
-    //
-    FinestCrseFabs.clear();
-    //
-    // Final set of non-periodic BCs.
-    //
-    if (! FineState.getDomain().contains(fab.box()))
-    {
-        m_amrlevel.setPhysBoundaryValues(fab,
-                                         m_index,
-                                         m_time,
-                                         dcomp,
-                                         m_scomp,
-                                         m_ncomp);
-    }
-
-    if (m_FixUpCorners)
-    {
-        FixUpPhysCorners(fab,m_amrlevel,m_index,m_time,m_scomp,dcomp,m_ncomp);
-    }
-}
-
-FillPatchIteratorHelper::~FillPatchIteratorHelper () {}
-
-FillPatchIterator::~FillPatchIterator () {}
-
-void
-AmrLevel::FillCoarsePatch (MultiFab& mf,
-                           int       dcomp,
-                           Real      time,
-                           int       idx,
-                           int       scomp,
-                           int       ncomp,
-			   int       nghost)
-{
-    BL_PROFILE("AmrLevel::FillCoarsePatch()");
-
-    //
-    // Must fill this region on crse level and interpolate.
-    //
-    BL_ASSERT(level != 0);
-    BL_ASSERT(ncomp <= (mf.nComp()-dcomp));
-    BL_ASSERT(nghost <= mf.nGrow());
-    BL_ASSERT(0 <= idx && idx < desc_lst.size());
-
-    int                     DComp   = dcomp;
-    const StateDescriptor&  desc    = desc_lst[idx];
-    const Box&              pdomain = state[idx].getDomain();
-    const BoxArray&         mf_BA   = mf.boxArray();
-    const DistributionMapping& mf_DM = mf.DistributionMap();
-    AmrLevel&               clev    = parent->getLevel(level-1);
-    const Geometry&         cgeom   = clev.geom;
-
-    Box domain_g = pdomain;
-    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	if (geom.isPeriodic(i)) {
-	    domain_g.grow(i,nghost);
-	}
-    }
-
-    std::vector< std::pair<int,int> > ranges  = desc.sameInterps(scomp,ncomp);
-
-    BL_ASSERT(desc.inRange(scomp, ncomp));
-
-    for (int i = 0; i < static_cast<int>(ranges.size()); i++)
-    {
-        const int     SComp  = ranges[i].first;
-        const int     NComp  = ranges[i].second;
-        Interpolater* mapper = desc.interp(SComp);
-
-        BoxArray crseBA(mf_BA.size());
-        
-        for (int j = 0, N = crseBA.size(); j < N; ++j)
-        {
-            BL_ASSERT(mf_BA[j].ixType() == desc.getType());
-	    const Box& bx = amrex::grow(mf_BA[j],nghost) & domain_g;
-            crseBA.set(j,mapper->CoarseBox(bx, crse_ratio));
-        }
-
-#ifdef AMREX_USE_EB
-        MultiFab crseMF(crseBA,mf_DM,NComp,0,MFInfo(),
-                        EBFArrayBoxFactory(cgeom, crseBA, mf_DM, {0,0,0}, EBSupport::basic));
-#else
-	MultiFab crseMF(crseBA,mf_DM,NComp,0);
-#endif
-
-	if ( level == 1 
-	     || amrex::ProperlyNested(crse_ratio, parent->blockingFactor(level),
-				       nghost, mf_BA.ixType(), mapper) )
-	{
-	    StateData& statedata = clev.state[idx];
-	    
-	    Vector<MultiFab*> smf;
-	    Vector<Real> stime;
-	    statedata.getData(smf,stime,time);
-
-	    StateDataPhysBCFunct physbcf(statedata,SComp,cgeom);
-
-	    amrex::FillPatchSingleLevel(crseMF,time,smf,stime,SComp,0,NComp,cgeom,physbcf);
-	}
-	else
-	{
-	    FillPatch(clev,crseMF,0,time,idx,SComp,NComp,0);
-	}
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-	for (MFIter mfi(mf); mfi.isValid(); ++mfi)
-	{
-	    const Box& dbx = amrex::grow(mfi.validbox(),nghost) & domain_g;
-	    
-	    Vector<BCRec> bcr(ncomp);
-	    
-	    amrex::setBC(dbx,pdomain,SComp,0,NComp,desc.getBCs(),bcr);
-	    
-	    mapper->interp(crseMF[mfi],
-			   0,
-			   mf[mfi],
-			   DComp,
-			   NComp,
-			   dbx,
-			   crse_ratio,
-			   cgeom,
-			   geom,
-			   bcr,
-			   SComp,
-			   idx, RunOn::Cpu);
-	}
-
-	StateDataPhysBCFunct physbcf(state[idx],SComp,geom);
-	physbcf.FillBoundary(mf, DComp, NComp, time);
-
-        DComp += NComp;
-    }
-}
-
-std::unique_ptr<MultiFab>
-AmrLevel::derive (const std::string& name,
-                  Real           time,
-                  int            ngrow)
-{
-    BL_ASSERT(ngrow >= 0);
-
-    std::unique_ptr<MultiFab> mf;
-
-    int index, scomp, ncomp;
-
-    if (isStateVariable(name, index, scomp))
-    {
-        mf.reset(new MultiFab(state[index].boxArray(), dmap, 1, ngrow, MFInfo(), *m_factory));
-        FillPatch(*this,*mf,ngrow,time,index,scomp,1);
-    }
-    else if (const DeriveRec* rec = derive_lst.get(name))
-    {
-        rec->getRange(0, index, scomp, ncomp);
-
-        const BoxArray& srcBA = state[index].boxArray();
-
-        BoxArray dstBA(srcBA);
-        dstBA.convert(rec->deriveType());
-
-	int ngrow_src = ngrow;
-	{
-	    Box bx0 = srcBA[0];
-	    Box bx1 = rec->boxMap()(bx0);
-	    int g = bx0.smallEnd(0) - bx1.smallEnd(0);
-	    ngrow_src += g;
-	}
-
-        MultiFab srcMF(srcBA, dmap, rec->numState(), ngrow_src, MFInfo(), *m_factory);
-
-        for (int k = 0, dc = 0; k < rec->numRange(); k++, dc += ncomp)
-        {
-            rec->getRange(k, index, scomp, ncomp);
-            FillPatch(*this,srcMF,ngrow_src,time,index,scomp,ncomp,dc);
-        }
-
-        mf.reset(new MultiFab(dstBA, dmap, rec->numDerive(), ngrow, MFInfo(), *m_factory));
-
-#if defined(AMREX_CRSEGRNDOMP) || (!defined(AMREX_XSDK) && defined(CRSEGRNDOMP))
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for (MFIter mfi(*mf,true); mfi.isValid(); ++mfi)
-        {
-            int         grid_no = mfi.index();
-            Real*       ddat    = (*mf)[mfi].dataPtr();
-            const int*  dlo     = (*mf)[mfi].loVect();
-            const int*  dhi     = (*mf)[mfi].hiVect();
-	    const Box&  gtbx    = mfi.growntilebox();
-	    const int*  lo      = gtbx.loVect();
-	    const int*  hi      = gtbx.hiVect();
-            int         n_der   = rec->numDerive();
-            Real*       cdat    = srcMF[mfi].dataPtr();
-            const int*  clo     = srcMF[mfi].loVect();
-            const int*  chi     = srcMF[mfi].hiVect();
-            int         n_state = rec->numState();
-            const int*  dom_lo  = state[index].getDomain().loVect();
-            const int*  dom_hi  = state[index].getDomain().hiVect();
-            const Real* dx      = geom.CellSize();
-            const int*  bcr     = rec->getBC();
-            const RealBox temp    (gtbx,geom.CellSize(),geom.ProbLo());
-            const Real* xlo     = temp.lo();
-            Real        dt      = parent->dtLevel(level);
-
-	    if (rec->derFunc() != static_cast<DeriveFunc>(0)){
-		rec->derFunc()(ddat,ARLIM(dlo),ARLIM(dhi),&n_der,
-			       cdat,ARLIM(clo),ARLIM(chi),&n_state,
-			       lo,hi,dom_lo,dom_hi,dx,xlo,&time,&dt,bcr,
-			       &level,&grid_no);
-	    } else if (rec->derFunc3D() != static_cast<DeriveFunc3D>(0)){
-		rec->derFunc3D()(ddat,ARLIM_3D(dlo),ARLIM_3D(dhi),&n_der,
-				 cdat,ARLIM_3D(clo),ARLIM_3D(chi),&n_state,
-				 ARLIM_3D(lo),ARLIM_3D(hi),
-				 ARLIM_3D(dom_lo),ARLIM_3D(dom_hi),
-				 ZFILL(dx),ZFILL(xlo),
-				 &time,&dt,
-				 AMREX_BCREC_3D(bcr),
-				 &level,&grid_no);
-	    } else {
-		amrex::Error("AmeLevel::derive: no function available");
-	    }
-        }
-#else
-        for (MFIter mfi(srcMF); mfi.isValid(); ++mfi)
-        {
-            int         grid_no = mfi.index();
-            const RealBox gridloc(grids[grid_no],geom.CellSize(),geom.ProbLo());
-            Real*       ddat    = (*mf)[mfi].dataPtr();
-            const int*  dlo     = (*mf)[mfi].loVect();
-            const int*  dhi     = (*mf)[mfi].hiVect();
-            int         n_der   = rec->numDerive();
-            Real*       cdat    = srcMF[mfi].dataPtr();
-            const int*  clo     = srcMF[mfi].loVect();
-            const int*  chi     = srcMF[mfi].hiVect();
-            int         n_state = rec->numState();
-            const int*  dom_lo  = state[index].getDomain().loVect();
-            const int*  dom_hi  = state[index].getDomain().hiVect();
-            const Real* dx      = geom.CellSize();
-            const int*  bcr     = rec->getBC();
-            const Real* xlo     = gridloc.lo();
-            Real        dt      = parent->dtLevel(level);
-
-	    if (rec->derFunc() != static_cast<DeriveFunc>(0)){
-		rec->derFunc()(ddat,ARLIM(dlo),ARLIM(dhi),&n_der,
-			       cdat,ARLIM(clo),ARLIM(chi),&n_state,
-			       dlo,dhi,dom_lo,dom_hi,dx,xlo,&time,&dt,bcr,
-			       &level,&grid_no);
-	    } else if (rec->derFunc3D() != static_cast<DeriveFunc3D>(0)){
-		rec->derFunc3D()(ddat,ARLIM_3D(dlo),ARLIM_3D(dhi),&n_der,
-				 cdat,ARLIM_3D(clo),ARLIM_3D(chi),&n_state,
-				 ARLIM_3D(dlo),ARLIM_3D(dhi),
-				 ARLIM_3D(dom_lo),ARLIM_3D(dom_hi),
-				 ZFILL(dx),ZFILL(xlo),
-				 &time,&dt,
-				 AMREX_BCREC_3D(bcr),
-				 &level,&grid_no);
-	    } else {
-		amrex::Error("AmeLevel::derive: no function available");
-	    }
-        }
-#endif
-    }
-    else
-    {
-        //
-        // If we got here, cannot derive given name.
-        //
-        std::string msg("AmrLevel::derive(MultiFab*): unknown variable: ");
-        msg += name;
-        amrex::Error(msg.c_str());
-    }
-
-    return mf;
-}
-
-void
-AmrLevel::derive (const std::string& name,
-                  Real           time,
-                  MultiFab&      mf,
-                  int            dcomp)
-{
-    BL_ASSERT(dcomp < mf.nComp());
-
-    const int ngrow = mf.nGrow();
-
-    int index, scomp, ncomp;
-
-    if (isStateVariable(name,index,scomp))
-    {
-        FillPatch(*this,mf,ngrow,time,index,scomp,1);
-    }
-    else if (const DeriveRec* rec = derive_lst.get(name))
-    {
-        rec->getRange(0,index,scomp,ncomp);
-
-        const BoxArray& srcBA = state[index].boxArray();
-
-	int ngrow_src = ngrow;
-	{
-	    Box bx0 = srcBA[0];
-	    Box bx1 = rec->boxMap()(bx0);
-	    int g = bx0.smallEnd(0) - bx1.smallEnd(0);
-	    ngrow_src += g;
-	}
-
-        MultiFab srcMF(srcBA,dmap,rec->numState(),ngrow_src, MFInfo(), *m_factory);
-
-        for (int k = 0, dc = 0; k < rec->numRange(); k++, dc += ncomp)
-        {
-            rec->getRange(k,index,scomp,ncomp);
-
-            FillPatch(*this,srcMF,ngrow_src,time,index,scomp,ncomp,dc);
-        }
-
-#if defined(AMREX_CRSEGRNDOMP) || (!defined(AMREX_XSDK) && defined(CRSEGRNDOMP))
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for (MFIter mfi(mf,true); mfi.isValid(); ++mfi)
-        {
-            int         idx     = mfi.index();
-            Real*       ddat    = mf[mfi].dataPtr(dcomp);
-            const int*  dlo     = mf[mfi].loVect();
-            const int*  dhi     = mf[mfi].hiVect();
-	    const Box&  gtbx    = mfi.growntilebox();
-	    const int*  lo      = gtbx.loVect();
-	    const int*  hi      = gtbx.hiVect();
-            int         n_der   = rec->numDerive();
-            Real*       cdat    = srcMF[mfi].dataPtr();
-            const int*  clo     = srcMF[mfi].loVect();
-            const int*  chi     = srcMF[mfi].hiVect();
-            int         n_state = rec->numState();
-            const int*  dom_lo  = state[index].getDomain().loVect();
-            const int*  dom_hi  = state[index].getDomain().hiVect();
-            const Real* dx      = geom.CellSize();
-            const int*  bcr     = rec->getBC();
-            const RealBox& temp = RealBox(gtbx,geom.CellSize(),geom.ProbLo());
-            const Real* xlo     = temp.lo();
-            Real        dt      = parent->dtLevel(level);
-
-	    if (rec->derFunc() != static_cast<DeriveFunc>(0)){
-		rec->derFunc()(ddat,ARLIM(dlo),ARLIM(dhi),&n_der,
-			       cdat,ARLIM(clo),ARLIM(chi),&n_state,
-			       lo,hi,dom_lo,dom_hi,dx,xlo,&time,&dt,bcr,
-			       &level,&idx);
-	    } else if (rec->derFunc3D() != static_cast<DeriveFunc3D>(0)){
-		rec->derFunc3D()(ddat,ARLIM_3D(dlo),ARLIM_3D(dhi),&n_der,
-				 cdat,ARLIM_3D(clo),ARLIM_3D(chi),&n_state,
-				 ARLIM_3D(lo),ARLIM_3D(hi),
-				 ARLIM_3D(dom_lo),ARLIM_3D(dom_hi),
-				 ZFILL(dx),ZFILL(xlo),
-				 &time,&dt,
-				 AMREX_BCREC_3D(bcr),
-				 &level,&idx);
-	    } else {
-		amrex::Error("AmeLevel::derive: no function available");
-	    }
-        }
-#else
-        for (MFIter mfi(srcMF); mfi.isValid(); ++mfi)
-        {
-            int         idx     = mfi.index();
-            Real*       ddat    = mf[mfi].dataPtr(dcomp);
-            const int*  dlo     = mf[mfi].loVect();
-            const int*  dhi     = mf[mfi].hiVect();
-            int         n_der   = rec->numDerive();
-            Real*       cdat    = srcMF[mfi].dataPtr();
-            const int*  clo     = srcMF[mfi].loVect();
-            const int*  chi     = srcMF[mfi].hiVect();
-            int         n_state = rec->numState();
-            const int*  dom_lo  = state[index].getDomain().loVect();
-            const int*  dom_hi  = state[index].getDomain().hiVect();
-            const Real* dx      = geom.CellSize();
-            const int*  bcr     = rec->getBC();
-            const RealBox& temp = RealBox(mf[mfi].box(),geom.CellSize(),geom.ProbLo());
-            const Real* xlo     = temp.lo();
-            Real        dt      = parent->dtLevel(level);
-
-	    if (rec->derFunc() != static_cast<DeriveFunc>(0)){
-		rec->derFunc()(ddat,ARLIM(dlo),ARLIM(dhi),&n_der,
-			       cdat,ARLIM(clo),ARLIM(chi),&n_state,
-			       dlo,dhi,dom_lo,dom_hi,dx,xlo,&time,&dt,bcr,
-			       &level,&idx);
-	    } else if (rec->derFunc3D() != static_cast<DeriveFunc3D>(0)){
-		rec->derFunc3D()(ddat,ARLIM_3D(dlo),ARLIM_3D(dhi),&n_der,
-				 cdat,ARLIM_3D(clo),ARLIM_3D(chi),&n_state,
-				 ARLIM_3D(dlo),ARLIM_3D(dhi),
-				 ARLIM_3D(dom_lo),ARLIM_3D(dom_hi),
-				 ZFILL(dx),ZFILL(xlo),
-				 &time,&dt,
-				 AMREX_BCREC_3D(bcr),
-				 &level,&idx);
-	    } else {
-		amrex::Error("AmeLevel::derive: no function available");
-	    }
-        }
-#endif
-    }
-    else
-    {
-        //
-        // If we got here, cannot derive given name.
-        //
-        std::string msg("AmrLevel::derive(MultiFab*): unknown variable: ");
-        msg += name;
-        amrex::Error(msg.c_str());
-    }
-}
-
-//! Update the distribution maps in StateData based on the size of the map
-void
-AmrLevel::UpdateDistributionMaps ( DistributionMapping& update_dmap )
-{
-    long mapsize = update_dmap.size();
-
-    if (dmap.size() == mapsize)
-    { dmap = update_dmap; }
-
-    for (int i = 0; i < state.size(); ++i)
-    {
-       if (state[i].DistributionMap().size() == mapsize)
-          { state[i].setDistributionMap(update_dmap); }
-    }
-}
-
-
-
-Vector<int>
-AmrLevel::getBCArray (int State_Type,
-                      int gridno,
-                      int strt_comp,
-                      int ncomp)
-{
-    Vector<int> bc(2*BL_SPACEDIM*ncomp);
-
-    BCRec bcr;
-
-    for (int n = 0; n < ncomp; n++)
-    {
-        bcr = state[State_Type].getBC(strt_comp+n,gridno);
-        const int* b_rec = bcr.vect();
-        for (int m = 0; m < 2*BL_SPACEDIM; m++)
-            bc[2*BL_SPACEDIM*n + m] = b_rec[m];
-    }
-
-    return bc;
-}
-
-int
-AmrLevel::okToRegrid ()
-{
-    return true;
-}
-
-void
-AmrLevel::setPlotVariables ()
-{
-    ParmParse pp("amr");
-
-    if (pp.contains("plot_vars"))
-    {
-        std::string nm;
-      
-        int nPltVars = pp.countval("plot_vars");
-      
-        for (int i = 0; i < nPltVars; i++)
-        {
-            pp.get("plot_vars", nm, i);
-
-            if (nm == "ALL") 
-                parent->fillStatePlotVarList();
-            else if (nm == "NONE")
-                parent->clearStatePlotVarList();
-            else
-                parent->addStatePlotVar(nm);
-        }
-    }
-    else 
-    {
-        //
-        // The default is to add them all.
-        //
-        parent->fillStatePlotVarList();
-    }
-  
-    if (pp.contains("derive_plot_vars"))
-    {
-        std::string nm;
-      
-        int nDrvPltVars = pp.countval("derive_plot_vars");
-      
-        for (int i = 0; i < nDrvPltVars; i++)
-        {
-            pp.get("derive_plot_vars", nm, i);
-
-            if (nm == "ALL") 
-                parent->fillDerivePlotVarList();
-            else if (nm == "NONE")
-                parent->clearDerivePlotVarList();
-            else
-                parent->addDerivePlotVar(nm);
-        }
-    }
-    else 
-    {
-        //
-        // The default is to add none of them.
-        //
-        parent->clearDerivePlotVarList();
-    }
-}
-
-void
-AmrLevel::setSmallPlotVariables ()
-{
-    ParmParse pp("amr");
-
-    if (pp.contains("small_plot_vars"))
-    {
-        std::string nm;
-      
-        int nPltVars = pp.countval("small_plot_vars");
-      
-        for (int i = 0; i < nPltVars; i++)
-        {
-            pp.get("small_plot_vars", nm, i);
-
-	    parent->addStateSmallPlotVar(nm);
-        }
-    }
-    else 
-    {
-        //
-        // The default is to use none.
-        //
-        parent->clearStateSmallPlotVarList();
-    }
-
-    if (pp.contains("derive_small_plot_vars"))
-    {
-        std::string nm;
-      
-        int nDrvPltVars = pp.countval("derive_small_plot_vars");
-      
-        for (int i = 0; i < nDrvPltVars; i++)
-        {
-            pp.get("derive_small_plot_vars", nm, i);
-
-            if (nm == "ALL") 
-                parent->fillDeriveSmallPlotVarList();
-            else if (nm == "NONE")
-                parent->clearDeriveSmallPlotVarList();
-            else
-                parent->addDeriveSmallPlotVar(nm);
-        }
-    }
-    else 
-    {
-        //
-        // The default is to add none of them.
-        //
-        parent->clearDeriveSmallPlotVarList();
-    }
-  
-}
-
-AmrLevel::TimeLevel
-AmrLevel::which_time (int  indx,
-                      Real time) const
-{
-    const Real oldtime = state[indx].prevTime();
-    const Real newtime = state[indx].curTime();
-    const Real haftime = .5 * (oldtime + newtime);
-    const Real qtime = oldtime + 0.25*(newtime-oldtime);
-    const Real tqtime = oldtime + 0.75*(newtime-oldtime);
-    const Real epsilon = 0.001 * (newtime - oldtime);
-
-    BL_ASSERT(time >= oldtime-epsilon && time <= newtime+epsilon);
-    
-    if (time >= oldtime-epsilon && time <= oldtime+epsilon)
-    {
-        return AmrOldTime;
-    }
-    else if (time >= newtime-epsilon && time <= newtime+epsilon)
-    {
-        return AmrNewTime;
-    }
-    else if (time >= haftime-epsilon && time <= haftime+epsilon)
-    {
-        return AmrHalfTime;
-    }
-    else if (time >= qtime-epsilon && time <= qtime+epsilon)
-    {
-        return Amr1QtrTime;
-    }
-    else if (time >= tqtime-epsilon && time <= tqtime+epsilon)
-    {
-        return Amr3QtrTime;
-    }
-    return AmrOtherTime;
-}
-
-Real
-AmrLevel::estimateWork ()
-{
-    return 1.0*countCells();
-}
-
-bool
-AmrLevel::writePlotNow ()
-{
-    return false;
-}
-
-bool
-AmrLevel::writeSmallPlotNow ()
-{
-    return false;
-}
-
-const BoxArray& AmrLevel::getAreaNotToTag()
-{
-    return m_AreaNotToTag;
-}
-
-const Box& AmrLevel::getAreaToTag()
-{
-    return m_AreaToTag;
-}
-
-void AmrLevel::setAreaNotToTag(BoxArray& ba)
-{
-    m_AreaNotToTag = ba;
-}
-
-void AmrLevel::constructAreaNotToTag()
-{
-    if (level == 0 || !parent->useFixedCoarseGrids() || parent->useFixedUpToLevel()>level)
-        return;
-
-    // We are restricting the tagging on the finest fixed level
-    if (parent->useFixedUpToLevel()==level)
-    {
-        // We use the next coarser level shrunk by one blockingfactor
-        //    as the region in which we allow tagging. 
-        // Why level-1? Because we always use the full domain at level 0 
-        //    and therefore level 0 in initialba is level 1 in the AMR hierarchy, etc.
-        const Vector<BoxArray>& initialba = parent->getInitialBA();
-        Box tagarea(initialba[level-1].minimalBox());
-        tagarea.grow(-parent->blockingFactor(level));
-        m_AreaToTag = tagarea;
-
-        // We disallow tagging in the remaining part of the domain.
-        BoxArray tagba = amrex::boxComplement(parent->Geom(level).Domain(),m_AreaToTag);
-        m_AreaNotToTag = tagba;
-
-        BoxArray bxa(parent->Geom(level).Domain());
-        BL_ASSERT(bxa.contains(m_AreaNotToTag));
-    }
-
-    if (parent->useFixedUpToLevel()<level)
-    {
-        Box tagarea = parent->getLevel(level-1).getAreaToTag();
-        tagarea.refine(parent->refRatio(level-1));
-        tagarea.grow(-parent->blockingFactor(level));
-        m_AreaToTag = tagarea;
-        BoxArray tagba = amrex::boxComplement(parent->Geom(level).Domain(),m_AreaToTag);
-        m_AreaNotToTag = tagba;
-    }
-}
-
-void
-AmrLevel::FillPatch(AmrLevel& amrlevel,
-		    MultiFab& leveldata,
-		    int       boxGrow,
-		    Real      time,
-		    int       index,
-		    int       scomp,
-		    int       ncomp,
-                    int       dcomp)
-{
-    BL_ASSERT(dcomp+ncomp-1 <= leveldata.nComp());
-    BL_ASSERT(boxGrow <= leveldata.nGrow());
-    FillPatchIterator fpi(amrlevel, leveldata, boxGrow, time, index, scomp, ncomp);
-    const MultiFab& mf_fillpatched = fpi.get_mf();
-    MultiFab::Copy(leveldata, mf_fillpatched, 0, dcomp, ncomp, boxGrow);
-}
-
-void
-AmrLevel::LevelDirectoryNames(const std::string &dir,
-                              std::string &LevelDir,
-			      std::string &FullPath)
-{
-    LevelDir = amrex::Concatenate("Level_", level, 1);
-    //
-    // Now for the full pathname of that directory.
-    //
-    FullPath = dir;
-    if( ! FullPath.empty() && FullPath.back() != '/') {
-        FullPath += '/';
-    }
-    FullPath += LevelDir;
-}
-
-void
-AmrLevel::CreateLevelDirectory (const std::string &dir)
-{
-    // Build directory to hold the MultiFabs in the StateData at this level.
-    // The directory is relative the the directory containing the Header file.
-
-    std::string LevelDir, FullPath;
-    LevelDirectoryNames(dir, LevelDir, FullPath);
-
-    if(ParallelDescriptor::IOProcessor()) {
-      if( ! amrex::UtilCreateDirectory(FullPath, 0755)) {
-        amrex::CreateDirectoryFailed(FullPath);
-      }
-    }
-
-    levelDirectoryCreated = true;
-}
-
-}
-
diff --git a/Src/AmrTask/Amr/AMReX_AmrTask.cpp b/Src/AmrTask/Amr/AMReX_AmrTask.cpp
deleted file mode 100644
index b8c94e9c7fe..00000000000
--- a/Src/AmrTask/Amr/AMReX_AmrTask.cpp
+++ /dev/null
@@ -1,3056 +0,0 @@
-
-#include <algorithm>
-#include <cstdio>
-#include <list>
-#include <iostream>
-#include <iomanip>
-#include <sstream>
-#include <iomanip>
-#include <limits>
-#include <cmath>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-#include <sys/types.h>
-#include <sys/stat.h>
-#include <unistd.h>
-
-#include <AMReX_Geometry.H>
-#include <AMReX_TagBox.H>
-#include <AMReX_Vector.H>
-#include <AMReX_CoordSys.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BoxDomain.H>
-#include <AMReX_Cluster.H>
-#include <AMReX_LevelBld.H>
-#include <AMReX_AmrLevel.H>
-#include <AMReX_PROB_AMR_F.H>
-#include <AMReX_Amr.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_DistributionMapping.H>
-#include <AMReX_FabSet.H>
-#include <AMReX_StateData.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_Print.H>
-
-#ifdef BL_LAZY
-#include <AMReX_Lazy.H>
-#endif
-
-#ifdef AMREX_MEM_PROFILING
-#include <AMReX_MemProfiler.H>
-#endif
-
-#ifdef BL_USE_ARRAYVIEW
-#include <DatasetClient.H>
-#endif
-
-namespace amrex {
-
-//
-// Static class members.  Set defaults in Initialize()!!!
-//
-std::list<std::string> Amr::state_plot_vars;
-std::list<std::string> Amr::state_small_plot_vars;
-std::list<std::string> Amr::derive_plot_vars;
-std::list<std::string> Amr::derive_small_plot_vars;
-bool                   Amr::first_plotfile;
-bool                   Amr::first_smallplotfile;
-Vector<BoxArray>        Amr::initial_ba;
-Vector<BoxArray>        Amr::regrid_ba;
-
-namespace
-{
-    const std::string CheckPointVersion("CheckPointVersion_1.0");
-
-    bool initialized = false;
-}
-
-namespace
-{
-    //
-    // These are all ParmParse'd in.  Set defaults in Initialize()!!!
-    //
-    int  plot_nfiles;
-    int  mffile_nstreams;
-    int  probinit_natonce;
-    bool plot_files_output;
-    int  checkpoint_nfiles;
-    int  regrid_on_restart;
-    int  use_efficient_regrid;
-    int  plotfile_on_restart;
-    int  checkpoint_on_restart;
-    bool checkpoint_files_output;
-    int  compute_new_dt_on_regrid;
-    bool precreateDirectories;
-    bool prereadFAHeaders;
-    VisMF::Header::Version plot_headerversion(VisMF::Header::Version_v1);
-    VisMF::Header::Version checkpoint_headerversion(VisMF::Header::Version_v1);
-
-}
-
-void
-Amr::Initialize ()
-{
-    if (initialized) return;
-    //
-    // Set all defaults here!!!
-    //
-    Amr::first_plotfile      = true;
-    Amr::first_smallplotfile = true;
-    plot_nfiles              = 64;
-    mffile_nstreams          = 1;
-    probinit_natonce         = 32;
-    plot_files_output        = true;
-    checkpoint_nfiles        = 64;
-    regrid_on_restart        = 0;
-    use_efficient_regrid     = 0;
-    plotfile_on_restart      = 0;
-    checkpoint_on_restart    = 0;
-    checkpoint_files_output  = true;
-    compute_new_dt_on_regrid = 0;
-    precreateDirectories     = true;
-    prereadFAHeaders         = true;
-    plot_headerversion       = VisMF::Header::Version_v1;
-    checkpoint_headerversion = VisMF::Header::Version_v1;
-
-    amrex::ExecOnFinalize(Amr::Finalize);
-
-    initialized = true;
-}
-
-void
-Amr::Finalize ()
-{
-    Amr::state_plot_vars.clear();
-    Amr::derive_plot_vars.clear();
-    Amr::derive_small_plot_vars.clear();
-    Amr::regrid_ba.clear();
-    Amr::initial_ba.clear();
-
-    initialized = false;
-}
-
-bool Amr::Plot_Files_Output () { return plot_files_output; }
-
-std::ostream&
-Amr::DataLog (int i)
-{
-    return *datalog[i];
-}
-
-int
-Amr::NumDataLogs ()
-{
-    return datalog.size();
-}
-
-bool
-Amr::RegridOnRestart () const
-{
-    return regrid_on_restart;
-}
-
-void
-Amr::setDtMin (const Vector<Real>& dt_min_in)
-{
-    for (int i = 0; i <= finest_level; i++)
-        dt_min[i] = dt_min_in[i];
-}
-
-Vector<std::unique_ptr<AmrLevel> >&
-Amr::getAmrLevels ()
-{
-    return amr_level;
-}
-
-long
-Amr::cellCount (int lev)
-{
-    return amr_level[lev]->countCells();
-}
-
-int
-Amr::numGrids (int lev)
-{
-    return amr_level[lev]->numGrids();
-}
-
-std::unique_ptr<MultiFab>
-Amr::derive (const std::string& name,
-             Real               time,
-             int                lev,
-             int                ngrow)
-{
-    return amr_level[lev]->derive(name,time,ngrow);
-}
-
-Amr::Amr ()
-    :
-    AmrCore()
-{
-    Initialize();
-    InitAmr();
-}
-
-Amr::Amr (const RealBox* rb, int max_level_in, const Vector<int>& n_cell_in, int coord)
-    :
-    AmrCore(rb,max_level_in,n_cell_in,coord)
-{
-    Initialize();
-    InitAmr();
-}
-
-void
-Amr::InitAmr ()
-{
-    BL_PROFILE("Amr::InitAmr()");
-    //
-    // Determine physics class.
-    //
-    levelbld = getLevelBld();
-    //
-    // Global function that define state variables.
-    //
-    levelbld->variableSetUp();
-    //
-    // Set default values.
-    //
-    plot_int               = -1;
-    small_plot_int         = -1;
-    last_plotfile          = 0;
-    last_smallplotfile     = -1;
-    last_checkpoint        = 0;
-    record_run_info        = false;
-    record_grid_info       = false;
-    file_name_digits       = 5;
-    record_run_info_terse  = false;
-    bUserStopRequest       = false;
-    message_int            = 10;
-    
-    for (int i = 0; i < BL_SPACEDIM; i++)
-        isPeriodic[i] = false;
-
-    ParmParse pp("amr");
-    //
-    // Check for command line flags.
-    //
-    pp.query("regrid_on_restart",regrid_on_restart);
-    pp.query("use_efficient_regrid",use_efficient_regrid);
-    pp.query("plotfile_on_restart",plotfile_on_restart);
-    pp.query("checkpoint_on_restart",checkpoint_on_restart);
-
-    pp.query("compute_new_dt_on_regrid",compute_new_dt_on_regrid);
-
-    pp.query("mffile_nstreams", mffile_nstreams);
-    pp.query("probinit_natonce", probinit_natonce);
-
-    probinit_natonce = std::max(1, std::min(ParallelDescriptor::NProcs(), probinit_natonce));
-
-    pp.query("file_name_digits", file_name_digits);
-
-    pp.query("initial_grid_file",initial_grids_file);
-    pp.query("regrid_file"      , regrid_grids_file);
-
-    pp.query("message_int", message_int);
-    
-    if (pp.contains("run_log"))
-    {
-        std::string log_file_name;
-        pp.get("run_log",log_file_name);
-        setRecordRunInfo(log_file_name);
-    }
-    if (pp.contains("run_log_terse"))
-    {
-        std::string log_file_name;
-        pp.get("run_log_terse",log_file_name);
-        setRecordRunInfoTerse(log_file_name);
-    }
-    if (pp.contains("grid_log"))
-    {
-        std::string grid_file_name;
-        pp.get("grid_log",grid_file_name);
-        setRecordGridInfo(grid_file_name);
-    }
-
-    if (pp.contains("data_log"))
-    {
-      int num_datalogs = pp.countval("data_log");
-      datalog.resize(num_datalogs);
-      datalogname.resize(num_datalogs);
-      pp.queryarr("data_log",datalogname,0,num_datalogs);
-      for (int i = 0; i < num_datalogs; i++) 
-        setRecordDataInfo(i,datalogname[i]);
-    }
-
-    probin_file = "probin";  // Make "probin" the default
-
-    if (pp.contains("probin_file"))
-    {
-        pp.get("probin_file",probin_file);
-    }
-    //
-    // If set, then restart from checkpoint file.
-    //
-    pp.query("restart", restart_chkfile);
-    //
-    // If set, then restart from plotfile.
-    //
-    pp.query("restart_from_plotfile", restart_pltfile);
-
-    int nlev     = max_level+1;
-    dt_level.resize(nlev);
-    level_steps.resize(nlev);
-    level_count.resize(nlev);
-    n_cycle.resize(nlev);
-    dt_min.resize(nlev);
-    amr_level.resize(nlev);
-    //
-    // Set bogus values.
-    //
-    for (int i = 0; i < nlev; i++)
-    {
-        dt_level[i]    = 1.e200; // Something nonzero so old & new will differ
-        level_steps[i] = 0;
-        level_count[i] = 0;
-        n_cycle[i]     = 0;
-        dt_min[i]      = 0.0;
-    }
-
-    // Make the default regrid_int = 1 for all levels.
-    if (max_level > 0) 
-    {
-       regrid_int.resize(max_level);
-       for (int i = 0; i < max_level; i++)
-           regrid_int[i]  = 1;
-    }
-    
-    //
-    // Setup plot and checkpoint controls.
-    //
-    initPltAndChk();
-    
-    //
-    // Setup subcycling controls.
-    //
-    initSubcycle();
-
-    //
-    // Read in the regrid interval if max_level > 0.
-    //
-    if (max_level > 0) 
-    {
-       int numvals = pp.countval("regrid_int");
-       if (numvals == 1)
-       {
-           //
-           // Set all values to the single available value.
-           //
-           int the_regrid_int = 0;
-           pp.query("regrid_int",the_regrid_int);
-           for (int i = 0; i < max_level; i++)
-           {
-               regrid_int[i] = the_regrid_int;
-           }
-       }
-       else if (numvals == 0)
-       {
-	   amrex::Print(std::cerr) << "Using default regrid_int = 1 at all levels!\n";
-       }
-       else if (numvals < max_level)
-       {
-           amrex::Error("You did not specify enough values of regrid_int");
-       }
-       else 
-       {
-           //
-           // Otherwise we expect a vector of max_level values
-           //
-           pp.queryarr("regrid_int",regrid_int,0,max_level);
-       }
-    }
-
-    if (max_level > 0 && !initial_grids_file.empty())
-    {
-#define STRIP while( is.get() != '\n' ) {}
-        std::ifstream is(initial_grids_file.c_str(),std::ios::in);
-
-        if (!is.good())
-            amrex::FileOpenFailed(initial_grids_file);
-
-        int in_finest,ngrid;
-
-        is >> in_finest;
-        STRIP;
-        initial_ba.resize(in_finest);
-
-        use_fixed_upto_level = in_finest;
-        if (in_finest > max_level)
-           amrex::Error("You have fewer levels in your inputs file then in your grids file!");
-
-        for (int lev = 1; lev <= in_finest; lev++)
-        {
-            BoxList bl;
-            is >> ngrid;
-            STRIP;
-            for (int i = 0; i < ngrid; i++)
-            {
-                Box bx;
-                is >> bx;
-                STRIP;
-                bx.refine(ref_ratio[lev-1]);
-                bl.push_back(bx);
-            }
-            initial_ba[lev-1].define(bl);
-        }
-        is.close();
-	amrex::Print() << "Read initial_ba. Size is " << initial_ba.size() << "\n";
-
-#undef STRIP
-    }
-
-    if (max_level > 0 && !regrid_grids_file.empty())
-    {
-#define STRIP while( is.get() != '\n' ) {}
-        std::ifstream is(regrid_grids_file.c_str(),std::ios::in);
-
-        if (!is.good())
-            amrex::FileOpenFailed(regrid_grids_file);
-
-        int in_finest,ngrid;
-
-        is >> in_finest;
-        STRIP;
-        regrid_ba.resize(in_finest);
-        for (int lev = 1; lev <= in_finest; lev++)
-        {
-            BoxList bl;
-            is >> ngrid;
-            STRIP;
-            for (int i = 0; i < ngrid; i++)
-            {
-                Box bx;
-                is >> bx;
-                STRIP;
-                 bx.refine(ref_ratio[lev-1]);
-                 for (int idim = 0 ; idim < BL_SPACEDIM; ++idim)
-                 {
-                     if (bx.length(idim) > max_grid_size[lev][idim])
-                     {
-                         amrex::Print() << "Grid " << bx << " too large" << '\n';
-                         amrex::Error();
-                     }
-                 }
-                 bl.push_back(bx);
-            }
-            regrid_ba[lev-1].define(bl);
-        }
-        is.close();
-#undef STRIP
-    }
-
-    loadbalance_with_workestimates = 0;
-    pp.query("loadbalance_with_workestimates", loadbalance_with_workestimates);
-
-    loadbalance_level0_int = 2;
-    pp.query("loadbalance_level0_int", loadbalance_level0_int);
-
-    loadbalance_max_fac = 1.5;
-    pp.query("loadbalance_max_fac", loadbalance_max_fac);
-}
-
-bool
-Amr::isStatePlotVar (const std::string& name)
-{
-    for (std::list<std::string>::const_iterator li = state_plot_vars.begin(), End = state_plot_vars.end();
-         li != End;
-         ++li)
-    {
-        if (*li == name) {
-            return true;
-	}
-    }
-    return false;
-}
-
-bool
-Amr::isStateSmallPlotVar (const std::string& name)
-{
-    for (std::list<std::string>::const_iterator li = state_small_plot_vars.begin(), End = state_small_plot_vars.end();
-         li != End;
-         ++li)
-    {
-        if (*li == name)
-            return true;
-    }
-    return false;
-}
-
-void
-Amr::fillStatePlotVarList ()
-{
-    state_plot_vars.clear();
-    const DescriptorList &desc_lst = AmrLevel::get_desc_lst();
-    for (int typ(0); typ < desc_lst.size(); ++typ) {
-        for (int comp(0); comp < desc_lst[typ].nComp(); ++comp) {
-            if (desc_lst[typ].getType() == IndexType::TheCellType()) {
-                state_plot_vars.push_back(desc_lst[typ].name(comp));
-	    }
-	}
-    }
-}
-
-void
-Amr::clearStatePlotVarList ()
-{
-    state_plot_vars.clear();
-}
-
-void
-Amr::clearStateSmallPlotVarList ()
-{
-    state_small_plot_vars.clear();
-}
-
-void
-Amr::addStatePlotVar (const std::string& name)
-{
-    if ( ! isStatePlotVar(name)) {
-        state_plot_vars.push_back(name);
-    }
-}
-
-void
-Amr::addStateSmallPlotVar (const std::string& name)
-{
-    if (!isStateSmallPlotVar(name))
-        state_small_plot_vars.push_back(name);
-}
-
-void
-Amr::deleteStatePlotVar (const std::string& name)
-{
-    if (isStatePlotVar(name)) {
-        state_plot_vars.remove(name);
-    }
-}
-
-bool
-Amr::isDerivePlotVar (const std::string& name)
-{
-    for (std::list<std::string>::const_iterator li = derive_plot_vars.begin(), End = derive_plot_vars.end();
-         li != End;
-         ++li)
-    {
-        if (*li == name) {
-            return true;
-	}
-    }
-
-    return false;
-}
-
-bool
-Amr::isDeriveSmallPlotVar (const std::string& name)
-{
-    for (std::list<std::string>::const_iterator li = derive_small_plot_vars.begin(), End = derive_small_plot_vars.end();
-         li != End;
-         ++li)
-    {
-        if (*li == name) {
-            return true;
-	}
-    }
-
-    return false;
-}
-
-void 
-Amr::fillDerivePlotVarList ()
-{
-    derive_plot_vars.clear();
-    DeriveList& derive_lst = AmrLevel::get_derive_lst();
-    std::list<DeriveRec>& dlist = derive_lst.dlist();
-    for (std::list<DeriveRec>::const_iterator it = dlist.begin(), End = dlist.end();
-         it != End;
-         ++it)
-    {
-        if (it->deriveType() == IndexType::TheCellType())
-        {
-            derive_plot_vars.push_back(it->name());
-        }
-    }
-}
-
-void 
-Amr::fillDeriveSmallPlotVarList ()
-{
-    derive_small_plot_vars.clear();
-    DeriveList& derive_lst = AmrLevel::get_derive_lst();
-    std::list<DeriveRec>& dlist = derive_lst.dlist();
-    for (std::list<DeriveRec>::const_iterator it = dlist.begin(), End = dlist.end();
-         it != End;
-         ++it)
-    {
-        if (it->deriveType() == IndexType::TheCellType())
-        {
-            derive_small_plot_vars.push_back(it->name());
-        }
-    }
-}
-
-void
-Amr::clearDerivePlotVarList ()
-{
-    derive_plot_vars.clear();
-}
-
-void
-Amr::clearDeriveSmallPlotVarList ()
-{
-    derive_small_plot_vars.clear();
-}
-
-void
-Amr::addDerivePlotVar (const std::string& name)
-{
-    if (!isDerivePlotVar(name))
-        derive_plot_vars.push_back(name);
-}
-
-void
-Amr::addDeriveSmallPlotVar (const std::string& name)
-{
-    if (!isDeriveSmallPlotVar(name))
-        derive_small_plot_vars.push_back(name);
-}
-
-void
-Amr::deleteDerivePlotVar (const std::string& name)
-{
-    if (isDerivePlotVar(name))
-        derive_plot_vars.remove(name);
-}
-
-void
-Amr::deleteDeriveSmallPlotVar (const std::string& name)
-{
-    if (isDeriveSmallPlotVar(name))
-        derive_small_plot_vars.remove(name);
-}
-
-Amr::~Amr ()
-{
-    levelbld->variableCleanUp();
-
-    Amr::Finalize();
-}
-
-void
-Amr::setRecordGridInfo (const std::string& filename)
-{
-    record_grid_info = true;
-    if (ParallelDescriptor::IOProcessor())
-    {
-        gridlog.open(filename.c_str(),std::ios::out|std::ios::app);
-        if (!gridlog.good())
-            amrex::FileOpenFailed(filename);
-    }
-    ParallelDescriptor::Barrier("Amr::setRecordGridInfo");
-}
-
-void
-Amr::setRecordRunInfo (const std::string& filename)
-{
-    record_run_info = true;
-    if (ParallelDescriptor::IOProcessor())
-    {
-        runlog.open(filename.c_str(),std::ios::out|std::ios::app);
-        if (!runlog.good())
-            amrex::FileOpenFailed(filename);
-    }
-    ParallelDescriptor::Barrier("Amr::setRecordRunInfo");
-}
-
-void
-Amr::setRecordRunInfoTerse (const std::string& filename)
-{
-    record_run_info_terse = true;
-    if (ParallelDescriptor::IOProcessor())
-    {
-        runlog_terse.open(filename.c_str(),std::ios::out|std::ios::app);
-        if (!runlog_terse.good())
-            amrex::FileOpenFailed(filename);
-    }
-    ParallelDescriptor::Barrier("Amr::setRecordRunInfoTerse");
-}
-
-void
-Amr::setRecordDataInfo (int i, const std::string& filename)
-{
-    if (ParallelDescriptor::IOProcessor())
-    {
-        datalog[i].reset(new std::fstream);
-        datalog[i]->open(filename.c_str(),std::ios::out|std::ios::app);
-        if (!datalog[i]->good())
-            amrex::FileOpenFailed(filename);
-    }
-    ParallelDescriptor::Barrier("Amr::setRecordDataInfo");
-}
-
-void
-Amr::setDtLevel (const Vector<Real>& dt_lev)
-{
-    for (int i = 0; i <= finest_level; i++)
-        dt_level[i] = dt_lev[i];
-}
-
-void
-Amr::setDtLevel (Real dt, int lev)
-{
-    dt_level[lev] = dt;
-}
-
-void
-Amr::setNCycle (const Vector<int>& ns)
-{
-    for (int i = 0; i <= finest_level; i++)
-        n_cycle[i] = ns[i];
-}
-
-long
-Amr::cellCount ()
-{
-    long cnt = 0;
-    for (int i = 0; i <= finest_level; i++)
-        cnt += amr_level[i]->countCells();
-    return cnt;
-}
-
-int
-Amr::numGrids ()
-{
-    int cnt = 0;
-    for (int i = 0; i <= finest_level; i++)
-        cnt += amr_level[i]->numGrids();
-    return cnt;
-}
-
-int
-Amr::okToContinue ()
-{
-    int ok = true;
-    for (int i = 0; ok && (i <= finest_level); i++)
-        ok = ok && amr_level[i]->okToContinue();
-    if(bUserStopRequest) {
-      ok = false;
-    }
-    return ok;
-}
-
-void
-Amr::writePlotFile ()
-{
-    if ( ! Plot_Files_Output()) {
-      return;
-    }
-
-    BL_PROFILE_REGION_START("Amr::writePlotFile()");
-    BL_PROFILE("Amr::writePlotFile()");
-
-    VisMF::SetNOutFiles(plot_nfiles);
-    VisMF::Header::Version currentVersion(VisMF::GetHeaderVersion());
-    VisMF::SetHeaderVersion(plot_headerversion);
-
-    if (first_plotfile) {
-        first_plotfile = false;
-        amr_level[0]->setPlotVariables();
-    }
-
-    Real dPlotFileTime0 = ParallelDescriptor::second();
-
-    const std::string& pltfile = amrex::Concatenate(plot_file_root,level_steps[0],file_name_digits);
-
-    if (verbose > 0) {
-	amrex::Print() << "PLOTFILE: file = " << pltfile << '\n';
-    }
-
-    if (record_run_info && ParallelDescriptor::IOProcessor()) {
-        runlog << "PLOTFILE: file = " << pltfile << '\n';
-    }
-
-  amrex::StreamRetry sretry(pltfile, abort_on_stream_retry_failure,
-                             stream_max_tries);
-
-  const std::string pltfileTemp(pltfile + ".temp");
-
-  while(sretry.TryFileOutput()) {
-    //
-    //  if either the pltfile or pltfileTemp exists, rename them
-    //  to move them out of the way.  then create pltfile
-    //  with the temporary name, then rename it back when
-    //  it is finished writing.  then stream retry can rename
-    //  it to a bad suffix if there were stream errors.
-    //
-
-    if(precreateDirectories) {    // ---- make all directories at once
-      amrex::UtilRenameDirectoryToOld(pltfile, false);      // dont call barrier
-      if (verbose > 1) {
-          amrex::Print() << "IOIOIOIO:  precreating directories for " << pltfileTemp << "\n";
-      }
-      amrex::PreBuildDirectorHierarchy(pltfileTemp, "Level_", finest_level + 1, true);  // call barrier
-    } else {
-      amrex::UtilRenameDirectoryToOld(pltfile, false);     // dont call barrier
-      amrex::UtilCreateCleanDirectory(pltfileTemp, true);  // call barrier
-    }
-
-    std::string HeaderFileName(pltfileTemp + "/Header");
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    std::ofstream HeaderFile;
-
-    HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-
-    int old_prec(0);
-
-    if (ParallelDescriptor::IOProcessor()) {
-        //
-        // Only the IOProcessor() writes to the header file.
-        //
-        HeaderFile.open(HeaderFileName.c_str(), std::ios::out | std::ios::trunc |
-	                                        std::ios::binary);
-        if ( ! HeaderFile.good()) {
-            amrex::FileOpenFailed(HeaderFileName);
-	}
-        old_prec = HeaderFile.precision(15);
-    }
-
-    for (int k(0); k <= finest_level; ++k) {
-        amr_level[k]->writePlotFile(pltfileTemp, HeaderFile);
-    }
-
-    if (ParallelDescriptor::IOProcessor()) {
-        HeaderFile.precision(old_prec);
-        if ( ! HeaderFile.good()) {
-            amrex::Error("Amr::writePlotFile() failed");
-	}
-    }
-
-    last_plotfile = level_steps[0];
-
-    if (verbose > 0) {
-        const int IOProc        = ParallelDescriptor::IOProcessorNumber();
-        Real      dPlotFileTime = ParallelDescriptor::second() - dPlotFileTime0;
-
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime,IOProc);
-
-	amrex::Print() << "Write plotfile time = " << dPlotFileTime << "  seconds" << "\n\n";
-    }
-    ParallelDescriptor::Barrier("Amr::writePlotFile::end");
-
-    if(ParallelDescriptor::IOProcessor()) {
-      std::rename(pltfileTemp.c_str(), pltfile.c_str());
-    }
-    ParallelDescriptor::Barrier("Renaming temporary plotfile.");
-    //
-    // the plotfile file now has the regular name
-    //
-
-  }  // end while
-
-  VisMF::SetHeaderVersion(currentVersion);
-  
-  BL_PROFILE_REGION_STOP("Amr::writePlotFile()");
-}
-
-void
-Amr::writeSmallPlotFile ()
-{
-    if ( ! Plot_Files_Output()) {
-      return;
-    }
-
-    BL_PROFILE_REGION_START("Amr::writeSmallPlotFile()");
-    BL_PROFILE("Amr::writeSmallPlotFile()");
-
-    VisMF::SetNOutFiles(plot_nfiles);
-    VisMF::Header::Version currentVersion(VisMF::GetHeaderVersion());
-    VisMF::SetHeaderVersion(plot_headerversion);
-
-    if (first_smallplotfile) {
-        first_smallplotfile = false;
-        amr_level[0]->setSmallPlotVariables();
-    }
-
-    // Don't continue if we have no variables to plot.
-    
-    if (stateSmallPlotVars().size() == 0) {
-      return;
-    }
-
-    Real dPlotFileTime0 = ParallelDescriptor::second();
-
-    const std::string& pltfile = amrex::Concatenate(small_plot_file_root,
-                                                     level_steps[0],
-                                                     file_name_digits);
-
-    if (verbose > 0) {
-	amrex::Print() << "SMALL PLOTFILE: file = " << pltfile << '\n';
-    }
-
-    if (record_run_info && ParallelDescriptor::IOProcessor()) {
-        runlog << "SMALL PLOTFILE: file = " << pltfile << '\n';
-    }
-
-  amrex::StreamRetry sretry(pltfile, abort_on_stream_retry_failure,
-                             stream_max_tries);
-
-  const std::string pltfileTemp(pltfile + ".temp");
-
-  while(sretry.TryFileOutput()) {
-    //
-    //  if either the pltfile or pltfileTemp exists, rename them
-    //  to move them out of the way.  then create pltfile
-    //  with the temporary name, then rename it back when
-    //  it is finished writing.  then stream retry can rename
-    //  it to a bad suffix if there were stream errors.
-    //
-    if(precreateDirectories) {    // ---- make all directories at once
-      amrex::UtilRenameDirectoryToOld(pltfile, false);      // dont call barrier
-      amrex::UtilCreateCleanDirectory(pltfileTemp, false);  // dont call barrier
-      for(int i(0); i <= finest_level; ++i) {
-        amr_level[i]->CreateLevelDirectory(pltfileTemp);
-      }
-      ParallelDescriptor::Barrier("Amr::precreate smallplotfile Directories");
-    } else {
-      amrex::UtilRenameDirectoryToOld(pltfile, false);     // dont call barrier
-      amrex::UtilCreateCleanDirectory(pltfileTemp, true);  // call barrier
-    }
-
-
-    std::string HeaderFileName(pltfileTemp + "/Header");
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    std::ofstream HeaderFile;
-
-    HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-
-    int old_prec(0);
-
-    if (ParallelDescriptor::IOProcessor()) {
-        //
-        // Only the IOProcessor() writes to the header file.
-        //
-        HeaderFile.open(HeaderFileName.c_str(), std::ios::out | std::ios::trunc |
-	                                        std::ios::binary);
-        if ( ! HeaderFile.good()) {
-            amrex::FileOpenFailed(HeaderFileName);
-	}
-        old_prec = HeaderFile.precision(15);
-    }
-
-    for (int k(0); k <= finest_level; ++k) {
-        amr_level[k]->writeSmallPlotFile(pltfileTemp, HeaderFile);
-    }
-
-    if (ParallelDescriptor::IOProcessor()) {
-        HeaderFile.precision(old_prec);
-        if ( ! HeaderFile.good()) {
-            amrex::Error("Amr::writeSmallPlotFile() failed");
-	}
-    }
-
-    last_smallplotfile = level_steps[0];
-
-    if (verbose > 0) {
-        const int IOProc        = ParallelDescriptor::IOProcessorNumber();
-        Real      dPlotFileTime = ParallelDescriptor::second() - dPlotFileTime0;
-
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime,IOProc);
-
-	amrex::Print() << "Write small plotfile time = " << dPlotFileTime << "  seconds" << "\n\n";
-    }
-    ParallelDescriptor::Barrier("Amr::writeSmallPlotFile::end");
-
-    if(ParallelDescriptor::IOProcessor()) {
-      std::rename(pltfileTemp.c_str(), pltfile.c_str());
-    }
-    ParallelDescriptor::Barrier("Renaming temporary plotfile.");
-    //
-    // the plotfile file now has the regular name
-    //
-
-  }  // end while
-
-  VisMF::SetHeaderVersion(currentVersion);
-  
-  BL_PROFILE_REGION_STOP("Amr::writeSmallPlotFile()");
-}
-
-void
-Amr::checkInput ()
-{
-    if (max_level < 0)
-        amrex::Error("checkInput: max_level not set");
-    //
-    // Check that blocking_factor is a power of 2.
-    //
-    for (int i = 0; i < max_level; i++)
-    {
-        for (int idim = 0; idim < BL_SPACEDIM; ++idim)
-        {
-            int k = blocking_factor[i][idim];
-            while ( k > 0 && (k%2 == 0) )
-                k /= 2;
-            if (k != 1)
-                amrex::Error("Amr::checkInput: blocking_factor not power of 2");
-        }
-    }
-    //
-    // Check level dependent values.
-    //
-    for (int i = 0; i < max_level; i++)
-    {
-        if (MaxRefRatio(i) < 2 || MaxRefRatio(i) > 12)
-            amrex::Error("Amr::checkInput: bad ref_ratios");
-    }
-    const Box& domain = Geom(0).Domain();
-    if (!domain.ok())
-        amrex::Error("level 0 domain bad or not set");
-    //
-    // Check that domain size is a multiple of blocking_factor[0].
-    //
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        int len = domain.length(i);
-        if (len%blocking_factor[0][i] != 0)
-            amrex::Error("domain size not divisible by blocking_factor");
-    }
-    //
-    // Check that max_grid_size is even.
-    //
-    for (int i = 0; i < max_level; i++)
-    {
-        for (int idim = 0; idim < BL_SPACEDIM; ++idim) {
-            if (max_grid_size[i][idim]%2 != 0) {
-                amrex::Error("max_grid_size is not even");
-            }
-        }
-    }
-
-    //
-    // Check that max_grid_size is a multiple of blocking_factor at every level.
-    //
-    for (int i = 0; i < max_level; i++)
-    {
-        for (int idim = 0; idim < BL_SPACEDIM; ++idim) {
-            if (max_grid_size[i][idim]%blocking_factor[i][idim] != 0) {
-                amrex::Error("max_grid_size not divisible by blocking_factor");
-            }
-        }
-    }
-
-    if( ! Geom(0).ProbDomain().ok()) {
-        amrex::Error("Amr::checkInput: bad physical problem size");
-    }
-
-    if(verbose > 0) {
-	amrex::Print() << "Successfully read inputs file ... " << '\n';
-    }
-}
-
-void
-Amr::init (Real strt_time,
-           Real stop_time)
-{
-    BL_PROFILE_REGION_START("Amr::init()");
-    BL_PROFILE("Amr::init()");
-    if( ! restart_chkfile.empty() && restart_chkfile != "init")
-    {
-        restart(restart_chkfile);
-    }
-    else
-    {
-        initialInit(strt_time,stop_time);
-        checkPoint();
-        if(plot_int > 0 || plot_per > 0) {
-            writePlotFile();
-	}
-	if (small_plot_int > 0 || small_plot_per > 0)
-	    writeSmallPlotFile();
-    }
-
-#ifdef BL_COMM_PROFILING
-    Vector<Box> probDomain(maxLevel()+1);
-    for(int i(0); i < probDomain.size(); ++i) {
-	probDomain[i] = Geom(i).Domain();
-    }
-    BL_COMM_PROFILE_INITAMR(finest_level, max_level, ref_ratio, probDomain);
-#endif
-    BL_PROFILE_REGION_STOP("Amr::init()");
-}
-
-void
-Amr::readProbinFile (int& a_init)
-{
-    BL_PROFILE("Amr::readProbinFile()");
-    //
-    // Populate integer array with name of probin file.
-    //
-    int probin_file_length = probin_file.length();
-
-    Vector<int> probin_file_name(probin_file_length);
-
-    for (int i = 0; i < probin_file_length; i++)
-        probin_file_name[i] = probin_file[i];
-
-    if (verbose > 0)
-	amrex::Print() << "Starting to call amrex_probinit ... \n";
-
-    const int nAtOnce = probinit_natonce;
-    const int MyProc  = ParallelDescriptor::MyProc();
-    const int NProcs  = ParallelDescriptor::NProcs();
-    const int NSets   = (NProcs + (nAtOnce - 1)) / nAtOnce;
-    const int MySet   = MyProc/nAtOnce;
-
-    Real piStart = 0, piEnd = 0, piStartAll = ParallelDescriptor::second();
-
-    for (int iSet = 0; iSet < NSets; ++iSet)
-    {
-        if (MySet == iSet)
-        {
-            //
-            // Call the pesky probin reader.
-            //
-            piStart = ParallelDescriptor::second();
-
-#ifdef AMREX_DIMENSION_AGNOSTIC
-
-            amrex_probinit(&a_init,
-			   probin_file_name.dataPtr(),
-			   &probin_file_length,
-			   AMREX_ZFILL(Geom(0).ProbLo()),
-			   AMREX_ZFILL(Geom(0).ProbHi()));
-
-#else
-
-            amrex_probinit(&a_init,
-			   probin_file_name.dataPtr(),
-			   &probin_file_length,
-			   Geom(0).ProbLo(),
-			   Geom(0).ProbHi());
-
-#endif
-
-            piEnd = ParallelDescriptor::second();
-            const int iBuff     = 0;
-            const int wakeUpPID = (MyProc + nAtOnce);
-            const int tag       = (MyProc % nAtOnce);
-            if (wakeUpPID < NProcs)
-                ParallelDescriptor::Send(&iBuff, 1, wakeUpPID, tag);
-        }
-        if (MySet == (iSet + 1))
-        {
-            //
-            // Next set waits.
-            //
-            int iBuff;
-            int waitForPID = (MyProc - nAtOnce);
-            int tag        = (MyProc % nAtOnce);
-            ParallelDescriptor::Recv(&iBuff, 1, waitForPID, tag);
-        }
-    }
-
-    if (verbose > 1)
-    {
-        const int IOProc     = ParallelDescriptor::IOProcessorNumber();
-        Real      piTotal    = piEnd - piStart;
-        Real      piTotalAll = ParallelDescriptor::second() - piStartAll;
-
-        ParallelDescriptor::ReduceRealMax(piTotal,    IOProc);
-        ParallelDescriptor::ReduceRealMax(piTotalAll, IOProc);
-
-	amrex::Print() << "amrex_probinit max time   = " << piTotal    << '\n'
-		       << "amrex_probinit total time = " << piTotalAll << '\n';
-    }
-
-    if (verbose > 0)
-	amrex::Print() << "Successfully run amrex_probinit\n";
-}
-
-void
-Amr::initialInit (Real              strt_time,
-                  Real              stop_time,
-                  const BoxArray*   lev0_grids,
-                  const Vector<int>* pmap)
-{
-    BL_PROFILE("Amr::initialInit()");
-    InitializeInit(strt_time, stop_time, lev0_grids, pmap);
-
-    // This is a subtlety, but in the case where we are initializing the data
-    //   from a plotfile, we want to use the time read in from the plotfile as 
-    //   the start time instead of using "strt_time".
-    // The Amr data "cumtime" has been set in InitializeInit; if we are restarting 
-    //   from a plotfile, then cumtime must be re-defined in that initialization routine. 
-    //   Thus here we pass "cumtime" rather than "strt_time" to FinalizeInit.
-    FinalizeInit  (cumtime, stop_time);
-}
-
-void
-Amr::InitializeInit(Real              strt_time,
-                    Real              stop_time,
-                    const BoxArray*   lev0_grids,
-                    const Vector<int>* pmap)
-{
-    BL_PROFILE("Amr::InitializeInit()");
-    BL_COMM_PROFILE_NAMETAG("Amr::InitializeInit TOP");
-    if (check_input) checkInput();
-    //
-    // Generate internal values from user-supplied values.
-    //
-    finest_level = 0;
-    //
-    // Init problem dependent data.
-    //
-    int linit = true;
-
-    if (!probin_file.empty()) {
-        readProbinFile(linit);
-    }
-
-    cumtime = strt_time;
-    //
-    // Define base level grids.  Note that if we are restarting from a plotfile, this
-    //    routine will call the level 0 AmrLevel initialization which will overwrite cumtime.
-    //
-    defBaseLevel(strt_time, lev0_grids, pmap);
-}
-
-void
-Amr::FinalizeInit (Real              strt_time,
-                   Real              stop_time)
-{
-    BL_PROFILE("Amr::FinalizeInit()");
-    //
-    // Compute dt and set time levels of all grid data.
-    //
-    amr_level[0]->computeInitialDt(finest_level,
-				   sub_cycle,
-				   n_cycle,
-				   ref_ratio,
-				   dt_level,
-				   stop_time);
-    //
-    // The following was added for multifluid.
-    //
-    Real dt0   = dt_level[0];
-    dt_min[0]  = dt_level[0];
-    n_cycle[0] = 1;
-
-    for (int lev = 1; lev <= max_level; lev++)
-    {
-        dt0           /= n_cycle[lev];
-        dt_level[lev]  = dt0;
-        dt_min[lev]    = dt_level[lev];
-    }
-
-    if (max_level > 0)
-        bldFineLevels(strt_time);
-
-    for (int lev = 0; lev <= finest_level; lev++)
-        amr_level[lev]->setTimeLevel(strt_time,dt_level[lev],dt_level[lev]);
-
-    for (int lev = 0; lev <= finest_level; lev++)
-        amr_level[lev]->post_regrid(0,finest_level);
-
-    for (int lev = 0; lev <= finest_level; lev++)
-    {
-        level_steps[lev] = 0;
-        level_count[lev] = 0;
-    }
-
-    //
-    // Perform any special post_initialization operations.
-    //
-    for(int lev(0); lev <= finest_level; ++lev) {
-      amr_level[lev]->post_init(stop_time);
-    }
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-       if (verbose > 1)
-       {
-           std::cout << "INITIAL GRIDS \n";
-           printGridInfo(std::cout,0,finest_level);
-       }
-       else if (verbose > 0)
-       { 
-           std::cout << "INITIAL GRIDS \n";
-           printGridSummary(std::cout,0,finest_level);
-       }
-    }
-
-    if (record_grid_info && ParallelDescriptor::IOProcessor())
-    {
-        gridlog << "INITIAL GRIDS \n";
-        printGridInfo(gridlog,0,finest_level);
-    }
-    BL_COMM_PROFILE_NAMETAG("Amr::initialInit BOTTOM");
-}
-
-void
-Amr::restart (const std::string& filename)
-{
-    BL_PROFILE_REGION_START("Amr::restart()");
-    BL_PROFILE("Amr::restart()");
-
-    which_level_being_advanced = -1;
-
-    Real dRestartTime0 = ParallelDescriptor::second();
-
-    VisMF::SetMFFileInStreams(mffile_nstreams);
-
-    if (verbose > 0) {
-	amrex::Print() << "restarting calculation from file: " << filename << "\n";
-    }
-
-    if (record_run_info && ParallelDescriptor::IOProcessor()) {
-        runlog << "RESTART from file = " << filename << '\n';
-    }
-    //
-    // Init problem dependent data.
-    //
-    int linit = false;
-
-    readProbinFile(linit);
-    //
-    // Start calculation from given restart file.
-    //
-    if (record_run_info && ParallelDescriptor::IOProcessor()) {
-        runlog << "RESTART from file = " << filename << '\n';
-    }
-
-    // ---- preread and broadcast all FabArray headers if this file exists
-    std::map<std::string, Vector<char> > faHeaderMap;
-    if(prereadFAHeaders) {
-      // ---- broadcast the file with the names of the fabarray headers
-      std::string faHeaderFilesName(filename + "/FabArrayHeaders.txt");
-      Vector<char> faHeaderFileChars;
-      bool bExitOnError(false);  // ---- dont exit if this file does not exist
-      ParallelDescriptor::ReadAndBcastFile(faHeaderFilesName, faHeaderFileChars,
-                                           bExitOnError);
-      if(faHeaderFileChars.size() > 0) {  // ---- headers were read
-        std::string faFileCharPtrString(faHeaderFileChars.dataPtr());
-        std::istringstream fais(faFileCharPtrString, std::istringstream::in);
-        while ( ! fais.eof()) {  // ---- read and broadcast each header
-          std::string faHeaderName;
-          fais >> faHeaderName;
-          if( ! fais.eof()) {
-            std::string faHeaderFullName(filename + '/' + faHeaderName + "_H");
-            Vector<char> &tempCharArray = faHeaderMap[faHeaderFullName];
-            ParallelDescriptor::ReadAndBcastFile(faHeaderFullName, tempCharArray);
-	    if(verbose > 2) {
-		amrex::Print() 
-		    << ":::: faHeaderName faHeaderFullName tempCharArray.size() = " << faHeaderName
-		    << "  " << faHeaderFullName << "  " << tempCharArray.size() << "\n";
-	    }
-          }
-        }
-        StateData::SetFAHeaderMapPtr(&faHeaderMap);
-      }
-    }
-
-    //
-    // Open the checkpoint header file for reading.
-    //
-    std::string File(filename + "/Header");
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    Vector<char> fileCharPtr;
-    ParallelDescriptor::ReadAndBcastFile(File, fileCharPtr);
-    std::string fileCharPtrString(fileCharPtr.dataPtr());
-    std::istringstream is(fileCharPtrString, std::istringstream::in);
-    //
-    // Read global data.
-    //
-    // Attempt to differentiate between old and new CheckPointFiles.
-    //
-    int         spdim;
-    bool        new_checkpoint_format = false;
-    std::string first_line;
-
-    std::getline(is,first_line);
-
-    if (first_line == CheckPointVersion)
-    {
-        new_checkpoint_format = true;
-        is >> spdim;
-    }
-    else
-    {
-        spdim = atoi(first_line.c_str());
-    }
-
-    if (spdim != BL_SPACEDIM)
-    {
-        std::cerr << "Amr::restart(): bad spacedim = " << spdim << '\n';
-        amrex::Abort();
-    }
-
-    is >> cumtime;
-    int mx_lev;
-    is >> mx_lev;
-    is >> finest_level;
-
-    Vector<Box> inputs_domain(max_level+1);
-    for (int lev = 0; lev <= max_level; ++lev)
-    {
-	Box bx(Geom(lev).Domain().smallEnd(),Geom(lev).Domain().bigEnd());
-       inputs_domain[lev] = bx;
-    }
-
-    if (max_level >= mx_lev) {
-
-       for (int i(0); i <= mx_lev; ++i) { is >> Geom(i);      }
-       for (int i(0); i <  mx_lev; ++i) { is >> ref_ratio[i]; }
-       for (int i(0); i <= mx_lev; ++i) { is >> dt_level[i];  }
-
-       if (new_checkpoint_format)
-       {
-           for (int i(0); i <= mx_lev; ++i) { is >> dt_min[i]; }
-       }
-       else
-       {
-           for (int i(0); i <= mx_lev; ++i) { dt_min[i] = dt_level[i]; }
-       }
-
-       Vector<int>  n_cycle_in;
-       n_cycle_in.resize(mx_lev+1);  
-       for (int i(0); i <= mx_lev; ++i) { is >> n_cycle_in[i]; }
-       bool any_changed = false;
-
-       for (int i(0); i <= mx_lev; ++i) {
-           if (n_cycle[i] != n_cycle_in[i]) {
-               any_changed = true;
-               if (verbose > 0) {
-		   amrex::Print() << "Warning: n_cycle has changed at level " << i << 
-		       " from " << n_cycle_in[i] << " to " << n_cycle[i] << "\n";
-	       }
-           }
-       }
-
-       // If we change n_cycle then force a full regrid from level 0 up
-       if (max_level > 0 && any_changed)
-       {
-           level_count[0] = regrid_int[0];
-           if (verbose > 0) {
-	       amrex::Print() << "Warning: This forces a full regrid \n";
-	   }
-       }
-
-
-       for (int i(0); i <= mx_lev; ++i) { is >> level_steps[i]; }
-       for (int i(0); i <= mx_lev; ++i) { is >> level_count[i]; }
-
-       //
-       // Set bndry conditions.
-       //
-       if (max_level > mx_lev)
-       {
-           for (int i(mx_lev + 1); i <= max_level; ++i)
-           {
-               dt_level[i]    = dt_level[i-1]/n_cycle[i];
-               level_steps[i] = n_cycle[i]*level_steps[i-1];
-               level_count[i] = 0;
-           }
-
-           // This is just an error check
-           if ( ! sub_cycle)
-           {
-               for (int i(1); i <= finest_level; ++i)
-               {
-                   if (dt_level[i] != dt_level[i-1]) {
-                      amrex::Error("restart: must have same dt at all levels if not subcycling");
-		   }
-               }
-           }
-       }
-
-       if (regrid_on_restart && max_level > 0)
-       {
-           if (regrid_int[0] > 0) {
-               level_count[0] = regrid_int[0];
-	   } else {
-               amrex::Error("restart: can't have regrid_on_restart and regrid_int <= 0");
-	   }
-       }
-
-       checkInput();
-       //
-       // Read levels.
-       //
-       for (int lev(0); lev <= finest_level; ++lev)
-       {
-	   amr_level[lev].reset((*levelbld)());
-           amr_level[lev]->restart(*this, is);
-	   this->SetBoxArray(lev, amr_level[lev]->boxArray());
-	   this->SetDistributionMap(lev, amr_level[lev]->DistributionMap());
-       }
-       //
-       // Build any additional data structures.
-       //
-       for (int lev = 0; lev <= finest_level; lev++) {
-           amr_level[lev]->post_restart();
-       }
-
-    } else {
-
-       if (ParallelDescriptor::IOProcessor()) {
-          amrex::Warning("Amr::restart(): max_level is lower than before");
-       }
-
-       int new_finest_level = std::min(max_level,finest_level);
-
-       finest_level = new_finest_level;
- 
-       // These are just used to hold the extra stuff we have to read in.
-       Geometry   geom_dummy;
-       Real       real_dummy;
-       int         int_dummy;
-       IntVect intvect_dummy;
-
-       for (int i(0)            ; i <= max_level; ++i) { is >> Geom(i); }
-       for (int i(max_level + 1); i <= mx_lev   ; ++i) { is >> geom_dummy; }
-
-       for (int i(0)        ; i <  max_level; ++i) { is >> ref_ratio[i]; }
-       for (int i(max_level); i <  mx_lev   ; ++i) { is >> intvect_dummy; }
-
-       for (int i(0)            ; i <= max_level; ++i) { is >> dt_level[i]; }
-       for (int i(max_level + 1); i <= mx_lev   ; ++i) { is >> real_dummy; }
-
-       if (new_checkpoint_format) {
-           for (int i(0)            ; i <= max_level; ++i) { is >> dt_min[i]; }
-           for (int i(max_level + 1); i <= mx_lev   ; ++i) { is >> real_dummy; }
-       } else {
-           for (int i(0); i <= max_level; ++i) { dt_min[i] = dt_level[i]; }
-       }
-
-       for (int i(0)            ; i <= max_level; ++i) { is >> n_cycle[i]; }
-       for (int i(max_level + 1); i <= mx_lev   ; ++i) { is >> int_dummy; }
-
-       for (int i(0)            ; i <= max_level; ++i) { is >> level_steps[i]; }
-       for (int i(max_level + 1); i <= mx_lev   ; ++i) { is >> int_dummy; }
-
-       for (int i(0)            ; i <= max_level; ++i) { is >> level_count[i]; }
-       for (int i(max_level + 1); i <= mx_lev   ; ++i) { is >> int_dummy; }
-
-       if (regrid_on_restart && max_level > 0) {
-           if (regrid_int[0] > 0)  {
-               level_count[0] = regrid_int[0];
-	   } else {
-               amrex::Error("restart: can't have regrid_on_restart and regrid_int <= 0");
-	   }
-       }
-
-       checkInput();
-
-       //
-       // Read levels.
-       //
-       for (int lev = 0; lev <= new_finest_level; lev++)
-       {
-	   amr_level[lev].reset((*levelbld)());
-           amr_level[lev]->restart(*this, is);
-	   this->SetBoxArray(lev, amr_level[lev]->boxArray());
-	   this->SetDistributionMap(lev, amr_level[lev]->DistributionMap());
-       }
-       //
-       // Build any additional data structures.
-       //
-       for (int lev = 0; lev <= new_finest_level; lev++) {
-           amr_level[lev]->post_restart();
-       }
-    }
-
-    for (int lev = 0; lev <= finest_level; ++lev)
-    {
-	Box restart_domain(Geom(lev).Domain());
-       if ( ! (inputs_domain[lev] == restart_domain) )
-       {
-	   amrex::Print() 
-	       << "Problem at level " << lev << '\n'
-	       << "Domain according to     inputs file is " <<  inputs_domain[lev] << '\n'
-	       << "Domain according to checkpoint file is " << restart_domain      << '\n'
-	       << "Amr::restart() failed -- box from inputs file does not "
-	       << "equal box from restart file. \n";
-          amrex::Abort();
-       }
-    }
-
-    if (verbose > 0)
-    {
-        Real dRestartTime = ParallelDescriptor::second() - dRestartTime0;
-
-        ParallelDescriptor::ReduceRealMax(dRestartTime,ParallelDescriptor::IOProcessorNumber());
-
-	amrex::Print() << "Restart time = " << dRestartTime << " seconds." << '\n';
-    }
-    BL_PROFILE_REGION_STOP("Amr::restart()");
-}
-
-void
-Amr::checkPoint ()
-{
-    if( ! checkpoint_files_output) {
-      return;
-    }
-
-    BL_PROFILE_REGION_START("Amr::checkPoint()");
-    BL_PROFILE("Amr::checkPoint()");
-
-    VisMF::SetNOutFiles(checkpoint_nfiles);
-    //
-    // In checkpoint files always write out FABs in NATIVE format.
-    //
-    FABio::Format thePrevFormat = FArrayBox::getFormat();
-
-    FArrayBox::setFormat(FABio::FAB_NATIVE);
-
-    VisMF::Header::Version currentVersion(VisMF::GetHeaderVersion());
-    VisMF::SetHeaderVersion(checkpoint_headerversion);
-
-    Real dCheckPointTime0 = ParallelDescriptor::second();
-
-    const std::string& ckfile = amrex::Concatenate(check_file_root,level_steps[0],file_name_digits);
-
-    if(verbose > 0) {
-	amrex::Print() << "CHECKPOINT: file = " << ckfile << "\n";
-    }
-
-    if(record_run_info && ParallelDescriptor::IOProcessor()) {
-        runlog << "CHECKPOINT: file = " << ckfile << '\n';
-    }
-
-
-  amrex::StreamRetry sretry(ckfile, abort_on_stream_retry_failure,
-                             stream_max_tries);
-
-  const std::string ckfileTemp(ckfile + ".temp");
-
-  while(sretry.TryFileOutput()) {
-
-    StateData::ClearFabArrayHeaderNames();
-
-    //
-    //  if either the ckfile or ckfileTemp exists, rename them
-    //  to move them out of the way.  then create ckfile
-    //  with the temporary name, then rename it back when
-    //  it is finished writing.  then stream retry can rename
-    //  it to a bad suffix if there were stream errors.
-    //
-
-    if(precreateDirectories) {    // ---- make all directories at once
-      amrex::UtilRenameDirectoryToOld(ckfile, false);      // dont call barrier
-      amrex::UtilCreateCleanDirectory(ckfileTemp, false);  // dont call barrier
-      for(int i(0); i <= finest_level; ++i) {
-        amr_level[i]->CreateLevelDirectory(ckfileTemp);
-      }
-      ParallelDescriptor::Barrier("Amr::precreateDirectories");
-    } else {
-      amrex::UtilRenameDirectoryToOld(ckfile, false);     // dont call barrier
-      amrex::UtilCreateCleanDirectory(ckfileTemp, true);  // call barrier
-    }
-
-    std::string HeaderFileName = ckfileTemp + "/Header";
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    std::ofstream HeaderFile;
-
-    HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-
-    int old_prec = 0;
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        //
-        // Only the IOProcessor() writes to the header file.
-        //
-        HeaderFile.open(HeaderFileName.c_str(), std::ios::out | std::ios::trunc |
-	                                        std::ios::binary);
-
-        if ( ! HeaderFile.good()) {
-            amrex::FileOpenFailed(HeaderFileName);
-	}
-
-        old_prec = HeaderFile.precision(17);
-
-        HeaderFile << CheckPointVersion << '\n'
-                   << BL_SPACEDIM       << '\n'
-                   << cumtime           << '\n'
-                   << max_level         << '\n'
-                   << finest_level      << '\n';
-        //
-        // Write out problem domain.
-        //
-        for (int i(0); i <= max_level; ++i) { HeaderFile << Geom(i)        << ' '; }
-        HeaderFile << '\n';
-        for (int i(0); i < max_level; ++i)  { HeaderFile << ref_ratio[i]   << ' '; }
-        HeaderFile << '\n';
-        for (int i(0); i <= max_level; ++i) { HeaderFile << dt_level[i]    << ' '; }
-        HeaderFile << '\n';
-        for (int i(0); i <= max_level; ++i) { HeaderFile << dt_min[i]      << ' '; }
-        HeaderFile << '\n';
-        for (int i(0); i <= max_level; ++i) { HeaderFile << n_cycle[i]     << ' '; }
-        HeaderFile << '\n';
-        for (int i(0); i <= max_level; ++i) { HeaderFile << level_steps[i] << ' '; }
-        HeaderFile << '\n';
-        for (int i(0); i <= max_level; ++i) { HeaderFile << level_count[i] << ' '; }
-        HeaderFile << '\n';
-    }
-
-    for (int i = 0; i <= finest_level; ++i) {
-        amr_level[i]->checkPoint(ckfileTemp, HeaderFile);
-    }
-
-    if (ParallelDescriptor::IOProcessor()) {
-	const Vector<std::string> &FAHeaderNames = StateData::FabArrayHeaderNames();
-	if(FAHeaderNames.size() > 0) {
-          std::string FAHeaderFilesName = ckfileTemp + "/FabArrayHeaders.txt";
-          std::ofstream FAHeaderFile(FAHeaderFilesName.c_str(),
-	                             std::ios::out | std::ios::trunc |
-	                             std::ios::binary);
-          if ( ! FAHeaderFile.good()) {
-              amrex::FileOpenFailed(FAHeaderFilesName);
-	  }
-
-	  for(int i(0); i < FAHeaderNames.size(); ++i) {
-	    FAHeaderFile << FAHeaderNames[i] << '\n';
-	  }
-	}
-    }
-
-    if(ParallelDescriptor::IOProcessor()) {
-        HeaderFile.precision(old_prec);
-
-        if( ! HeaderFile.good()) {
-            amrex::Error("Amr::checkpoint() failed");
-	}
-    }
-
-    last_checkpoint = level_steps[0];
-
-    if (verbose > 0)
-    {
-        Real dCheckPointTime = ParallelDescriptor::second() - dCheckPointTime0;
-
-        ParallelDescriptor::ReduceRealMax(dCheckPointTime,
-	                            ParallelDescriptor::IOProcessorNumber());
-
-	amrex::Print() << "checkPoint() time = " << dCheckPointTime << " secs." << '\n';
-    }
-    ParallelDescriptor::Barrier("Amr::checkPoint::end");
-
-    if(ParallelDescriptor::IOProcessor()) {
-      std::rename(ckfileTemp.c_str(), ckfile.c_str());
-    }
-    ParallelDescriptor::Barrier("Renaming temporary checkPoint file.");
-
-  }  // end while
-
-  //
-  // Restore the previous FAB format.
-  //
-  FArrayBox::setFormat(thePrevFormat);
-
-  VisMF::SetHeaderVersion(currentVersion);
-
-  BL_PROFILE_REGION_STOP("Amr::checkPoint()");
-}
-
-void
-Amr::RegridOnly (Real time)
-{
-    BL_ASSERT(regrid_on_restart == 1);
-
-    int lev_top = std::min(finest_level, max_level-1);
-
-    for (int i = 0; i <= lev_top; i++)
-       regrid(i,time);
-
-    if (plotfile_on_restart)
-	writePlotFile();
-
-    if (checkpoint_on_restart)
-       checkPoint();
-
-}
-
-void
-Amr::timeStep (int  level,
-               Real time,
-               int  iteration,
-               int  niter,
-               Real stop_time)
-{
-    BL_PROFILE("Amr::timeStep()");
-    BL_COMM_PROFILE_NAMETAG("Amr::timeStep TOP");
-
-    // This is used so that the AmrLevel functions can know which level is being advanced 
-    //      when regridding is called with possible lbase > level.
-    which_level_being_advanced = level;
-
-    // Update so that by default, we don't force a post-step regrid.
-    amr_level[level]->setPostStepRegrid(0);
-
-    //
-    // Allow regridding of level 0 calculation on restart.
-    //
-    if (max_level == 0 && regrid_on_restart)
-    {
-	regrid_level_0_on_restart();
-    }
-    else
-    {
-        int lev_top = std::min(finest_level, max_level-1);
-
-        for (int i(level); i <= lev_top; ++i)
-        {
-            const int old_finest = finest_level;
-
-            if (okToRegrid(i))
-            {
-                regrid(i,time);
-
-                //
-                // Compute new dt after regrid if at level 0 and compute_new_dt_on_regrid.
-                //
-                if ( compute_new_dt_on_regrid && (i == 0) )
-                {
-                    int post_regrid_flag = 1;
-                    amr_level[0]->computeNewDt(finest_level,
-					       sub_cycle,
-					       n_cycle,
-					       ref_ratio,
-					       dt_min,
-					       dt_level,
-					       stop_time, 
-					       post_regrid_flag);
-                }
-
-                for (int k(i); k <= finest_level; ++k) {
-                    level_count[k] = 0;
-		}
-
-                if (old_finest < finest_level)
-                {
-                    //
-                    // The new levels will not have valid time steps
-                    // and iteration counts.
-                    //
-                    for (int k(old_finest + 1); k <= finest_level; ++k)
-                    {
-                        dt_level[k]    = dt_level[k-1]/n_cycle[k];
-                    }
-                }
-            }
-            if (old_finest > finest_level) {
-                lev_top = std::min(finest_level, max_level - 1);
-	    }
-        }
-
-        if (max_level == 0 && loadbalance_level0_int > 0 && loadbalance_with_workestimates)
-        {
-            if (level_steps[0] == 1 || level_count[0] >= loadbalance_level0_int) {
-                LoadBalanceLevel0(time);
-                level_count[0] = 0;
-            }
-        }
-    }
-    //
-    // Check to see if should write plotfile.
-    // This routine is here so it is done after the restart regrid.
-    //
-    if (plotfile_on_restart && ! (restart_chkfile.empty()) )
-    {
-	plotfile_on_restart = 0;
-	writePlotFile();
-    }
-    //
-    // Advance grids at this level.
-    //
-    if (verbose > 0)
-    {
-	amrex::Print() << "[Level " << level << " step " << level_steps[level]+1 << "] "
-		       << "ADVANCE with dt = " << dt_level[level] << "\n";
-    }
-    BL_PROFILE_REGION_START("amr_level.advance");
-    Real dt_new = amr_level[level]->advance(time,dt_level[level],iteration,niter);
-    BL_PROFILE_REGION_STOP("amr_level.advance");
-
-    dt_min[level] = iteration == 1 ? dt_new : std::min(dt_min[level],dt_new);
-
-    level_steps[level]++;
-    level_count[level]++;
-
-    if (verbose > 0)
-    {
-	amrex::Print() << "[Level " << level << " step " << level_steps[level] << "] "
-		       << "Advanced " << amr_level[level]->countCells() << " cells\n";
-    }
-
-    // If the level signified that it wants a regrid after the advance has
-    // occurred, do that now.
-    if (amr_level[level]->postStepRegrid()) {
-
-	int old_finest = finest_level;
-
-	regrid(level, time);
-
-	if (old_finest < finest_level)
-	{
-	    //
-	    // The new levels will not have valid time steps.
-	    //
-	    for (int k = old_finest + 1; k <= finest_level; ++k)
-	    {
-		dt_level[k] = dt_level[k-1] / n_cycle[k];
-	    }
-	}
-
-    }
-
-    //
-    // Advance grids at higher level.
-    //
-    if (level < finest_level)
-    {
-        const int lev_fine = level+1;
-
-        if (sub_cycle)
-        {
-            const int ncycle = n_cycle[lev_fine];
-
-            BL_COMM_PROFILE_NAMETAG("Amr::timeStep timeStep subcycle");
-            for (int i = 1; i <= ncycle; i++)
-                timeStep(lev_fine,time+(i-1)*dt_level[lev_fine],i,ncycle,stop_time);
-        }
-        else
-        {
-            BL_COMM_PROFILE_NAMETAG("Amr::timeStep timeStep nosubcycle");
-            timeStep(lev_fine,time,1,1,stop_time);
-        }
-    }
-
-    amr_level[level]->post_timestep(iteration);
-
-    // Set this back to negative so we know whether we are in fact in this routine
-    which_level_being_advanced = -1;
-}
-
-Real
-Amr::coarseTimeStepDt (Real stop_time)
-{
-    coarseTimeStep(stop_time);
-    return dt_level[0];
-}
-
-void
-Amr::coarseTimeStep (Real stop_time)
-{
-    BL_PROFILE_REGION_START("Amr::coarseTimeStep()");
-    BL_PROFILE("Amr::coarseTimeStep()");
-    std::stringstream stepName;
-    stepName << "timeStep STEP " << level_steps[0];
-
-    const Real run_strt = ParallelDescriptor::second() ;
-
-    //
-    // Compute new dt.
-    //
-    if (levelSteps(0) > 0)
-    {
-        int post_regrid_flag = 0;
-        amr_level[0]->computeNewDt(finest_level,
-				   sub_cycle,
-				   n_cycle,
-				   ref_ratio,
-				   dt_min,
-				   dt_level,
-				   stop_time,
-				   post_regrid_flag);
-    }
-    else
-    {
-        amr_level[0]->computeInitialDt(finest_level,
-				       sub_cycle,
-				       n_cycle,
-				       ref_ratio,
-				       dt_level,
-				       stop_time);
-    }
-
-    BL_PROFILE_REGION_START(stepName.str());
-
-    timeStep(0,cumtime,1,1,stop_time);
-
-    BL_PROFILE_REGION_STOP(stepName.str());
-
-    cumtime += dt_level[0];
-
-    amr_level[0]->postCoarseTimeStep(cumtime);
-
-    if (verbose > 0)
-    {
-        const int IOProc   = ParallelDescriptor::IOProcessorNumber();
-        Real      run_stop = ParallelDescriptor::second() - run_strt;
-	const int istep    = level_steps[0];
-
-#ifdef BL_LAZY
-	Lazy::QueueReduction( [=] () mutable {
-#endif
-        ParallelDescriptor::ReduceRealMax(run_stop,IOProc);
-	amrex::Print() << "\n[STEP " << istep << "] Coarse TimeStep time: " << run_stop << '\n';
-#ifdef BL_LAZY
-	});
-#endif
-
-#ifndef AMREX_MEM_PROFILING
-        long min_fab_kilobytes  = amrex::TotalBytesAllocatedInFabsHWM()/1024;
-        long max_fab_kilobytes  = min_fab_kilobytes;
-
-#ifdef BL_LAZY
-	Lazy::QueueReduction( [=] () mutable {
-#endif
-        ParallelDescriptor::ReduceLongMin(min_fab_kilobytes, IOProc);
-        ParallelDescriptor::ReduceLongMax(max_fab_kilobytes, IOProc);
-
-	amrex::Print() << "[STEP " << istep << "] FAB kilobyte spread across MPI nodes: ["
-		       << min_fab_kilobytes << " ... " << max_fab_kilobytes << "]\n";
-#ifdef BL_LAZY
-	amrex::Print() << "\n";
-	});
-#endif
-#endif
-    }
-
-#ifdef AMREX_MEM_PROFILING
-    {
-	std::ostringstream ss;
-	ss << "[STEP " << level_steps[0] << "]";
-	MemProfiler::report(ss.str());
-    }
-#endif
-
-    BL_PROFILE_ADD_STEP(level_steps[0]);
-    BL_PROFILE_REGION_STOP("Amr::coarseTimeStep()");
-    BL_TRACE_PROFILE_FLUSH();
-    BL_COMM_PROFILE_NAMETAG(stepName.str());
-    BL_COMM_PROFILE_FLUSH();
-
-    if (verbose > 0)
-    {
-	amrex::Print()
-	    << "\nSTEP = " << level_steps[0]
-	    << " TIME = "  << cumtime
-	    << " DT = "    << dt_level[0] << "\n\n";
-    }
-    if (record_run_info && ParallelDescriptor::IOProcessor())
-    {
-        runlog << "STEP = "  << level_steps[0]
-               << " TIME = " << cumtime
-               << " DT = "   << dt_level[0] << '\n';
-    }
-    if (record_run_info_terse && ParallelDescriptor::IOProcessor())
-        runlog_terse << level_steps[0] << " " << cumtime << " " << dt_level[0] << '\n';
-
-    int check_test = 0;
-
-    if (check_per > 0.0)
-    {
-      const int num_per_old = (cumtime-dt_level[0]) / check_per;
-      const int num_per_new = (cumtime            ) / check_per;
-
-      if (num_per_old != num_per_new)
-      {
-	check_test = 1;
-      }
-    }
-
-    int to_stop       = 0;    
-    int to_checkpoint = 0;
-    int to_plot       = 0;
-    int to_small_plot = 0;
-    if (message_int > 0 && level_steps[0] % message_int == 0) {
-	if (ParallelDescriptor::IOProcessor())
-	{
-	    FILE *fp;
-	    if ((fp=fopen("dump_and_continue","r")) != 0)
-	    {
-		remove("dump_and_continue");
-		to_checkpoint = 1;
-		fclose(fp);
-	    }
-	    else if ((fp=fopen("stop_run","r")) != 0)
-	    {
-		remove("stop_run");
-		to_stop = 1;
-		fclose(fp);
-	    }
-	    else if ((fp=fopen("dump_and_stop","r")) != 0)
-	    {
-		remove("dump_and_stop");
-		to_checkpoint = 1;
-		to_stop = 1;
-		fclose(fp);
-	    }
-
-	    if ((fp=fopen("plot_and_continue","r")) != 0)
-	    {
-		remove("plot_and_continue");
-		to_plot = 1;
-		fclose(fp);
-	    }
-
-            if ((fp=fopen("small_plot_and_continue","r")) != 0)
-            {
-                remove("small_plot_and_continue");
-                to_small_plot = 1;
-                fclose(fp);
-            }
-	}
-        int packed_data[4];
-	packed_data[0] = to_stop;
-	packed_data[1] = to_checkpoint;
-        packed_data[2] = to_plot;
-        packed_data[3] = to_small_plot;
-	ParallelDescriptor::Bcast(packed_data, 4, ParallelDescriptor::IOProcessorNumber());
-	to_stop = packed_data[0];
-	to_checkpoint = packed_data[1];
-        to_plot = packed_data[2];
-        to_small_plot = packed_data[3];
-
-    }
-
-    if(to_stop == 1 && to_checkpoint == 0) {  // prevent main from writing files
-      last_checkpoint = level_steps[0];
-      last_plotfile   = level_steps[0];
-    }
-
-    if (to_checkpoint && write_plotfile_with_checkpoint)
-      to_plot = 1;
-
-    if ((check_int > 0 && level_steps[0] % check_int == 0) || check_test == 1
-	|| to_checkpoint)
-    {
-        checkPoint();
-    }
-
-
-    if (writePlotNow() || to_plot)
-    {
-        writePlotFile();
-    }
-
-    if (writeSmallPlotNow() || to_small_plot)
-    {
-        writeSmallPlotFile();
-    }
-
-    bUserStopRequest = to_stop;
-    if (to_stop)
-    {
-        ParallelDescriptor::Barrier("Amr::coarseTimeStep::to_stop");
-        if(ParallelDescriptor::IOProcessor()) {
-          if (to_checkpoint)
-          {
-            std::cerr << "Stopped by user w/ checkpoint" << std::endl;
-          }
-          else
-          {
-            std::cerr << "Stopped by user w/o checkpoint" << std::endl;
-          }
-	}
-    }
-}
-
-bool
-Amr::writePlotNow()
-{
-    int plot_test = 0;
-    if (plot_per > 0.0)
-    {
-      const int num_per_old = (cumtime-dt_level[0]) / plot_per;
-      const int num_per_new = (cumtime            ) / plot_per;
-
-      if (num_per_old != num_per_new)
-	{
-	  plot_test = 1;
-	}
-    }
-
-    return ( (plot_int > 0 && level_steps[0] % plot_int == 0) || 
-              plot_test == 1 ||
-              amr_level[0]->writePlotNow());
-} 
-
-bool
-Amr::writeSmallPlotNow()
-{
-    int plot_test = 0;
-    if (small_plot_per > 0.0)
-    {
-      const int num_per_old = (cumtime-dt_level[0]) / small_plot_per;
-      const int num_per_new = (cumtime            ) / small_plot_per;
-
-      if (num_per_old != num_per_new)
-	{
-	  plot_test = 1;
-	}
-    }
-
-    return ( (small_plot_int > 0 && level_steps[0] % small_plot_int == 0) || 
-              plot_test == 1 ||
-              amr_level[0]->writeSmallPlotNow());
-} 
-
-void
-Amr::defBaseLevel (Real              strt_time, 
-                   const BoxArray*   lev0_grids,
-                   const Vector<int>* pmap)
-{
-    BL_PROFILE("Amr::defBaseLevel()");
-    // Just initialize this here for the heck of it
-    which_level_being_advanced = -1;
-
-    //
-    // Check that base domain has even number of zones in all directions.
-    //
-    const Box& domain   = Geom(0).Domain();
-    const IntVect& d_len = domain.size();
-
-    for (int idir = 0; idir < BL_SPACEDIM; idir++)
-        if (d_len[idir]%2 != 0)
-            amrex::Error("defBaseLevel: must have even number of cells");
-
-    BoxArray lev0;
-
-    if (lev0_grids != 0 && lev0_grids->size() > 0)
-    {
-        BL_ASSERT(pmap != 0);
-
-        BoxArray domain_ba(domain);
-        if (!domain_ba.contains(*lev0_grids))
-            amrex::Error("defBaseLevel: domain does not contain lev0_grids!");
-        if (!lev0_grids->contains(domain_ba))
-            amrex::Error("defBaseLevel: lev0_grids does not contain domain");
-
-        lev0 = *lev0_grids;
-
-	if (refine_grid_layout) {
-	    ChopGrids(0,lev0,ParallelDescriptor::NProcs());
-	}
-    }
-    else
-    {
-	lev0 = MakeBaseGrids();
-    }
-
-    this->SetBoxArray(0, lev0);
-    this->SetDistributionMap(0, DistributionMapping(lev0));
-
-    //
-    // Now build level 0 grids.
-    //
-    amr_level[0].reset((*levelbld)(*this,0,Geom(0),grids[0],dmap[0],strt_time));
-    //
-    // Now init level 0 grids with data.
-    //
-    amr_level[0]->initData();
-}
-
-void
-Amr::regrid (int  lbase,
-             Real time,
-             bool initial)
-{
-    BL_PROFILE("Amr::regrid()");
-
-    if (lbase > std::min(finest_level,max_level-1)) return;
-
-    if (verbose > 0)
-	amrex::Print() << "Now regridding at level lbase = " << lbase << "\n";
-
-    //
-    // Compute positions of new grids.
-    //
-    int             new_finest;
-    Vector<BoxArray> new_grid_places(max_level+1);
-    Vector<DistributionMapping> new_dmap(max_level+1);
-
-    grid_places(lbase,time,new_finest, new_grid_places);
-
-    bool regrid_level_zero = (!initial) && (lbase == 0)
-        && ( loadbalance_with_workestimates || (new_grid_places[0] != amr_level[0]->boxArray()));
-
-    const int start = regrid_level_zero ? 0 : lbase+1;
-
-    bool grids_unchanged = finest_level == new_finest;
-    for (int lev = start, End = std::min(finest_level,new_finest); lev <= End; lev++) {
-	if (new_grid_places[lev] == amr_level[lev]->boxArray()) {
-	    new_grid_places[lev] = amr_level[lev]->boxArray();  // to avoid duplicates
-	    new_dmap[lev] = amr_level[lev]->DistributionMap(); 
-	} else {
-	    grids_unchanged = false;
-	}
-    }
-
-    //
-    // If use_efficient_regrid flag is set and grids are unchanged, then don't do anything more here.
-    //
-    if (use_efficient_regrid == 1 && grids_unchanged )
-    {
-	if (verbose > 0) {
-	    amrex::Print() << "Regridding at level lbase = " << lbase 
-			   << " but grids unchanged\n";
-	}
-	return;
-    }
-
-    //
-    // Reclaim old-time grid space for all remain levels > lbase.
-    //
-    for(int lev = start; lev <= finest_level; ++lev) {
-	amr_level[lev]->removeOldData();
-    }
-    //
-    // Reclaim all remaining storage for levels > new_finest.
-    //
-    for(int lev = new_finest + 1; lev <= finest_level; ++lev) {
-	amr_level[lev].reset();
-	this->ClearBoxArray(lev);
-	this->ClearDistributionMap(lev);
-    }
-
-    finest_level = new_finest;
-
-    //
-    // Define the new grids from level start up to new_finest.
-    //
-    for(int lev = start; lev <= new_finest; ++lev) {
-        //
-        // Construct skeleton of new level.
-        //
-
-        if (loadbalance_with_workestimates && !initial) {
-            new_dmap[lev] = makeLoadBalanceDistributionMap(lev, time, new_grid_places[lev]);
-        }
-        else if (new_dmap[lev].empty()) {
-	    new_dmap[lev].define(new_grid_places[lev]);
-	}
-
-        AmrLevel* a = (*levelbld)(*this,lev,Geom(lev),new_grid_places[lev],
-				  new_dmap[lev],cumtime);
-
-        if (initial)
-        {
-            //
-            // We're being called on startup from bldFineLevels().
-            // NOTE: The initData function may use a filPatch, and so needs to
-            //       be officially inserted into the hierarchy prior to the call.
-            //
-            amr_level[lev].reset(a);
-	    this->SetBoxArray(lev, amr_level[lev]->boxArray());
-	    this->SetDistributionMap(lev, amr_level[lev]->DistributionMap());
-            amr_level[lev]->initData();
-        }
-        else if (amr_level[lev])
-        {
-            //
-            // Init with data from old structure then remove old structure.
-            // NOTE: The init function may use a filPatch from the old level,
-            //       which therefore needs remain in the hierarchy during the call.
-            //
-            a->init(*amr_level[lev]);
-            amr_level[lev].reset(a);
-	    this->SetBoxArray(lev, amr_level[lev]->boxArray());
-	    this->SetDistributionMap(lev, amr_level[lev]->DistributionMap());
-	}
-        else
-        {
-            a->init();
-            amr_level[lev].reset(a);
-	    this->SetBoxArray(lev, amr_level[lev]->boxArray());
-	    this->SetDistributionMap(lev, amr_level[lev]->DistributionMap());
-        }
-
-    }
-
-
-    //
-    // Check at *all* levels whether we need to do anything special now that the grids
-    //       at levels lbase+1 and higher may have changed.  
-    //
-    for(int lev(0); lev <= new_finest; ++lev) {
-      amr_level[lev]->post_regrid(lbase,new_finest);
-    }
-
-    //
-    // Report creation of new grids.
-    //
-
-    if (record_run_info && ParallelDescriptor::IOProcessor())
-    {
-        runlog << "REGRID: at level lbase = " << lbase << '\n';
-        printGridInfo(runlog,start,finest_level);
-    }
-
-    if (record_grid_info && ParallelDescriptor::IOProcessor())
-    {
-        if (lbase == 0)
-            gridlog << "STEP = " << level_steps[0] << ' ';
-
-        gridlog << "TIME = "
-                << time
-                << " : REGRID  with lbase = "
-                << lbase
-                << '\n';
-
-        printGridInfo(gridlog,start,finest_level);
-    }
-
-    if (verbose > 0 && ParallelDescriptor::IOProcessor())
-    {
-        if (lbase == 0)
-            std::cout << "STEP = " << level_steps[0] << ' ';
-
-        std::cout << "TIME = "
-                  << time
-                  << " : REGRID  with lbase = "
-                  << lbase
-                  << std::endl;
-
-        if (verbose > 1)
-        {
-           printGridInfo(std::cout,start,finest_level);
-        }
-        else
-        {
-           printGridSummary(std::cout,start,finest_level);
-        }
-    }
-}
-
-DistributionMapping
-Amr::makeLoadBalanceDistributionMap (int lev, Real time, const BoxArray& ba) const
-{
-    BL_PROFILE("makeLoadBalanceDistributionMap()");
-
-    amrex::Print() << "Load balance on level " << lev << " at t = " << time << "\n";
-
-    DistributionMapping newdm;
-
-    const int work_est_type = amr_level[0]->WorkEstType();
-
-    if (work_est_type < 0) {
-        amrex::Print() << "\nAMREX WARNING: work estimates type does not exist!\n\n";
-        newdm.define(ba);
-    }
-    else if (amr_level[lev])
-    {
-        DistributionMapping dmtmp;
-        if (ba.size() == boxArray(lev).size()) {
-            dmtmp = DistributionMap(lev);
-        } else {
-            dmtmp.define(ba);
-        }
-
-        MultiFab workest(ba, dmtmp, 1, 0);
-        AmrLevel::FillPatch(*amr_level[lev], workest, 0, time, work_est_type, 0, 1, 0);
-
-        Real navg = static_cast<Real>(ba.size()) / static_cast<Real>(ParallelDescriptor::NProcs());
-        int nmax = std::max(std::round(loadbalance_max_fac*navg), std::ceil(navg));
-
-        newdm = DistributionMapping::makeKnapSack(workest, nmax);
-    }
-    else
-    {
-        newdm.define(ba);
-    }
-
-    return newdm;
-}
-
-void
-Amr::LoadBalanceLevel0 (Real time)
-{
-    BL_PROFILE("LoadBalanceLevel0()");
-    const auto& dm = makeLoadBalanceDistributionMap(0, time, boxArray(0));
-    InstallNewDistributionMap(0, dm);
-    amr_level[0]->post_regrid(0,time);
-}
-
-void
-Amr::InstallNewDistributionMap (int lev, const DistributionMapping& newdm)
-{
-    BL_PROFILE("InstallNewDistributionMap()");
-
-    AmrLevel* a = (*levelbld)(*this,lev,Geom(lev),boxArray(lev),newdm,cumtime);
-    a->init(*amr_level[lev]);
-    amr_level[lev].reset(a);
-
-    this->SetBoxArray(lev, amr_level[lev]->boxArray());
-    this->SetDistributionMap(lev, amr_level[lev]->DistributionMap());
-}
-
-void
-Amr::regrid_level_0_on_restart()
-{
-    regrid_on_restart = 0;
-    //
-    // Coarsening before we split the grids ensures that each resulting
-    // grid will have an even number of cells in each direction.
-    //
-    BoxArray lev0(amrex::coarsen(Geom(0).Domain(),2));
-    //
-    // Now split up into list of grids within max_grid_size[0] limit.
-    //
-    lev0.maxSize(max_grid_size[0]/2);
-    //
-    // Now refine these boxes back to level 0.
-    //
-    lev0.refine(2);
-    
-    //
-    // If use_efficient_regrid flag is set, then test to see whether we in fact 
-    //    have just changed the level 0 grids. If not, then don't do anything more here.
-    //
-    if ( !( (use_efficient_regrid == 1) && (lev0 == amr_level[0]->boxArray()) ) ) 
-    {
-	//
-	// Construct skeleton of new level.
-	//
-	DistributionMapping dm(lev0);
-	AmrLevel* a = (*levelbld)(*this,0,Geom(0),lev0,dm,cumtime);
-	
-	a->init(*amr_level[0]);
-	amr_level[0].reset(a);
-	
-	this->SetBoxArray(0, amr_level[0]->boxArray());
-	this->SetDistributionMap(0, amr_level[0]->DistributionMap());
-
-	amr_level[0]->post_regrid(0,0);
-	
-	if (ParallelDescriptor::IOProcessor())
-	{
-	    if (verbose > 1)
-	    {
-		printGridInfo(std::cout,0,finest_level);
-	    }
-	    else if (verbose > 0)
-	    {
-		printGridSummary(std::cout,0,finest_level);
-	    }
-	}
-	
-	if (record_grid_info && ParallelDescriptor::IOProcessor())
-	    printGridInfo(gridlog,0,finest_level);
-    }
-    else
-    {
-	if (verbose > 0)
-	    amrex::Print() << "Regridding at level 0 but grids unchanged \n";
-    }
-}
-
-void
-Amr::printGridInfo (std::ostream& os,
-                    int           min_lev,
-                    int           max_lev)
-{
-    for (int lev = min_lev; lev <= max_lev; lev++)
-    {
-        const BoxArray&           bs      = amr_level[lev]->boxArray();
-        int                       numgrid = bs.size();
-        long                      ncells  = amr_level[lev]->countCells();
-        double                    ntot    = Geom(lev).Domain().d_numPts();
-        Real                      frac    = 100.0_rt*(Real(ncells) / ntot);
-        const DistributionMapping& map    = amr_level[lev]->get_new_data(0).DistributionMap();
-
-        os << "  Level "
-           << lev
-           << "   "
-           << numgrid
-           << " grids  "
-           << ncells
-           << " cells  "
-           << frac
-           << " % of domain"
-           << '\n';
-
-
-        for (int k = 0; k < numgrid; k++)
-        {
-            const Box& b = bs[k];
-
-            os << ' ' << lev << ": " << b << "   ";
-                
-            for (int i = 0; i < BL_SPACEDIM; i++)
-                os << b.length(i) << ' ';
-
-            os << ":: " << map[k] << '\n';
-        }
-    }
-
-    os << std::endl; // Make sure we flush!
-}
-
-
-void
-Amr::grid_places (int              lbase,
-                  Real             time,
-                  int&             new_finest,
-                  Vector<BoxArray>& new_grids)
-{
-    BL_PROFILE("Amr::grid_places()");
-
-    const Real strttime = ParallelDescriptor::second();
-
-    if (lbase == 0)
-    {
-	new_grids[0] = MakeBaseGrids();
-    }
-
-    if ( time == 0. && !initial_grids_file.empty() && !use_fixed_coarse_grids)
-    {
-        new_finest = std::min(max_level,(finest_level+1));
-        new_finest = std::min<int>(new_finest,initial_ba.size());
-
-        for (int lev = 1; lev <= new_finest; lev++)
-        {
-            BoxList bl;
-            int ngrid = initial_ba[lev-1].size();
-            for (int i = 0; i < ngrid; i++)
-            {
-                Box bx(initial_ba[lev-1][i]);
-                if (lev > lbase)
-                    bl.push_back(bx);
-            }
-            if (lev > lbase)
-                new_grids[lev].define(bl);
-        }
-        return;
-    }
-
-    // Use grids in initial_grids_file as fixed coarse grids.
-    if ( ! initial_grids_file.empty() && use_fixed_coarse_grids)
-    {
-        new_finest = std::min(max_level,(finest_level+1));
-        new_finest = std::min<int>(new_finest,initial_ba.size());
-
-        for (int lev = lbase+1; lev <= new_finest; lev++)
-        {
-            BoxList bl;
-            int ngrid = initial_ba[lev-1].size();
-            for (int i = 0; i < ngrid; i++)
-            {
-                Box bx(initial_ba[lev-1][i]);
-
-                if (lev > lbase)
-                    bl.push_back(bx);
-
-            }
-            if (lev > lbase)
-                new_grids[lev].define(bl);
-            new_grids[lev].maxSize(max_grid_size[lev]);
-        }
-    }
-    else if ( !regrid_grids_file.empty() )     // Use grids in regrid_grids_file 
-    {
-        new_finest = std::min(max_level,(finest_level+1));
-        new_finest = std::min<int>(new_finest,regrid_ba.size());
-        for (int lev = 1; lev <= new_finest; lev++)
-        {
-            BoxList bl;
-            int ngrid = regrid_ba[lev-1].size();
-            for (int i = 0; i < ngrid; i++)
-            {
-                Box bx(regrid_ba[lev-1][i]);
-                if (lev > lbase)
-                    bl.push_back(bx);
-            }
-            if (lev > lbase)
-                new_grids[lev].define(bl);
-        }
-        return;
-    }
-
-    MakeNewGrids(lbase, time, new_finest, new_grids);
-
-    if (verbose > 0)
-    {
-        Real stoptime = ParallelDescriptor::second() - strttime;
-
-#ifdef BL_LAZY
-	Lazy::QueueReduction( [=] () mutable {
-#endif
-        ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
-	amrex::Print() << "grid_places() time: " << stoptime << " new finest: " << new_finest<< '\n';
-#ifdef BL_LAZY
-	});
-#endif
-    }
-}
-
-void
-Amr::ErrorEst (int lev, TagBoxArray& tags, Real time, int ngrow)
-{
-    amr_level[lev]->errorEst(tags,TagBox::CLEAR,TagBox::SET,time, n_error_buf[lev],ngrow);
-}
-
-BoxArray
-Amr::GetAreaNotToTag (int lev)
-{
-    return BoxArray(amr_level[lev]->getAreaNotToTag());
-}
-
-void
-Amr::ManualTagsPlacement (int lev, TagBoxArray& tags, const Vector<IntVect>& bf_lev)
-{
-    amr_level[lev]->manual_tags_placement(tags, bf_lev);
-}
-
-void
-Amr::bldFineLevels (Real strt_time)
-{
-    BL_PROFILE("Amr::bldFineLevels()");
-    finest_level = 0;
-
-    Vector<BoxArray> new_grids(max_level+1);
-    //
-    // Get initial grid placement.
-    //
-    do
-    {
-        int new_finest;
-
-        grid_places(finest_level,strt_time,new_finest,new_grids);
-
-        if (new_finest <= finest_level) break;
-        //
-        // Create a new level and link with others.
-        //
-        finest_level = new_finest;
-
-	DistributionMapping new_dm {new_grids[new_finest]};
-
-        AmrLevel* level = (*levelbld)(*this,
-                                      new_finest,
-                                      Geom(new_finest),
-                                      new_grids[new_finest],
-				      new_dm,
-                                      strt_time);
-
-        amr_level[new_finest].reset(level);
-	this->SetBoxArray(new_finest, new_grids[new_finest]);
-	this->SetDistributionMap(new_finest, new_dm);
-
-        amr_level[new_finest]->initData();
-    }
-    while (finest_level < max_level);
-    //
-    // Iterate grids to ensure fine grids encompass all interesting gunk.
-    //     but only iterate if we did not provide a grids file.
-    //
-    if ( regrid_grids_file.empty() || (strt_time == 0.0 && !initial_grids_file.empty()) )  
-    {
-	bool grids_the_same;
-
-	const int MaxCnt = 4;
-
-	int count = 0;
-
-	do
-	{
-	    for (int i = 0; i <= finest_level; i++) {
-		new_grids[i] = amr_level[i]->boxArray();
-	    }
-
-	    regrid(0,strt_time,true);
-
-	    grids_the_same = true;
-
-	    for (int i = 0; i <= finest_level && grids_the_same; i++) {
-		if (!(new_grids[i] == amr_level[i]->boxArray())) {
-		    grids_the_same = false;
-		}
-	    }
-
-	    count++;
-	}
-	while (!grids_the_same && count < MaxCnt);
-    }
-}
-
-void
-Amr::initSubcycle ()
-{
-    BL_PROFILE("Amr::initSubcycle()");
-    ParmParse pp("amr");
-    sub_cycle = true;
-    if (pp.contains("nosub"))
-    {
-	amrex::Print() << "Warning: The nosub flag has been deprecated.\n "
-				    << "... please use subcycling_mode to control subcycling.\n";
-        int nosub;
-        pp.query("nosub",nosub);
-        if (nosub > 0)
-            sub_cycle = false;
-        else
-            amrex::Error("nosub <= 0 not allowed.\n");
-        subcycling_mode = "None";
-    }
-    else 
-    {
-        subcycling_mode = "Auto";
-        pp.query("subcycling_mode",subcycling_mode);
-    }
-    
-    if (subcycling_mode == "None")
-    {
-        sub_cycle = false;
-        for (int i = 0; i <= max_level; i++)
-        {
-            n_cycle[i] = 1;
-        }
-    }
-    else if (subcycling_mode == "Manual")
-    {
-        int cnt = pp.countval("subcycling_iterations");
-
-        if (cnt == 1)
-        {
-            //
-            // Set all values to the single available value.
-            //
-            int cycles = 0;
-
-            pp.get("subcycling_iterations",cycles);
-
-            n_cycle[0] = 1; // coarse level is always 1 cycle
-            for (int i = 1; i <= max_level; i++)
-            {
-                n_cycle[i] = cycles;
-            }
-        }
-        else if (cnt > 1)
-        {
-            //
-            // Otherwise we expect a vector of max_grid_size values.
-            //
-            pp.getarr("subcycling_iterations",n_cycle,0,max_level+1);
-            if (n_cycle[0] != 1)
-            {
-                amrex::Error("First entry of subcycling_iterations must be 1");
-            }
-        }
-        else
-        {
-            amrex::Error("Must provide a valid subcycling_iterations if mode is Manual");
-        }
-        for (int i = 1; i <= max_level; i++)
-        {
-            if (n_cycle[i] > MaxRefRatio(i-1))
-                amrex::Error("subcycling iterations must always be <= ref_ratio");
-            if (n_cycle[i] <= 0)
-                amrex::Error("subcycling iterations must always be > 0");
-        }
-    }
-    else if (subcycling_mode == "Auto")
-    {
-        n_cycle[0] = 1;
-        for (int i = 1; i <= max_level; i++)
-        {
-            n_cycle[i] = MaxRefRatio(i-1);
-        } 
-    }
-    else if (subcycling_mode == "Optimal")
-    {
-        // if subcycling mode is Optimal, n_cycle is set dynamically.
-        // We'll initialize it to be Auto subcycling.
-        n_cycle[0] = 1;
-        for (int i = 1; i <= max_level; i++)
-        {
-            n_cycle[i] = MaxRefRatio(i-1);
-        } 
-    }
-    else
-    {
-        std::string err_message = "Unrecognzied subcycling mode: " + subcycling_mode + "\n";
-        amrex::Error(err_message.c_str());
-    }
-}
-
-void
-Amr::initPltAndChk ()
-{
-    ParmParse pp("amr");
-
-    pp.query("checkpoint_files_output", checkpoint_files_output);
-    pp.query("plot_files_output", plot_files_output);
-
-    pp.query("plot_nfiles", plot_nfiles);
-    pp.query("checkpoint_nfiles", checkpoint_nfiles);
-    //
-    // -1 ==> use ParallelDescriptor::NProcs().
-    //
-    if (plot_nfiles       == -1) plot_nfiles       = ParallelDescriptor::NProcs();
-    if (checkpoint_nfiles == -1) checkpoint_nfiles = ParallelDescriptor::NProcs();
-    
-    check_file_root = "chk";
-    pp.query("check_file",check_file_root);
-
-    check_int = -1;
-    pp.query("check_int",check_int);
-
-    check_per = -1.0;
-    pp.query("check_per",check_per);
-
-    if (check_int > 0 && check_per > 0)
-    {
-        if (ParallelDescriptor::IOProcessor())
-	    amrex::Warning("Warning: both amr.check_int and amr.check_per are > 0.");
-    }
-
-    plot_file_root = "plt";
-    pp.query("plot_file",plot_file_root);
-
-    plot_int = -1;
-    pp.query("plot_int",plot_int);
-
-    plot_per = -1.0;
-    pp.query("plot_per",plot_per);
-
-    if (plot_int > 0 && plot_per > 0)
-    {
-        if (ParallelDescriptor::IOProcessor())
-            amrex::Warning("Warning: both amr.plot_int and amr.plot_per are > 0.");
-    }
-
-    small_plot_file_root = "smallplt";
-    pp.query("small_plot_file",small_plot_file_root);
-
-    small_plot_int = -1;
-    pp.query("small_plot_int",small_plot_int);
-
-    small_plot_per = -1.0;
-    pp.query("small_plot_per",small_plot_per);
-
-    if (small_plot_int > 0 && small_plot_per > 0)
-    {
-        if (ParallelDescriptor::IOProcessor())
-            amrex::Warning("Warning: both amr.small_plot_int and amr.small_plot_per are > 0.");
-    }
-
-    write_plotfile_with_checkpoint = 1;
-    pp.query("write_plotfile_with_checkpoint",write_plotfile_with_checkpoint);
-
-    stream_max_tries = 4;
-    pp.query("stream_max_tries",stream_max_tries);
-    stream_max_tries = std::max(stream_max_tries, 1);
-
-    abort_on_stream_retry_failure = false;
-    pp.query("abort_on_stream_retry_failure",abort_on_stream_retry_failure);
-
-    pp.query("precreateDirectories", precreateDirectories);
-    pp.query("prereadFAHeaders", prereadFAHeaders);
-
-    int phvInt(plot_headerversion), chvInt(checkpoint_headerversion);
-    pp.query("plot_headerversion", phvInt);
-    if(phvInt != plot_headerversion) {
-      plot_headerversion = static_cast<VisMF::Header::Version> (phvInt);
-    }
-    pp.query("checkpoint_headerversion", chvInt);
-    if(chvInt != checkpoint_headerversion) {
-      checkpoint_headerversion = static_cast<VisMF::Header::Version> (chvInt);
-    }
-}
-
-
-bool
-Amr::okToRegrid(int level)
-{
-    if (regrid_int[level] < 0)
-        return false;
-    else
-        return level_count[level] >= regrid_int[level] && amr_level[level]->okToRegrid();
-}
-
-Real
-Amr::computeOptimalSubcycling(int n, int* best, Real* dt_max, Real* est_work, int* cycle_max)
-{
-    BL_ASSERT(cycle_max[0] == 1);
-    // internally these represent the total number of steps at a level, 
-    // not the number of cycles
-    std::vector<int> cycles(n);
-    Real best_ratio = 1e200;
-    Real best_dt = 0;
-    Real ratio;
-    Real dt;
-    Real work;
-    int limit = 1;
-    // This provides a memory efficient way to test all candidates
-    for (int i = 1; i < n; i++)
-        limit *= cycle_max[i];
-    for (int candidate = 0; candidate < limit; candidate++)
-    {
-        int temp_cand = candidate;
-        cycles[0] = 1;
-        dt = dt_max[0];
-        work = est_work[0];
-        for (int i  = 1; i < n; i++)
-        {
-            // grab the relevant "digit" and shift over.
-            cycles[i] = (1 + temp_cand%cycle_max[i]) * cycles[i-1];
-            temp_cand /= cycle_max[i];
-            dt = std::min(dt, cycles[i]*dt_max[i]);
-            work += cycles[i]*est_work[i];
-        }
-        ratio = work/dt;
-        if (ratio < best_ratio) 
-        {
-            for (int i  = 0; i < n; i++)
-                best[i] = cycles[i];
-            best_ratio = ratio;
-            best_dt = dt;
-        }
-    }
-    //
-    // Now we convert best back to n_cycles format
-    //
-    for (int i = n-1; i > 0; i--)
-        best[i] /= best[i-1];
-    return best_dt;
-}
-
-const Vector<BoxArray>& Amr::getInitialBA()
-{
-  return initial_ba;
-}
-
-#ifdef AMREX_PARTICLES
-void 
-Amr::RedistributeParticles ()
-{
-    amr_level[0]->particle_redistribute(0,true);
-}
-#endif
-    
-}
-
diff --git a/Src/AmrTask/Amr/Make.package b/Src/AmrTask/Amr/Make.package
deleted file mode 100644
index 38448c44473..00000000000
--- a/Src/AmrTask/Amr/Make.package
+++ /dev/null
@@ -1,9 +0,0 @@
-AMRLIB_BASE=EXE
-
-C$(AMRLIB_BASE)_sources += AMReX_AmrAsync.cpp AMReX_AmrLevelAsync.cpp
-
-C$(AMRLIB_BASE)_headers += AMReX_Amr.H AMReX_AmrLevel.H AMReX_AmrLevelAsync.H AMReX_Derive.H AMReX_LevelBld.H AMReX_StateData.H \
-                AMReX_StateDescriptor.H AMReX_PROB_AMR_F.H AMReX_AuxBoundaryData.H AMReX_Extrapolater.H
-
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/Amr $(AMREX_HOME)/Src/AmrTask/Amr
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Amr $(AMREX_HOME)/Src/AmrTask/Amr
diff --git a/Src/AmrTask/Amr/Makefile b/Src/AmrTask/Amr/Makefile
deleted file mode 100755
index 17c8d199fdb..00000000000
--- a/Src/AmrTask/Amr/Makefile
+++ /dev/null
@@ -1,23 +0,0 @@
-include ../arch.common 
-
-OBJECTS= AMReX_AmrTask.o 
-
-AMRLIB= AMRTask.a
-
-all: $(AMRLIB)
-
-$(AMRLIB): $(OBJECTS)
-	ar rv $(AMRLIB) $(OBJECTS) 
-
-
-INCLUDE += -DBL_USE_MPI -DBL_USE_OMP -DBL_SPACEDIM=3 -DAMREX_SPACEDIM=3 -DBL_FORT_USE_UNDERSCORE -DBL_Linux
-
-AMReX_AmrTask.o: AMReX_AmrTask.cpp
-	$(C++) $(C++FLAGS) -I./ -I../../Base -I../../Amr -I../../AmrCore -I../../Boundary -I../graph -I$(INCLUDE) -c AMReX_AmrTask.cpp -o AMReX_AmrTask.o
-
-.PHONY: clean
-
-clean:
-	$(RM) $(OBJECTS)
-	$(RM) *.a
-
diff --git a/Src/AmrTask/AmrCore/AMReX_FillPatchUtil.H b/Src/AmrTask/AmrCore/AMReX_FillPatchUtil.H
deleted file mode 100644
index 767e668257a..00000000000
--- a/Src/AmrTask/AmrCore/AMReX_FillPatchUtil.H
+++ /dev/null
@@ -1,36 +0,0 @@
-#ifndef AMREX_FillPatchUtil_H_
-#define AMREX_FillPatchUtil_H_
-
-#include <AMReX_MultiFab.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_PhysBCFunct.H>
-#include <AMReX_Interpolater.H>
-#include <array>
-
-namespace amrex
-{
-    void FillPatchSingleLevel (MultiFab& mf, Real time, 
-			       const Vector<MultiFab*>& smf, const Vector<Real>& stime, 
-			       int scomp, int dcomp, int ncomp,
-			       const Geometry& geom, PhysBCFunctBase& physbcf);
-
-    void FillPatchTwoLevels (MultiFab& mf, Real time,
-			     const Vector<MultiFab*>& cmf, const Vector<Real>& ct,
-			     const Vector<MultiFab*>& fmf, const Vector<Real>& ft,
-			     int scomp, int dcomp, int ncomp,
-			     const Geometry& cgeom, const Geometry& fgeom, 
-			     PhysBCFunctBase& cbc, PhysBCFunctBase& fbc,
-			     const IntVect& ratio, 
-			     Interpolater* mapper, const BCRec& bcs);
-
-    void FillPatchTwoLevels (MultiFab& mf, Real time,
-			     const Vector<MultiFab*>& cmf, const Vector<Real>& ct,
-			     const Vector<MultiFab*>& fmf, const Vector<Real>& ft,
-			     int scomp, int dcomp, int ncomp,
-			     const Geometry& cgeom, const Geometry& fgeom, 
-			     PhysBCFunctBase& cbc, PhysBCFunctBase& fbc,
-			     const IntVect& ratio, 
-			     Interpolater* mapper, const Vector<BCRec>& bcs);
-}
-
-#endif
diff --git a/Src/AmrTask/AmrCore/AMReX_FillPatchUtil.cpp b/Src/AmrTask/AmrCore/AMReX_FillPatchUtil.cpp
deleted file mode 100644
index 39d3fb74b4c..00000000000
--- a/Src/AmrTask/AmrCore/AMReX_FillPatchUtil.cpp
+++ /dev/null
@@ -1,176 +0,0 @@
-#include <AMReX_Utility.H>
-#include <AMReX_FillPatchUtil.H>
-#include <AMReX_FillPatchUtil_F.H>
-#include <cmath>
-
-#ifdef AMREX_USE_EB
-#include <AMReX_EBFabFactory.H>
-#endif
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-namespace amrex
-{
-    void FillPatchSingleLevel (MultiFab& mf, Real time, 
-	    const Vector<MultiFab*>& smf, const Vector<Real>& stime,
-	    int scomp, int dcomp, int ncomp,
-	    const Geometry& geom, PhysBCFunctBase& physbcf)
-    {
-	BL_PROFILE("FillPatchSingleLevel");
-
-	BL_ASSERT(scomp+ncomp <= smf[0]->nComp());
-	BL_ASSERT(dcomp+ncomp <= mf.nComp());
-	BL_ASSERT(smf.size() == stime.size());
-	BL_ASSERT(smf.size() != 0);
-
-	if (smf.size() == 1) 
-	{
-	    mf.copy(*smf[0], scomp, dcomp, ncomp, 0, mf.nGrow(), geom.periodicity());
-	} 
-	else if (smf.size() == 2) 
-	{
-	    BL_ASSERT(smf[0]->boxArray() == smf[1]->boxArray());
-	    MultiFab raii;
-	    MultiFab * dmf;
-	    int destcomp;
-	    bool sameba;
-	    if (mf.boxArray() == smf[0]->boxArray()) {
-		dmf = &mf;
-		destcomp = dcomp;
-		sameba = true;
-	    } else {
-		raii.define(smf[0]->boxArray(), smf[0]->DistributionMap(), ncomp, 0,
-			MFInfo(), smf[0]->Factory());
-
-		dmf = &raii;
-		destcomp = 0;
-		sameba = false;
-	    }
-
-#ifdef _OPENMP
-#pragma omp parallel 
-#endif
-	    for (MFIter mfi(*dmf,true); mfi.isValid(); ++mfi)
-	    {
-		const Box& bx = mfi.tilebox();
-		(*dmf)[mfi].linInterp((*smf[0])[mfi],
-			scomp,
-			(*smf[1])[mfi],
-			scomp,
-			stime[0],
-			stime[1],
-			time,
-			bx,
-			destcomp,
-			ncomp);
-	    }
-
-	    if (sameba)
-	    {
-		// Note that when sameba is true mf's BoxArray is nonoverlapping.
-		// So FillBoundary is safe.
-		mf.FillBoundary(dcomp,ncomp,geom.periodicity());
-	    }
-	    else
-	    {
-		int src_ngrow = 0;
-		int dst_ngrow = mf.nGrow();
-
-		mf.copy(*dmf, 0, dcomp, ncomp, src_ngrow, dst_ngrow, geom.periodicity());
-	    }
-	}
-	else {
-	    amrex::Abort("FillPatchSingleLevel: high-order interpolation in time not implemented yet");
-	}
-
-	physbcf.FillBoundary(mf, dcomp, ncomp, time);
-    }
-
-    void FillPatchTwoLevels (MultiFab& mf, Real time,
-	    const Vector<MultiFab*>& cmf, const Vector<Real>& ct,
-	    const Vector<MultiFab*>& fmf, const Vector<Real>& ft,
-	    int scomp, int dcomp, int ncomp,
-	    const Geometry& cgeom, const Geometry& fgeom, 
-	    PhysBCFunctBase& cbc, PhysBCFunctBase& fbc,
-	    const IntVect& ratio, 
-	    Interpolater* mapper, const BCRec& bcs)
-    {
-	Vector<BCRec> bcs_array(1,BCRec(bcs.lo(),bcs.hi()));
-
-	FillPatchTwoLevels(mf,time,cmf,ct,fmf,ft,scomp,dcomp,ncomp,cgeom,fgeom,
-		cbc,fbc,ratio,mapper,bcs_array);
-    }
-
-
-    void FillPatchTwoLevels (MultiFab& mf, Real time,
-	    const Vector<MultiFab*>& cmf, const Vector<Real>& ct,
-	    const Vector<MultiFab*>& fmf, const Vector<Real>& ft,
-	    int scomp, int dcomp, int ncomp,
-	    const Geometry& cgeom, const Geometry& fgeom, 
-	    PhysBCFunctBase& cbc, PhysBCFunctBase& fbc,
-	    const IntVect& ratio, 
-	    Interpolater* mapper, const Vector<BCRec>& bcs)
-    {
-	BL_PROFILE("FillPatchTwoLevels");
-
-	int ngrow = mf.nGrow();
-
-	if (ngrow > 0 || mf.getBDKey() != fmf[0]->getBDKey()) 
-	{
-	    const InterpolaterBoxCoarsener& coarsener = mapper->BoxCoarsener(ratio);
-
-	    Box fdomain = fgeom.Domain();
-	    fdomain.convert(mf.boxArray().ixType());
-	    Box fdomain_g(fdomain);
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		if (fgeom.isPeriodic(i)) {
-		    fdomain_g.grow(i,ngrow);
-		}
-	    }
-
-	    const FabArrayBase::FPinfo& fpc = FabArrayBase::TheFPinfo(*fmf[0], mf, fdomain_g,
-                                                                      IntVect(ngrow), coarsener, 
-                                                                      amrex::coarsen(fgeom.Domain(),ratio));
-
-	    if ( ! fpc.ba_crse_patch.empty())
-	    {
-		MultiFab mf_crse_patch(fpc.ba_crse_patch, fpc.dm_crse_patch, ncomp, 0, MFInfo(),
-			*fpc.fact_crse_patch);
-
-		FillPatchSingleLevel(mf_crse_patch, time, cmf, ct, scomp, 0, ncomp, cgeom, cbc);
-
-		int idummy1=0, idummy2=0;
-		bool cc = fpc.ba_crse_patch.ixType().cellCentered();
-		ignore_unused(cc);
-#ifdef _OPENMP
-#pragma omp parallel if (cc)
-#endif
-		for (MFIter mfi(mf_crse_patch); mfi.isValid(); ++mfi)
-		{
-		    int li = mfi.LocalIndex();
-		    int gi = fpc.dst_idxs[li];		
-		    const Box& dbx = fpc.dst_boxes[li];
-
-		    Vector<BCRec> bcr(ncomp);
-		    amrex::setBC(dbx,fdomain,scomp,0,ncomp,bcs,bcr);
-
-		    mapper->interp(mf_crse_patch[mfi],
-			    0,
-			    mf[gi],
-			    dcomp,
-			    ncomp,
-			    dbx,
-			    ratio,
-			    cgeom,
-			    fgeom,
-			    bcr,
-			    idummy1, idummy2, RunOn::Cpu);
-		}
-	    }
-	}
-
-	FillPatchSingleLevel(mf, time, fmf, ft, scomp, dcomp, ncomp, fgeom, fbc);
-    }
-}//namespace
diff --git a/Src/AmrTask/Makefile b/Src/AmrTask/Makefile
deleted file mode 100644
index 5bdc7b13c56..00000000000
--- a/Src/AmrTask/Makefile
+++ /dev/null
@@ -1,17 +0,0 @@
-include ./arch.common
-
-SUBDIRS = graph $(RTS_DIR) Amr tutorials/UnitTests/ AMFIter tutorials/MiniApps/HeatEquation
-
-.PHONY: build $(SUBDIRS)
-
-build: $(SUBDIRS)
-
-$(SUBDIRS):
-	$(MAKE) -C $@
-
-.PHONY: all
-
-all: build
-
-clean:
-	$(foreach dir, $(SUBDIRS), $(MAKE) -C $(dir) clean;)
diff --git a/Src/AmrTask/arch.common b/Src/AmrTask/arch.common
deleted file mode 100644
index 940944a3fc6..00000000000
--- a/Src/AmrTask/arch.common
+++ /dev/null
@@ -1,4 +0,0 @@
-ROOT_PATH= /home/users/nnguyent/lbl/amrex/Src/AmrTask
-
-include  $(ROOT_PATH)/arch/arch.mpi.generic
-#include  $(ROOT_PATH)/arch/arch.serial
diff --git a/Src/AmrTask/arch/arch.mpi.generic b/Src/AmrTask/arch/arch.mpi.generic
deleted file mode 100755
index 6772e25989c..00000000000
--- a/Src/AmrTask/arch/arch.mpi.generic
+++ /dev/null
@@ -1,64 +0,0 @@
-RM		= rm -f
-LN		= ln -s
-ECHO		= echo
-
-C++ 		= mpicxx
-CC		= mpicc
-
-C++LINK		= $(C++)
-CLINK		= $(C++)
-
-COPTIMIZATION	= -O3
-
-C++FLAGS        += -std=c++11 $(COPTIMIZATION) -fopenmp -openmp #$(DEBUG)
-
-LDFLAGS		+= $(C++FLAGS)
-LDLIBS          = -lpthread 
-
-RTS_DIR		= $(ROOT_PATH)/rts_impls/MPI_Generic/
-INCLUDE  	= $(RTS_DIR)
-
-SEGSIZE		= -DSEGMENT_SIZE=2147483648
-
-#########################################################################
-# End of the System dependent prefix
-#########################################################################
-
-
-#########################################################################
-#									#
-# Suffixes for compiling most normal C++, C files		#
-#									#
-#########################################################################
-
-.SUFFIXES:
-.SUFFIXES: .C .cxx .c .cpp .o
-
-.C.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(C++) $(C++FLAGS) -c $<
-		@$(ECHO)
-
-.cxx.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(C++) $(C++FLAGS) -c $<
-		@$(ECHO)
-
-.cpp.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(C++) $(C++FLAGS) -c $<
-		@$(ECHO)
-
-.c.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(CC) $(C++FLAGS) -c $<
-		@$(ECHO)
-
diff --git a/Src/AmrTask/arch/arch.serial b/Src/AmrTask/arch/arch.serial
deleted file mode 100755
index ab28167c033..00000000000
--- a/Src/AmrTask/arch/arch.serial
+++ /dev/null
@@ -1,63 +0,0 @@
-RM		= rm -f
-LN		= ln -s
-ECHO		= echo
-
-C++ 		= g++
-CC		= gcc
-
-C++LINK		= $(C++)
-CLINK		= $(C++)
-
-COPTIMIZATION	= -O3
-
-C++FLAGS        += -std=c++11 $(COPTIMIZATION) $(DEBUG)
-
-LDFLAGS	+= $(C++FLAGS)
-LDLIBS          = 
-
-RTS_DIR		= $(ROOT_PATH)/rts_impls/Serial/
-INCLUDE  	= $(RTS_DIR)
-
-
-#########################################################################
-# End of the System dependent prefix
-#########################################################################
-
-
-#########################################################################
-#									#
-# Suffixes for compiling most normal C++, C files		#
-#									#
-#########################################################################
-
-.SUFFIXES:
-.SUFFIXES: .C .cxx .c .cpp .o
-
-.C.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(C++) $(C++FLAGS) -c $<
-		@$(ECHO)
-
-.cxx.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(C++) $(C++FLAGS) -c $<
-		@$(ECHO)
-
-.cpp.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(C++) $(C++FLAGS) -c $<
-		@$(ECHO)
-
-.c.o:
-		@$(ECHO)
-		@$(ECHO) "Compiling Source File --" $<
-		@$(ECHO) "---------------------"
-		$(CC) $(C++FLAGS) -c $<
-		@$(ECHO)
-
diff --git a/Src/AmrTask/graph/AMReX_AbstractTask.H b/Src/AmrTask/graph/AMReX_AbstractTask.H
deleted file mode 100644
index b191781d5b2..00000000000
--- a/Src/AmrTask/graph/AMReX_AbstractTask.H
+++ /dev/null
@@ -1,274 +0,0 @@
-#ifndef AMREX_ABSTRACT_TASK
-#define AMREX_ABSTRACT_TASK
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 08-07-2017
-
-#include "AMReX_DataTypes.H"
-#include <iostream>
-#include <vector>
-#include <map>
-#include <queue>
-#include <string>
-#include <string.h>
-#include <sstream>
-#include <cassert>
-#include "rts_taskimpl.H"
-using namespace std;
-
-namespace amrex{
-
-    class TaskName{
-	protected:
-	    std::vector<int> _ids;
-	public:
-	    TaskName(){}
-	    TaskName(int id){_ids.push_back(id);}
-	    TaskName(int id0, int id1){_ids.push_back(id0); _ids.push_back(id1);}
-	    TaskName(int id0, int id1, int id2){_ids.push_back(id0); _ids.push_back(id1); _ids.push_back(id2);}
-	    TaskName(int id0, int id1, int id2, int id3){_ids.push_back(id0); _ids.push_back(id1); _ids.push_back(id2);_ids.push_back(id3);}
-	    int& operator[](int i){return _ids[i];}
-	    const int& operator[](int i) const{return _ids[i];}
-	    TaskName& operator=(const TaskName &rhs){
-		assert(_ids.size()==0 || _ids.size()== rhs.Dim());
-		if(_ids.size()==0)
-		    for(int i=0; i< rhs.Dim(); i++)
-			_ids.push_back(rhs[i]);
-		else //already have the same dim
-		    for(int i=0; i< _ids.size(); i++)
-			_ids[i] = rhs[i];
-		return *this;
-	    }
-	    bool operator== (const TaskName &rhs) const{
-		if(_ids.size() != rhs.Dim()) return false;
-		for(int i=0; i< _ids.size(); i++)
-		    if(_ids[i] != rhs[i]) return false;
-		return true;
-	    }
-	    bool operator!= (const TaskName &rhs) const{
-		if(_ids.size() != rhs.Dim()) return true;
-		for(int i=0; i< _ids.size(); i++)
-		    if(_ids[i] != rhs[i]) return true;
-		return false;
-	    }
-	    bool operator< (const TaskName &rhs) const{
-		if(_ids.size() < rhs.Dim()) return true;
-		if(_ids.size() > rhs.Dim()) return false;
-		for(int i= _ids.size()-1; i>=0; i--){
-		    if(_ids[i] > rhs[i]) return false;
-		    if(_ids[i] < rhs[i]) return true;
-		}
-		return false;
-	    }
-	    void SetSize(int dim){
-		for(int i=0; i<dim; i++) _ids.push_back(0);
-	    }
-	    int Dim() const{return _ids.size();}
-    };
-
-    //! This class can be used to express data dependencies. The runtime may serialize the data or augment it with other control information
-    class Data{
-	private:
-	    size_t _size; //in bytes
-	    TaskName _src, _recipient;
-	    int _tag;
-	    char* _buffer;
-	    int _serializedDescSize;
-	    int _destRank; //we need this only when there are more than 1 process AND the application controls the task mapping
-	    void* SetBuffer(char* buffer){_buffer= buffer;}  
-	public:
-	    //!Create a message with empty load
-	    Data(TaskName src, TaskName recipient, size_t size) {
-		_src= src; _recipient= recipient;
-		_size=size; _tag=0;
-		_destRank=-1;
-		_serializedDescSize= sizeof(size_t) /*_size*/+ sizeof(int) /*_tag*/ + 2*sizeof(int) /*_src and _recipient length*/ + (src.Dim()+recipient.Dim()) * sizeof(size_t);
-		_buffer= new char[size+_serializedDescSize];
-	    }
-
-	    Data (char* a){ //deserialize data
-		_buffer= a;
-		_size= *((size_t*) a);
-		_tag= *((int*) (a+sizeof(size_t)));
-		int srclen= *((int*) (a+sizeof(size_t)+ sizeof(int)));
-		int recipientlen= *((int*) (a+sizeof(size_t)+ 2*sizeof(int)));
-		_src.SetSize(srclen); _recipient.SetSize(recipientlen);
-		size_t *entries= (size_t*) (a+sizeof(size_t)+ 3*sizeof(int));
-		for(int i=0; i<srclen+recipientlen; i++){
-		    if(i<srclen) _src[i]= entries[i];
-		    else _recipient[i-srclen]= entries[i];
-		}
-		_serializedDescSize= sizeof(size_t) /*_size*/+ sizeof(int) /*_tag*/ + 2*sizeof(int) /*_src and _recipient length*/ + (_src.Dim()+_recipient.Dim()) * sizeof(size_t);
-	    }
-
-	    TaskName GetRecipient(){return _recipient;}
-	    TaskName GetSource(){return _src;}
-	    void* GetBuffer(){return (void*)(_buffer+_serializedDescSize);}  
-	    size_t GetSize(){return _size;}
-	    void SetTag(size_t tag){_tag= tag;}
-	    void SetDestRank(int destRank){_destRank= destRank;}
-	    int GetDestRank(){return _destRank;}
-	    int GetTag(){return _tag;}
-	    void Free(){
-		delete _buffer;
-		delete this;
-	    }
-
-	    char* SerializeData(){
-		char* p=_buffer;
-		memcpy(p, &_size, sizeof(size_t));
-		p+= sizeof(size_t);
-		memcpy(p, &_tag, sizeof(int));
-		p+= sizeof(int);
-		int srclen= _src.Dim(), recipientlen= _recipient.Dim();
-		memcpy(p, &srclen, sizeof(int));
-		p+= sizeof(int);
-		memcpy(p, &recipientlen, sizeof(int));
-		p+= sizeof(int);
-		size_t *entries= (size_t*) p;
-		for(int i=0; i<srclen+recipientlen; i++){ 
-		    if(i<srclen) entries[i]= _src[i];
-		    else entries[i]= _recipient[i-srclen];
-		}
-		return _buffer;
-	    }
-	    size_t GetSerializedSize(){return _size+ _serializedDescSize;}
-    };
-
-    class DependencyMap{
-	private:
-	    std::map<TaskName, map<int, std::queue< Data* > > > _dataMap;
-	    size_t _size; 
-
-	public:
-	    //return the total number of inputs/outputs of a task
-	    size_t size(){
-		size_t s=0;
-		std::map<TaskName, std::map<int, std::queue< Data* > > >::iterator it= _dataMap.begin();
-		while (it!= _dataMap.end()){
-		    std::map<int, std::queue< Data* > >::iterator tagIt= ((*it).second).begin(); 
-		    while (tagIt!= ((*it).second).end()){
-			s+= (*tagIt).second.size();
-			tagIt++;
-		    }
-		    it++;
-		}
-		return s;
-	    }
-	    bool isSatisfied(TaskName name, int tag=0){
-		if(_dataMap.find(name) != _dataMap.end()){
-		    if(_dataMap[name].find(tag) != _dataMap[name].end()){
-			return _dataMap[name][tag].size() >0;
-		    }
-		}
-		return false;
-	    }
-	    bool empty(){return _size==0;}
-	    void push_back(TaskName name, Data* d, int tag=0){
-		_dataMap[name][tag].push(d);
-		_size++;
-	    }
-	    Data* pop_front(TaskName name, int tag=0){
-		if(_dataMap[name][tag].size()==0) return NULL;
-		Data* d= _dataMap[name][tag].front();
-		_dataMap[name][tag].pop();
-		_size--;
-		return d;
-	    }
-	    std::queue< Data* >& GetDependencies(TaskName name, int tag=0){return _dataMap[name][tag];}
-    };
-
-    //! The most abstract task
-    class Task{
-	protected:
-	    TaskName _id;
-	    DependencyMap _neighbors_in; 
-	    std::queue<Data*> _outputs;
-	    std::queue<Task*> _newTasks;
-	    bool _isPersistent;
-	    bool _isMasterTask;
-	public:
-	    Task():_isPersistent(true),_isMasterTask(false){}
-	    Task(TaskName name):_isPersistent(true),_isMasterTask(false){_id= name;}
-	    //Describe Data Dependency
-	    virtual bool Dependency()=0;
-	    //! What the task is supposed to do
-	    virtual void Job()=0;
-	    //! Once the task finished its computation, any actions should be taken (like create new taks)?
-	    virtual void PostCompletion()=0;
-	    TaskName MyName(){return _id;}
-	    void SetName(TaskName id){ _id=id;}
-	    void SetMaster(){_isMasterTask=true;}
-
-	    bool TestDependencies(){return Dependency();}
-	    void RunJob(){Job();}
-	    void RunPostCompletion(){PostCompletion();} 
-	    void Pull(TaskName src, char* d, size_t size, int tag=0);
-	    void Push(TaskName dest, char* d, size_t size, int tag=0);
-	    bool Depend_on(TaskName src, int tag=0){
-		return _neighbors_in.isSatisfied(src, tag);
-	    }
-	    std::queue<Data*>& GetOutputs(){return _outputs;}
-	    std::queue<Task*>& GetNewTasks(){return _newTasks;}
-	    DependencyMap& GetInputs(){return _neighbors_in;}
-	    void KeepTaskAlive(){_isPersistent=true;}
-	    void SelfDestroy(){_isPersistent=false;}
-	    bool isPersistent(){return _isPersistent;}
-	    bool isMasterTask(){return _isMasterTask;}
-
-	    template<typename T> void LocalAtomicAdd(T *addr, T val){
-		LocalAtomicAdd_impl(addr, val);
-	    }
-	    template<typename T> void GlobalAtomicAdd(T *addr, T val){
-		GlobalAtomicAdd_impl(addr, val);
-	    }
-	    void barrierTask(){
-		//BarrierTask_impl();
-	    }
-	    void RegisterTask(Task* t){
-		_newTasks.push(t);
-	    }
-    };
-
-#if 0
-    //! This task is created to do LOCAL jobs (thus it is not migratable), when all data dependencies have been satisfied
-    class NonMigratableTask :public Task{
-	protected:
-	    TaskState st;
-	    //! A task may depend on multiple pieces of data from another task
-	    //! A task may send multiple pieces of data to another task
-	    //DependencyMap neighbors_out;
-	public:
-    };
-
-
-    //! This task can be migrated to a remote process (e.g. to be closer to data). 
-    class MigratableTask :public Task{
-	protected:
-	    int origin;//original process
-	public:
-	    virtual void pullData();  
-    };
-
-
-
-
-    enum state_t{FRESH /*just created*/, PENDING/*waiting for data*/, READY/*data dependencies satisfied*/, RUNNING /*scheduled to run*/, FINISHED /*no more work to do*/, ERROR};
-    class TaskState{
-	private:
-	    state_t _st;
-
-	public:
-	    TaskState():_st(PENDING){}
-	    TaskState(state_t st):_st(st){}
-	    void shift();
-	    void shift(state_t newState);
-    };
-#endif
-
-
-
-
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/graph/AMReX_AbstractTask.cpp b/Src/AmrTask/graph/AMReX_AbstractTask.cpp
deleted file mode 100644
index ab5983ce73e..00000000000
--- a/Src/AmrTask/graph/AMReX_AbstractTask.cpp
+++ /dev/null
@@ -1,18 +0,0 @@
-#include<AMReX_AbstractTask.H>
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-24-2017
-
-namespace amrex{
-    void Task::Pull(TaskName src, char* d, size_t size, int tag){
-	Data* data= _neighbors_in.pop_front(src, tag);
-	memcpy(d, data->GetBuffer(), size);
-	data->Free();
-    }
-    void Task::Push(TaskName dest, char* d, size_t size, int tag){
-        Data* data= new Data(_id, dest, size);
-	data->SetTag(tag);
-	memcpy(data->GetBuffer(), d, size);
-	_outputs.push(data);
-    }
-}
diff --git a/Src/AmrTask/graph/AMReX_Affinity.H b/Src/AmrTask/graph/AMReX_Affinity.H
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/Src/AmrTask/graph/AMReX_Affinity.cpp b/Src/AmrTask/graph/AMReX_Affinity.cpp
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/Src/AmrTask/graph/AMReX_DataTypes.H b/Src/AmrTask/graph/AMReX_DataTypes.H
deleted file mode 100644
index 2d1ec100158..00000000000
--- a/Src/AmrTask/graph/AMReX_DataTypes.H
+++ /dev/null
@@ -1,142 +0,0 @@
-#ifndef AMREX_PRIMITIVE_TYPES
-#define AMREX_PRIMITIVE_TYPES
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-24-2017
-
-#include <iostream>
-#include <vector>
-#include <map>
-#include <list>
-#include <string>
-#include <sstream>
-#include <cassert>
-using namespace std;
-
-namespace amrex{
-    //!This class is similar to IntVect, but it supports template
-    template <int D=1>
-	class PointVect{
-	    private:
-		int _vect[D];
-	    public:
-		class shift_hasher{
-		    private:
-			static const unsigned shift=0;
-			static const unsigned shift_stride=0;
-			shift_hasher(){
-			    shift=shift_stride= 8*sizeof(size_t)/D;
-			}
-		    public:
-			size_t operator()(const PointVect& vec) const
-			{
-			    size_t ret=_vect[0];
-			    for(int i=1; i<D; i++){
-				ret ^= (_vect[i] << shift);
-				shift+= shift_stride;
-			    }
-			    return ret;
-			}
-		};
-		PointVect(){bzero(_vect, D*sizeof(int));}
-                PointVect(int x){
-                        assert(D==1);
-                        _vect[0] =x;
-                }
-                PointVect(int x, int y){
-                        assert(D==1);
-                        _vect[0] =x;
-                        _vect[1] =y;
-                }
-		PointVect(int x, int y, int z){
- 		        assert(D==3);
-			_vect[0] =x;
-			_vect[1] =y;
-			_vect[2] =z;
-                }
-                PointVect(int x, int y, int z, int t){
-                        assert(D==4);
-                        _vect[0] =x;
-                        _vect[1] =y;
-                        _vect[2] =z;
-                        _vect[3] =t;
-                }
-		int& operator[] (int i) {
-		    return _vect[i];
-		}
-		const int& operator[] (int i) const{
-		    return _vect[i];
-		}
-		PointVect<D>& set(int i, int val){
-		    _vect[i]=val;
-		    return *this;
-		}
-		PointVect<D>& operator= (const PointVect<D>& rhs) const{
-		    for(int i=0; i<D; i++) _vect[i]=rhs[i];
-		    return *this;
-		}
-		PointVect<D>& operator= (const PointVect<D>& rhs){
-		    for(int i=0; i<D; i++) _vect[i]=rhs[i];
-		    return *this;
-		}
-		PointVect<D>& operator= (const int val) const{
-		    for(int i=0; i<D; i++) _vect[i]=val;
-		    return *this;
-		}
-		bool operator== (int val) const{
-		    for(int i=0; i<D; i++) if(_vect[i]!=val) return false;
-		    return true;
-		}
-		bool operator!= (int val) const{
-		    for(int i=0; i<D; i++) if(_vect[i]==val) return false;
-		    return true;
-		}
-		bool operator== (const PointVect& rhs) const{
-		    for(int i=0; i<D; i++) if(_vect[i]!=rhs[i]) return false;
-		    return true;
-		}
-		bool operator!= (const PointVect& rhs) const{
-		    for(int i=0; i<D; i++) if(_vect[i]==rhs[i]) return false;
-		    return true;
-		}
-		bool operator< (const PointVect& rhs) const{
-		    for(int i=D-1; i>=0; i++){
-			if(_vect[i]>rhs[i]) return false;
-			if(_vect[i]<rhs[i]) return true;
-                    }
-		    return false;
-		}
-		bool operator<= (const PointVect& rhs) const{
-		    for(int i=D-1; i>=0; i++){
-			if(_vect[i]>rhs[i]) return false;
-			if(_vect[i]<rhs[i]) return true;
-                    }
-		    return true;
-		}
-		bool operator> (const PointVect& rhs) const{
-		    for(int i=D-1; i>=0; i++){
-			if(_vect[i]<rhs[i]) return false;
-			if(_vect[i]>rhs[i]) return true;
-                    }
-		    return false;
-		}
-		bool operator>= (const PointVect& rhs) const{
-		    for(int i=D-1; i>=0; i++){
-			if(_vect[i]<rhs[i]) return false;
-			if(_vect[i]>rhs[i]) return true;
-                    }
-		    return true;
-		}
-	};
-
-    /*
-       template <class T, int D=1>
-       class TaskTable{
-       private:
-       std::unorderedMap<PointVect<D>, std::list<T*>, PointVect::shift_hasher>
-       public:
-       };
-     */
-}
-
-#endif 
diff --git a/Src/AmrTask/graph/AMReX_TaskGraph.H b/Src/AmrTask/graph/AMReX_TaskGraph.H
deleted file mode 100644
index 8095754dbe8..00000000000
--- a/Src/AmrTask/graph/AMReX_TaskGraph.H
+++ /dev/null
@@ -1,339 +0,0 @@
-#ifndef AMREX_ABSTRACT_TASKGRAPH
-#define AMREX_ABSTRACT_TASKGRAPH
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-24-2017
-
-#include <iostream>
-#include <vector>
-#include <map>
-#include <list>
-#include <string>
-#include <sstream>
-#include <cassert>
-#include "AMReX_AbstractTask.H"
-using namespace std;
-
-namespace amrex{
-
-    template <int D=1>
-	class BlockMapping{
-	    private:
-		PointVect<D> _first, _last, _range, _size;
-		size_t _linearSize;
-		size_t _totalSize;
-
-	    public:
-		BlockMapping(PointVect<D> gSize, PointVect<D> myProc, PointVect<D> nProcs){
-		    for(int i=0; i<D; i++){
-			size_t block;
-			size_t remainder;
-			block= gSize[i]/nProcs[i]; 
-			remainder= gSize[i]%nProcs[i];
-			_first[i]= myProc[i]*block + (myProc[i]<remainder?myProc[i]:remainder);  
-			_last[i]= _first[i]+block -1 + (myProc[i]<remainder?1:0);  
-			_range[i]= _last[i]-_first[i] +1;
-			_size[i]= _range[i];
-		    }
-		}
-
-		BlockMapping(PointVect<D> gSize, int myProc, int nProcs){
-		    size_t block;
-		    size_t remainder;
-		    size_t totalSize=gSize[0];
-		    for(int i=1; i<D; i++) totalSize=totalSize*gSize[i];
-		    _totalSize= totalSize;
-		    block= totalSize/nProcs;
-		    remainder= totalSize%nProcs;
-		    int first_linear, last_linear;
-		    first_linear= myProc*block + (myProc<remainder?myProc:remainder);
-		    last_linear= first_linear+block -1 + (myProc<remainder?1:0);
-		    _linearSize= last_linear-first_linear+1;
-		    size_t subSize=totalSize;
-		    for(int i=D-1; i>=0; i--){
-			subSize= subSize/gSize[i];
-			_last[i]=last_linear/subSize;
-			_first[i]=first_linear/subSize;
-			_range[i]= _last[i]-_first[i] +1;
-			_size[i]= _range[i];
-			last_linear= last_linear%subSize;
-			first_linear= first_linear%subSize;
-		    }
-		}
-
-		PointVect<D> first(){return _first;}
-		PointVect<D> last(){return _last;}
-		PointVect<D> range(){return _range;}
-		PointVect<D> size(){return _size;}
-		size_t linearSize(){return _linearSize;}
-		size_t totalSize(){return _totalSize;}
-	};
-
-    enum RunningMode{
-	_Push=0,//The task will not be scheduled until all data dependencies are satified. Data are pushed by other tasks without its consent.
-	_Pull//The task will be fetched and it will pull dependencies from other tasks 
-    };
-
-    class SelfAssociate{
-	public:
-	    TaskName TaskAssociate(TaskName name){
-		return name;
-	    }
-    };
-
-    //!This class defines data and task spaces, as well as options to decompose these spaces
-    template <class T>
-	class AbstractTaskGraph{
-	    struct TaskComp {
-		bool operator() (const TaskName& lhs, const TaskName& rhs) const
-		{
-		    return lhs<rhs;
-		}
-	    };
-	    protected:
-	    int _nProcs, _rank;
-	    //! Graph name, e.g. "3DStencil", "SparseLU", etc. The default value is empty string
-	    string _graphName; 
-	    std::vector<Task*> _initialTasks; 
-	    std::map<TaskName, Task*, TaskComp> _taskPool;
-	    //! A process can iterate over tasks that it owns. However, how application tasks are mapped to processes will be defined at higher level classes.
-	    Task *_begin, *_end, *_current;
-	    typename std::vector<Task*>::iterator _currIt;
-	    size_t _nLocalTasks;
-	    RunningMode _mode;
-
-	    public:
-	    AbstractTaskGraph(string graphName=""): _graphName(graphName), _rank(0), _nProcs(1){
-		_begin=NULL;
-		_end=NULL;
-		_current=NULL;
-		_nLocalTasks=0;
-		_mode= _Push;
-	    }
-	    void DestroyGraph(){
-		    for(typename std::vector<T*>::iterator it= _initialTasks.begin(); it!= _initialTasks.end(); it++){
-			delete (*it);
-		    }
-		    _initialTasks.clear();
-		    _taskPool.clear();
-	    }
-	    void DestroyTask(Task* t){
-		_taskPool.erase(t->MyName());
-	    }
-	    int MyProc(){return _rank;}  
-	    int ProcCount(){return _nProcs;}  
-	    RunningMode GetRunningMode(){return _mode;}
-	    string GetTaskName(){return _graphName;}
-	    void GraphSynchronize();
-	    std::map<TaskName, Task*, TaskComp> &GetTaskPool(){return _taskPool;}
-	    Task* LocateTask(TaskName name){
-		if(_taskPool.find(name)!= _taskPool.end())
-		    return _taskPool[name];
-		return NULL;
-	    }
-	    virtual int FindProcessAssociation(TaskName name){ //maps task name to process rank
-	    }
-	    //!First element stored in the process
-	    Task* Begin(){
-		return _begin;
-	    }
-	    //!Last element stored in the process
-	    Task* End(){
-		return _end;
-	    }
-	    //! The next element
-	    Task* Next(){
-		_currIt++;
-		_current= *_currIt;
-		return _current;
-	    }
-	    //! The current element
-	    Task* Current(){
-		return _current;
-	    }
-	};
-
-
-    /**
-     * \brief This class is useful when we need a task graph to partition an irregular geometry. 
-     * Tasks are created from a list of names (for example, box/data tile names), which can have multiple dimensions.
-     * These tasks are stored in a distributed hash map and can be accessed in constant time.
-     * A task can create another task dynamically and set it location (i.e., which process owns the newly created task). 
-     * The default location is that of the the parent task.
-     */
-    template <class T, int D=1, class A=SelfAssociate>
-	class ArrayGraph: public AbstractTaskGraph<T>{
-	    protected:
-		string _graphName;
-		BlockMapping<D> *_taskMap;
-		PointVect<D> _graphSize;
-
-	    public:
-		//! Create a 1D Task Graph
-		ArrayGraph(string graphName, int graphSize, int rank, int nProcs): _graphName(graphName), _graphSize(graphSize){
-		    assert(D==1);
-		    AbstractTaskGraph<T>::_nProcs= nProcs;
-		    AbstractTaskGraph<T>::_rank= rank;
-		    _taskMap= new BlockMapping<1>(PointVect<1>(graphSize), PointVect<1>(rank), PointVect<1>(nProcs));
-		    for(int i=_taskMap->first()[0], idx=0; i<=_taskMap->last()[0]; i++, idx++){
-			TaskName name(i);
-			T *t= new T();
-			t->SetName(name);
-			AbstractTaskGraph<T>::_initialTasks.push_back(t);
-			AbstractTaskGraph<T>::_taskPool[name]= t;
-		    }
-		    AbstractTaskGraph<T>::_begin= *(AbstractTaskGraph<T>::_initialTasks.begin());
-		    AbstractTaskGraph<T>::_end= *(AbstractTaskGraph<T>::_initialTasks.end());
-		    AbstractTaskGraph<T>::_currIt= AbstractTaskGraph<T>::_initialTasks.begin();
-		    AbstractTaskGraph<T>::_current= *(AbstractTaskGraph<T>::_currIt);
-		    AbstractTaskGraph<T>::_mode= _Push;
-		}
-		//! Create a multidimensional graph and LINEARLY map it to processors
-		ArrayGraph(string graphName, PointVect<D> graphSize, int rank, int nProcs): _graphName(graphName){
-		    _graphSize= graphSize;
-		    AbstractTaskGraph<T>::_nProcs= nProcs;
-		    AbstractTaskGraph<T>::_rank= rank;
-		    _taskMap= new BlockMapping<D>(graphSize, rank, nProcs);
-		    PointVect<D> p=_taskMap->first();
-		    for(int i=0; i<_taskMap->linearSize(); i++){
-			TaskName name;
-			name.SetSize(D);
-			for(int j=0; j<D; j++){
-			    name[j]= p[j];
-			}
-			T *t= new T();
-			t->SetName(name);
-			AbstractTaskGraph<T>::_initialTasks.push_back(t);
-			AbstractTaskGraph<T>::_taskPool[name]= t;
-			for(int d=0; d<D; d++)
-			    if(p[d]+1 < graphSize[d]){
-				p[d]++; 
-				//reset lower dimensions
-				for(int dd=0; dd<d; dd++) p[dd]=0;
-				break;
-			    }
-		    }
-		    AbstractTaskGraph<T>::_begin= *(AbstractTaskGraph<T>::_initialTasks.begin());
-		    AbstractTaskGraph<T>::_end= *(AbstractTaskGraph<T>::_initialTasks.end());
-		    AbstractTaskGraph<T>::_currIt= AbstractTaskGraph<T>::_initialTasks.begin();
-		    AbstractTaskGraph<T>::_current= *(AbstractTaskGraph<T>::_currIt);
-		    AbstractTaskGraph<T>::_mode= _Push;
-		}
-		int FindProcessAssociation(TaskName name){
-		    A associate;
-		    TaskName n= associate.TaskAssociate(name);
-		    size_t block_size= _taskMap->totalSize()/AbstractTaskGraph<T>::ProcCount();
-		    size_t val=n[0];
-		    size_t stride=1;
-		    for(int d=1; d<D; d++){
-			stride *= _graphSize[d-1];
-			val+= n[d]*stride;
-		    }
-		    return val/block_size;
-		}
-
-		BlockMapping<D>* GetTaskMap(){return &_taskMap;}
-		void Destroy(){
-		    for(typename std::vector<T*>::iterator it= AbstractTaskGraph<T>::_initialTasks.begin(); it!= AbstractTaskGraph<T>::_initialTasks.end(); it++){
-			delete (*it);
-		    }
-		    AbstractTaskGraph<T>::_initialTasks.clear();
-		    AbstractTaskGraph<T>::_taskPool.clear();
-		    delete _taskMap;
-		}
-	};
-
-#if 0
-    //! This class should be used when we want to create a rectangular task space (data and/or time).
-    template <class T, int D=1>
-	class CartesianGraph: public AbstractTaskGraph<T>{
-	    protected:
-		string _graphName;
-		BlockMapping<T, D>* _taskMap;
-
-	    public:
-		//create a multi-dimensional taskGraph using P processes
-		CartesianGraph(string graphName="", PointVect<D> graphSize, PointVect<D> Prank, PointVect<D> Psize){
-		    _taskMap= new BlockMapping<T, D>(graphSize, Prank, Psize);
-		    if(_taskMap.size() !=0){ 
-			TaskName name(_taskMap.first()[0]);
-			size_t nTasks= _taskMap.size()[0];
-			for (int d=1; d<D; d++){
-			    name[d]=_taskMap.first()[d];
-			    nTasks= nTasks*_taskMap.size()[d];
-			}
-			for (int d=0; d<D; d++){
-			    for(int i=_taskMap->first()[d], idx=0; i<=_taskMap->last()[d]; i++, idx++){
-				T *t= new T();
-				t->SetName(name);
-				AbstractTaskGraph<T>::_initialTasks.push_back(t);
-				AbstractTaskGraph<T>::_taskPool[name]= t;
-			    }
-			}
-		    }
-
-
-		}
-		BlockMapping<T, D>* GetTaskMap(){return &_taskMap;}
-	};
-#endif
-
-
-#if 0
-
-    //Data are distributed linearly, though a multi-dimensional key (e.g. task name) is required to locate them
-    template <class T, int D=1>
-	class LinearMapping::public AbstractMapping{
-	    private:
-		std::unorderedMap<PointVect<D>, std::list<T*>, PointVect::shift_hasher> _data; 
-	    public:
-		LinearMapping(std::vector< PointVect<D> > nameVect){
-		    _begin[0]= nameVect[0];
-		    _end[0]= nameVect[nameVect.size()-1];
-		    _size[0]= nameVect.size();
-		}
-	};
-
-    //
-
-    template <class T, int D=1>
-	class CyclicMapping: public AbstractMapping{
-	    private:
-
-	    public: 
-		CyclicMapping(PointVect<D> gSize, PointVect<D> myProc, PointVect<D> nProcs){
-		    for(int i=0; i<D; i++){
-			size_t block;
-			size_t remainder;
-			block= gSize[i]/nProcs[i]; 
-			remainder= gSize[i]%nProcs[i];
-			_begin[i]= myProc[i]<gSize[i]?myProc[i]:gSize[i];
-			_size[i]= _begin[i]<gSize[i]?block+myProc[i]<remainder?1:0; 
-			_end[i]= _begin[i]+ (size[i]-1)*nProcs[i]; 
-		    }
-		}
-	};
-
-    template <class T, int D=1>
-	class BlockyCylicMapping{
-	    private:
-		CyclicMapping(PointVect<D> gSize, PointVect<D> blockSize, PointVect<D> myProc, PointVect<D> nProcs){
-		    for(int i=0; i<D; i++){
-			size_t block;
-			size_t block_block;
-			size_t remainder;
-			block= gSize[i]/blockSize[i]+gSize[i]%blockSize[i]==0?0:1;
-			block_block= block/nProcs[i];
-			remainder= block%nProcs[i];
-
-			_begin[i]= myProc[i]<block?myProc[i]:gSize[i];
-			_size[i]= _begin[i]<gSize[i]?block_block+myProc[i]<remainder?1:0; //number of blocks
-			_end[i]= _begin[i]+ (size[i]-1)*nProcs[i];
-		    }
-		}
-	};
-#endif
-
-}
-
-#endif
diff --git a/Src/AmrTask/graph/AMReX_TaskGraph.cpp b/Src/AmrTask/graph/AMReX_TaskGraph.cpp
deleted file mode 100644
index 8583abdb661..00000000000
--- a/Src/AmrTask/graph/AMReX_TaskGraph.cpp
+++ /dev/null
@@ -1,9 +0,0 @@
-#include <AMReX_TaskGraph.H>
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-24-2017
-
-namespace amrex{
-
-
-}
diff --git a/Src/AmrTask/graph/Makefile b/Src/AmrTask/graph/Makefile
deleted file mode 100755
index 82dddfef0d6..00000000000
--- a/Src/AmrTask/graph/Makefile
+++ /dev/null
@@ -1,24 +0,0 @@
-include ../arch.common 
-
-GRAPH_LIB= graph.a
-
-OBJECTS= AMReX_AbstractTask.o AMReX_TaskGraph.o
-
-all: $(GRAPH_LIB)
-  
-$(GRAPH_LIB): $(OBJECTS) 
-	ar rv $(GRAPH_LIB) $(OBJECTS) 
-
-$(OBJECTS): AMReX_AbstractTask.H AMReX_AbstractTask.cpp AMReX_TaskGraph.H AMReX_TaskGraph.cpp
-
-AMReX_AbstractTask.o: AMReX_AbstractTask.cpp AMReX_AbstractTask.H
-	$(C++) $(C++FLAGS) -I. -I$(INCLUDE) -c AMReX_AbstractTask.cpp -o AMReX_AbstractTask.o
-
-AMReX_TaskGraph.o: AMReX_TaskGraph.cpp AMReX_TaskGraph.H
-	$(C++) $(C++FLAGS) -I./ -I$(INCLUDE) -c AMReX_TaskGraph.cpp -o AMReX_TaskGraph.o
-
-.PHONY: clean
-
-clean:
-	$(RM) $(OBJECTS)
-	$(RM) graph.a
diff --git a/Src/AmrTask/graph/RTS.H b/Src/AmrTask/graph/RTS.H
deleted file mode 100644
index 5e230a86827..00000000000
--- a/Src/AmrTask/graph/RTS.H
+++ /dev/null
@@ -1,52 +0,0 @@
-#ifndef _RTS
-#define _RTS
-#include "AMReX_AbstractTask.H"
-#include "AMReX_TaskGraph.H"
-#include <iostream>
-#include <queue>
-#include "rts_graphimpl.H"
-#include <sys/time.h>
-
-using namespace std;
-
-namespace amrex{
-    struct _workerThreadInfo{
-	int _tid; //thread id in local group
-        int _size; //number of threads in the group
-    };
-
-    struct _threadInfo{
-        bool _isComm; //whether this thread handles communication
-        int _wtid; //worker thread id (-1 if this thread is decicated to communication)
-        int _nWts; //number of thread groups
-    };
-
-    class RTS{
-	private:
-            int _nWrks;
-            void RTS_Init();
-	    int _rank, _nProcs;
-
-	public:
-            RTS(){
-		_nWrks=1; 
-		char* nWrks= getenv("NWORKERS");
-		if(nWrks) _nWrks= atoi(nWrks);
-	    }
-            RTS(int nWrks):_nWrks(nWrks){}
-	    int ProcCount();
-	    int MyProc();
-	    int WorkerThreadCount();
-	    int MyWorkerThread();
-	    void Init(); //Build the runtime system from scratch
-	    void Init(int rank, int nProcs);//Build the runtime system on pre-existing MPI processes
-	    void Iterate(void *graph);
-	    void Finalize();
-            double Time();
-            void Barrier();
-            template<typename T> void ReductionSum(T *local, T *global, int length, int root){
-                ReductionSum_impl(local, global, length, root);
-            }
-    };
-}
-#endif
diff --git a/Src/AmrTask/make_defaults/Cori b/Src/AmrTask/make_defaults/Cori
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/Src/AmrTask/make_defaults/Edison b/Src/AmrTask/make_defaults/Edison
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/Src/AmrTask/make_defaults/Summit-dev b/Src/AmrTask/make_defaults/Summit-dev
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/Src/AmrTask/rts_impls/MPI_Generic/Makefile b/Src/AmrTask/rts_impls/MPI_Generic/Makefile
deleted file mode 100755
index 050bbab1718..00000000000
--- a/Src/AmrTask/rts_impls/MPI_Generic/Makefile
+++ /dev/null
@@ -1,27 +0,0 @@
-include ../../arch.common 
-
-RTS_LIB= rts.a
-
-OBJECTS= rts.o sysInfo.o dl_malloc.o
-
-all: $(RTS_LIB)
-
-$(RTS_LIB): $(OBJECTS)
-	ar rv $(RTS_LIB) $(OBJECTS) 
-
-#$(OBJECTS): rts.C
-
-rts.o: rts.C
-	$(C++) $(C++FLAGS) $(SEGSIZE) -DONLY_MSPACES=1 -I. -I../Utils/ -I$(INCLUDE) -I../../graph -c rts.C -o rts.o
-
-sysInfo.o: ../Utils/sysInfo.C
-	$(C++) $(C++FLAGS) -I../Utils/ -I$(INCLUDE) -c ../Utils/sysInfo.C -o sysInfo.o
-
-dl_malloc.o:
-	$(CC) -DONLY_MSPACES=1 -I../Utils/ -I$(INCLUDE) -O2 -c ../Utils/dl_malloc.c -o dl_malloc.o
-
-.PHONY: clean
-
-clean:
-	$(RM) $(OBJECTS)
-	$(RM) *.a
diff --git a/Src/AmrTask/rts_impls/MPI_Generic/README b/Src/AmrTask/rts_impls/MPI_Generic/README
deleted file mode 100644
index 9577b83c562..00000000000
--- a/Src/AmrTask/rts_impls/MPI_Generic/README
+++ /dev/null
@@ -1,17 +0,0 @@
-This is a runtime version that employs 2-sided MPI (i.e. MPI-1) to implement fundamental routines required to schedule an AMReX task dependency graph.
-The runtime comprises a set of MPI processes, each consisting of multiple WORKER threads. 
-The runtime can be configured to run with 1 process per compute node (i), per NUMA node (ii), or per core (iii). 
-For cases (i) and (ii), there can be multiple WORKER threads per process (one WORKER thread per NUMA node or per core).
-Also, the runtime can dedicate one or a few cores per compute node to handle communication in a responsive fashion.
-For case (ii), WORKER thread and Communication HANDLER thread share the same core. 
-
-Multiple worker threads may share a single task queue (for load balancing purpose).
-Each worker thread also has a private queue serving as a task buffer, allowing scheduling latency and lock/unlock cost to be reduced.
-
-Note: one of the primary goals of this runtime implementation is PORTABILITY.
-
-Thus, there is no special assumption about MPI mode to be made. 
-For example, the runtime should run correctly whether MPI supports MPI_THREAD_FUNNELED (common scenario) or MPI_THREAD_MULTIPLE (not so common) mode.
-
-Also, we use Pthreads to implement WORKER threads.
-At the application level, the programmer can use OpenMP to parallelize each task.
diff --git a/Src/AmrTask/rts_impls/MPI_Generic/mylock.h b/Src/AmrTask/rts_impls/MPI_Generic/mylock.h
deleted file mode 100644
index bddb8ed6970..00000000000
--- a/Src/AmrTask/rts_impls/MPI_Generic/mylock.h
+++ /dev/null
@@ -1,27 +0,0 @@
-#ifndef MYLOCK
-#define MYLOCK
-
-#include <pthread.h>
-
-class MyLock
-{
-    private: 
-	pthread_mutex_t _lock;
-
-    public:
-	MyLock(){
-            pthread_mutex_init(&_lock, NULL);
-	}
-	~MyLock(){
-	    pthread_mutex_destroy(&_lock);
-	}
-	void lock()
-	{
-	    pthread_mutex_lock(&_lock);
-	}
-	void unlock()
-	{
-	    pthread_mutex_unlock(&_lock);
-	}
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/MPI_Generic/rts.C b/Src/AmrTask/rts_impls/MPI_Generic/rts.C
deleted file mode 100644
index 6dddd3b12d5..00000000000
--- a/Src/AmrTask/rts_impls/MPI_Generic/rts.C
+++ /dev/null
@@ -1,593 +0,0 @@
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 08-14-2017
-#include "AMReX_AbstractTask.H"
-#include "AMReX_TaskGraph.H"
-#include "RTS.H"
-#include <mpi.h>
-#include <sched.h>
-#include <sys/syscall.h>
-#include <unistd.h>
-#include "sysInfo.H"
-#include "mylock.h"
-#include <pthread.h>
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-namespace amrex{
-    //we don't use template for task and message queuese since in the future we may implement them in different ways
-    class _TaskQueue {
-	private:
-	    std::queue<Task*> _queue;
-	    MyLock _lock;
-	    bool _NoLoad; //queue is empty and no onflight task
-	public:
-	    _TaskQueue():_NoLoad(true){}
-	    void push(Task* t){
-		_lock.lock();
-		_queue.push(t);
-		_NoLoad=false;
-		_lock.unlock();
-	    }
-	    Task* pop(){
-		_lock.lock();
-		if(_queue.size()>0) {
-		    Task*t = _queue.front();
-		    _queue.pop();
-		    _lock.unlock();
-		    return t;
-		}
-		_lock.unlock();
-		return NULL;
-	    }
-	    Task* front(){
-		_lock.lock();
-		if(_queue.size()>0) {
-		    Task*t = _queue.front();
-		    return t;
-		}
-		_lock.unlock();
-		return NULL;
-	    }
-	    void SetNoLoad(){
-		_lock.lock();
-		if(_queue.size()==0)_NoLoad=true;
-		_lock.unlock();
-	    }
-	    bool NoLoad(){return _NoLoad;}
-	    size_t size(){ return _queue.size();}
-    };
-
-    class _MessageQueue{
-	private:
-	    std::queue<Data*> _queue;
-	    MyLock _lock;
-	public:
-	    void push(Data* &d){
-		_lock.lock();
-		_queue.push(d);
-		_lock.unlock();
-	    }
-	    Data* pop(){
-		_lock.lock();
-		if(_queue.size()>0) {
-		    Data*d = _queue.front();
-		    _queue.pop();
-		    _lock.unlock();
-		    return d;
-		}
-		_lock.unlock();
-		return NULL;
-	    }
-	    size_t size(){ return _queue.size();}
-    };
-
-    struct RtsDomain{
-	_TaskQueue _WaitingQueue; 
-	_TaskQueue _DataFetchingQueue;  //used in Pull model
-	_TaskQueue _ReadyQueue; 
-	_TaskQueue _RunningQueue; 
-	_TaskQueue _ToCreateTaskQueue; 
-	_TaskQueue _ToDestroyTaskQueue; 
-	_MessageQueue _MsgQueue; 
-	pthread_t *_threads;
-	_TaskQueue *_TaskBuffers;
-	int _size;
-	volatile int _activeSlaves;
-	MyLock _lock;
-	RtsDomain(){_threads=NULL; _size=0; _activeSlaves=0;};
-	~RtsDomain(){
-	    assert(_WaitingQueue.size()==0);
-	    assert(_DataFetchingQueue.size()==0);
-	    assert(_ReadyQueue.size()==0);
-	    assert(_RunningQueue.size()==0);
-	    assert(_ToCreateTaskQueue.size()==0);
-	    assert(_ToDestroyTaskQueue.size()==0);
-	    assert(_MsgQueue.size()==0);
-	    free(_threads);
-	}
-    };
-    int numa_nodes;
-    RtsDomain *dom;
-    int **_stopSignal;
-    AbstractTaskGraph<Task>* graph;
-    char* _DedicatedScheduler;
-    std::queue< std::pair<MPI_Request*, Data*> > _SendRequests;
-    std::queue< std::pair<MPI_Request*, char*> > _RecvRequests;
-    std::queue<char*> _recvBuffers;
-    MyLock _l;
-#define MAX_RECV_QUEUE 4
-
-    int RTS::ProcCount(){
-	return _nProcs;
-    }
-
-    int RTS::MyProc(){
-	return _rank;
-    }
-
-    int RTS::WorkerThreadCount(){
-	return _nWrks;
-    }
-
-    int RTS::MyWorkerThread(){
-	return 0;
-    }
-
-    struct argT {
-	int numaID;
-	int tid;
-	int nThreads;
-    };
-    void run(void* threadInfo){
-	argT *args= (argT*)threadInfo;
-	int numaID= args->numaID;
-	int tid= args->tid;
-	int nThreads= args->nThreads;
-	dom[numaID]._lock.lock();
-	if(dom[numaID]._activeSlaves==0){
-	    _stopSignal[numaID]= new int[nThreads];
-	} 
-	_stopSignal[numaID][tid]=0;
-	dom[numaID]._activeSlaves++;
-	dom[numaID]._lock.unlock();
-	if(dom[numaID]._TaskBuffers[tid].size()==0) dom[numaID]._TaskBuffers[tid].SetNoLoad();
-	while(true){
-	    //if local task queue is empty, pull at most 2 tasks from the global queue
-	    if(dom[numaID]._TaskBuffers[tid].size()==0){
-		int nReadyTasks= dom[numaID]._ReadyQueue.size();
-		if(nReadyTasks){
-		    Task* t= dom[numaID]._ReadyQueue.pop();
-		    if(t) dom[numaID]._TaskBuffers[tid].push(t);
-		    if(dom[numaID]._ReadyQueue.size() >= nThreads){ //get one more task
-			Task* t1= dom[numaID]._ReadyQueue.pop();
-			if(t1) dom[numaID]._TaskBuffers[tid].push(t1);
-		    }
-		}
-	    }
-
-	    if(dom[numaID]._TaskBuffers[tid].size()){
-		Task* t= dom[numaID]._TaskBuffers[tid].pop();
-		if(t){
-		    t->RunJob();
-		    t->RunPostCompletion();
-		    //Flush all outputs
-		    while(t->GetOutputs().size()>0){
-			Data* outdata= t->GetOutputs().front();
-			t->GetOutputs().pop();
-			if(outdata){
-			    TaskName dst= outdata->GetRecipient();
-			    int tag= outdata->GetTag();
-			    if(graph->LocateTask(dst)){
-				graph->LocateTask(dst)->GetInputs().push_back(outdata->GetSource(), outdata, tag);
-			    }else dom[numaID]._MsgQueue.push(outdata);
-			}
-		    }
-		    //process newly created tasks
-		    while(t->GetNewTasks().size()>0){
-			Task* nt= t->GetNewTasks().front();
-			t->GetNewTasks().pop();
-			dom[numaID]._ToCreateTaskQueue.push(nt);
-		    }
-		    //keep or destroy current task
-		    if(t->isPersistent()){
-			if(t->Dependency()){
-			    dom[numaID]._ReadyQueue.push(t);
-			}else{
-			    dom[numaID]._WaitingQueue.push(t);
-			}
-		    }else{
-			dom[numaID]._ToDestroyTaskQueue.push(t);
-		    }
-		    if(dom[numaID]._TaskBuffers[tid].size()==0){
-			if(dom[numaID]._TaskBuffers[tid].NoLoad()==false) dom[numaID]._TaskBuffers[tid].SetNoLoad();
-		    }
-		}
-	    }
-	    if(_stopSignal[numaID][tid]) break;
-	}
-	free(args);
-	dom[numaID]._lock.lock();
-	dom[numaID]._activeSlaves--;
-	if(dom[numaID]._activeSlaves==0){
-	    free(_stopSignal[numaID]);
-	}
-	dom[numaID]._lock.unlock();
-    }
-
-    void InitializeMPI(){
-	int provided;
-	MPI_Init_thread(0, 0, MPI_THREAD_FUNNELED, &provided);
-	if(provided == MPI_THREAD_SINGLE){//with this MPI, process can't spawn threads
-	    cerr << "Spawning threads is not allowed by the MPI implementation" << std::endl;;
-	}
-    }
-
-    void RTS::RTS_Init(){
-	NodeHardware hw = query_node_hardware();
-
-	assert(_nWrks>0 && _nWrks <= hw.core_per_numa * hw.numa_per_node);
-
-	bool numaAware=true;
-	char* env= getenv("ENABLE_NUMA_AWARE");
-	numaAware= (env!=NULL);
-	if(numaAware){ //the process covers multiple NUMA nodes
-	    numa_nodes= hw.numa_per_node;
-	    int worker_per_numa = _nWrks / numa_nodes;
-	    int remainder= _nWrks % numa_nodes;
-	    int r=0;
-	    int base=0; 
-	    int localID=-1;
-	    //create a list of persistent threads for each NUMA node
-	    cpu_set_t cpuset;
-	    pthread_attr_t attr;
-	    pthread_attr_init(&attr);
-	    dom= new RtsDomain[numa_nodes];
-	    _stopSignal= new int*[numa_nodes];
-	    for(int i=0; i<numa_nodes; i++){
-		dom[i]._threads= new pthread_t[worker_per_numa+1];
-		dom[i]._TaskBuffers= new _TaskQueue[worker_per_numa+1];
-	    }
-	    for(int i=0, domNo=-1; i<_nWrks; i++){
-		localID++;
-		if(localID==0){
-		    domNo++;
-		}
-		CPU_ZERO(&cpuset);
-		CPU_SET(base+localID, &cpuset);
-		if(! (localID==0 && domNo==0)){
-		    pthread_attr_setaffinity_np(&attr, sizeof(cpu_set_t), &cpuset);
-		    argT* arg= new argT;
-		    arg->numaID= domNo;
-		    arg->tid= localID;
-		    arg->nThreads= worker_per_numa+ (r<remainder?1:0);
-		    int err = pthread_create(&(dom[domNo]._threads[localID]), &attr, (void*(*)(void*))run, arg);
-		}else dom[domNo]._threads[localID]= pthread_self();// master thread
-		dom[domNo]._size++;
-		if(r<remainder && localID == worker_per_numa){
-		    localID=-1;
-		    base+= hw.core_per_numa;
-		    r++;
-		}else if(r==remainder && localID == (worker_per_numa-1)){
-		    localID=-1;
-		    base+= hw.core_per_numa;
-		}
-	    }
-	}else{
-	    numa_nodes= 1;
-	    _stopSignal= new int*[numa_nodes];
-	    dom= new RtsDomain[1];
-
-	    //create a single list of persistent threads and set the thread affinity 
-	    cpu_set_t cpuset;
-	    cpu_set_t mycpuset;
-	    pthread_attr_t attr;
-	    pthread_attr_init(&attr);
-	    dom[0]._threads= new pthread_t[_nWrks];
-	    dom[0]._TaskBuffers= new _TaskQueue[_nWrks];
-	    pthread_getaffinity_np(pthread_self(), sizeof(cpu_set_t), &cpuset);
-	    for(int i=0, j=0; i<CPU_SETSIZE && j<_nWrks; i++) {
-		if(CPU_ISSET(i, &cpuset)){ 
-		    CPU_ZERO(&mycpuset);
-		    CPU_SET(i, &mycpuset);
-		    if(j!=0){
-			argT* arg= new argT;
-			arg->numaID= 0;
-			arg->tid= j;
-			arg->nThreads=_nWrks;
-			pthread_attr_setaffinity_np(&attr, sizeof(cpu_set_t), &mycpuset);
-			int err = pthread_create(&(dom[0]._threads[j]), &attr, (void*(*)(void*))run, arg);
-		    }else dom[0]._threads[j]= pthread_self();// master thread
-		    dom[0]._size++;
-		    j++;
-		}
-	    }
-	}
-    }
-
-    void RTS::Init(){
-        InitializeMPI();
-        MPI_Comm_rank(MPI_COMM_WORLD, &_rank);
-        MPI_Comm_size(MPI_COMM_WORLD, &_nProcs);
-        RTS_Init();
-    }
-
-    void RTS::Init(int rank, int nProcs){
-        _rank= rank;
-	_nProcs= nProcs;
-	RTS_Init();
-    }
-
-    void RTS::Finalize(){
-	for(int d=0; d<numa_nodes; d++)
-	    for(int w=(d==0?1:0); w<dom[d]._size; w++) _stopSignal[d][w]=1;
-	while(true){
-	    bool alldone=true;
-	    for(int d=0; d<numa_nodes; d++){
-		if(dom[d]._activeSlaves){
-		    alldone=false;
-		    break;
-		}
-	    }
-	    if(alldone) break;
-	}
-	free(_stopSignal);
-    }
-
-    void RTS::Iterate(void* taskgraph){
-	_DedicatedScheduler= getenv("DEDICATED_SCHEDULER");
-	char* env= getenv("MAX_MSG_SIZE");
-	//the master thread distributes tasks to workers
-	graph= (AbstractTaskGraph<Task>*)taskgraph;
-	//visit all initial tasks 
-	{
-	    Task* t= graph->Begin();
-	    int numaID=0;
-	    while(t != graph->End()){
-		if(graph->GetRunningMode()== _Push)
-		{
-		    if(t->Dependency()){//all data have arrived
-			dom[numaID]._ReadyQueue.push(t);
-		    }else{
-			dom[numaID]._WaitingQueue.push(t);
-		    }
-		}else{//Pull mode
-		    dom[numaID]._DataFetchingQueue.push(t);
-		}
-		t = graph->Next();
-		numaID= (numaID+1)%numa_nodes; //just use a simple round robin distribution for now
-	    }
-	}
-	bool keepRunning=true;
-	//allocate a static buffer for incoming messages
-	size_t max_buf_size=2<<24;
-	if(env) max_buf_size= atoi(env);
-	for(int i=0; i< MAX_RECV_QUEUE; i++){
-	    char* _recvBuffer= new char[max_buf_size];
-	    _recvBuffers.push(_recvBuffer);
-	}
-
-	dom[0]._TaskBuffers[0].SetNoLoad();
-	while (keepRunning){
-	    //Handle communication
-	    {
-		if(graph->GetRunningMode()== _Push)
-		{
-		    //Process outgoing messages for all domains
-		    for(int d=0; d<numa_nodes; d++){
-			int nMsgs= dom[d]._MsgQueue.size();
-			for(int i=0; i<nMsgs; i++){
-			    Data* msg= dom[d]._MsgQueue.pop();
-			    if(msg){
-				TaskName name= msg->GetRecipient();
-				if(graph->LocateTask(name)){
-				    Task* t= graph->LocateTask(name);
-				    t->GetInputs().push_back(msg->GetSource(), msg, msg->GetTag());
-				}
-				else{ //Recipient is either on a remote node or has not been created
-				    int destRank= msg->GetDestRank(); 
-				    if(destRank==-1) destRank= graph->FindProcessAssociation(name); //the runtime handles the mapping
-				    if(destRank== MyProc()) dom[d]._MsgQueue.push(msg);  //keep in local message queue since recipient task has not been created
-				    else {//remote node
-					MPI_Request* req= new MPI_Request;
-					MPI_Isend(msg->SerializeData(), msg->GetSerializedSize(), MPI_CHAR, destRank, 0, MPI_COMM_WORLD, req);
-					_SendRequests.push(std::pair<MPI_Request*, Data*>(req, msg));
-				    }
-				}
-			    }
-			}
-		    }
-		    //prepost receives
-		    if(_RecvRequests.size() < MAX_RECV_QUEUE){
-			MPI_Request* req= new MPI_Request;
-			char* _recvBuffer=NULL;
-			if(_recvBuffers.size()){
-			    _recvBuffer= _recvBuffers.front();
-			    _recvBuffers.pop();
-			}else _recvBuffer= new char[max_buf_size];
-			MPI_Irecv(_recvBuffer, max_buf_size, MPI_CHAR, MPI_ANY_SOURCE, 0, MPI_COMM_WORLD, req);
-			_RecvRequests.push(std::pair<MPI_Request*, char*>(req, _recvBuffer));
-		    }
-		    //check send status
-		    int nSendRequests= _SendRequests.size();
-		    for(int i=0; i<nSendRequests; i++){
-			int done=0;
-			std::pair<MPI_Request*, Data*> p= _SendRequests.front();
-			MPI_Request *req= p.first;
-			_SendRequests.pop();
-			MPI_Test(req, &done, MPI_STATUS_IGNORE);
-			if(done){
-			    Data* d= p.second;  
-			    d->Free();
-			    free(req);
-			}else _SendRequests.push(p);
-		    }
-		    //check recv status
-		    int nRecvRequests= _RecvRequests.size();
-		    for(int i=0; i<nRecvRequests; i++){
-			int done=0;
-			std::pair<MPI_Request*, char*> p= _RecvRequests.front();
-			MPI_Request *req= p.first;
-			_RecvRequests.pop();
-			MPI_Test(req, &done, MPI_STATUS_IGNORE);
-			if(done){
-			    Data* msg= new Data(p.second);  //deserialize
-			    TaskName name= msg->GetRecipient();
-			    TaskName src= msg->GetSource();
-			    Task* t= graph->LocateTask(name);
-			    if(t){
-				t->GetInputs().push_back(msg->GetSource(), msg, msg->GetTag());
-			    }else dom[0]._MsgQueue.push(msg); 
-			    free(req);
-			}else _RecvRequests.push(p);
-		    }
-		}else{
-		}
-	    }
-	    //visit waiting tasks in all domains 
-	    if(graph->GetRunningMode()== _Push)
-	    { //no else
-		for(int d=0; d<numa_nodes; d++){
-		    int nWaitingTasks= dom[d]._WaitingQueue.size();
-		    for(int i=0; i<nWaitingTasks; i++){
-			Task* t= dom[d]._WaitingQueue.pop();
-			if(t->Dependency()){ 
-			    dom[d]._ReadyQueue.push(t);
-			}else{
-			    dom[d]._WaitingQueue.push(t);
-			}
-		    }
-		}
-	    }
-
-	    if(!_DedicatedScheduler){
-		//pull one task directly from global task queue
-		if(graph->GetRunningMode()== _Push){
-		    int nReadyTasks= dom[0]._ReadyQueue.size();
-		    if(nReadyTasks){
-			Task* t= dom[0]._ReadyQueue.pop();
-			if(t){
-			    t->RunJob(); 
-			    t->RunPostCompletion(); 
-			    //Flush all outputs
-			    while(t->GetOutputs().size()>0){
-				Data* outdata= t->GetOutputs().front();
-				t->GetOutputs().pop();
-				if(outdata){
-				    TaskName dst= outdata->GetRecipient();
-				    int tag= outdata->GetTag();
-				    if(graph->LocateTask(dst)){
-					graph->LocateTask(dst)->GetInputs().push_back(outdata->GetSource(), outdata, tag);
-				    }else dom[0]._MsgQueue.push(outdata); 
-				}
-			    }
-			    //process newly created tasks for domain 0
-			    while(t->GetNewTasks().size()>0){
-				Task* nt= t->GetNewTasks().front();
-				t->GetNewTasks().pop();
-				graph->GetTaskPool()[nt->MyName()]=nt;
-				if(nt->Dependency()){//all data have arrived
-				    dom[0]._ReadyQueue.push(nt);
-				}else{
-				    dom[0]._WaitingQueue.push(nt);
-				}
-			    } 
-			    //keep or destroy task for domain 0
-			    if(t->isPersistent()){
-				if(t->Dependency()){
-				    dom[0]._ReadyQueue.push(t);
-				}else{
-				    dom[0]._WaitingQueue.push(t);
-				}
-			    }else{
-				//remove task from the task pool and delete it
-				graph->DestroyTask(t);
-			    }
-			}
-		    }
-		}
-	    }
-
-
-	    //service new task creation and destroy for other workers
-	    for(int d=0; d<numa_nodes; d++){
-		if(dom[d]._ToCreateTaskQueue.size()){
-		    Task* nt= dom[d]._ToCreateTaskQueue.pop();
-		    if(nt){
-			graph->GetTaskPool()[nt->MyName()]=nt;
-			if(nt->Dependency()){//all data have arrived
-			    dom[d]._ReadyQueue.push(nt);
-			}else{
-			    dom[d]._WaitingQueue.push(nt);
-			}
-		    }
-		}
-	    }
-	    for(int d=0; d<numa_nodes; d++){
-		if(dom[d]._ToDestroyTaskQueue.size()){
-		    Task* ot= dom[d]._ToDestroyTaskQueue.pop();
-		    if(ot){
-			graph->DestroyTask(ot);
-		    }
-		}
-	    }
-
-	    keepRunning=false;
-	    for(int d=0; d<numa_nodes; d++){
-		for(int i=0; i<dom[d]._size; i++){ 
-		    if(dom[d]._TaskBuffers[i].NoLoad() ==false) {
-			keepRunning=true;
-			break;
-		    }
-		}
-		if(keepRunning) break;
-	    }	
-	    if(!keepRunning) 
-	    {
-		for(int d=0; d<numa_nodes; d++){
-		    if(dom[d]._WaitingQueue.size() || dom[d]._DataFetchingQueue.size()|| dom[d]._ReadyQueue.size()|| dom[d]._RunningQueue.size()||\
-			    dom[d]._MsgQueue.size() || graph->GetTaskPool().size() || dom[d]._ToCreateTaskQueue.size() || dom[d]._ToDestroyTaskQueue.size())  {
-			keepRunning=true;
-			break;
-		    }
-		}
-	    }
-	}//end while (keepRunning)
-	//cancel all unused preposted requests
-	while(_SendRequests.size()){
-	    MPI_Cancel(_SendRequests.front().first);
-	    free(_SendRequests.front().first);
-	    free(_SendRequests.front().second);
-	    _SendRequests.pop();
-	}
-
-	//free recv buffers if any left
-	while(_recvBuffers.size()){
-	    free(_recvBuffers.front());
-	    _recvBuffers.pop();
-	}
-    }
-
-    const double kMicro = 1.0e-6;
-    double RTS::Time()
-    {
-	struct timeval TV;
-
-	const int RC = gettimeofday(&TV, NULL);
-	if(RC == -1)
-	{
-	    printf("ERROR: Bad call to gettimeofday\n");
-	    return(-1);
-	}
-	return( ((double)TV.tv_sec) + kMicro * ((double)TV.tv_usec) );
-    } 
-
-    void RTS::Barrier(){
-	//nothing
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/MPI_Generic/rts_graphimpl.H b/Src/AmrTask/rts_impls/MPI_Generic/rts_graphimpl.H
deleted file mode 100644
index c4e2cab2ef7..00000000000
--- a/Src/AmrTask/rts_impls/MPI_Generic/rts_graphimpl.H
+++ /dev/null
@@ -1,26 +0,0 @@
-#ifndef COLLECTIVE_IMPL
-#define COLLECTIVE_IMPL
-
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-21-2017
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <mpi.h>
-#include <cassert>
-using std::is_same;
-
-namespace amrex{
-
-    template<typename T>
-    void ReductionSum_impl(T *local, T *global, int length, int root){
-        MPI_Datatype datatype;
-        if(is_same<T, double>::value) datatype= MPI_DOUBLE;
-        MPI_Reduce(local, global, length, datatype, MPI_SUM, root, MPI_COMM_WORLD);
-    }
-
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/rts_impls/MPI_Generic/rts_taskimpl.H b/Src/AmrTask/rts_impls/MPI_Generic/rts_taskimpl.H
deleted file mode 100644
index a12d1866c35..00000000000
--- a/Src/AmrTask/rts_impls/MPI_Generic/rts_taskimpl.H
+++ /dev/null
@@ -1,27 +0,0 @@
-#ifndef MYATOMICS
-#define MYATOMICS
-
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-21-2017
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-#include "mylock.h"
-
-namespace amrex{
-    extern MyLock _l;
-    template<typename T> void LocalAtomicAdd_impl(T *addr, T val){
-        _l.lock();
-        *addr+= val;
-        _l.unlock();
-    }
-    template<typename T> void GlobalAtomicAdd_impl(T *addr, T val){
-	assert(false);//not defined
-    }
-
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/rts_impls/README b/Src/AmrTask/rts_impls/README
deleted file mode 100644
index 7a2ef06c4e4..00000000000
--- a/Src/AmrTask/rts_impls/README
+++ /dev/null
@@ -1,6 +0,0 @@
-Given an AMReX task graph program, a runtime system operates the program execution.
-In particular, the runtime system manages task creation and distribution, schedules tasks, and handles communication among tasks, etc. 
-Since a task graph representation exhibits partial orderings among tasks, the program can be operated in many ways.
-Different runtime systems can employ different scheduling policies.
-In this directory, we include interfaces to existing runtimes system. 
-The user can select one that suits well for a particular application and hardware architecture.
diff --git a/Src/AmrTask/rts_impls/Serial/Makefile b/Src/AmrTask/rts_impls/Serial/Makefile
deleted file mode 100755
index 9d581c7dd58..00000000000
--- a/Src/AmrTask/rts_impls/Serial/Makefile
+++ /dev/null
@@ -1,22 +0,0 @@
-include ../../arch.common 
-
-OBJECTS= rts.o
-
-RTS_LIB= rts.a
-
-OBJECTS= rts.o
-
-all: $(RTS_LIB)
-
-$(RTS_LIB): $(OBJECTS)
-	ar rv $(RTS_LIB) $(OBJECTS) 
-
-$(OBJECTS): rts.C
-
-rts.o: rts.C
-	$(C++) $(C++FLAGS) -I. -I$(INCLUDE) -I../../graph -c rts.C -o rts.o
-
-.PHONY: clean
-
-clean:
-	$(RM) $(OBJECTS)
diff --git a/Src/AmrTask/rts_impls/Serial/rts.C b/Src/AmrTask/rts_impls/Serial/rts.C
deleted file mode 100644
index ddd5604b30e..00000000000
--- a/Src/AmrTask/rts_impls/Serial/rts.C
+++ /dev/null
@@ -1,177 +0,0 @@
-#include "AMReX_AbstractTask.H"
-#include "AMReX_TaskGraph.H"
-#include "RTS.H"
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-21-2017
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-namespace amrex{
-    typedef std::queue<Task*> _TaskQueue;
-    typedef std::queue<Data*> _MessageQueue;
-    _TaskQueue _WaitingQueue;
-    _TaskQueue _DataFetchingQueue;  //used in Pull model
-    _TaskQueue _ReadyQueue;
-    _TaskQueue _RunningQueue;
-    _MessageQueue _MsgQueue;
-
-    int RTS::ProcCount(){
-	return 1;
-    }
-
-    int RTS::MyProc(){
-	return 0;
-    }
-
-    int RTS::WorkerThreadCount(){
-	return 1;
-    }
-
-    int RTS::MyWorkerThread(){
-	return 0;
-    }
-
-    void RTS::Init(){ 
-    }
-
-    void RTS::Init(int rank, int nProcs){
-	_rank=0;
-	_nProcs=1;
-    }
-
-    void RTS::Finalize(){
-	//Now, no task should be alive. Thus, this routine check the content of all task queues.
-	assert(_WaitingQueue.size()==0);
-	assert(_DataFetchingQueue.size()==0);
-	assert(_ReadyQueue.size()==0);
-	assert(_RunningQueue.size()==0);
-    }
-
-    void RTS::Iterate(void* taskgraph){
-	AbstractTaskGraph<Task>* graph= (AbstractTaskGraph<Task>*)taskgraph;
-	//visit all initial tasks 
-	{
-	    Task* t= graph->Begin();
-	    while(t != graph->End()){
-		if(graph->GetRunningMode()== _Push)
-		{
-		    if(t->Dependency()){//all data have arrived
-			_ReadyQueue.push(t);
-		    }else{
-			_WaitingQueue.push(t);
-		    }
-		}else{//Pull mode
-		    _DataFetchingQueue.push(t);
-		}
-		t = graph->Next();
-	    }
-	}
-	bool keepRunning=true;
-	while (keepRunning){
-	    //Handle communication
-	    {
-		if(graph->GetRunningMode()== _Push)
-		{
-		    //Process messages
-		    int nMsgs= _MsgQueue.size();
-		    for(int i=0; i<nMsgs; i++){
-			Data* msg= _MsgQueue.front();
-			_MsgQueue.pop();
-			TaskName name= msg->GetRecipient();
-			if(graph->LocateTask(name)){
-			    Task* t= graph->LocateTask(name);
-			    t->GetInputs().push_back(msg->GetSource(), msg, msg->GetTag());
-			}
-			else _MsgQueue.push(msg); //Recipient has not been created
-		    }
-		}else{
-		    while(_DataFetchingQueue.size()){
-			Task* t= _DataFetchingQueue.front();
-			_DataFetchingQueue.pop();
-			t->Dependency();//send active messages to pull data from source tasks    
-		    }
-		}
-	    }
-	    //visit waiting tasks (only in push mode)
-	    if(graph->GetRunningMode()== _Push)
-	    { //no else
-		int nWaitingTasks= _WaitingQueue.size();
-		for(int i=0; i<nWaitingTasks; i++){
-		    Task* t= _WaitingQueue.front();
-		    _WaitingQueue.pop();
-		    if(t->Dependency()){ 
-			_ReadyQueue.push(t);
-		    }else{
-			_WaitingQueue.push(t);
-		    }
-		}
-	    }
-	    //Execute ready tasks
-	    {
-		while(_ReadyQueue.size()){
-		    Task* t= _ReadyQueue.front();
-		    _ReadyQueue.pop();
-		    t->RunJob(); 
-		    t->RunPostCompletion(); 
-		    //Flush all outputs
-		    while(t->GetOutputs().size()>0){
-			Data* outdata= t->GetOutputs().front();
-			t->GetOutputs().pop();
-			TaskName dst= outdata->GetRecipient();
-			int tag= outdata->GetTag();
-			if(graph->LocateTask(dst)){
-			    graph->LocateTask(dst)->GetInputs().push_back(outdata->GetSource(), outdata, tag);
-			}else _MsgQueue.push(outdata); 
-		    }
-		    //process newly created tasks
-		    while(t->GetNewTasks().size()>0){
-			Task* nt= t->GetNewTasks().front();
-			t->GetNewTasks().pop();
-			graph->GetTaskPool()[nt->MyName()]=nt;
-			if(nt->Dependency()){//all data have arrived
-			    _ReadyQueue.push(nt);
-			}else{
-			    _WaitingQueue.push(nt);
-			}
-		    }
-		    //keep or destroy task
-		    if(t->isPersistent()){
-			if(t->Dependency()){
-			    _ReadyQueue.push(t);
-			}else{
-			    _WaitingQueue.push(t);
-			}
-		    }else{
-			//remove task from the task pool and delete it
-			graph->DestroyTask(t);
-		    }
-		}
-	    }
-	    keepRunning= _WaitingQueue.size()>0 || _DataFetchingQueue.size()>0|| _ReadyQueue.size()>0|| _RunningQueue.size()>0|| _MsgQueue.size()>0 || graph->GetTaskPool().size()>0;
-	}
-    }
-
-    const double kMicro = 1.0e-6;
-    double RTS::Time()
-    {
-	struct timeval TV;
-
-	const int RC = gettimeofday(&TV, NULL);
-	if(RC == -1)
-	{
-	    printf("ERROR: Bad call to gettimeofday\n");
-	    return(-1);
-	}
-	return( ((double)TV.tv_sec) + kMicro * ((double)TV.tv_usec) );
-    } 
-
-    void RTS::Barrier(){
-	//nothing
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/Serial/rts_graphimpl.H b/Src/AmrTask/rts_impls/Serial/rts_graphimpl.H
deleted file mode 100644
index 8563dd81626..00000000000
--- a/Src/AmrTask/rts_impls/Serial/rts_graphimpl.H
+++ /dev/null
@@ -1,18 +0,0 @@
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-21-2017
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-namespace amrex{
-
-    template<typename T>
-    void ReductionSum_impl(T *local, T *global, int length, int root){
-        for(int i=0; i<length; i++) global[i]=local[i];
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/Serial/rts_taskimpl.H b/Src/AmrTask/rts_impls/Serial/rts_taskimpl.H
deleted file mode 100644
index 906d4c9cea1..00000000000
--- a/Src/AmrTask/rts_impls/Serial/rts_taskimpl.H
+++ /dev/null
@@ -1,20 +0,0 @@
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 07-21-2017
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-namespace amrex{
-
-    template<typename T> void LocalAtomicAdd_impl(T *addr, T val){
-        *addr+= val;
-    }
-    template<typename T> void GlobalAtomicAdd_impl(T *addr, T val){
-        *addr+= val;
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/Utils/dl_malloc.c b/Src/AmrTask/rts_impls/Utils/dl_malloc.c
deleted file mode 100644
index 27bce62d3ed..00000000000
--- a/Src/AmrTask/rts_impls/Utils/dl_malloc.c
+++ /dev/null
@@ -1,6326 +0,0 @@
-/*
-  This is a version (aka dlmalloc) of malloc/free/realloc written by
-  Doug Lea and released to the public domain, as explained at
-  http://creativecommons.org/publicdomain/zero/1.0/ Send questions,
-  comments, complaints, performance data, etc to dl@cs.oswego.edu
-
-* Version 2.8.6 Wed Aug 29 06:57:58 2012  Doug Lea
-   Note: There may be an updated version of this malloc obtainable at
-           ftp://gee.cs.oswego.edu/pub/misc/malloc.c
-         Check before installing!
-
-* Quickstart
-
-  This library is all in one file to simplify the most common usage:
-  ftp it, compile it (-O3), and link it into another program. All of
-  the compile-time options default to reasonable values for use on
-  most platforms.  You might later want to step through various
-  compile-time and dynamic tuning options.
-
-  For convenience, an include file for code using this malloc is at:
-     ftp://gee.cs.oswego.edu/pub/misc/malloc-2.8.6.h
-  You don't really need this .h file unless you call functions not
-  defined in your system include files.  The .h file contains only the
-  excerpts from this file needed for using this malloc on ANSI C/C++
-  systems, so long as you haven't changed compile-time options about
-  naming and tuning parameters.  If you do, then you can create your
-  own malloc.h that does include all settings by cutting at the point
-  indicated below. Note that you may already by default be using a C
-  library containing a malloc that is based on some version of this
-  malloc (for example in linux). You might still want to use the one
-  in this file to customize settings or to avoid overheads associated
-  with library versions.
-
-* Vital statistics:
-
-  Supported pointer/size_t representation:       4 or 8 bytes
-       size_t MUST be an unsigned type of the same width as
-       pointers. (If you are using an ancient system that declares
-       size_t as a signed type, or need it to be a different width
-       than pointers, you can use a previous release of this malloc
-       (e.g. 2.7.2) supporting these.)
-
-  Alignment:                                     8 bytes (minimum)
-       This suffices for nearly all current machines and C compilers.
-       However, you can define MALLOC_ALIGNMENT to be wider than this
-       if necessary (up to 128bytes), at the expense of using more space.
-
-  Minimum overhead per allocated chunk:   4 or  8 bytes (if 4byte sizes)
-                                          8 or 16 bytes (if 8byte sizes)
-       Each malloced chunk has a hidden word of overhead holding size
-       and status information, and additional cross-check word
-       if FOOTERS is defined.
-
-  Minimum allocated size: 4-byte ptrs:  16 bytes    (including overhead)
-                          8-byte ptrs:  32 bytes    (including overhead)
-
-       Even a request for zero bytes (i.e., malloc(0)) returns a
-       pointer to something of the minimum allocatable size.
-       The maximum overhead wastage (i.e., number of extra bytes
-       allocated than were requested in malloc) is less than or equal
-       to the minimum size, except for requests >= mmap_threshold that
-       are serviced via mmap(), where the worst case wastage is about
-       32 bytes plus the remainder from a system page (the minimal
-       mmap unit); typically 4096 or 8192 bytes.
-
-  Security: static-safe; optionally more or less
-       The "security" of malloc refers to the ability of malicious
-       code to accentuate the effects of errors (for example, freeing
-       space that is not currently malloc'ed or overwriting past the
-       ends of chunks) in code that calls malloc.  This malloc
-       guarantees not to modify any memory locations below the base of
-       heap, i.e., static variables, even in the presence of usage
-       errors.  The routines additionally detect most improper frees
-       and reallocs.  All this holds as long as the static bookkeeping
-       for malloc itself is not corrupted by some other means.  This
-       is only one aspect of security -- these checks do not, and
-       cannot, detect all possible programming errors.
-
-       If FOOTERS is defined nonzero, then each allocated chunk
-       carries an additional check word to verify that it was malloced
-       from its space.  These check words are the same within each
-       execution of a program using malloc, but differ across
-       executions, so externally crafted fake chunks cannot be
-       freed. This improves security by rejecting frees/reallocs that
-       could corrupt heap memory, in addition to the checks preventing
-       writes to statics that are always on.  This may further improve
-       security at the expense of time and space overhead.  (Note that
-       FOOTERS may also be worth using with MSPACES.)
-
-       By default detected errors cause the program to abort (calling
-       "abort()"). You can override this to instead proceed past
-       errors by defining PROCEED_ON_ERROR.  In this case, a bad free
-       has no effect, and a malloc that encounters a bad address
-       caused by user overwrites will ignore the bad address by
-       dropping pointers and indices to all known memory. This may
-       be appropriate for programs that should continue if at all
-       possible in the face of programming errors, although they may
-       run out of memory because dropped memory is never reclaimed.
-
-       If you don't like either of these options, you can define
-       CORRUPTION_ERROR_ACTION and USAGE_ERROR_ACTION to do anything
-       else. And if if you are sure that your program using malloc has
-       no errors or vulnerabilities, you can define INSECURE to 1,
-       which might (or might not) provide a small performance improvement.
-
-       It is also possible to limit the maximum total allocatable
-       space, using malloc_set_footprint_limit. This is not
-       designed as a security feature in itself (calls to set limits
-       are not screened or privileged), but may be useful as one
-       aspect of a secure implementation.
-
-  Thread-safety: NOT thread-safe unless USE_LOCKS defined non-zero
-       When USE_LOCKS is defined, each public call to malloc, free,
-       etc is surrounded with a lock. By default, this uses a plain
-       pthread mutex, win32 critical section, or a spin-lock if if
-       available for the platform and not disabled by setting
-       USE_SPIN_LOCKS=0.  However, if USE_RECURSIVE_LOCKS is defined,
-       recursive versions are used instead (which are not required for
-       base functionality but may be needed in layered extensions).
-       Using a global lock is not especially fast, and can be a major
-       bottleneck.  It is designed only to provide minimal protection
-       in concurrent environments, and to provide a basis for
-       extensions.  If you are using malloc in a concurrent program,
-       consider instead using nedmalloc
-       (http://www.nedprod.com/programs/portable/nedmalloc/) or
-       ptmalloc (See http://www.malloc.de), which are derived from
-       versions of this malloc.
-
-  System requirements: Any combination of MORECORE and/or MMAP/MUNMAP
-       This malloc can use unix sbrk or any emulation (invoked using
-       the CALL_MORECORE macro) and/or mmap/munmap or any emulation
-       (invoked using CALL_MMAP/CALL_MUNMAP) to get and release system
-       memory.  On most unix systems, it tends to work best if both
-       MORECORE and MMAP are enabled.  On Win32, it uses emulations
-       based on VirtualAlloc. It also uses common C library functions
-       like memset.
-
-  Compliance: I believe it is compliant with the Single Unix Specification
-       (See http://www.unix.org). Also SVID/XPG, ANSI C, and probably
-       others as well.
-
-* Overview of algorithms
-
-  This is not the fastest, most space-conserving, most portable, or
-  most tunable malloc ever written. However it is among the fastest
-  while also being among the most space-conserving, portable and
-  tunable.  Consistent balance across these factors results in a good
-  general-purpose allocator for malloc-intensive programs.
-
-  In most ways, this malloc is a best-fit allocator. Generally, it
-  chooses the best-fitting existing chunk for a request, with ties
-  broken in approximately least-recently-used order. (This strategy
-  normally maintains low fragmentation.) However, for requests less
-  than 256bytes, it deviates from best-fit when there is not an
-  exactly fitting available chunk by preferring to use space adjacent
-  to that used for the previous small request, as well as by breaking
-  ties in approximately most-recently-used order. (These enhance
-  locality of series of small allocations.)  And for very large requests
-  (>= 256Kb by default), it relies on system memory mapping
-  facilities, if supported.  (This helps avoid carrying around and
-  possibly fragmenting memory used only for large chunks.)
-
-  All operations (except malloc_stats and mallinfo) have execution
-  times that are bounded by a constant factor of the number of bits in
-  a size_t, not counting any clearing in calloc or copying in realloc,
-  or actions surrounding MORECORE and MMAP that have times
-  proportional to the number of non-contiguous regions returned by
-  system allocation routines, which is often just 1. In real-time
-  applications, you can optionally suppress segment traversals using
-  NO_SEGMENT_TRAVERSAL, which assures bounded execution even when
-  system allocators return non-contiguous spaces, at the typical
-  expense of carrying around more memory and increased fragmentation.
-
-  The implementation is not very modular and seriously overuses
-  macros. Perhaps someday all C compilers will do as good a job
-  inlining modular code as can now be done by brute-force expansion,
-  but now, enough of them seem not to.
-
-  Some compilers issue a lot of warnings about code that is
-  dead/unreachable only on some platforms, and also about intentional
-  uses of negation on unsigned types. All known cases of each can be
-  ignored.
-
-  For a longer but out of date high-level description, see
-     http://gee.cs.oswego.edu/dl/html/malloc.html
-
-* MSPACES
-  If MSPACES is defined, then in addition to malloc, free, etc.,
-  this file also defines mspace_malloc, mspace_free, etc. These
-  are versions of malloc routines that take an "mspace" argument
-  obtained using create_mspace, to control all internal bookkeeping.
-  If ONLY_MSPACES is defined, only these versions are compiled.
-  So if you would like to use this allocator for only some allocations,
-  and your system malloc for others, you can compile with
-  ONLY_MSPACES and then do something like...
-    static mspace mymspace = create_mspace(0,0); // for example
-    #define mymalloc(bytes)  mspace_malloc(mymspace, bytes)
-
-  (Note: If you only need one instance of an mspace, you can instead
-  use "USE_DL_PREFIX" to relabel the global malloc.)
-
-  You can similarly create thread-local allocators by storing
-  mspaces as thread-locals. For example:
-    static __thread mspace tlms = 0;
-    void*  tlmalloc(size_t bytes) {
-      if (tlms == 0) tlms = create_mspace(0, 0);
-      return mspace_malloc(tlms, bytes);
-    }
-    void  tlfree(void* mem) { mspace_free(tlms, mem); }
-
-  Unless FOOTERS is defined, each mspace is completely independent.
-  You cannot allocate from one and free to another (although
-  conformance is only weakly checked, so usage errors are not always
-  caught). If FOOTERS is defined, then each chunk carries around a tag
-  indicating its originating mspace, and frees are directed to their
-  originating spaces. Normally, this requires use of locks.
-
- -------------------------  Compile-time options ---------------------------
-
-Be careful in setting #define values for numerical constants of type
-size_t. On some systems, literal values are not automatically extended
-to size_t precision unless they are explicitly casted. You can also
-use the symbolic values MAX_SIZE_T, SIZE_T_ONE, etc below.
-
-WIN32                    default: defined if _WIN32 defined
-  Defining WIN32 sets up defaults for MS environment and compilers.
-  Otherwise defaults are for unix. Beware that there seem to be some
-  cases where this malloc might not be a pure drop-in replacement for
-  Win32 malloc: Random-looking failures from Win32 GDI API's (eg;
-  SetDIBits()) may be due to bugs in some video driver implementations
-  when pixel buffers are malloc()ed, and the region spans more than
-  one VirtualAlloc()ed region. Because dlmalloc uses a small (64Kb)
-  default granularity, pixel buffers may straddle virtual allocation
-  regions more often than when using the Microsoft allocator.  You can
-  avoid this by using VirtualAlloc() and VirtualFree() for all pixel
-  buffers rather than using malloc().  If this is not possible,
-  recompile this malloc with a larger DEFAULT_GRANULARITY. Note:
-  in cases where MSC and gcc (cygwin) are known to differ on WIN32,
-  conditions use _MSC_VER to distinguish them.
-
-DLMALLOC_EXPORT       default: extern
-  Defines how public APIs are declared. If you want to export via a
-  Windows DLL, you might define this as
-    #define DLMALLOC_EXPORT extern  __declspec(dllexport)
-  If you want a POSIX ELF shared object, you might use
-    #define DLMALLOC_EXPORT extern __attribute__((visibility("default")))
-
-MALLOC_ALIGNMENT         default: (size_t)(2 * sizeof(void *))
-  Controls the minimum alignment for malloc'ed chunks.  It must be a
-  power of two and at least 8, even on machines for which smaller
-  alignments would suffice. It may be defined as larger than this
-  though. Note however that code and data structures are optimized for
-  the case of 8-byte alignment.
-
-MSPACES                  default: 0 (false)
-  If true, compile in support for independent allocation spaces.
-  This is only supported if HAVE_MMAP is true.
-
-ONLY_MSPACES             default: 0 (false)
-  If true, only compile in mspace versions, not regular versions.
-
-USE_LOCKS                default: 0 (false)
-  Causes each call to each public routine to be surrounded with
-  pthread or WIN32 mutex lock/unlock. (If set true, this can be
-  overridden on a per-mspace basis for mspace versions.) If set to a
-  non-zero value other than 1, locks are used, but their
-  implementation is left out, so lock functions must be supplied manually,
-  as described below.
-
-USE_SPIN_LOCKS           default: 1 iff USE_LOCKS and spin locks available
-  If true, uses custom spin locks for locking. This is currently
-  supported only gcc >= 4.1, older gccs on x86 platforms, and recent
-  MS compilers.  Otherwise, posix locks or win32 critical sections are
-  used.
-
-USE_RECURSIVE_LOCKS      default: not defined
-  If defined nonzero, uses recursive (aka reentrant) locks, otherwise
-  uses plain mutexes. This is not required for malloc proper, but may
-  be needed for layered allocators such as nedmalloc.
-
-LOCK_AT_FORK            default: not defined
-  If defined nonzero, performs pthread_atfork upon initialization
-  to initialize child lock while holding parent lock. The implementation
-  assumes that pthread locks (not custom locks) are being used. In other
-  cases, you may need to customize the implementation.
-
-FOOTERS                  default: 0
-  If true, provide extra checking and dispatching by placing
-  information in the footers of allocated chunks. This adds
-  space and time overhead.
-
-INSECURE                 default: 0
-  If true, omit checks for usage errors and heap space overwrites.
-
-USE_DL_PREFIX            default: NOT defined
-  Causes compiler to prefix all public routines with the string 'dl'.
-  This can be useful when you only want to use this malloc in one part
-  of a program, using your regular system malloc elsewhere.
-
-MALLOC_INSPECT_ALL       default: NOT defined
-  If defined, compiles malloc_inspect_all and mspace_inspect_all, that
-  perform traversal of all heap space.  Unless access to these
-  functions is otherwise restricted, you probably do not want to
-  include them in secure implementations.
-
-ABORT                    default: defined as abort()
-  Defines how to abort on failed checks.  On most systems, a failed
-  check cannot die with an "assert" or even print an informative
-  message, because the underlying print routines in turn call malloc,
-  which will fail again.  Generally, the best policy is to simply call
-  abort(). It's not very useful to do more than this because many
-  errors due to overwriting will show up as address faults (null, odd
-  addresses etc) rather than malloc-triggered checks, so will also
-  abort.  Also, most compilers know that abort() does not return, so
-  can better optimize code conditionally calling it.
-
-PROCEED_ON_ERROR           default: defined as 0 (false)
-  Controls whether detected bad addresses cause them to bypassed
-  rather than aborting. If set, detected bad arguments to free and
-  realloc are ignored. And all bookkeeping information is zeroed out
-  upon a detected overwrite of freed heap space, thus losing the
-  ability to ever return it from malloc again, but enabling the
-  application to proceed. If PROCEED_ON_ERROR is defined, the
-  static variable malloc_corruption_error_count is compiled in
-  and can be examined to see if errors have occurred. This option
-  generates slower code than the default abort policy.
-
-DEBUG                    default: NOT defined
-  The DEBUG setting is mainly intended for people trying to modify
-  this code or diagnose problems when porting to new platforms.
-  However, it may also be able to better isolate user errors than just
-  using runtime checks.  The assertions in the check routines spell
-  out in more detail the assumptions and invariants underlying the
-  algorithms.  The checking is fairly extensive, and will slow down
-  execution noticeably. Calling malloc_stats or mallinfo with DEBUG
-  set will attempt to check every non-mmapped allocated and free chunk
-  in the course of computing the summaries.
-
-ABORT_ON_ASSERT_FAILURE   default: defined as 1 (true)
-  Debugging assertion failures can be nearly impossible if your
-  version of the assert macro causes malloc to be called, which will
-  lead to a cascade of further failures, blowing the runtime stack.
-  ABORT_ON_ASSERT_FAILURE cause assertions failures to call abort(),
-  which will usually make debugging easier.
-
-MALLOC_FAILURE_ACTION     default: sets errno to ENOMEM, or no-op on win32
-  The action to take before "return 0" when malloc fails to be able to
-  return memory because there is none available.
-
-HAVE_MORECORE             default: 1 (true) unless win32 or ONLY_MSPACES
-  True if this system supports sbrk or an emulation of it.
-
-MORECORE                  default: sbrk
-  The name of the sbrk-style system routine to call to obtain more
-  memory.  See below for guidance on writing custom MORECORE
-  functions. The type of the argument to sbrk/MORECORE varies across
-  systems.  It cannot be size_t, because it supports negative
-  arguments, so it is normally the signed type of the same width as
-  size_t (sometimes declared as "intptr_t").  It doesn't much matter
-  though. Internally, we only call it with arguments less than half
-  the max value of a size_t, which should work across all reasonable
-  possibilities, although sometimes generating compiler warnings.
-
-MORECORE_CONTIGUOUS       default: 1 (true) if HAVE_MORECORE
-  If true, take advantage of fact that consecutive calls to MORECORE
-  with positive arguments always return contiguous increasing
-  addresses.  This is true of unix sbrk. It does not hurt too much to
-  set it true anyway, since malloc copes with non-contiguities.
-  Setting it false when definitely non-contiguous saves time
-  and possibly wasted space it would take to discover this though.
-
-MORECORE_CANNOT_TRIM      default: NOT defined
-  True if MORECORE cannot release space back to the system when given
-  negative arguments. This is generally necessary only if you are
-  using a hand-crafted MORECORE function that cannot handle negative
-  arguments.
-
-NO_SEGMENT_TRAVERSAL       default: 0
-  If non-zero, suppresses traversals of memory segments
-  returned by either MORECORE or CALL_MMAP. This disables
-  merging of segments that are contiguous, and selectively
-  releasing them to the OS if unused, but bounds execution times.
-
-HAVE_MMAP                 default: 1 (true)
-  True if this system supports mmap or an emulation of it.  If so, and
-  HAVE_MORECORE is not true, MMAP is used for all system
-  allocation. If set and HAVE_MORECORE is true as well, MMAP is
-  primarily used to directly allocate very large blocks. It is also
-  used as a backup strategy in cases where MORECORE fails to provide
-  space from system. Note: A single call to MUNMAP is assumed to be
-  able to unmap memory that may have be allocated using multiple calls
-  to MMAP, so long as they are adjacent.
-
-HAVE_MREMAP               default: 1 on linux, else 0
-  If true realloc() uses mremap() to re-allocate large blocks and
-  extend or shrink allocation spaces.
-
-MMAP_CLEARS               default: 1 except on WINCE.
-  True if mmap clears memory so calloc doesn't need to. This is true
-  for standard unix mmap using /dev/zero and on WIN32 except for WINCE.
-
-USE_BUILTIN_FFS            default: 0 (i.e., not used)
-  Causes malloc to use the builtin ffs() function to compute indices.
-  Some compilers may recognize and intrinsify ffs to be faster than the
-  supplied C version. Also, the case of x86 using gcc is special-cased
-  to an asm instruction, so is already as fast as it can be, and so
-  this setting has no effect. Similarly for Win32 under recent MS compilers.
-  (On most x86s, the asm version is only slightly faster than the C version.)
-
-malloc_getpagesize         default: derive from system includes, or 4096.
-  The system page size. To the extent possible, this malloc manages
-  memory from the system in page-size units.  This may be (and
-  usually is) a function rather than a constant. This is ignored
-  if WIN32, where page size is determined using getSystemInfo during
-  initialization.
-
-USE_DEV_RANDOM             default: 0 (i.e., not used)
-  Causes malloc to use /dev/random to initialize secure magic seed for
-  stamping footers. Otherwise, the current time is used.
-
-NO_MALLINFO                default: 0
-  If defined, don't compile "mallinfo". This can be a simple way
-  of dealing with mismatches between system declarations and
-  those in this file.
-
-MALLINFO_FIELD_TYPE        default: size_t
-  The type of the fields in the mallinfo struct. This was originally
-  defined as "int" in SVID etc, but is more usefully defined as
-  size_t. The value is used only if  HAVE_USR_INCLUDE_MALLOC_H is not set
-
-NO_MALLOC_STATS            default: 0
-  If defined, don't compile "malloc_stats". This avoids calls to
-  fprintf and bringing in stdio dependencies you might not want.
-
-REALLOC_ZERO_BYTES_FREES    default: not defined
-  This should be set if a call to realloc with zero bytes should
-  be the same as a call to free. Some people think it should. Otherwise,
-  since this malloc returns a unique pointer for malloc(0), so does
-  realloc(p, 0).
-
-LACKS_UNISTD_H, LACKS_FCNTL_H, LACKS_SYS_PARAM_H, LACKS_SYS_MMAN_H
-LACKS_STRINGS_H, LACKS_STRING_H, LACKS_SYS_TYPES_H,  LACKS_ERRNO_H
-LACKS_STDLIB_H LACKS_SCHED_H LACKS_TIME_H  default: NOT defined unless on WIN32
-  Define these if your system does not have these header files.
-  You might need to manually insert some of the declarations they provide.
-
-DEFAULT_GRANULARITY        default: page size if MORECORE_CONTIGUOUS,
-                                system_info.dwAllocationGranularity in WIN32,
-                                otherwise 64K.
-      Also settable using mallopt(M_GRANULARITY, x)
-  The unit for allocating and deallocating memory from the system.  On
-  most systems with contiguous MORECORE, there is no reason to
-  make this more than a page. However, systems with MMAP tend to
-  either require or encourage larger granularities.  You can increase
-  this value to prevent system allocation functions to be called so
-  often, especially if they are slow.  The value must be at least one
-  page and must be a power of two.  Setting to 0 causes initialization
-  to either page size or win32 region size.  (Note: In previous
-  versions of malloc, the equivalent of this option was called
-  "TOP_PAD")
-
-DEFAULT_TRIM_THRESHOLD    default: 2MB
-      Also settable using mallopt(M_TRIM_THRESHOLD, x)
-  The maximum amount of unused top-most memory to keep before
-  releasing via malloc_trim in free().  Automatic trimming is mainly
-  useful in long-lived programs using contiguous MORECORE.  Because
-  trimming via sbrk can be slow on some systems, and can sometimes be
-  wasteful (in cases where programs immediately afterward allocate
-  more large chunks) the value should be high enough so that your
-  overall system performance would improve by releasing this much
-  memory.  As a rough guide, you might set to a value close to the
-  average size of a process (program) running on your system.
-  Releasing this much memory would allow such a process to run in
-  memory.  Generally, it is worth tuning trim thresholds when a
-  program undergoes phases where several large chunks are allocated
-  and released in ways that can reuse each other's storage, perhaps
-  mixed with phases where there are no such chunks at all. The trim
-  value must be greater than page size to have any useful effect.  To
-  disable trimming completely, you can set to MAX_SIZE_T. Note that the trick
-  some people use of mallocing a huge space and then freeing it at
-  program startup, in an attempt to reserve system memory, doesn't
-  have the intended effect under automatic trimming, since that memory
-  will immediately be returned to the system.
-
-DEFAULT_MMAP_THRESHOLD       default: 256K
-      Also settable using mallopt(M_MMAP_THRESHOLD, x)
-  The request size threshold for using MMAP to directly service a
-  request. Requests of at least this size that cannot be allocated
-  using already-existing space will be serviced via mmap.  (If enough
-  normal freed space already exists it is used instead.)  Using mmap
-  segregates relatively large chunks of memory so that they can be
-  individually obtained and released from the host system. A request
-  serviced through mmap is never reused by any other request (at least
-  not directly; the system may just so happen to remap successive
-  requests to the same locations).  Segregating space in this way has
-  the benefits that: Mmapped space can always be individually released
-  back to the system, which helps keep the system level memory demands
-  of a long-lived program low.  Also, mapped memory doesn't become
-  `locked' between other chunks, as can happen with normally allocated
-  chunks, which means that even trimming via malloc_trim would not
-  release them.  However, it has the disadvantage that the space
-  cannot be reclaimed, consolidated, and then used to service later
-  requests, as happens with normal chunks.  The advantages of mmap
-  nearly always outweigh disadvantages for "large" chunks, but the
-  value of "large" may vary across systems.  The default is an
-  empirically derived value that works well in most systems. You can
-  disable mmap by setting to MAX_SIZE_T.
-
-MAX_RELEASE_CHECK_RATE   default: 4095 unless not HAVE_MMAP
-  The number of consolidated frees between checks to release
-  unused segments when freeing. When using non-contiguous segments,
-  especially with multiple mspaces, checking only for topmost space
-  doesn't always suffice to trigger trimming. To compensate for this,
-  free() will, with a period of MAX_RELEASE_CHECK_RATE (or the
-  current number of segments, if greater) try to release unused
-  segments to the OS when freeing chunks that result in
-  consolidation. The best value for this parameter is a compromise
-  between slowing down frees with relatively costly checks that
-  rarely trigger versus holding on to unused memory. To effectively
-  disable, set to MAX_SIZE_T. This may lead to a very slight speed
-  improvement at the expense of carrying around more memory.
-*/
-
-/* Version identifier to allow people to support multiple versions */
-#ifndef DLMALLOC_VERSION
-#define DLMALLOC_VERSION 20806
-#endif /* DLMALLOC_VERSION */
-
-#ifndef DLMALLOC_EXPORT
-#define DLMALLOC_EXPORT extern
-#endif
-
-#ifndef WIN32
-#ifdef _WIN32
-#define WIN32 1
-#endif  /* _WIN32 */
-#ifdef _WIN32_WCE
-#define LACKS_FCNTL_H
-#define WIN32 1
-#endif /* _WIN32_WCE */
-#endif  /* WIN32 */
-#ifdef WIN32
-#define WIN32_LEAN_AND_MEAN
-#include <windows.h>
-#include <tchar.h>
-#define HAVE_MMAP 1
-#define HAVE_MORECORE 0
-#define LACKS_UNISTD_H
-#define LACKS_SYS_PARAM_H
-#define LACKS_SYS_MMAN_H
-#define LACKS_STRING_H
-#define LACKS_STRINGS_H
-#define LACKS_SYS_TYPES_H
-#define LACKS_ERRNO_H
-#define LACKS_SCHED_H
-#ifndef MALLOC_FAILURE_ACTION
-#define MALLOC_FAILURE_ACTION
-#endif /* MALLOC_FAILURE_ACTION */
-#ifndef MMAP_CLEARS
-#ifdef _WIN32_WCE /* WINCE reportedly does not clear */
-#define MMAP_CLEARS 0
-#else
-#define MMAP_CLEARS 1
-#endif /* _WIN32_WCE */
-#endif /*MMAP_CLEARS */
-#endif  /* WIN32 */
-
-#if defined(DARWIN) || defined(_DARWIN)
-/* Mac OSX docs advise not to use sbrk; it seems better to use mmap */
-#ifndef HAVE_MORECORE
-#define HAVE_MORECORE 0
-#define HAVE_MMAP 1
-/* OSX allocators provide 16 byte alignment */
-#ifndef MALLOC_ALIGNMENT
-#define MALLOC_ALIGNMENT ((size_t)16U)
-#endif
-#endif  /* HAVE_MORECORE */
-#endif  /* DARWIN */
-
-#ifndef LACKS_SYS_TYPES_H
-#include <sys/types.h>  /* For size_t */
-#endif  /* LACKS_SYS_TYPES_H */
-
-/* The maximum possible size_t value has all bits set */
-#define MAX_SIZE_T           (~(size_t)0)
-
-#ifndef USE_LOCKS /* ensure true if spin or recursive locks set */
-#define USE_LOCKS  ((defined(USE_SPIN_LOCKS) && USE_SPIN_LOCKS != 0) || \
-                    (defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0))
-#endif /* USE_LOCKS */
-
-#if USE_LOCKS /* Spin locks for gcc >= 4.1, older gcc on x86, MSC >= 1310 */
-#if ((defined(__GNUC__) &&                                              \
-      ((__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 1)) ||      \
-       defined(__i386__) || defined(__x86_64__))) ||                    \
-     (defined(_MSC_VER) && _MSC_VER>=1310))
-#ifndef USE_SPIN_LOCKS
-#define USE_SPIN_LOCKS 1
-#endif /* USE_SPIN_LOCKS */
-#elif USE_SPIN_LOCKS
-#error "USE_SPIN_LOCKS defined without implementation"
-#endif /* ... locks available... */
-#elif !defined(USE_SPIN_LOCKS)
-#define USE_SPIN_LOCKS 0
-#endif /* USE_LOCKS */
-
-#ifndef ONLY_MSPACES
-#define ONLY_MSPACES 0
-#endif  /* ONLY_MSPACES */
-#ifndef MSPACES
-#if ONLY_MSPACES
-#define MSPACES 1
-#else   /* ONLY_MSPACES */
-#define MSPACES 0
-#endif  /* ONLY_MSPACES */
-#endif  /* MSPACES */
-#ifndef MALLOC_ALIGNMENT
-#define MALLOC_ALIGNMENT ((size_t)(2 * sizeof(void *)))
-#endif  /* MALLOC_ALIGNMENT */
-#ifndef FOOTERS
-#define FOOTERS 0
-#endif  /* FOOTERS */
-#ifndef ABORT
-#define ABORT  abort()
-#endif  /* ABORT */
-#ifndef ABORT_ON_ASSERT_FAILURE
-#define ABORT_ON_ASSERT_FAILURE 1
-#endif  /* ABORT_ON_ASSERT_FAILURE */
-#ifndef PROCEED_ON_ERROR
-#define PROCEED_ON_ERROR 0
-#endif  /* PROCEED_ON_ERROR */
-
-#ifndef INSECURE
-#define INSECURE 0
-#endif  /* INSECURE */
-#ifndef MALLOC_INSPECT_ALL
-#define MALLOC_INSPECT_ALL 0
-#endif  /* MALLOC_INSPECT_ALL */
-#ifndef HAVE_MMAP
-#define HAVE_MMAP 1
-#endif  /* HAVE_MMAP */
-#ifndef MMAP_CLEARS
-#define MMAP_CLEARS 1
-#endif  /* MMAP_CLEARS */
-#ifndef HAVE_MREMAP
-#ifdef linux
-#define HAVE_MREMAP 1
-#define _GNU_SOURCE /* Turns on mremap() definition */
-#else   /* linux */
-#define HAVE_MREMAP 0
-#endif  /* linux */
-#endif  /* HAVE_MREMAP */
-#ifndef MALLOC_FAILURE_ACTION
-#define MALLOC_FAILURE_ACTION  errno = ENOMEM;
-#endif  /* MALLOC_FAILURE_ACTION */
-#ifndef HAVE_MORECORE
-#if ONLY_MSPACES
-#define HAVE_MORECORE 0
-#else   /* ONLY_MSPACES */
-#define HAVE_MORECORE 1
-#endif  /* ONLY_MSPACES */
-#endif  /* HAVE_MORECORE */
-#if !HAVE_MORECORE
-#define MORECORE_CONTIGUOUS 0
-#else   /* !HAVE_MORECORE */
-#define MORECORE_DEFAULT sbrk
-#ifndef MORECORE_CONTIGUOUS
-#define MORECORE_CONTIGUOUS 1
-#endif  /* MORECORE_CONTIGUOUS */
-#endif  /* HAVE_MORECORE */
-#ifndef DEFAULT_GRANULARITY
-#if (MORECORE_CONTIGUOUS || defined(WIN32))
-#define DEFAULT_GRANULARITY (0)  /* 0 means to compute in init_mparams */
-#else   /* MORECORE_CONTIGUOUS */
-#define DEFAULT_GRANULARITY ((size_t)64U * (size_t)1024U)
-#endif  /* MORECORE_CONTIGUOUS */
-#endif  /* DEFAULT_GRANULARITY */
-#ifndef DEFAULT_TRIM_THRESHOLD
-#ifndef MORECORE_CANNOT_TRIM
-#define DEFAULT_TRIM_THRESHOLD ((size_t)2U * (size_t)1024U * (size_t)1024U)
-#else   /* MORECORE_CANNOT_TRIM */
-#define DEFAULT_TRIM_THRESHOLD MAX_SIZE_T
-#endif  /* MORECORE_CANNOT_TRIM */
-#endif  /* DEFAULT_TRIM_THRESHOLD */
-#ifndef DEFAULT_MMAP_THRESHOLD
-#if HAVE_MMAP
-#define DEFAULT_MMAP_THRESHOLD ((size_t)256U * (size_t)1024U)
-#else   /* HAVE_MMAP */
-#define DEFAULT_MMAP_THRESHOLD MAX_SIZE_T
-#endif  /* HAVE_MMAP */
-#endif  /* DEFAULT_MMAP_THRESHOLD */
-#ifndef MAX_RELEASE_CHECK_RATE
-#if HAVE_MMAP
-#define MAX_RELEASE_CHECK_RATE 4095
-#else
-#define MAX_RELEASE_CHECK_RATE MAX_SIZE_T
-#endif /* HAVE_MMAP */
-#endif /* MAX_RELEASE_CHECK_RATE */
-#ifndef USE_BUILTIN_FFS
-#define USE_BUILTIN_FFS 0
-#endif  /* USE_BUILTIN_FFS */
-#ifndef USE_DEV_RANDOM
-#define USE_DEV_RANDOM 0
-#endif  /* USE_DEV_RANDOM */
-#ifndef NO_MALLINFO
-#define NO_MALLINFO 0
-#endif  /* NO_MALLINFO */
-#ifndef MALLINFO_FIELD_TYPE
-#define MALLINFO_FIELD_TYPE size_t
-#endif  /* MALLINFO_FIELD_TYPE */
-#ifndef NO_MALLOC_STATS
-#define NO_MALLOC_STATS 0
-#endif  /* NO_MALLOC_STATS */
-#ifndef NO_SEGMENT_TRAVERSAL
-#define NO_SEGMENT_TRAVERSAL 0
-#endif /* NO_SEGMENT_TRAVERSAL */
-
-/*
-  mallopt tuning options.  SVID/XPG defines four standard parameter
-  numbers for mallopt, normally defined in malloc.h.  None of these
-  are used in this malloc, so setting them has no effect. But this
-  malloc does support the following options.
-*/
-
-#define M_TRIM_THRESHOLD     (-1)
-#define M_GRANULARITY        (-2)
-#define M_MMAP_THRESHOLD     (-3)
-
-/* ------------------------ Mallinfo declarations ------------------------ */
-
-#if !NO_MALLINFO
-/*
-  This version of malloc supports the standard SVID/XPG mallinfo
-  routine that returns a struct containing usage properties and
-  statistics. It should work on any system that has a
-  /usr/include/malloc.h defining struct mallinfo.  The main
-  declaration needed is the mallinfo struct that is returned (by-copy)
-  by mallinfo().  The malloinfo struct contains a bunch of fields that
-  are not even meaningful in this version of malloc.  These fields are
-  are instead filled by mallinfo() with other numbers that might be of
-  interest.
-
-  HAVE_USR_INCLUDE_MALLOC_H should be set if you have a
-  /usr/include/malloc.h file that includes a declaration of struct
-  mallinfo.  If so, it is included; else a compliant version is
-  declared below.  These must be precisely the same for mallinfo() to
-  work.  The original SVID version of this struct, defined on most
-  systems with mallinfo, declares all fields as ints. But some others
-  define as unsigned long. If your system defines the fields using a
-  type of different width than listed here, you MUST #include your
-  system version and #define HAVE_USR_INCLUDE_MALLOC_H.
-*/
-
-/* #define HAVE_USR_INCLUDE_MALLOC_H */
-
-#ifdef HAVE_USR_INCLUDE_MALLOC_H
-#include "/usr/include/malloc.h"
-#else /* HAVE_USR_INCLUDE_MALLOC_H */
-#ifndef STRUCT_MALLINFO_DECLARED
-/* HP-UX (and others?) redefines mallinfo unless _STRUCT_MALLINFO is defined */
-#define _STRUCT_MALLINFO
-#define STRUCT_MALLINFO_DECLARED 1
-struct mallinfo {
-  MALLINFO_FIELD_TYPE arena;    /* non-mmapped space allocated from system */
-  MALLINFO_FIELD_TYPE ordblks;  /* number of free chunks */
-  MALLINFO_FIELD_TYPE smblks;   /* always 0 */
-  MALLINFO_FIELD_TYPE hblks;    /* always 0 */
-  MALLINFO_FIELD_TYPE hblkhd;   /* space in mmapped regions */
-  MALLINFO_FIELD_TYPE usmblks;  /* maximum total allocated space */
-  MALLINFO_FIELD_TYPE fsmblks;  /* always 0 */
-  MALLINFO_FIELD_TYPE uordblks; /* total allocated space */
-  MALLINFO_FIELD_TYPE fordblks; /* total free space */
-  MALLINFO_FIELD_TYPE keepcost; /* releasable (via malloc_trim) space */
-};
-#endif /* STRUCT_MALLINFO_DECLARED */
-#endif /* HAVE_USR_INCLUDE_MALLOC_H */
-#endif /* NO_MALLINFO */
-
-/*
-  Try to persuade compilers to inline. The most critical functions for
-  inlining are defined as macros, so these aren't used for them.
-*/
-
-#ifndef FORCEINLINE
-  #if defined(__GNUC__)
-#define FORCEINLINE __inline __attribute__ ((always_inline))
-  #elif defined(_MSC_VER)
-    #define FORCEINLINE __forceinline
-  #endif
-#endif
-#ifndef NOINLINE
-  #if defined(__GNUC__)
-    #define NOINLINE __attribute__ ((noinline))
-  #elif defined(_MSC_VER)
-    #define NOINLINE __declspec(noinline)
-  #else
-    #define NOINLINE
-  #endif
-#endif
-
-#ifdef __cplusplus
-extern "C" {
-#ifndef FORCEINLINE
- #define FORCEINLINE inline
-#endif
-#endif /* __cplusplus */
-#ifndef FORCEINLINE
- #define FORCEINLINE
-#endif
-
-#if !ONLY_MSPACES
-
-/* ------------------- Declarations of public routines ------------------- */
-
-#ifndef USE_DL_PREFIX
-#define dlcalloc               calloc
-#define dlfree                 free
-#define dlmalloc               malloc
-#define dlmemalign             memalign
-#define dlposix_memalign       posix_memalign
-#define dlrealloc              realloc
-#define dlrealloc_in_place     realloc_in_place
-#define dlvalloc               valloc
-#define dlpvalloc              pvalloc
-#define dlmallinfo             mallinfo
-#define dlmallopt              mallopt
-#define dlmalloc_trim          malloc_trim
-#define dlmalloc_stats         malloc_stats
-#define dlmalloc_usable_size   malloc_usable_size
-#define dlmalloc_footprint     malloc_footprint
-#define dlmalloc_max_footprint malloc_max_footprint
-#define dlmalloc_footprint_limit malloc_footprint_limit
-#define dlmalloc_set_footprint_limit malloc_set_footprint_limit
-#define dlmalloc_inspect_all   malloc_inspect_all
-#define dlindependent_calloc   independent_calloc
-#define dlindependent_comalloc independent_comalloc
-#define dlbulk_free            bulk_free
-#endif /* USE_DL_PREFIX */
-
-/*
-  malloc(size_t n)
-  Returns a pointer to a newly allocated chunk of at least n bytes, or
-  null if no space is available, in which case errno is set to ENOMEM
-  on ANSI C systems.
-
-  If n is zero, malloc returns a minimum-sized chunk. (The minimum
-  size is 16 bytes on most 32bit systems, and 32 bytes on 64bit
-  systems.)  Note that size_t is an unsigned type, so calls with
-  arguments that would be negative if signed are interpreted as
-  requests for huge amounts of space, which will often fail. The
-  maximum supported value of n differs across systems, but is in all
-  cases less than the maximum representable value of a size_t.
-*/
-DLMALLOC_EXPORT void* dlmalloc(size_t);
-
-/*
-  free(void* p)
-  Releases the chunk of memory pointed to by p, that had been previously
-  allocated using malloc or a related routine such as realloc.
-  It has no effect if p is null. If p was not malloced or already
-  freed, free(p) will by default cause the current program to abort.
-*/
-DLMALLOC_EXPORT void  dlfree(void*);
-
-/*
-  calloc(size_t n_elements, size_t element_size);
-  Returns a pointer to n_elements * element_size bytes, with all locations
-  set to zero.
-*/
-DLMALLOC_EXPORT void* dlcalloc(size_t, size_t);
-
-/*
-  realloc(void* p, size_t n)
-  Returns a pointer to a chunk of size n that contains the same data
-  as does chunk p up to the minimum of (n, p's size) bytes, or null
-  if no space is available.
-
-  The returned pointer may or may not be the same as p. The algorithm
-  prefers extending p in most cases when possible, otherwise it
-  employs the equivalent of a malloc-copy-free sequence.
-
-  If p is null, realloc is equivalent to malloc.
-
-  If space is not available, realloc returns null, errno is set (if on
-  ANSI) and p is NOT freed.
-
-  if n is for fewer bytes than already held by p, the newly unused
-  space is lopped off and freed if possible.  realloc with a size
-  argument of zero (re)allocates a minimum-sized chunk.
-
-  The old unix realloc convention of allowing the last-free'd chunk
-  to be used as an argument to realloc is not supported.
-*/
-DLMALLOC_EXPORT void* dlrealloc(void*, size_t);
-
-/*
-  realloc_in_place(void* p, size_t n)
-  Resizes the space allocated for p to size n, only if this can be
-  done without moving p (i.e., only if there is adjacent space
-  available if n is greater than p's current allocated size, or n is
-  less than or equal to p's size). This may be used instead of plain
-  realloc if an alternative allocation strategy is needed upon failure
-  to expand space; for example, reallocation of a buffer that must be
-  memory-aligned or cleared. You can use realloc_in_place to trigger
-  these alternatives only when needed.
-
-  Returns p if successful; otherwise null.
-*/
-DLMALLOC_EXPORT void* dlrealloc_in_place(void*, size_t);
-
-/*
-  memalign(size_t alignment, size_t n);
-  Returns a pointer to a newly allocated chunk of n bytes, aligned
-  in accord with the alignment argument.
-
-  The alignment argument should be a power of two. If the argument is
-  not a power of two, the nearest greater power is used.
-  8-byte alignment is guaranteed by normal malloc calls, so don't
-  bother calling memalign with an argument of 8 or less.
-
-  Overreliance on memalign is a sure way to fragment space.
-*/
-DLMALLOC_EXPORT void* dlmemalign(size_t, size_t);
-
-/*
-  int posix_memalign(void** pp, size_t alignment, size_t n);
-  Allocates a chunk of n bytes, aligned in accord with the alignment
-  argument. Differs from memalign only in that it (1) assigns the
-  allocated memory to *pp rather than returning it, (2) fails and
-  returns EINVAL if the alignment is not a power of two (3) fails and
-  returns ENOMEM if memory cannot be allocated.
-*/
-DLMALLOC_EXPORT int dlposix_memalign(void**, size_t, size_t);
-
-/*
-  valloc(size_t n);
-  Equivalent to memalign(pagesize, n), where pagesize is the page
-  size of the system. If the pagesize is unknown, 4096 is used.
-*/
-DLMALLOC_EXPORT void* dlvalloc(size_t);
-
-/*
-  mallopt(int parameter_number, int parameter_value)
-  Sets tunable parameters The format is to provide a
-  (parameter-number, parameter-value) pair.  mallopt then sets the
-  corresponding parameter to the argument value if it can (i.e., so
-  long as the value is meaningful), and returns 1 if successful else
-  0.  To workaround the fact that mallopt is specified to use int,
-  not size_t parameters, the value -1 is specially treated as the
-  maximum unsigned size_t value.
-
-  SVID/XPG/ANSI defines four standard param numbers for mallopt,
-  normally defined in malloc.h.  None of these are use in this malloc,
-  so setting them has no effect. But this malloc also supports other
-  options in mallopt. See below for details.  Briefly, supported
-  parameters are as follows (listed defaults are for "typical"
-  configurations).
-
-  Symbol            param #  default    allowed param values
-  M_TRIM_THRESHOLD     -1   2*1024*1024   any   (-1 disables)
-  M_GRANULARITY        -2     page size   any power of 2 >= page size
-  M_MMAP_THRESHOLD     -3      256*1024   any   (or 0 if no MMAP support)
-*/
-DLMALLOC_EXPORT int dlmallopt(int, int);
-
-/*
-  malloc_footprint();
-  Returns the number of bytes obtained from the system.  The total
-  number of bytes allocated by malloc, realloc etc., is less than this
-  value. Unlike mallinfo, this function returns only a precomputed
-  result, so can be called frequently to monitor memory consumption.
-  Even if locks are otherwise defined, this function does not use them,
-  so results might not be up to date.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_footprint(void);
-
-/*
-  malloc_max_footprint();
-  Returns the maximum number of bytes obtained from the system. This
-  value will be greater than current footprint if deallocated space
-  has been reclaimed by the system. The peak number of bytes allocated
-  by malloc, realloc etc., is less than this value. Unlike mallinfo,
-  this function returns only a precomputed result, so can be called
-  frequently to monitor memory consumption.  Even if locks are
-  otherwise defined, this function does not use them, so results might
-  not be up to date.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_max_footprint(void);
-
-/*
-  malloc_footprint_limit();
-  Returns the number of bytes that the heap is allowed to obtain from
-  the system, returning the last value returned by
-  malloc_set_footprint_limit, or the maximum size_t value if
-  never set. The returned value reflects a permission. There is no
-  guarantee that this number of bytes can actually be obtained from
-  the system.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_footprint_limit();
-
-/*
-  malloc_set_footprint_limit();
-  Sets the maximum number of bytes to obtain from the system, causing
-  failure returns from malloc and related functions upon attempts to
-  exceed this value. The argument value may be subject to page
-  rounding to an enforceable limit; this actual value is returned.
-  Using an argument of the maximum possible size_t effectively
-  disables checks. If the argument is less than or equal to the
-  current malloc_footprint, then all future allocations that require
-  additional system memory will fail. However, invocation cannot
-  retroactively deallocate existing used memory.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_set_footprint_limit(size_t bytes);
-
-#if MALLOC_INSPECT_ALL
-/*
-  malloc_inspect_all(void(*handler)(void *start,
-                                    void *end,
-                                    size_t used_bytes,
-                                    void* callback_arg),
-                      void* arg);
-  Traverses the heap and calls the given handler for each managed
-  region, skipping all bytes that are (or may be) used for bookkeeping
-  purposes.  Traversal does not include include chunks that have been
-  directly memory mapped. Each reported region begins at the start
-  address, and continues up to but not including the end address.  The
-  first used_bytes of the region contain allocated data. If
-  used_bytes is zero, the region is unallocated. The handler is
-  invoked with the given callback argument. If locks are defined, they
-  are held during the entire traversal. It is a bad idea to invoke
-  other malloc functions from within the handler.
-
-  For example, to count the number of in-use chunks with size greater
-  than 1000, you could write:
-  static int count = 0;
-  void count_chunks(void* start, void* end, size_t used, void* arg) {
-    if (used >= 1000) ++count;
-  }
-  then:
-    malloc_inspect_all(count_chunks, NULL);
-
-  malloc_inspect_all is compiled only if MALLOC_INSPECT_ALL is defined.
-*/
-DLMALLOC_EXPORT void dlmalloc_inspect_all(void(*handler)(void*, void *, size_t, void*),
-                           void* arg);
-
-#endif /* MALLOC_INSPECT_ALL */
-
-#if !NO_MALLINFO
-/*
-  mallinfo()
-  Returns (by copy) a struct containing various summary statistics:
-
-  arena:     current total non-mmapped bytes allocated from system
-  ordblks:   the number of free chunks
-  smblks:    always zero.
-  hblks:     current number of mmapped regions
-  hblkhd:    total bytes held in mmapped regions
-  usmblks:   the maximum total allocated space. This will be greater
-                than current total if trimming has occurred.
-  fsmblks:   always zero
-  uordblks:  current total allocated space (normal or mmapped)
-  fordblks:  total free space
-  keepcost:  the maximum number of bytes that could ideally be released
-               back to system via malloc_trim. ("ideally" means that
-               it ignores page restrictions etc.)
-
-  Because these fields are ints, but internal bookkeeping may
-  be kept as longs, the reported values may wrap around zero and
-  thus be inaccurate.
-*/
-DLMALLOC_EXPORT struct mallinfo dlmallinfo(void);
-#endif /* NO_MALLINFO */
-
-/*
-  independent_calloc(size_t n_elements, size_t element_size, void* chunks[]);
-
-  independent_calloc is similar to calloc, but instead of returning a
-  single cleared space, it returns an array of pointers to n_elements
-  independent elements that can hold contents of size elem_size, each
-  of which starts out cleared, and can be independently freed,
-  realloc'ed etc. The elements are guaranteed to be adjacently
-  allocated (this is not guaranteed to occur with multiple callocs or
-  mallocs), which may also improve cache locality in some
-  applications.
-
-  The "chunks" argument is optional (i.e., may be null, which is
-  probably the most typical usage). If it is null, the returned array
-  is itself dynamically allocated and should also be freed when it is
-  no longer needed. Otherwise, the chunks array must be of at least
-  n_elements in length. It is filled in with the pointers to the
-  chunks.
-
-  In either case, independent_calloc returns this pointer array, or
-  null if the allocation failed.  If n_elements is zero and "chunks"
-  is null, it returns a chunk representing an array with zero elements
-  (which should be freed if not wanted).
-
-  Each element must be freed when it is no longer needed. This can be
-  done all at once using bulk_free.
-
-  independent_calloc simplifies and speeds up implementations of many
-  kinds of pools.  It may also be useful when constructing large data
-  structures that initially have a fixed number of fixed-sized nodes,
-  but the number is not known at compile time, and some of the nodes
-  may later need to be freed. For example:
-
-  struct Node { int item; struct Node* next; };
-
-  struct Node* build_list() {
-    struct Node** pool;
-    int n = read_number_of_nodes_needed();
-    if (n <= 0) return 0;
-    pool = (struct Node**)(independent_calloc(n, sizeof(struct Node), 0);
-    if (pool == 0) die();
-    // organize into a linked list...
-    struct Node* first = pool[0];
-    for (i = 0; i < n-1; ++i)
-      pool[i]->next = pool[i+1];
-    free(pool);     // Can now free the array (or not, if it is needed later)
-    return first;
-  }
-*/
-DLMALLOC_EXPORT void** dlindependent_calloc(size_t, size_t, void**);
-
-/*
-  independent_comalloc(size_t n_elements, size_t sizes[], void* chunks[]);
-
-  independent_comalloc allocates, all at once, a set of n_elements
-  chunks with sizes indicated in the "sizes" array.    It returns
-  an array of pointers to these elements, each of which can be
-  independently freed, realloc'ed etc. The elements are guaranteed to
-  be adjacently allocated (this is not guaranteed to occur with
-  multiple callocs or mallocs), which may also improve cache locality
-  in some applications.
-
-  The "chunks" argument is optional (i.e., may be null). If it is null
-  the returned array is itself dynamically allocated and should also
-  be freed when it is no longer needed. Otherwise, the chunks array
-  must be of at least n_elements in length. It is filled in with the
-  pointers to the chunks.
-
-  In either case, independent_comalloc returns this pointer array, or
-  null if the allocation failed.  If n_elements is zero and chunks is
-  null, it returns a chunk representing an array with zero elements
-  (which should be freed if not wanted).
-
-  Each element must be freed when it is no longer needed. This can be
-  done all at once using bulk_free.
-
-  independent_comallac differs from independent_calloc in that each
-  element may have a different size, and also that it does not
-  automatically clear elements.
-
-  independent_comalloc can be used to speed up allocation in cases
-  where several structs or objects must always be allocated at the
-  same time.  For example:
-
-  struct Head { ... }
-  struct Foot { ... }
-
-  void send_message(char* msg) {
-    int msglen = strlen(msg);
-    size_t sizes[3] = { sizeof(struct Head), msglen, sizeof(struct Foot) };
-    void* chunks[3];
-    if (independent_comalloc(3, sizes, chunks) == 0)
-      die();
-    struct Head* head = (struct Head*)(chunks[0]);
-    char*        body = (char*)(chunks[1]);
-    struct Foot* foot = (struct Foot*)(chunks[2]);
-    // ...
-  }
-
-  In general though, independent_comalloc is worth using only for
-  larger values of n_elements. For small values, you probably won't
-  detect enough difference from series of malloc calls to bother.
-
-  Overuse of independent_comalloc can increase overall memory usage,
-  since it cannot reuse existing noncontiguous small chunks that
-  might be available for some of the elements.
-*/
-DLMALLOC_EXPORT void** dlindependent_comalloc(size_t, size_t*, void**);
-
-/*
-  bulk_free(void* array[], size_t n_elements)
-  Frees and clears (sets to null) each non-null pointer in the given
-  array.  This is likely to be faster than freeing them one-by-one.
-  If footers are used, pointers that have been allocated in different
-  mspaces are not freed or cleared, and the count of all such pointers
-  is returned.  For large arrays of pointers with poor locality, it
-  may be worthwhile to sort this array before calling bulk_free.
-*/
-DLMALLOC_EXPORT size_t  dlbulk_free(void**, size_t n_elements);
-
-/*
-  pvalloc(size_t n);
-  Equivalent to valloc(minimum-page-that-holds(n)), that is,
-  round up n to nearest pagesize.
- */
-DLMALLOC_EXPORT void*  dlpvalloc(size_t);
-
-/*
-  malloc_trim(size_t pad);
-
-  If possible, gives memory back to the system (via negative arguments
-  to sbrk) if there is unused memory at the `high' end of the malloc
-  pool or in unused MMAP segments. You can call this after freeing
-  large blocks of memory to potentially reduce the system-level memory
-  requirements of a program. However, it cannot guarantee to reduce
-  memory. Under some allocation patterns, some large free blocks of
-  memory will be locked between two used chunks, so they cannot be
-  given back to the system.
-
-  The `pad' argument to malloc_trim represents the amount of free
-  trailing space to leave untrimmed. If this argument is zero, only
-  the minimum amount of memory to maintain internal data structures
-  will be left. Non-zero arguments can be supplied to maintain enough
-  trailing space to service future expected allocations without having
-  to re-obtain memory from the system.
-
-  Malloc_trim returns 1 if it actually released any memory, else 0.
-*/
-DLMALLOC_EXPORT int  dlmalloc_trim(size_t);
-
-/*
-  malloc_stats();
-  Prints on stderr the amount of space obtained from the system (both
-  via sbrk and mmap), the maximum amount (which may be more than
-  current if malloc_trim and/or munmap got called), and the current
-  number of bytes allocated via malloc (or realloc, etc) but not yet
-  freed. Note that this is the number of bytes allocated, not the
-  number requested. It will be larger than the number requested
-  because of alignment and bookkeeping overhead. Because it includes
-  alignment wastage as being in use, this figure may be greater than
-  zero even when no user-level chunks are allocated.
-
-  The reported current and maximum system memory can be inaccurate if
-  a program makes other calls to system memory allocation functions
-  (normally sbrk) outside of malloc.
-
-  malloc_stats prints only the most commonly interesting statistics.
-  More information can be obtained by calling mallinfo.
-*/
-DLMALLOC_EXPORT void  dlmalloc_stats(void);
-
-/*
-  malloc_usable_size(void* p);
-
-  Returns the number of bytes you can actually use in
-  an allocated chunk, which may be more than you requested (although
-  often not) due to alignment and minimum size constraints.
-  You can use this many bytes without worrying about
-  overwriting other allocated objects. This is not a particularly great
-  programming practice. malloc_usable_size can be more useful in
-  debugging and assertions, for example:
-
-  p = malloc(n);
-  assert(malloc_usable_size(p) >= 256);
-*/
-size_t dlmalloc_usable_size(void*);
-
-#endif /* ONLY_MSPACES */
-
-#if MSPACES
-
-/*
-  mspace is an opaque type representing an independent
-  region of space that supports mspace_malloc, etc.
-*/
-typedef void* mspace;
-
-/*
-  create_mspace creates and returns a new independent space with the
-  given initial capacity, or, if 0, the default granularity size.  It
-  returns null if there is no system memory available to create the
-  space.  If argument locked is non-zero, the space uses a separate
-  lock to control access. The capacity of the space will grow
-  dynamically as needed to service mspace_malloc requests.  You can
-  control the sizes of incremental increases of this space by
-  compiling with a different DEFAULT_GRANULARITY or dynamically
-  setting with mallopt(M_GRANULARITY, value).
-*/
-DLMALLOC_EXPORT mspace create_mspace(size_t capacity, int locked);
-
-/*
-  destroy_mspace destroys the given space, and attempts to return all
-  of its memory back to the system, returning the total number of
-  bytes freed. After destruction, the results of access to all memory
-  used by the space become undefined.
-*/
-DLMALLOC_EXPORT size_t destroy_mspace(mspace msp);
-
-/*
-  create_mspace_with_base uses the memory supplied as the initial base
-  of a new mspace. Part (less than 128*sizeof(size_t) bytes) of this
-  space is used for bookkeeping, so the capacity must be at least this
-  large. (Otherwise 0 is returned.) When this initial space is
-  exhausted, additional memory will be obtained from the system.
-  Destroying this space will deallocate all additionally allocated
-  space (if possible) but not the initial base.
-*/
-DLMALLOC_EXPORT mspace create_mspace_with_base(void* base, size_t capacity, int locked);
-DLMALLOC_EXPORT mspace create_device_mspace_with_base(void* base, size_t capacity, int locked);
-
-/*
-  mspace_track_large_chunks controls whether requests for large chunks
-  are allocated in their own untracked mmapped regions, separate from
-  others in this mspace. By default large chunks are not tracked,
-  which reduces fragmentation. However, such chunks are not
-  necessarily released to the system upon destroy_mspace.  Enabling
-  tracking by setting to true may increase fragmentation, but avoids
-  leakage when relying on destroy_mspace to release all memory
-  allocated using this space.  The function returns the previous
-  setting.
-*/
-DLMALLOC_EXPORT int mspace_track_large_chunks(mspace msp, int enable);
-
-
-/*
-  mspace_malloc behaves as malloc, but operates within
-  the given space.
-*/
-DLMALLOC_EXPORT void* mspace_malloc(mspace msp, size_t bytes);
-
-/*
-  mspace_free behaves as free, but operates within
-  the given space.
-
-  If compiled with FOOTERS==1, mspace_free is not actually needed.
-  free may be called instead of mspace_free because freed chunks from
-  any space are handled by their originating spaces.
-*/
-DLMALLOC_EXPORT void mspace_free(mspace msp, void* mem);
-
-/*
-  mspace_realloc behaves as realloc, but operates within
-  the given space.
-
-  If compiled with FOOTERS==1, mspace_realloc is not actually
-  needed.  realloc may be called instead of mspace_realloc because
-  realloced chunks from any space are handled by their originating
-  spaces.
-*/
-DLMALLOC_EXPORT void* mspace_realloc(mspace msp, void* mem, size_t newsize);
-
-/*
-  mspace_calloc behaves as calloc, but operates within
-  the given space.
-*/
-DLMALLOC_EXPORT void* mspace_calloc(mspace msp, size_t n_elements, size_t elem_size);
-
-/*
-  mspace_memalign behaves as memalign, but operates within
-  the given space.
-*/
-DLMALLOC_EXPORT void* mspace_memalign(mspace msp, size_t alignment, size_t bytes);
-
-/*
-  mspace_independent_calloc behaves as independent_calloc, but
-  operates within the given space.
-*/
-DLMALLOC_EXPORT void** mspace_independent_calloc(mspace msp, size_t n_elements,
-                                 size_t elem_size, void* chunks[]);
-
-/*
-  mspace_independent_comalloc behaves as independent_comalloc, but
-  operates within the given space.
-*/
-DLMALLOC_EXPORT void** mspace_independent_comalloc(mspace msp, size_t n_elements,
-                                   size_t sizes[], void* chunks[]);
-
-/*
-  mspace_footprint() returns the number of bytes obtained from the
-  system for this space.
-*/
-DLMALLOC_EXPORT size_t mspace_footprint(mspace msp);
-
-/*
-  mspace_max_footprint() returns the peak number of bytes obtained from the
-  system for this space.
-*/
-DLMALLOC_EXPORT size_t mspace_max_footprint(mspace msp);
-
-
-#if !NO_MALLINFO
-/*
-  mspace_mallinfo behaves as mallinfo, but reports properties of
-  the given space.
-*/
-DLMALLOC_EXPORT struct mallinfo mspace_mallinfo(mspace msp);
-#endif /* NO_MALLINFO */
-
-/*
-  malloc_usable_size(void* p) behaves the same as malloc_usable_size;
-*/
-DLMALLOC_EXPORT size_t mspace_usable_size(const void* mem);
-
-/*
-  mspace_malloc_stats behaves as malloc_stats, but reports
-  properties of the given space.
-*/
-DLMALLOC_EXPORT void mspace_malloc_stats(mspace msp);
-
-/*
-  mspace_trim behaves as malloc_trim, but
-  operates within the given space.
-*/
-DLMALLOC_EXPORT int mspace_trim(mspace msp, size_t pad);
-
-/*
-  An alias for mallopt.
-*/
-DLMALLOC_EXPORT int mspace_mallopt(int, int);
-
-#endif /* MSPACES */
-
-#ifdef __cplusplus
-}  /* end of extern "C" */
-#endif /* __cplusplus */
-
-/*
-  ========================================================================
-  To make a fully customizable malloc.h header file, cut everything
-  above this line, put into file malloc.h, edit to suit, and #include it
-  on the next line, as well as in programs that use this malloc.
-  ========================================================================
-*/
-
-/* #include "malloc.h" */
-
-/*------------------------------ internal #includes ---------------------- */
-
-#ifdef _MSC_VER
-#pragma warning( disable : 4146 ) /* no "unsigned" warnings */
-#endif /* _MSC_VER */
-#if !NO_MALLOC_STATS
-#include <stdio.h>       /* for printing in malloc_stats */
-#endif /* NO_MALLOC_STATS */
-#ifndef LACKS_ERRNO_H
-#include <errno.h>       /* for MALLOC_FAILURE_ACTION */
-#endif /* LACKS_ERRNO_H */
-#ifdef DEBUG
-#if ABORT_ON_ASSERT_FAILURE
-#undef assert
-#define assert(x) if(!(x)) ABORT
-#else /* ABORT_ON_ASSERT_FAILURE */
-#include <assert.h>
-#endif /* ABORT_ON_ASSERT_FAILURE */
-#else  /* DEBUG */
-#ifndef assert
-#define assert(x)
-#endif
-#define DEBUG 0
-#endif /* DEBUG */
-#if !defined(WIN32) && !defined(LACKS_TIME_H)
-#include <time.h>        /* for magic initialization */
-#endif /* WIN32 */
-#ifndef LACKS_STDLIB_H
-#include <stdlib.h>      /* for abort() */
-#endif /* LACKS_STDLIB_H */
-#ifndef LACKS_STRING_H
-#include <string.h>      /* for memset etc */
-#endif  /* LACKS_STRING_H */
-#if USE_BUILTIN_FFS
-#ifndef LACKS_STRINGS_H
-#include <strings.h>     /* for ffs */
-#endif /* LACKS_STRINGS_H */
-#endif /* USE_BUILTIN_FFS */
-#if HAVE_MMAP
-#ifndef LACKS_SYS_MMAN_H
-/* On some versions of linux, mremap decl in mman.h needs __USE_GNU set */
-#if (defined(linux) && !defined(__USE_GNU))
-#define __USE_GNU 1
-#include <sys/mman.h>    /* for mmap */
-#undef __USE_GNU
-#else
-#include <sys/mman.h>    /* for mmap */
-#endif /* linux */
-#endif /* LACKS_SYS_MMAN_H */
-#ifndef LACKS_FCNTL_H
-#include <fcntl.h>
-#endif /* LACKS_FCNTL_H */
-#endif /* HAVE_MMAP */
-#ifndef LACKS_UNISTD_H
-#include <unistd.h>     /* for sbrk, sysconf */
-#else /* LACKS_UNISTD_H */
-#if !defined(__FreeBSD__) && !defined(__OpenBSD__) && !defined(__NetBSD__)
-extern void*     sbrk(ptrdiff_t);
-#endif /* FreeBSD etc */
-#endif /* LACKS_UNISTD_H */
-
-/* Declarations for locking */
-#if USE_LOCKS
-#ifndef WIN32
-#if defined (__SVR4) && defined (__sun)  /* solaris */
-#include <thread.h>
-#elif !defined(LACKS_SCHED_H)
-#include <sched.h>
-#endif /* solaris or LACKS_SCHED_H */
-#if (defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0) || !USE_SPIN_LOCKS
-#include <pthread.h>
-#endif /* USE_RECURSIVE_LOCKS ... */
-#elif defined(_MSC_VER)
-#ifndef _M_AMD64
-/* These are already defined on AMD64 builds */
-#ifdef __cplusplus
-extern "C" {
-#endif /* __cplusplus */
-LONG __cdecl _InterlockedCompareExchange(LONG volatile *Dest, LONG Exchange, LONG Comp);
-LONG __cdecl _InterlockedExchange(LONG volatile *Target, LONG Value);
-#ifdef __cplusplus
-}
-#endif /* __cplusplus */
-#endif /* _M_AMD64 */
-#pragma intrinsic (_InterlockedCompareExchange)
-#pragma intrinsic (_InterlockedExchange)
-#define interlockedcompareexchange _InterlockedCompareExchange
-#define interlockedexchange _InterlockedExchange
-#elif defined(WIN32) && defined(__GNUC__)
-#define interlockedcompareexchange(a, b, c) __sync_val_compare_and_swap(a, c, b)
-#define interlockedexchange __sync_lock_test_and_set
-#endif /* Win32 */
-#else /* USE_LOCKS */
-#endif /* USE_LOCKS */
-
-#ifndef LOCK_AT_FORK
-#define LOCK_AT_FORK 0
-#endif
-
-/* Declarations for bit scanning on win32 */
-#if defined(_MSC_VER) && _MSC_VER>=1300
-#ifndef BitScanForward /* Try to avoid pulling in WinNT.h */
-#ifdef __cplusplus
-extern "C" {
-#endif /* __cplusplus */
-unsigned char _BitScanForward(unsigned long *index, unsigned long mask);
-unsigned char _BitScanReverse(unsigned long *index, unsigned long mask);
-#ifdef __cplusplus
-}
-#endif /* __cplusplus */
-
-#define BitScanForward _BitScanForward
-#define BitScanReverse _BitScanReverse
-#pragma intrinsic(_BitScanForward)
-#pragma intrinsic(_BitScanReverse)
-#endif /* BitScanForward */
-#endif /* defined(_MSC_VER) && _MSC_VER>=1300 */
-
-#ifndef WIN32
-#ifndef malloc_getpagesize
-#  ifdef _SC_PAGESIZE         /* some SVR4 systems omit an underscore */
-#    ifndef _SC_PAGE_SIZE
-#      define _SC_PAGE_SIZE _SC_PAGESIZE
-#    endif
-#  endif
-#  ifdef _SC_PAGE_SIZE
-#    define malloc_getpagesize sysconf(_SC_PAGE_SIZE)
-#  else
-#    if defined(BSD) || defined(DGUX) || defined(HAVE_GETPAGESIZE)
-       extern size_t getpagesize();
-#      define malloc_getpagesize getpagesize()
-#    else
-#      ifdef WIN32 /* use supplied emulation of getpagesize */
-#        define malloc_getpagesize getpagesize()
-#      else
-#        ifndef LACKS_SYS_PARAM_H
-#          include <sys/param.h>
-#        endif
-#        ifdef EXEC_PAGESIZE
-#          define malloc_getpagesize EXEC_PAGESIZE
-#        else
-#          ifdef NBPG
-#            ifndef CLSIZE
-#              define malloc_getpagesize NBPG
-#            else
-#              define malloc_getpagesize (NBPG * CLSIZE)
-#            endif
-#          else
-#            ifdef NBPC
-#              define malloc_getpagesize NBPC
-#            else
-#              ifdef PAGESIZE
-#                define malloc_getpagesize PAGESIZE
-#              else /* just guess */
-#                define malloc_getpagesize ((size_t)4096U)
-#              endif
-#            endif
-#          endif
-#        endif
-#      endif
-#    endif
-#  endif
-#endif
-#endif
-
-/* ------------------- size_t and alignment properties -------------------- */
-
-/* The byte and bit size of a size_t */
-#define SIZE_T_SIZE         (sizeof(size_t))
-#define SIZE_T_BITSIZE      (sizeof(size_t) << 3)
-
-/* Some constants coerced to size_t */
-/* Annoying but necessary to avoid errors on some platforms */
-#define SIZE_T_ZERO         ((size_t)0)
-#define SIZE_T_ONE          ((size_t)1)
-#define SIZE_T_TWO          ((size_t)2)
-#define SIZE_T_FOUR         ((size_t)4)
-#define TWO_SIZE_T_SIZES    (SIZE_T_SIZE<<1)
-#define FOUR_SIZE_T_SIZES   (SIZE_T_SIZE<<2)
-#define SIX_SIZE_T_SIZES    (FOUR_SIZE_T_SIZES+TWO_SIZE_T_SIZES)
-#define HALF_MAX_SIZE_T     (MAX_SIZE_T / 2U)
-
-/* The bit mask value corresponding to MALLOC_ALIGNMENT */
-#define CHUNK_ALIGN_MASK    (MALLOC_ALIGNMENT - SIZE_T_ONE)
-
-/* True if address a has acceptable alignment */
-#define is_aligned(A)       (((size_t)((A)) & (CHUNK_ALIGN_MASK)) == 0)
-
-/* the number of bytes to offset an address to align it */
-#define align_offset(A)\
- ((((size_t)(A) & CHUNK_ALIGN_MASK) == 0)? 0 :\
-  ((MALLOC_ALIGNMENT - ((size_t)(A) & CHUNK_ALIGN_MASK)) & CHUNK_ALIGN_MASK))
-
-/* -------------------------- MMAP preliminaries ------------------------- */
-
-/*
-   If HAVE_MORECORE or HAVE_MMAP are false, we just define calls and
-   checks to fail so compiler optimizer can delete code rather than
-   using so many "#if"s.
-*/
-
-
-/* MORECORE and MMAP must return MFAIL on failure */
-#define MFAIL                ((void*)(MAX_SIZE_T))
-#define CMFAIL               ((char*)(MFAIL)) /* defined for convenience */
-
-#if HAVE_MMAP
-
-#ifndef WIN32
-#define MUNMAP_DEFAULT(a, s)  munmap((a), (s))
-#define MMAP_PROT            (PROT_READ|PROT_WRITE)
-#if !defined(MAP_ANONYMOUS) && defined(MAP_ANON)
-#define MAP_ANONYMOUS        MAP_ANON
-#endif /* MAP_ANON */
-#ifdef MAP_ANONYMOUS
-#define MMAP_FLAGS           (MAP_PRIVATE|MAP_ANONYMOUS)
-#define MMAP_DEFAULT(s)       mmap(0, (s), MMAP_PROT, MMAP_FLAGS, -1, 0)
-#else /* MAP_ANONYMOUS */
-/*
-   Nearly all versions of mmap support MAP_ANONYMOUS, so the following
-   is unlikely to be needed, but is supplied just in case.
-*/
-#define MMAP_FLAGS           (MAP_PRIVATE)
-static int dev_zero_fd = -1; /* Cached file descriptor for /dev/zero. */
-#define MMAP_DEFAULT(s) ((dev_zero_fd < 0) ? \
-           (dev_zero_fd = open("/dev/zero", O_RDWR), \
-            mmap(0, (s), MMAP_PROT, MMAP_FLAGS, dev_zero_fd, 0)) : \
-            mmap(0, (s), MMAP_PROT, MMAP_FLAGS, dev_zero_fd, 0))
-#endif /* MAP_ANONYMOUS */
-
-#define DIRECT_MMAP_DEFAULT(s) MMAP_DEFAULT(s)
-
-#else /* WIN32 */
-
-/* Win32 MMAP via VirtualAlloc */
-static FORCEINLINE void* win32mmap(size_t size) {
-  void* ptr = VirtualAlloc(0, size, MEM_RESERVE|MEM_COMMIT, PAGE_READWRITE);
-  return (ptr != 0)? ptr: MFAIL;
-}
-
-/* For direct MMAP, use MEM_TOP_DOWN to minimize interference */
-static FORCEINLINE void* win32direct_mmap(size_t size) {
-  void* ptr = VirtualAlloc(0, size, MEM_RESERVE|MEM_COMMIT|MEM_TOP_DOWN,
-                           PAGE_READWRITE);
-  return (ptr != 0)? ptr: MFAIL;
-}
-
-/* This function supports releasing coalesed segments */
-static FORCEINLINE int win32munmap(void* ptr, size_t size) {
-  MEMORY_BASIC_INFORMATION minfo;
-  char* cptr = (char*)ptr;
-  while (size) {
-    if (VirtualQuery(cptr, &minfo, sizeof(minfo)) == 0)
-      return -1;
-    if (minfo.BaseAddress != cptr || minfo.AllocationBase != cptr ||
-        minfo.State != MEM_COMMIT || minfo.RegionSize > size)
-      return -1;
-    if (VirtualFree(cptr, 0, MEM_RELEASE) == 0)
-      return -1;
-    cptr += minfo.RegionSize;
-    size -= minfo.RegionSize;
-  }
-  return 0;
-}
-
-#define MMAP_DEFAULT(s)             win32mmap(s)
-#define MUNMAP_DEFAULT(a, s)        win32munmap((a), (s))
-#define DIRECT_MMAP_DEFAULT(s)      win32direct_mmap(s)
-#endif /* WIN32 */
-#endif /* HAVE_MMAP */
-
-#if HAVE_MREMAP
-#ifndef WIN32
-#define MREMAP_DEFAULT(addr, osz, nsz, mv) mremap((addr), (osz), (nsz), (mv))
-#endif /* WIN32 */
-#endif /* HAVE_MREMAP */
-
-/**
- * Define CALL_MORECORE
- */
-#if HAVE_MORECORE
-    #ifdef MORECORE
-        #define CALL_MORECORE(S)    MORECORE(S)
-    #else  /* MORECORE */
-        #define CALL_MORECORE(S)    MORECORE_DEFAULT(S)
-    #endif /* MORECORE */
-#else  /* HAVE_MORECORE */
-    #define CALL_MORECORE(S)        MFAIL
-#endif /* HAVE_MORECORE */
-
-/**
- * Define CALL_MMAP/CALL_MUNMAP/CALL_DIRECT_MMAP
- */
-#if HAVE_MMAP
-    #define USE_MMAP_BIT            (SIZE_T_ONE)
-
-    #ifdef MMAP
-        #define CALL_MMAP(s)        MMAP(s)
-    #else /* MMAP */
-        #define CALL_MMAP(s)        MMAP_DEFAULT(s)
-    #endif /* MMAP */
-    #ifdef MUNMAP
-        #define CALL_MUNMAP(a, s)   MUNMAP((a), (s))
-    #else /* MUNMAP */
-        #define CALL_MUNMAP(a, s)   MUNMAP_DEFAULT((a), (s))
-    #endif /* MUNMAP */
-    #ifdef DIRECT_MMAP
-        #define CALL_DIRECT_MMAP(s) DIRECT_MMAP(s)
-    #else /* DIRECT_MMAP */
-        #define CALL_DIRECT_MMAP(s) DIRECT_MMAP_DEFAULT(s)
-    #endif /* DIRECT_MMAP */
-#else  /* HAVE_MMAP */
-    #define USE_MMAP_BIT            (SIZE_T_ZERO)
-
-    #define MMAP(s)                 MFAIL
-    #define MUNMAP(a, s)            (-1)
-    #define DIRECT_MMAP(s)          MFAIL
-    #define CALL_DIRECT_MMAP(s)     DIRECT_MMAP(s)
-    #define CALL_MMAP(s)            MMAP(s)
-    #define CALL_MUNMAP(a, s)       MUNMAP((a), (s))
-#endif /* HAVE_MMAP */
-
-/**
- * Define CALL_MREMAP
- */
-#if HAVE_MMAP && HAVE_MREMAP
-    #ifdef MREMAP
-        #define CALL_MREMAP(addr, osz, nsz, mv) MREMAP((addr), (osz), (nsz), (mv))
-    #else /* MREMAP */
-        #define CALL_MREMAP(addr, osz, nsz, mv) MREMAP_DEFAULT((addr), (osz), (nsz), (mv))
-    #endif /* MREMAP */
-#else  /* HAVE_MMAP && HAVE_MREMAP */
-    #define CALL_MREMAP(addr, osz, nsz, mv)     MFAIL
-#endif /* HAVE_MMAP && HAVE_MREMAP */
-
-/* mstate bit set if continguous morecore disabled or failed */
-#define USE_NONCONTIGUOUS_BIT (4U)
-
-/* segment bit set in create_mspace_with_base */
-#define EXTERN_BIT            (8U)
-
-
-/* --------------------------- Lock preliminaries ------------------------ */
-
-/*
-  When locks are defined, there is one global lock, plus
-  one per-mspace lock.
-
-  The global lock_ensures that mparams.magic and other unique
-  mparams values are initialized only once. It also protects
-  sequences of calls to MORECORE.  In many cases sys_alloc requires
-  two calls, that should not be interleaved with calls by other
-  threads.  This does not protect against direct calls to MORECORE
-  by other threads not using this lock, so there is still code to
-  cope the best we can on interference.
-
-  Per-mspace locks surround calls to malloc, free, etc.
-  By default, locks are simple non-reentrant mutexes.
-
-  Because lock-protected regions generally have bounded times, it is
-  OK to use the supplied simple spinlocks. Spinlocks are likely to
-  improve performance for lightly contended applications, but worsen
-  performance under heavy contention.
-
-  If USE_LOCKS is > 1, the definitions of lock routines here are
-  bypassed, in which case you will need to define the type MLOCK_T,
-  and at least INITIAL_LOCK, DESTROY_LOCK, ACQUIRE_LOCK, RELEASE_LOCK
-  and TRY_LOCK.  You must also declare a
-    static MLOCK_T malloc_global_mutex = { initialization values };.
-
-*/
-
-#if !USE_LOCKS
-#define USE_LOCK_BIT               (0U)
-#define INITIAL_LOCK(l)            (0)
-#define DESTROY_LOCK(l)            (0)
-#define ACQUIRE_MALLOC_GLOBAL_LOCK()
-#define RELEASE_MALLOC_GLOBAL_LOCK()
-
-#else
-#if USE_LOCKS > 1
-/* -----------------------  User-defined locks ------------------------ */
-/* Define your own lock implementation here */
-/* #define INITIAL_LOCK(lk)  ... */
-/* #define DESTROY_LOCK(lk)  ... */
-/* #define ACQUIRE_LOCK(lk)  ... */
-/* #define RELEASE_LOCK(lk)  ... */
-/* #define TRY_LOCK(lk) ... */
-/* static MLOCK_T malloc_global_mutex = ... */
-
-#elif USE_SPIN_LOCKS
-
-/* First, define CAS_LOCK and CLEAR_LOCK on ints */
-/* Note CAS_LOCK defined to return 0 on success */
-
-#if defined(__GNUC__)&& (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 1))
-#define CAS_LOCK(sl)     __sync_lock_test_and_set(sl, 1)
-#define CLEAR_LOCK(sl)   __sync_lock_release(sl)
-
-#elif (defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__)))
-/* Custom spin locks for older gcc on x86 */
-static FORCEINLINE int x86_cas_lock(int *sl) {
-  int ret;
-  int val = 1;
-  int cmp = 0;
-  __asm__ __volatile__  ("lock; cmpxchgl %1, %2"
-                         : "=a" (ret)
-                         : "r" (val), "m" (*(sl)), "0"(cmp)
-                         : "memory", "cc");
-  return ret;
-}
-
-static FORCEINLINE void x86_clear_lock(int* sl) {
-  assert(*sl != 0);
-  int prev = 0;
-  int ret;
-  __asm__ __volatile__ ("lock; xchgl %0, %1"
-                        : "=r" (ret)
-                        : "m" (*(sl)), "0"(prev)
-                        : "memory");
-}
-
-#define CAS_LOCK(sl)     x86_cas_lock(sl)
-#define CLEAR_LOCK(sl)   x86_clear_lock(sl)
-
-#else /* Win32 MSC */
-#define CAS_LOCK(sl)     interlockedexchange(sl, (LONG)1)
-#define CLEAR_LOCK(sl)   interlockedexchange (sl, (LONG)0)
-
-#endif /* ... gcc spins locks ... */
-
-/* How to yield for a spin lock */
-#define SPINS_PER_YIELD       63
-#if defined(_MSC_VER)
-#define SLEEP_EX_DURATION     50 /* delay for yield/sleep */
-#define SPIN_LOCK_YIELD  SleepEx(SLEEP_EX_DURATION, FALSE)
-#elif defined (__SVR4) && defined (__sun) /* solaris */
-#define SPIN_LOCK_YIELD   thr_yield();
-#elif !defined(LACKS_SCHED_H)
-#define SPIN_LOCK_YIELD   sched_yield();
-#else
-#define SPIN_LOCK_YIELD
-#endif /* ... yield ... */
-
-#if !defined(USE_RECURSIVE_LOCKS) || USE_RECURSIVE_LOCKS == 0
-/* Plain spin locks use single word (embedded in malloc_states) */
-static int spin_acquire_lock(int *sl) {
-  int spins = 0;
-  while (*(volatile int *)sl != 0 || CAS_LOCK(sl)) {
-    if ((++spins & SPINS_PER_YIELD) == 0) {
-      SPIN_LOCK_YIELD;
-    }
-  }
-  return 0;
-}
-
-#define MLOCK_T               int
-#define TRY_LOCK(sl)          !CAS_LOCK(sl)
-#define RELEASE_LOCK(sl)      CLEAR_LOCK(sl)
-#define ACQUIRE_LOCK(sl)      (CAS_LOCK(sl)? spin_acquire_lock(sl) : 0)
-#define INITIAL_LOCK(sl)      (*sl = 0)
-#define DESTROY_LOCK(sl)      (0)
-static MLOCK_T malloc_global_mutex = 0;
-
-#else /* USE_RECURSIVE_LOCKS */
-/* types for lock owners */
-#ifdef WIN32
-#define THREAD_ID_T           DWORD
-#define CURRENT_THREAD        GetCurrentThreadId()
-#define EQ_OWNER(X,Y)         ((X) == (Y))
-#else
-/*
-  Note: the following assume that pthread_t is a type that can be
-  initialized to (casted) zero. If this is not the case, you will need to
-  somehow redefine these or not use spin locks.
-*/
-#define THREAD_ID_T           pthread_t
-#define CURRENT_THREAD        pthread_self()
-#define EQ_OWNER(X,Y)         pthread_equal(X, Y)
-#endif
-
-struct malloc_recursive_lock {
-  int sl;
-  unsigned int c;
-  THREAD_ID_T threadid;
-};
-
-#define MLOCK_T  struct malloc_recursive_lock
-static MLOCK_T malloc_global_mutex = { 0, 0, (THREAD_ID_T)0};
-
-static FORCEINLINE void recursive_release_lock(MLOCK_T *lk) {
-  assert(lk->sl != 0);
-  if (--lk->c == 0) {
-    CLEAR_LOCK(&lk->sl);
-  }
-}
-
-static FORCEINLINE int recursive_acquire_lock(MLOCK_T *lk) {
-  THREAD_ID_T mythreadid = CURRENT_THREAD;
-  int spins = 0;
-  for (;;) {
-    if (*((volatile int *)(&lk->sl)) == 0) {
-      if (!CAS_LOCK(&lk->sl)) {
-        lk->threadid = mythreadid;
-        lk->c = 1;
-        return 0;
-      }
-    }
-    else if (EQ_OWNER(lk->threadid, mythreadid)) {
-      ++lk->c;
-      return 0;
-    }
-    if ((++spins & SPINS_PER_YIELD) == 0) {
-      SPIN_LOCK_YIELD;
-    }
-  }
-}
-
-static FORCEINLINE int recursive_try_lock(MLOCK_T *lk) {
-  THREAD_ID_T mythreadid = CURRENT_THREAD;
-  if (*((volatile int *)(&lk->sl)) == 0) {
-    if (!CAS_LOCK(&lk->sl)) {
-      lk->threadid = mythreadid;
-      lk->c = 1;
-      return 1;
-    }
-  }
-  else if (EQ_OWNER(lk->threadid, mythreadid)) {
-    ++lk->c;
-    return 1;
-  }
-  return 0;
-}
-
-#define RELEASE_LOCK(lk)      recursive_release_lock(lk)
-#define TRY_LOCK(lk)          recursive_try_lock(lk)
-#define ACQUIRE_LOCK(lk)      recursive_acquire_lock(lk)
-#define INITIAL_LOCK(lk)      ((lk)->threadid = (THREAD_ID_T)0, (lk)->sl = 0, (lk)->c = 0)
-#define DESTROY_LOCK(lk)      (0)
-#endif /* USE_RECURSIVE_LOCKS */
-
-#elif defined(WIN32) /* Win32 critical sections */
-#define MLOCK_T               CRITICAL_SECTION
-#define ACQUIRE_LOCK(lk)      (EnterCriticalSection(lk), 0)
-#define RELEASE_LOCK(lk)      LeaveCriticalSection(lk)
-#define TRY_LOCK(lk)          TryEnterCriticalSection(lk)
-#define INITIAL_LOCK(lk)      (!InitializeCriticalSectionAndSpinCount((lk), 0x80000000|4000))
-#define DESTROY_LOCK(lk)      (DeleteCriticalSection(lk), 0)
-#define NEED_GLOBAL_LOCK_INIT
-
-static MLOCK_T malloc_global_mutex;
-static volatile LONG malloc_global_mutex_status;
-
-/* Use spin loop to initialize global lock */
-static void init_malloc_global_mutex() {
-  for (;;) {
-    long stat = malloc_global_mutex_status;
-    if (stat > 0)
-      return;
-    /* transition to < 0 while initializing, then to > 0) */
-    if (stat == 0 &&
-        interlockedcompareexchange(&malloc_global_mutex_status, (LONG)-1, (LONG)0) == 0) {
-      InitializeCriticalSection(&malloc_global_mutex);
-      interlockedexchange(&malloc_global_mutex_status, (LONG)1);
-      return;
-    }
-    SleepEx(0, FALSE);
-  }
-}
-
-#else /* pthreads-based locks */
-#define MLOCK_T               pthread_mutex_t
-#define ACQUIRE_LOCK(lk)      pthread_mutex_lock(lk)
-#define RELEASE_LOCK(lk)      pthread_mutex_unlock(lk)
-#define TRY_LOCK(lk)          (!pthread_mutex_trylock(lk))
-#define INITIAL_LOCK(lk)      pthread_init_lock(lk)
-#define DESTROY_LOCK(lk)      pthread_mutex_destroy(lk)
-
-#if defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0 && defined(linux) && !defined(PTHREAD_MUTEX_RECURSIVE)
-/* Cope with old-style linux recursive lock initialization by adding */
-/* skipped internal declaration from pthread.h */
-extern int pthread_mutexattr_setkind_np __P ((pthread_mutexattr_t *__attr,
-                                              int __kind));
-#define PTHREAD_MUTEX_RECURSIVE PTHREAD_MUTEX_RECURSIVE_NP
-#define pthread_mutexattr_settype(x,y) pthread_mutexattr_setkind_np(x,y)
-#endif /* USE_RECURSIVE_LOCKS ... */
-
-static MLOCK_T malloc_global_mutex = PTHREAD_MUTEX_INITIALIZER;
-
-static int pthread_init_lock (MLOCK_T *lk) {
-  pthread_mutexattr_t attr;
-  if (pthread_mutexattr_init(&attr)) return 1;
-#if defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0
-  if (pthread_mutexattr_settype(&attr, PTHREAD_MUTEX_RECURSIVE)) return 1;
-#endif
-  if (pthread_mutex_init(lk, &attr)) return 1;
-  if (pthread_mutexattr_destroy(&attr)) return 1;
-  return 0;
-}
-
-#endif /* ... lock types ... */
-
-/* Common code for all lock types */
-#define USE_LOCK_BIT               (2U)
-
-#ifndef ACQUIRE_MALLOC_GLOBAL_LOCK
-#define ACQUIRE_MALLOC_GLOBAL_LOCK()  ACQUIRE_LOCK(&malloc_global_mutex);
-#endif
-
-#ifndef RELEASE_MALLOC_GLOBAL_LOCK
-#define RELEASE_MALLOC_GLOBAL_LOCK()  RELEASE_LOCK(&malloc_global_mutex);
-#endif
-
-#endif /* USE_LOCKS */
-
-/* -----------------------  Chunk representations ------------------------ */
-
-/*
-  (The following includes lightly edited explanations by Colin Plumb.)
-
-  The malloc_chunk declaration below is misleading (but accurate and
-  necessary).  It declares a "view" into memory allowing access to
-  necessary fields at known offsets from a given base.
-
-  Chunks of memory are maintained using a `boundary tag' method as
-  originally described by Knuth.  (See the paper by Paul Wilson
-  ftp://ftp.cs.utexas.edu/pub/garbage/allocsrv.ps for a survey of such
-  techniques.)  Sizes of free chunks are stored both in the front of
-  each chunk and at the end.  This makes consolidating fragmented
-  chunks into bigger chunks fast.  The head fields also hold bits
-  representing whether chunks are free or in use.
-
-  Here are some pictures to make it clearer.  They are "exploded" to
-  show that the state of a chunk can be thought of as extending from
-  the high 31 bits of the head field of its header through the
-  prev_foot and PINUSE_BIT bit of the following chunk header.
-
-  A chunk that's in use looks like:
-
-   chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-           | Size of previous chunk (if P = 0)                             |
-           +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |P|
-         | Size of this chunk                                         1| +-+
-   mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         |                                                               |
-         +-                                                             -+
-         |                                                               |
-         +-                                                             -+
-         |                                                               :
-         +-      size - sizeof(size_t) available payload bytes          -+
-         :                                                               |
- chunk-> +-                                                             -+
-         |                                                               |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-       +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |1|
-       | Size of next chunk (may or may not be in use)               | +-+
- mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-
-    And if it's free, it looks like this:
-
-   chunk-> +-                                                             -+
-           | User payload (must be in use, or we would have merged!)       |
-           +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |P|
-         | Size of this chunk                                         0| +-+
-   mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         | Next pointer                                                  |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         | Prev pointer                                                  |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         |                                                               :
-         +-      size - sizeof(struct chunk) unused bytes               -+
-         :                                                               |
- chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         | Size of this chunk                                            |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-       +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |0|
-       | Size of next chunk (must be in use, or we would have merged)| +-+
- mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-       |                                                               :
-       +- User payload                                                -+
-       :                                                               |
-       +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-                                                                     |0|
-                                                                     +-+
-  Note that since we always merge adjacent free chunks, the chunks
-  adjacent to a free chunk must be in use.
-
-  Given a pointer to a chunk (which can be derived trivially from the
-  payload pointer) we can, in O(1) time, find out whether the adjacent
-  chunks are free, and if so, unlink them from the lists that they
-  are on and merge them with the current chunk.
-
-  Chunks always begin on even word boundaries, so the mem portion
-  (which is returned to the user) is also on an even word boundary, and
-  thus at least double-word aligned.
-
-  The P (PINUSE_BIT) bit, stored in the unused low-order bit of the
-  chunk size (which is always a multiple of two words), is an in-use
-  bit for the *previous* chunk.  If that bit is *clear*, then the
-  word before the current chunk size contains the previous chunk
-  size, and can be used to find the front of the previous chunk.
-  The very first chunk allocated always has this bit set, preventing
-  access to non-existent (or non-owned) memory. If pinuse is set for
-  any given chunk, then you CANNOT determine the size of the
-  previous chunk, and might even get a memory addressing fault when
-  trying to do so.
-
-  The C (CINUSE_BIT) bit, stored in the unused second-lowest bit of
-  the chunk size redundantly records whether the current chunk is
-  inuse (unless the chunk is mmapped). This redundancy enables usage
-  checks within free and realloc, and reduces indirection when freeing
-  and consolidating chunks.
-
-  Each freshly allocated chunk must have both cinuse and pinuse set.
-  That is, each allocated chunk borders either a previously allocated
-  and still in-use chunk, or the base of its memory arena. This is
-  ensured by making all allocations from the `lowest' part of any
-  found chunk.  Further, no free chunk physically borders another one,
-  so each free chunk is known to be preceded and followed by either
-  inuse chunks or the ends of memory.
-
-  Note that the `foot' of the current chunk is actually represented
-  as the prev_foot of the NEXT chunk. This makes it easier to
-  deal with alignments etc but can be very confusing when trying
-  to extend or adapt this code.
-
-  The exceptions to all this are
-
-     1. The special chunk `top' is the top-most available chunk (i.e.,
-        the one bordering the end of available memory). It is treated
-        specially.  Top is never included in any bin, is used only if
-        no other chunk is available, and is released back to the
-        system if it is very large (see M_TRIM_THRESHOLD).  In effect,
-        the top chunk is treated as larger (and thus less well
-        fitting) than any other available chunk.  The top chunk
-        doesn't update its trailing size field since there is no next
-        contiguous chunk that would have to index off it. However,
-        space is still allocated for it (TOP_FOOT_SIZE) to enable
-        separation or merging when space is extended.
-
-     3. Chunks allocated via mmap, have both cinuse and pinuse bits
-        cleared in their head fields.  Because they are allocated
-        one-by-one, each must carry its own prev_foot field, which is
-        also used to hold the offset this chunk has within its mmapped
-        region, which is needed to preserve alignment. Each mmapped
-        chunk is trailed by the first two fields of a fake next-chunk
-        for sake of usage checks.
-
-*/
-
-struct malloc_chunk {
-  size_t               prev_foot;  /* Size of previous chunk (if free).  */
-  size_t               head;       /* Size and inuse bits. */
-  struct malloc_chunk* fd;         /* double links -- used only if free. */
-  struct malloc_chunk* bk;
-};
-
-typedef struct malloc_chunk  mchunk;
-typedef struct malloc_chunk* mchunkptr;
-typedef struct malloc_chunk* sbinptr;  /* The type of bins of chunks */
-typedef unsigned int bindex_t;         /* Described below */
-typedef unsigned int binmap_t;         /* Described below */
-typedef unsigned int flag_t;           /* The type of various bit flag sets */
-
-/* ------------------- Chunks sizes and alignments ----------------------- */
-
-#define MCHUNK_SIZE         (sizeof(mchunk))
-
-#if FOOTERS
-#define CHUNK_OVERHEAD      (TWO_SIZE_T_SIZES)
-#else /* FOOTERS */
-#define CHUNK_OVERHEAD      (SIZE_T_SIZE)
-#endif /* FOOTERS */
-
-/* MMapped chunks need a second word of overhead ... */
-#define MMAP_CHUNK_OVERHEAD (TWO_SIZE_T_SIZES)
-/* ... and additional padding for fake next-chunk at foot */
-#define MMAP_FOOT_PAD       (FOUR_SIZE_T_SIZES)
-
-/* The smallest size we can malloc is an aligned minimal chunk */
-#define MIN_CHUNK_SIZE\
-  ((MCHUNK_SIZE + CHUNK_ALIGN_MASK) & ~CHUNK_ALIGN_MASK)
-
-/* conversion from malloc headers to user pointers, and back */
-#define chunk2mem(p)        ((void*)((char*)(p)       + TWO_SIZE_T_SIZES))
-#define mem2chunk(mem)      ((mchunkptr)((char*)(mem) - TWO_SIZE_T_SIZES))
-/* chunk associated with aligned address A */
-#define align_as_chunk(A)   (mchunkptr)((A) + align_offset(chunk2mem(A)))
-
-/* Bounds on request (not chunk) sizes. */
-#define MAX_REQUEST         ((-MIN_CHUNK_SIZE) << 2)
-#define MIN_REQUEST         (MIN_CHUNK_SIZE - CHUNK_OVERHEAD - SIZE_T_ONE)
-
-/* pad request bytes into a usable size */
-#define pad_request(req) \
-   (((req) + CHUNK_OVERHEAD + CHUNK_ALIGN_MASK) & ~CHUNK_ALIGN_MASK)
-
-/* pad request, checking for minimum (but not maximum) */
-#define request2size(req) \
-  (((req) < MIN_REQUEST)? MIN_CHUNK_SIZE : pad_request(req))
-
-
-/* ------------------ Operations on head and foot fields ----------------- */
-
-/*
-  The head field of a chunk is or'ed with PINUSE_BIT when previous
-  adjacent chunk in use, and or'ed with CINUSE_BIT if this chunk is in
-  use, unless mmapped, in which case both bits are cleared.
-
-  FLAG4_BIT is not used by this malloc, but might be useful in extensions.
-*/
-
-#define PINUSE_BIT          (SIZE_T_ONE)
-#define CINUSE_BIT          (SIZE_T_TWO)
-#define FLAG4_BIT           (SIZE_T_FOUR)
-#define INUSE_BITS          (PINUSE_BIT|CINUSE_BIT)
-#define FLAG_BITS           (PINUSE_BIT|CINUSE_BIT|FLAG4_BIT)
-
-/* Head value for fenceposts */
-#define FENCEPOST_HEAD      (INUSE_BITS|SIZE_T_SIZE)
-
-/* extraction of fields from head words */
-#define cinuse(p)           ((p)->head & CINUSE_BIT)
-#define pinuse(p)           ((p)->head & PINUSE_BIT)
-#define flag4inuse(p)       ((p)->head & FLAG4_BIT)
-#define is_inuse(p)         (((p)->head & INUSE_BITS) != PINUSE_BIT)
-#define is_mmapped(p)       (((p)->head & INUSE_BITS) == 0)
-
-#define chunksize(p)        ((p)->head & ~(FLAG_BITS))
-
-#define clear_pinuse(p)     ((p)->head &= ~PINUSE_BIT)
-#define set_flag4(p)        ((p)->head |= FLAG4_BIT)
-#define clear_flag4(p)      ((p)->head &= ~FLAG4_BIT)
-
-/* Treat space at ptr +/- offset as a chunk */
-#define chunk_plus_offset(p, s)  ((mchunkptr)(((char*)(p)) + (s)))
-#define chunk_minus_offset(p, s) ((mchunkptr)(((char*)(p)) - (s)))
-
-/* Ptr to next or previous physical malloc_chunk. */
-#define next_chunk(p) ((mchunkptr)( ((char*)(p)) + ((p)->head & ~FLAG_BITS)))
-#define prev_chunk(p) ((mchunkptr)( ((char*)(p)) - ((p)->prev_foot) ))
-
-/* extract next chunk's pinuse bit */
-#define next_pinuse(p)  ((next_chunk(p)->head) & PINUSE_BIT)
-
-/* Get/set size at footer */
-#define get_foot(p, s)  (((mchunkptr)((char*)(p) + (s)))->prev_foot)
-#define set_foot(p, s)  (((mchunkptr)((char*)(p) + (s)))->prev_foot = (s))
-
-/* Set size, pinuse bit, and foot */
-#define set_size_and_pinuse_of_free_chunk(p, s)\
-  ((p)->head = (s|PINUSE_BIT), set_foot(p, s))
-
-/* Set size, pinuse bit, foot, and clear next pinuse */
-#define set_free_with_pinuse(p, s, n)\
-  (clear_pinuse(n), set_size_and_pinuse_of_free_chunk(p, s))
-
-/* Get the internal overhead associated with chunk p */
-#define overhead_for(p)\
- (is_mmapped(p)? MMAP_CHUNK_OVERHEAD : CHUNK_OVERHEAD)
-
-/* Return true if malloced space is not necessarily cleared */
-#if MMAP_CLEARS
-#define calloc_must_clear(p) (!is_mmapped(p))
-#else /* MMAP_CLEARS */
-#define calloc_must_clear(p) (1)
-#endif /* MMAP_CLEARS */
-
-/* ---------------------- Overlaid data structures ----------------------- */
-
-/*
-  When chunks are not in use, they are treated as nodes of either
-  lists or trees.
-
-  "Small"  chunks are stored in circular doubly-linked lists, and look
-  like this:
-
-    chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Size of previous chunk                            |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `head:' |             Size of chunk, in bytes                         |P|
-      mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Forward pointer to next chunk in list             |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Back pointer to previous chunk in list            |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Unused space (may be 0 bytes long)                .
-            .                                                               .
-            .                                                               |
-nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `foot:' |             Size of chunk, in bytes                           |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-
-  Larger chunks are kept in a form of bitwise digital trees (aka
-  tries) keyed on chunksizes.  Because malloc_tree_chunks are only for
-  free chunks greater than 256 bytes, their size doesn't impose any
-  constraints on user chunk sizes.  Each node looks like:
-
-    chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Size of previous chunk                            |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `head:' |             Size of chunk, in bytes                         |P|
-      mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Forward pointer to next chunk of same size        |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Back pointer to previous chunk of same size       |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Pointer to left child (child[0])                  |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Pointer to right child (child[1])                 |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Pointer to parent                                 |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             bin index of this chunk                           |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Unused space                                      .
-            .                                                               |
-nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `foot:' |             Size of chunk, in bytes                           |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-
-  Each tree holding treenodes is a tree of unique chunk sizes.  Chunks
-  of the same size are arranged in a circularly-linked list, with only
-  the oldest chunk (the next to be used, in our FIFO ordering)
-  actually in the tree.  (Tree members are distinguished by a non-null
-  parent pointer.)  If a chunk with the same size an an existing node
-  is inserted, it is linked off the existing node using pointers that
-  work in the same way as fd/bk pointers of small chunks.
-
-  Each tree contains a power of 2 sized range of chunk sizes (the
-  smallest is 0x100 <= x < 0x180), which is is divided in half at each
-  tree level, with the chunks in the smaller half of the range (0x100
-  <= x < 0x140 for the top nose) in the left subtree and the larger
-  half (0x140 <= x < 0x180) in the right subtree.  This is, of course,
-  done by inspecting individual bits.
-
-  Using these rules, each node's left subtree contains all smaller
-  sizes than its right subtree.  However, the node at the root of each
-  subtree has no particular ordering relationship to either.  (The
-  dividing line between the subtree sizes is based on trie relation.)
-  If we remove the last chunk of a given size from the interior of the
-  tree, we need to replace it with a leaf node.  The tree ordering
-  rules permit a node to be replaced by any leaf below it.
-
-  The smallest chunk in a tree (a common operation in a best-fit
-  allocator) can be found by walking a path to the leftmost leaf in
-  the tree.  Unlike a usual binary tree, where we follow left child
-  pointers until we reach a null, here we follow the right child
-  pointer any time the left one is null, until we reach a leaf with
-  both child pointers null. The smallest chunk in the tree will be
-  somewhere along that path.
-
-  The worst case number of steps to add, find, or remove a node is
-  bounded by the number of bits differentiating chunks within
-  bins. Under current bin calculations, this ranges from 6 up to 21
-  (for 32 bit sizes) or up to 53 (for 64 bit sizes). The typical case
-  is of course much better.
-*/
-
-struct malloc_tree_chunk {
-  /* The first four fields must be compatible with malloc_chunk */
-  size_t                    prev_foot;
-  size_t                    head;
-  struct malloc_tree_chunk* fd;
-  struct malloc_tree_chunk* bk;
-
-  struct malloc_tree_chunk* child[2];
-  struct malloc_tree_chunk* parent;
-  bindex_t                  index;
-};
-
-typedef struct malloc_tree_chunk  tchunk;
-typedef struct malloc_tree_chunk* tchunkptr;
-typedef struct malloc_tree_chunk* tbinptr; /* The type of bins of trees */
-
-/* A little helper macro for trees */
-#define leftmost_child(t) ((t)->child[0] != 0? (t)->child[0] : (t)->child[1])
-
-/* ----------------------------- Segments -------------------------------- */
-
-/*
-  Each malloc space may include non-contiguous segments, held in a
-  list headed by an embedded malloc_segment record representing the
-  top-most space. Segments also include flags holding properties of
-  the space. Large chunks that are directly allocated by mmap are not
-  included in this list. They are instead independently created and
-  destroyed without otherwise keeping track of them.
-
-  Segment management mainly comes into play for spaces allocated by
-  MMAP.  Any call to MMAP might or might not return memory that is
-  adjacent to an existing segment.  MORECORE normally contiguously
-  extends the current space, so this space is almost always adjacent,
-  which is simpler and faster to deal with. (This is why MORECORE is
-  used preferentially to MMAP when both are available -- see
-  sys_alloc.)  When allocating using MMAP, we don't use any of the
-  hinting mechanisms (inconsistently) supported in various
-  implementations of unix mmap, or distinguish reserving from
-  committing memory. Instead, we just ask for space, and exploit
-  contiguity when we get it.  It is probably possible to do
-  better than this on some systems, but no general scheme seems
-  to be significantly better.
-
-  Management entails a simpler variant of the consolidation scheme
-  used for chunks to reduce fragmentation -- new adjacent memory is
-  normally prepended or appended to an existing segment. However,
-  there are limitations compared to chunk consolidation that mostly
-  reflect the fact that segment processing is relatively infrequent
-  (occurring only when getting memory from system) and that we
-  don't expect to have huge numbers of segments:
-
-  * Segments are not indexed, so traversal requires linear scans.  (It
-    would be possible to index these, but is not worth the extra
-    overhead and complexity for most programs on most platforms.)
-  * New segments are only appended to old ones when holding top-most
-    memory; if they cannot be prepended to others, they are held in
-    different segments.
-
-  Except for the top-most segment of an mstate, each segment record
-  is kept at the tail of its segment. Segments are added by pushing
-  segment records onto the list headed by &mstate.seg for the
-  containing mstate.
-
-  Segment flags control allocation/merge/deallocation policies:
-  * If EXTERN_BIT set, then we did not allocate this segment,
-    and so should not try to deallocate or merge with others.
-    (This currently holds only for the initial segment passed
-    into create_mspace_with_base.)
-  * If USE_MMAP_BIT set, the segment may be merged with
-    other surrounding mmapped segments and trimmed/de-allocated
-    using munmap.
-  * If neither bit is set, then the segment was obtained using
-    MORECORE so can be merged with surrounding MORECORE'd segments
-    and deallocated/trimmed using MORECORE with negative arguments.
-*/
-
-struct malloc_segment {
-  char*        base;             /* base address */
-  size_t       size;             /* allocated size */
-  struct malloc_segment* next;   /* ptr to next segment */
-  flag_t       sflags;           /* mmap and extern flag */
-};
-
-#define is_mmapped_segment(S)  ((S)->sflags & USE_MMAP_BIT)
-#define is_extern_segment(S)   ((S)->sflags & EXTERN_BIT)
-
-typedef struct malloc_segment  msegment;
-typedef struct malloc_segment* msegmentptr;
-
-/* ---------------------------- malloc_state ----------------------------- */
-
-/*
-   A malloc_state holds all of the bookkeeping for a space.
-   The main fields are:
-
-  Top
-    The topmost chunk of the currently active segment. Its size is
-    cached in topsize.  The actual size of topmost space is
-    topsize+TOP_FOOT_SIZE, which includes space reserved for adding
-    fenceposts and segment records if necessary when getting more
-    space from the system.  The size at which to autotrim top is
-    cached from mparams in trim_check, except that it is disabled if
-    an autotrim fails.
-
-  Designated victim (dv)
-    This is the preferred chunk for servicing small requests that
-    don't have exact fits.  It is normally the chunk split off most
-    recently to service another small request.  Its size is cached in
-    dvsize. The link fields of this chunk are not maintained since it
-    is not kept in a bin.
-
-  SmallBins
-    An array of bin headers for free chunks.  These bins hold chunks
-    with sizes less than MIN_LARGE_SIZE bytes. Each bin contains
-    chunks of all the same size, spaced 8 bytes apart.  To simplify
-    use in double-linked lists, each bin header acts as a malloc_chunk
-    pointing to the real first node, if it exists (else pointing to
-    itself).  This avoids special-casing for headers.  But to avoid
-    waste, we allocate only the fd/bk pointers of bins, and then use
-    repositioning tricks to treat these as the fields of a chunk.
-
-  TreeBins
-    Treebins are pointers to the roots of trees holding a range of
-    sizes. There are 2 equally spaced treebins for each power of two
-    from TREE_SHIFT to TREE_SHIFT+16. The last bin holds anything
-    larger.
-
-  Bin maps
-    There is one bit map for small bins ("smallmap") and one for
-    treebins ("treemap).  Each bin sets its bit when non-empty, and
-    clears the bit when empty.  Bit operations are then used to avoid
-    bin-by-bin searching -- nearly all "search" is done without ever
-    looking at bins that won't be selected.  The bit maps
-    conservatively use 32 bits per map word, even if on 64bit system.
-    For a good description of some of the bit-based techniques used
-    here, see Henry S. Warren Jr's book "Hacker's Delight" (and
-    supplement at http://hackersdelight.org/). Many of these are
-    intended to reduce the branchiness of paths through malloc etc, as
-    well as to reduce the number of memory locations read or written.
-
-  Segments
-    A list of segments headed by an embedded malloc_segment record
-    representing the initial space.
-
-  Address check support
-    The least_addr field is the least address ever obtained from
-    MORECORE or MMAP. Attempted frees and reallocs of any address less
-    than this are trapped (unless INSECURE is defined).
-
-  Magic tag
-    A cross-check field that should always hold same value as mparams.magic.
-
-  Max allowed footprint
-    The maximum allowed bytes to allocate from system (zero means no limit)
-
-  Flags
-    Bits recording whether to use MMAP, locks, or contiguous MORECORE
-
-  Statistics
-    Each space keeps track of current and maximum system memory
-    obtained via MORECORE or MMAP.
-
-  Trim support
-    Fields holding the amount of unused topmost memory that should trigger
-    trimming, and a counter to force periodic scanning to release unused
-    non-topmost segments.
-
-  Locking
-    If USE_LOCKS is defined, the "mutex" lock is acquired and released
-    around every public call using this mspace.
-
-  Extension support
-    A void* pointer and a size_t field that can be used to help implement
-    extensions to this malloc.
-*/
-
-/* Bin types, widths and sizes */
-#define NSMALLBINS        (32U)
-#define NTREEBINS         (32U)
-#define SMALLBIN_SHIFT    (3U)
-#define SMALLBIN_WIDTH    (SIZE_T_ONE << SMALLBIN_SHIFT)
-#define TREEBIN_SHIFT     (8U)
-#define MIN_LARGE_SIZE    (SIZE_T_ONE << TREEBIN_SHIFT)
-#define MAX_SMALL_SIZE    (MIN_LARGE_SIZE - SIZE_T_ONE)
-#define MAX_SMALL_REQUEST (MAX_SMALL_SIZE - CHUNK_ALIGN_MASK - CHUNK_OVERHEAD)
-
-struct malloc_state {
-  binmap_t   smallmap;
-  binmap_t   treemap;
-  size_t     dvsize;
-  size_t     topsize;
-  char*      least_addr;
-  mchunkptr  dv;
-  mchunkptr  top;
-  size_t     trim_check;
-  size_t     release_checks;
-  size_t     magic;
-  mchunkptr  smallbins[(NSMALLBINS+1)*2];
-  tbinptr    treebins[NTREEBINS];
-  size_t     footprint;
-  size_t     max_footprint;
-  size_t     footprint_limit; /* zero means no limit */
-  flag_t     mflags;
-#if USE_LOCKS
-  MLOCK_T    mutex;     /* locate lock among fields that rarely change */
-#endif /* USE_LOCKS */
-  msegment   seg;
-  void*      extp;      /* Unused but available for extensions */
-  size_t     exts;
-};
-
-typedef struct malloc_state*    mstate;
-
-/* ------------- Global malloc_state and malloc_params ------------------- */
-
-/*
-  malloc_params holds global properties, including those that can be
-  dynamically set using mallopt. There is a single instance, mparams,
-  initialized in init_mparams. Note that the non-zeroness of "magic"
-  also serves as an initialization flag.
-*/
-
-struct malloc_params {
-  size_t magic;
-  size_t page_size;
-  size_t granularity;
-  size_t mmap_threshold;
-  size_t trim_threshold;
-  flag_t default_mflags;
-};
-
-static struct malloc_params mparams;
-
-/* Ensure mparams initialized */
-#define ensure_initialization() (void)(mparams.magic != 0 || init_mparams())
-
-#if !ONLY_MSPACES
-
-/* The global malloc_state used for all non-"mspace" calls */
-static struct malloc_state _gm_;
-#define gm                 (&_gm_)
-#define is_global(M)       ((M) == &_gm_)
-
-#endif /* !ONLY_MSPACES */
-
-#define is_initialized(M)  ((M)->top != 0)
-
-/* -------------------------- system alloc setup ------------------------- */
-
-/* Operations on mflags */
-
-#define use_lock(M)           ((M)->mflags &   USE_LOCK_BIT)
-#define enable_lock(M)        ((M)->mflags |=  USE_LOCK_BIT)
-#if USE_LOCKS
-#define disable_lock(M)       ((M)->mflags &= ~USE_LOCK_BIT)
-#else
-#define disable_lock(M)
-#endif
-
-#define use_mmap(M)           ((M)->mflags &   USE_MMAP_BIT)
-#define enable_mmap(M)        ((M)->mflags |=  USE_MMAP_BIT)
-#if HAVE_MMAP
-#define disable_mmap(M)       ((M)->mflags &= ~USE_MMAP_BIT)
-#else
-#define disable_mmap(M)
-#endif
-
-#define use_noncontiguous(M)  ((M)->mflags &   USE_NONCONTIGUOUS_BIT)
-#define disable_contiguous(M) ((M)->mflags |=  USE_NONCONTIGUOUS_BIT)
-
-#define set_lock(M,L)\
- ((M)->mflags = (L)?\
-  ((M)->mflags | USE_LOCK_BIT) :\
-  ((M)->mflags & ~USE_LOCK_BIT))
-
-/* page-align a size */
-#define page_align(S)\
- (((S) + (mparams.page_size - SIZE_T_ONE)) & ~(mparams.page_size - SIZE_T_ONE))
-
-/* granularity-align a size */
-#define granularity_align(S)\
-  (((S) + (mparams.granularity - SIZE_T_ONE))\
-   & ~(mparams.granularity - SIZE_T_ONE))
-
-
-/* For mmap, use granularity alignment on windows, else page-align */
-#ifdef WIN32
-#define mmap_align(S) granularity_align(S)
-#else
-#define mmap_align(S) page_align(S)
-#endif
-
-/* For sys_alloc, enough padding to ensure can malloc request on success */
-#define SYS_ALLOC_PADDING (TOP_FOOT_SIZE + MALLOC_ALIGNMENT)
-
-#define is_page_aligned(S)\
-   (((size_t)(S) & (mparams.page_size - SIZE_T_ONE)) == 0)
-#define is_granularity_aligned(S)\
-   (((size_t)(S) & (mparams.granularity - SIZE_T_ONE)) == 0)
-
-/*  True if segment S holds address A */
-#define segment_holds(S, A)\
-  ((char*)(A) >= S->base && (char*)(A) < S->base + S->size)
-
-/* Return segment holding given address */
-static msegmentptr segment_holding(mstate m, char* addr) {
-  msegmentptr sp = &m->seg;
-  for (;;) {
-    if (addr >= sp->base && addr < sp->base + sp->size)
-      return sp;
-    if ((sp = sp->next) == 0)
-      return 0;
-  }
-  return 0;
-}
-
-/* Return true if segment contains a segment link */
-static int has_segment_link(mstate m, msegmentptr ss) {
-  msegmentptr sp = &m->seg;
-  for (;;) {
-    if ((char*)sp >= ss->base && (char*)sp < ss->base + ss->size)
-      return 1;
-    if ((sp = sp->next) == 0)
-      return 0;
-  }
-  return 0;
-}
-
-#ifndef MORECORE_CANNOT_TRIM
-#define should_trim(M,s)  ((s) > (M)->trim_check)
-#else  /* MORECORE_CANNOT_TRIM */
-#define should_trim(M,s)  (0)
-#endif /* MORECORE_CANNOT_TRIM */
-
-/*
-  TOP_FOOT_SIZE is padding at the end of a segment, including space
-  that may be needed to place segment records and fenceposts when new
-  noncontiguous segments are added.
-*/
-#define TOP_FOOT_SIZE\
-  (align_offset(chunk2mem(0))+pad_request(sizeof(struct malloc_segment))+MIN_CHUNK_SIZE)
-
-
-/* -------------------------------  Hooks -------------------------------- */
-
-/*
-  PREACTION should be defined to return 0 on success, and nonzero on
-  failure. If you are not using locking, you can redefine these to do
-  anything you like.
-*/
-
-#if USE_LOCKS
-#define PREACTION(M)  ((use_lock(M))? ACQUIRE_LOCK(&(M)->mutex) : 0)
-#define POSTACTION(M) { if (use_lock(M)) RELEASE_LOCK(&(M)->mutex); }
-#else /* USE_LOCKS */
-
-#ifndef PREACTION
-#define PREACTION(M) (0)
-#endif  /* PREACTION */
-
-#ifndef POSTACTION
-#define POSTACTION(M)
-#endif  /* POSTACTION */
-
-#endif /* USE_LOCKS */
-
-/*
-  CORRUPTION_ERROR_ACTION is triggered upon detected bad addresses.
-  USAGE_ERROR_ACTION is triggered on detected bad frees and
-  reallocs. The argument p is an address that might have triggered the
-  fault. It is ignored by the two predefined actions, but might be
-  useful in custom actions that try to help diagnose errors.
-*/
-
-#if PROCEED_ON_ERROR
-
-/* A count of the number of corruption errors causing resets */
-int malloc_corruption_error_count;
-
-/* default corruption action */
-static void reset_on_error(mstate m);
-
-#define CORRUPTION_ERROR_ACTION(m)  reset_on_error(m)
-#define USAGE_ERROR_ACTION(m, p)
-
-#else /* PROCEED_ON_ERROR */
-
-#ifndef CORRUPTION_ERROR_ACTION
-#define CORRUPTION_ERROR_ACTION(m) ABORT
-#endif /* CORRUPTION_ERROR_ACTION */
-
-#ifndef USAGE_ERROR_ACTION
-#define USAGE_ERROR_ACTION(m,p) ABORT
-#endif /* USAGE_ERROR_ACTION */
-
-#endif /* PROCEED_ON_ERROR */
-
-
-/* -------------------------- Debugging setup ---------------------------- */
-
-#if ! DEBUG
-
-#define check_free_chunk(M,P)
-#define check_inuse_chunk(M,P)
-#define check_malloced_chunk(M,P,N)
-#define check_mmapped_chunk(M,P)
-#define check_malloc_state(M)
-#define check_top_chunk(M,P)
-
-#else /* DEBUG */
-#define check_free_chunk(M,P)       do_check_free_chunk(M,P)
-#define check_inuse_chunk(M,P)      do_check_inuse_chunk(M,P)
-#define check_top_chunk(M,P)        do_check_top_chunk(M,P)
-#define check_malloced_chunk(M,P,N) do_check_malloced_chunk(M,P,N)
-#define check_mmapped_chunk(M,P)    do_check_mmapped_chunk(M,P)
-#define check_malloc_state(M)       do_check_malloc_state(M)
-
-static void   do_check_any_chunk(mstate m, mchunkptr p);
-static void   do_check_top_chunk(mstate m, mchunkptr p);
-static void   do_check_mmapped_chunk(mstate m, mchunkptr p);
-static void   do_check_inuse_chunk(mstate m, mchunkptr p);
-static void   do_check_free_chunk(mstate m, mchunkptr p);
-static void   do_check_malloced_chunk(mstate m, void* mem, size_t s);
-static void   do_check_tree(mstate m, tchunkptr t);
-static void   do_check_treebin(mstate m, bindex_t i);
-static void   do_check_smallbin(mstate m, bindex_t i);
-static void   do_check_malloc_state(mstate m);
-static int    bin_find(mstate m, mchunkptr x);
-static size_t traverse_and_check(mstate m);
-#endif /* DEBUG */
-
-/* ---------------------------- Indexing Bins ---------------------------- */
-
-#define is_small(s)         (((s) >> SMALLBIN_SHIFT) < NSMALLBINS)
-#define small_index(s)      (bindex_t)((s)  >> SMALLBIN_SHIFT)
-#define small_index2size(i) ((i)  << SMALLBIN_SHIFT)
-#define MIN_SMALL_INDEX     (small_index(MIN_CHUNK_SIZE))
-
-/* addressing by index. See above about smallbin repositioning */
-#define smallbin_at(M, i)   ((sbinptr)((char*)&((M)->smallbins[(i)<<1])))
-#define treebin_at(M,i)     (&((M)->treebins[i]))
-
-/* assign tree index for size S to variable I. Use x86 asm if possible  */
-#if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-#define compute_tree_index(S, I)\
-{\
-  unsigned int X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int K = (unsigned) sizeof(X)*__CHAR_BIT__ - 1 - (unsigned) __builtin_clz(X); \
-    I =  (bindex_t)((K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1)));\
-  }\
-}
-
-#elif defined (__INTEL_COMPILER)
-#define compute_tree_index(S, I)\
-{\
-  size_t X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int K = _bit_scan_reverse (X); \
-    I =  (bindex_t)((K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1)));\
-  }\
-}
-
-#elif defined(_MSC_VER) && _MSC_VER>=1300
-#define compute_tree_index(S, I)\
-{\
-  size_t X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int K;\
-    _BitScanReverse((DWORD *) &K, (DWORD) X);\
-    I =  (bindex_t)((K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1)));\
-  }\
-}
-
-#else /* GNUC */
-#define compute_tree_index(S, I)\
-{\
-  size_t X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int Y = (unsigned int)X;\
-    unsigned int N = ((Y - 0x100) >> 16) & 8;\
-    unsigned int K = (((Y <<= N) - 0x1000) >> 16) & 4;\
-    N += K;\
-    N += K = (((Y <<= K) - 0x4000) >> 16) & 2;\
-    K = 14 - N + ((Y <<= K) >> 15);\
-    I = (K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1));\
-  }\
-}
-#endif /* GNUC */
-
-/* Bit representing maximum resolved size in a treebin at i */
-#define bit_for_tree_index(i) \
-   (i == NTREEBINS-1)? (SIZE_T_BITSIZE-1) : (((i) >> 1) + TREEBIN_SHIFT - 2)
-
-/* Shift placing maximum resolved bit in a treebin at i as sign bit */
-#define leftshift_for_tree_index(i) \
-   ((i == NTREEBINS-1)? 0 : \
-    ((SIZE_T_BITSIZE-SIZE_T_ONE) - (((i) >> 1) + TREEBIN_SHIFT - 2)))
-
-/* The size of the smallest chunk held in bin with index i */
-#define minsize_for_tree_index(i) \
-   ((SIZE_T_ONE << (((i) >> 1) + TREEBIN_SHIFT)) |  \
-   (((size_t)((i) & SIZE_T_ONE)) << (((i) >> 1) + TREEBIN_SHIFT - 1)))
-
-
-/* ------------------------ Operations on bin maps ----------------------- */
-
-/* bit corresponding to given index */
-#define idx2bit(i)              ((binmap_t)(1) << (i))
-
-/* Mark/Clear bits with given index */
-#define mark_smallmap(M,i)      ((M)->smallmap |=  idx2bit(i))
-#define clear_smallmap(M,i)     ((M)->smallmap &= ~idx2bit(i))
-#define smallmap_is_marked(M,i) ((M)->smallmap &   idx2bit(i))
-
-#define mark_treemap(M,i)       ((M)->treemap  |=  idx2bit(i))
-#define clear_treemap(M,i)      ((M)->treemap  &= ~idx2bit(i))
-#define treemap_is_marked(M,i)  ((M)->treemap  &   idx2bit(i))
-
-/* isolate the least set bit of a bitmap */
-#define least_bit(x)         ((x) & -(x))
-
-/* mask with all bits to left of least bit of x on */
-#define left_bits(x)         ((x<<1) | -(x<<1))
-
-/* mask with all bits to left of or equal to least bit of x on */
-#define same_or_left_bits(x) ((x) | -(x))
-
-/* index corresponding to given bit. Use x86 asm if possible */
-
-#if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int J;\
-  J = __builtin_ctz(X); \
-  I = (bindex_t)J;\
-}
-
-#elif defined (__INTEL_COMPILER)
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int J;\
-  J = _bit_scan_forward (X); \
-  I = (bindex_t)J;\
-}
-
-#elif defined(_MSC_VER) && _MSC_VER>=1300
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int J;\
-  _BitScanForward((DWORD *) &J, X);\
-  I = (bindex_t)J;\
-}
-
-#elif USE_BUILTIN_FFS
-#define compute_bit2idx(X, I) I = ffs(X)-1
-
-#else
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int Y = X - 1;\
-  unsigned int K = Y >> (16-4) & 16;\
-  unsigned int N = K;        Y >>= K;\
-  N += K = Y >> (8-3) &  8;  Y >>= K;\
-  N += K = Y >> (4-2) &  4;  Y >>= K;\
-  N += K = Y >> (2-1) &  2;  Y >>= K;\
-  N += K = Y >> (1-0) &  1;  Y >>= K;\
-  I = (bindex_t)(N + Y);\
-}
-#endif /* GNUC */
-
-
-/* ----------------------- Runtime Check Support ------------------------- */
-
-/*
-  For security, the main invariant is that malloc/free/etc never
-  writes to a static address other than malloc_state, unless static
-  malloc_state itself has been corrupted, which cannot occur via
-  malloc (because of these checks). In essence this means that we
-  believe all pointers, sizes, maps etc held in malloc_state, but
-  check all of those linked or offsetted from other embedded data
-  structures.  These checks are interspersed with main code in a way
-  that tends to minimize their run-time cost.
-
-  When FOOTERS is defined, in addition to range checking, we also
-  verify footer fields of inuse chunks, which can be used guarantee
-  that the mstate controlling malloc/free is intact.  This is a
-  streamlined version of the approach described by William Robertson
-  et al in "Run-time Detection of Heap-based Overflows" LISA'03
-  http://www.usenix.org/events/lisa03/tech/robertson.html The footer
-  of an inuse chunk holds the xor of its mstate and a random seed,
-  that is checked upon calls to free() and realloc().  This is
-  (probabalistically) unguessable from outside the program, but can be
-  computed by any code successfully malloc'ing any chunk, so does not
-  itself provide protection against code that has already broken
-  security through some other means.  Unlike Robertson et al, we
-  always dynamically check addresses of all offset chunks (previous,
-  next, etc). This turns out to be cheaper than relying on hashes.
-*/
-
-#if !INSECURE
-/* Check if address a is at least as high as any from MORECORE or MMAP */
-#define ok_address(M, a) ((char*)(a) >= (M)->least_addr)
-/* Check if address of next chunk n is higher than base chunk p */
-#define ok_next(p, n)    ((char*)(p) < (char*)(n))
-/* Check if p has inuse status */
-#define ok_inuse(p)     is_inuse(p)
-/* Check if p has its pinuse bit on */
-#define ok_pinuse(p)     pinuse(p)
-
-#else /* !INSECURE */
-#define ok_address(M, a) (1)
-#define ok_next(b, n)    (1)
-#define ok_inuse(p)      (1)
-#define ok_pinuse(p)     (1)
-#endif /* !INSECURE */
-
-#if (FOOTERS && !INSECURE)
-/* Check if (alleged) mstate m has expected magic field */
-#define ok_magic(M)      ((M)->magic == mparams.magic)
-#else  /* (FOOTERS && !INSECURE) */
-#define ok_magic(M)      (1)
-#endif /* (FOOTERS && !INSECURE) */
-
-/* In gcc, use __builtin_expect to minimize impact of checks */
-#if !INSECURE
-#if defined(__GNUC__) && __GNUC__ >= 3
-#define RTCHECK(e)  __builtin_expect(e, 1)
-#else /* GNUC */
-#define RTCHECK(e)  (e)
-#endif /* GNUC */
-#else /* !INSECURE */
-#define RTCHECK(e)  (1)
-#endif /* !INSECURE */
-
-/* macros to set up inuse chunks with or without footers */
-
-#if !FOOTERS
-
-#define mark_inuse_foot(M,p,s)
-
-/* Macros for setting head/foot of non-mmapped chunks */
-
-/* Set cinuse bit and pinuse bit of next chunk */
-#define set_inuse(M,p,s)\
-  ((p)->head = (((p)->head & PINUSE_BIT)|s|CINUSE_BIT),\
-  ((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT)
-
-/* Set cinuse and pinuse of this chunk and pinuse of next chunk */
-#define set_inuse_and_pinuse(M,p,s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT),\
-  ((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT)
-
-/* Set size, cinuse and pinuse bit of this chunk */
-#define set_size_and_pinuse_of_inuse_chunk(M, p, s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT))
-
-#else /* FOOTERS */
-
-/* Set foot of inuse chunk to be xor of mstate and seed */
-#define mark_inuse_foot(M,p,s)\
-  (((mchunkptr)((char*)(p) + (s)))->prev_foot = ((size_t)(M) ^ mparams.magic))
-
-#define get_mstate_for(p)\
-  ((mstate)(((mchunkptr)((char*)(p) +\
-    (chunksize(p))))->prev_foot ^ mparams.magic))
-
-#define set_inuse(M,p,s)\
-  ((p)->head = (((p)->head & PINUSE_BIT)|s|CINUSE_BIT),\
-  (((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT), \
-  mark_inuse_foot(M,p,s))
-
-#define set_inuse_and_pinuse(M,p,s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT),\
-  (((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT),\
- mark_inuse_foot(M,p,s))
-
-#define set_size_and_pinuse_of_inuse_chunk(M, p, s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT),\
-  mark_inuse_foot(M, p, s))
-
-#endif /* !FOOTERS */
-
-/* ---------------------------- setting mparams -------------------------- */
-
-#if LOCK_AT_FORK
-static void pre_fork(void)         { ACQUIRE_LOCK(&(gm)->mutex); }
-static void post_fork_parent(void) { RELEASE_LOCK(&(gm)->mutex); }
-static void post_fork_child(void)  { INITIAL_LOCK(&(gm)->mutex); }
-#endif /* LOCK_AT_FORK */
-
-/* Initialize mparams */
-static int init_mparams(void) {
-#ifdef NEED_GLOBAL_LOCK_INIT
-  if (malloc_global_mutex_status <= 0)
-    init_malloc_global_mutex();
-#endif
-
-  ACQUIRE_MALLOC_GLOBAL_LOCK();
-  if (mparams.magic == 0) {
-    size_t magic;
-    size_t psize;
-    size_t gsize;
-
-#ifndef WIN32
-    psize = malloc_getpagesize;
-    gsize = ((DEFAULT_GRANULARITY != 0)? DEFAULT_GRANULARITY : psize);
-#else /* WIN32 */
-    {
-      SYSTEM_INFO system_info;
-      GetSystemInfo(&system_info);
-      psize = system_info.dwPageSize;
-      gsize = ((DEFAULT_GRANULARITY != 0)?
-               DEFAULT_GRANULARITY : system_info.dwAllocationGranularity);
-    }
-#endif /* WIN32 */
-
-    /* Sanity-check configuration:
-       size_t must be unsigned and as wide as pointer type.
-       ints must be at least 4 bytes.
-       alignment must be at least 8.
-       Alignment, min chunk size, and page size must all be powers of 2.
-    */
-    if ((sizeof(size_t) != sizeof(char*)) ||
-        (MAX_SIZE_T < MIN_CHUNK_SIZE)  ||
-        (sizeof(int) < 4)  ||
-        (MALLOC_ALIGNMENT < (size_t)8U) ||
-        ((MALLOC_ALIGNMENT & (MALLOC_ALIGNMENT-SIZE_T_ONE)) != 0) ||
-        ((MCHUNK_SIZE      & (MCHUNK_SIZE-SIZE_T_ONE))      != 0) ||
-        ((gsize            & (gsize-SIZE_T_ONE))            != 0) ||
-        ((psize            & (psize-SIZE_T_ONE))            != 0))
-      ABORT;
-    mparams.granularity = gsize;
-    mparams.page_size = psize;
-    mparams.mmap_threshold = DEFAULT_MMAP_THRESHOLD;
-    mparams.trim_threshold = DEFAULT_TRIM_THRESHOLD;
-#if MORECORE_CONTIGUOUS
-    mparams.default_mflags = USE_LOCK_BIT|USE_MMAP_BIT;
-#else  /* MORECORE_CONTIGUOUS */
-    mparams.default_mflags = USE_LOCK_BIT|USE_MMAP_BIT|USE_NONCONTIGUOUS_BIT;
-#endif /* MORECORE_CONTIGUOUS */
-
-#if !ONLY_MSPACES
-    /* Set up lock for main malloc area */
-    gm->mflags = mparams.default_mflags;
-    (void)INITIAL_LOCK(&gm->mutex);
-#endif
-#if LOCK_AT_FORK
-    pthread_atfork(&pre_fork, &post_fork_parent, &post_fork_child);
-#endif
-
-    {
-#if USE_DEV_RANDOM
-      int fd;
-      unsigned char buf[sizeof(size_t)];
-      /* Try to use /dev/urandom, else fall back on using time */
-      if ((fd = open("/dev/urandom", O_RDONLY)) >= 0 &&
-          read(fd, buf, sizeof(buf)) == sizeof(buf)) {
-        magic = *((size_t *) buf);
-        close(fd);
-      }
-      else
-#endif /* USE_DEV_RANDOM */
-#ifdef WIN32
-      magic = (size_t)(GetTickCount() ^ (size_t)0x55555555U);
-#elif defined(LACKS_TIME_H)
-      magic = (size_t)&magic ^ (size_t)0x55555555U;
-#else
-      magic = (size_t)(time(0) ^ (size_t)0x55555555U);
-#endif
-      magic |= (size_t)8U;    /* ensure nonzero */
-      magic &= ~(size_t)7U;   /* improve chances of fault for bad values */
-      /* Until memory modes commonly available, use volatile-write */
-      (*(volatile size_t *)(&(mparams.magic))) = magic;
-    }
-  }
-
-  RELEASE_MALLOC_GLOBAL_LOCK();
-  return 1;
-}
-
-/* support for mallopt */
-static int change_mparam(int param_number, int value) {
-  size_t val;
-  ensure_initialization();
-  val = (value == -1)? MAX_SIZE_T : (size_t)value;
-  switch(param_number) {
-  case M_TRIM_THRESHOLD:
-    mparams.trim_threshold = val;
-    return 1;
-  case M_GRANULARITY:
-    if (val >= mparams.page_size && ((val & (val-1)) == 0)) {
-      mparams.granularity = val;
-      return 1;
-    }
-    else
-      return 0;
-  case M_MMAP_THRESHOLD:
-    mparams.mmap_threshold = val;
-    return 1;
-  default:
-    return 0;
-  }
-}
-
-#if DEBUG
-/* ------------------------- Debugging Support --------------------------- */
-
-/* Check properties of any chunk, whether free, inuse, mmapped etc  */
-static void do_check_any_chunk(mstate m, mchunkptr p) {
-  assert((is_aligned(chunk2mem(p))) || (p->head == FENCEPOST_HEAD));
-  assert(ok_address(m, p));
-}
-
-/* Check properties of top chunk */
-static void do_check_top_chunk(mstate m, mchunkptr p) {
-  msegmentptr sp = segment_holding(m, (char*)p);
-  size_t  sz = p->head & ~INUSE_BITS; /* third-lowest bit can be set! */
-  assert(sp != 0);
-  assert((is_aligned(chunk2mem(p))) || (p->head == FENCEPOST_HEAD));
-  assert(ok_address(m, p));
-  assert(sz == m->topsize);
-  assert(sz > 0);
-  assert(sz == ((sp->base + sp->size) - (char*)p) - TOP_FOOT_SIZE);
-  assert(pinuse(p));
-  assert(!pinuse(chunk_plus_offset(p, sz)));
-}
-
-/* Check properties of (inuse) mmapped chunks */
-static void do_check_mmapped_chunk(mstate m, mchunkptr p) {
-  size_t  sz = chunksize(p);
-  size_t len = (sz + (p->prev_foot) + MMAP_FOOT_PAD);
-  assert(is_mmapped(p));
-  assert(use_mmap(m));
-  assert((is_aligned(chunk2mem(p))) || (p->head == FENCEPOST_HEAD));
-  assert(ok_address(m, p));
-  assert(!is_small(sz));
-  assert((len & (mparams.page_size-SIZE_T_ONE)) == 0);
-  assert(chunk_plus_offset(p, sz)->head == FENCEPOST_HEAD);
-  assert(chunk_plus_offset(p, sz+SIZE_T_SIZE)->head == 0);
-}
-
-/* Check properties of inuse chunks */
-static void do_check_inuse_chunk(mstate m, mchunkptr p) {
-  do_check_any_chunk(m, p);
-  assert(is_inuse(p));
-  assert(next_pinuse(p));
-  /* If not pinuse and not mmapped, previous chunk has OK offset */
-  assert(is_mmapped(p) || pinuse(p) || next_chunk(prev_chunk(p)) == p);
-  if (is_mmapped(p))
-    do_check_mmapped_chunk(m, p);
-}
-
-/* Check properties of free chunks */
-static void do_check_free_chunk(mstate m, mchunkptr p) {
-  size_t sz = chunksize(p);
-  mchunkptr next = chunk_plus_offset(p, sz);
-  do_check_any_chunk(m, p);
-  assert(!is_inuse(p));
-  assert(!next_pinuse(p));
-  assert (!is_mmapped(p));
-  if (p != m->dv && p != m->top) {
-    if (sz >= MIN_CHUNK_SIZE) {
-      assert((sz & CHUNK_ALIGN_MASK) == 0);
-      assert(is_aligned(chunk2mem(p)));
-      assert(next->prev_foot == sz);
-      assert(pinuse(p));
-      assert (next == m->top || is_inuse(next));
-      assert(p->fd->bk == p);
-      assert(p->bk->fd == p);
-    }
-    else  /* markers are always of size SIZE_T_SIZE */
-      assert(sz == SIZE_T_SIZE);
-  }
-}
-
-/* Check properties of malloced chunks at the point they are malloced */
-static void do_check_malloced_chunk(mstate m, void* mem, size_t s) {
-  if (mem != 0) {
-    mchunkptr p = mem2chunk(mem);
-    size_t sz = p->head & ~INUSE_BITS;
-    do_check_inuse_chunk(m, p);
-    assert((sz & CHUNK_ALIGN_MASK) == 0);
-    assert(sz >= MIN_CHUNK_SIZE);
-    assert(sz >= s);
-    /* unless mmapped, size is less than MIN_CHUNK_SIZE more than request */
-    assert(is_mmapped(p) || sz < (s + MIN_CHUNK_SIZE));
-  }
-}
-
-/* Check a tree and its subtrees.  */
-static void do_check_tree(mstate m, tchunkptr t) {
-  tchunkptr head = 0;
-  tchunkptr u = t;
-  bindex_t tindex = t->index;
-  size_t tsize = chunksize(t);
-  bindex_t idx;
-  compute_tree_index(tsize, idx);
-  assert(tindex == idx);
-  assert(tsize >= MIN_LARGE_SIZE);
-  assert(tsize >= minsize_for_tree_index(idx));
-  assert((idx == NTREEBINS-1) || (tsize < minsize_for_tree_index((idx+1))));
-
-  do { /* traverse through chain of same-sized nodes */
-    do_check_any_chunk(m, ((mchunkptr)u));
-    assert(u->index == tindex);
-    assert(chunksize(u) == tsize);
-    assert(!is_inuse(u));
-    assert(!next_pinuse(u));
-    assert(u->fd->bk == u);
-    assert(u->bk->fd == u);
-    if (u->parent == 0) {
-      assert(u->child[0] == 0);
-      assert(u->child[1] == 0);
-    }
-    else {
-      assert(head == 0); /* only one node on chain has parent */
-      head = u;
-      assert(u->parent != u);
-      assert (u->parent->child[0] == u ||
-              u->parent->child[1] == u ||
-              *((tbinptr*)(u->parent)) == u);
-      if (u->child[0] != 0) {
-        assert(u->child[0]->parent == u);
-        assert(u->child[0] != u);
-        do_check_tree(m, u->child[0]);
-      }
-      if (u->child[1] != 0) {
-        assert(u->child[1]->parent == u);
-        assert(u->child[1] != u);
-        do_check_tree(m, u->child[1]);
-      }
-      if (u->child[0] != 0 && u->child[1] != 0) {
-        assert(chunksize(u->child[0]) < chunksize(u->child[1]));
-      }
-    }
-    u = u->fd;
-  } while (u != t);
-  assert(head != 0);
-}
-
-/*  Check all the chunks in a treebin.  */
-static void do_check_treebin(mstate m, bindex_t i) {
-  tbinptr* tb = treebin_at(m, i);
-  tchunkptr t = *tb;
-  int empty = (m->treemap & (1U << i)) == 0;
-  if (t == 0)
-    assert(empty);
-  if (!empty)
-    do_check_tree(m, t);
-}
-
-/*  Check all the chunks in a smallbin.  */
-static void do_check_smallbin(mstate m, bindex_t i) {
-  sbinptr b = smallbin_at(m, i);
-  mchunkptr p = b->bk;
-  unsigned int empty = (m->smallmap & (1U << i)) == 0;
-  if (p == b)
-    assert(empty);
-  if (!empty) {
-    for (; p != b; p = p->bk) {
-      size_t size = chunksize(p);
-      mchunkptr q;
-      /* each chunk claims to be free */
-      do_check_free_chunk(m, p);
-      /* chunk belongs in bin */
-      assert(small_index(size) == i);
-      assert(p->bk == b || chunksize(p->bk) == chunksize(p));
-      /* chunk is followed by an inuse chunk */
-      q = next_chunk(p);
-      if (q->head != FENCEPOST_HEAD)
-        do_check_inuse_chunk(m, q);
-    }
-  }
-}
-
-/* Find x in a bin. Used in other check functions. */
-static int bin_find(mstate m, mchunkptr x) {
-  size_t size = chunksize(x);
-  if (is_small(size)) {
-    bindex_t sidx = small_index(size);
-    sbinptr b = smallbin_at(m, sidx);
-    if (smallmap_is_marked(m, sidx)) {
-      mchunkptr p = b;
-      do {
-        if (p == x)
-          return 1;
-      } while ((p = p->fd) != b);
-    }
-  }
-  else {
-    bindex_t tidx;
-    compute_tree_index(size, tidx);
-    if (treemap_is_marked(m, tidx)) {
-      tchunkptr t = *treebin_at(m, tidx);
-      size_t sizebits = size << leftshift_for_tree_index(tidx);
-      while (t != 0 && chunksize(t) != size) {
-        t = t->child[(sizebits >> (SIZE_T_BITSIZE-SIZE_T_ONE)) & 1];
-        sizebits <<= 1;
-      }
-      if (t != 0) {
-        tchunkptr u = t;
-        do {
-          if (u == (tchunkptr)x)
-            return 1;
-        } while ((u = u->fd) != t);
-      }
-    }
-  }
-  return 0;
-}
-
-/* Traverse each chunk and check it; return total */
-static size_t traverse_and_check(mstate m) {
-  size_t sum = 0;
-  if (is_initialized(m)) {
-    msegmentptr s = &m->seg;
-    sum += m->topsize + TOP_FOOT_SIZE;
-    while (s != 0) {
-      mchunkptr q = align_as_chunk(s->base);
-      mchunkptr lastq = 0;
-      assert(pinuse(q));
-      while (segment_holds(s, q) &&
-             q != m->top && q->head != FENCEPOST_HEAD) {
-        sum += chunksize(q);
-        if (is_inuse(q)) {
-          assert(!bin_find(m, q));
-          do_check_inuse_chunk(m, q);
-        }
-        else {
-          assert(q == m->dv || bin_find(m, q));
-          assert(lastq == 0 || is_inuse(lastq)); /* Not 2 consecutive free */
-          do_check_free_chunk(m, q);
-        }
-        lastq = q;
-        q = next_chunk(q);
-      }
-      s = s->next;
-    }
-  }
-  return sum;
-}
-
-
-/* Check all properties of malloc_state. */
-static void do_check_malloc_state(mstate m) {
-  bindex_t i;
-  size_t total;
-  /* check bins */
-  for (i = 0; i < NSMALLBINS; ++i)
-    do_check_smallbin(m, i);
-  for (i = 0; i < NTREEBINS; ++i)
-    do_check_treebin(m, i);
-
-  if (m->dvsize != 0) { /* check dv chunk */
-    do_check_any_chunk(m, m->dv);
-    assert(m->dvsize == chunksize(m->dv));
-    assert(m->dvsize >= MIN_CHUNK_SIZE);
-    assert(bin_find(m, m->dv) == 0);
-  }
-
-  if (m->top != 0) {   /* check top chunk */
-    do_check_top_chunk(m, m->top);
-    /*assert(m->topsize == chunksize(m->top)); redundant */
-    assert(m->topsize > 0);
-    assert(bin_find(m, m->top) == 0);
-  }
-
-  total = traverse_and_check(m);
-  assert(total <= m->footprint);
-  assert(m->footprint <= m->max_footprint);
-}
-#endif /* DEBUG */
-
-/* ----------------------------- statistics ------------------------------ */
-
-#if !NO_MALLINFO
-static struct mallinfo internal_mallinfo(mstate m) {
-  struct mallinfo nm = { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
-  ensure_initialization();
-  if (!PREACTION(m)) {
-    check_malloc_state(m);
-    if (is_initialized(m)) {
-      size_t nfree = SIZE_T_ONE; /* top always free */
-      size_t mfree = m->topsize + TOP_FOOT_SIZE;
-      size_t sum = mfree;
-      msegmentptr s = &m->seg;
-      while (s != 0) {
-        mchunkptr q = align_as_chunk(s->base);
-        while (segment_holds(s, q) &&
-               q != m->top && q->head != FENCEPOST_HEAD) {
-          size_t sz = chunksize(q);
-          sum += sz;
-          if (!is_inuse(q)) {
-            mfree += sz;
-            ++nfree;
-          }
-          q = next_chunk(q);
-        }
-        s = s->next;
-      }
-
-      nm.arena    = sum;
-      nm.ordblks  = nfree;
-      nm.hblkhd   = m->footprint - sum;
-      nm.usmblks  = m->max_footprint;
-      nm.uordblks = m->footprint - mfree;
-      nm.fordblks = mfree;
-      nm.keepcost = m->topsize;
-    }
-
-    POSTACTION(m);
-  }
-  return nm;
-}
-#endif /* !NO_MALLINFO */
-
-#if !NO_MALLOC_STATS
-static void internal_malloc_stats(mstate m) {
-  ensure_initialization();
-  if (!PREACTION(m)) {
-    size_t maxfp = 0;
-    size_t fp = 0;
-    size_t used = 0;
-    check_malloc_state(m);
-    if (is_initialized(m)) {
-      msegmentptr s = &m->seg;
-      maxfp = m->max_footprint;
-      fp = m->footprint;
-      used = fp - (m->topsize + TOP_FOOT_SIZE);
-
-      while (s != 0) {
-        mchunkptr q = align_as_chunk(s->base);
-        while (segment_holds(s, q) &&
-               q != m->top && q->head != FENCEPOST_HEAD) {
-          if (!is_inuse(q))
-            used -= chunksize(q);
-          q = next_chunk(q);
-        }
-        s = s->next;
-      }
-    }
-    POSTACTION(m); /* drop lock */
-    fprintf(stderr, "max system bytes = %10lu\n", (unsigned long)(maxfp));
-    fprintf(stderr, "system bytes     = %10lu\n", (unsigned long)(fp));
-    fprintf(stderr, "in use bytes     = %10lu\n", (unsigned long)(used));
-  }
-}
-#endif /* NO_MALLOC_STATS */
-
-/* ----------------------- Operations on smallbins ----------------------- */
-
-/*
-  Various forms of linking and unlinking are defined as macros.  Even
-  the ones for trees, which are very long but have very short typical
-  paths.  This is ugly but reduces reliance on inlining support of
-  compilers.
-*/
-
-/* Link a free chunk into a smallbin  */
-#define insert_small_chunk(M, P, S) {\
-  bindex_t I  = small_index(S);\
-  mchunkptr B = smallbin_at(M, I);\
-  mchunkptr F = B;\
-  assert(S >= MIN_CHUNK_SIZE);\
-  if (!smallmap_is_marked(M, I))\
-    mark_smallmap(M, I);\
-  else if (RTCHECK(ok_address(M, B->fd)))\
-    F = B->fd;\
-  else {\
-    CORRUPTION_ERROR_ACTION(M);\
-  }\
-  B->fd = P;\
-  F->bk = P;\
-  P->fd = F;\
-  P->bk = B;\
-}
-
-/* Unlink a chunk from a smallbin  */
-#define unlink_small_chunk(M, P, S) {\
-  mchunkptr F = P->fd;\
-  mchunkptr B = P->bk;\
-  bindex_t I = small_index(S);\
-  assert(P != B);\
-  assert(P != F);\
-  assert(chunksize(P) == small_index2size(I));\
-  if (RTCHECK(F == smallbin_at(M,I) || (ok_address(M, F) && F->bk == P))) { \
-    if (B == F) {\
-      clear_smallmap(M, I);\
-    }\
-    else if (RTCHECK(B == smallbin_at(M,I) ||\
-                     (ok_address(M, B) && B->fd == P))) {\
-      F->bk = B;\
-      B->fd = F;\
-    }\
-    else {\
-      CORRUPTION_ERROR_ACTION(M);\
-    }\
-  }\
-  else {\
-    CORRUPTION_ERROR_ACTION(M);\
-  }\
-}
-
-/* Unlink the first chunk from a smallbin */
-#define unlink_first_small_chunk(M, B, P, I) {\
-  mchunkptr F = P->fd;\
-  assert(P != B);\
-  assert(P != F);\
-  assert(chunksize(P) == small_index2size(I));\
-  if (B == F) {\
-    clear_smallmap(M, I);\
-  }\
-  else if (RTCHECK(ok_address(M, F) && F->bk == P)) {\
-    F->bk = B;\
-    B->fd = F;\
-  }\
-  else {\
-    CORRUPTION_ERROR_ACTION(M);\
-  }\
-}
-
-/* Replace dv node, binning the old one */
-/* Used only when dvsize known to be small */
-#define replace_dv(M, P, S) {\
-  size_t DVS = M->dvsize;\
-  assert(is_small(DVS));\
-  if (DVS != 0) {\
-    mchunkptr DV = M->dv;\
-    insert_small_chunk(M, DV, DVS);\
-  }\
-  M->dvsize = S;\
-  M->dv = P;\
-}
-
-/* ------------------------- Operations on trees ------------------------- */
-
-/* Insert chunk into tree */
-#define insert_large_chunk(M, X, S) {\
-  tbinptr* H;\
-  bindex_t I;\
-  compute_tree_index(S, I);\
-  H = treebin_at(M, I);\
-  X->index = I;\
-  X->child[0] = X->child[1] = 0;\
-  if (!treemap_is_marked(M, I)) {\
-    mark_treemap(M, I);\
-    *H = X;\
-    X->parent = (tchunkptr)H;\
-    X->fd = X->bk = X;\
-  }\
-  else {\
-    tchunkptr T = *H;\
-    size_t K = S << leftshift_for_tree_index(I);\
-    for (;;) {\
-      if (chunksize(T) != S) {\
-        tchunkptr* C = &(T->child[(K >> (SIZE_T_BITSIZE-SIZE_T_ONE)) & 1]);\
-        K <<= 1;\
-        if (*C != 0)\
-          T = *C;\
-        else if (RTCHECK(ok_address(M, C))) {\
-          *C = X;\
-          X->parent = T;\
-          X->fd = X->bk = X;\
-          break;\
-        }\
-        else {\
-          CORRUPTION_ERROR_ACTION(M);\
-          break;\
-        }\
-      }\
-      else {\
-        tchunkptr F = T->fd;\
-        if (RTCHECK(ok_address(M, T) && ok_address(M, F))) {\
-          T->fd = F->bk = X;\
-          X->fd = F;\
-          X->bk = T;\
-          X->parent = 0;\
-          break;\
-        }\
-        else {\
-          CORRUPTION_ERROR_ACTION(M);\
-          break;\
-        }\
-      }\
-    }\
-  }\
-}
-
-/*
-  Unlink steps:
-
-  1. If x is a chained node, unlink it from its same-sized fd/bk links
-     and choose its bk node as its replacement.
-  2. If x was the last node of its size, but not a leaf node, it must
-     be replaced with a leaf node (not merely one with an open left or
-     right), to make sure that lefts and rights of descendents
-     correspond properly to bit masks.  We use the rightmost descendent
-     of x.  We could use any other leaf, but this is easy to locate and
-     tends to counteract removal of leftmosts elsewhere, and so keeps
-     paths shorter than minimally guaranteed.  This doesn't loop much
-     because on average a node in a tree is near the bottom.
-  3. If x is the base of a chain (i.e., has parent links) relink
-     x's parent and children to x's replacement (or null if none).
-*/
-
-#define unlink_large_chunk(M, X) {\
-  tchunkptr XP = X->parent;\
-  tchunkptr R;\
-  if (X->bk != X) {\
-    tchunkptr F = X->fd;\
-    R = X->bk;\
-    if (RTCHECK(ok_address(M, F) && F->bk == X && R->fd == X)) {\
-      F->bk = R;\
-      R->fd = F;\
-    }\
-    else {\
-      CORRUPTION_ERROR_ACTION(M);\
-    }\
-  }\
-  else {\
-    tchunkptr* RP;\
-    if (((R = *(RP = &(X->child[1]))) != 0) ||\
-        ((R = *(RP = &(X->child[0]))) != 0)) {\
-      tchunkptr* CP;\
-      while ((*(CP = &(R->child[1])) != 0) ||\
-             (*(CP = &(R->child[0])) != 0)) {\
-        R = *(RP = CP);\
-      }\
-      if (RTCHECK(ok_address(M, RP)))\
-        *RP = 0;\
-      else {\
-        CORRUPTION_ERROR_ACTION(M);\
-      }\
-    }\
-  }\
-  if (XP != 0) {\
-    tbinptr* H = treebin_at(M, X->index);\
-    if (X == *H) {\
-      if ((*H = R) == 0) \
-        clear_treemap(M, X->index);\
-    }\
-    else if (RTCHECK(ok_address(M, XP))) {\
-      if (XP->child[0] == X) \
-        XP->child[0] = R;\
-      else \
-        XP->child[1] = R;\
-    }\
-    else\
-      CORRUPTION_ERROR_ACTION(M);\
-    if (R != 0) {\
-      if (RTCHECK(ok_address(M, R))) {\
-        tchunkptr C0, C1;\
-        R->parent = XP;\
-        if ((C0 = X->child[0]) != 0) {\
-          if (RTCHECK(ok_address(M, C0))) {\
-            R->child[0] = C0;\
-            C0->parent = R;\
-          }\
-          else\
-            CORRUPTION_ERROR_ACTION(M);\
-        }\
-        if ((C1 = X->child[1]) != 0) {\
-          if (RTCHECK(ok_address(M, C1))) {\
-            R->child[1] = C1;\
-            C1->parent = R;\
-          }\
-          else\
-            CORRUPTION_ERROR_ACTION(M);\
-        }\
-      }\
-      else\
-        CORRUPTION_ERROR_ACTION(M);\
-    }\
-  }\
-}
-
-/* Relays to large vs small bin operations */
-
-#define insert_chunk(M, P, S)\
-  if (is_small(S)) insert_small_chunk(M, P, S)\
-  else { tchunkptr TP = (tchunkptr)(P); insert_large_chunk(M, TP, S); }
-
-#define unlink_chunk(M, P, S)\
-  if (is_small(S)) unlink_small_chunk(M, P, S)\
-  else { tchunkptr TP = (tchunkptr)(P); unlink_large_chunk(M, TP); }
-
-
-/* Relays to internal calls to malloc/free from realloc, memalign etc */
-
-#if ONLY_MSPACES
-#define internal_malloc(m, b) mspace_malloc(m, b)
-#define internal_free(m, mem) mspace_free(m,mem);
-#else /* ONLY_MSPACES */
-#if MSPACES
-#define internal_malloc(m, b)\
-  ((m == gm)? dlmalloc(b) : mspace_malloc(m, b))
-#define internal_free(m, mem)\
-   if (m == gm) dlfree(mem); else mspace_free(m,mem);
-#else /* MSPACES */
-#define internal_malloc(m, b) dlmalloc(b)
-#define internal_free(m, mem) dlfree(mem)
-#endif /* MSPACES */
-#endif /* ONLY_MSPACES */
-
-/* -----------------------  Direct-mmapping chunks ----------------------- */
-
-/*
-  Directly mmapped chunks are set up with an offset to the start of
-  the mmapped region stored in the prev_foot field of the chunk. This
-  allows reconstruction of the required argument to MUNMAP when freed,
-  and also allows adjustment of the returned chunk to meet alignment
-  requirements (especially in memalign).
-*/
-
-/* Malloc using mmap */
-static void* mmap_alloc(mstate m, size_t nb) {
-  size_t mmsize = mmap_align(nb + SIX_SIZE_T_SIZES + CHUNK_ALIGN_MASK);
-  if (m->footprint_limit != 0) {
-    size_t fp = m->footprint + mmsize;
-    if (fp <= m->footprint || fp > m->footprint_limit)
-      return 0;
-  }
-  if (mmsize > nb) {     /* Check for wrap around 0 */
-    char* mm = (char*)(CALL_DIRECT_MMAP(mmsize));
-    if (mm != CMFAIL) {
-      size_t offset = align_offset(chunk2mem(mm));
-      size_t psize = mmsize - offset - MMAP_FOOT_PAD;
-      mchunkptr p = (mchunkptr)(mm + offset);
-      p->prev_foot = offset;
-      p->head = psize;
-      mark_inuse_foot(m, p, psize);
-      chunk_plus_offset(p, psize)->head = FENCEPOST_HEAD;
-      chunk_plus_offset(p, psize+SIZE_T_SIZE)->head = 0;
-
-      if (m->least_addr == 0 || mm < m->least_addr)
-        m->least_addr = mm;
-      if ((m->footprint += mmsize) > m->max_footprint)
-        m->max_footprint = m->footprint;
-      assert(is_aligned(chunk2mem(p)));
-      check_mmapped_chunk(m, p);
-      return chunk2mem(p);
-    }
-  }
-  return 0;
-}
-
-/* Realloc using mmap */
-static mchunkptr mmap_resize(mstate m, mchunkptr oldp, size_t nb, int flags) {
-  size_t oldsize = chunksize(oldp);
-  (void)flags; /* placate people compiling -Wunused */
-  if (is_small(nb)) /* Can't shrink mmap regions below small size */
-    return 0;
-  /* Keep old chunk if big enough but not too big */
-  if (oldsize >= nb + SIZE_T_SIZE &&
-      (oldsize - nb) <= (mparams.granularity << 1))
-    return oldp;
-  else {
-    size_t offset = oldp->prev_foot;
-    size_t oldmmsize = oldsize + offset + MMAP_FOOT_PAD;
-    size_t newmmsize = mmap_align(nb + SIX_SIZE_T_SIZES + CHUNK_ALIGN_MASK);
-    char* cp = (char*)CALL_MREMAP((char*)oldp - offset,
-                                  oldmmsize, newmmsize, flags);
-    if (cp != CMFAIL) {
-      mchunkptr newp = (mchunkptr)(cp + offset);
-      size_t psize = newmmsize - offset - MMAP_FOOT_PAD;
-      newp->head = psize;
-      mark_inuse_foot(m, newp, psize);
-      chunk_plus_offset(newp, psize)->head = FENCEPOST_HEAD;
-      chunk_plus_offset(newp, psize+SIZE_T_SIZE)->head = 0;
-
-      if (cp < m->least_addr)
-        m->least_addr = cp;
-      if ((m->footprint += newmmsize - oldmmsize) > m->max_footprint)
-        m->max_footprint = m->footprint;
-      check_mmapped_chunk(m, newp);
-      return newp;
-    }
-  }
-  return 0;
-}
-
-
-/* -------------------------- mspace management -------------------------- */
-
-/* Initialize top chunk and its size */
-static void init_top(mstate m, mchunkptr p, size_t psize) {
-  /* Ensure alignment */
-  size_t offset = align_offset(chunk2mem(p));
-  p = (mchunkptr)((char*)p + offset);
-  psize -= offset;
-
-  m->top = p;
-  m->topsize = psize;
-  p->head = psize | PINUSE_BIT;
-  /* set size of fake trailing chunk holding overhead space only once */
-  chunk_plus_offset(p, psize)->head = TOP_FOOT_SIZE;
-  m->trim_check = mparams.trim_threshold; /* reset on each update */
-}
-
-/* Initialize bins for a new mstate that is otherwise zeroed out */
-static void init_bins(mstate m) {
-  /* Establish circular links for smallbins */
-  bindex_t i;
-  for (i = 0; i < NSMALLBINS; ++i) {
-    sbinptr bin = smallbin_at(m,i);
-    bin->fd = bin->bk = bin;
-  }
-}
-
-#if PROCEED_ON_ERROR
-
-/* default corruption action */
-static void reset_on_error(mstate m) {
-  int i;
-  ++malloc_corruption_error_count;
-  /* Reinitialize fields to forget about all memory */
-  m->smallmap = m->treemap = 0;
-  m->dvsize = m->topsize = 0;
-  m->seg.base = 0;
-  m->seg.size = 0;
-  m->seg.next = 0;
-  m->top = m->dv = 0;
-  for (i = 0; i < NTREEBINS; ++i)
-    *treebin_at(m, i) = 0;
-  init_bins(m);
-}
-#endif /* PROCEED_ON_ERROR */
-
-/* Allocate chunk and prepend remainder with chunk in successor base. */
-static void* prepend_alloc(mstate m, char* newbase, char* oldbase,
-                           size_t nb) {
-  mchunkptr p = align_as_chunk(newbase);
-  mchunkptr oldfirst = align_as_chunk(oldbase);
-  size_t psize = (char*)oldfirst - (char*)p;
-  mchunkptr q = chunk_plus_offset(p, nb);
-  size_t qsize = psize - nb;
-  set_size_and_pinuse_of_inuse_chunk(m, p, nb);
-
-  assert((char*)oldfirst > (char*)q);
-  assert(pinuse(oldfirst));
-  assert(qsize >= MIN_CHUNK_SIZE);
-
-  /* consolidate remainder with first chunk of old base */
-  if (oldfirst == m->top) {
-    size_t tsize = m->topsize += qsize;
-    m->top = q;
-    q->head = tsize | PINUSE_BIT;
-    check_top_chunk(m, q);
-  }
-  else if (oldfirst == m->dv) {
-    size_t dsize = m->dvsize += qsize;
-    m->dv = q;
-    set_size_and_pinuse_of_free_chunk(q, dsize);
-  }
-  else {
-    if (!is_inuse(oldfirst)) {
-      size_t nsize = chunksize(oldfirst);
-      unlink_chunk(m, oldfirst, nsize);
-      oldfirst = chunk_plus_offset(oldfirst, nsize);
-      qsize += nsize;
-    }
-    set_free_with_pinuse(q, qsize, oldfirst);
-    insert_chunk(m, q, qsize);
-    check_free_chunk(m, q);
-  }
-
-  check_malloced_chunk(m, chunk2mem(p), nb);
-  return chunk2mem(p);
-}
-
-/* Add a segment to hold a new noncontiguous region */
-static void add_segment(mstate m, char* tbase, size_t tsize, flag_t mmapped) {
-  /* Determine locations and sizes of segment, fenceposts, old top */
-  char* old_top = (char*)m->top;
-  msegmentptr oldsp = segment_holding(m, old_top);
-  char* old_end = oldsp->base + oldsp->size;
-  size_t ssize = pad_request(sizeof(struct malloc_segment));
-  char* rawsp = old_end - (ssize + FOUR_SIZE_T_SIZES + CHUNK_ALIGN_MASK);
-  size_t offset = align_offset(chunk2mem(rawsp));
-  char* asp = rawsp + offset;
-  char* csp = (asp < (old_top + MIN_CHUNK_SIZE))? old_top : asp;
-  mchunkptr sp = (mchunkptr)csp;
-  msegmentptr ss = (msegmentptr)(chunk2mem(sp));
-  mchunkptr tnext = chunk_plus_offset(sp, ssize);
-  mchunkptr p = tnext;
-  int nfences = 0;
-
-  /* reset top to new space */
-  init_top(m, (mchunkptr)tbase, tsize - TOP_FOOT_SIZE);
-
-  /* Set up segment record */
-  assert(is_aligned(ss));
-  set_size_and_pinuse_of_inuse_chunk(m, sp, ssize);
-  *ss = m->seg; /* Push current record */
-  m->seg.base = tbase;
-  m->seg.size = tsize;
-  m->seg.sflags = mmapped;
-  m->seg.next = ss;
-
-  /* Insert trailing fenceposts */
-  for (;;) {
-    mchunkptr nextp = chunk_plus_offset(p, SIZE_T_SIZE);
-    p->head = FENCEPOST_HEAD;
-    ++nfences;
-    if ((char*)(&(nextp->head)) < old_end)
-      p = nextp;
-    else
-      break;
-  }
-  assert(nfences >= 2);
-
-  /* Insert the rest of old top into a bin as an ordinary free chunk */
-  if (csp != old_top) {
-    mchunkptr q = (mchunkptr)old_top;
-    size_t psize = csp - old_top;
-    mchunkptr tn = chunk_plus_offset(q, psize);
-    set_free_with_pinuse(q, psize, tn);
-    insert_chunk(m, q, psize);
-  }
-
-  check_top_chunk(m, m->top);
-}
-
-/* -------------------------- System allocation -------------------------- */
-
-/* Get memory from system using MORECORE or MMAP */
-static void* sys_alloc(mstate m, size_t nb) {
-  char* tbase = CMFAIL;
-  size_t tsize = 0;
-  flag_t mmap_flag = 0;
-  size_t asize; /* allocation size */
-
-  ensure_initialization();
-
-  /* Directly map large chunks, but only if already initialized */
-  if (use_mmap(m) && nb >= mparams.mmap_threshold && m->topsize != 0) {
-    void* mem = mmap_alloc(m, nb);
-    if (mem != 0)
-      return mem;
-  }
-
-  asize = granularity_align(nb + SYS_ALLOC_PADDING);
-  if (asize <= nb)
-    return 0; /* wraparound */
-  if (m->footprint_limit != 0) {
-    size_t fp = m->footprint + asize;
-    if (fp <= m->footprint || fp > m->footprint_limit)
-      return 0;
-  }
-
-  /*
-    Try getting memory in any of three ways (in most-preferred to
-    least-preferred order):
-    1. A call to MORECORE that can normally contiguously extend memory.
-       (disabled if not MORECORE_CONTIGUOUS or not HAVE_MORECORE or
-       or main space is mmapped or a previous contiguous call failed)
-    2. A call to MMAP new space (disabled if not HAVE_MMAP).
-       Note that under the default settings, if MORECORE is unable to
-       fulfill a request, and HAVE_MMAP is true, then mmap is
-       used as a noncontiguous system allocator. This is a useful backup
-       strategy for systems with holes in address spaces -- in this case
-       sbrk cannot contiguously expand the heap, but mmap may be able to
-       find space.
-    3. A call to MORECORE that cannot usually contiguously extend memory.
-       (disabled if not HAVE_MORECORE)
-
-   In all cases, we need to request enough bytes from system to ensure
-   we can malloc nb bytes upon success, so pad with enough space for
-   top_foot, plus alignment-pad to make sure we don't lose bytes if
-   not on boundary, and round this up to a granularity unit.
-  */
-
-  if (MORECORE_CONTIGUOUS && !use_noncontiguous(m)) {
-    char* br = CMFAIL;
-    size_t ssize = asize; /* sbrk call size */
-    msegmentptr ss = (m->top == 0)? 0 : segment_holding(m, (char*)m->top);
-    ACQUIRE_MALLOC_GLOBAL_LOCK();
-
-    if (ss == 0) {  /* First time through or recovery */
-      char* base = (char*)CALL_MORECORE(0);
-      if (base != CMFAIL) {
-        size_t fp;
-        /* Adjust to end on a page boundary */
-        if (!is_page_aligned(base))
-          ssize += (page_align((size_t)base) - (size_t)base);
-        fp = m->footprint + ssize; /* recheck limits */
-        if (ssize > nb && ssize < HALF_MAX_SIZE_T &&
-            (m->footprint_limit == 0 ||
-             (fp > m->footprint && fp <= m->footprint_limit)) &&
-            (br = (char*)(CALL_MORECORE(ssize))) == base) {
-          tbase = base;
-          tsize = ssize;
-        }
-      }
-    }
-    else {
-      /* Subtract out existing available top space from MORECORE request. */
-      ssize = granularity_align(nb - m->topsize + SYS_ALLOC_PADDING);
-      /* Use mem here only if it did continuously extend old space */
-      if (ssize < HALF_MAX_SIZE_T &&
-          (br = (char*)(CALL_MORECORE(ssize))) == ss->base+ss->size) {
-        tbase = br;
-        tsize = ssize;
-      }
-    }
-
-    if (tbase == CMFAIL) {    /* Cope with partial failure */
-      if (br != CMFAIL) {    /* Try to use/extend the space we did get */
-        if (ssize < HALF_MAX_SIZE_T &&
-            ssize < nb + SYS_ALLOC_PADDING) {
-          size_t esize = granularity_align(nb + SYS_ALLOC_PADDING - ssize);
-          if (esize < HALF_MAX_SIZE_T) {
-            char* end = (char*)CALL_MORECORE(esize);
-            if (end != CMFAIL)
-              ssize += esize;
-            else {            /* Can't use; try to release */
-              (void) CALL_MORECORE(-ssize);
-              br = CMFAIL;
-            }
-          }
-        }
-      }
-      if (br != CMFAIL) {    /* Use the space we did get */
-        tbase = br;
-        tsize = ssize;
-      }
-      else
-        disable_contiguous(m); /* Don't try contiguous path in the future */
-    }
-
-    RELEASE_MALLOC_GLOBAL_LOCK();
-  }
-
-  if (HAVE_MMAP && tbase == CMFAIL) {  /* Try MMAP */
-    char* mp = (char*)(CALL_MMAP(asize));
-    if (mp != CMFAIL) {
-      tbase = mp;
-      tsize = asize;
-      mmap_flag = USE_MMAP_BIT;
-    }
-  }
-
-  if (HAVE_MORECORE && tbase == CMFAIL) { /* Try noncontiguous MORECORE */
-    if (asize < HALF_MAX_SIZE_T) {
-      char* br = CMFAIL;
-      char* end = CMFAIL;
-      ACQUIRE_MALLOC_GLOBAL_LOCK();
-      br = (char*)(CALL_MORECORE(asize));
-      end = (char*)(CALL_MORECORE(0));
-      RELEASE_MALLOC_GLOBAL_LOCK();
-      if (br != CMFAIL && end != CMFAIL && br < end) {
-        size_t ssize = end - br;
-        if (ssize > nb + TOP_FOOT_SIZE) {
-          tbase = br;
-          tsize = ssize;
-        }
-      }
-    }
-  }
-
-  if (tbase != CMFAIL) {
-
-    if ((m->footprint += tsize) > m->max_footprint)
-      m->max_footprint = m->footprint;
-
-    if (!is_initialized(m)) { /* first-time initialization */
-      if (m->least_addr == 0 || tbase < m->least_addr)
-        m->least_addr = tbase;
-      m->seg.base = tbase;
-      m->seg.size = tsize;
-      m->seg.sflags = mmap_flag;
-      m->magic = mparams.magic;
-      m->release_checks = MAX_RELEASE_CHECK_RATE;
-      init_bins(m);
-#if !ONLY_MSPACES
-      if (is_global(m))
-        init_top(m, (mchunkptr)tbase, tsize - TOP_FOOT_SIZE);
-      else
-#endif
-      {
-        /* Offset top by embedded malloc_state */
-        mchunkptr mn = next_chunk(mem2chunk(m));
-        init_top(m, mn, (size_t)((tbase + tsize) - (char*)mn) -TOP_FOOT_SIZE);
-      }
-    }
-
-    else {
-      /* Try to merge with an existing segment */
-      msegmentptr sp = &m->seg;
-      /* Only consider most recent segment if traversal suppressed */
-      while (sp != 0 && tbase != sp->base + sp->size)
-        sp = (NO_SEGMENT_TRAVERSAL) ? 0 : sp->next;
-      if (sp != 0 &&
-          !is_extern_segment(sp) &&
-          (sp->sflags & USE_MMAP_BIT) == mmap_flag &&
-          segment_holds(sp, m->top)) { /* append */
-        sp->size += tsize;
-        init_top(m, m->top, m->topsize + tsize);
-      }
-      else {
-        if (tbase < m->least_addr)
-          m->least_addr = tbase;
-        sp = &m->seg;
-        while (sp != 0 && sp->base != tbase + tsize)
-          sp = (NO_SEGMENT_TRAVERSAL) ? 0 : sp->next;
-        if (sp != 0 &&
-            !is_extern_segment(sp) &&
-            (sp->sflags & USE_MMAP_BIT) == mmap_flag) {
-          char* oldbase = sp->base;
-          sp->base = tbase;
-          sp->size += tsize;
-          return prepend_alloc(m, tbase, oldbase, nb);
-        }
-        else
-          add_segment(m, tbase, tsize, mmap_flag);
-      }
-    }
-
-    if (nb < m->topsize) { /* Allocate from new or extended top space */
-      size_t rsize = m->topsize -= nb;
-      mchunkptr p = m->top;
-      mchunkptr r = m->top = chunk_plus_offset(p, nb);
-      r->head = rsize | PINUSE_BIT;
-      set_size_and_pinuse_of_inuse_chunk(m, p, nb);
-      check_top_chunk(m, m->top);
-      check_malloced_chunk(m, chunk2mem(p), nb);
-      return chunk2mem(p);
-    }
-  }
-
-  MALLOC_FAILURE_ACTION;
-  return 0;
-}
-
-/* -----------------------  system deallocation -------------------------- */
-
-/* Unmap and unlink any mmapped segments that don't contain used chunks */
-static size_t release_unused_segments(mstate m) {
-  size_t released = 0;
-  int nsegs = 0;
-  msegmentptr pred = &m->seg;
-  msegmentptr sp = pred->next;
-  while (sp != 0) {
-    char* base = sp->base;
-    size_t size = sp->size;
-    msegmentptr next = sp->next;
-    ++nsegs;
-    if (is_mmapped_segment(sp) && !is_extern_segment(sp)) {
-      mchunkptr p = align_as_chunk(base);
-      size_t psize = chunksize(p);
-      /* Can unmap if first chunk holds entire segment and not pinned */
-      if (!is_inuse(p) && (char*)p + psize >= base + size - TOP_FOOT_SIZE) {
-        tchunkptr tp = (tchunkptr)p;
-        assert(segment_holds(sp, (char*)sp));
-        if (p == m->dv) {
-          m->dv = 0;
-          m->dvsize = 0;
-        }
-        else {
-          unlink_large_chunk(m, tp);
-        }
-        if (CALL_MUNMAP(base, size) == 0) {
-          released += size;
-          m->footprint -= size;
-          /* unlink obsoleted record */
-          sp = pred;
-          sp->next = next;
-        }
-        else { /* back out if cannot unmap */
-          insert_large_chunk(m, tp, psize);
-        }
-      }
-    }
-    if (NO_SEGMENT_TRAVERSAL) /* scan only first segment */
-      break;
-    pred = sp;
-    sp = next;
-  }
-  /* Reset check counter */
-  m->release_checks = (((size_t) nsegs > (size_t) MAX_RELEASE_CHECK_RATE)?
-                       (size_t) nsegs : (size_t) MAX_RELEASE_CHECK_RATE);
-  return released;
-}
-
-static int sys_trim(mstate m, size_t pad) {
-  size_t released = 0;
-  ensure_initialization();
-  if (pad < MAX_REQUEST && is_initialized(m)) {
-    pad += TOP_FOOT_SIZE; /* ensure enough room for segment overhead */
-
-    if (m->topsize > pad) {
-      /* Shrink top space in granularity-size units, keeping at least one */
-      size_t unit = mparams.granularity;
-      size_t extra = ((m->topsize - pad + (unit - SIZE_T_ONE)) / unit -
-                      SIZE_T_ONE) * unit;
-      msegmentptr sp = segment_holding(m, (char*)m->top);
-
-      if (!is_extern_segment(sp)) {
-        if (is_mmapped_segment(sp)) {
-          if (HAVE_MMAP &&
-              sp->size >= extra &&
-              !has_segment_link(m, sp)) { /* can't shrink if pinned */
-            size_t newsize = sp->size - extra;
-            (void)newsize; /* placate people compiling -Wunused-variable */
-            /* Prefer mremap, fall back to munmap */
-            if ((CALL_MREMAP(sp->base, sp->size, newsize, 0) != MFAIL) ||
-                (CALL_MUNMAP(sp->base + newsize, extra) == 0)) {
-              released = extra;
-            }
-          }
-        }
-        else if (HAVE_MORECORE) {
-          if (extra >= HALF_MAX_SIZE_T) /* Avoid wrapping negative */
-            extra = (HALF_MAX_SIZE_T) + SIZE_T_ONE - unit;
-          ACQUIRE_MALLOC_GLOBAL_LOCK();
-          {
-            /* Make sure end of memory is where we last set it. */
-            char* old_br = (char*)(CALL_MORECORE(0));
-            if (old_br == sp->base + sp->size) {
-              char* rel_br = (char*)(CALL_MORECORE(-extra));
-              char* new_br = (char*)(CALL_MORECORE(0));
-              if (rel_br != CMFAIL && new_br < old_br)
-                released = old_br - new_br;
-            }
-          }
-          RELEASE_MALLOC_GLOBAL_LOCK();
-        }
-      }
-
-      if (released != 0) {
-        sp->size -= released;
-        m->footprint -= released;
-        init_top(m, m->top, m->topsize - released);
-        check_top_chunk(m, m->top);
-      }
-    }
-
-    /* Unmap any unused mmapped segments */
-    if (HAVE_MMAP)
-      released += release_unused_segments(m);
-
-    /* On failure, disable autotrim to avoid repeated failed future calls */
-    if (released == 0 && m->topsize > m->trim_check)
-      m->trim_check = MAX_SIZE_T;
-  }
-
-  return (released != 0)? 1 : 0;
-}
-
-/* Consolidate and bin a chunk. Differs from exported versions
-   of free mainly in that the chunk need not be marked as inuse.
-*/
-static void dispose_chunk(mstate m, mchunkptr p, size_t psize) {
-  mchunkptr next = chunk_plus_offset(p, psize);
-  if (!pinuse(p)) {
-    mchunkptr prev;
-    size_t prevsize = p->prev_foot;
-    if (is_mmapped(p)) {
-      psize += prevsize + MMAP_FOOT_PAD;
-      if (CALL_MUNMAP((char*)p - prevsize, psize) == 0)
-        m->footprint -= psize;
-      return;
-    }
-    prev = chunk_minus_offset(p, prevsize);
-    psize += prevsize;
-    p = prev;
-    if (RTCHECK(ok_address(m, prev))) { /* consolidate backward */
-      if (p != m->dv) {
-        unlink_chunk(m, p, prevsize);
-      }
-      else if ((next->head & INUSE_BITS) == INUSE_BITS) {
-        m->dvsize = psize;
-        set_free_with_pinuse(p, psize, next);
-        return;
-      }
-    }
-    else {
-      CORRUPTION_ERROR_ACTION(m);
-      return;
-    }
-  }
-  if (RTCHECK(ok_address(m, next))) {
-    if (!cinuse(next)) {  /* consolidate forward */
-      if (next == m->top) {
-        size_t tsize = m->topsize += psize;
-        m->top = p;
-        p->head = tsize | PINUSE_BIT;
-        if (p == m->dv) {
-          m->dv = 0;
-          m->dvsize = 0;
-        }
-        return;
-      }
-      else if (next == m->dv) {
-        size_t dsize = m->dvsize += psize;
-        m->dv = p;
-        set_size_and_pinuse_of_free_chunk(p, dsize);
-        return;
-      }
-      else {
-        size_t nsize = chunksize(next);
-        psize += nsize;
-        unlink_chunk(m, next, nsize);
-        set_size_and_pinuse_of_free_chunk(p, psize);
-        if (p == m->dv) {
-          m->dvsize = psize;
-          return;
-        }
-      }
-    }
-    else {
-      set_free_with_pinuse(p, psize, next);
-    }
-    insert_chunk(m, p, psize);
-  }
-  else {
-    CORRUPTION_ERROR_ACTION(m);
-  }
-}
-
-/* ---------------------------- malloc --------------------------- */
-
-/* allocate a large request from the best fitting chunk in a treebin */
-static void* tmalloc_large(mstate m, size_t nb) {
-  tchunkptr v = 0;
-  size_t rsize = -nb; /* Unsigned negation */
-  tchunkptr t;
-  bindex_t idx;
-  compute_tree_index(nb, idx);
-  if ((t = *treebin_at(m, idx)) != 0) {
-    /* Traverse tree for this bin looking for node with size == nb */
-    size_t sizebits = nb << leftshift_for_tree_index(idx);
-    tchunkptr rst = 0;  /* The deepest untaken right subtree */
-    for (;;) {
-      tchunkptr rt;
-      size_t trem = chunksize(t) - nb;
-      if (trem < rsize) {
-        v = t;
-        if ((rsize = trem) == 0)
-          break;
-      }
-      rt = t->child[1];
-      t = t->child[(sizebits >> (SIZE_T_BITSIZE-SIZE_T_ONE)) & 1];
-      if (rt != 0 && rt != t)
-        rst = rt;
-      if (t == 0) {
-        t = rst; /* set t to least subtree holding sizes > nb */
-        break;
-      }
-      sizebits <<= 1;
-    }
-  }
-  if (t == 0 && v == 0) { /* set t to root of next non-empty treebin */
-    binmap_t leftbits = left_bits(idx2bit(idx)) & m->treemap;
-    if (leftbits != 0) {
-      bindex_t i;
-      binmap_t leastbit = least_bit(leftbits);
-      compute_bit2idx(leastbit, i);
-      t = *treebin_at(m, i);
-    }
-  }
-
-  while (t != 0) { /* find smallest of tree or subtree */
-    size_t trem = chunksize(t) - nb;
-    if (trem < rsize) {
-      rsize = trem;
-      v = t;
-    }
-    t = leftmost_child(t);
-  }
-
-  /*  If dv is a better fit, return 0 so malloc will use it */
-  if (v != 0 && rsize < (size_t)(m->dvsize - nb)) {
-    if (RTCHECK(ok_address(m, v))) { /* split */
-      mchunkptr r = chunk_plus_offset(v, nb);
-      assert(chunksize(v) == rsize + nb);
-      if (RTCHECK(ok_next(v, r))) {
-        unlink_large_chunk(m, v);
-        if (rsize < MIN_CHUNK_SIZE)
-          set_inuse_and_pinuse(m, v, (rsize + nb));
-        else {
-          set_size_and_pinuse_of_inuse_chunk(m, v, nb);
-          set_size_and_pinuse_of_free_chunk(r, rsize);
-          insert_chunk(m, r, rsize);
-        }
-        return chunk2mem(v);
-      }
-    }
-    CORRUPTION_ERROR_ACTION(m);
-  }
-  return 0;
-}
-
-/* allocate a small request from the best fitting chunk in a treebin */
-static void* tmalloc_small(mstate m, size_t nb) {
-  tchunkptr t, v;
-  size_t rsize;
-  bindex_t i;
-  binmap_t leastbit = least_bit(m->treemap);
-  compute_bit2idx(leastbit, i);
-  v = t = *treebin_at(m, i);
-  rsize = chunksize(t) - nb;
-
-  while ((t = leftmost_child(t)) != 0) {
-    size_t trem = chunksize(t) - nb;
-    if (trem < rsize) {
-      rsize = trem;
-      v = t;
-    }
-  }
-
-  if (RTCHECK(ok_address(m, v))) {
-    mchunkptr r = chunk_plus_offset(v, nb);
-    assert(chunksize(v) == rsize + nb);
-    if (RTCHECK(ok_next(v, r))) {
-      unlink_large_chunk(m, v);
-      if (rsize < MIN_CHUNK_SIZE)
-        set_inuse_and_pinuse(m, v, (rsize + nb));
-      else {
-        set_size_and_pinuse_of_inuse_chunk(m, v, nb);
-        set_size_and_pinuse_of_free_chunk(r, rsize);
-        replace_dv(m, r, rsize);
-      }
-      return chunk2mem(v);
-    }
-  }
-
-  CORRUPTION_ERROR_ACTION(m);
-  return 0;
-}
-
-#if !ONLY_MSPACES
-
-void* dlmalloc(size_t bytes) {
-  /*
-     Basic algorithm:
-     If a small request (< 256 bytes minus per-chunk overhead):
-       1. If one exists, use a remainderless chunk in associated smallbin.
-          (Remainderless means that there are too few excess bytes to
-          represent as a chunk.)
-       2. If it is big enough, use the dv chunk, which is normally the
-          chunk adjacent to the one used for the most recent small request.
-       3. If one exists, split the smallest available chunk in a bin,
-          saving remainder in dv.
-       4. If it is big enough, use the top chunk.
-       5. If available, get memory from system and use it
-     Otherwise, for a large request:
-       1. Find the smallest available binned chunk that fits, and use it
-          if it is better fitting than dv chunk, splitting if necessary.
-       2. If better fitting than any binned chunk, use the dv chunk.
-       3. If it is big enough, use the top chunk.
-       4. If request size >= mmap threshold, try to directly mmap this chunk.
-       5. If available, get memory from system and use it
-
-     The ugly goto's here ensure that postaction occurs along all paths.
-  */
-
-#if USE_LOCKS
-  ensure_initialization(); /* initialize in sys_alloc if not using locks */
-#endif
-
-  if (!PREACTION(gm)) {
-    void* mem;
-    size_t nb;
-    if (bytes <= MAX_SMALL_REQUEST) {
-      bindex_t idx;
-      binmap_t smallbits;
-      nb = (bytes < MIN_REQUEST)? MIN_CHUNK_SIZE : pad_request(bytes);
-      idx = small_index(nb);
-      smallbits = gm->smallmap >> idx;
-
-      if ((smallbits & 0x3U) != 0) { /* Remainderless fit to a smallbin. */
-        mchunkptr b, p;
-        idx += ~smallbits & 1;       /* Uses next bin if idx empty */
-        b = smallbin_at(gm, idx);
-        p = b->fd;
-        assert(chunksize(p) == small_index2size(idx));
-        unlink_first_small_chunk(gm, b, p, idx);
-        set_inuse_and_pinuse(gm, p, small_index2size(idx));
-        mem = chunk2mem(p);
-        check_malloced_chunk(gm, mem, nb);
-        goto postaction;
-      }
-
-      else if (nb > gm->dvsize) {
-        if (smallbits != 0) { /* Use chunk in next nonempty smallbin */
-          mchunkptr b, p, r;
-          size_t rsize;
-          bindex_t i;
-          binmap_t leftbits = (smallbits << idx) & left_bits(idx2bit(idx));
-          binmap_t leastbit = least_bit(leftbits);
-          compute_bit2idx(leastbit, i);
-          b = smallbin_at(gm, i);
-          p = b->fd;
-          assert(chunksize(p) == small_index2size(i));
-          unlink_first_small_chunk(gm, b, p, i);
-          rsize = small_index2size(i) - nb;
-          /* Fit here cannot be remainderless if 4byte sizes */
-          if (SIZE_T_SIZE != 4 && rsize < MIN_CHUNK_SIZE)
-            set_inuse_and_pinuse(gm, p, small_index2size(i));
-          else {
-            set_size_and_pinuse_of_inuse_chunk(gm, p, nb);
-            r = chunk_plus_offset(p, nb);
-            set_size_and_pinuse_of_free_chunk(r, rsize);
-            replace_dv(gm, r, rsize);
-          }
-          mem = chunk2mem(p);
-          check_malloced_chunk(gm, mem, nb);
-          goto postaction;
-        }
-
-        else if (gm->treemap != 0 && (mem = tmalloc_small(gm, nb)) != 0) {
-          check_malloced_chunk(gm, mem, nb);
-          goto postaction;
-        }
-      }
-    }
-    else if (bytes >= MAX_REQUEST)
-      nb = MAX_SIZE_T; /* Too big to allocate. Force failure (in sys alloc) */
-    else {
-      nb = pad_request(bytes);
-      if (gm->treemap != 0 && (mem = tmalloc_large(gm, nb)) != 0) {
-        check_malloced_chunk(gm, mem, nb);
-        goto postaction;
-      }
-    }
-
-    if (nb <= gm->dvsize) {
-      size_t rsize = gm->dvsize - nb;
-      mchunkptr p = gm->dv;
-      if (rsize >= MIN_CHUNK_SIZE) { /* split dv */
-        mchunkptr r = gm->dv = chunk_plus_offset(p, nb);
-        gm->dvsize = rsize;
-        set_size_and_pinuse_of_free_chunk(r, rsize);
-        set_size_and_pinuse_of_inuse_chunk(gm, p, nb);
-      }
-      else { /* exhaust dv */
-        size_t dvs = gm->dvsize;
-        gm->dvsize = 0;
-        gm->dv = 0;
-        set_inuse_and_pinuse(gm, p, dvs);
-      }
-      mem = chunk2mem(p);
-      check_malloced_chunk(gm, mem, nb);
-      goto postaction;
-    }
-
-    else if (nb < gm->topsize) { /* Split top */
-      size_t rsize = gm->topsize -= nb;
-      mchunkptr p = gm->top;
-      mchunkptr r = gm->top = chunk_plus_offset(p, nb);
-      r->head = rsize | PINUSE_BIT;
-      set_size_and_pinuse_of_inuse_chunk(gm, p, nb);
-      mem = chunk2mem(p);
-      check_top_chunk(gm, gm->top);
-      check_malloced_chunk(gm, mem, nb);
-      goto postaction;
-    }
-
-    mem = sys_alloc(gm, nb);
-
-  postaction:
-    POSTACTION(gm);
-    return mem;
-  }
-
-  return 0;
-}
-
-/* ---------------------------- free --------------------------- */
-
-void dlfree(void* mem) {
-  /*
-     Consolidate freed chunks with preceeding or succeeding bordering
-     free chunks, if they exist, and then place in a bin.  Intermixed
-     with special cases for top, dv, mmapped chunks, and usage errors.
-  */
-
-  if (mem != 0) {
-    mchunkptr p  = mem2chunk(mem);
-#if FOOTERS
-    mstate fm = get_mstate_for(p);
-    if (!ok_magic(fm)) {
-      USAGE_ERROR_ACTION(fm, p);
-      return;
-    }
-#else /* FOOTERS */
-#define fm gm
-#endif /* FOOTERS */
-    if (!PREACTION(fm)) {
-      check_inuse_chunk(fm, p);
-      if (RTCHECK(ok_address(fm, p) && ok_inuse(p))) {
-        size_t psize = chunksize(p);
-        mchunkptr next = chunk_plus_offset(p, psize);
-        if (!pinuse(p)) {
-          size_t prevsize = p->prev_foot;
-          if (is_mmapped(p)) {
-            psize += prevsize + MMAP_FOOT_PAD;
-            if (CALL_MUNMAP((char*)p - prevsize, psize) == 0)
-              fm->footprint -= psize;
-            goto postaction;
-          }
-          else {
-            mchunkptr prev = chunk_minus_offset(p, prevsize);
-            psize += prevsize;
-            p = prev;
-            if (RTCHECK(ok_address(fm, prev))) { /* consolidate backward */
-              if (p != fm->dv) {
-                unlink_chunk(fm, p, prevsize);
-              }
-              else if ((next->head & INUSE_BITS) == INUSE_BITS) {
-                fm->dvsize = psize;
-                set_free_with_pinuse(p, psize, next);
-                goto postaction;
-              }
-            }
-            else
-              goto erroraction;
-          }
-        }
-
-        if (RTCHECK(ok_next(p, next) && ok_pinuse(next))) {
-          if (!cinuse(next)) {  /* consolidate forward */
-            if (next == fm->top) {
-              size_t tsize = fm->topsize += psize;
-              fm->top = p;
-              p->head = tsize | PINUSE_BIT;
-              if (p == fm->dv) {
-                fm->dv = 0;
-                fm->dvsize = 0;
-              }
-              if (should_trim(fm, tsize))
-                sys_trim(fm, 0);
-              goto postaction;
-            }
-            else if (next == fm->dv) {
-              size_t dsize = fm->dvsize += psize;
-              fm->dv = p;
-              set_size_and_pinuse_of_free_chunk(p, dsize);
-              goto postaction;
-            }
-            else {
-              size_t nsize = chunksize(next);
-              psize += nsize;
-              unlink_chunk(fm, next, nsize);
-              set_size_and_pinuse_of_free_chunk(p, psize);
-              if (p == fm->dv) {
-                fm->dvsize = psize;
-                goto postaction;
-              }
-            }
-          }
-          else
-            set_free_with_pinuse(p, psize, next);
-
-          if (is_small(psize)) {
-            insert_small_chunk(fm, p, psize);
-            check_free_chunk(fm, p);
-          }
-          else {
-            tchunkptr tp = (tchunkptr)p;
-            insert_large_chunk(fm, tp, psize);
-            check_free_chunk(fm, p);
-            if (--fm->release_checks == 0)
-              release_unused_segments(fm);
-          }
-          goto postaction;
-        }
-      }
-    erroraction:
-      USAGE_ERROR_ACTION(fm, p);
-    postaction:
-      POSTACTION(fm);
-    }
-  }
-#if !FOOTERS
-#undef fm
-#endif /* FOOTERS */
-}
-
-void* dlcalloc(size_t n_elements, size_t elem_size) {
-  void* mem;
-  size_t req = 0;
-  if (n_elements != 0) {
-    req = n_elements * elem_size;
-    if (((n_elements | elem_size) & ~(size_t)0xffff) &&
-        (req / n_elements != elem_size))
-      req = MAX_SIZE_T; /* force downstream failure on overflow */
-  }
-  mem = dlmalloc(req);
-  if (mem != 0 && calloc_must_clear(mem2chunk(mem)))
-    memset(mem, 0, req);
-  return mem;
-}
-
-#endif /* !ONLY_MSPACES */
-
-/* ------------ Internal support for realloc, memalign, etc -------------- */
-
-/* Try to realloc; only in-place unless can_move true */
-static mchunkptr try_realloc_chunk(mstate m, mchunkptr p, size_t nb,
-                                   int can_move) {
-  mchunkptr newp = 0;
-  size_t oldsize = chunksize(p);
-  mchunkptr next = chunk_plus_offset(p, oldsize);
-  if (RTCHECK(ok_address(m, p) && ok_inuse(p) &&
-              ok_next(p, next) && ok_pinuse(next))) {
-    if (is_mmapped(p)) {
-      newp = mmap_resize(m, p, nb, can_move);
-    }
-    else if (oldsize >= nb) {             /* already big enough */
-      size_t rsize = oldsize - nb;
-      if (rsize >= MIN_CHUNK_SIZE) {      /* split off remainder */
-        mchunkptr r = chunk_plus_offset(p, nb);
-        set_inuse(m, p, nb);
-        set_inuse(m, r, rsize);
-        dispose_chunk(m, r, rsize);
-      }
-      newp = p;
-    }
-    else if (next == m->top) {  /* extend into top */
-      if (oldsize + m->topsize > nb) {
-        size_t newsize = oldsize + m->topsize;
-        size_t newtopsize = newsize - nb;
-        mchunkptr newtop = chunk_plus_offset(p, nb);
-        set_inuse(m, p, nb);
-        newtop->head = newtopsize |PINUSE_BIT;
-        m->top = newtop;
-        m->topsize = newtopsize;
-        newp = p;
-      }
-    }
-    else if (next == m->dv) { /* extend into dv */
-      size_t dvs = m->dvsize;
-      if (oldsize + dvs >= nb) {
-        size_t dsize = oldsize + dvs - nb;
-        if (dsize >= MIN_CHUNK_SIZE) {
-          mchunkptr r = chunk_plus_offset(p, nb);
-          mchunkptr n = chunk_plus_offset(r, dsize);
-          set_inuse(m, p, nb);
-          set_size_and_pinuse_of_free_chunk(r, dsize);
-          clear_pinuse(n);
-          m->dvsize = dsize;
-          m->dv = r;
-        }
-        else { /* exhaust dv */
-          size_t newsize = oldsize + dvs;
-          set_inuse(m, p, newsize);
-          m->dvsize = 0;
-          m->dv = 0;
-        }
-        newp = p;
-      }
-    }
-    else if (!cinuse(next)) { /* extend into next free chunk */
-      size_t nextsize = chunksize(next);
-      if (oldsize + nextsize >= nb) {
-        size_t rsize = oldsize + nextsize - nb;
-        unlink_chunk(m, next, nextsize);
-        if (rsize < MIN_CHUNK_SIZE) {
-          size_t newsize = oldsize + nextsize;
-          set_inuse(m, p, newsize);
-        }
-        else {
-          mchunkptr r = chunk_plus_offset(p, nb);
-          set_inuse(m, p, nb);
-          set_inuse(m, r, rsize);
-          dispose_chunk(m, r, rsize);
-        }
-        newp = p;
-      }
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(m, chunk2mem(p));
-  }
-  return newp;
-}
-
-static void* internal_memalign(mstate m, size_t alignment, size_t bytes) {
-  void* mem = 0;
-  if (alignment <  MIN_CHUNK_SIZE) /* must be at least a minimum chunk size */
-    alignment = MIN_CHUNK_SIZE;
-  if ((alignment & (alignment-SIZE_T_ONE)) != 0) {/* Ensure a power of 2 */
-    size_t a = MALLOC_ALIGNMENT << 1;
-    while (a < alignment) a <<= 1;
-    alignment = a;
-  }
-  if (bytes >= MAX_REQUEST - alignment) {
-    if (m != 0)  { /* Test isn't needed but avoids compiler warning */
-      MALLOC_FAILURE_ACTION;
-    }
-  }
-  else {
-    size_t nb = request2size(bytes);
-    size_t req = nb + alignment + MIN_CHUNK_SIZE - CHUNK_OVERHEAD;
-    mem = internal_malloc(m, req);
-    if (mem != 0) {
-      mchunkptr p = mem2chunk(mem);
-      if (PREACTION(m))
-        return 0;
-      if ((((size_t)(mem)) & (alignment - 1)) != 0) { /* misaligned */
-        /*
-          Find an aligned spot inside chunk.  Since we need to give
-          back leading space in a chunk of at least MIN_CHUNK_SIZE, if
-          the first calculation places us at a spot with less than
-          MIN_CHUNK_SIZE leader, we can move to the next aligned spot.
-          We've allocated enough total room so that this is always
-          possible.
-        */
-        char* br = (char*)mem2chunk((size_t)(((size_t)((char*)mem + alignment -
-                                                       SIZE_T_ONE)) &
-                                             -alignment));
-        char* pos = ((size_t)(br - (char*)(p)) >= MIN_CHUNK_SIZE)?
-          br : br+alignment;
-        mchunkptr newp = (mchunkptr)pos;
-        size_t leadsize = pos - (char*)(p);
-        size_t newsize = chunksize(p) - leadsize;
-
-        if (is_mmapped(p)) { /* For mmapped chunks, just adjust offset */
-          newp->prev_foot = p->prev_foot + leadsize;
-          newp->head = newsize;
-        }
-        else { /* Otherwise, give back leader, use the rest */
-          set_inuse(m, newp, newsize);
-          set_inuse(m, p, leadsize);
-          dispose_chunk(m, p, leadsize);
-        }
-        p = newp;
-      }
-
-      /* Give back spare room at the end */
-      if (!is_mmapped(p)) {
-        size_t size = chunksize(p);
-        if (size > nb + MIN_CHUNK_SIZE) {
-          size_t remainder_size = size - nb;
-          mchunkptr remainder = chunk_plus_offset(p, nb);
-          set_inuse(m, p, nb);
-          set_inuse(m, remainder, remainder_size);
-          dispose_chunk(m, remainder, remainder_size);
-        }
-      }
-
-      mem = chunk2mem(p);
-      assert (chunksize(p) >= nb);
-      assert(((size_t)mem & (alignment - 1)) == 0);
-      check_inuse_chunk(m, p);
-      POSTACTION(m);
-    }
-  }
-  return mem;
-}
-
-/*
-  Common support for independent_X routines, handling
-    all of the combinations that can result.
-  The opts arg has:
-    bit 0 set if all elements are same size (using sizes[0])
-    bit 1 set if elements should be zeroed
-*/
-static void** ialloc(mstate m,
-                     size_t n_elements,
-                     size_t* sizes,
-                     int opts,
-                     void* chunks[]) {
-
-  size_t    element_size;   /* chunksize of each element, if all same */
-  size_t    contents_size;  /* total size of elements */
-  size_t    array_size;     /* request size of pointer array */
-  void*     mem;            /* malloced aggregate space */
-  mchunkptr p;              /* corresponding chunk */
-  size_t    remainder_size; /* remaining bytes while splitting */
-  void**    marray;         /* either "chunks" or malloced ptr array */
-  mchunkptr array_chunk;    /* chunk for malloced ptr array */
-  flag_t    was_enabled;    /* to disable mmap */
-  size_t    size;
-  size_t    i;
-
-  ensure_initialization();
-  /* compute array length, if needed */
-  if (chunks != 0) {
-    if (n_elements == 0)
-      return chunks; /* nothing to do */
-    marray = chunks;
-    array_size = 0;
-  }
-  else {
-    /* if empty req, must still return chunk representing empty array */
-    if (n_elements == 0)
-      return (void**)internal_malloc(m, 0);
-    marray = 0;
-    array_size = request2size(n_elements * (sizeof(void*)));
-  }
-
-  /* compute total element size */
-  if (opts & 0x1) { /* all-same-size */
-    element_size = request2size(*sizes);
-    contents_size = n_elements * element_size;
-  }
-  else { /* add up all the sizes */
-    element_size = 0;
-    contents_size = 0;
-    for (i = 0; i != n_elements; ++i)
-      contents_size += request2size(sizes[i]);
-  }
-
-  size = contents_size + array_size;
-
-  /*
-     Allocate the aggregate chunk.  First disable direct-mmapping so
-     malloc won't use it, since we would not be able to later
-     free/realloc space internal to a segregated mmap region.
-  */
-  was_enabled = use_mmap(m);
-  disable_mmap(m);
-  mem = internal_malloc(m, size - CHUNK_OVERHEAD);
-  if (was_enabled)
-    enable_mmap(m);
-  if (mem == 0)
-    return 0;
-
-  if (PREACTION(m)) return 0;
-  p = mem2chunk(mem);
-  remainder_size = chunksize(p);
-
-  assert(!is_mmapped(p));
-
-  if (opts & 0x2) {       /* optionally clear the elements */
-    memset((size_t*)mem, 0, remainder_size - SIZE_T_SIZE - array_size);
-  }
-
-  /* If not provided, allocate the pointer array as final part of chunk */
-  if (marray == 0) {
-    size_t  array_chunk_size;
-    array_chunk = chunk_plus_offset(p, contents_size);
-    array_chunk_size = remainder_size - contents_size;
-    marray = (void**) (chunk2mem(array_chunk));
-    set_size_and_pinuse_of_inuse_chunk(m, array_chunk, array_chunk_size);
-    remainder_size = contents_size;
-  }
-
-  /* split out elements */
-  for (i = 0; ; ++i) {
-    marray[i] = chunk2mem(p);
-    if (i != n_elements-1) {
-      if (element_size != 0)
-        size = element_size;
-      else
-        size = request2size(sizes[i]);
-      remainder_size -= size;
-      set_size_and_pinuse_of_inuse_chunk(m, p, size);
-      p = chunk_plus_offset(p, size);
-    }
-    else { /* the final element absorbs any overallocation slop */
-      set_size_and_pinuse_of_inuse_chunk(m, p, remainder_size);
-      break;
-    }
-  }
-
-#if DEBUG
-  if (marray != chunks) {
-    /* final element must have exactly exhausted chunk */
-    if (element_size != 0) {
-      assert(remainder_size == element_size);
-    }
-    else {
-      assert(remainder_size == request2size(sizes[i]));
-    }
-    check_inuse_chunk(m, mem2chunk(marray));
-  }
-  for (i = 0; i != n_elements; ++i)
-    check_inuse_chunk(m, mem2chunk(marray[i]));
-
-#endif /* DEBUG */
-
-  POSTACTION(m);
-  return marray;
-}
-
-/* Try to free all pointers in the given array.
-   Note: this could be made faster, by delaying consolidation,
-   at the price of disabling some user integrity checks, We
-   still optimize some consolidations by combining adjacent
-   chunks before freeing, which will occur often if allocated
-   with ialloc or the array is sorted.
-*/
-static size_t internal_bulk_free(mstate m, void* array[], size_t nelem) {
-  size_t unfreed = 0;
-  if (!PREACTION(m)) {
-    void** a;
-    void** fence = &(array[nelem]);
-    for (a = array; a != fence; ++a) {
-      void* mem = *a;
-      if (mem != 0) {
-        mchunkptr p = mem2chunk(mem);
-        size_t psize = chunksize(p);
-#if FOOTERS
-        if (get_mstate_for(p) != m) {
-          ++unfreed;
-          continue;
-        }
-#endif
-        check_inuse_chunk(m, p);
-        *a = 0;
-        if (RTCHECK(ok_address(m, p) && ok_inuse(p))) {
-          void ** b = a + 1; /* try to merge with next chunk */
-          mchunkptr next = next_chunk(p);
-          if (b != fence && *b == chunk2mem(next)) {
-            size_t newsize = chunksize(next) + psize;
-            set_inuse(m, p, newsize);
-            *b = chunk2mem(p);
-          }
-          else
-            dispose_chunk(m, p, psize);
-        }
-        else {
-          CORRUPTION_ERROR_ACTION(m);
-          break;
-        }
-      }
-    }
-    if (should_trim(m, m->topsize))
-      sys_trim(m, 0);
-    POSTACTION(m);
-  }
-  return unfreed;
-}
-
-/* Traversal */
-#if MALLOC_INSPECT_ALL
-static void internal_inspect_all(mstate m,
-                                 void(*handler)(void *start,
-                                                void *end,
-                                                size_t used_bytes,
-                                                void* callback_arg),
-                                 void* arg) {
-  if (is_initialized(m)) {
-    mchunkptr top = m->top;
-    msegmentptr s;
-    for (s = &m->seg; s != 0; s = s->next) {
-      mchunkptr q = align_as_chunk(s->base);
-      while (segment_holds(s, q) && q->head != FENCEPOST_HEAD) {
-        mchunkptr next = next_chunk(q);
-        size_t sz = chunksize(q);
-        size_t used;
-        void* start;
-        if (is_inuse(q)) {
-          used = sz - CHUNK_OVERHEAD; /* must not be mmapped */
-          start = chunk2mem(q);
-        }
-        else {
-          used = 0;
-          if (is_small(sz)) {     /* offset by possible bookkeeping */
-            start = (void*)((char*)q + sizeof(struct malloc_chunk));
-          }
-          else {
-            start = (void*)((char*)q + sizeof(struct malloc_tree_chunk));
-          }
-        }
-        if (start < (void*)next)  /* skip if all space is bookkeeping */
-          handler(start, next, used, arg);
-        if (q == top)
-          break;
-        q = next;
-      }
-    }
-  }
-}
-#endif /* MALLOC_INSPECT_ALL */
-
-/* ------------------ Exported realloc, memalign, etc -------------------- */
-
-#if !ONLY_MSPACES
-
-void* dlrealloc(void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem == 0) {
-    mem = dlmalloc(bytes);
-  }
-  else if (bytes >= MAX_REQUEST) {
-    MALLOC_FAILURE_ACTION;
-  }
-#ifdef REALLOC_ZERO_BYTES_FREES
-  else if (bytes == 0) {
-    dlfree(oldmem);
-  }
-#endif /* REALLOC_ZERO_BYTES_FREES */
-  else {
-    size_t nb = request2size(bytes);
-    mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-    mstate m = gm;
-#else /* FOOTERS */
-    mstate m = get_mstate_for(oldp);
-    if (!ok_magic(m)) {
-      USAGE_ERROR_ACTION(m, oldmem);
-      return 0;
-    }
-#endif /* FOOTERS */
-    if (!PREACTION(m)) {
-      mchunkptr newp = try_realloc_chunk(m, oldp, nb, 1);
-      POSTACTION(m);
-      if (newp != 0) {
-        check_inuse_chunk(m, newp);
-        mem = chunk2mem(newp);
-      }
-      else {
-        mem = internal_malloc(m, bytes);
-        if (mem != 0) {
-          size_t oc = chunksize(oldp) - overhead_for(oldp);
-          memcpy(mem, oldmem, (oc < bytes)? oc : bytes);
-          internal_free(m, oldmem);
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* dlrealloc_in_place(void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem != 0) {
-    if (bytes >= MAX_REQUEST) {
-      MALLOC_FAILURE_ACTION;
-    }
-    else {
-      size_t nb = request2size(bytes);
-      mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-      mstate m = gm;
-#else /* FOOTERS */
-      mstate m = get_mstate_for(oldp);
-      if (!ok_magic(m)) {
-        USAGE_ERROR_ACTION(m, oldmem);
-        return 0;
-      }
-#endif /* FOOTERS */
-      if (!PREACTION(m)) {
-        mchunkptr newp = try_realloc_chunk(m, oldp, nb, 0);
-        POSTACTION(m);
-        if (newp == oldp) {
-          check_inuse_chunk(m, newp);
-          mem = oldmem;
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* dlmemalign(size_t alignment, size_t bytes) {
-  if (alignment <= MALLOC_ALIGNMENT) {
-    return dlmalloc(bytes);
-  }
-  return internal_memalign(gm, alignment, bytes);
-}
-
-int dlposix_memalign(void** pp, size_t alignment, size_t bytes) {
-  void* mem = 0;
-  if (alignment == MALLOC_ALIGNMENT)
-    mem = dlmalloc(bytes);
-  else {
-    size_t d = alignment / sizeof(void*);
-    size_t r = alignment % sizeof(void*);
-    if (r != 0 || d == 0 || (d & (d-SIZE_T_ONE)) != 0)
-      return EINVAL;
-    else if (bytes <= MAX_REQUEST - alignment) {
-      if (alignment <  MIN_CHUNK_SIZE)
-        alignment = MIN_CHUNK_SIZE;
-      mem = internal_memalign(gm, alignment, bytes);
-    }
-  }
-  if (mem == 0)
-    return ENOMEM;
-  else {
-    *pp = mem;
-    return 0;
-  }
-}
-
-void* dlvalloc(size_t bytes) {
-  size_t pagesz;
-  ensure_initialization();
-  pagesz = mparams.page_size;
-  return dlmemalign(pagesz, bytes);
-}
-
-void* dlpvalloc(size_t bytes) {
-  size_t pagesz;
-  ensure_initialization();
-  pagesz = mparams.page_size;
-  return dlmemalign(pagesz, (bytes + pagesz - SIZE_T_ONE) & ~(pagesz - SIZE_T_ONE));
-}
-
-void** dlindependent_calloc(size_t n_elements, size_t elem_size,
-                            void* chunks[]) {
-  size_t sz = elem_size; /* serves as 1-element array */
-  return ialloc(gm, n_elements, &sz, 3, chunks);
-}
-
-void** dlindependent_comalloc(size_t n_elements, size_t sizes[],
-                              void* chunks[]) {
-  return ialloc(gm, n_elements, sizes, 0, chunks);
-}
-
-size_t dlbulk_free(void* array[], size_t nelem) {
-  return internal_bulk_free(gm, array, nelem);
-}
-
-#if MALLOC_INSPECT_ALL
-void dlmalloc_inspect_all(void(*handler)(void *start,
-                                         void *end,
-                                         size_t used_bytes,
-                                         void* callback_arg),
-                          void* arg) {
-  ensure_initialization();
-  if (!PREACTION(gm)) {
-    internal_inspect_all(gm, handler, arg);
-    POSTACTION(gm);
-  }
-}
-#endif /* MALLOC_INSPECT_ALL */
-
-int dlmalloc_trim(size_t pad) {
-  int result = 0;
-  ensure_initialization();
-  if (!PREACTION(gm)) {
-    result = sys_trim(gm, pad);
-    POSTACTION(gm);
-  }
-  return result;
-}
-
-size_t dlmalloc_footprint(void) {
-  return gm->footprint;
-}
-
-size_t dlmalloc_max_footprint(void) {
-  return gm->max_footprint;
-}
-
-size_t dlmalloc_footprint_limit(void) {
-  size_t maf = gm->footprint_limit;
-  return maf == 0 ? MAX_SIZE_T : maf;
-}
-
-size_t dlmalloc_set_footprint_limit(size_t bytes) {
-  size_t result;  /* invert sense of 0 */
-  if (bytes == 0)
-    result = granularity_align(1); /* Use minimal size */
-  if (bytes == MAX_SIZE_T)
-    result = 0;                    /* disable */
-  else
-    result = granularity_align(bytes);
-  return gm->footprint_limit = result;
-}
-
-#if !NO_MALLINFO
-struct mallinfo dlmallinfo(void) {
-  return internal_mallinfo(gm);
-}
-#endif /* NO_MALLINFO */
-
-#if !NO_MALLOC_STATS
-void dlmalloc_stats() {
-  internal_malloc_stats(gm);
-}
-#endif /* NO_MALLOC_STATS */
-
-int dlmallopt(int param_number, int value) {
-  return change_mparam(param_number, value);
-}
-
-size_t dlmalloc_usable_size(void* mem) {
-  if (mem != 0) {
-    mchunkptr p = mem2chunk(mem);
-    if (is_inuse(p))
-      return chunksize(p) - overhead_for(p);
-  }
-  return 0;
-}
-
-#endif /* !ONLY_MSPACES */
-
-/* ----------------------------- user mspaces ---------------------------- */
-
-#if MSPACES
-
-static mstate init_user_mstate(char* tbase, size_t tsize) {
-  size_t msize = pad_request(sizeof(struct malloc_state));
-  mchunkptr mn;
-  mchunkptr msp = align_as_chunk(tbase);
-  mstate m = (mstate)(chunk2mem(msp));
-  memset(m, 0, msize);
-  (void)INITIAL_LOCK(&m->mutex);
-  msp->head = (msize|INUSE_BITS);
-  m->seg.base = m->least_addr = tbase;
-  m->seg.size = m->footprint = m->max_footprint = tsize;
-  m->magic = mparams.magic;
-  m->release_checks = MAX_RELEASE_CHECK_RATE;
-  m->mflags = mparams.default_mflags;
-  m->extp = 0;
-  m->exts = 0;
-  disable_contiguous(m);
-  init_bins(m);
-  mn = next_chunk(mem2chunk(m));
-  init_top(m, mn, (size_t)((tbase + tsize) - (char*)mn) - TOP_FOOT_SIZE);
-  check_top_chunk(m, m->top);
-  return m;
-}
-
-static mstate init_device_mstate(char* tbase, char* dbase, size_t tsize) {
-  size_t msize = pad_request(sizeof(struct malloc_state));
-  mchunkptr mn;
-  mchunkptr msp = align_as_chunk(tbase);
-  mstate m = (mstate)(chunk2mem(msp));
-  //memset(m, 0, msize);
-  (void)INITIAL_LOCK(&m->mutex);
-  msp->head = (msize|INUSE_BITS);
-  m->seg.base = m->least_addr = dbase;
-  m->seg.size = m->footprint = m->max_footprint = tsize;
-  m->magic = mparams.magic;
-  m->release_checks = MAX_RELEASE_CHECK_RATE;
-  m->mflags = mparams.default_mflags;
-  m->extp = 0;
-  m->exts = 0;
-  disable_contiguous(m);
-  init_bins(m);
-  mn = next_chunk(mem2chunk(m));
-printf("BBBBBBBBBBBBBB\n");
-  init_top(m, mn, (size_t)((tbase + tsize) - (char*)mn) - TOP_FOOT_SIZE);
-  //check_top_chunk(m, m->top);
-  return m;
-}
-
-
-mspace create_mspace(size_t capacity, int locked) {
-  mstate m = 0;
-  size_t msize;
-  ensure_initialization();
-  msize = pad_request(sizeof(struct malloc_state));
-  if (capacity < (size_t) -(msize + TOP_FOOT_SIZE + mparams.page_size)) {
-    size_t rs = ((capacity == 0)? mparams.granularity :
-                 (capacity + TOP_FOOT_SIZE + msize));
-    size_t tsize = granularity_align(rs);
-    char* tbase = (char*)(CALL_MMAP(tsize));
-    if (tbase != CMFAIL) {
-      m = init_user_mstate(tbase, tsize);
-      m->seg.sflags = USE_MMAP_BIT;
-      set_lock(m, locked);
-    }
-  }
-  return (mspace)m;
-}
-
-mspace create_mspace_with_base(void* base, size_t capacity, int locked) {
-  mstate m = 0;
-  size_t msize;
-  ensure_initialization();
-  msize = pad_request(sizeof(struct malloc_state));
-  if (capacity > msize + TOP_FOOT_SIZE &&
-      capacity < (size_t) -(msize + TOP_FOOT_SIZE + mparams.page_size)) {
-    m = init_user_mstate((char*)base, capacity);
-    m->seg.sflags = EXTERN_BIT;
-    set_lock(m, locked);
-  }
-  return (mspace)m;
-}
-
-mspace create_device_mspace_with_base(void* base, size_t capacity, int locked) {
-  mstate m = 0;
-  size_t msize;
-  //ensure_initialization();
-  msize = pad_request(sizeof(struct malloc_state));
-  void* host_base;
-  host_base= malloc(msize + TOP_FOOT_SIZE+mparams.page_size);
-  if (capacity > msize + TOP_FOOT_SIZE &&
-      capacity < (size_t) -(msize + TOP_FOOT_SIZE + mparams.page_size)) {
-    m = init_device_mstate((char*)host_base, (char*)base, capacity);
-printf("AAAAAAAAA\n");
-    m->seg.sflags = EXTERN_BIT;
-    set_lock(m, locked);
-  }
-  return (mspace)m;
-}
-
-
-int mspace_track_large_chunks(mspace msp, int enable) {
-  int ret = 0;
-  mstate ms = (mstate)msp;
-  if (!PREACTION(ms)) {
-    if (!use_mmap(ms)) {
-      ret = 1;
-    }
-    if (!enable) {
-      enable_mmap(ms);
-    } else {
-      disable_mmap(ms);
-    }
-    POSTACTION(ms);
-  }
-  return ret;
-}
-
-size_t destroy_mspace(mspace msp) {
-  size_t freed = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    msegmentptr sp = &ms->seg;
-    (void)DESTROY_LOCK(&ms->mutex); /* destroy before unmapped */
-    while (sp != 0) {
-      char* base = sp->base;
-      size_t size = sp->size;
-      flag_t flag = sp->sflags;
-      (void)base; /* placate people compiling -Wunused-variable */
-      sp = sp->next;
-      if ((flag & USE_MMAP_BIT) && !(flag & EXTERN_BIT) &&
-          CALL_MUNMAP(base, size) == 0)
-        freed += size;
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return freed;
-}
-
-/*
-  mspace versions of routines are near-clones of the global
-  versions. This is not so nice but better than the alternatives.
-*/
-
-void* mspace_malloc(mspace msp, size_t bytes) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  if (!PREACTION(ms)) {
-    void* mem;
-    size_t nb;
-    if (bytes <= MAX_SMALL_REQUEST) {
-      bindex_t idx;
-      binmap_t smallbits;
-      nb = (bytes < MIN_REQUEST)? MIN_CHUNK_SIZE : pad_request(bytes);
-      idx = small_index(nb);
-      smallbits = ms->smallmap >> idx;
-
-      if ((smallbits & 0x3U) != 0) { /* Remainderless fit to a smallbin. */
-        mchunkptr b, p;
-        idx += ~smallbits & 1;       /* Uses next bin if idx empty */
-        b = smallbin_at(ms, idx);
-        p = b->fd;
-        assert(chunksize(p) == small_index2size(idx));
-        unlink_first_small_chunk(ms, b, p, idx);
-        set_inuse_and_pinuse(ms, p, small_index2size(idx));
-        mem = chunk2mem(p);
-        check_malloced_chunk(ms, mem, nb);
-        goto postaction;
-      }
-
-      else if (nb > ms->dvsize) {
-        if (smallbits != 0) { /* Use chunk in next nonempty smallbin */
-          mchunkptr b, p, r;
-          size_t rsize;
-          bindex_t i;
-          binmap_t leftbits = (smallbits << idx) & left_bits(idx2bit(idx));
-          binmap_t leastbit = least_bit(leftbits);
-          compute_bit2idx(leastbit, i);
-          b = smallbin_at(ms, i);
-          p = b->fd;
-          assert(chunksize(p) == small_index2size(i));
-          unlink_first_small_chunk(ms, b, p, i);
-          rsize = small_index2size(i) - nb;
-          /* Fit here cannot be remainderless if 4byte sizes */
-          if (SIZE_T_SIZE != 4 && rsize < MIN_CHUNK_SIZE)
-            set_inuse_and_pinuse(ms, p, small_index2size(i));
-          else {
-            set_size_and_pinuse_of_inuse_chunk(ms, p, nb);
-            r = chunk_plus_offset(p, nb);
-            set_size_and_pinuse_of_free_chunk(r, rsize);
-            replace_dv(ms, r, rsize);
-          }
-          mem = chunk2mem(p);
-          check_malloced_chunk(ms, mem, nb);
-          goto postaction;
-        }
-
-        else if (ms->treemap != 0 && (mem = tmalloc_small(ms, nb)) != 0) {
-          check_malloced_chunk(ms, mem, nb);
-          goto postaction;
-        }
-      }
-    }
-    else if (bytes >= MAX_REQUEST)
-      nb = MAX_SIZE_T; /* Too big to allocate. Force failure (in sys alloc) */
-    else {
-      nb = pad_request(bytes);
-      if (ms->treemap != 0 && (mem = tmalloc_large(ms, nb)) != 0) {
-        check_malloced_chunk(ms, mem, nb);
-        goto postaction;
-      }
-    }
-
-    if (nb <= ms->dvsize) {
-      size_t rsize = ms->dvsize - nb;
-      mchunkptr p = ms->dv;
-      if (rsize >= MIN_CHUNK_SIZE) { /* split dv */
-        mchunkptr r = ms->dv = chunk_plus_offset(p, nb);
-        ms->dvsize = rsize;
-        set_size_and_pinuse_of_free_chunk(r, rsize);
-        set_size_and_pinuse_of_inuse_chunk(ms, p, nb);
-      }
-      else { /* exhaust dv */
-        size_t dvs = ms->dvsize;
-        ms->dvsize = 0;
-        ms->dv = 0;
-        set_inuse_and_pinuse(ms, p, dvs);
-      }
-      mem = chunk2mem(p);
-      check_malloced_chunk(ms, mem, nb);
-      goto postaction;
-    }
-
-    else if (nb < ms->topsize) { /* Split top */
-      size_t rsize = ms->topsize -= nb;
-      mchunkptr p = ms->top;
-      mchunkptr r = ms->top = chunk_plus_offset(p, nb);
-      r->head = rsize | PINUSE_BIT;
-      set_size_and_pinuse_of_inuse_chunk(ms, p, nb);
-      mem = chunk2mem(p);
-      check_top_chunk(ms, ms->top);
-      check_malloced_chunk(ms, mem, nb);
-      goto postaction;
-    }
-
-    mem = sys_alloc(ms, nb);
-
-  postaction:
-    POSTACTION(ms);
-    return mem;
-  }
-
-  return 0;
-}
-
-void mspace_free(mspace msp, void* mem) {
-  if (mem != 0) {
-    mchunkptr p  = mem2chunk(mem);
-#if FOOTERS
-    mstate fm = get_mstate_for(p);
-    (void)msp; /* placate people compiling -Wunused */
-#else /* FOOTERS */
-    mstate fm = (mstate)msp;
-#endif /* FOOTERS */
-    if (!ok_magic(fm)) {
-      USAGE_ERROR_ACTION(fm, p);
-      return;
-    }
-    if (!PREACTION(fm)) {
-      check_inuse_chunk(fm, p);
-      if (RTCHECK(ok_address(fm, p) && ok_inuse(p))) {
-        size_t psize = chunksize(p);
-        mchunkptr next = chunk_plus_offset(p, psize);
-        if (!pinuse(p)) {
-          size_t prevsize = p->prev_foot;
-          if (is_mmapped(p)) {
-            psize += prevsize + MMAP_FOOT_PAD;
-            if (CALL_MUNMAP((char*)p - prevsize, psize) == 0)
-              fm->footprint -= psize;
-            goto postaction;
-          }
-          else {
-            mchunkptr prev = chunk_minus_offset(p, prevsize);
-            psize += prevsize;
-            p = prev;
-            if (RTCHECK(ok_address(fm, prev))) { /* consolidate backward */
-              if (p != fm->dv) {
-                unlink_chunk(fm, p, prevsize);
-              }
-              else if ((next->head & INUSE_BITS) == INUSE_BITS) {
-                fm->dvsize = psize;
-                set_free_with_pinuse(p, psize, next);
-                goto postaction;
-              }
-            }
-            else
-              goto erroraction;
-          }
-        }
-
-        if (RTCHECK(ok_next(p, next) && ok_pinuse(next))) {
-          if (!cinuse(next)) {  /* consolidate forward */
-            if (next == fm->top) {
-              size_t tsize = fm->topsize += psize;
-              fm->top = p;
-              p->head = tsize | PINUSE_BIT;
-              if (p == fm->dv) {
-                fm->dv = 0;
-                fm->dvsize = 0;
-              }
-              if (should_trim(fm, tsize))
-                sys_trim(fm, 0);
-              goto postaction;
-            }
-            else if (next == fm->dv) {
-              size_t dsize = fm->dvsize += psize;
-              fm->dv = p;
-              set_size_and_pinuse_of_free_chunk(p, dsize);
-              goto postaction;
-            }
-            else {
-              size_t nsize = chunksize(next);
-              psize += nsize;
-              unlink_chunk(fm, next, nsize);
-              set_size_and_pinuse_of_free_chunk(p, psize);
-              if (p == fm->dv) {
-                fm->dvsize = psize;
-                goto postaction;
-              }
-            }
-          }
-          else
-            set_free_with_pinuse(p, psize, next);
-
-          if (is_small(psize)) {
-            insert_small_chunk(fm, p, psize);
-            check_free_chunk(fm, p);
-          }
-          else {
-            tchunkptr tp = (tchunkptr)p;
-            insert_large_chunk(fm, tp, psize);
-            check_free_chunk(fm, p);
-            if (--fm->release_checks == 0)
-              release_unused_segments(fm);
-          }
-          goto postaction;
-        }
-      }
-    erroraction:
-      USAGE_ERROR_ACTION(fm, p);
-    postaction:
-      POSTACTION(fm);
-    }
-  }
-}
-
-void* mspace_calloc(mspace msp, size_t n_elements, size_t elem_size) {
-  void* mem;
-  size_t req = 0;
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  if (n_elements != 0) {
-    req = n_elements * elem_size;
-    if (((n_elements | elem_size) & ~(size_t)0xffff) &&
-        (req / n_elements != elem_size))
-      req = MAX_SIZE_T; /* force downstream failure on overflow */
-  }
-  mem = internal_malloc(ms, req);
-  if (mem != 0 && calloc_must_clear(mem2chunk(mem)))
-    memset(mem, 0, req);
-  return mem;
-}
-
-void* mspace_realloc(mspace msp, void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem == 0) {
-    mem = mspace_malloc(msp, bytes);
-  }
-  else if (bytes >= MAX_REQUEST) {
-    MALLOC_FAILURE_ACTION;
-  }
-#ifdef REALLOC_ZERO_BYTES_FREES
-  else if (bytes == 0) {
-    mspace_free(msp, oldmem);
-  }
-#endif /* REALLOC_ZERO_BYTES_FREES */
-  else {
-    size_t nb = request2size(bytes);
-    mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-    mstate m = (mstate)msp;
-#else /* FOOTERS */
-    mstate m = get_mstate_for(oldp);
-    if (!ok_magic(m)) {
-      USAGE_ERROR_ACTION(m, oldmem);
-      return 0;
-    }
-#endif /* FOOTERS */
-    if (!PREACTION(m)) {
-      mchunkptr newp = try_realloc_chunk(m, oldp, nb, 1);
-      POSTACTION(m);
-      if (newp != 0) {
-        check_inuse_chunk(m, newp);
-        mem = chunk2mem(newp);
-      }
-      else {
-        mem = mspace_malloc(m, bytes);
-        if (mem != 0) {
-          size_t oc = chunksize(oldp) - overhead_for(oldp);
-          memcpy(mem, oldmem, (oc < bytes)? oc : bytes);
-          mspace_free(m, oldmem);
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* mspace_realloc_in_place(mspace msp, void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem != 0) {
-    if (bytes >= MAX_REQUEST) {
-      MALLOC_FAILURE_ACTION;
-    }
-    else {
-      size_t nb = request2size(bytes);
-      mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-      mstate m = (mstate)msp;
-#else /* FOOTERS */
-      mstate m = get_mstate_for(oldp);
-      (void)msp; /* placate people compiling -Wunused */
-      if (!ok_magic(m)) {
-        USAGE_ERROR_ACTION(m, oldmem);
-        return 0;
-      }
-#endif /* FOOTERS */
-      if (!PREACTION(m)) {
-        mchunkptr newp = try_realloc_chunk(m, oldp, nb, 0);
-        POSTACTION(m);
-        if (newp == oldp) {
-          check_inuse_chunk(m, newp);
-          mem = oldmem;
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* mspace_memalign(mspace msp, size_t alignment, size_t bytes) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  if (alignment <= MALLOC_ALIGNMENT)
-    return mspace_malloc(msp, bytes);
-  return internal_memalign(ms, alignment, bytes);
-}
-
-void** mspace_independent_calloc(mspace msp, size_t n_elements,
-                                 size_t elem_size, void* chunks[]) {
-  size_t sz = elem_size; /* serves as 1-element array */
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  return ialloc(ms, n_elements, &sz, 3, chunks);
-}
-
-void** mspace_independent_comalloc(mspace msp, size_t n_elements,
-                                   size_t sizes[], void* chunks[]) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  return ialloc(ms, n_elements, sizes, 0, chunks);
-}
-
-size_t mspace_bulk_free(mspace msp, void* array[], size_t nelem) {
-  return internal_bulk_free((mstate)msp, array, nelem);
-}
-
-#if MALLOC_INSPECT_ALL
-void mspace_inspect_all(mspace msp,
-                        void(*handler)(void *start,
-                                       void *end,
-                                       size_t used_bytes,
-                                       void* callback_arg),
-                        void* arg) {
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    if (!PREACTION(ms)) {
-      internal_inspect_all(ms, handler, arg);
-      POSTACTION(ms);
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-}
-#endif /* MALLOC_INSPECT_ALL */
-
-int mspace_trim(mspace msp, size_t pad) {
-  int result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    if (!PREACTION(ms)) {
-      result = sys_trim(ms, pad);
-      POSTACTION(ms);
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-#if !NO_MALLOC_STATS
-void mspace_malloc_stats(mspace msp) {
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    internal_malloc_stats(ms);
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-}
-#endif /* NO_MALLOC_STATS */
-
-size_t mspace_footprint(mspace msp) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    result = ms->footprint;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-size_t mspace_max_footprint(mspace msp) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    result = ms->max_footprint;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-size_t mspace_footprint_limit(mspace msp) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    size_t maf = ms->footprint_limit;
-    result = (maf == 0) ? MAX_SIZE_T : maf;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-size_t mspace_set_footprint_limit(mspace msp, size_t bytes) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    if (bytes == 0)
-      result = granularity_align(1); /* Use minimal size */
-    if (bytes == MAX_SIZE_T)
-      result = 0;                    /* disable */
-    else
-      result = granularity_align(bytes);
-    ms->footprint_limit = result;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-#if !NO_MALLINFO
-struct mallinfo mspace_mallinfo(mspace msp) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return internal_mallinfo(ms);
-}
-#endif /* NO_MALLINFO */
-
-size_t mspace_usable_size(const void* mem) {
-  if (mem != 0) {
-    mchunkptr p = mem2chunk(mem);
-    if (is_inuse(p))
-      return chunksize(p) - overhead_for(p);
-  }
-  return 0;
-}
-
-int mspace_mallopt(int param_number, int value) {
-  return change_mparam(param_number, value);
-}
-
-#endif /* MSPACES */
-
-
-/* -------------------- Alternative MORECORE functions ------------------- */
-
-/*
-  Guidelines for creating a custom version of MORECORE:
-
-  * For best performance, MORECORE should allocate in multiples of pagesize.
-  * MORECORE may allocate more memory than requested. (Or even less,
-      but this will usually result in a malloc failure.)
-  * MORECORE must not allocate memory when given argument zero, but
-      instead return one past the end address of memory from previous
-      nonzero call.
-  * For best performance, consecutive calls to MORECORE with positive
-      arguments should return increasing addresses, indicating that
-      space has been contiguously extended.
-  * Even though consecutive calls to MORECORE need not return contiguous
-      addresses, it must be OK for malloc'ed chunks to span multiple
-      regions in those cases where they do happen to be contiguous.
-  * MORECORE need not handle negative arguments -- it may instead
-      just return MFAIL when given negative arguments.
-      Negative arguments are always multiples of pagesize. MORECORE
-      must not misinterpret negative args as large positive unsigned
-      args. You can suppress all such calls from even occurring by defining
-      MORECORE_CANNOT_TRIM,
-
-  As an example alternative MORECORE, here is a custom allocator
-  kindly contributed for pre-OSX macOS.  It uses virtually but not
-  necessarily physically contiguous non-paged memory (locked in,
-  present and won't get swapped out).  You can use it by uncommenting
-  this section, adding some #includes, and setting up the appropriate
-  defines above:
-
-      #define MORECORE osMoreCore
-
-  There is also a shutdown routine that should somehow be called for
-  cleanup upon program exit.
-
-  #define MAX_POOL_ENTRIES 100
-  #define MINIMUM_MORECORE_SIZE  (64 * 1024U)
-  static int next_os_pool;
-  void *our_os_pools[MAX_POOL_ENTRIES];
-
-  void *osMoreCore(int size)
-  {
-    void *ptr = 0;
-    static void *sbrk_top = 0;
-
-    if (size > 0)
-    {
-      if (size < MINIMUM_MORECORE_SIZE)
-         size = MINIMUM_MORECORE_SIZE;
-      if (CurrentExecutionLevel() == kTaskLevel)
-         ptr = PoolAllocateResident(size + RM_PAGE_SIZE, 0);
-      if (ptr == 0)
-      {
-        return (void *) MFAIL;
-      }
-      // save ptrs so they can be freed during cleanup
-      our_os_pools[next_os_pool] = ptr;
-      next_os_pool++;
-      ptr = (void *) ((((size_t) ptr) + RM_PAGE_MASK) & ~RM_PAGE_MASK);
-      sbrk_top = (char *) ptr + size;
-      return ptr;
-    }
-    else if (size < 0)
-    {
-      // we don't currently support shrink behavior
-      return (void *) MFAIL;
-    }
-    else
-    {
-      return sbrk_top;
-    }
-  }
-
-  // cleanup any allocated memory pools
-  // called as last thing before shutting down driver
-
-  void osCleanupMem(void)
-  {
-    void **ptr;
-
-    for (ptr = our_os_pools; ptr < &our_os_pools[MAX_POOL_ENTRIES]; ptr++)
-      if (*ptr)
-      {
-         PoolDeallocate(*ptr);
-         *ptr = 0;
-      }
-  }
-
-*/
-
-
-/* -----------------------------------------------------------------------
-History:
-    v2.8.6 Wed Aug 29 06:57:58 2012  Doug Lea
-      * fix bad comparison in dlposix_memalign
-      * don't reuse adjusted asize in sys_alloc
-      * add LOCK_AT_FORK -- thanks to Kirill Artamonov for the suggestion
-      * reduce compiler warnings -- thanks to all who reported/suggested these
-
-    v2.8.5 Sun May 22 10:26:02 2011  Doug Lea  (dl at gee)
-      * Always perform unlink checks unless INSECURE
-      * Add posix_memalign.
-      * Improve realloc to expand in more cases; expose realloc_in_place.
-        Thanks to Peter Buhr for the suggestion.
-      * Add footprint_limit, inspect_all, bulk_free. Thanks
-        to Barry Hayes and others for the suggestions.
-      * Internal refactorings to avoid calls while holding locks
-      * Use non-reentrant locks by default. Thanks to Roland McGrath
-        for the suggestion.
-      * Small fixes to mspace_destroy, reset_on_error.
-      * Various configuration extensions/changes. Thanks
-         to all who contributed these.
-
-    V2.8.4a Thu Apr 28 14:39:43 2011 (dl at gee.cs.oswego.edu)
-      * Update Creative Commons URL
-
-    V2.8.4 Wed May 27 09:56:23 2009  Doug Lea  (dl at gee)
-      * Use zeros instead of prev foot for is_mmapped
-      * Add mspace_track_large_chunks; thanks to Jean Brouwers
-      * Fix set_inuse in internal_realloc; thanks to Jean Brouwers
-      * Fix insufficient sys_alloc padding when using 16byte alignment
-      * Fix bad error check in mspace_footprint
-      * Adaptations for ptmalloc; thanks to Wolfram Gloger.
-      * Reentrant spin locks; thanks to Earl Chew and others
-      * Win32 improvements; thanks to Niall Douglas and Earl Chew
-      * Add NO_SEGMENT_TRAVERSAL and MAX_RELEASE_CHECK_RATE options
-      * Extension hook in malloc_state
-      * Various small adjustments to reduce warnings on some compilers
-      * Various configuration extensions/changes for more platforms. Thanks
-         to all who contributed these.
-
-    V2.8.3 Thu Sep 22 11:16:32 2005  Doug Lea  (dl at gee)
-      * Add max_footprint functions
-      * Ensure all appropriate literals are size_t
-      * Fix conditional compilation problem for some #define settings
-      * Avoid concatenating segments with the one provided
-        in create_mspace_with_base
-      * Rename some variables to avoid compiler shadowing warnings
-      * Use explicit lock initialization.
-      * Better handling of sbrk interference.
-      * Simplify and fix segment insertion, trimming and mspace_destroy
-      * Reinstate REALLOC_ZERO_BYTES_FREES option from 2.7.x
-      * Thanks especially to Dennis Flanagan for help on these.
-
-    V2.8.2 Sun Jun 12 16:01:10 2005  Doug Lea  (dl at gee)
-      * Fix memalign brace error.
-
-    V2.8.1 Wed Jun  8 16:11:46 2005  Doug Lea  (dl at gee)
-      * Fix improper #endif nesting in C++
-      * Add explicit casts needed for C++
-
-    V2.8.0 Mon May 30 14:09:02 2005  Doug Lea  (dl at gee)
-      * Use trees for large bins
-      * Support mspaces
-      * Use segments to unify sbrk-based and mmap-based system allocation,
-        removing need for emulation on most platforms without sbrk.
-      * Default safety checks
-      * Optional footer checks. Thanks to William Robertson for the idea.
-      * Internal code refactoring
-      * Incorporate suggestions and platform-specific changes.
-        Thanks to Dennis Flanagan, Colin Plumb, Niall Douglas,
-        Aaron Bachmann,  Emery Berger, and others.
-      * Speed up non-fastbin processing enough to remove fastbins.
-      * Remove useless cfree() to avoid conflicts with other apps.
-      * Remove internal memcpy, memset. Compilers handle builtins better.
-      * Remove some options that no one ever used and rename others.
-
-    V2.7.2 Sat Aug 17 09:07:30 2002  Doug Lea  (dl at gee)
-      * Fix malloc_state bitmap array misdeclaration
-
-    V2.7.1 Thu Jul 25 10:58:03 2002  Doug Lea  (dl at gee)
-      * Allow tuning of FIRST_SORTED_BIN_SIZE
-      * Use PTR_UINT as type for all ptr->int casts. Thanks to John Belmonte.
-      * Better detection and support for non-contiguousness of MORECORE.
-        Thanks to Andreas Mueller, Conal Walsh, and Wolfram Gloger
-      * Bypass most of malloc if no frees. Thanks To Emery Berger.
-      * Fix freeing of old top non-contiguous chunk im sysmalloc.
-      * Raised default trim and map thresholds to 256K.
-      * Fix mmap-related #defines. Thanks to Lubos Lunak.
-      * Fix copy macros; added LACKS_FCNTL_H. Thanks to Neal Walfield.
-      * Branch-free bin calculation
-      * Default trim and mmap thresholds now 256K.
-
-    V2.7.0 Sun Mar 11 14:14:06 2001  Doug Lea  (dl at gee)
-      * Introduce independent_comalloc and independent_calloc.
-        Thanks to Michael Pachos for motivation and help.
-      * Make optional .h file available
-      * Allow > 2GB requests on 32bit systems.
-      * new WIN32 sbrk, mmap, munmap, lock code from <Walter@GeNeSys-e.de>.
-        Thanks also to Andreas Mueller <a.mueller at paradatec.de>,
-        and Anonymous.
-      * Allow override of MALLOC_ALIGNMENT (Thanks to Ruud Waij for
-        helping test this.)
-      * memalign: check alignment arg
-      * realloc: don't try to shift chunks backwards, since this
-        leads to  more fragmentation in some programs and doesn't
-        seem to help in any others.
-      * Collect all cases in malloc requiring system memory into sysmalloc
-      * Use mmap as backup to sbrk
-      * Place all internal state in malloc_state
-      * Introduce fastbins (although similar to 2.5.1)
-      * Many minor tunings and cosmetic improvements
-      * Introduce USE_PUBLIC_MALLOC_WRAPPERS, USE_MALLOC_LOCK
-      * Introduce MALLOC_FAILURE_ACTION, MORECORE_CONTIGUOUS
-        Thanks to Tony E. Bennett <tbennett@nvidia.com> and others.
-      * Include errno.h to support default failure action.
-
-    V2.6.6 Sun Dec  5 07:42:19 1999  Doug Lea  (dl at gee)
-      * return null for negative arguments
-      * Added Several WIN32 cleanups from Martin C. Fong <mcfong at yahoo.com>
-         * Add 'LACKS_SYS_PARAM_H' for those systems without 'sys/param.h'
-          (e.g. WIN32 platforms)
-         * Cleanup header file inclusion for WIN32 platforms
-         * Cleanup code to avoid Microsoft Visual C++ compiler complaints
-         * Add 'USE_DL_PREFIX' to quickly allow co-existence with existing
-           memory allocation routines
-         * Set 'malloc_getpagesize' for WIN32 platforms (needs more work)
-         * Use 'assert' rather than 'ASSERT' in WIN32 code to conform to
-           usage of 'assert' in non-WIN32 code
-         * Improve WIN32 'sbrk()' emulation's 'findRegion()' routine to
-           avoid infinite loop
-      * Always call 'fREe()' rather than 'free()'
-
-    V2.6.5 Wed Jun 17 15:57:31 1998  Doug Lea  (dl at gee)
-      * Fixed ordering problem with boundary-stamping
-
-    V2.6.3 Sun May 19 08:17:58 1996  Doug Lea  (dl at gee)
-      * Added pvalloc, as recommended by H.J. Liu
-      * Added 64bit pointer support mainly from Wolfram Gloger
-      * Added anonymously donated WIN32 sbrk emulation
-      * Malloc, calloc, getpagesize: add optimizations from Raymond Nijssen
-      * malloc_extend_top: fix mask error that caused wastage after
-        foreign sbrks
-      * Add linux mremap support code from HJ Liu
-
-    V2.6.2 Tue Dec  5 06:52:55 1995  Doug Lea  (dl at gee)
-      * Integrated most documentation with the code.
-      * Add support for mmap, with help from
-        Wolfram Gloger (Gloger@lrz.uni-muenchen.de).
-      * Use last_remainder in more cases.
-      * Pack bins using idea from  colin@nyx10.cs.du.edu
-      * Use ordered bins instead of best-fit threshhold
-      * Eliminate block-local decls to simplify tracing and debugging.
-      * Support another case of realloc via move into top
-      * Fix error occuring when initial sbrk_base not word-aligned.
-      * Rely on page size for units instead of SBRK_UNIT to
-        avoid surprises about sbrk alignment conventions.
-      * Add mallinfo, mallopt. Thanks to Raymond Nijssen
-        (raymond@es.ele.tue.nl) for the suggestion.
-      * Add `pad' argument to malloc_trim and top_pad mallopt parameter.
-      * More precautions for cases where other routines call sbrk,
-        courtesy of Wolfram Gloger (Gloger@lrz.uni-muenchen.de).
-      * Added macros etc., allowing use in linux libc from
-        H.J. Lu (hjl@gnu.ai.mit.edu)
-      * Inverted this history list
-
-    V2.6.1 Sat Dec  2 14:10:57 1995  Doug Lea  (dl at gee)
-      * Re-tuned and fixed to behave more nicely with V2.6.0 changes.
-      * Removed all preallocation code since under current scheme
-        the work required to undo bad preallocations exceeds
-        the work saved in good cases for most test programs.
-      * No longer use return list or unconsolidated bins since
-        no scheme using them consistently outperforms those that don't
-        given above changes.
-      * Use best fit for very large chunks to prevent some worst-cases.
-      * Added some support for debugging
-
-    V2.6.0 Sat Nov  4 07:05:23 1995  Doug Lea  (dl at gee)
-      * Removed footers when chunks are in use. Thanks to
-        Paul Wilson (wilson@cs.texas.edu) for the suggestion.
-
-    V2.5.4 Wed Nov  1 07:54:51 1995  Doug Lea  (dl at gee)
-      * Added malloc_trim, with help from Wolfram Gloger
-        (wmglo@Dent.MED.Uni-Muenchen.DE).
-
-    V2.5.3 Tue Apr 26 10:16:01 1994  Doug Lea  (dl at g)
-
-    V2.5.2 Tue Apr  5 16:20:40 1994  Doug Lea  (dl at g)
-      * realloc: try to expand in both directions
-      * malloc: swap order of clean-bin strategy;
-      * realloc: only conditionally expand backwards
-      * Try not to scavenge used bins
-      * Use bin counts as a guide to preallocation
-      * Occasionally bin return list chunks in first scan
-      * Add a few optimizations from colin@nyx10.cs.du.edu
-
-    V2.5.1 Sat Aug 14 15:40:43 1993  Doug Lea  (dl at g)
-      * faster bin computation & slightly different binning
-      * merged all consolidations to one part of malloc proper
-         (eliminating old malloc_find_space & malloc_clean_bin)
-      * Scan 2 returns chunks (not just 1)
-      * Propagate failure in realloc if malloc returns 0
-      * Add stuff to allow compilation on non-ANSI compilers
-          from kpv@research.att.com
-
-    V2.5 Sat Aug  7 07:41:59 1993  Doug Lea  (dl at g.oswego.edu)
-      * removed potential for odd address access in prev_chunk
-      * removed dependency on getpagesize.h
-      * misc cosmetics and a bit more internal documentation
-      * anticosmetics: mangled names in macros to evade debugger strangeness
-      * tested on sparc, hp-700, dec-mips, rs6000
-          with gcc & native cc (hp, dec only) allowing
-          Detlefs & Zorn comparison study (in SIGPLAN Notices.)
-
-    Trial version Fri Aug 28 13:14:29 1992  Doug Lea  (dl at g.oswego.edu)
-      * Based loosely on libg++-1.2X malloc. (It retains some of the overall
-         structure of old version,  but most details differ.)
-
-*/
diff --git a/Src/AmrTask/rts_impls/Utils/dl_malloc.h b/Src/AmrTask/rts_impls/Utils/dl_malloc.h
deleted file mode 100644
index 5c047ced436..00000000000
--- a/Src/AmrTask/rts_impls/Utils/dl_malloc.h
+++ /dev/null
@@ -1,622 +0,0 @@
-/*
-  Default header file for malloc-2.8.x, written by Doug Lea
-  and released to the public domain, as explained at
-  http://creativecommons.org/publicdomain/zero/1.0/ 
- 
-  This header is for ANSI C/C++ only.  You can set any of
-  the following #defines before including:
-
-  * If USE_DL_PREFIX is defined, it is assumed that malloc.c 
-    was also compiled with this option, so all routines
-    have names starting with "dl".
-
-  * If HAVE_USR_INCLUDE_MALLOC_H is defined, it is assumed that this
-    file will be #included AFTER <malloc.h>. This is needed only if
-    your system defines a struct mallinfo that is incompatible with the
-    standard one declared here.  Otherwise, you can include this file
-    INSTEAD of your system system <malloc.h>.  At least on ANSI, all
-    declarations should be compatible with system versions
-
-  * If MSPACES is defined, declarations for mspace versions are included.
-*/
-
-#ifndef MALLOC_280_H
-#define MALLOC_280_H
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-
-#include <stddef.h>   /* for size_t */
-
-#ifndef ONLY_MSPACES
-#define ONLY_MSPACES 0     /* define to a value */
-#elif ONLY_MSPACES != 0
-#define ONLY_MSPACES 1
-#endif  /* ONLY_MSPACES */
-#ifndef NO_MALLINFO
-#define NO_MALLINFO 0
-#endif  /* NO_MALLINFO */
-
-#ifndef MSPACES
-#if ONLY_MSPACES
-#define MSPACES 1
-#else   /* ONLY_MSPACES */
-#define MSPACES 0
-#endif  /* ONLY_MSPACES */
-#endif  /* MSPACES */
- 
-// YZ: moved mallinfo before "#if !ONLY_MSPACES" because mspace may use mallinfo too!
-#if !NO_MALLINFO
-#ifndef HAVE_USR_INCLUDE_MALLOC_H
-#ifndef _MALLOC_H
-#ifndef MALLINFO_FIELD_TYPE
-#define MALLINFO_FIELD_TYPE size_t
-#endif /* MALLINFO_FIELD_TYPE */
-#ifndef STRUCT_MALLINFO_DECLARED
-#define STRUCT_MALLINFO_DECLARED 1
-  struct mallinfo {
-    MALLINFO_FIELD_TYPE arena;    /* non-mmapped space allocated from system */
-    MALLINFO_FIELD_TYPE ordblks;  /* number of free chunks */
-    MALLINFO_FIELD_TYPE smblks;   /* always 0 */
-    MALLINFO_FIELD_TYPE hblks;    /* always 0 */
-    MALLINFO_FIELD_TYPE hblkhd;   /* space in mmapped regions */
-    MALLINFO_FIELD_TYPE usmblks;  /* maximum total allocated space */
-    MALLINFO_FIELD_TYPE fsmblks;  /* always 0 */
-    MALLINFO_FIELD_TYPE uordblks; /* total allocated space */
-    MALLINFO_FIELD_TYPE fordblks; /* total free space */
-    MALLINFO_FIELD_TYPE keepcost; /* releasable (via malloc_trim) space */
-  };
-#endif /* STRUCT_MALLINFO_DECLARED */
-#endif  /* _MALLOC_H */
-#endif  /* HAVE_USR_INCLUDE_MALLOC_H */
-#endif  /* !NO_MALLINFO */
-  
-#if !ONLY_MSPACES
-
-#ifndef USE_DL_PREFIX
-#define dlcalloc               calloc
-#define dlfree                 free
-#define dlmalloc               malloc
-#define dlmemalign             memalign
-#define dlposix_memalign       posix_memalign
-#define dlrealloc              realloc
-#define dlvalloc               valloc
-#define dlpvalloc              pvalloc
-#define dlmallinfo             mallinfo
-#define dlmallopt              mallopt
-#define dlmalloc_trim          malloc_trim
-#define dlmalloc_stats         malloc_stats
-#define dlmalloc_usable_size   malloc_usable_size
-#define dlmalloc_footprint     malloc_footprint
-#define dlmalloc_max_footprint malloc_max_footprint
-#define dlmalloc_footprint_limit malloc_footprint_limit
-#define dlmalloc_set_footprint_limit malloc_set_footprint_limit
-#define dlmalloc_inspect_all   malloc_inspect_all
-#define dlindependent_calloc   independent_calloc
-#define dlindependent_comalloc independent_comalloc
-#define dlbulk_free            bulk_free
-#endif /* USE_DL_PREFIX */
-
-/*
-  malloc(size_t n)
-  Returns a pointer to a newly allocated chunk of at least n bytes, or
-  null if no space is available, in which case errno is set to ENOMEM
-  on ANSI C systems.
-
-  If n is zero, malloc returns a minimum-sized chunk. (The minimum
-  size is 16 bytes on most 32bit systems, and 32 bytes on 64bit
-  systems.)  Note that size_t is an unsigned type, so calls with
-  arguments that would be negative if signed are interpreted as
-  requests for huge amounts of space, which will often fail. The
-  maximum supported value of n differs across systems, but is in all
-  cases less than the maximum representable value of a size_t.
-*/
-void* dlmalloc(size_t);
-
-/*
-  free(void* p)
-  Releases the chunk of memory pointed to by p, that had been previously
-  allocated using malloc or a related routine such as realloc.
-  It has no effect if p is null. If p was not malloced or already
-  freed, free(p) will by default cuase the current program to abort.
-*/
-void  dlfree(void*);
-
-/*
-  calloc(size_t n_elements, size_t element_size);
-  Returns a pointer to n_elements * element_size bytes, with all locations
-  set to zero.
-*/
-void* dlcalloc(size_t, size_t);
-
-/*
-  realloc(void* p, size_t n)
-  Returns a pointer to a chunk of size n that contains the same data
-  as does chunk p up to the minimum of (n, p's size) bytes, or null
-  if no space is available.
-
-  The returned pointer may or may not be the same as p. The algorithm
-  prefers extending p in most cases when possible, otherwise it
-  employs the equivalent of a malloc-copy-free sequence.
-
-  If p is null, realloc is equivalent to malloc.
-
-  If space is not available, realloc returns null, errno is set (if on
-  ANSI) and p is NOT freed.
-
-  if n is for fewer bytes than already held by p, the newly unused
-  space is lopped off and freed if possible.  realloc with a size
-  argument of zero (re)allocates a minimum-sized chunk.
-
-  The old unix realloc convention of allowing the last-free'd chunk
-  to be used as an argument to realloc is not supported.
-*/
-void* dlrealloc(void*, size_t);
-
-/*
-  realloc_in_place(void* p, size_t n)
-  Resizes the space allocated for p to size n, only if this can be
-  done without moving p (i.e., only if there is adjacent space
-  available if n is greater than p's current allocated size, or n is
-  less than or equal to p's size). This may be used instead of plain
-  realloc if an alternative allocation strategy is needed upon failure
-  to expand space; for example, reallocation of a buffer that must be
-  memory-aligned or cleared. You can use realloc_in_place to trigger
-  these alternatives only when needed.
-
-  Returns p if successful; otherwise null.
-*/
-void* dlrealloc_in_place(void*, size_t);
-
-/*
-  memalign(size_t alignment, size_t n);
-  Returns a pointer to a newly allocated chunk of n bytes, aligned
-  in accord with the alignment argument.
-
-  The alignment argument should be a power of two. If the argument is
-  not a power of two, the nearest greater power is used.
-  8-byte alignment is guaranteed by normal malloc calls, so don't
-  bother calling memalign with an argument of 8 or less.
-
-  Overreliance on memalign is a sure way to fragment space.
-*/
-void* dlmemalign(size_t, size_t);
-
-/*
-  int posix_memalign(void** pp, size_t alignment, size_t n);
-  Allocates a chunk of n bytes, aligned in accord with the alignment
-  argument. Differs from memalign only in that it (1) assigns the
-  allocated memory to *pp rather than returning it, (2) fails and
-  returns EINVAL if the alignment is not a power of two (3) fails and
-  returns ENOMEM if memory cannot be allocated.
-*/
-int dlposix_memalign(void**, size_t, size_t);
-
-/*
-  valloc(size_t n);
-  Equivalent to memalign(pagesize, n), where pagesize is the page
-  size of the system. If the pagesize is unknown, 4096 is used.
-*/
-void* dlvalloc(size_t);
-
-/*
-  mallopt(int parameter_number, int parameter_value)
-  Sets tunable parameters The format is to provide a
-  (parameter-number, parameter-value) pair.  mallopt then sets the
-  corresponding parameter to the argument value if it can (i.e., so
-  long as the value is meaningful), and returns 1 if successful else
-  0.  SVID/XPG/ANSI defines four standard param numbers for mallopt,
-  normally defined in malloc.h.  None of these are use in this malloc,
-  so setting them has no effect. But this malloc also supports other
-  options in mallopt:
-
-  Symbol            param #  default    allowed param values
-  M_TRIM_THRESHOLD     -1   2*1024*1024   any   (-1U disables trimming)
-  M_GRANULARITY        -2     page size   any power of 2 >= page size
-  M_MMAP_THRESHOLD     -3      256*1024   any   (or 0 if no MMAP support)
-*/
-int dlmallopt(int, int);
-
-#define M_TRIM_THRESHOLD     (-1)
-#define M_GRANULARITY        (-2)
-#define M_MMAP_THRESHOLD     (-3)
-
-
-/*
-  malloc_footprint();
-  Returns the number of bytes obtained from the system.  The total
-  number of bytes allocated by malloc, realloc etc., is less than this
-  value. Unlike mallinfo, this function returns only a precomputed
-  result, so can be called frequently to monitor memory consumption.
-  Even if locks are otherwise defined, this function does not use them,
-  so results might not be up to date.
-*/
-size_t dlmalloc_footprint(void);
-
-/*
-  malloc_max_footprint();
-  Returns the maximum number of bytes obtained from the system. This
-  value will be greater than current footprint if deallocated space
-  has been reclaimed by the system. The peak number of bytes allocated
-  by malloc, realloc etc., is less than this value. Unlike mallinfo,
-  this function returns only a precomputed result, so can be called
-  frequently to monitor memory consumption.  Even if locks are
-  otherwise defined, this function does not use them, so results might
-  not be up to date.
-*/
-size_t dlmalloc_max_footprint(void);
-
-/*
-  malloc_footprint_limit();
-  Returns the number of bytes that the heap is allowed to obtain from
-  the system, returning the last value returned by
-  malloc_set_footprint_limit, or the maximum size_t value if
-  never set. The returned value reflects a permission. There is no
-  guarantee that this number of bytes can actually be obtained from
-  the system.  
-*/
-size_t dlmalloc_footprint_limit(void);
-
-/*
-  malloc_set_footprint_limit();
-  Sets the maximum number of bytes to obtain from the system, causing
-  failure returns from malloc and related functions upon attempts to
-  exceed this value. The argument value may be subject to page
-  rounding to an enforceable limit; this actual value is returned.
-  Using an argument of the maximum possible size_t effectively
-  disables checks. If the argument is less than or equal to the
-  current malloc_footprint, then all future allocations that require
-  additional system memory will fail. However, invocation cannot
-  retroactively deallocate existing used memory.
-*/
-size_t dlmalloc_set_footprint_limit(size_t bytes);
-
-/*
-  malloc_inspect_all(void(*handler)(void *start,
-                                    void *end,
-                                    size_t used_bytes,
-                                    void* callback_arg),
-                      void* arg);
-  Traverses the heap and calls the given handler for each managed
-  region, skipping all bytes that are (or may be) used for bookkeeping
-  purposes.  Traversal does not include include chunks that have been
-  directly memory mapped. Each reported region begins at the start
-  address, and continues up to but not including the end address.  The
-  first used_bytes of the region contain allocated data. If
-  used_bytes is zero, the region is unallocated. The handler is
-  invoked with the given callback argument. If locks are defined, they
-  are held during the entire traversal. It is a bad idea to invoke
-  other malloc functions from within the handler.
-
-  For example, to count the number of in-use chunks with size greater
-  than 1000, you could write:
-  static int count = 0;
-  void count_chunks(void* start, void* end, size_t used, void* arg) {
-    if (used >= 1000) ++count;
-  }
-  then:
-    malloc_inspect_all(count_chunks, NULL);
-
-  malloc_inspect_all is compiled only if MALLOC_INSPECT_ALL is defined.
-*/
-void dlmalloc_inspect_all(void(*handler)(void*, void *, size_t, void*),
-                           void* arg);
-
-#if !NO_MALLINFO
-/*
-  mallinfo()
-  Returns (by copy) a struct containing various summary statistics:
-
-  arena:     current total non-mmapped bytes allocated from system
-  ordblks:   the number of free chunks
-  smblks:    always zero.
-  hblks:     current number of mmapped regions
-  hblkhd:    total bytes held in mmapped regions
-  usmblks:   the maximum total allocated space. This will be greater
-                than current total if trimming has occurred.
-  fsmblks:   always zero
-  uordblks:  current total allocated space (normal or mmapped)
-  fordblks:  total free space
-  keepcost:  the maximum number of bytes that could ideally be released
-               back to system via malloc_trim. ("ideally" means that
-               it ignores page restrictions etc.)
-
-  Because these fields are ints, but internal bookkeeping may
-  be kept as longs, the reported values may wrap around zero and
-  thus be inaccurate.
-*/
-
-struct mallinfo dlmallinfo(void);
-#endif  /* NO_MALLINFO */
-
-/*
-  independent_calloc(size_t n_elements, size_t element_size, void* chunks[]);
-
-  independent_calloc is similar to calloc, but instead of returning a
-  single cleared space, it returns an array of pointers to n_elements
-  independent elements that can hold contents of size elem_size, each
-  of which starts out cleared, and can be independently freed,
-  realloc'ed etc. The elements are guaranteed to be adjacently
-  allocated (this is not guaranteed to occur with multiple callocs or
-  mallocs), which may also improve cache locality in some
-  applications.
-
-  The "chunks" argument is optional (i.e., may be null, which is
-  probably the most typical usage). If it is null, the returned array
-  is itself dynamically allocated and should also be freed when it is
-  no longer needed. Otherwise, the chunks array must be of at least
-  n_elements in length. It is filled in with the pointers to the
-  chunks.
-
-  In either case, independent_calloc returns this pointer array, or
-  null if the allocation failed.  If n_elements is zero and "chunks"
-  is null, it returns a chunk representing an array with zero elements
-  (which should be freed if not wanted).
-
-  Each element must be freed when it is no longer needed. This can be
-  done all at once using bulk_free.
-
-  independent_calloc simplifies and speeds up implementations of many
-  kinds of pools.  It may also be useful when constructing large data
-  structures that initially have a fixed number of fixed-sized nodes,
-  but the number is not known at compile time, and some of the nodes
-  may later need to be freed. For example:
-
-  struct Node { int item; struct Node* next; };
-
-  struct Node* build_list() {
-    struct Node** pool;
-    int n = read_number_of_nodes_needed();
-    if (n <= 0) return 0;
-    pool = (struct Node**)(independent_calloc(n, sizeof(struct Node), 0);
-    if (pool == 0) die();
-    // organize into a linked list...
-    struct Node* first = pool[0];
-    for (i = 0; i < n-1; ++i)
-      pool[i]->next = pool[i+1];
-    free(pool);     // Can now free the array (or not, if it is needed later)
-    return first;
-  }
-*/
-void** dlindependent_calloc(size_t, size_t, void**);
-
-/*
-  independent_comalloc(size_t n_elements, size_t sizes[], void* chunks[]);
-
-  independent_comalloc allocates, all at once, a set of n_elements
-  chunks with sizes indicated in the "sizes" array.    It returns
-  an array of pointers to these elements, each of which can be
-  independently freed, realloc'ed etc. The elements are guaranteed to
-  be adjacently allocated (this is not guaranteed to occur with
-  multiple callocs or mallocs), which may also improve cache locality
-  in some applications.
-
-  The "chunks" argument is optional (i.e., may be null). If it is null
-  the returned array is itself dynamically allocated and should also
-  be freed when it is no longer needed. Otherwise, the chunks array
-  must be of at least n_elements in length. It is filled in with the
-  pointers to the chunks.
-
-  In either case, independent_comalloc returns this pointer array, or
-  null if the allocation failed.  If n_elements is zero and chunks is
-  null, it returns a chunk representing an array with zero elements
-  (which should be freed if not wanted).
-
-  Each element must be freed when it is no longer needed. This can be
-  done all at once using bulk_free.
-
-  independent_comallac differs from independent_calloc in that each
-  element may have a different size, and also that it does not
-  automatically clear elements.
-
-  independent_comalloc can be used to speed up allocation in cases
-  where several structs or objects must always be allocated at the
-  same time.  For example:
-
-  struct Head { ... }
-  struct Foot { ... }
-
-  void send_message(char* msg) {
-    int msglen = strlen(msg);
-    size_t sizes[3] = { sizeof(struct Head), msglen, sizeof(struct Foot) };
-    void* chunks[3];
-    if (independent_comalloc(3, sizes, chunks) == 0)
-      die();
-    struct Head* head = (struct Head*)(chunks[0]);
-    char*        body = (char*)(chunks[1]);
-    struct Foot* foot = (struct Foot*)(chunks[2]);
-    // ...
-  }
-
-  In general though, independent_comalloc is worth using only for
-  larger values of n_elements. For small values, you probably won't
-  detect enough difference from series of malloc calls to bother.
-
-  Overuse of independent_comalloc can increase overall memory usage,
-  since it cannot reuse existing noncontiguous small chunks that
-  might be available for some of the elements.
-*/
-void** dlindependent_comalloc(size_t, size_t*, void**);
-
-/*
-  bulk_free(void* array[], size_t n_elements)
-  Frees and clears (sets to null) each non-null pointer in the given
-  array.  This is likely to be faster than freeing them one-by-one.
-  If footers are used, pointers that have been allocated in different
-  mspaces are not freed or cleared, and the count of all such pointers
-  is returned.  For large arrays of pointers with poor locality, it
-  may be worthwhile to sort this array before calling bulk_free.
-*/
-size_t  dlbulk_free(void**, size_t n_elements);
-
-/*
-  pvalloc(size_t n);
-  Equivalent to valloc(minimum-page-that-holds(n)), that is,
-  round up n to nearest pagesize.
- */
-void*  dlpvalloc(size_t);
-
-/*
-  malloc_trim(size_t pad);
-
-  If possible, gives memory back to the system (via negative arguments
-  to sbrk) if there is unused memory at the `high' end of the malloc
-  pool or in unused MMAP segments. You can call this after freeing
-  large blocks of memory to potentially reduce the system-level memory
-  requirements of a program. However, it cannot guarantee to reduce
-  memory. Under some allocation patterns, some large free blocks of
-  memory will be locked between two used chunks, so they cannot be
-  given back to the system.
-
-  The `pad' argument to malloc_trim represents the amount of free
-  trailing space to leave untrimmed. If this argument is zero, only
-  the minimum amount of memory to maintain internal data structures
-  will be left. Non-zero arguments can be supplied to maintain enough
-  trailing space to service future expected allocations without having
-  to re-obtain memory from the system.
-
-  Malloc_trim returns 1 if it actually released any memory, else 0.
-*/
-int  dlmalloc_trim(size_t);
-
-/*
-  malloc_stats();
-  Prints on stderr the amount of space obtained from the system (both
-  via sbrk and mmap), the maximum amount (which may be more than
-  current if malloc_trim and/or munmap got called), and the current
-  number of bytes allocated via malloc (or realloc, etc) but not yet
-  freed. Note that this is the number of bytes allocated, not the
-  number requested. It will be larger than the number requested
-  because of alignment and bookkeeping overhead. Because it includes
-  alignment wastage as being in use, this figure may be greater than
-  zero even when no user-level chunks are allocated.
-
-  The reported current and maximum system memory can be inaccurate if
-  a program makes other calls to system memory allocation functions
-  (normally sbrk) outside of malloc.
-
-  malloc_stats prints only the most commonly interesting statistics.
-  More information can be obtained by calling mallinfo.
-  
-  malloc_stats is not compiled if NO_MALLOC_STATS is defined.
-*/
-void  dlmalloc_stats(void);
-
-#endif /* !ONLY_MSPACES */
-
-/*
-  malloc_usable_size(void* p);
-
-  Returns the number of bytes you can actually use in
-  an allocated chunk, which may be more than you requested (although
-  often not) due to alignment and minimum size constraints.
-  You can use this many bytes without worrying about
-  overwriting other allocated objects. This is not a particularly great
-  programming practice. malloc_usable_size can be more useful in
-  debugging and assertions, for example:
-
-  p = malloc(n);
-  assert(malloc_usable_size(p) >= 256);
-*/
-size_t dlmalloc_usable_size(const void*);
-
-#if MSPACES
-
-/*
-  mspace is an opaque type representing an independent
-  region of space that supports mspace_malloc, etc.
-*/
-typedef void* mspace;
-
-/*
-  create_mspace creates and returns a new independent space with the
-  given initial capacity, or, if 0, the default granularity size.  It
-  returns null if there is no system memory available to create the
-  space.  If argument locked is non-zero, the space uses a separate
-  lock to control access. The capacity of the space will grow
-  dynamically as needed to service mspace_malloc requests.  You can
-  control the sizes of incremental increases of this space by
-  compiling with a different DEFAULT_GRANULARITY or dynamically
-  setting with mallopt(M_GRANULARITY, value).
-*/
-mspace create_mspace(size_t capacity, int locked);
-
-/*
-  destroy_mspace destroys the given space, and attempts to return all
-  of its memory back to the system, returning the total number of
-  bytes freed. After destruction, the results of access to all memory
-  used by the space become undefined.
-*/
-size_t destroy_mspace(mspace msp);
-
-/*
-  create_mspace_with_base uses the memory supplied as the initial base
-  of a new mspace. Part (less than 128*sizeof(size_t) bytes) of this
-  space is used for bookkeeping, so the capacity must be at least this
-  large. (Otherwise 0 is returned.) When this initial space is
-  exhausted, additional memory will be obtained from the system.
-  Destroying this space will deallocate all additionally allocated
-  space (if possible) but not the initial base.
-*/
-mspace create_mspace_with_base(void* base, size_t capacity, int locked);
-mspace create_device_mspace_with_base(void* base, size_t capacity, int locked);
-
-/*
-  mspace_track_large_chunks controls whether requests for large chunks
-  are allocated in their own untracked mmapped regions, separate from
-  others in this mspace. By default large chunks are not tracked,
-  which reduces fragmentation. However, such chunks are not
-  necessarily released to the system upon destroy_mspace.  Enabling
-  tracking by setting to true may increase fragmentation, but avoids
-  leakage when relying on destroy_mspace to release all memory
-  allocated using this space.  The function returns the previous
-  setting.
-*/
-int mspace_track_large_chunks(mspace msp, int enable);
-
-#if !NO_MALLINFO
-/*
-  mspace_mallinfo behaves as mallinfo, but reports properties of
-  the given space.
-*/
-struct mallinfo mspace_mallinfo(mspace msp);
-#endif /* NO_MALLINFO */
-
-/*
-  An alias for mallopt.
-*/
-int mspace_mallopt(int, int);
-
-/*
-  The following operate identically to their malloc counterparts
-  but operate only for the given mspace argument
-*/
-void* mspace_malloc(mspace msp, size_t bytes);
-void mspace_free(mspace msp, void* mem);
-void* mspace_calloc(mspace msp, size_t n_elements, size_t elem_size);
-void* mspace_realloc(mspace msp, void* mem, size_t newsize);
-void* mspace_realloc_in_place(mspace msp, void* mem, size_t newsize);
-void* mspace_memalign(mspace msp, size_t alignment, size_t bytes);
-void** mspace_independent_calloc(mspace msp, size_t n_elements,
-                                 size_t elem_size, void* chunks[]);
-void** mspace_independent_comalloc(mspace msp, size_t n_elements,
-                                   size_t sizes[], void* chunks[]);
-size_t mspace_bulk_free(mspace msp, void**, size_t n_elements);
-size_t mspace_usable_size(const void* mem);
-void mspace_malloc_stats(mspace msp);
-int mspace_trim(mspace msp, size_t pad);
-size_t mspace_footprint(mspace msp);
-size_t mspace_max_footprint(mspace msp);
-size_t mspace_footprint_limit(mspace msp);
-size_t mspace_set_footprint_limit(mspace msp, size_t bytes);
-void mspace_inspect_all(mspace msp, 
-                        void(*handler)(void *, void *, size_t, void*),
-                        void* arg);
-#endif  /* MSPACES */
-
-#ifdef __cplusplus
-};  /* end of extern "C" */
-#endif
-
-#endif /* MALLOC_280_H */
diff --git a/Src/AmrTask/rts_impls/Utils/sysInfo.C b/Src/AmrTask/rts_impls/Utils/sysInfo.C
deleted file mode 100644
index 3f4974f3f5d..00000000000
--- a/Src/AmrTask/rts_impls/Utils/sysInfo.C
+++ /dev/null
@@ -1,138 +0,0 @@
-//This code was developed in Rambutan to parse machine information
-
-#include "sysInfo.H"
-#include <fstream>
-#include <algorithm>
-#include <vector>
-#include <cassert>
-using namespace std;
-
-
-namespace {
-  bool read_line_prefix(istream &is, string &prefix) {
-    int spaces = 0;
-    
-    prefix.clear();
-    
-    while(true) {
-      int c = is.get();
-
-      if(c == EOF)
-        return false;
-      
-      if(c == '\n') {
-        prefix.clear();
-        spaces = 0;
-        continue;
-      }
-      
-      if(c == ':')
-        return true;
-      
-      if(c == ' ')
-        spaces += 1;
-      else if(c == '\t')
-        ;
-      else {
-        while(spaces > 0) {
-          prefix.push_back(' ');
-          spaces -= 1;
-        }
-        prefix.push_back((char)c);
-      }
-    }
-  }
-}
-
-NodeHardware query_node_hardware() {
-  NodeHardware ans;
-  
-  struct Entry {
-    int proc;
-    int phys;
-    int core;
-    int sib_n;
-    int core_n;
-  };
-  
-  vector<Entry> procs;
-  
-  { // parse /proc/cpuinfo
-    ifstream f("/proc/cpuinfo", ios::in);
-    
-    string pre;
-    
-    Entry e;
-    int n = 5;
-    
-    while(read_line_prefix(f, pre)) {
-      if(pre == "processor") {
-        assert(n == 5);
-        f >> e.proc;
-      }
-      else if(pre == "physical id")
-        f >> e.phys;
-      else if(pre == "siblings")
-        f >> e.sib_n;
-      else if(pre == "core id")
-        f >> e.core;
-      else if(pre == "cpu cores")
-        f >> e.core_n;
-      else
-        continue;
-      
-      n -= 1;
-      if(n == 0) {
-        procs.push_back(e);
-        n = 5;
-      }
-    }
-  }
-  
-  // sort procs by "proc id", weird if wasnt already sorted by OS
-  std::sort(procs.begin(), procs.end(), [](Entry a, Entry b) { return a.proc < b.proc; });
-  
-  // assert OS numbers procs contiguously from zero
-  bool ok = true;
-  for(int i=0; i < (int)procs.size(); i++)
-    ok = ok && procs[i].proc == i;
-  assert(ok);
-  
-  ans.numa_per_node = procs.size() / procs[0].sib_n;
-  ans.core_per_numa = procs[0].core_n;
-  ans.thread_per_core = procs[0].sib_n / procs[0].core_n;
-  
-  if(procs.size() == 1) {
-    ans.thread_stride = 0;
-    ans.core_stride = 0;
-    ans.numa_stride = 0;
-  }
-  else {
-    ans.thread_stride = procs.size();
-    for(int i=1; i < (int)procs.size(); i++) {
-      if(procs[i].core == procs[0].core && procs[i].phys == procs[0].phys) {
-        ans.thread_stride = i;
-        break;
-      }
-    }
-    
-    ans.core_stride = procs.size();
-    for(int i=1; i < (int)procs.size(); i++) {
-      if(procs[i].core != procs[0].core) {
-        ans.core_stride = i;
-        break;
-      }
-    }
-    
-    ans.numa_stride = procs.size();
-    for(int i=1; i < (int)procs.size(); i++) {
-      if(procs[i].phys != procs[0].phys) {
-        ans.numa_stride = i;
-        break;
-      }
-    }
-  }
-  
-  return ans;
-}
-
diff --git a/Src/AmrTask/rts_impls/Utils/sysInfo.H b/Src/AmrTask/rts_impls/Utils/sysInfo.H
deleted file mode 100644
index 19979e7187c..00000000000
--- a/Src/AmrTask/rts_impls/Utils/sysInfo.H
+++ /dev/null
@@ -1,39 +0,0 @@
-#ifndef NODE_INFO
-#define NODE_INFO
-
-# include <cstdlib>
-# include <iostream>
-# include <sstream>
-# include <string>
-# include <unordered_map>
-
-// Implementation provided machine primitives.
-
-  
-  struct NodeHardware {
-    int thread_per_core;
-    int core_per_numa;
-    int numa_per_node;
-    
-    // cpuid indexing dimension order
-    int thread_stride;
-    int core_stride;
-    int numa_stride;
-    
-    int thread_per_numa() const { return thread_per_core*core_per_numa; }
-    int thread_per_node() const { return thread_per_core*core_per_numa*numa_per_node; }
-    int core_per_node() const { return core_per_numa*numa_per_node; }
-    
-    int numa_of_core(int core) const { return core/core_per_numa; }
-    int numa_of_thread(int thread) const { return thread/(thread_per_core*core_per_numa); }
-    
-    int core_of_thread(int thread) const { return thread/thread_per_core; }
-    
-    int cpuid_of(int thread, int core, int numa) const {
-      return thread*thread_stride + core*core_stride + numa*numa_stride;
-    }
-  };
-
-
-   NodeHardware query_node_hardware();
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi/Make.package b/Src/AmrTask/rts_impls/mpi/Make.package
deleted file mode 100644
index 21973fa39b2..00000000000
--- a/Src/AmrTask/rts_impls/mpi/Make.package
+++ /dev/null
@@ -1,12 +0,0 @@
-PERILLA_LIB=EXE
-COMMON_DIR=$(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-
-C$(PERILLA_LIB)_sources += PackageQueue.cpp Perilla.cpp PerillaRts.cpp
-
-C$(PERILLA_LIB)_headers += $(COMMON_DIR)/Barrier.H Config.H $(COMMON_DIR)/LocalConnection.H PackageQueue.H $(COMMON_DIR)/RegionGraph.H $(COMMON_DIR)/RGIter.H $(COMMON_DIR)/RegionQueue.H $(COMMON_DIR)/RemoteConnection.H $(COMMON_DIR)/WorkerThread.H $(COMMON_DIR)/AsyncMultiFabUtil.H PerillaRts.H
-
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common/perilla.mak
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
diff --git a/Src/AmrTask/rts_impls/mpi/PackageQueue.H b/Src/AmrTask/rts_impls/mpi/PackageQueue.H
deleted file mode 100755
index 362f58c5037..00000000000
--- a/Src/AmrTask/rts_impls/mpi/PackageQueue.H
+++ /dev/null
@@ -1,58 +0,0 @@
-#ifndef P_PACKAGEQUEUE_H
-#define P_PACKAGEQUEUE_H
-
-#include <PerillaConfig.H>
-#include <pthread.h>
-#include <mpi.h>
-
-class Package
-{
-private:
-  int source, destination;
-public:
-  double *databuf;
-  pthread_mutex_t packageLock;
-  volatile int bufSize;
-  volatile bool completed; //message transfer is done
-  volatile bool served; //message transfer request has been served but may have not completed
-  MPI_Request request; //!for MPI
-  Package();
-  ~Package();
-  Package(int size);
-  Package(int src, int dest);
-  Package(int src, int dest, int size);
-  void setPackageSource(int src);
-  void setPackageDestination(int dest);
-  void completeRequest(void);
-  void completeRequest(bool canAvoidLock);
-  bool checkRequest(void);
-  void generatePackage(int size);
-};
-
-class PackageQueue
-{
-private:
-  Package *buffer[perilla::MSG_QUEUE_DEFAULT_MAXSIZE];
-  volatile int n;
-  volatile int front;
-  volatile int rear;
-  volatile int prear;
-  int max_size;
-public:  
-  pthread_mutex_t queueLock;
-  PackageQueue();
-  ~PackageQueue();
-  int queueSize(void);  
-  int queueSize(bool canAvoidLock);
-  void enqueue(Package* package);  
-  void enqueue(Package* package, bool canAvoidLock);
-  Package* dequeue(void);  
-  Package* dequeue(bool canAvoidLock);
-  Package* getRear(void);
-  Package* getRear(bool canAvoidLock);
-  Package* getFront(void);
-  Package* getFront(bool canAvoidLock);
-  void emptyQueue(bool canAvoidLock);
-};
-#endif
-
diff --git a/Src/AmrTask/rts_impls/mpi/PackageQueue.cpp b/Src/AmrTask/rts_impls/mpi/PackageQueue.cpp
deleted file mode 100755
index 00fd736b63b..00000000000
--- a/Src/AmrTask/rts_impls/mpi/PackageQueue.cpp
+++ /dev/null
@@ -1,261 +0,0 @@
-#include <PackageQueue.H>
-#include <iostream>
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include <PerillaMemCheck.H>
-extern PerillaMemCheck memcheck;
-#endif
-
-Package::Package()
-{
-    databuf = 0;
-    bufSize = 0;
-    source = 0;
-    destination = 0;
-    completed = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::~Package()
-{
-    if(databuf) free(databuf);
-#ifdef PERILLA_DEBUG
-    memcheck.remove(memcheck.genKey(this));
-#endif
-}
-
-Package::Package(int size)
-{
-    databuf = new double[size];
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::Package(int src, int dest)
-{
-    bufSize = 0;
-    source = src;
-    destination = dest;
-    completed = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::Package(int src, int dest, int size)
-{
-    databuf = new double[size];
-    bufSize = size;
-    source = src;
-    destination = dest;
-    completed = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-void Package::setPackageSource(int src)
-{
-    source = src;
-}
-
-void Package::setPackageDestination(int dest)
-{
-    destination = dest;
-}
-
-void Package::completeRequest(void)
-{
-    pthread_mutex_lock(&packageLock);
-    completed = true;
-    pthread_mutex_unlock(&packageLock);
-}
-
-void Package::completeRequest(bool canAvoidLock)
-{
-    if(!canAvoidLock)pthread_mutex_lock(&packageLock);
-    completed = true;
-    if(!canAvoidLock)pthread_mutex_unlock(&packageLock);
-}
-
-bool Package::checkRequest(void)
-{
-    return completed;
-}  
-
-void Package::generatePackage(int size)
-{
-    databuf = new double[size];
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-PackageQueue::PackageQueue()
-{
-    n = 0;
-    front = 0;
-    rear = 0;
-    prear = -1;
-    queueLock= PTHREAD_MUTEX_INITIALIZER;;
-}
-
-int PackageQueue::queueSize(void)
-{
-    int size;
-    pthread_mutex_lock(&queueLock);
-    size = n;
-    pthread_mutex_unlock(&queueLock);
-    return size;
-}
-
-int PackageQueue::queueSize(bool canAvoidLock)
-{
-    int size;
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-    size = n;
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-    return size;
-}
-
-void PackageQueue::enqueue(Package* package)
-{
-    pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n==perilla::MSG_QUEUE_DEFAULT_MAXSIZE){
-        printf("Failed to Enqueue: Queue Overflow\n");
-        exit(0);
-    }
-#endif
-    buffer[rear] = package;
-    prear = rear;    
-    rear = (rear+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n++;
-    pthread_mutex_unlock(&queueLock);
-}
-
-void PackageQueue::enqueue(Package* package, bool canAvoidLock)
-{
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n==perilla::MSG_QUEUE_DEFAULT_MAXSIZE){
-        printf("Failed to Enqueue: Queue Overflow\n");
-        exit(0);
-    }
-#endif
-    buffer[rear] = package;
-    prear = rear;
-    rear = (rear+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n++;
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-}
-
-Package* PackageQueue::dequeue(void)
-{
-    Package* package = 0;
-    pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n<0){
-        printf("Failed to Dequeue: Queue Empty\n");
-        exit(0);
-    }
-#endif
-    package = buffer[front];
-    front = (front+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n--;
-    pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::dequeue(bool canAvoidLock)
-{
-    Package* package = 0;
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n<0){
-        printf("Failed to Dequeue: Queue Empty\n");
-        exit(0);
-    }
-#endif
-    package = buffer[front];
-    front = (front+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n--;
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getRear(void)
-{
-    Package* package = 0;
-    pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[prear];
-    pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getRear(bool canAvoidLock)
-{
-    Package* package = 0;
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[prear];
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getFront(void)
-{
-    Package* package = 0;
-    pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[front];
-    pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getFront(bool canAvoidLock)
-{
-    Package* package = 0;
-    if(!canAvoidLock) pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[front];
-    if(!canAvoidLock) pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-void PackageQueue::emptyQueue(bool canAvoidLock){
-    if(!canAvoidLock) pthread_mutex_lock(&queueLock);
-    while(n){
-	Package* p= dequeue(true);
-	delete p;
-    }
-    if(!canAvoidLock) pthread_mutex_unlock(&queueLock);
-}
-
-PackageQueue::~PackageQueue()
-{
-    emptyQueue(true);   
-}
diff --git a/Src/AmrTask/rts_impls/mpi/Perilla.H b/Src/AmrTask/rts_impls/mpi/Perilla.H
deleted file mode 100755
index 2bc3301ae9e..00000000000
--- a/Src/AmrTask/rts_impls/mpi/Perilla.H
+++ /dev/null
@@ -1,92 +0,0 @@
-#ifndef _PERILLA_
-#define _PERILLA_
-
-#include <AMReX_MultiFab.H>
-#include <vector>
-#include <map>
-#include <RegionGraph.H>
-#include <pthread.h>
-
-#include <RGIter.H>
-
-//#define USE_PERILLA_PTHREADS
-
-using namespace std;
-
-namespace amrex{
-    class Perilla
-    {
-	static int tagGen(int src, int dest, int channelID, int nFabs, int nChannels);
-
-	public:
-	static int uTags;
-	static bool genTags;
-        static int max_step;
-
-	static std::map<int,std::map<int,int>> pTagCnt;
-	static std::map<int,std::map<int,std::map<int,std::map<int,std::map<int,int>>>>> tagMap;
-	static std::map<int,std::map<int,std::map<int,std::map<int,int>>>> myTagMap;
-        static void clearTagMap();
-        static void clearMyTagMap();
-	static void communicateTags();
-        static void registerId(int tid);
-	static int tid();
-	static volatile int numTeamsFinished;
-        static volatile int updateMetadata_request;
-        static volatile int updateMetadata_noticed;
-        static volatile int updateMetadata_done;
-	static Barrier * globalBarrier;
-	static void syncProcesses();
-	static void multifabBuildFabCon(RegionGraph* graph, const MultiFab& mf, const Periodicity& period);
-	static void serviceLocalRequests(RegionGraph *graph, int tg);
-	static void serviceRemoteRequests(RegionGraph *graph, int graphID, int nGraphs);
-	static void serviceRemoteRequests(RegionGraph *graph);  
-	static void serviceSingleGraphComm(RegionGraph* graph, int tid);
-	static void serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, bool cpyAcross, int tid);
-	static void serviceMultipleGraphCommDynamic(std::vector<RegionGraph*>graphArray, bool cpyAcross, int tid);
-        static void flattenGraphHierarchy(std::vector<std::vector<RegionGraph*> >graphArray, std::vector<RegionGraph*> &flattenedGraphArray);
-	static void serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, int tid);
-	static void fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f);
-	static void fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f, bool singleT);
-
-	static void serviceLocalGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int tg);
-	static void serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraph, int tg);
-	static void resetRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraph, int tg);
-
-  	static void fillBoundaryPush(amrex::RGIter& rgi, amrex::MultiFab& mf);
-  	static void fillBoundaryPull(amrex::RGIter& rgi, amrex::MultiFab& mf, bool singleT);
-  	static void fillBoundaryPush(amrex::RGIter& rgi, RegionGraph *graph, amrex::MultiFab& mf);
-  	static void fillBoundaryPull(amrex::RGIter& rgi, RegionGraph *graph, amrex::MultiFab& mf, bool singleT);
-
-  /////////////////////////////////////////////////////////////////////////////////////////////////////////////////
-
-
-        void   multifabExtractCopyAssoc(void* threadInfo);
-	static void multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& dmf, const MultiFab& smf, int nc, int ng, int ngSrc, const Periodicity& period);
-	static void multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& dmf, const MultiFab& smf, const Periodicity& period);
-	static void multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-	static void multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT); 
-
-
-        static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-        static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, bool singleT);
-
-	static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-	static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT);
-
-	//static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT, bool mTeams=true);
-
-        //static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT, bool mTeams=true);
-
-        //static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, bool singleT, bool mTeams=true);
-	//static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT, bool mTeams=true);
-
-
-       static void multifabCopyPush_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-       //static void fillBoundaryPush_1Team(RegionGraph *graph, amrex::MultiFab& mf, int f, bool mOneThread=false);
-
-       //static void multifabCopyPull_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-       static void fillBoundaryPull_1Team(RegionGraph *graph, amrex::MultiFab& mf, int f);
-    }; // class Perilla
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi/Perilla.cpp b/Src/AmrTask/rts_impls/mpi/Perilla.cpp
deleted file mode 100755
index 8a9fb76038d..00000000000
--- a/Src/AmrTask/rts_impls/mpi/Perilla.cpp
+++ /dev/null
@@ -1,976 +0,0 @@
-#include <AMReX_MultiFab.H>
-#include <AMReX_FabArray.H>
-#include <AMReX_Periodicity.H>
-#include <WorkerThread.H>
-#include <PerillaConfig.H>
-#include <RegionGraph.H>
-#include <Barrier.H>
-#include <vector>
-#include <iostream>
-#include <limits>
-#include <exception>
-#include <mpi.h>
-#include <Perilla.H>
-using namespace std;
-using namespace amrex;
-using namespace perilla;
-
-#ifdef PERILLA_DEBUG
-#include<stdlib.h>
-#include <sys/time.h>
-
-const double kMicro = 1.0e-6;
-double getTime()
-{
-    struct timeval TV;
-    const int RC = gettimeofday(&TV, NULL);
-    if(RC == -1)
-    {
-	printf("ERROR: Bad call to gettimeofday\n");
-	return(-1);
-    }
-    return( ((double)TV.tv_sec) + kMicro * ((double)TV.tv_usec) );
-}
-
-double isendDelay=0.0;
-double irecvDelay=0.0;
-double isendTestDelay=0.0;
-double irecvTestDelay=0.0;
-double localScheDelay=0.0;
-#endif
-
-void Perilla::syncProcesses(){
-    MPI_Barrier(MPI_COMM_WORLD);
-}
-
-void Perilla::serviceLocalRequests(RegionGraph* rg, int tg)
-{
-    int numfabs = rg->lMap.size();
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    bool anyReq=false;
-	    for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++)
-		if(rg->lMap[f]->l_con.scpy[i].pQueue.queueSize(true)>0){
-		    anyReq=true;
-		    break;
-		}
-	    if(anyReq){
-		pthread_mutex_lock(&(rg->lMap[f]->l_con.sLock));
-		for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++){
-		    if(rg->lMap[f]->l_con.scpy[i].pQueue.queueSize(true)>0)
-		    {
-			Package *sPackage = rg->lMap[f]->l_con.scpy[i].pQueue.dequeue(true);
-			pthread_mutex_lock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			int dPartner = rg->lMap[f]->l_con.scpy[i].dPartner;
-			Package *dPackage = rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			std::memcpy(dPackage->databuf, sPackage->databuf, dPackage->bufSize * sizeof(double));
-			rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			if(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.queueSize(true)==1)
-			    rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.firingRuleCnt++;
-			pthread_mutex_unlock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			rg->lMap[f]->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-		    }
-		}
-		pthread_mutex_unlock(&(rg->lMap[f]->l_con.sLock));
-	    }//if there is any local send request
-	}// if my region
-    }// for(f<numfabs)    
-}//serviceLocalRequests
-
-void Perilla::serviceRemoteRequests(RegionGraph* rg, int graphID, int nGraphs)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = rg->rMap.size();
-    int tg = WorkerThread::perilla_wid();
-
-    // !we first pre-post receive  
-    for(int f=0; f<numfabs; f++)
-    {
-	for(int i=0; i<rg->lMap[f]->r_con.nrcv; i++)
-	{
-	    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed
-		nextrReq = true;
-	    else
-	    {
-		//we buffer at most 2 packages per send task - recv task pair, but 1 must be completed before we buffer the next to allow for tag reuse
-		Package *rearPackage = rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);
-		if(rearPackage) 
-		    if(rearPackage->completed && rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			nextrReq = true;
-		    else //!expected message is still on the way
-			nextrReq = false;
-	    }
-	    if(nextrReq) //!take a message from recycle pool and post a receive
-	    {
-		pthread_mutex_lock(&(rg->rMap[f]->r_con.rcvLock));
-		pthread_mutex_lock(&(rg->lMap[f]->r_con.rcvLock));
-		int ns = rg->rMap[f]->r_con.rcv[i].ns;
-		int nd = rg->rMap[f]->r_con.rcv[i].nd;
-		int lnd = rg->rMap[f]->r_con.rcv[i].lnd;
-		int r_grids = rg->rMap[f]->r_con.rcv[i].r_grids;
-		//!create a package to keep track of receive requests
-		Package *rMetaPackage = rg->rMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-		//!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-		Package *rPackage = rg->lMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-		int tag = tagMap[rg->rMap[f]->r_con.rcv[i].pr][graphID][nd][ns][rg->rMap[f]->r_con.rcv[i].sz];
-
-		rMetaPackage->request = MPI_REQUEST_NULL;
-		rg->lMap[f]->r_con.rcv[i].pQueue.enqueue(rPackage,true);   //!this is not done yet
-		rg->rMap[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage,true);   //!this is not done yet
-		rMetaPackage->request = ParallelDescriptor::Arecv(rPackage->databuf,
-			rg->rMap[f]->r_con.rcv[i].sz,
-			rg->rMap[f]->r_con.rcv[i].pr, tag).req(); // tag == SeqNum in c++ ver
-		pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-		pthread_mutex_unlock(&(rg->rMap[f]->r_con.rcvLock));
-	    }
-	}//for num messages in each Fab
-    }// for(f<numfabs)
-
-    //handle send requests. We don't need to lock the queues because no one changes the front queue data.
-    for(int f=0; f<numfabs; f++)
-    {
-	for(int i=0; i<rg->sMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //then !no message has been issued or all send requests have been fulfilled
-		nextsReq = false;
-	    else
-		nextsReq = true;
-
-	    if(nextsReq)
-	    {
-		Package *sMetaPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(!sMetaPackage->served)
-		{
-		    Package *sPackage = rg->lMap[f]->r_con.snd[i].pQueue.getFront(true);
-		    sMetaPackage->completed = false;
-		    sMetaPackage->served = true;
-		    sMetaPackage->request = MPI_REQUEST_NULL;
-		    int ns = rg->sMap[f]->r_con.snd[i].ns;
-		    int nd = rg->sMap[f]->r_con.snd[i].nd;
-		    int r_gid = rg->sMap[f]->r_con.snd[i].r_gid;
-		    int r_grids = rg->sMap[f]->r_con.snd[i].r_grids;
-		    int tag = Perilla::myTagMap[r_gid][nd][ns][rg->sMap[f]->r_con.snd[i].sz];
-		    sMetaPackage->request = ParallelDescriptor::Asend(sPackage->databuf,
-			    rg->sMap[f]->r_con.snd[i].sz,
-			    rg->sMap[f]->r_con.snd[i].pr, tag).req();  
-		}
-	    }
-	} // for(i<nsnd)
-    } // for(f<numfabs)
-
-    //!now we test if send and receive requests have been serviced
-    for(int f=0; f<numfabs; f++)
-    {
-	//!receive requests
-	for(int i=0; i<rg->rMap[f]->r_con.nrcv; i++)
-	{
-	    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //by our policy, we can assume that all messages before rear have completed
-	    {
-		//we dont need to lock the queue, because other consumers just take front messages. A circular buffer guarantees that the rear of the queue can be safely accessed when other queue data is modified
-		Package *rearPackage =  rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);
-		if(rearPackage) 
-		    if(!(rearPackage->completed))
-		    {
-			bool flag = false;
-			int ret_flag;
-			MPI_Status status;
-			ParallelDescriptor::Test(rearPackage->request, ret_flag, status);
-			flag = (ret_flag == 0) ? false : true;
-			if(flag)
-			{
-			    pthread_mutex_lock(&(rg->lMap[f]->r_con.rcvLock));
-			    rearPackage->completeRequest(true);
-			    rg->lMap[f]->r_con.rcv[i].pQueue.getRear()->completeRequest(true);
-			    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				rg->lMap[f]->r_con.firingRuleCnt++;
-			    pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-			}
-		    }
-	    } // if(queueSize > 0)
-	} // for(i<nrcv)
-    } // for(f<numfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {
-	//!send requests
-	for(int i=0; i<rg->lMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-	    {
-		Package *frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(frontPackage->served && !frontPackage->completed) //!latest receive request has NOT been completed
-		{
-		    bool flag = false;
-		    int ret_flag;
-		    MPI_Status status;
-		    ParallelDescriptor::Test(frontPackage->request, ret_flag, status);
-		    flag = (ret_flag == 0) ? false : true;
-		    if(flag)
-		    {
-			pthread_mutex_lock(&(rg->sMap[f]->r_con.sndLock));
-			frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = MPI_REQUEST_NULL;
-			rg->sMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			pthread_mutex_unlock(&(rg->sMap[f]->r_con.sndLock));
-			pthread_mutex_lock(&(rg->lMap[f]->r_con.sndLock));
-			frontPackage = rg->lMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = MPI_REQUEST_NULL;
-			rg->lMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			pthread_mutex_unlock(&(rg->lMap[f]->r_con.sndLock));			
-		    }
-		}
-	    } // if(queueSize > 0)
-	} // for(i<nsnd)
-    }// for(f<numfabs)
-
-}// serviceRemoteRequests
-
-void Perilla::serviceMultipleGraphCommDynamic(std::vector<RegionGraph*> graphArray, bool cpyAcross, int tid)
-{
-    int tg = WorkerThread::perilla_wid();
-    int np = ParallelDescriptor::NProcs();
-    int nGraphs = graphArray.size();
-
-    for(int g=0; g<nGraphs; g++)
-    {
-#ifdef PERILLA_DEBUG
-	double time= -getTime();
-#endif
-	serviceLocalRequests(graphArray[g], tg);
-	if(cpyAcross)
-	    serviceLocalGridCopyRequests(graphArray,g,tg);
-#ifdef PERILLA_DEBUG
-	time+= getTime();
-	if(tg==0)localScheDelay+= time;
-#endif
-	if(np > 1)
-	{
-	    if(tg==0)
-	    {
-		serviceRemoteRequests(graphArray[g],g,nGraphs);
-		if(cpyAcross)
-		    serviceRemoteGridCopyRequests(graphArray,g,nGraphs,tg);
-	    }
-	}
-    }
-}//serviceMultipleGraphCommDynamic
-
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int myProc = ParallelDescriptor::MyProc();
-
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	FabCopyAssoc* cpDst = destGraph->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{   
-	    if(cpDst->graphPartner == srcGraph)
-		break;
-	    cpDst = cpDst->next;
-	}
-	if(cpDst == 0) cout <<"Metadata for across grid copy not found"<< endl;
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpDst->l_con.dLock));
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-	    {
-		Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-	    }
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue()); // corrected from pQ to recycleQ and from recycleQ to pQ
-	    cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-	    pthread_mutex_unlock(&(cpDst->l_con.dLock));
-	}
-	else
-	{
-	    if(ntid==0){
-		pthread_mutex_lock(&(cpDst->l_con.dLock));
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		{
-		    Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-		}
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		    cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue()); // corrected from pQ to recycleQ and from recycleQ to pQ
-		cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-		pthread_mutex_unlock(&(cpDst->l_con.dLock));
-	    }
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		///*
-		Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf); 
-		rcvPackage->completed = false;
-		rcvPackage->served = false;
-		rcvPackage->request = MPI_REQUEST_NULL;
-		cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage, true);                         // corrected from pQ to recycleQ           
-	    }
-	    cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-	    cpDst->r_con.remotePullDone = true;
-	    ///*
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			cpDst->r_con.firingRuleCnt++;
-	    //*/
-	    pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-	}
-	else
-	{
-	    if(ntid==0)
-	    {
-		pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		{
-		    Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-		    rcvPackage->completed = false;
-		    rcvPackage->served = false;
-		    rcvPackage->request = MPI_REQUEST_NULL;
-		    cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage, true);                         // corrected from pQ to recycleQ       
-		}
-		cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-		cpDst->r_con.remotePullDone = true;
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    if(cpDst->r_con.rcv[i].pQueue.queueSize() >= 1)
-			if(cpDst->r_con.rcv[i].pQueue.getFront()->checkRequest())
-			    cpDst->r_con.firingRuleCnt++;
-		pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-	    }
-	}
-    } // if(!(*mfDst == *mfSrc))
-} // multifabCopyPull
-
-
-void Perilla::fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f, bool singleT)
-{
-
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    if(ntid==0)
-	pthread_mutex_lock(&(graph->lMap[f]->l_con.dLock));
-    if(!singleT)
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads    
-
-    for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	{
-	    Package *dPackage = graph->lMap[f]->l_con.dcpy[i].pQueue.getFront(true);
-	    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->l_con.dcpy[i].dbx,0,nComp,dPackage->databuf);
-	}
-
-    if(!singleT)
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(ntid==0)
-    {
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    graph->lMap[f]->l_con.dcpy[i].recycleQueue.enqueue( graph->lMap[f]->l_con.dcpy[i].pQueue.dequeue(true),true );
-
-	graph->lMap[f]->l_con.firingRuleCnt = graph->lMap[f]->l_con.firingRuleCnt - graph->lMap[f]->l_con.ndcpy;
-
-	graph->lMap[f]->l_con.scpyCnt = 0;
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    if(graph->lMap[f]->l_con.dcpy[i].pQueue.queueSize(true) >= 1)
-		graph->lMap[f]->l_con.firingRuleCnt++;
-	pthread_mutex_unlock(&(graph->lMap[f]->l_con.dLock));
-    }
-    if(!singleT)
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-    {
-	pthread_mutex_lock(&(graph->rMap[f]->r_con.rcvLock));
-	pthread_mutex_lock(&(graph->lMap[f]->r_con.rcvLock));
-    }
-    if(!singleT)
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	{
-	    Package *rcvMetaPackage = graph->rMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = 0;
-	    graph->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-	    Package *rcvPackage = graph->lMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->r_con.rcv[i].dbx,0,nComp,rcvPackage->databuf);
-	    rcvPackage->completed = false;
-	    graph->lMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);
-	}
-    if(!singleT)
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(ntid==0)
-    {
-	graph->lMap[f]->r_con.firingRuleCnt = graph->lMap[f]->r_con.firingRuleCnt - graph->lMap[f]->r_con.nrcv;
-	for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	    if(graph->lMap[f]->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		if(graph->lMap[f]->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-		    graph->lMap[f]->r_con.firingRuleCnt++;
-	pthread_mutex_unlock(&(graph->lMap[f]->r_con.rcvLock));
-	pthread_mutex_unlock(&(graph->rMap[f]->r_con.rcvLock));
-    }
-
-} // fillBoundaryPull
-
-
-
-void Perilla::fillBoundaryPull_1Team(RegionGraph* graph, amrex::MultiFab& mf, int f)
-{
-    exit(0);
-} // fillBoundaryPull
-
-
-void Perilla::multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    int myProc = ParallelDescriptor::MyProc();
-    // MultiFab* mfDst = destGraph->assocMF;
-    // MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-	while(cpSrc != 0)
-	{
-	    if(cpSrc->graphPartner == destGraph)
-		break;
-	    cpSrc = cpSrc->next;
-	}
-	if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->l_con.sLock));
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-	    {
-		Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-	    }
-	    for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-	    pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-	}
-	else
-	{
-	    if(ntid == 0)
-		pthread_mutex_lock(&(cpSrc->l_con.sLock));
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-		}
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    if(ntid==0)
-	    {
-		for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		    cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-		pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-	    }
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-
-		Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-	    }
-
-	    pthread_mutex_unlock(&(cpSrc->r_con.sndLock));
-
-	    cpSrc->r_con.remotePushReady = true;
-	    ///*
-	    pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);
-	    pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-	}
-	else
-	{
-	    if(ntid == 0)
-		pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		    cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-		}
-
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    if(ntid==0)
-	    {
-		pthread_mutex_unlock(&(cpSrc->r_con.sndLock));
-
-		cpSrc->r_con.remotePushReady = true;
-		///*
-		pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);
-		pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-		//*/
-	    }
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))                                                                                                              
-} // multifabCopyPushAsync
-
-
-void Perilla::fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f)
-{
-
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    if(ntid == 0)
-	pthread_mutex_lock(&(graph->lMap[f]->l_con.sLock));
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-	if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	{
-	    Package *sPackage = graph->lMap[f]->l_con.scpy[i].recycleQueue.getFront(true);
-	    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->l_con.scpy[i].sbx,0,nComp,sPackage->databuf);
-	}
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-	{
-	    graph->lMap[f]->l_con.scpy[i].pQueue.enqueue( graph->lMap[f]->l_con.scpy[i].recycleQueue.dequeue(true),true );
-	}
-	pthread_mutex_unlock(&(graph->lMap[f]->l_con.sLock));
-    }
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-	pthread_mutex_lock(&(graph->lMap[f]->r_con.sndLock));
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	if((i%(perilla::NUM_THREADS_PER_TEAM-1))==ntid)
-	{
-	    Package *sndPackage = graph->lMap[f]->r_con.snd[i].recycleQueue.dequeue(true);
-	    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->r_con.snd[i].sbx,0,nComp,sndPackage->databuf);
-	    graph->lMap[f]->r_con.snd[i].pQueue.enqueue( sndPackage,true );
-	}
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(ntid==0)
-    {
-	pthread_mutex_unlock(&(graph->lMap[f]->r_con.sndLock));
-	pthread_mutex_lock(&(graph->sMap[f]->r_con.sndLock));
-	for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	    graph->sMap[f]->r_con.snd[i].pQueue.enqueue( graph->sMap[f]->r_con.snd[i].recycleQueue.dequeue(true),true );
-	pthread_mutex_unlock(&(graph->sMap[f]->r_con.sndLock));
-    }
-} // fillBoundaryPush
-
-
-
-void Perilla::fillBoundaryPush(amrex::RGIter& rgi, amrex::MultiFab& mf)
-{
-    if(rgi.currentItr != rgi.totalItr)
-	return;
-
-    int f = rgi.currentRegion;
-    fillBoundaryPush(rgi.itrGraph, &mf, f);
-}
-
-void Perilla::fillBoundaryPush(amrex::RGIter& rgi, RegionGraph* rg, amrex::MultiFab& mf)
-{
-    if(rgi.currentItr != rgi.totalItr)
-	return;
-
-    int f = rgi.currentRegion;
-    fillBoundaryPush(rg, &mf, f);
-}
-
-
-void Perilla::multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    multifabCopyPush_1Team(destGraph,srcGraph,mfDst,mfSrc,f,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-}
-
-
-void Perilla::multifabCopyPush_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int ntid = perilla::wtid();// - perilla::NUM_COMM_THREADS;
-    int tg = perilla::wid();
-    int myProc = amrex::ParallelDescriptor::MyProc();
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-	while(cpSrc != 0)
-	{
-	    if(cpSrc->graphPartner == destGraph)
-		break;
-	    cpSrc = cpSrc->next;
-	}
-	if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->l_con.sLock));
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-	    {
-		Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-	    }
-	    for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true));
-	    pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-	}
-	else
-	{
-	    if(ntid == 0)
-	    {
-		pthread_mutex_lock(&(cpSrc->l_con.sLock));
-		for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		{
-		    Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-		}
-
-		for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		    cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true));
-		pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-	    }
-	}
-
-	int np = amrex::ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-		Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		sndPackage->served = false;
-		sndPackage->completed = false;
-		cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage, true);
-	    }
-	    cpSrc->r_con.remotePushReady = true;
-	    pthread_mutex_unlock(&(cpSrc->r_con.sndLock));
-	}
-	else
-	{
-	    if(ntid == 0)
-	    {
-		pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		{
-		    Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		    sndPackage->served = false;
-		    sndPackage->completed = false;
-		    cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage, true);
-		}
-		cpSrc->r_con.remotePushReady = true;
-		pthread_mutex_unlock(&(cpSrc->r_con.sndLock));
-	    }
-	}
-    } // if(!(*mfDst == *mfSrc))                                                                                                                    
-} // multifabCopyPush
-
-
-void Perilla::serviceLocalGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int tg)
-{
-    int nfabs = graphArray[g]->numTasks;
-
-    for(int f=0; f<nfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		bool anyReq=false;
-		for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		    if(cpSrc->l_con.scpy[i].pQueue.queueSize(true)>0){
-			anyReq=true;
-			break;
-		    }
-		if(anyReq)
-		{
-		    pthread_mutex_lock(&(cpSrc->l_con.sLock));
-		    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		    {
-			if(cpSrc->l_con.scpy[i].pQueue.queueSize(true)>0)
-			{
-			    FabCopyAssoc* cpDst = cpSrc->graphPartner->task[cpSrc->l_con.scpy[i].nd]->cpAsc_dstHead;
-			    while(cpDst != 0)
-			    {
-				if(cpDst->graphPartner == graphArray[g])
-				    break;
-				cpDst = cpDst->next;
-			    }
-			    Package* sPackage = cpSrc->l_con.scpy[i].pQueue.dequeue(true);
-			    pthread_mutex_lock(&(cpDst->l_con.dLock));
-			    int dPartner = cpSrc->l_con.scpy[i].dPartner;
-			    Package* dPackage = cpDst->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			    std::memcpy(dPackage->databuf, sPackage->databuf, dPackage->bufSize * sizeof(double));
-			    cpDst->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			    if(cpDst->l_con.dcpy[dPartner].pQueue.queueSize(true) == 1)
-				cpDst->l_con.firingRuleCnt++;
-			    pthread_mutex_unlock(&(cpDst->l_con.dLock));
-			    cpSrc->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-			}
-		    } // for
-		    pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-		}//anyReq
-		cpSrc = cpSrc->next;
-	    } // while(cpSrc != 0)
-	} // if(tg==fg)
-    } // for(f<nfabs)
-} // serviceLocalGridCopyRequests
-
-void Perilla::serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    int graphID = graphArray[g]->graphID;
-
-#ifdef PERILLA_DEBUG
-    double time= -getTime();
-#endif
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true)==0)
-		{
-		    nextrReq = true;
-		}
-		else
-		{
-		    Package *rearPackage = cpDst->r_con.rcv[i].pQueue.getRear(true);
-		    if(rearPackage) 
-			if(rearPackage->completed && cpDst->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			{
-			    nextrReq = true;
-			}
-			else //!expected message is still on the way
-			    nextrReq = false;
-		}
-		if(nextrReq) //!take a message from recycle pool and post a receive
-		{
-		    pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-		    int ns = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].ns;
-		    int nd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].nd;
-		    int lnd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-		    int r_grids = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].r_grids;
-		    Package *rPackage = cpDst->r_con.rcv[i].recycleQueue.dequeue(true);
-		    int tag = tagMap[graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr][g][nd][ns][graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz];
-		    rPackage->request = MPI_REQUEST_NULL;
-		    rPackage->completed=false;
-		    cpDst->r_con.rcv[i].pQueue.enqueue(rPackage, true);   //!this is not done yet
-		    rPackage->request = ParallelDescriptor::Arecv(rPackage->databuf,
-			    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz,
-			    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr, tag).req(); // tag == SeqNum in c++ ver
-		    pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		}						
-	    } // for (i<i<cpDst->r_con.nrcv)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-#ifdef PERILLA_DEBUG
-    time+= getTime();
-    irecvDelay+= time;
-
-    time= -getTime();
-#endif
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-		if(cpSrc->r_con.snd[i].pQueue.queueSize(true) == 0)
-		    nextsReq = false;
-		else
-		    nextsReq = true;
-
-		if(nextsReq) 
-		{
-		    //there is no need to lock the queue because we only touch the front to initialize the send
-		    //During this time, workers can produce more messages into the queue, but a circular queue ensures that the front of the queue will not be modified
-		    Package *sPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-		    if(!sPackage->served)
-		    {  		    
-			sPackage->completed = false;
-			sPackage->served = true;
-			sPackage->request = MPI_REQUEST_NULL;
-			int ns = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].ns;
-			int nd = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].nd;
-			int r_gid = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_gid;
-			int r_grids = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_grids;
-			int tag = Perilla::myTagMap[r_gid][nd][ns][graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz];
-			sPackage->request = ParallelDescriptor::Asend(sPackage->databuf,
-				graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz,
-				graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-		    }
-		}		
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-#ifdef PERILLA_DEBUG
-    time+= getTime();
-    isendDelay+= time;
-
-    time= -getTime();
-#endif
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true) > 0) 
-		{		    
-		    Package *rearPackage =  cpDst->r_con.rcv[i].pQueue.getRear(true);
-		    //Note: all messages before rear have completed
-		    if(rearPackage)
-			if(!rearPackage->completed)
-			{
-			    bool flag = false;
-			    int ret_flag=0;
-			    MPI_Status status;
-			    ParallelDescriptor::Test(rearPackage->request, ret_flag, status);
-
-			    flag = (ret_flag == 0) ? false : true;
-			    if(flag)
-			    {
-				pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-				rearPackage->completeRequest(true);				
-				if(cpDst->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				{
-				    cpDst->r_con.firingRuleCnt++;
-				}
-				pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-			    }
-			}		   		    
-		} // if(pQueue.queueSize(true) > 0)		    
-	    } // for (i<i<cpDst->r_con.nrcv)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-#ifdef PERILLA_DEBUG
-    time+= getTime();
-    irecvTestDelay+= time;
-
-    time= -getTime();
-#endif
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {		
-		if(cpSrc->r_con.snd[i].pQueue.queueSize(true) >0)
-		{
-		    Package *frontPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-		    if(frontPackage->served)
-		    {
-			bool flag = false;
-			int ret_flag;
-			MPI_Status status;
-			ParallelDescriptor::Test(frontPackage->request, ret_flag, status);
-			flag = (ret_flag == 0) ? false : true;
-			if(flag)
-			{
-			    //we have to lock the queue before removing the front 
-			    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-			    frontPackage = cpSrc->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = MPI_REQUEST_NULL;
-			    cpSrc->r_con.snd[i].recycleQueue.enqueue(frontPackage, true);
-			    pthread_mutex_unlock(&(cpSrc->r_con.sndLock));			
-			}
-		    }
-		} // if(queueSize > 0)				
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-#ifdef PERILLA_DEBUG
-    time+= getTime();
-    isendTestDelay+= time;
-#endif
-} // serviceRemoteGridCopyRequests
-
diff --git a/Src/AmrTask/rts_impls/mpi/PerillaConfig.H b/Src/AmrTask/rts_impls/mpi/PerillaConfig.H
deleted file mode 100755
index 8b2609001e1..00000000000
--- a/Src/AmrTask/rts_impls/mpi/PerillaConfig.H
+++ /dev/null
@@ -1,22 +0,0 @@
-#ifndef P_PERILLACONFIG_H
-#define P_PERILLACONFIG_H
-
-//class PerillaConfig
-namespace perilla
-{
-  static const int NUM_THREAD_TEAMS=4;
-  static const int NUM_THREADS_PER_TEAM=4;
-  static const int NUM_COMM_THREADS=1;
-  static const int NUM_PREGENERATED_PACKAGES=3;
-  static const int MSG_QUEUE_DEFAULT_MAXSIZE=3; // same as num of pregenerated packages because these got swaped between pQ and recycleQ
-  static const int TASK_QUEUE_DEFAULT_SIZE=512;
-  static const int MAX_SQRT_TAG=512;  //sqrt(512*512)
-  static const bool NUMA_AWARE_MESSAGEHANDLER=true;
-  static const int LOCK_GRANULARITY=1; //!0 is queue level, 1 is region level
-  
-  static const bool LAZY_PUSH=false;
-  static const bool LAZY_PULL=false;
-  static const bool PACKING_FINEGRAIN=false; //!PACKING_FINEGRAIN = TRUE is effective when LAZY_PUSH=FALSE
-  static const bool UNPACKING_FINEGRAIN=false; //!is effective when LAZY_PUSH=FALSE
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi/PerillaRts.H b/Src/AmrTask/rts_impls/mpi/PerillaRts.H
deleted file mode 100644
index 49eaa0db0d0..00000000000
--- a/Src/AmrTask/rts_impls/mpi/PerillaRts.H
+++ /dev/null
@@ -1,49 +0,0 @@
-#ifndef _PERILLA_RTS_
-#define _PERILLA_RTS_
-
-#include <AMReX_Amr.H>
-#include <PerillaConfig.H>
-#include <RGIter.H>
-
-namespace perilla{
-
-struct _workerThreadInfo{
-    int _tid; //thread id in local group
-    int _size; //number of threads in the group
-};
-
-struct _threadInfo{
-    bool _isComm; //whether this thread handles communication
-    int _wtid; //worker thread id (-1 if this thread is decicated to communication)
-    int _nWts; //number of thread groups
-};
-
-class RTS
-{
-    private:
-	int _nWrks;
-	void RTS_Init();
-	int _rank, _nProcs;
-
-    public:
-	RTS(){
-	    _nWrks=1;
-	    char* nWrks= getenv("NWORKERS");
-	    if(nWrks) _nWrks= atoi(nWrks);
-	}
-	RTS(int nWrks):_nWrks(nWrks){}
-	int ProcCount();
-	int MyProc();
-	int WorkerThreadCount();
-	int MyWorkerThread();
-	void Init(); //Build the runtime system from scratch
-	void Init(int rank, int nProcs);//Build the runtime system on pre-existing MPI processes
-	void Iterate(void *graph, int max_step, Real stop_time);
-	void Finalize();
-	void Barrier();
-	void runAMR(Amr* amrptr, int max_step, Real stop_time);
-        void invokeOnDemand(std::vector<RegionGraph *> rg, RGIter *rgi);
-};
-
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi/PerillaRts.cpp b/Src/AmrTask/rts_impls/mpi/PerillaRts.cpp
deleted file mode 100644
index f101bd5e4b0..00000000000
--- a/Src/AmrTask/rts_impls/mpi/PerillaRts.cpp
+++ /dev/null
@@ -1,195 +0,0 @@
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 08-14-2017
-#include <mpi.h>
-#include <sched.h>
-#include <sys/syscall.h>
-#include <unistd.h>
-#include <mylock.h>
-#include <pthread.h>
-#include "PerillaRts.H"
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include <PerillaMemCheck.H>
-PerillaMemCheck memcheck;
-#endif
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-namespace perilla{
-    Amr* amrptr;
-    struct RtsDomain{
-	pthread_t *_threads;
-	int _size;
-	MyLock _lock;
-	RtsDomain():_threads(NULL), _size(0){};
-	~RtsDomain(){
-	    free(_threads);
-	}
-    };
-    int numa_nodes;
-    RtsDomain *dom;
-    MyLock _l;
-    volatile char startSignal=0;
-    pthread_mutex_t startLock= PTHREAD_MUTEX_INITIALIZER;
-
-    int RTS::ProcCount(){
-	return _nProcs;
-    }
-
-    int RTS::MyProc(){
-	return _rank;
-    }
-
-    int RTS::WorkerThreadCount(){
-	return _nWrks;
-    }
-
-    int RTS::MyWorkerThread(){
-	return 0;
-    }
-
-    struct argT {
-	int numaID;
-	int tid;
-	int g_tid;
-	int nThreads;
-	int nTotalThreads;
-	int max_step;
-	Real stop_time;
-	RTS* thisRTS;
-    };
-
-    void RTS::runAMR(Amr* amr, int max_step, Real stop_time){
-        while (amr->okToContinue() &&
-              (amr->levelSteps(0) < max_step || max_step < 0) &&
-              (amr->cumTime() < stop_time || stop_time < 0.0) )
-            
-        {
-            // Do a coarse timestep, which calls one or multiple timestep updates (i.e. timeStep()) at each AMR level
-            amr->coarseTimeStep(stop_time);
-        }
-    }
-
-#ifdef USE_PERILLA_PTHREADS
-    void run(void* threadInfo){
-	argT *args= (argT*)threadInfo;
-	int numaID= args->numaID;
-	int tid= args->tid;
-	int g_tid= args->g_tid;
-	int nThreads= args->nThreads;
-	int nTotalThreads= args->nTotalThreads;
-	int max_step= args->max_step;
-	Real stop_time= args->stop_time;
-	RTS* rts= args->thisRTS;
-	Perilla::registerId(g_tid);
-	//done with thread id setup, now wait for the start signal from master
-        pthread_mutex_lock(&startLock);
-	startSignal++;
-        pthread_mutex_unlock(&startLock);
-	while(startSignal!= nTotalThreads){}
-        rts->runAMR(amrptr, max_step, stop_time);
-    }
-#endif
-
-    void InitializeMPI(){
-	int provided;
-	MPI_Init_thread(0, 0, MPI_THREAD_FUNNELED, &provided);
-	if(provided == MPI_THREAD_SINGLE){//with this MPI, process can't spawn threads
-	    cerr << "Spawning threads is not allowed by the MPI implementation" << std::endl;;
-	}
-    }
-
-    void RTS::RTS_Init(){
-	amrptr= NULL;
-    }
-
-    void RTS::Init(){
-        InitializeMPI();
-        MPI_Comm_rank(MPI_COMM_WORLD, &_rank);
-        MPI_Comm_size(MPI_COMM_WORLD, &_nProcs);
-        RTS_Init();
-    }
-
-    void RTS::Init(int rank, int nProcs){
-        _rank= rank;
-	_nProcs= nProcs;
-	RTS_Init();
-    }
-
-    void RTS::Finalize(){
-#ifdef PERILLA_DEBUG
-      memcheck.report();
-#endif
-    }
-
-    void RTS::Iterate(void* amrGraph, int max_step, Real stop_time){
-	    assert(amrGraph);
-	    Perilla::max_step= max_step;
-	    amrptr= (Amr*)amrGraph;
-            WorkerThread::init();
-#ifndef USE_PERILLA_PTHREADS
-            runAMR(amrptr, max_step, stop_time);
-#else
-	    int numa_nodes= perilla::NUM_THREAD_TEAMS;
-	    int worker_per_numa = perilla::NUM_THREADS_PER_TEAM;
-            int _nWrks= numa_nodes*worker_per_numa;
-	    int base=0; 
-	    int localID=-1;
-	    //create a list of persistent threads for each NUMA node
-	    cpu_set_t cpuset;
-	    pthread_attr_t attr;
-	    pthread_attr_init(&attr);
-	    dom= new RtsDomain[numa_nodes];
-	    for(int i=0; i<numa_nodes; i++){
-		dom[i]._threads= new pthread_t[worker_per_numa];
-	    }
-	    for(int i=0, domNo=-1; i<_nWrks; i++){
-		localID++;
-		if(localID==0){
-		    domNo++;
-		}
-		CPU_ZERO(&cpuset);
-		CPU_SET(base+localID, &cpuset);
-		if(! (localID==0 && domNo==0)){
-		    pthread_attr_setaffinity_np(&attr, sizeof(cpu_set_t), &cpuset);
-		    argT* arg= new argT;
-		    arg->numaID= domNo;
-		    arg->tid= localID;
-		    arg->g_tid= domNo*worker_per_numa+localID;
-		    arg->nThreads= worker_per_numa;
-		    arg->nTotalThreads= _nWrks;
-		    arg->thisRTS= this;
-		    arg->max_step= max_step;
-		    arg->stop_time= stop_time;
-		    int err = pthread_create(&(dom[domNo]._threads[localID]), &attr, (void*(*)(void*))run, arg);
-		}else{ //master thread
-		    dom[domNo]._threads[localID]= pthread_self();
-		    Perilla::registerId(0);
-		    //enable worker threads to start computing
-        	    pthread_mutex_lock(&startLock);
-	   	    startSignal++;
-	            pthread_mutex_unlock(&startLock);
-                }
-		dom[domNo]._size++;
-		if(localID == (worker_per_numa-1)){
-		    localID=-1;
-		    base+= worker_per_numa;
-		}
-	    }
-	    while(startSignal!= _nWrks){}//wait until all threads have done the setup phase
-            runAMR(amrptr, max_step, stop_time);
-	    for(int i=1; i<_nWrks; i++) pthread_join(dom[i/worker_per_numa]._threads[i%worker_per_numa], NULL);
-#endif
-    }
-
-    void RTS::Barrier(){
-        MPI_Barrier(MPI_COMM_WORLD);
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/mpi/perilla.mak b/Src/AmrTask/rts_impls/mpi/perilla.mak
deleted file mode 100755
index 9e1c88ce260..00000000000
--- a/Src/AmrTask/rts_impls/mpi/perilla.mak
+++ /dev/null
@@ -1,10 +0,0 @@
-CEXE_sources += PackageQueue.cpp
-CEXE_sources += Perilla.cpp
-CEXE_sources += WorkerThread.cpp
-
-
-CEXE_headers += Config.H
-CEXE_headers += PackageQueue.H
-
-
-
diff --git a/Src/AmrTask/rts_impls/mpi_omp/AsyncMultiFabUtil.H b/Src/AmrTask/rts_impls/mpi_omp/AsyncMultiFabUtil.H
deleted file mode 100755
index 66c239f0f2f..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/AsyncMultiFabUtil.H
+++ /dev/null
@@ -1,34 +0,0 @@
-#ifndef _AsyncMultiFabUtil_H_
-#define _AsyncMultiFabUtil_H_
-
-#include <AMReX_MultiFab.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_Amr.H>
-#include <omp.h>
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const int ratio, int f);
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const int ratio, int f);        
-
-// Average fine cell-based MultiFab onto crse cell-centered MultiFab without volume weighting.
-// This routine DOES NOT assume that the crse BoxArray is a coarsened version of the fine BoxArray.
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int ratio, int f);  
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int ratio, int f);
-
-void average_down_push (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, MultiFab* crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-                       amrex::Geometry&, amrex::Geometry&,int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_pull (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse,
-                       amrex::Geometry&, amrex::Geometry&, int scomp, int ncomp, const IntVect& ratio, int f);
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/AsyncMultiFabUtil.cpp b/Src/AmrTask/rts_impls/mpi_omp/AsyncMultiFabUtil.cpp
deleted file mode 100755
index e86ff112537..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/AsyncMultiFabUtil.cpp
+++ /dev/null
@@ -1,175 +0,0 @@
-#include <AMReX_MultiFabUtil.H>
-//#include <AMReX_MultiFabUtil_F.H>
-#include <AsyncMultiFabUtil.H>
-#include <AMReX_MultiFabUtil_C.H>
-#include <Perilla.H>
-#include <WorkerThread.H>
-
-using namespace amrex;
-using namespace perilla;
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	const Geometry& fgeom, const Geometry& cgeom, int scomp, int ncomp, int rr, int f)
-{
-    average_down_push(amr,S_fine,S_crse,crse_S_fine,RG_fine,RG_crse,fgeom,cgeom,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-const Geometry& fgeom, const Geometry& cgeom, int scomp, int ncomp, int rr, int f)
-{
-    average_down_pull(S_fine,S_crse,RG_fine,RG_crse,fgeom,cgeom,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	const Geometry& fgeom, const Geometry& cgeom, int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    if (S_fine.is_nodal() || S_crse.is_nodal())
-    {
-	amrex::Error("Can't use amrex::average_down for nodal MultiFab!");
-    }
-
-#if (BL_SPACEDIM == 3)
-    average_down_push(amr, S_fine, S_crse, crse_S_fine, RG_fine, RG_crse, scomp, ncomp, ratio, f);
-    return;
-#else
-
-    assert(S_crse.nComp() == S_fine.nComp());
-
-
-    MultiFab fvolume;
-    fgeom.GetVolume(fvolume, fine_BA, 0);
-
-    int lfi = crse_S_fine.IndexArray()[f];
-    const Box& tbx = crse_S_fine[ lfi ].box();
-
-    amrex_avgdown_with_vol(tbx,crse_S_fine[lfi].array(),S_fine[lfi].array(),fvolume[mfi].array(),
-                           0,scomp,ncomp,ratio);
-
-    Perilla::multifabCopyPushAsync(RG_crse, RG_fine, &S_crse, &crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-#endif
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fgeom, const Geometry& cgeom, 
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-
-    if (S_fine.is_nodal() || S_crse.is_nodal())
-    {
-	amrex::Error("Can't use amrex::average_down for nodal MultiFab!");
-    }
-
-#if (BL_SPACEDIM == 3)
-    average_down_pull(S_fine, S_crse, RG_fine, RG_crse, scomp, ncomp, ratio, f);
-    return;
-#else
-    assert(S_crse.nComp() == S_fine.nComp());
-    Perilla::multifabCopyPull(RG_crse, RG_fine, &S_crse, &S_fine, f, scomp, 0, ncomp, 0, 0, false);
-#endif
-}
-
-
-// *************************************************************************************************************
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-	int scomp, int ncomp, int rr, int f)
-{
-    average_down_push(amr,S_fine,S_crse,crse_S_fine,RG_fine,RG_crse,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int rr, int f)
-{
-    average_down_pull(S_fine,S_crse,RG_fine,RG_crse,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    assert(S_crse.nComp() == S_fine.nComp());
-
-    //  NOTE: The tilebox is defined at the coarse level.
-    int lfi = crse_S_fine.IndexArray()[f];
-    int tg = WorkerThread::perilla_wid();
-    int nt = WorkerThread::perilla_wtid();
-
-    for(int t=0; t<RG_fine->fabTiles[f]->numTiles; t++)
-	if(t % (perilla::NUM_THREADS_PER_TEAM-1) == nt)
-	{
-	    const Box& tbx = *(RG_fine->fabTiles[f]->tileBx[t]);
-            amrex_avgdown(tbx,crse_S_fine[lfi].array(),S_fine[lfi].array(),0,scomp,ncomp,ratio);
-	}
-    RG_fine->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    Perilla::multifabCopyPushAsync(RG_crse, RG_fine, &S_crse, &crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    assert(S_crse.nComp() == S_fine.nComp());
-    Perilla::multifabCopyPull(RG_crse, RG_fine, &S_crse, &S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-void average_down_push (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, MultiFab* crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,amrex::Geometry& geom, amrex::Geometry& geom1,
-        int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    if(rgi.currentItr != rgi.totalItr)
-        return;
-
-    f = rgi.currentRegion;
-    //  NOTE: The tilebox is defined at the coarse level.
-    int lfi = crse_S_fine->IndexArray()[f];
-
-    //  NOTE: We copy from component scomp of the fine fab into component 0 of the crse fab
-    //        because the crse fab is a temporary which was made starting at comp 0, it is
-    //        not part of the actual crse multifab which came in.
-
-    perilla::syncWorkerThreads();
-    int nThreads= perilla::nWorkerThreads();
-    for(int t=0; t<RG_fine->fabTiles[f]->numTiles; t+= nThreads)
-    {
-        const Box& tbx = *(RG_fine->fabTiles[f]->tileBx[t]);
-        amrex_avgdown(tbx,(*crse_S_fine)[lfi].array(),(*S_fine)[lfi].array(),0,scomp,ncomp,ratio);
-    }
-    perilla::syncWorkerThreads();
-    Perilla::multifabCopyPush(RG_crse, RG_fine, S_crse, crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-void average_down_pull (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, amrex::Geometry& geom, amrex::Geometry& geom1,
-        int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    if(rgi.currentItr != 1)
-        return;
-    f = rgi.currentRegion;
-
-    Perilla::multifabCopyPull(RG_crse, RG_fine, S_crse, S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-
-// *************************************************************************************************************
-
-#if 0
-// Average fine face-based MultiFab onto crse fine-centered MultiFab.
-// This routine assumes that the crse BoxArray is a coarsened version of the fine BoxArray.
-void average_down_faces (PArray<MultiFab>& fine, PArray<MultiFab>& crse, IntVect& ratio)
-{
-    BL_ASSERT(crse.size()  == BL_SPACEDIM);
-    BL_ASSERT(fine.size()  == BL_SPACEDIM);
-    BL_ASSERT(crse[0].nComp() == fine[0].nComp());
-
-    int ncomp = crse[0].nComp();
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (int n=0; n<BL_SPACEDIM; ++n) {
-	for (MFIter mfi(crse[n],true); mfi.isValid(); ++mfi)
-	{
-	    const Box& tbx = mfi.tilebox();
-
-	    BL_FORT_PROC_CALL(BL_AVGDOWN_FACES,bl_avgdown_faces)
-		(tbx.loVect(),tbx.hiVect(),
-		 BL_TO_FORTRAN(fine[n][mfi]),
-		 BL_TO_FORTRAN(crse[n][mfi]),
-		 ratio.getVect(),n,ncomp);
-	}
-    }
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/Barrier.H b/Src/AmrTask/rts_impls/mpi_omp/Barrier.H
deleted file mode 100755
index 91dce71d255..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/Barrier.H
+++ /dev/null
@@ -1,18 +0,0 @@
-#ifndef P_BARRIER_H
-#define P_BARRIER_H
-#include <omp.h>
-
-class Barrier
-{
-private:
-  volatile int counter;
-  int maxThreads;
-  volatile bool globalSense;
-public:
-  Barrier();
-  Barrier(int maxThreads);
-  void init(int maxThreads);
-  void sync();
-  void sync(int numthreads);
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/Barrier.cpp b/Src/AmrTask/rts_impls/mpi_omp/Barrier.cpp
deleted file mode 100755
index 5409a7e43c1..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/Barrier.cpp
+++ /dev/null
@@ -1,77 +0,0 @@
-#include <Barrier.H>
-#include <stdio.h>
-#include <limits.h>
-#include<assert.h>
-
-Barrier::Barrier()
-{
-  //With this intializer, numthreads has to be specified when syncing, i.e. sync(numthreads)
-  counter = INT_MAX;
-  globalSense = false;
-  maxThreads=INT_MAX;
-}
-
-Barrier::Barrier(int numthreads)
-{
-//With this initializer, both sync() and sync(numthreads) can be used
-#pragma omp critical
-{
-  counter = numthreads;
-  maxThreads= numthreads;
-  globalSense = false;
-}
-}
-
-void Barrier::init(int numthreads)
-{
-//Similar to Barrier(int numthreads)
-  counter = numthreads;
-  maxThreads= numthreads;
-  globalSense = false;
-}
-
-void Barrier::sync() //sync all threads associated with this barrier
-{
-  assert(maxThreads<INT_MAX);
-  bool localSense;
-  localSense = globalSense;
-  localSense =  !localSense;
-#pragma omp critical
-  {
-    counter--;
-    if(counter == 0)
-      {
-        counter = maxThreads;
-        globalSense = localSense;
-      }
-  }
-
-  while(globalSense != localSense)
-    {
-#pragma omp flush
-    }
-}
-
-void Barrier::sync(int numthreads) //sync a subset of threads
-{
-  assert(numthreads<=maxThreads);
-  bool localSense;
-  
-  localSense = globalSense;  
-  localSense =  !localSense;
-  
-#pragma omp critical
-  {
-    counter--;
-    if(counter == (maxThreads-numthreads))
-      {
-	counter = maxThreads;
-	globalSense = localSense;
-      }
-  }
-
-  while(globalSense != localSense)
-    {
-#pragma omp flush
-    }
-}
diff --git a/Src/AmrTask/rts_impls/mpi_omp/LocalConnection.H b/Src/AmrTask/rts_impls/mpi_omp/LocalConnection.H
deleted file mode 100755
index 0ba21e273e2..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/LocalConnection.H
+++ /dev/null
@@ -1,58 +0,0 @@
-#ifndef P_LOCALCONNECTION_H
-#define P_LOCALCONNECTION_H
-
-#include <PackageQueue.H>
-#include <Barrier.H>
-#include <AMReX_Box.H>
-#include <omp.h>
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include "PerillaMemCheck.H"
-extern PerillaMemCheck memcheck;
-#endif
-using namespace amrex;
-
-class LocalCopyDescriptor
-{
-    public:
-	int ns;   //Source box in layout
-	int nd;   //Destination box in layout
-	int sz;
-	Box sbx;     //Sub-box for this copy
-	Box dbx;     //Sub-box for this copy
-	PackageQueue pQueue;  //store incoming or outgoing messages, both fab and the runtime can access this queue
-	PackageQueue recycleQueue; //just for now, I'll replace this with a NUMA aware package allocator
-	int sPartner, dPartner;
-	int dcpyCnt,scpyCnt;
-	omp_lock_t ghostLock;
-	LocalCopyDescriptor() : ns(-1), nd(-1), scpyCnt(0), dcpyCnt(0), sz(0), sPartner(-1), dPartner(-1) {
-	    omp_init_lock(&ghostLock);
-	}
-};
-
-class LocalConnection
-{
-    public:
-	int nscpy;   //Number of cpy chunks
-	int ndcpy;   //Number of cpy chunks
-	omp_lock_t sLock, dLock, ghostLock;
-	int firingRuleCnt;
-	int scpyCnt, dcpyCnt;
-	Barrier *localBarrier;
-	LocalCopyDescriptor *scpy;
-	LocalCopyDescriptor *dcpy;
-	LocalConnection() : nscpy(0), ndcpy(0), firingRuleCnt(0), scpy(NULL), dcpy(NULL), scpyCnt(0), dcpyCnt(0), localBarrier(NULL){
-	    omp_init_lock(&sLock);
-	    omp_init_lock(&dLock);
-	    omp_init_lock(&ghostLock);
-	}
-
-	~LocalConnection()
-	{
-	    if(localBarrier) free(localBarrier);
-	    if(scpy) free(scpy);
-	    if(dcpy) free(dcpy);
-	}
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/Make.package b/Src/AmrTask/rts_impls/mpi_omp/Make.package
deleted file mode 100644
index a9cf8caa34d..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/Make.package
+++ /dev/null
@@ -1,11 +0,0 @@
-PERILLA_LIB=EXE
-
-C$(PERILLA_LIB)_sources += Barrier.cpp RGIter.cpp RegionQueue.cpp PackageQueue.cpp Perilla.cpp RegionGraph.cpp WorkerThread.cpp AsyncMultiFabUtil.cpp PerillaRts.cpp
-
-C$(PERILLA_LIB)_headers += Barrier.H Config.H LocalConnection.H PackageQueue.H RegionGraph.H RegionQueue.H RemoteConnection.H WorkerThread.H AsyncMultiFabUtil.H PerillaRts.H
-
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi_omp/perilla.mak
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi_omp
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi_omp
-
-
diff --git a/Src/AmrTask/rts_impls/mpi_omp/PackageQueue.H b/Src/AmrTask/rts_impls/mpi_omp/PackageQueue.H
deleted file mode 100755
index d521a4eff25..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/PackageQueue.H
+++ /dev/null
@@ -1,57 +0,0 @@
-#ifndef P_PACKAGEQUEUE_H
-#define P_PACKAGEQUEUE_H
-
-#include <PerillaConfig.H>
-#include <omp.h>
-#include <mpi.h>
-
-class Package
-{
-private:
-  int source, destination;
-public:
-  double *databuf;
-  int bufSize;
-  omp_lock_t packageLock;
-  bool completed; //message transfer is done
-  bool served; //message transfer request has been served but may have not completed
-  bool notified;
-  MPI_Request request; //!for MPI
-  Package();
-  ~Package();
-  Package(int size);
-  Package(int src, int dest);
-  Package(int src, int dest, int size);
-  void setPackageSource(int src);
-  void setPackageDestination(int dest);
-  void completeRequest(void);
-  void completeRequest(bool lockIgnore);
-  bool checkRequest(void);
-  void generatePackage(int size);
-};
-
-class PackageQueue
-{
-private:
-  Package *buffer[perilla::MSG_QUEUE_DEFAULT_MAXSIZE];
-  int n;
-  int front;
-  int rear;
-  int prear;
-public:  
-  omp_lock_t queueLock;
-  PackageQueue();
-  ~PackageQueue();
-  int queueSize(void);  
-  int queueSize(bool lockIgnore);
-  void enqueue(Package* package);  
-  void enqueue(Package* package, bool lockIgnore);
-  Package* dequeue(void);  
-  Package* dequeue(bool lockIgnore);
-  Package* getRear(void);
-  Package* getRear(bool lockIgnore);
-  Package* getFront(void);
-  Package* getFront(bool lockIgnore);
-  void emptyQueue();
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/PackageQueue.cpp b/Src/AmrTask/rts_impls/mpi_omp/PackageQueue.cpp
deleted file mode 100755
index 83009415007..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/PackageQueue.cpp
+++ /dev/null
@@ -1,240 +0,0 @@
-#include <PackageQueue.H>
-#include <iostream>
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include <PerillaMemCheck.H>
-extern PerillaMemCheck memcheck;
-#endif
-
-Package::Package()
-{
-    databuf = 0;
-    bufSize = 0;
-    source = 0;
-    destination = 0;
-    completed = false;
-    notified = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    omp_init_lock(&packageLock);
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::~Package()
-{
-    if(databuf) free(databuf);
-#ifdef PERILLA_DEBUG
-    memcheck.remove(memcheck.genKey(this));
-#endif
-}
-
-Package::Package(int size)
-{
-    databuf = new double[size];
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    notified = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    omp_init_lock(&packageLock);
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::Package(int src, int dest)
-{
-    bufSize = 0;
-    source = src;
-    destination = dest;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::Package(int src, int dest, int size)
-{
-    source = src;
-    destination = dest;
-    databuf = new double[size];
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    notified = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    omp_init_lock(&packageLock);
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-void Package::setPackageSource(int src)
-{
-    source = src;
-}
-
-void Package::setPackageDestination(int dest)
-{
-    destination = dest;
-}
-
-void Package::completeRequest(void)
-{
-    omp_set_lock(&packageLock);
-    completed = true;
-    omp_unset_lock(&packageLock);
-}
-
-void Package::completeRequest(bool lockIgnore)
-{
-    if(!lockIgnore)omp_set_lock(&packageLock);
-    completed = true;
-    if(!lockIgnore)omp_unset_lock(&packageLock);
-}
-
-bool Package::checkRequest(void)
-{
-    return completed;
-}  
-
-void Package::generatePackage(int size)
-{
-    databuf = new double[size];
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    notified = false;
-    served = false;
-    request = MPI_REQUEST_NULL;
-    omp_init_lock(&packageLock);
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-PackageQueue::PackageQueue()
-{
-    n = 0;
-    front = 0;
-    rear = 0;
-    prear = -1;
-    omp_init_lock(&queueLock);
-}
-
-int PackageQueue::queueSize(void)
-{
-    int size;
-    omp_set_lock(&queueLock);
-    size = n;
-    omp_unset_lock(&queueLock);
-    return size;
-}
-
-int PackageQueue::queueSize(bool lockIgnore)
-{
-    int size;
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    size = n;
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-    return size;
-}
-
-void PackageQueue::enqueue(Package* package)
-{
-    omp_set_lock(&queueLock);
-    buffer[rear] = package;
-    prear = rear;    
-    rear = (rear+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n++;
-    omp_unset_lock(&queueLock);
-}
-
-void PackageQueue::enqueue(Package* package, bool lockIgnore)
-{
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    buffer[rear] = package;
-    prear = rear;
-    rear = (rear+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n++;
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-}
-
-Package* PackageQueue::dequeue(void)
-{
-    Package* package = 0;
-    omp_set_lock(&queueLock);
-    package = buffer[front];
-    front = (front+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n--;
-    omp_unset_lock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::dequeue(bool lockIgnore)
-{
-    lockIgnore = false;
-    Package* package = 0;
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    if(n<0)
-	std::cout<< "Q size " << n << " front " << front <<std::endl;
-    package = buffer[front];
-    front = (front+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n--;
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getRear(void)
-{
-    Package* package = 0;
-    omp_set_lock(&queueLock);
-    package = buffer[prear];
-    omp_unset_lock(&queueLock);
-    return package;
-}
-Package* PackageQueue::getRear(bool lockIgnore)
-{
-    Package* package = 0;
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    package = buffer[prear];
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getFront(void)
-{
-    Package* package = 0;
-    omp_set_lock(&queueLock);
-    package = buffer[front];
-    omp_unset_lock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getFront(bool lockIgnore)
-{
-    Package* package = 0;
-    if(!lockIgnore) omp_set_lock(&queueLock);
-    package = buffer[front];
-    if(!lockIgnore) omp_unset_lock(&queueLock);
-    return package;
-}
-
-void PackageQueue::emptyQueue(){
-    while(n){
-        Package* p= dequeue(false);
-        delete p;
-    }
-}
-
-PackageQueue::~PackageQueue()
-{
-    emptyQueue();
-}
-
diff --git a/Src/AmrTask/rts_impls/mpi_omp/Perilla.H b/Src/AmrTask/rts_impls/mpi_omp/Perilla.H
deleted file mode 100755
index 7d945beb1cf..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/Perilla.H
+++ /dev/null
@@ -1,76 +0,0 @@
-#ifndef _PERILLA_
-#define _PERILLA_
-
-#include <AMReX_MultiFab.H>
-#include <vector>
-#include <map>
-#include <RegionGraph.H>
-#include <RGIter.H>
-
-using namespace std;
-
-namespace amrex
-{
-
-class Perilla
-{
-    static int tagGen(int src, int dest, int channelID, int nFabs, int nChannels);
-
-    public:
-    static int uTags;
-    static bool genTags;
-    static int max_step;
-
-    static std::map<int,std::map<int,int>> pTagCnt;
-    static std::map<int,std::map<int,std::map<int,std::map<int,std::map<int,int>>>>> tagMap;
-    static std::map<int,std::map<int,std::map<int,std::map<int,int>>>> myTagMap;
-    static void clearTagMap();
-    static void clearMyTagMap();
-    static void communicateTags();
-
-    static volatile int numTeamsFinished;
-    static volatile int updateMetadata_request;
-    static volatile int updateMetadata_noticed;
-    static volatile int updateMetadata_done;
-    static Barrier * globalBarrier;
-    static void multifabBuildFabCon(RegionGraph* graph, const MultiFab& mf, const Periodicity& period);
-    static void serviceLocalRequests(RegionGraph *graph, int tg);
-    static void serviceRemoteRequests(RegionGraph *graph, int graphID, int nGraphs);
-    static void serviceRemoteRequests(RegionGraph *graph);  
-    static void serviceSingleGraphComm(RegionGraph* graph, int tid);
-    static void serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, bool cpyAcross, int tid);
-    static void serviceMultipleGraphCommDynamic(std::vector<RegionGraph*> graphArray, bool cpyAcross, int tid);
-    static void flattenGraphHierarchy(std::vector<std::vector<RegionGraph*> >graphArray, std::vector<RegionGraph*> &flattenedGraphArray);
-    static void serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, int tid);
-    static void fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f);
-    static void fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f);
-    static void fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f, bool singleT);
-
-    static void multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& dmf, const MultiFab& smf, int nc, int ng, int ngSrc, const Periodicity& period);
-    static void multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& dmf, const MultiFab& smf, const Periodicity& period);
-    static void multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-    static void multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT); 
-
-    static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-    static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, bool singleT);
-
-       static void multifabCopyPush_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-
-    static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-    static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT);
-
-    static void serviceLocalGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int tg);
-    static void serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraph, int tg);
-    static void resetRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraph, int tg);
-
-    static void fillBoundaryPush(amrex::RGIter& rgi, amrex::MultiFab& mf);
-    static void fillBoundaryPull(amrex::RGIter& rgi, amrex::MultiFab& mf, bool singleT);
-    static void fillBoundaryPush(amrex::RGIter& rgi, RegionGraph *graph, amrex::MultiFab& mf);
-    static void fillBoundaryPull(amrex::RGIter& rgi, RegionGraph *graph, amrex::MultiFab& mf, bool singleT);
-
-}; // class Perilla
-
-
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/Perilla.cpp b/Src/AmrTask/rts_impls/mpi_omp/Perilla.cpp
deleted file mode 100755
index ade1cd8c6b3..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/Perilla.cpp
+++ /dev/null
@@ -1,2943 +0,0 @@
-#include <AMReX_MultiFab.H>
-#include <AMReX_FabArray.H>
-#include <AMReX_Periodicity.H>
-#include <WorkerThread.H>
-#include <PerillaConfig.H>
-#include <RegionGraph.H>
-#include <Barrier.H>
-#include <vector>
-#include <iostream>
-#include <limits>
-#include <exception>
-#include <mpi.h>
-#include <Perilla.H>
-using namespace std;
-using namespace amrex;
-using namespace perilla;
-
-volatile int Perilla::numTeamsFinished = 0;
-volatile int Perilla::updateMetadata_request = 0;
-volatile int Perilla::updateMetadata_noticed = 0;
-volatile int Perilla::updateMetadata_done = 0;
-int Perilla::max_step=1;
-std::map<int,std::map<int,int>> Perilla::pTagCnt;
-int Perilla::uTags=0;
-bool Perilla::genTags=true;
-std::map<int, std::map<int, std::map<int, std::map<int, std::map<int,int> > > > > Perilla::tagMap;
-std::map<int, std::map<int, std::map<int, std::map<int, int> > > > Perilla::myTagMap;
-
-void Perilla::clearTagMap(){
-    Perilla::tagMap.clear();
-}
-
-void Perilla::clearMyTagMap(){
-    Perilla::myTagMap.clear();
-}
-
-void Perilla::communicateTags()
-{
-    int myProc = ParallelDescriptor::MyProc();
-    int nPs = ParallelDescriptor::NProcs();
-    typedef std::map<int, int> tags_t;
-    typedef std::map<int, std::map<int,int>> stags_t;
-    typedef std::map<int, std::map<int,std::map<int,int>>> dstags_t; 
-    typedef std::map<int, std::map<int,std::map<int,std::map<int,int>>>> gdstags_t;
-    typedef std::map<int, std::map<int,std::map<int,std::map<int,std::map<int,int>>>>> pgdstags_t;
-
-    int** tags = new int*[nPs];
-    int** rtags = new int*[nPs];
-    int* rTagCnt = new int[nPs*2];
-    int* sTagCnt = new int[nPs*2];
-
-    MPI_Request *srrequest;
-    srrequest = new MPI_Request[nPs];
-    MPI_Request *ssrequest;
-    ssrequest = new MPI_Request[nPs];
-    MPI_Request *trrequest;
-    trrequest = new MPI_Request[nPs];
-    MPI_Request *tsrequest;
-    tsrequest = new MPI_Request[nPs];
-
-    std::vector<bool> proc_communicated;
-
-    proc_communicated.resize(nPs);
-    for(int p=0; p<nPs; p++)
-	proc_communicated[p]=false;
-
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	{
-	    MPI_Irecv(&rTagCnt[p*2], 2, MPI_INT, p , 0, MPI_COMM_WORLD, &srrequest[p]);
-	}
-    }
-
-    for(pgdstags_t::iterator it1 = Perilla::tagMap.begin(); it1  != Perilla::tagMap.end(); it1++)
-    {
-	int tac=0;
-	int ng=0;
-	for(gdstags_t::iterator it2 = it1->second.begin(); it2  != it1->second.end(); it2++)
-	{
-	    tac++;
-	    tac++;
-	    ng++;
-	    for(dstags_t::iterator it3 = it2->second.begin(); it3  != it2->second.end(); it3++)
-		for(stags_t::iterator it4 = it3->second.begin(); it4  != it3->second.end(); it4++)
-		    for(tags_t::iterator it5 = it4->second.begin(); it5  != it4->second.end(); it5++)
-		    {
-			tac+=4;
-		    }
-	}
-	sTagCnt[it1->first*2] = tac;
-	sTagCnt[it1->first*2+1] = ng;
-	tags[it1->first] = new int[sTagCnt[it1->first*2]];
-	MPI_Isend(&sTagCnt[it1->first*2], 2, MPI_INT, it1->first, 0, MPI_COMM_WORLD, &ssrequest[it1->first]);
-	proc_communicated[it1->first]=true;
-    }
-
-    for(int p=0; p<nPs; p++)
-	if(p!=myProc)
-	    if(!proc_communicated[p])
-	    {
-		sTagCnt[p*2] = 0;
-		sTagCnt[p*2+1] = 0;
-		MPI_Isend(&sTagCnt[p*2], 2, MPI_INT, p, 0, MPI_COMM_WORLD, &ssrequest[p]);
-	    }
-
-
-    for(pgdstags_t::iterator it1 = Perilla::tagMap.begin(); it1  != Perilla::tagMap.end(); it1++)
-    {
-	int tac=0;
-	for(gdstags_t::iterator it2 = it1->second.begin(); it2  != it1->second.end(); it2++)
-	{
-	    tags[it1->first][tac++] = it2->first;
-	    tags[it1->first][tac++] = pTagCnt[it1->first][it2->first];
-	    int gtagc = 0;
-	    for(dstags_t::iterator it3 = it2->second.begin(); it3  != it2->second.end(); it3++)
-		for(stags_t::iterator it4 = it3->second.begin(); it4  != it3->second.end(); it4++)
-		    for(tags_t::iterator it5 = it4->second.begin(); it5  != it4->second.end(); it5++)
-		    {
-			tags[it1->first][tac++] = it3->first;
-			tags[it1->first][tac++] = it4->first;
-			tags[it1->first][tac++] = it5->first;
-			tags[it1->first][tac++] = it5->second;
-			gtagc++;
-		    }
-	    BL_ASSERT(pTagCnt[it1->first][it2->first] == gtagc);
-	}
-	MPI_Isend(tags[it1->first], tac, MPI_INT, it1->first, 1, MPI_COMM_WORLD, &tsrequest[it1->first]);
-    }
-
-
-    MPI_Status status;
-    for(int p=0; p<nPs; p++)
-    {      
-	if(p!=myProc)
-	{
-	    MPI_Wait( &srrequest[p], &status );
-	    if(rTagCnt[p*2] > 0)
-	    {
-		rtags[p] = new int[rTagCnt[p*2]];
-		MPI_Irecv(rtags[p], rTagCnt[p*2], MPI_INT, p , 1, MPI_COMM_WORLD, &trrequest[p]);
-	    }
-	}
-    }
-
-    //      //MPI_Irecv(size) Wait
-
-
-    //MPI_recive tags arra
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	{
-	    if(rTagCnt[p*2] > 0)
-	    {
-		MPI_Wait( &trrequest[p], &status );
-		int tCnt=0;
-		for(int g=0; g<rTagCnt[p*2+1];g++)
-		{
-		    int gi = rtags[p][tCnt++];
-		    int sCnt = rtags[p][tCnt++];
-		    for(int j=0; j<sCnt; j++)
-		    {
-			Perilla::myTagMap[gi][rtags[p][tCnt]][rtags[p][tCnt+1]][rtags[p][tCnt+2]]=rtags[p][tCnt+3];
-			//std::cout<< "at myP "<<myProc<<" g " << gi << " d " << rtags[p][tCnt]<< " s " << rtags[p][tCnt+1] << " t "<< rtags[p][tCnt+2]<<std::endl;
-			tCnt += 4;    
-		    }
-		}
-		//std::cout<< "at P "<< myProc <<" rCnt "<<rTagCnt[p*2]<<" " << tCnt << std::endl;
-	    }
-	}      	
-    }
-
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	    if(rTagCnt[p*2] > 0)
-	    {
-		delete[] rtags[p];
-	    }
-    }
-
-
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	    if(proc_communicated[p])
-	    {
-		MPI_Wait( &tsrequest[p], &status );
-		delete[] tags[p];
-	    }
-    }
-
-    delete[] srrequest;
-    delete[] ssrequest;
-    delete[] trrequest;
-    delete[] tsrequest;
-    delete[] tags;
-    delete[] rtags;
-    delete[] rTagCnt;
-    delete[] sTagCnt;
-
-    Perilla::genTags=false;
-}
-
-
-
-#if 0
-
-int Perilla::tagGen(int src, int dest, int channelID, int nFabs, int nChannels)
-{
-    int maxRange;
-
-    maxRange = nFabs;
-    if(nFabs*nChannels > perilla::MAX_SQRT_TAG) maxRange= 1024;    
-    return (src%maxRange)*maxRange + (dest%maxRange) + channelID*(perilla::MAX_SQRT_TAG*(perilla::MAX_SQRT_TAG+1)/nChannels);
-
-    //int nfabs = 256;
-
-    //if(src >= nfabs || dest>=nfabs)
-    // std::cout<<"Warnig Tag" << src << " " << dest << " "<<nFabs <<std::endl;
-
-    //maxRange = nfabs*nfabs;
-    //return src*nfabs + dest + channelID*(maxRange+2);
-
-
-    /*int maxSR = *nChannels;
-
-      std::cout << "tag " << (src%maxRange)*maxRange + (dest%maxRange) + channelID*(maxSR*(maxSR+1)/nChannels) << " " <<MPI_TAG_UB <<std::endl;
-
-      if( (src%maxRange)*maxRange + (dest%maxRange) + channelID*(maxSR*(maxSR+1)/nChannels) >= MPI_TAG_UB )
-      std::cout << "Out of Bound tag " << (src%maxRange)*maxRange + (dest%maxRange) + channelID*(maxSR*(maxSR+1)/nChannels) << " " <<MPI_TAG_UB <<std::endl;
-      return (src%maxRange)*maxRange + (dest%maxRange) + channelID*(maxSR*(maxSR+1)/nChannels);
-     */
-}
-#endif
-
-
-void Perilla::multifabBuildFabCon(RegionGraph* rg, const MultiFab& mf, const Periodicity& period)
-{
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = mf.IndexArray().size();
-    bool cross = false;
-    const FabArrayBase::FB& TheFB = mf.getFB(mf.nGrowVect(), period, false, false);
-    const int n_loc_mf = TheFB.m_LocTags->size();
-    const int n_snds_mf = TheFB.m_SndTags->size();
-    const int n_rcvs_mf = TheFB.m_RcvTags->size();
-
-    Vector<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-    Vector<int> send_pr;
-    send_cctc.reserve(n_snds_mf);
-
-    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheFB.m_SndTags->begin(),
-	    m_End = TheFB.m_SndTags->end();
-	    m_it != m_End;
-	    ++m_it)
-    {
-	if(m_it->first != myProc)      // Not destined to me.
-	{
-	    send_pr.push_back(m_it->first);
-	    send_cctc.push_back(&(m_it->second));
-	}
-    }
-
-    Vector<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-    Vector<int> recv_pr;
-    recv_cctc.reserve(n_rcvs_mf);
-
-    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheFB.m_RcvTags->begin(),
-	    m_End = TheFB.m_RcvTags->end();
-	    m_it != m_End;
-	    ++m_it)
-    {
-	if(m_it->first != myProc)      // I am not the source for this receipt
-	{
-	    recv_pr.push_back(m_it->first);
-	    recv_cctc.push_back(&(m_it->second));
-	}
-    }
-#pragma omp parallel shared(rg, mf, numfabs, np, TheFB, recv_cctc, send_cctc)
-    {
-	//int tg = WorkerThread::perilla_wid();
-	int fg;
-	//if(WorkerThread::perilla_isCommunicationThread())	
-#pragma omp single
-	{	  
-	    //bool cc = !mf->is_nodal(); //  cc = multifab_cell_centered_q(mf)
-	    //mf->sMap.reserve(numfabs);
-	    //mf->rMap.reserve(numfabs);
-	    //std::cout<< "Allocating sMap and rMap" <<std::endl;
-	    rg->alloc_lMap(mf);	  
-	    rg->alloc_sMap(mf);
-	    rg->alloc_rMap(mf);
-	}
-#pragma omp barrier      
-	//if(tid==0)            	          
-	{	  
-	    //bool cc = !mf->is_nodal(); //  cc = multifab_cell_centered_q(mf)
-	    //mf->sMap.reserve(numfabs);
-	    //mf->rMap.reserve(numfabs);
-#pragma omp for
-	    for(int f=0; f<numfabs; f++) //	   !create local communication metadata for each fab
-	    {
-		//if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-		{	      
-		    rg->lMap[f]->l_con.nscpy = 0;
-
-		    //for(int i=0; i<bxasc->l_con.ncpy; i++)
-		    for(int i=0; i<n_loc_mf; i++)
-		    {
-			const FabArrayBase::CopyComTag& tag = (*TheFB.m_LocTags)[i];
-
-			//std::cout << tag.srcIndex << " " << tag.dstIndex << " " <<tag.sbox.smallEnd() <<" "<< tag.sbox.bigEnd() << std::endl;
-
-			BL_ASSERT(mf.distributionMap[tag.dstIndex] == myProc);
-			BL_ASSERT(mf.distributionMap[tag.srcIndex] == myProc);
-			//get(tag.dstIndex).copy(get(tag.srcIndex),tag.box,scomp,tag.box,scomp,ncomp);
-			//if(f == local_index(mf,bxasc->l_con.cpy[i].ns)) //LocalIndex
-			if(mf.IndexArray()[f] == tag.srcIndex)
-			    rg->lMap[f]->l_con.nscpy++;		  
-			//if(f == local_index(mf,bxasc->l_con.cpy[i].nd)) //LocalIndex
-			if(mf.IndexArray()[f] == tag.dstIndex)
-			    rg->lMap[f]->l_con.ndcpy++;
-		    }
-		    /*
-		       if(rg->lMap[f]->l_con.nscpy+rg->lMap[f]->l_con.ndcpy != n_loc_mf)
-		       std::cout<< "Diff in Sum " << rg->lMap[f]->l_con.nscpy << " " <<rg->lMap[f]->l_con.ndcpy << " " << n_loc_mf <<std::endl;
-		       BL_ASSERT(rg->lMap[f]->l_con.nscpy+rg->lMap[f]->l_con.ndcpy == n_loc_mf);
-		     */
-		}
-	    }
-	}
-#pragma omp barrier
-	//now we know how many copying segments each fab owns as source and destination allocate memory for metadata   
-#pragma omp for
-	for(int f=0; f<numfabs; f++)
-	{
-	    //fg = f % (omp_get_num_threads()/perilla::NUM_THREADS_PER_TEAM);   /// need to check if computing correct ???????
-	    //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==1))
-	    //if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())	    
-	    {
-		//omp_init_lock(&(rg->lMap[f]->l_con.sLock));
-		//omp_init_lock(&(rg->lMap[f]->l_con.dLock));
-		//omp_init_lock(&(rg->lMap[f]->l_con.ghostLock));
-
-		//std::cout<< "MF l_con nscpy " <<rg->lMap[f]->l_con.nscpy << " ndcpy " << rg->lMap[f]->l_con.ndcpy <<std::endl;
-
-		rg->lMap[f]->l_con.scpy = new LocalCopyDescriptor[rg->lMap[f]->l_con.nscpy];
-		rg->lMap[f]->l_con.dcpy = new LocalCopyDescriptor[rg->lMap[f]->l_con.ndcpy];
-		rg->lMap[f]->l_con.scpyCnt = 0;
-		rg->lMap[f]->l_con.dcpyCnt = 0;
-	    }
-	}
-#pragma omp barrier
-	if(np > 1)
-	{
-#pragma omp for
-	    for(int f=0; f<numfabs; f++)
-	    {
-		//if(WorkerThread::perilla_isMasterWorkerThread() && WorkerThread::isMyRegion(tg,f))      
-		{
-		    rg->lMap[f]->r_con.nrcv = 0;
-		    rg->lMap[f]->r_con.nsnd = 0;
-		    rg->lMap[f]->r_con.firingRuleCnt = 0;
-
-		    //for(int i=0; i<bxasc->r_con.nsnd; i++)
-		    for(int i=0; i<n_snds_mf; i++)
-		    {
-			const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-			for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-				it != cctc.end(); ++it)
-			{
-			    //if(f == local_index(mf,bxasc->r_con.snd[i].ns)) //LocalIndex
-			    if(mf.IndexArray()[f] == it->srcIndex)
-			    {
-				rg->lMap[f]->r_con.nsnd++;
-			    }
-			}
-		    }
-		    //for(int i=0; i<bxasc->r_con.nrcv; i++)
-		    for(int i=0; i<n_rcvs_mf; i++)
-		    {
-			const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-			for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-				it != cctc.end(); ++it)
-			{
-			    //if(f == local_index(mf,bxasc->r_con.rcv[i].nd)) //LocalIndex
-			    if(mf.IndexArray()[f] == it->dstIndex)
-			    {
-				rg->lMap[f]->r_con.nrcv++;
-			    }
-			}
-		    }
-		    //rg->sMap[f]->r_con.sndLock = new omp_lock_t;
-		    //rg->rMap[f]->r_con.rcvLock = new omp_lock_t;
-		    //omp_init_lock(rg->sMap[f]->r_con.sndLock);
-		    //omp_init_lock(rg->rMap[f]->r_con.rcvLock);
-		    rg->lMap[f]->r_con.snd = new RemoteCommDescriptor[rg->lMap[f]->r_con.nsnd];
-		    rg->lMap[f]->r_con.rcv = new RemoteCommDescriptor[rg->lMap[f]->r_con.nrcv];
-		}		
-	    }	
-	    //if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)      
-	    {
-#pragma omp for
-		for(int f=0; f<numfabs; f++)
-		{
-		    rg->rMap[f]->r_con.nrcv = 0;
-		    rg->sMap[f]->r_con.nsnd = 0;
-
-		    //for(int i=0; i<bxasc->r_con.nsnd; i++)
-		    for(int i=0; i<n_snds_mf; i++)
-		    {
-			const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-			for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-				it != cctc.end(); ++it)
-			{
-			    //if(f == local_index(mf,bxasc->r_con.snd[i].ns)) //LocalIndex
-			    if(mf.IndexArray()[f] == it->srcIndex)
-			    {
-				rg->sMap[f]->r_con.nsnd++;
-			    }
-			}
-		    }
-		    //for(int i=0; i<bxasc->r_con.nrcv; i++)
-		    for(int i=0; i<n_rcvs_mf; i++)
-		    {
-			const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-			for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-				it != cctc.end(); ++it)
-			{
-			    //if(f == local_index(mf,bxasc->r_con.rcv[i].nd)) //LocalIndex
-			    if(mf.IndexArray()[f] == it->dstIndex)
-			    {
-				rg->rMap[f]->r_con.nrcv++;
-			    }
-			}
-		    }
-		    //rg->sMap[f]->r_con.sndLock = new omp_lock_t;
-		    //rg->rMap[f]->r_con.rcvLock = new omp_lock_t;
-		    //omp_init_lock(rg->sMap[f]->r_con.sndLock);
-		    //omp_init_lock(rg->rMap[f]->r_con.rcvLock);
-		    rg->sMap[f]->r_con.snd = new RemoteCommDescriptor[rg->sMap[f]->r_con.nsnd];
-		    rg->rMap[f]->r_con.rcv = new RemoteCommDescriptor[rg->rMap[f]->r_con.nrcv];
-		}
-	    }
-	}
-    } // omp parallel
-    //std::cout<< "counting done " <<std::endl;
-    //    !!touch data to bind pages to the NUMA node
-#pragma omp parallel shared(mf, numfabs, TheFB, recv_cctc, send_cctc)
-    {
-	int tg = WorkerThread::perilla_wid();
-
-	//      std::cout<< "Barr 4- "<< tid <<" "<< tg << " " << WorkerThread::isTeamMasterThread(tid) << std::endl;
-
-	//      std::cout<< "Barr 5" <<std::endl;
-	int fg, scnt, dcnt;
-
-
-#pragma omp for
-	for(int f=0; f<numfabs; f++)
-	{
-	    //fg = f % (omp_get_num_threads()/perilla::NUM_THREADS_PER_TEAM);
-	    //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==1))
-
-	    //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==0))
-	    //if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-	    {
-		rg->lMap[f]->l_con.localBarrier = new Barrier(perilla::NUM_THREADS_PER_TEAM-1);
-		// !create local communication meta data for sources and destinations
-		scnt = -1;
-		dcnt = -1;
-		//for(int i=0; i<bxasc->l_con.ncpy; i++)
-		for(int i=0; i<n_loc_mf; i++)
-		{
-		    const FabArrayBase::CopyComTag& tag = (*TheFB.m_LocTags)[i];
-		    BL_ASSERT(mf.distributionMap[tag.dstIndex] == myProc);
-		    BL_ASSERT(mf.distributionMap[tag.srcIndex] == myProc);
-
-		    //if(f == local_index(mf,bxasc->l_con.cpy[i].ns)) //LocalIndex
-		    if(mf.IndexArray()[f] == tag.srcIndex)
-		    {
-			scnt++;
-			//omp_init_lock(&(rg->lMap[f]->l_con.scpy[scnt].ghostLock));
-			rg->lMap[f]->l_con.scpy[scnt].ns = mf.localindex(tag.srcIndex); //local_index(mf,bxasc->l_con.cpy[i].ns); //LocalIndex
-			rg->lMap[f]->l_con.scpy[scnt].nd = mf.localindex(tag.dstIndex); //local_index(mf,bxasc->l_con.cpy[i].nd); //LocalIndex
-			rg->lMap[f]->l_con.scpy[scnt].sbx = tag.sbox; //bxasc->l_con.cpy[i].sbx;
-			rg->lMap[f]->l_con.scpy[scnt].dbx = tag.dbox; //bxasc->l_con.cpy[i].dbx;		    
-			// !create queues for ghost cells
-			//call queue_init(mf%fbs(f)%l_con%scpy(scnt)%pQueue)
-			//call queue_init(mf%fbs(f)%l_con%scpy(scnt)%recycleQueue)
-			int psize = tag.sbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-			/*
-			   p => dataptr(mf%fbs(f), mf%fbs(f)%l_con%scpy(scnt)%sbx, 1, mf%nc)
-			   s1= size(p,1)
-			   s2= size(p,2)
-			   s3= size(p,3)
-			   s4= size(p,4)
-			   s1*s2*s3*s4
-			 */
-			for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			{
-			    Package *tmpPkg = new Package(psize);
-			    for(int j=0; j<psize; j++)
-				tmpPkg->databuf[j] = 0;				  
-			    rg->lMap[f]->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);			
-			}
-			for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			    rg->lMap[f]->l_con.scpy[scnt].recycleQueue.enqueue(rg->lMap[f]->l_con.scpy[scnt].pQueue.dequeue());
-		    }	      
-		    //if(f == local_index(mf,bxasc->l_con.cpy[i].nd)) //LocalIndex
-		    if(mf.IndexArray()[f] == tag.dstIndex)		    
-		    {
-			dcnt++;		      		      
-			rg->lMap[f]->l_con.dcpy[dcnt].ns = mf.localindex(tag.srcIndex); //local_index(mf,bxasc->l_con.cpy[i].ns); //LocalIndex
-			rg->lMap[f]->l_con.dcpy[dcnt].nd = mf.localindex(tag.dstIndex); //local_index(mf,bxasc->l_con.cpy[i].nd); //LocalIndex
-			rg->lMap[f]->l_con.dcpy[dcnt].sbx = tag.sbox; //bxasc->l_con.cpy[i].sbx;
-			rg->lMap[f]->l_con.dcpy[dcnt].dbx = tag.dbox; //bxasc->l_con.cpy[i].dbx;		    
-			//call queue_init(mf%fbs(f)%l_con%dcpy(dcnt)%pQueue)
-			//call queue_init(mf%fbs(f)%l_con%dcpy(dcnt)%recycleQueue)
-			int psize = tag.dbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-			/*
-			   p => dataptr(mf%fbs(f), mf%fbs(f)%l_con%dcpy(dcnt)%dbx, 1, mf%nc)
-			   s1= size(p,1)
-			   s2= size(p,2)
-			   s3= size(p,3)
-			   s4= size(p,4)
-			   s1*s2*s3*s4
-			 */
-
-			for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			{
-			    Package *tmpPkg = new Package(psize);
-			    for(int j=0; j<psize; j++)
-				tmpPkg->databuf[j] = 0;				  
-			    rg->lMap[f]->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);			
-			}
-			for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			    rg->lMap[f]->l_con.dcpy[dcnt].recycleQueue.enqueue(rg->lMap[f]->l_con.dcpy[dcnt].pQueue.dequeue());
-		    }
-		} // for(i<n_loc_mf)
-		//std::cout<< scnt << " " << dcnt << std::endl;
-	    }
-	}// for(f<numfabs)
-
-#pragma omp barrier	  
-
-//	if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)    
-#pragma omp for
-	    for(int f=0; f<numfabs; f++)
-	    {
-		for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++)
-		    for(int j=0; j<rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.ndcpy; j++)
-			if(rg->lMap[f]->l_con.scpy[i].dbx == rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[j].dbx)
-			    rg->lMap[f]->l_con.scpy[i].dPartner = j;
-
-		for(int i=0; i<rg->lMap[f]->l_con.ndcpy; i++)
-		    for(int j=0; j<rg->lMap[rg->lMap[f]->l_con.dcpy[i].ns]->l_con.nscpy; j++)
-			if(rg->lMap[f]->l_con.dcpy[i].dbx == rg->lMap[rg->lMap[f]->l_con.dcpy[i].ns]->l_con.scpy[j].dbx)
-			    rg->lMap[f]->l_con.dcpy[i].sPartner = j;	
-	    }
-    }
-
-    if(np == 1) return;
-
-    //std::cout<< "local init done" <<std::endl;
-
-//#pragma omp parallel shared(rg, mf, numfabs)
-    {
-	//int tg = WorkerThread::perilla_wid();
-	int fg, nsnd, nrcv;
-
-	for(int f=0; f<numfabs; f++)
-	{
-	    //fg = f % (omp_get_num_threads()/perilla::NUM_THREADS_PER_TEAM);
-	    //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==0))
-	    //if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-	    {
-		//rg->lMap[f]->r_con.sndLock = new omp_lock_t;
-		//rg->lMap[f]->r_con.rcvLock = new omp_lock_t;
-		//omp_init_lock(rg->lMap[f]->r_con.sndLock);
-		//omp_init_lock(rg->lMap[f]->r_con.rcvLock);
-		//rg->lMap[f]->r_con.snd = new RemoteCommDescriptor[rg->lMap[f]->r_con.nsnd];
-		//rg->lMap[f]->r_con.rcv = new RemoteCommDescriptor[rg->lMap[f]->r_con.nrcv];
-		nrcv= -1;
-		//for(int i=0; i<bxasc->r_con.nrcv; i++)
-		for(int i=0; i<n_rcvs_mf; i++)
-		{
-		    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-		    int pr = recv_pr[i];
-		    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-			    it != cctc.end(); ++it)
-		    {	      
-			//if(f == local_index(mf,bxasc->r_con.rcv[i].nd)) //LocalIndex
-			if(mf.IndexArray()[f] == it->dstIndex)
-			{
-			    nrcv++;
-			    rg->lMap[f]->r_con.rcv[nrcv].ns = it->srcIndex; //bxasc->r_con.rcv[i].ns;
-			    //rg->lMap[f]->r_con.rcv[nrcv].lnd = ; //local_index(mf,bxasc->r_con.rcv[i].nd); // not used anywhere so deferred ---------????????
-			    //rg->lMap[f]->r_con.rcv[nrcv].lns = -1; //undefined
-			    rg->lMap[f]->r_con.rcv[nrcv].nd = it->dstIndex; //bxasc->r_con.rcv[i].nd;
-			    rg->lMap[f]->r_con.rcv[nrcv].lnd = mf.localindex(it->dstIndex);
-			    rg->lMap[f]->r_con.rcv[nrcv].lns = mf.localindex(it->srcIndex);
-			    rg->lMap[f]->r_con.rcv[nrcv].sbx = it->sbox; //bxasc->r_con.rcv[i].sbx;
-			    rg->lMap[f]->r_con.rcv[nrcv].dbx = it->dbox; //bxasc->r_con.rcv[i].dbx;
-			    rg->lMap[f]->r_con.rcv[nrcv].pr = pr; //bxasc->r_con.rcv[i].pr;
-			    rg->lMap[f]->r_con.rcv[nrcv].cnt = 0;		    
-			    //!create queues for ghost cells
-			    //call queue_init(mf%fbs(f)%r_con%rcv(nrcv)%pQueue)
-			    //call queue_init(mf%fbs(f)%r_con%rcv(nrcv)%recycleQueue)
-			    int psize = it->sbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-			    /*
-			       p => dataptr(mf%fbs(f), mf%fbs(f)%r_con%rcv(nrcv)%dbx, 1, mf%nc)
-			       s1= size(p,1)
-			       s2= size(p,2)
-			       s3= size(p,3)
-			       s4= size(p,4)
-			       s1*s2*s3*s4
-			     */
-			    rg->lMap[f]->r_con.rcv[nrcv].sz = psize;
-			    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			    {
-				Package *tmpPkg = new Package(psize);
-				for(int j=0; j<psize; j++)
-				    tmpPkg->databuf[j] = 0;				  
-				rg->lMap[f]->r_con.rcv[nrcv].pQueue.enqueue(tmpPkg);			
-			    }
-			    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				rg->lMap[f]->r_con.rcv[nrcv].recycleQueue.enqueue(rg->lMap[f]->r_con.rcv[nrcv].pQueue.dequeue());
-			}
-		    }
-		} // for(i<n_rcvs_mf)
-
-		nsnd = -1;
-		//for(int i=0; i<bxasc->r_con.nsnd; i++)
-		for(int i=0; i<n_snds_mf; i++)
-		{
-		    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-		    int pr = send_pr[i];
-		    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-			    it != cctc.end(); ++it)
-		    { 
-			//if(f == local_index(mf,bxasc->r_con.snd[i].ns)) //LocalIndex
-			if(mf.IndexArray()[f] == it->srcIndex )
-			{
-			    nsnd++;
-			    rg->lMap[f]->r_con.snd[nsnd].ns = it->srcIndex; //bxasc->r_con.snd[i].ns;
-			    rg->lMap[f]->r_con.snd[nsnd].nd = it->dstIndex; //bxasc->r_con.snd[i].nd;
-			    //rg->lMap[f]->r_con.snd[nsnd].lns = ; //local_index(mf,bxasc->r_con.snd[i].ns); //not used anywhere so deferred ------?????????
-			    //rg->lMap[f]->r_con.snd[nsnd].lnd = -1; //undefined
-			    rg->lMap[f]->r_con.snd[nsnd].lns = mf.localindex(it->srcIndex);
-			    rg->lMap[f]->r_con.snd[nsnd].lnd = mf.localindex(it->dstIndex);
-			    rg->lMap[f]->r_con.snd[nsnd].sbx = it->sbox; //bxasc->r_con.snd[i].sbx;
-			    rg->lMap[f]->r_con.snd[nsnd].dbx = it->dbox; //bxasc->r_con.snd[i].dbx;
-			    rg->lMap[f]->r_con.snd[nsnd].pr = pr; //bxasc->r_con.snd[i].pr;
-			    rg->lMap[f]->r_con.snd[nsnd].cnt = 0;
-			    //!create queues for ghost cells		
-			    //call queue_init(mf%fbs(f)%r_con%snd(nsnd)%pQueue)
-			    //call queue_init(mf%fbs(f)%r_con%snd(nsnd)%recycleQueue)
-			    int psize = it->sbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-			    /*
-			       p => dataptr(mf%fbs(f), mf%fbs(f)%r_con%snd(nsnd)%sbx, 1, mf%nc)
-			       s1= size(p,1)
-			       s2= size(p,2)
-			       s3= size(p,3)
-			       s4= size(p,4)
-			       s1*s2*s3*s4
-			     */		    
-			    rg->lMap[f]->r_con.snd[nsnd].sz = psize;
-			    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			    {
-				Package *tmpPkg = new Package(psize);
-				for(int j=0; j<psize; j++)
-				    tmpPkg->databuf[j] = 0;				  
-				rg->lMap[f]->r_con.snd[nsnd].pQueue.enqueue(tmpPkg);			
-			    }
-			    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				rg->lMap[f]->r_con.snd[nsnd].recycleQueue.enqueue(rg->lMap[f]->r_con.snd[nsnd].pQueue.dequeue());
-
-			    //std::cout<< "RQ f "<< f << " i "<< nsnd <<std::endl;
-			}
-		    }
-		} // for(i<n_snds_mf)
-		//std::cout<< "tid "<< tid << " f "<< f << " nfabs "<< numfabs <<std::endl;
-	    }// if(fg==tg...)
-	    //#pragma omp barrier
-	}//for(f<numfabs)
-
-	//std::cout<< "Barr 1 tid " << tid <<std::endl;
-
-//#pragma omp barrier      //----------------------------------- Barrier ------------------------------------------      
-
-	//if(tid == 0)
-	//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-	{
-	    for(int f=0; f<numfabs; f++)	  
-	    {
-		for(int i=0; i<rg->lMap[f]->r_con.nsnd; i++)
-		{
-		    rg->sMap[f]->r_con.snd[i].ns = rg->lMap[f]->r_con.snd[i].ns;
-		    rg->sMap[f]->r_con.snd[i].nd = rg->lMap[f]->r_con.snd[i].nd;
-		    rg->sMap[f]->r_con.snd[i].lns = rg->lMap[f]->r_con.snd[i].lns;
-		    rg->sMap[f]->r_con.snd[i].lnd = rg->lMap[f]->r_con.snd[i].lnd;
-		    rg->sMap[f]->r_con.snd[i].r_gid = rg->graphID-1;
-		    rg->sMap[f]->r_con.snd[i].r_grids = rg->numFabs;
-		    rg->sMap[f]->r_con.snd[i].sbx = rg->lMap[f]->r_con.snd[i].sbx;
-		    rg->sMap[f]->r_con.snd[i].dbx = rg->lMap[f]->r_con.snd[i].dbx;
-		    rg->sMap[f]->r_con.snd[i].pr = rg->lMap[f]->r_con.snd[i].pr;
-		    rg->sMap[f]->r_con.snd[i].sz = rg->lMap[f]->r_con.snd[i].sz;
-		    rg->sMap[f]->r_con.snd[i].cnt = 0;
-		    rg->lMap[f]->r_con.snd[i].cnt = 0;
-
-		    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-		    {
-			Package *tmpPkg = new Package(rg->lMap[f]->r_con.snd[i].sz);
-			for(int j=0; j<rg->lMap[f]->r_con.snd[i].sz; j++)
-			    tmpPkg->databuf[j] = 0;				  
-			rg->sMap[f]->r_con.snd[i].pQueue.enqueue(tmpPkg);			
-		    }
-		    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			rg->sMap[f]->r_con.snd[i].recycleQueue.enqueue(rg->sMap[f]->r_con.snd[i].pQueue.dequeue());
-		}
-		for(int i=0; i<rg->lMap[f]->r_con.nrcv; i++)
-		{
-		    rg->rMap[f]->r_con.rcv[i].ns = rg->lMap[f]->r_con.rcv[i].ns;
-		    rg->rMap[f]->r_con.rcv[i].nd = rg->lMap[f]->r_con.rcv[i].nd;
-		    rg->rMap[f]->r_con.rcv[i].lns = rg->lMap[f]->r_con.rcv[i].lns;
-		    rg->rMap[f]->r_con.rcv[i].lnd = rg->lMap[f]->r_con.rcv[i].lnd;
-		    rg->rMap[f]->r_con.rcv[i].r_gid = rg->graphID-1;
-		    rg->rMap[f]->r_con.rcv[i].r_grids = rg->numFabs;
-		    rg->rMap[f]->r_con.rcv[i].sbx = rg->lMap[f]->r_con.rcv[i].sbx;
-		    rg->rMap[f]->r_con.rcv[i].dbx = rg->lMap[f]->r_con.rcv[i].dbx;
-		    rg->rMap[f]->r_con.rcv[i].pr = rg->lMap[f]->r_con.rcv[i].pr;
-		    rg->rMap[f]->r_con.rcv[i].sz = rg->lMap[f]->r_con.rcv[i].sz;
-		    rg->rMap[f]->r_con.rcv[i].cnt = 0;
-		    rg->lMap[f]->r_con.rcv[i].cnt = 0;
-
-		    if(Perilla::genTags)
-		    {
-			try
-			{
-			    int rcv_pr = rg->rMap[f]->r_con.rcv[i].pr;
-			    int dstIndex = rg->rMap[f]->r_con.rcv[i].nd;
-			    int srcIndex = rg->rMap[f]->r_con.rcv[i].ns;
-			    int psize = rg->rMap[f]->r_con.rcv[i].sz;
-			    std::map<int,int>::iterator itr = tagMap[rcv_pr][rg->graphID-1][dstIndex][srcIndex].find(psize);
-			    if( itr != tagMap[rcv_pr][rg->graphID-1][dstIndex][srcIndex].end())
-			    {
-				//rg->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-			    }
-			    else
-			    {
-				tagMap[rcv_pr][rg->graphID-1][dstIndex][srcIndex][psize] = Perilla::uTags++;
-				//rg->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-				std::map<int,int>::iterator itr2 = pTagCnt[rcv_pr].find(rg->graphID-1);
-				if(itr2 != pTagCnt[rcv_pr].end())
-				    pTagCnt[rcv_pr][rg->graphID-1] = pTagCnt[rcv_pr][rg->graphID-1] + 1;
-				else
-				    pTagCnt[rcv_pr][rg->graphID-1] = 1;
-			    }
-			}
-			catch(std::exception& e)
-			{
-			    std::cout <<"Inside tagGeneration gID "<< rg->graphID <<" "<< e.what() << '\n';
-			}
-		    }
-		    //tagMap[rcv_pr][rg->graphID][it->dstIndex][it->srcIndex] = pTagCnt[rcv_pr];				  
-
-		    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-		    {
-			Package *tmpPkg = new Package(rg->lMap[f]->r_con.rcv[i].sz);
-			for(int j=0; j<rg->lMap[f]->r_con.rcv[i].sz; j++)
-			    tmpPkg->databuf[j] = 0;				  
-			rg->rMap[f]->r_con.rcv[i].pQueue.enqueue(tmpPkg);			
-		    }
-		    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-			rg->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rg->rMap[f]->r_con.rcv[i].pQueue.dequeue());
-		}
-	    }
-	}// if(tid==0)
-
-    }// omp parallel    
-}// multifabBuildFabCon
-
-void Perilla::serviceLocalRequests(RegionGraph* rg, int tg)    
-{
-    int numfabs = rg->lMap.size();
-
-    for(int f=0; f<numfabs; f++)
-    {
-	//int fg = f % perilla::NUM_THREAD_TEAMS;
-
-	//	if(tg==0)
-	//  std::cout<< "I am tg 0 :) processing fg " << fg <<std::endl;
-
-	if(WorkerThread::isMyRegion(tg,f))
-	    //if(tg == fg)
-	{
-	    //if(tg == 0)
-	    //std::cout<<"I am tg " << tg << " starting to process " << f << " in Graph " << graph->graphID <<std::endl;
-
-	    //int lockSucceeded = omp_test_lock(&(rg->lMap[f]->l_con.sLock));
-	    //if(lockSucceeded != 0) // 0-Fail, otherwise-Succeed
-	    {		
-		//if(graph->graphID == 1)
-		//if(tg == 0)
-		//std::cout<<"I am tg " << tg << " processing " << f << " in Graph " << graph->graphID <<std::endl;
-		/*if(graph->graphID == 1 && (f == 2 || f == 1) )
-		  {
-		  std::cout<< "serviceLR for gID 1  f " << f << " nscpy "<< rg->lMap[f]->l_con.nscpy << std::endl;
-		  for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++)
-		  std::cout<< " " << rg->lMap[f]->l_con.scpy[i].nd << " " <<  rg->lMap[f]->l_con.scpy[i].dPartner << " " << rg->lMap[f]->l_con.scpy[i].pQueue.queueSize();
-		  std::cout<< std::endl;
-		  }*/
-		for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++){
-
-		    //std::cout<< "serviceLR nscpy " << rg->lMap[f]->l_con.nscpy <<std::endl;
-
-		    //if(graph->graphID == 1 && rg->lMap[f]->l_con.scpy[i].nd == 1)
-		    //std::cout<< "Processing gID 1 nd 1 from f " << f << " i " << i << std::endl;
-
-		    if(rg->lMap[f]->l_con.scpy[i].pQueue.queueSize()>0)
-		    {
-                        omp_set_lock(&(rg->lMap[f]->l_con.sLock));
-			Package *sPackage = rg->lMap[f]->l_con.scpy[i].pQueue.dequeue();
-			if(perilla::LAZY_PUSH)
-			{
-			    //  Implemetation deffered. Currently not required
-			}
-			//if(graph->graphID == 1 && rg->lMap[f]->l_con.scpy[i].nd == 1)
-			//std::cout<< "Processing gID 1 nd 1 from f " << f << " i " << i << std::endl;
-			omp_set_lock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			int dPartner = rg->lMap[f]->l_con.scpy[i].dPartner;
-
-			//if(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.queueSize() == 0 )
-			if(dPartner == -1)
-			    std::cout<< " Caution rQ size dPrtn "<< rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.ndcpy << " " << dPartner <<" graph ID " <<rg->graphID<<std::endl;
-			//std::cout<< " Caution rQ size "<< rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.queueSize() <<std::endl;
-
-			Package *dPackage = rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-
-			//for(int j=0; j<sPackage->bufSize; j++)
-			//dPackage->databuf[j] = sPackage->databuf[j];        //copy data------------------------------???????????????
-
-			std::memcpy(dPackage->databuf, sPackage->databuf, dPackage->bufSize * sizeof(double));
-
-			rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			if(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.queueSize(true)==1)
-			    rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.firingRuleCnt++;
-			//if(graph->graphID == 1 && rg->lMap[f]->l_con.scpy[i].nd == 1)
-			//std::cout << "gID 1 frc " << rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.firingRuleCnt << " df " << rg->lMap[f]->l_con.scpy[i].nd <<std::endl;
-			omp_unset_lock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-
-			//if(graph->graphID == 1)
-			//std::cout<< "Processed gID 1  f " << rg->lMap[f]->l_con.scpy[i].nd << std::endl;
-
-			rg->lMap[f]->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-		    }}
-		omp_unset_lock(&(rg->lMap[f]->l_con.sLock));
-#pragma omp flush
-	    }// if(!lock succeedded)
-	    if(perilla::LAZY_PUSH)
-	    {
-		//  Implemetation deffered. Currently not required
-	    }	    
-	}// if(tg==fg)
-    }// for(f<numfabs)    
-}//serviceLocalRequests
-
-void Perilla::serviceRemoteRequests(RegionGraph* rg, int graphID, int nGraphs)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = rg->rMap.size();
-
-    // !we first post send and receive  
-    for(int f=0; f<numfabs; f++)
-    {
-	//int lockSucceeded = omp_test_lock(rg->rMap[f]->r_con.rcvLock);
-	//if(lockSucceeded != 0)
-	{
-	    //if(omp_test_lock(rg->lMap[f]->r_con.rcvLock) != 0)
-	    {
-		for(int i=0; i<rg->lMap[f]->r_con.nrcv; i++)
-		{
-		    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed
-			nextsReq = true;
-		    else
-		    {
-			Package *rearPackage = rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);//!CHECK THIS POINT LATER
-			if(rearPackage->completed && rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			    nextsReq = true;
-			else //!expected message is still on the way
-			    nextsReq = false;
-		    }
-		    if(nextsReq) //!take a message from recycle pool and post a receive
-		    {
-                        omp_set_lock((rg->rMap[f]->r_con.rcvLock));
-                        omp_set_lock((rg->lMap[f]->r_con.rcvLock));
-			int ns = rg->rMap[f]->r_con.rcv[i].ns;
-			int nd = rg->rMap[f]->r_con.rcv[i].nd;
-			int lnd = rg->rMap[f]->r_con.rcv[i].lnd;
-			int r_grids = rg->rMap[f]->r_con.rcv[i].r_grids;
-			//!create a package to keep track of receive requests
-			Package *rMetaPackage = rg->rMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			//!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-			Package *rPackage = rg->lMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			//tag = tagGen(mf%rMap(f)%r_con%rcv(i)%ns, mf%rMap(f)%r_con%rcv(i)%nd, gid, parallel_nprocs()*nfabs(mf), ngr)---------??????
-			//int tag = tagGen(rg->rMap[f]->r_con.rcv[i].ns, rg->rMap[f]->r_con.rcv[i].nd, graphID-1, np*numfabs, nGraphs);			
-			int tag = tagMap[rg->rMap[f]->r_con.rcv[i].pr][graphID][nd][ns][rg->rMap[f]->r_con.rcv[i].sz];
-
-			rMetaPackage->request = MPI_REQUEST_NULL;
-			rg->lMap[f]->r_con.rcv[i].pQueue.enqueue(rPackage,true);   //!this is not done yet
-			rg->rMap[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage,true);   //!this is not done yet
-			//rMetaPackage->request = parallel_irecv_dv(rpackage%ptr%dataBuf,mf%rMap(f)%r_con%rcv(i)%sz, mf%rMap(f)%r_con%rcv(i)%pr, tag) --------- ????
-			rMetaPackage->request = ParallelDescriptor::Arecv(rPackage->databuf,
-				rg->rMap[f]->r_con.rcv[i].sz,
-				rg->rMap[f]->r_con.rcv[i].pr, tag).req(); // tag == SeqNum in c++ ver
-                        omp_unset_lock((rg->lMap[f]->r_con.rcvLock));
-                        omp_unset_lock((rg->rMap[f]->r_con.rcvLock));
-		    }
-		}
-		//omp_unset_lock(rg->lMap[f]->r_con.rcvLock);
-	    }// if(omp_test_lock)
-	    //omp_unset_lock(rg->rMap[f]->r_con.rcvLock);
-	}// if(lockSucceeded)
-    }// for(f<numfabs)
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	for(int i=0; i<rg->sMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //then !no message has been issued or all send requests have been fulfilled
-		nextrReq = false;
-	    else
-		nextrReq = true;
-
-	    if(nextrReq)
-	    {
-		Package *sMetaPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(!sMetaPackage->served)
-		{
-		    Package *sPackage = rg->lMap[f]->r_con.snd[i].pQueue.getFront(true);
-		    sMetaPackage->completed = false;
-		    sMetaPackage->served = true;
-		    sMetaPackage->request = MPI_REQUEST_NULL;
-		    int ns = rg->sMap[f]->r_con.snd[i].ns;
-		    int nd = rg->sMap[f]->r_con.snd[i].nd;
-		    int r_gid = rg->sMap[f]->r_con.snd[i].r_gid;
-		    int r_grids = rg->sMap[f]->r_con.snd[i].r_grids;
-		    //tag = tagGen(mf%sMap(f)%r_con%snd(i)%ns, mf%sMap(f)%r_con%snd(i)%nd, gid, parallel_nprocs()*nfabs(mf), ngr) -???????
-		    //int tag = tagGen(rg->sMap[f]->r_con.snd[i].ns, rg->sMap[f]->r_con.snd[i].nd, graphID-1, np*numfabs, nGraphs);
-		    int tag = Perilla::myTagMap[r_gid][nd][ns][rg->sMap[f]->r_con.snd[i].sz];
-		    //int tag = myTagMap[graphID-1][rg->sMap[f]->r_con.snd[i].nd][rg->sMap[f]->r_con.snd[i].ns];
-		    //sMetaPackage%ptr%request = parallel_isend_dv(spackage%ptr%dataBuf,mf%sMap(f)%r_con%snd(i)%sz, mf%sMap(f)%r_con%snd(i)%pr, tag) --?????
-		    sMetaPackage->request = ParallelDescriptor::Asend(sPackage->databuf,
-			    rg->sMap[f]->r_con.snd[i].sz,
-			    rg->sMap[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-		}
-	    }
-	} // for(i<nsnd)
-    } // for(f<numfabs)
-
-    //!now we test if send and receive requests have been serviced
-    for(int f=0; f<numfabs; f++)
-    {
-	//!receive requests
-	for(int i=0; i<rg->rMap[f]->r_con.nrcv; i++)
-	{
-	    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-	    {
-		//if(omp_test_lock(rg->lMap[f]->r_con.rcvLock) != 0) // 0-Fail, otherwise-Succeed
-		{
-		    Package *rearPackage =  rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);
-		    if(!rearPackage->completed)
-		    {
-			bool flag = false;
-			int ret_flag;
-			MPI_Status status;
-
-			std::cout<< "myP "<< myProc << " f "<< f << " i "<< i<< " Req "<<rearPackage->request << std::endl;
-
-			ParallelDescriptor::Test(rearPackage->request, ret_flag, status);
-			flag = (ret_flag == 0) ? false : true;//parallel_test_one(rearPackage%ptr%request) -------???????
-			if(flag)
-			{
-                            omp_set_lock((rg->lMap[f]->r_con.rcvLock));
-			    rearPackage->completeRequest();
-			    rg->lMap[f]->r_con.rcv[i].pQueue.getRear()->completeRequest();
-			    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				rg->lMap[f]->r_con.firingRuleCnt++;
-			    omp_unset_lock((rg->lMap[f]->r_con.rcvLock));
-#pragma omp flush			    
-			}
-		    }
-		    //omp_unset_lock(rg->lMap[f]->r_con.rcvLock);
-		} // if(omp_test_lock)
-	    } // if(queueSize > 0)
-	} // for(i<nrcv)
-    } // for(f<numfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {
-	//!send requests
-	for(int i=0; i<rg->lMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-	    {
-		Package *frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(frontPackage->served && !frontPackage->completed) //!latest receive request has NOT been completed
-		{
-		    bool flag = false;
-		    int ret_flag;
-		    MPI_Status status;
-		    ParallelDescriptor::Test(frontPackage->request, ret_flag, status);
-		    flag = (ret_flag == 0) ? false : true;//parallel_test_one(frontPackage%ptr%request) -------???????		    
-		    if(flag)
-		    {
-			omp_set_lock(rg->sMap[f]->r_con.sndLock);
-			frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = MPI_REQUEST_NULL;
-			frontPackage->notified = false;
-			rg->sMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			omp_unset_lock(rg->sMap[f]->r_con.sndLock);
-#pragma omp flush
-			omp_set_lock(rg->lMap[f]->r_con.sndLock);
-			frontPackage = rg->lMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = MPI_REQUEST_NULL;
-			rg->lMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			omp_unset_lock(rg->lMap[f]->r_con.sndLock);			
-		    }
-		}
-	    } // if(queueSize > 0)
-	} // for(i<nsnd)
-    }// for(f<numfabs)
-
-}// serviceRemoteRequests
-
-void Perilla::serviceRemoteRequests(RegionGraph* rg)
-{
-    serviceRemoteRequests(rg,0,1);
-}
-
-void Perilla::serviceSingleGraphComm(RegionGraph* graph, int tid)
-{
-    int np = ParallelDescriptor::NProcs();
-    int tg = WorkerThread::perilla_wid();
-    while(true)
-    {
-#pragma omp flush (graph)
-	if(graph->totalFinishes < perilla::NUM_THREAD_TEAMS)
-	{
-	    serviceLocalRequests(graph, tg);
-	    if((np>1) & (tg==0))
-		serviceRemoteRequests(graph);
-	}
-	else
-	{
-	    if(tg==0)
-	    {
-		while(graph->totalFinishes < perilla::NUM_THREAD_TEAMS)
-		{
-#pragma omp flush (graph)
-		}		
-		//call parallel_barrier()  ---????????
-		ParallelDescriptor::Barrier("serviceSingleGraph-1");
-		graph->graphTeardown();
-		graph->workerTeardown();
-		//call parallel_barrier() ------?????????
-		ParallelDescriptor::Barrier("serviceSingleGraph-2");
-	    }
-	    break;
-	}
-    } // while(true)
-
-} //serviceSingleGraphComm
-
-void Perilla::serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, bool cpyAcross, int tid)
-{
-    int tg = WorkerThread::perilla_wid();
-    int np = ParallelDescriptor::NProcs();    
-    int graphFinishCnt = 0;
-    while(true)
-    {
-	for(int g=0; g<nGraphs; g++)
-	{
-#pragma omp flush (graphArray)
-	    if(graphArray[g].totalFinishes < perilla::NUM_THREAD_TEAMS)
-	    {
-		serviceLocalRequests(&graphArray[g], tg);
-		//if(cpyAcross)
-		//serviceLocalGridCopyRequests(graphArray,g,tg);
-		if(np > 1)
-		    if(tg==0)
-		    {
-			serviceRemoteRequests(&graphArray[g],g,nGraphs);
-			//if(cpyAcross)
-			//serviceRemoteGridCopyRequests(graphArray,g,nGraphs,tg);
-		    }
-	    }
-	}
-	//!check if we have finished all the graph execution
-	bool noMoreWork = true;
-	for(int g=0; g<nGraphs; g++)
-	    if(graphArray[g].totalFinishes < perilla::NUM_THREAD_TEAMS)
-		noMoreWork = false;
-	if(noMoreWork)
-	    break;	
-    } // while(true)
-    if(tg==0)
-	for(int g=0; g<nGraphs; g++)
-	{
-	    ParallelDescriptor::Barrier("serviceMultipleGraph-1");
-	    graphArray[g].graphTeardown();
-	    graphArray[g].workerTeardown();
-	    ParallelDescriptor::Barrier("serviceMultipleGraph-2");
-	}
-
-} // serviceMultipleGraphComm
-
-void Perilla::flattenGraphHierarchy(std::vector<std::vector<RegionGraph*> > graphArrayHierarchy, std::vector<RegionGraph*> &graphArray){
-    int gCnt=0;
-    for(int l=0; l<graphArrayHierarchy.size(); l++) gCnt+= graphArrayHierarchy[l].size();
-    for(int l=0; l<graphArrayHierarchy.size(); l++)
-        for(int g=0; g<graphArrayHierarchy[l].size(); g++)
-            graphArray.push_back(graphArrayHierarchy[l][g]);
-}
-
-void Perilla::serviceMultipleGraphCommDynamic(std::vector<RegionGraph*> graphArray, bool cpyAcross, int tid)
-{
-    int tg = WorkerThread::perilla_wid();
-    int np = ParallelDescriptor::NProcs();    
-    int myProc = ParallelDescriptor::MyProc();
-    int graphFinishCnt = 0;
-    int nGraphs;
-    bool doublechecked = false;
-
-    double maxltime=0;
-    double minltime=10;
-    double avgltime=0;
-    double numloops=0;
-    double ltime,lstime,letime;
-
-
-    //while(true)
-    {	
-	//lstime = omp_get_wtime();
-	for(int g=0; g<graphArray.size(); g++)
-	{
-	    nGraphs = graphArray.size();
-	    //if(graphArray[g]->graphID==13)
-	    //std::cout<<"Processing Local GridCopy Req Graph "<< g+1 << " tg " << tg <<std::endl;
-#pragma omp flush (graphArray)
-	    //if(graphArray[g]->totalFinishes < perilla::NUM_THREAD_TEAMS)
-	    {
-		/*try{
-		  if(graphArray[g]->assocMF == 0)
-		  std::cout<<"Processing Graph with NULL MF "<<g<<" ";
-		  }catch (const std::exception& e) {
-		  std::cout<<"Processing Graph with NULL MF "<<g<<" ";
-		  }*/
-		//if(graphArray[g]->graphID==1)
-		//std::cout<<"Processing Local Req Graph "<<g+1 << " tg " <<tg <<std::endl;
-		serviceLocalRequests(graphArray[g], tg);
-		if(cpyAcross)
-		{
-		    //if(graphArray[g]->graphID==13)
-		    //std::cout<<"Processing Local GridCopy Req Graph "<< g+1 << " tg " << tg <<std::endl;
-		    serviceLocalGridCopyRequests(graphArray,g,tg);
-		}
-		if(np > 1)
-		    //if(tg==0)
-		{
-		    serviceRemoteRequests(graphArray[g],g,nGraphs);
-		    if(cpyAcross)
-		    {
-			//resetRemoteGridCopyRequests(graphArray,g,nGraphs,tg);
-			if(tg==0)
-			    serviceRemoteGridCopyRequests(graphArray,g,nGraphs,tg);
-		    }
-		}
-	    }
-	}
-	/*
-	//!check if we have finished all the graph execution
-	bool noMoreWork = true;
-	//std::cout<<"Graph Not Completed ";
-	for(int g=0; g<nGraphs; g++)
-	if(graphArray[g]->totalFinishes < perilla::NUM_THREAD_TEAMS)
-	{
-	noMoreWork = false;
-	//if(tg==0)
-	//std::cout<< g << " tfs " << graphArray[g]->totalFinishes << std::endl;
-	}
-	//else
-	// std::cout<<"Graph Completed "<< g <<std::endl;
-	//std::cout<<std::endl;
-	if(noMoreWork)
-	break;
-	 */
-
-	//std::cin.ignore( std::numeric_limits <std::streamsize> ::max(), '\n' );
-
-	//for(int g=0; g<graphArray.size(); g++)
-	//std::cout << g+1 << ":" << graphArray[g]->totalFinishes << " | ";
-
-
-	//f( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-	//{
-	//    if(doublechecked) // double check if there are still something to send
-	//	break;
-	//    else
-	//	doublechecked = true;
-	//}
-
-	//std::cout<<"Teams Completed "<< Perilla::numTeamsFinished << " tid "<< tid << " myProc " << myProc <<std::endl;
-
-	//letime = omp_get_wtime();
-	numloops++;
-	//ltime = letime - lstime;
-
-	//avgltime += ltime;
-	//if(ltime < minltime)
-	 //   minltime = ltime;
-	//if(ltime > maxltime)
-	//    maxltime = ltime;
-
-    } // while(true)
-
-    //if(myProc==0)
-    //std::cout<< std::endl << "COMM HANDLER TIMES tg" << tg << " avg " << avgltime/numloops << " min " << minltime << " max " << maxltime <<std::endl;
-
-    //std::cout<< std::endl << "COMM HANDLER " << tg << " FINISHED EXECUTION" << " myProc " << myProc << " nTF " << Perilla::numTeamsFinished << " nTT " << perilla::NUM_THREAD_TEAMS<<std::endl;
-
-    //nGraphs = graphArray.size();
-    //if(tg==0)
-    //for(int g=0; g<nGraphs; g++)
-    //{
-	//ParallelDescriptor::Barrier("serviceMultipleGraph-1");
-	//graphArray[g]->graphTeardown(tg);
-	//graphArray[g]->workerTeardown(tg);
-	//ParallelDescriptor::Barrier("serviceMultipleGraph-2");
-    //}
-
-} // serviceMultipleGraphCommDynamic
-
-
-void Perilla::serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, int tid)
-{
-    serviceMultipleGraphComm(graphArray,nGraphs,false,tid);
-} // serviceMultipleGraphComm
-
-void Perilla::fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f)
-{
-
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    //if(graph->graphID == 1 && f == 1)
-    //std::cout << "fillBPush for gID 1 f 1 ntid "<< ntid <<std::endl;
-
-    if(perilla::LAZY_PUSH)
-    { }
-    else
-    {
-	if(ntid == 0)
-	    omp_set_lock(&(graph->lMap[f]->l_con.sLock));
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-	if(perilla::PACKING_FINEGRAIN)
-	{}
-	else
-	{
-	    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-		if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-
-		    //if(graph->graphID == 1 && graph->lMap[f]->l_con.scpy[i].nd == 1)
-		    //std::cout << "fillBPush for gID 1 nd 1 pQenQ f " << f << " i " << i <<std::endl;
-		    Package *sPackage = graph->lMap[f]->l_con.scpy[i].recycleQueue.getFront(true);
-		    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->l_con.scpy[i].sbx,0,nComp,sPackage->databuf);
-
-		    for(int d=0; d<sPackage->bufSize; d++)
-			if(sPackage->databuf[d] == 0)
-			{
-			    //std::cout<< "in fbPush Sending 0 from f "<< f <<std::endl;
-			    //BL_ASSERT(sPackage->databuf[d] != 0);
-			}
-		    //if(graph->lMap[f]->l_con.scpy[i].sbx.smallEnd() == graph->lMap[f]->l_con.scpy[i].sbx.bigEnd())
-		    //if(graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(0)==7 && graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(1)==7 && graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(2)==4)
-		    //  std::cout<< "Corner Push for f "<< f << " data0 " <<sPackage->databuf[0]<< " size " <<sPackage->bufSize << " se "<< graph->lMap[f]->l_con.scpy[i].sbx.smallEnd() <<std::endl;
-
-		}	    
-	} // if(PACKING_FINEGRAIN) - else
-
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-	if(ntid==0)
-	{
-	    //if(graph->graphID == 1 && f == 1)
-	    //std::cout << "fillBPush for gID 1 f 1 pQ enQ" <<std::endl;
-	    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-	    {
-		//if(graph->graphID == 1 && graph->lMap[f]->l_con.scpy[i].nd == 1)
-		//std::cout << "fillBPush for gID 1 nd 1 pQ enQ from f "<< f <<std::endl;
-		graph->lMap[f]->l_con.scpy[i].pQueue.enqueue( graph->lMap[f]->l_con.scpy[i].recycleQueue.dequeue(true),true );
-	    }
-	    omp_unset_lock(&(graph->lMap[f]->l_con.sLock));
-	}
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    } // if(LAZY_PUSH) - else
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-	omp_set_lock(graph->lMap[f]->r_con.sndLock);
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	if((i%(perilla::NUM_THREADS_PER_TEAM-1))==ntid)
-	{
-	    //std::cout << "RQS " << graph->lMap[f]->r_con.snd[i].recycleQueue.queueSize() << std::endl;
-
-	    Package *sndPackage = graph->lMap[f]->r_con.snd[i].recycleQueue.dequeue(true);	  
-	    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->r_con.snd[i].sbx,0,nComp,sndPackage->databuf);
-	    sndPackage->notified = false;
-	    graph->lMap[f]->r_con.snd[i].pQueue.enqueue( sndPackage,true );
-	    //!the local message handler will detect the change and notify the remote message handler =>read access
-	    //!the remote message handler first modifies the front item of this queue, then it push this item back to the message pool
-	}
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(ntid==0)
-    {
-	omp_unset_lock(graph->lMap[f]->r_con.sndLock);
-	omp_set_lock(graph->sMap[f]->r_con.sndLock);
-	for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	    graph->sMap[f]->r_con.snd[i].pQueue.enqueue( graph->sMap[f]->r_con.snd[i].recycleQueue.dequeue(true),true );
-	omp_unset_lock(graph->sMap[f]->r_con.sndLock);
-    }    																					      
-
-} // fillBoundaryPush
-
-void Perilla::fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f)
-{
-
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    if(ntid==0)
-	omp_set_lock(&(graph->lMap[f]->l_con.dLock));
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads    
-
-    if(perilla::LAZY_PUSH)
-    { }
-    else
-    {
-	if(perilla::UNPACKING_FINEGRAIN)
-	{}
-	else
-	{
-	    for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-		if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package *dPackage = graph->lMap[f]->l_con.dcpy[i].pQueue.getFront(true);
-
-		    for(int d=0; d<dPackage->bufSize; d++)
-			if(dPackage->databuf[d] == 0)
-			{
-			    //std::cout<< "in fbPull Reciving 0 for f "<< f <<std::endl;
-			    //BL_ASSERT(dPackage->databuf[d] != 0);
-			}
-		    /*
-		       if(f==0)
-		    //if(graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd() == graph->lMap[f]->l_con.dcpy[i].dbx.bigEnd())
-		    //if(graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(0)==-1 && graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(1)==-1 && graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(2)==4)
-		    std::cout<< "Corner Pull for f "<< f << " data0 " <<dPackage->databuf[0]<< " size " <<dPackage->bufSize <<" se " <<graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd()<<std::endl;
-		     */
-		    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->l_con.dcpy[i].dbx,0,nComp,dPackage->databuf);		  
-		}
-	} // if(UNPACKING_FINEGRAIN) - else
-    } // if(LAZY_PUSH) - else
-
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    graph->lMap[f]->l_con.dcpy[i].recycleQueue.enqueue( graph->lMap[f]->l_con.dcpy[i].pQueue.dequeue(true),true );
-
-	graph->lMap[f]->l_con.firingRuleCnt = graph->lMap[f]->l_con.firingRuleCnt - graph->lMap[f]->l_con.ndcpy;
-
-	graph->lMap[f]->l_con.scpyCnt = 0;
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    if(graph->lMap[f]->l_con.dcpy[i].pQueue.queueSize(true) >= 1)
-		graph->lMap[f]->l_con.firingRuleCnt++;
-	omp_unset_lock(&(graph->lMap[f]->l_con.dLock));
-    }
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-    {
-	omp_set_lock(graph->rMap[f]->r_con.rcvLock);
-	omp_set_lock(graph->lMap[f]->r_con.rcvLock);
-    }
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	{
-	    Package *rcvMetaPackage = graph->rMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = MPI_REQUEST_NULL;
-	    graph->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-	    Package *rcvPackage = graph->lMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->r_con.rcv[i].dbx,0,nComp,rcvPackage->databuf);
-	    rcvPackage->completed = false;
-	    rcvPackage->notified = false;
-	    graph->lMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);
-	}
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	graph->lMap[f]->r_con.firingRuleCnt = graph->lMap[f]->r_con.firingRuleCnt - graph->lMap[f]->r_con.nrcv;
-	for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	    if(graph->lMap[f]->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		if(graph->lMap[f]->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-		    graph->lMap[f]->r_con.firingRuleCnt++;
-	omp_unset_lock(graph->lMap[f]->r_con.rcvLock);
-	omp_unset_lock(graph->rMap[f]->r_con.rcvLock);
-    }
-
-} // fillBoundaryPull
-
-void Perilla::fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f, bool singleT)
-{
-exit(0);
-}
-
-/////////////////////////////////////////////////////////////////////////////////////////////////////////////////
-
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, int nc, int ng, int ngSrc, const Periodicity& period)
-{
-    //    MultiFab* mfSrc = gSrc->assocMF;
-    //    MultiFab* mfDst = gDst->assocMF;
-    int myProc = ParallelDescriptor::MyProc();
-    int np = ParallelDescriptor::NProcs();
-
-    try{
-
-	if(true)//if(!(*mfSrc == *mfDst))
-	{
-	    if(ng > mfDst.nGrow()) cout <<"MULTIFAB_COPY_C: ng > mfDst.nGrow not supported in parallel copy"<< endl;
-	    if(ngSrc > mfSrc.nGrow()) cout <<"MULTIFAB_COPY_C: ngSrc > mfSrc.nGrow"<< endl;
-	    if(ngSrc > 0)
-	    {
-
-		// To be implemented
-		//do i = 1, nboxes(msrc%la)
-		//  call push_back(bl, grow(box_nodalize(get_box(msrc%la,i),msrc%nodal),lngsrc))
-		//end do
-		//call build(batmp, bl, sort = .false.)
-		//call destroy(bl)
-		//call build(lasrctmp, batmp, boxarray_bbox(batmp), explicit_mapping = get_proc(msrc%la))
-		//call destroy(batmp)
-		//call build(msrctmp, lasrctmp, nc = lnc, ng = 0)
-		//pmfsrc => msrctmp
-	    }
-	    if(np > 1)
-	    {
-		if(gSrc->sCopyMapHead == 0)
-		    gSrc->sCopyMapHead = new CopyMap();
-		else
-		{
-		    CopyMap *tmpCopyMap = new CopyMap();
-		    tmpCopyMap->next = gSrc->sCopyMapHead;
-		    gSrc->sCopyMapHead = tmpCopyMap;
-		}
-		if(gDst->rCopyMapHead == 0)
-		    gDst->rCopyMapHead = new CopyMap();
-		else
-		{
-		    CopyMap *tmpCopyMap = new CopyMap();
-		    tmpCopyMap->next = gDst->rCopyMapHead;
-		    gDst->rCopyMapHead = tmpCopyMap;
-		}
-		//gSrc->sCopyMapHead->map.reserve(mfSrc.size());
-		//gDst->rCopyMapHead->map.reserve(mfDst.size());
-		gSrc->sCopyMapHead->alloc_CopyMap(mfSrc);
-		gDst->rCopyMapHead->alloc_CopyMap(mfDst);
-	    }
-
-	    if(gSrc->numTasks != mfSrc.IndexArray().size())
-		std::cout<< "before " <<gSrc->numTasks << " now " <<mfSrc.size() << " at gID " << gSrc->graphID << std::endl;	
-
-	    gSrc->numFabs = mfSrc.size();
-	    gDst->numFabs = mfDst.size();	
-
-	    gSrc->numTasks = mfSrc.IndexArray().size();
-	    gDst->numTasks = mfDst.IndexArray().size();
-
-	    int nfabsSrc = mfSrc.IndexArray().size();
-	    int nfabsDst = mfDst.IndexArray().size();
-
-            const FabArrayBase::CPC& TheCPC = mfDst.getCPC(IntVect(ng), mfSrc, IntVect(ngSrc), period);
-
-	    const int nloc_cpAsc = TheCPC.m_LocTags->size();
-	    const int nsnds_cpAsc = TheCPC.m_SndTags->size();
-	    const int nrcvs_cpAsc = TheCPC.m_RcvTags->size();     
-
-	    Vector<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-	    Vector<int> send_pr;
-	    send_cctc.reserve(nsnds_cpAsc);
-
-	    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC.m_SndTags->begin(),
-		    m_End = TheCPC.m_SndTags->end();
-		    m_it != m_End;
-		    ++m_it)
-	    {
-		if(m_it->first != myProc)      // Not destined to me.
-		{
-		    send_pr.push_back(m_it->first);
-		    send_cctc.push_back(&(m_it->second));
-		}
-	    }
-
-	    //	std::cout<< "Loop 1" <<std::endl;
-
-	    Vector<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-	    Vector<int> recv_pr;
-	    recv_cctc.reserve(nrcvs_cpAsc);
-
-	    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC.m_RcvTags->begin(),
-		    m_End = TheCPC.m_RcvTags->end();
-		    m_it != m_End;
-		    ++m_it)
-	    {
-		if(m_it->first != myProc)      // I am not the source for this receipt
-		{
-		    recv_pr.push_back(m_it->first);
-		    recv_cctc.push_back(&(m_it->second));
-		}
-	    }
-
-	    //std::cout<< "Before parallel at gID " << gDst->graphID << " numTask " << gDst->numTasks << " numFabs " << gDst->numFabs <<std::endl;	
-
-#pragma omp parallel shared(gSrc, gDst, mfSrc, mfDst, nfabsSrc, nfabsDst)
-	    {
-		int tg = WorkerThread::perilla_wid();
-		int fg;
-
-		for(int f=0; f<nfabsSrc; f++)
-		{
-		    if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-		    {
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			FabCopyAssoc *cpSrc;
-			if(gSrc->task[f]->cpAsc_srcHead == 0)
-			{
-			    gSrc->task[f]->cpAsc_srcHead = new FabCopyAssoc();
-			    cpSrc = gSrc->task[f]->cpAsc_srcHead;
-			}
-			else
-			{
-			    cpSrc = new FabCopyAssoc();
-			    cpSrc->next = gSrc->task[f]->cpAsc_srcHead;
-			    gSrc->task[f]->cpAsc_srcHead = cpSrc;
-			}
-
-			cpSrc->graphPartner = gDst;
-			cpSrc->l_con.nscpy = 0;
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-			    //if(f == tag.srcIndex)
-			    if(mfSrc.IndexArray()[f] == tag.srcIndex)
-				cpSrc->l_con.nscpy++;		  
-			}
-			cpSrc->l_con.scpy = new LocalCopyDescriptor[cpSrc->l_con.nscpy];		
-			int scnt = 0;
-
-			//if(gDst->graphID == 4 && tag.dstIndex == 60 )
-			//std::cout<< "Inside parallel Generating Local Copy send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-			    //if(f == tag.srcIndex)
-			    if(mfSrc.IndexArray()[f] == tag.srcIndex)			
-			    {
-
-				//if(gDst->graphID == 4 && (tag.dstIndex == 60 || tag.dstIndex == 59) )
-				//std::cout <<"myP " <<myProc<< " Added in S LocDep nd " << tag.dstIndex << " ns "<< tag.srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-				cpSrc->l_con.scpy[scnt].ns = mfSrc.localindex(tag.srcIndex);
-				cpSrc->l_con.scpy[scnt].nd = mfDst.localindex(tag.dstIndex);
-				cpSrc->l_con.scpy[scnt].sbx = tag.sbox;
-				cpSrc->l_con.scpy[scnt].dbx = tag.dbox;
-				int psize = tag.sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				//std::cout<< " gSrc ID "<< gSrc->graphID << " f "<<f<< " sndPkgsize " << psize <<std::endl;
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				{
-				    Package *tmpPkg = new Package(psize);
-				    for(int j=0; j<psize; j++)
-					tmpPkg->databuf[j] = 0;
-				    cpSrc->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);
-				}
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    cpSrc->l_con.scpy[scnt].recycleQueue.enqueue(cpSrc->l_con.scpy[scnt].pQueue.dequeue());
-				scnt++;
-			    }
-			}
-
-			if(np > 1)
-			{
-			    cpSrc->r_con.nsnd = 0;
-			    cpSrc->r_con.remotePushReady = false;
-			    cpSrc->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)				
-					cpSrc->r_con.nsnd++;
-				}		      
-			    } // for(i<nsnds_cpAsc)
-			    cpSrc->r_con.snd = new RemoteCommDescriptor[cpSrc->r_con.nsnd];
-			    scnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-				    {
-
-					//if(gDst->graphID == 17 && (it->srcIndex == 1198 || it->srcIndex == 1198 || it->srcIndex == 978 || it->srcIndex == 978))
-					//std::cout <<"myP " <<myProc<< " Added in S Dep r " << it->dstIndex << " s "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg <<" nsnd " << gSrc<< std::endl;
-
-					cpSrc->r_con.snd[scnt].ns = it->srcIndex;
-					cpSrc->r_con.snd[scnt].nd = it->dstIndex;			      
-					cpSrc->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					cpSrc->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);			      
-					cpSrc->r_con.snd[scnt].sbx = it->sbox;
-					cpSrc->r_con.snd[scnt].dbx = it->dbox;
-					int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    Package *tmpPkg = new Package(psize);
-					    for(int j=0; j<psize; j++)
-						tmpPkg->databuf[j] = 0;
-					    cpSrc->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    cpSrc->r_con.snd[scnt].recycleQueue.enqueue(cpSrc->r_con.snd[scnt].pQueue.dequeue());			      
-					scnt++;
-				    }
-				}		      		      
-			    } // for(i<nsnds_cpAsc)		    		  
-			} // if(np > 1)	      																	
-		    } // if(fg==tg)
-#pragma omp barrier
-		    //	      std::cout<< "Barrier 1" <<std::endl;	      
-		    if(np > 1)
-		    {
-			if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-			{
-
-			    // std::cout<< "Inside parallel Generating Remote Send tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			    gSrc->sCopyMapHead->map[f]->r_con.nsnd = 0;
-			    gSrc->sCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)				
-					gSrc->sCopyMapHead->map[f]->r_con.nsnd++;
-				}
-			    } // for(i<nsnds_cpAsc)
-			    gSrc->sCopyMapHead->map[f]->r_con.snd = new RemoteCommDescriptor[gSrc->sCopyMapHead->map[f]->r_con.nsnd];
-			    int scnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-				    {
-
-					//if(gDst->graphID == 31 && (it->dstIndex == 519))
-					//std::cout <<"myP " <<myProc<< " Added in S Dep nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].ns = it->srcIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].nd = it->dstIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_gid = gDst->graphID-1;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);				  
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sbx = it->sbox;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].dbx = it->dbox;
-
-					int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sz = psize;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pr = send_pr[i];
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].recycleQueue.enqueue(gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.dequeue());  
-					scnt++;
-				    }
-				}
-			    } // for(i<nsnds_cpAsc)
-			} // if(tid==0)
-		    } // if(np > 1)	  
-		} // for(f<nfabsSrc)
-		//	  std::cout<< "Barrier 2 " <<" tid "<<tid<<std::endl;	  
-#pragma omp barrier	  	  
-		for(int f=0; f<nfabsDst; f++)
-		{
-		    if(WorkerThread::isMyRegion(tg,f) && perilla::isMasterWorkerThread())		
-		    {
-			//	  std::cout <<"tid: "<< tid << " f: "<< f << " is master "<<WorkerThread::isTeamMasterThread(tid) << " is my region "<<WorkerThread::isMyRegion(tg,f)<<std::endl;		  
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			FabCopyAssoc *cpDst;
-			if(gDst->task[f]->cpAsc_dstHead == 0)
-			{
-			    gDst->task[f]->cpAsc_dstHead = new FabCopyAssoc();
-			    cpDst = gDst->task[f]->cpAsc_dstHead;
-			}
-			else
-			{
-			    cpDst = new FabCopyAssoc();
-			    cpDst->next = gDst->task[f]->cpAsc_dstHead;
-			    gDst->task[f]->cpAsc_dstHead = cpDst;
-			}
-			cpDst->graphPartner = gSrc;
-			cpDst->l_con.ndcpy = 0;
-			cpDst->l_con.firingRuleCnt = 0;
-			cpDst->l_con.dcpyCnt = 0;
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-			    //if(f == tag.dstIndex)
-			    if(mfDst.IndexArray()[f] == tag.dstIndex)
-				cpDst->l_con.ndcpy++;		  
-			}
-			cpDst->l_con.dcpy = new LocalCopyDescriptor[cpDst->l_con.ndcpy];		
-			int dcnt = 0;
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Local copy recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-
-			//if(gDst->graphID ==27 && f == 633)
-			//std::cout<< "tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc << " ndcpy " << cpDst->l_con.ndcpy <<std::endl;	
-
-
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-			    //if(f == tag.dstIndex)
-			    if(mfDst.IndexArray()[f] == tag.dstIndex)
-			    {
-
-				//if(gDst->graphID == 4 && (tag.dstIndex == 60 || tag.dstIndex == 59))
-				//std::cout<< "dcpy tid " << tid << " f " << f << " i " << i << " dcnt " << dcnt << " ns "<<tag.srcIndex << " nd "<<tag.dstIndex << " lo " << tag.dbox.smallEnd() << " hi " << tag.dbox.bigEnd() <<std::endl;	
-
-				cpDst->l_con.dcpy[dcnt].ns = mfSrc.localindex(tag.srcIndex);
-				cpDst->l_con.dcpy[dcnt].nd = mfDst.localindex(tag.dstIndex);
-				cpDst->l_con.dcpy[dcnt].sbx = tag.sbox;
-				cpDst->l_con.dcpy[dcnt].dbx = tag.dbox;
-
-				// if(gDst->graphID > 25 && f == 633)
-				//std::cout<< " Generating Package tid " << tid << " i " << i <<std::endl;	
-
-				int psize = tag.dbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				cpDst->l_con.dcpy[dcnt].sz = psize;
-
-				if(!gDst->isDepGraph)
-				{
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					Package *tmpPkg = new  Package(psize);
-
-					// if(tmpPkg == nullptr)
-					//std::cout<<"Found the culprit tid " << tid << " f " << f << " i " << i << std::endl;
-
-					for(int j=0; j<psize; j++)
-					    tmpPkg->databuf[j] = 0;
-					cpDst->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);
-				    }
-
-				    // if(gDst->graphID > 25 && f == 633)
-				    //std::cout<< " Generating  now in reQ Package tid " << tid << " i " << i <<std::endl;	
-
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpDst->l_con.dcpy[dcnt].recycleQueue.enqueue(cpDst->l_con.dcpy[dcnt].pQueue.dequeue());		      
-
-				    //if(gDst->graphID > 25 && f == 633)
-				    //  std::cout<< " Generated Package tid " << tid << " i " << i <<std::endl;	
-				}
-
-				dcnt++;
-			    }
-			}
-
-			// if(gDst->graphID > 25 && f > 630)
-			//std::cout<< "Safe now tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc <<std::endl;	
-
-			RegionGraph* depGraph = gDst->srcLinkGraph;
-			for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-			{
-			    int dfi = gDst->task[f]->depTaskIDs[df];
-			    FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-			    for(int i=0; i<cpdDst->l_con.ndcpy ; i++)
-			    {
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				{
-				    int psize = cpdDst->l_con.dcpy[i].sz;
-				    Package *tmpPkg = new  Package(psize);       
-				    for(int j=0; j<psize; j++)
-					tmpPkg->databuf[j] = 0;
-				    cpdDst->l_con.dcpy[i].pQueue.enqueue(tmpPkg);
-				}			      
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    cpdDst->l_con.dcpy[i].recycleQueue.enqueue(cpdDst->l_con.dcpy[i].pQueue.dequeue());		      
-			    }
-			}		  
-
-			if(np > 1)
-			{
-			    cpDst->r_con.nrcv = 0;
-			    cpDst->r_con.remotePullDone = false;
-			    cpDst->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-					cpDst->r_con.nrcv++;
-				}		      
-			    } // for(i<nrcvs_cpAsc)
-			    cpDst->r_con.rcv = new RemoteCommDescriptor[cpDst->r_con.nrcv];
-			    dcnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-				    {
-					cpDst->r_con.rcv[dcnt].nd = it->dstIndex;
-					cpDst->r_con.rcv[dcnt].ns = it->srcIndex;
-					cpDst->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					cpDst->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);				  
-					cpDst->r_con.rcv[dcnt].sbx = it->sbox;
-					cpDst->r_con.rcv[dcnt].dbx = it->dbox;
-					int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-					cpDst->r_con.rcv[dcnt].sz = psize;
-
-					if(!gDst->isDepGraph)
-					{
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    {
-						Package *tmpPkg = new Package(psize);
-						for(int j=0; j<psize; j++)
-						    tmpPkg->databuf[j] = 0;
-						cpDst->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-					    }
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						cpDst->r_con.rcv[dcnt].recycleQueue.enqueue(cpDst->r_con.rcv[dcnt].pQueue.dequeue());		      			      
-					}
-
-					dcnt++;
-				    }
-				}
-			    }// for(i<nrcvs_cpAsc)
-
-			    RegionGraph* depGraph = gDst->srcLinkGraph;
-			    for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-			    {
-				int dfi = gDst->task[f]->depTaskIDs[df];
-				FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-				for(int i=0; i<cpdDst->r_con.nrcv ; i++)
-				{
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					int psize = cpdDst->r_con.rcv[i].sz;
-					Package *tmpPkg = new  Package(psize);       
-					for(int j=0; j<psize; j++)
-					    tmpPkg->databuf[j] = 0;
-					cpdDst->r_con.rcv[i].pQueue.enqueue(tmpPkg);
-				    }			      
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpdDst->r_con.rcv[i].recycleQueue.enqueue(cpdDst->r_con.rcv[i].pQueue.dequeue());		      
-				}
-			    }		  
-
-
-			} // if(np > 1)
-		    }// if(fg==tg)
-
-#pragma omp barrier		  
-		    if(np > 1)
-		    {
-			//if(tid==0)
-			if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)			
-			{
-
-			    //  std::cout<< "Inside parallel Generating Remote Recive tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			    gDst->rCopyMapHead->map[f]->r_con.nrcv = 0;
-			    gDst->rCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-					gDst->rCopyMapHead->map[f]->r_con.nrcv++;
-				}
-			    }
-			    gDst->rCopyMapHead->map[f]->r_con.rcv = new RemoteCommDescriptor[gDst->rCopyMapHead->map[f]->r_con.nrcv];
-			    int dcnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-				    {
-
-					// if(myProc==54 && gDst->graphID == 25 && f == 10)
-					// std::cout <<"myP " <<myProc<<" Dep n R Added nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " sgID "<< gSrc->graphID <<" tg "<<tg<< " from P " << recv_pr[i] <<std::endl;
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].nd = it->dstIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].ns = it->srcIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sbx = it->sbox;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].dbx = it->dbox;
-
-					int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sz = psize;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pr = recv_pr[i];
-
-					BL_ASSERT(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd == f);
-
-					if(Perilla::genTags)
-					{
-					    try{
-						std::map<int,int>::iterator itr = tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].find(psize);
-						if( itr != tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].end())
-						{
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-						}
-						else
-						{
-						    tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex][psize] = Perilla::uTags++;
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-						    std::map<int,int>::iterator itr2 = pTagCnt[recv_pr[i]].find(gDst->graphID-1);
-						    if(itr2 != pTagCnt[recv_pr[i]].end())
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = pTagCnt[recv_pr[i]][gDst->graphID-1] + 1;
-						    else
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = 1;									     									      
-						}
-					    }
-					    catch(std::exception& e)
-					    {
-						std::cout <<"Inside tagGeneration gID "<< gDst->graphID <<" "<< e.what() << '\n';
-					    }
-					}
-					//tagMap[recv_pr[i]][gDst->graphID][it->dstIndex][it->srcIndex] = pTagCnt[recv_pr[i]];				  
-
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].recycleQueue.enqueue(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.dequeue());
-					dcnt++;
-				    }
-				}
-			    } // for(i<nrcvs_cpAsc)
-
-			} // if(tid==0)
-		    } // if(np > 1)
-		    //} //if(fg==tg)
-	    } // for(f<nfabsDst)
-	    // std::cout<< "Barrier 4" <<" tid "<<tid <<std::endl;	      	  	  
-#pragma omp barrier
-	    for(int f=0; f<nfabsSrc; f++)
-	    {
-		if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())	      
-		{	
-
-		    //if(gDst->graphID > 25)
-		    //std::cout<< "Inside parallel Generating Send partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;		  
-
-		    for(int i=0; i<gSrc->task[f]->cpAsc_srcHead->l_con.nscpy; i++)
-		    {
-			int lnd = gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].nd;
-			for(int j=0; j<gDst->task[ lnd ]->cpAsc_dstHead->l_con.ndcpy; j++)
-			    if(gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dbx == gDst->task[ lnd ]->cpAsc_dstHead->l_con.dcpy[j].dbx)
-				gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dPartner = j;
-		    }
-		}
-	    } // for(f<nfabsSrc)
-	    //std::cout<< "Barrier 5" <<" tid "<<tid<<std::endl;	      	  	  
-#pragma omp barrier
-	    for(int f=0; f<nfabsDst; f++)
-	    {
-		if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-		{
-
-		    //if(gDst->graphID > 25)
-		    //std::cout<< "Inside parallel Generating Recive partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-		    for(int i=0; i<gDst->task[f]->cpAsc_dstHead->l_con.ndcpy; i++)
-		    {
-			int lns = gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].ns;
-			for(int j=0; j<gSrc->task[ lns ]->cpAsc_srcHead->l_con.nscpy; j++)
-			    if(gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].dbx == gSrc->task[ lns ]->cpAsc_srcHead->l_con.scpy[j].dbx)
-				gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].sPartner = j;
-		    }
-		}
-	    } // for(f<nfabsDst)																 
-	} // omp parallel
-    } // if(!(*mfSrc == *mfDst))    
-}
-catch(std::exception& e)
-{
-    std::cout <<"Inside MFcopyAssoc gID "<< gDst->graphID <<" "<< e.what() << '\n';
-}
-
-
-//std::cout<< "All done safely at gID " << gDst->graphID <<std::endl;	
-
-} // multifabExtractCopyAssoc
-
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, const Periodicity& period) 
-{
-    multifabExtractCopyAssoc(gDst, gSrc, mfDst, mfSrc, 1, 0, 0, period);
-}
-
-void Perilla::multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    int myProc = ParallelDescriptor::MyProc();
-    // MultiFab* mfDst = destGraph->assocMF;
-    // MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-	//if(srcGraph->graphID==18 && f ==316 && ntid == 0)
-	//std::cout << "srgG chk see " << srcGraph << " " <<myProc <<std::endl;
-
-	while(cpSrc != 0)
-	{
-	    if(cpSrc->graphPartner == destGraph)
-		break;
-	    cpSrc = cpSrc->next;
-	} 
-	if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;	
-
-	if(singleT)
-	{
-	    omp_set_lock(&(cpSrc->l_con.sLock));		    
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-	    {
-		Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-	    }	    
-	    for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-	    omp_unset_lock(&(cpSrc->l_con.sLock));   
-	}
-	else
-	{
-	    if(ntid == 0)
-		omp_set_lock(&(cpSrc->l_con.sLock));	
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-		}	    
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    if(ntid==0)
-	    {
-		for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		    cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-		omp_unset_lock(&(cpSrc->l_con.sLock));   
-	    }
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	//if(myProc==26 && srcGraph->graphID==18  && ntid == 0)
-	//std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-	//if(myProc==28 && srcGraph->graphID==18  && ntid == 0)
-	//std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-	//if(srcGraph->graphID==18 && f ==316)	 
-	//BL_ASSERT(cpSrc->r_con.nsnd == 177);
-
-	if(singleT)
-	{
-	    omp_set_lock(cpSrc->r_con.sndLock);
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-
-		Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		sndPackage->notified = false;
-		sndPackage->notified = false;
-		cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-	    }
-
-	    omp_unset_lock(cpSrc->r_con.sndLock); 
-
-	    cpSrc->r_con.remotePushReady = true;
-	    ///*
-	    omp_set_lock(srcGraph->sCopyMapHead->map[f]->r_con.sndLock);
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-	    omp_unset_lock(srcGraph->sCopyMapHead->map[f]->r_con.sndLock);
-	}
-	else
-	{
-	    if(ntid == 0)
-		omp_set_lock(cpSrc->r_con.sndLock);
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-
-		    // if(myProc==4 && srcGraph->graphID==2 && (f ==0 || f ==2))
-		    //std::cout << " Pushing 2 316 164"<<std::endl;
-
-		    Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		    sndPackage->notified = false;
-		    sndPackage->notified = false;
-		    cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-
-		}
-
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    if(ntid==0)
-	    {
-		omp_unset_lock(cpSrc->r_con.sndLock); 
-
-		cpSrc->r_con.remotePushReady = true;
-		///*
-		omp_set_lock(srcGraph->sCopyMapHead->map[f]->r_con.sndLock);
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-		omp_unset_lock(srcGraph->sCopyMapHead->map[f]->r_con.sndLock);
-		//*/
-	    }
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))      													      
-} // multifabCopyPushAsync
-
-void Perilla::multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, bool singleT) 
-{
-    multifabCopyPushAsync(destGraph, srcGraph, mfDst, mfSrc, f, 1, 1, 1, 0, 0, singleT);
-} 
-
-void Perilla::multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    multifabCopyPush_1Team(destGraph,srcGraph,mfDst,mfSrc,f,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-    if(!singleT)
-      srcGraph->worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-}
-
-  void Perilla::multifabCopyPush_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-  {
-    int ntid = perilla::wtid();// - perilla::NUM_COMM_THREADS;
-    int tg = perilla::wid();
-    int myProc = amrex::ParallelDescriptor::MyProc();
-
-    if(true)//if(!(*mfDst == *mfSrc))
-      {
-        if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-        if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-        FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-        while(cpSrc != 0)
-        {
-            if(cpSrc->graphPartner == destGraph)
-              break;
-            cpSrc = cpSrc->next;
-        }
-        if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;
-
-        if(singleT)
-        {
-            omp_set_lock(&(cpSrc->l_con.sLock));
-            for(int i=0; i<cpSrc->l_con.nscpy; i++)
-              {
-                Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-                mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-              }
-            for(int i=0;i<cpSrc->l_con.nscpy; i++)
-              cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true));
-            omp_unset_lock(&(cpSrc->l_con.sLock));
-        }
-        else
-          {
-            if(ntid == 0)
-              omp_set_lock(&(cpSrc->l_con.sLock));
-            srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-            for(int i=0; i<cpSrc->l_con.nscpy; i++)
-              if((i%(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS)) == ntid)
-                {
-                  Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-                  mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-                  /*
-                  for(int ii=0; ii < sndPackage->bufSize; ii++)
-                    if(sndPackage->databuf[ii] == 0)
-                      fout << "MFCPush loc zero at " << f << " i " << i << " ii " << ii << " sbx "<< cpSrc->l_con.scpy[i].sbx << std::endl;
-                  */
-                }
-
-            //fout.close();
-
-            srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-            if(ntid==0)
-              {
-                for(int i=0;i<cpSrc->l_con.nscpy; i++)
-                  cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true));
-                omp_unset_lock(&(cpSrc->l_con.sLock));
-              }
-            srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-          }
-
-        int np = amrex::ParallelDescriptor::NProcs();
-        if(np == 1)
-          return;
-        if(singleT)
-        {
-            omp_set_lock((cpSrc->r_con.sndLock));
-            for(int i=0; i<cpSrc->r_con.nsnd; i++)
-            {
-                Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-                mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-                sndPackage->notified = false;
-                sndPackage->served = false;
-                sndPackage->completed = false;
-                cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage, true);
-            }
-            cpSrc->r_con.remotePushReady = true;
-            omp_unset_lock((cpSrc->r_con.sndLock));
-        }
-        else
-        {
-            if(ntid == 0)
-            {
-                omp_set_lock((cpSrc->r_con.sndLock));
-            }
-            srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-            for(int i=0; i<cpSrc->r_con.nsnd; i++)
-              if((i%(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS)) == ntid)
-                {
-                  Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-                  mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-                  sndPackage->notified = false;
-                  sndPackage->served = false;
-                  sndPackage->completed = false;
-                  cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage, true);
-                }
-
-            //fout.close();         
-            srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-            if(ntid==0)
-              {
-                cpSrc->r_con.remotePushReady = true;
-/*
-                for(int i=0; i<cpSrc->r_con.nsnd; i++){
-                  Package* sndPackage = srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true);
-                  sndPackage->served = false;
-                  sndPackage->completed = false;
-                  srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(sndPackage, true);
-                }
-*/
-                omp_unset_lock((cpSrc->r_con.sndLock));
-            }
-            srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-         }
-      } // if(!(*mfDst == *mfSrc))                                                                                                                    
-  } // multifabCopyPush
-
-
-void Perilla::multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, bool singleT)
-  {
-    multifabCopyPush(destGraph, srcGraph, mfDst, mfSrc, f, 1, 1, 1, 0, 0, singleT);
-  }
-
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int myProc = ParallelDescriptor::MyProc();
-
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    //MultiFab* mfDst = destGraph->assocMF;
-    //MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    //if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	//if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpDst = destGraph->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    if(cpDst->graphPartner == srcGraph)
-		break;
-	    cpDst = cpDst->next;
-	} 
-	if(cpDst == 0) cout <<"Metadata for across grid copy not found"<< endl;
-	//destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	if(singleT)
-	{
-	    omp_set_lock(&(cpDst->l_con.dLock));
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-	    {
-		Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-	    }	
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue(true),true); // corrected from pQ to recycleQ and from recycleQ to pQ
-	    cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-	    omp_unset_lock(&(cpDst->l_con.dLock));
-	}
-	else
-	{
-	    if(ntid==0)
-		omp_set_lock(&(cpDst->l_con.dLock));
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-		}	
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);       	
-
-	    if(ntid == 0)
-	    {
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		    cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue(true),true); // corrected from pQ to recycleQ and from recycleQ to pQ
-		cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-		omp_unset_lock(&(cpDst->l_con.dLock));
-	    }
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	if(singleT)
-	{
-	    omp_set_lock(destGraph->rCopyMapHead->map[f]->r_con.rcvLock);
-	    omp_set_lock(cpDst->r_con.rcvLock);
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		///*
-		Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-		rcvMetaPackage->completed = false;
-		rcvMetaPackage->served = false;
-		rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-		destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-		Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);	      
-		rcvPackage->notified = false;
-		rcvPackage->completed = false;
-		cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ	      
-		//*/
-
-		//Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-		//mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-	    }
-	    cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-	    cpDst->r_con.remotePullDone = true;
-	    ///*
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			cpDst->r_con.firingRuleCnt++;
-	    //*/
-	    omp_unset_lock(cpDst->r_con.rcvLock);
-	    omp_unset_lock(destGraph->rCopyMapHead->map[f]->r_con.rcvLock);
-
-	}
-	else
-	{	
-	    if(ntid==0)
-	    {
-		omp_set_lock(destGraph->rCopyMapHead->map[f]->r_con.rcvLock);
-		omp_set_lock(cpDst->r_con.rcvLock);
-	    }
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    ///*
-		    Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-		    rcvMetaPackage->completed = false;
-		    rcvMetaPackage->served = false;
-		    rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-		    destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-		    Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);	      
-		    rcvPackage->notified = false;
-		    rcvPackage->completed = false;
-		    cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ	      
-		    //*/
-
-		    //Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-		    //mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-
-		}
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    if(ntid==0)
-	    {
-		cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-		cpDst->r_con.remotePullDone = true;
-		///*
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-			if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			    cpDst->r_con.firingRuleCnt++;
-		//*/
-		omp_unset_lock(cpDst->r_con.rcvLock);
-		omp_unset_lock(destGraph->rCopyMapHead->map[f]->r_con.rcvLock);
-	    }
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))
-
-} // multifabCopyPull
-
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, bool singleT) 
-{
-    multifabCopyPull(destGraph, srcGraph, mfDst, mfSrc, f, 1, 1, 1, 0, 0,singleT);
-}
-
-void Perilla::serviceLocalGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int tg)
-{
-    int nfabs = graphArray[g]->numTasks;
-
-    for(int f=0; f<nfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		//std::cout<<" "<<cpSrc << " ";
-		int lockSucceeded = omp_test_lock(&(cpSrc->l_con.sLock));
-		if(lockSucceeded != 0)
-		{
-		    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		    {
-			if(cpSrc->l_con.scpy[i].pQueue.queueSize()>0)
-			{
-assert(doublechecked==false);
-			    FabCopyAssoc* cpDst = cpSrc->graphPartner->task[cpSrc->l_con.scpy[i].nd]->cpAsc_dstHead;
-			    while(cpDst != 0)
-			    {
-				if(cpDst->graphPartner == graphArray[g])
-				    break;
-				cpDst = cpDst->next;
-			    }			    
-			    Package* sPackage = cpSrc->l_con.scpy[i].pQueue.dequeue(true);
-			    omp_set_lock(&(cpDst->l_con.dLock));
-			    int dPartner = cpSrc->l_con.scpy[i].dPartner;
-			    Package* dPackage = cpDst->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			    /*
-			       for(int j=0; j<dPackage->bufSize; j++)
-			       {
-			       dPackage->databuf[j] = sPackage->databuf[j];
-			       }
-			     */
-			    std::memcpy(dPackage->databuf, sPackage->databuf, dPackage->bufSize * sizeof(double));
-			    //std::swap(dPackage->databuf, sPackage->databuf);
-
-			    cpDst->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			    if(cpDst->l_con.dcpy[dPartner].pQueue.queueSize(true) == 1)
-				cpDst->l_con.firingRuleCnt++;
-			    omp_unset_lock(&(cpDst->l_con.dLock));
-			    cpSrc->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-			}
-		    } // for
-		    omp_unset_lock(&(cpSrc->l_con.sLock));
-		} // if(lockSucceeded)
-		cpSrc = cpSrc->next;
-	    } // while(cpSrc != 0)
-	} // if(tg==fg)
-    } // for(f<nfabs)
-
-} // serviceLocalGridCopyRequests
-
-void Perilla::serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    //MultiFab* mf = graphArray[g]->assocMF;
-    int graphID = graphArray[g]->graphID;
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    if(omp_test_lock(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock) != 0)
-	    {
-		if(omp_test_lock(cpDst->r_con.rcvLock) != 0)
-		{
-		    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    {
-			if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed
-			{
-			    nextsReq = true;
-			}
-			else
-			{			    
-			    Package *rearPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.getRear(true);//!CHECK THIS POINT LATER
-			    // Also check the recycle queue because when rear is completed it may cause unlimited recv posts
-			    if(rearPackage->completed && graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.queueSize() > 1) //!latest receive request has been completed
-			    {
-				nextsReq = true;
-			    }
-			    else //!expected message is still on the way
-				nextsReq = false;
-			}
-			if(nextsReq) //!take a message from recycle pool and post a receive
-			{
-			    //!create a package to keep track of receive requests
-
-			    Package *rMetaPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			    //!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-			    int ns = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].ns;
-			    int nd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].nd;
-			    int lnd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-			    int r_grids = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].r_grids;
-			    Package *rPackage = cpDst->r_con.rcv[i].recycleQueue.dequeue(true);
-			    //int tag = tagGen(ns, nd, graphID-1, np*r_grids, nGraphs);
-			    //int tag = Perilla::myTagMap[graphID-1][nd][ns];
-			    //int tag = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-			    int tag = tagMap[graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr][g][nd][ns][graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz];
-
-			    //  if(graphArray[g]->graphID == 25 && lnd==10 && myProc==54)
-			    //std::cout << "R Posted g " << g << " myP " << myProc << " lnd " << lnd <<" nd "<< nd << " ns "<<ns << " tag "<<tag << " pr " <<graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr << std::endl;
-
-			    rMetaPackage->request = MPI_REQUEST_NULL;
-			    cpDst->r_con.rcv[i].pQueue.enqueue(rPackage,true);   //!this is not done yet
-			    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage,true);   //!this is not done yet	 
-			    rMetaPackage->request = ParallelDescriptor::Arecv(rPackage->databuf,
-				    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz,
-				    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr, tag).req(); // tag == SeqNum in c++ ver
-
-			}						
-		    } // for (i<i<cpDst->r_con.nrcv)
-		    omp_unset_lock(cpDst->r_con.rcvLock);
-		} // if(ga locked)
-		omp_unset_lock(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock);
-	    } // if(mf locked)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {	
-
-	//	if(g == 17 && f == 316 )
-	///std::cout << "Trying S Post " << std::endl;
-
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-		//if(g == 17 && f == 316 && i == 164)
-		//std::cout << "Comm Thread nsnd "<< cpSrc->r_con.nsnd << " " << graphArray[g]<< std::endl;
-		if(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed	       	
-		    nextrReq = false;
-		else
-		    nextrReq = true;
-
-		if(nextrReq) //!take a message from recycle pool and post a receive
-		{
-
-		    Package *sMetaPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.getFront(true);
-		    if(!sMetaPackage->served)
-		    {		    
-			Package *sPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-			sMetaPackage->completed = false;
-			sMetaPackage->served = true;
-			sMetaPackage->request = MPI_REQUEST_NULL;
-			int ns = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].ns;
-			int nd = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].nd;
-			int r_gid = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_gid;
-			int r_grids = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_grids;
-			//int tag = tagGen(ns, nd, r_gid-1, np*r_grids, nGraphs);
-			int tag = Perilla::myTagMap[r_gid][nd][ns][graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz];
-			sMetaPackage->request = ParallelDescriptor::Asend(sPackage->databuf,
-				graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz,
-				graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-			//if(g == 31 && nd == 519 )
-			//std::cout << "S Posted r_g " << r_gid << " atP " << myProc << " nd "<< nd << " ns "<<ns << " tag "<<tag << " pr " <<graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pr << std::endl;
-
-		    }
-		}		
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-		{		    
-		    if(omp_test_lock(cpDst->r_con.rcvLock) != 0)
-		    {		    
-			Package *rearPackage =  graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.getRear(true);
-			if(!rearPackage->completed)
-			{
-			    bool flag = false;
-			    int ret_flag=0;
-			    MPI_Status status;
-			    ParallelDescriptor::Test(rearPackage->request, ret_flag, status);
-
-			    flag = (ret_flag == 0) ? false : true;//parallel_test_one(rearPackage%ptr%request) -------???????
-			    if(flag)
-			    {
-				rearPackage->completeRequest();				
-				cpDst->r_con.rcv[i].pQueue.getRear()->completeRequest();
-
-				if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				{
-				    //if(graphArray[g]->graphID == 25 && f==0 && myProc==1)
-				    //std::cout<<"Recieved fc++ for f " << f << " fc " << cpDst->r_con.firingRuleCnt <<std::endl;
-				    cpDst->r_con.firingRuleCnt++;
-				}
-#pragma omp flush			    
-			    }
-			}		   		    
-			omp_unset_lock(cpDst->r_con.rcvLock);
-		    } // if(ga locked)
-		} // if(pQueue.queueSize(true) > 0)		    
-	    } // for (i<i<cpDst->r_con.nrcv)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {		
-		if(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-		{
-		    Package *frontPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.getFront(true);
-		    if(frontPackage->served && !frontPackage->completed) //!latest receive request has NOT been completed
-		    {
-			bool flag = false;
-			int ret_flag;
-			MPI_Status status;
-			ParallelDescriptor::Test(frontPackage->request, ret_flag, status);
-			flag = (ret_flag == 0) ? false : true;//parallel_test_one(frontPackage%ptr%request) -------???????		    
-			if(flag)
-			{
-			    omp_set_lock(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock);
-			    frontPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = MPI_REQUEST_NULL;
-			    frontPackage->notified = false;
-			    graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			    omp_unset_lock(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock);
-#pragma omp flush
-			    omp_set_lock(cpSrc->r_con.sndLock);
-			    frontPackage = cpSrc->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = MPI_REQUEST_NULL;
-			    cpSrc->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			    omp_unset_lock(cpSrc->r_con.sndLock);			
-			}
-		    }
-		} // if(queueSize > 0)				
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-} // serviceRemoteGridCopyRequests
-
-void Perilla::resetRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    //MultiFab* mf = graphArray[g]->assocMF;
-    int graphID = graphArray[g]->graphID;
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		if(cpSrc->r_con.remotePushReady)
-		{
-		    omp_set_lock(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock);
-		    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    {
-			graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-		    }
-		    omp_unset_lock(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock);
-		    cpSrc->r_con.remotePushReady = false;
-		}// if remotepushready
-		cpSrc = cpSrc->next;
-	    }
-	}// ismyRegion
-    }//for f<numfabs
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		if(omp_test_lock(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock) != 0)
-		{
-		    if(omp_test_lock(cpDst->r_con.rcvLock) != 0)
-		    {
-			//if(f==1 && g==26 && myProc == 54)
-			//std::cout<<"Completing Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpDst->r_con.remotePullDone <<std::endl;
-			if(cpDst->r_con.remotePullDone)
-			{
-			    for(int i=0; i<cpDst->r_con.nrcv; i++)
-			    {
-
-				Package *rcvMetaPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-				rcvMetaPackage->completed = false;
-				rcvMetaPackage->served = false;
-				rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-				graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-				Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-				rcvPackage->notified = false;
-				rcvPackage->completed = false;
-				cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ
-
-				//cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - 1;
-
-				if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-				    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-					cpDst->r_con.firingRuleCnt++;
-
-
-			    } // for (i<i<cpDst->r_con.nrcv)
-
-			    cpDst->r_con.remotePullDone = false;
-
-			    //if(f==1 && g==26 && myProc == 54)
-			    // std::cout<<"Completed Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpDst->r_con.remotePullDone <<std::endl;
-
-			}
-			omp_unset_lock(cpDst->r_con.rcvLock);
-		    } // if(ga locked)
-		    omp_unset_lock(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock);
-		} // if(mf locked)
-		cpDst = cpDst->next;
-	    } // while(cpDst != 0)	
-	    /*  
-		if(false)
-		for(int id=0; id<graphArray[g]->task[f]->depTaskIDs.size(); id++)
-		{	    
-		int df = graphArray[g]->task[f]->depTaskIDs[id];
-		if(WorkerThread::isMyRegion(0,df))
-		{
-		int lgID = graphArray[g]->srcLinkGraph->graphID-1;
-
-	    //if(f==1 && g==26 && myProc == 54)
-	    //std::cout<<"Completing Dep Push f " << df << " gID " << lgID+1 << " myP " << myProc  <<std::endl;
-
-	    FabCopyAssoc* cpdDst = graphArray[lgID]->task[df]->cpAsc_dstHead;
-	    while(cpdDst != 0)
-	    {
-	    if(omp_test_lock(graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcvLock) != 0)
-	    {
-	    if(omp_test_lock(cpdDst->r_con.rcvLock) != 0)
-	    {
-	    //if(f==1 && g==26 && myProc == 54)
-	    //std::cout<<"Completing Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpdDst->r_con.remotePullDone <<std::endl;
-	    if(cpdDst->r_con.remotePullDone)
-	    {
-	    for(int i=0; i<cpdDst->r_con.nrcv; i++)
-	    {
-
-	    Package *rcvMetaPackage = graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-	    graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-	    Package* rcvPackage = cpdDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-	    rcvPackage->notified = false;
-	    rcvPackage->completed = false;
-	    cpdDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ
-
-	    //cpdDst->r_con.firingRuleCnt = cpdDst->r_con.firingRuleCnt - 1;
-
-	    if(cpdDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-	    if(cpdDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-	    cpdDst->r_con.firingRuleCnt++;
-
-
-	    } // for (i<i<cpdDst->r_con.nrcv)
-
-	    cpdDst->r_con.remotePullDone = false;
-
-	    //if(df==10 && lgID==24 && myProc == 54)
-	    // std::cout<<"Completed Push f " << df << " gID " << lgID+1 << " myP " << myProc << " PDone "<< cpdDst->r_con.remotePullDone <<std::endl;
-	    }
-	    omp_unset_lock(cpdDst->r_con.rcvLock);
-	    } // if(ga locked)
-	    omp_unset_lock(graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcvLock);
-	    } // if(mf locked)
-	    cpdDst = cpdDst->next;
-	    } // while(cpdDst != 0)	
-
-
-	    } // if tg==0 region
-
-
-	    } // for all dependents
-	     */
-
-
-
-	}
-    } // for(f<nfabs)
-
-}
diff --git a/Src/AmrTask/rts_impls/mpi_omp/PerillaConfig.H b/Src/AmrTask/rts_impls/mpi_omp/PerillaConfig.H
deleted file mode 100755
index e7616fb0ab3..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/PerillaConfig.H
+++ /dev/null
@@ -1,23 +0,0 @@
-#ifndef P_PERILLACONFIG_H
-#define P_PERILLACONFIG_H
-
-//class PerillaConfig
-namespace perilla
-{
-  static const int NUM_THREAD_TEAMS=1;
-  static const int NUM_THREADS_PER_TEAM=6;
-  static const int NUM_COMM_THREADS=1;
-  static const int NUM_PREGENERATED_PACKAGES=2;
-  static const int MSG_QUEUE_DEFAULT_MAXSIZE=2; // same as num of pregenerated packages because these got swaped between pQ and recycleQ
-  static const int TASK_QUEUE_DEFAULT_MAXSIZE=32;
-  static const int MAX_SQRT_TAG=512;  //sqrt(512*512)
-  static const bool NUMA_AWARE_MESSAGEHANDLER=true;
-  static const int LOCK_GRANULARITY=1; //!0 is queue level, 1 is region level
-  
-  static const bool LAZY_PUSH=false;
-  static const bool LAZY_PULL=false;
-  static const bool PACKING_FINEGRAIN=false; //!PACKING_FINEGRAIN = TRUE is effective when LAZY_PUSH=FALSE
-  static const bool UNPACKING_FINEGRAIN=false; //!is effective when LAZY_PUSH=FALSE
-
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/PerillaRts.H b/Src/AmrTask/rts_impls/mpi_omp/PerillaRts.H
deleted file mode 100644
index 4e84eae60b8..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/PerillaRts.H
+++ /dev/null
@@ -1,50 +0,0 @@
-#ifndef _PERILLA_RTS_
-#define _PERILLA_RTS_
-
-#include <AMReX_Amr.H>
-#include <PerillaConfig.H>
-
-
-namespace perilla{
-
-struct _workerThreadInfo{
-    int _tid; //thread id in local group
-    int _size; //number of threads in the group
-};
-
-struct _threadInfo{
-    bool _isComm; //whether this thread handles communication
-    int _wtid; //worker thread id (-1 if this thread is decicated to communication)
-    int _nWts; //number of thread groups
-};
-
-class RTS
-{
-    private:
-	int _nWrks;
-	void RTS_Init();
-	int _rank, _nProcs;
-
-    public:
-	RTS(){
-	    _nWrks=1;
-	    char* nWrks= getenv("NWORKERS");
-	    if(nWrks) _nWrks= atoi(nWrks);
-	}
-	RTS(int nWrks):_nWrks(nWrks){}
-	int ProcCount();
-	int MyProc();
-	int WorkerThreadCount();
-	int MyWorkerThread();
-	void Init(); //Build the runtime system from scratch
-	void Init(int rank, int nProcs);//Build the runtime system on pre-existing MPI processes
-	void Iterate(void *graph, int max_step, Real stop_time);
-	void Finalize();
-//	double Time();
-	void Barrier();
-	void runAMR(Amr* amrptr, int max_step, Real stop_time);
-};
-
-}
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/PerillaRts.cpp b/Src/AmrTask/rts_impls/mpi_omp/PerillaRts.cpp
deleted file mode 100644
index 62048ad4210..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/PerillaRts.cpp
+++ /dev/null
@@ -1,111 +0,0 @@
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//ompodification 08-14-2017
-#include <mpi.h>
-#include <sched.h>
-#include <sys/syscall.h>
-#include <unistd.h>
-#include <omp.h>
-#include "PerillaRts.H"
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include <PerillaMemCheck.H>
-PerillaMemCheck memcheck;
-#endif
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-namespace perilla{
-    Amr* amrptr;
-
-    int RTS::ProcCount(){
-	return _nProcs;
-    }
-
-    int RTS::MyProc(){
-	return _rank;
-    }
-
-    int RTS::WorkerThreadCount(){
-	return _nWrks;
-    }
-
-    int RTS::MyWorkerThread(){
-	return 0;
-    }
-
-    void RTS::runAMR(Amr* amr, int max_step, Real stop_time){
-        while ( amr->okToContinue() &&
-              (amr->levelSteps(0) < max_step || max_step < 0) &&
-              (amr->cumTime() < stop_time || stop_time < 0.0) )
-            
-        {
-            // Do a coarse timestep, which calls one or multiple timestep updates (i.e. timeStep()) at each AMR level
-            amr->coarseTimeStep(stop_time);
-        }
-    }
-
-    void InitializeMPI(){
-	int provided;
-	MPI_Init_thread(0, 0, MPI_THREAD_FUNNELED, &provided);
-	if(provided == MPI_THREAD_SINGLE){//with this MPI, process can't spawn threads
-	    cerr << "Spawning threads is not allowed by the MPI implementation" << std::endl;;
-	}
-    }
-
-    void RTS::RTS_Init(){
-	amrptr= NULL;
-    }
-
-    void RTS::Init(){
-        InitializeMPI();
-        MPI_Comm_rank(MPI_COMM_WORLD, &_rank);
-        MPI_Comm_size(MPI_COMM_WORLD, &_nProcs);
-        RTS_Init();
-    }
-
-    void RTS::Init(int rank, int nProcs){
-        _rank= rank;
-	_nProcs= nProcs;
-	RTS_Init();
-    }
-
-    void RTS::Finalize(){
-#ifdef PERILLA_DEBUG
-        memcheck.report();
-#endif
-    }
-
-    void RTS::Iterate(void* amrGraph, int max_step, Real stop_time){
-	    Perilla::max_step=max_step;
-	    assert(amrGraph);
-	    amrptr= (Amr*)amrGraph;
-            runAMR(amrptr, max_step, stop_time);
-    }
-
-#if 0
-    const double kMicro = 1.0e-6;
-    double RTS::Time()
-    {
-	struct timeval TV;
-
-	const int RC = gettimeofday(&TV, NULL);
-	if(RC == -1)
-	{
-	    printf("ERROR: Bad call to gettimeofday\n");
-	    return(-1);
-	}
-	return( ((double)TV.tv_sec) + kMicro * ((double)TV.tv_usec) );
-    } 
-#endif
-
-    void RTS::Barrier(){
-	//nothing
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RGIter.H b/Src/AmrTask/rts_impls/mpi_omp/RGIter.H
deleted file mode 100755
index 8141fdc1300..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RGIter.H
+++ /dev/null
@@ -1,65 +0,0 @@
-#ifndef RGITER_H_
-#define RGITER_H_
-
-#include <RegionGraph.H>
-//#include <AMReX_Amr.H>
-//#include <PerillaRts.H>
-#include <fstream>
-
-namespace amrex{
-
-    class AsyncFillPatchIterator;
-
-    class RGIter
-    {
-	public:
-	    int tid;
-	    int ntid;
-	    int tg;
-	    int currentRegion;
-	    int currentTile;
-	    int totalItr;
-	    int currentItr;
-	    bool tiling;
-	    bool implicit;
-	    bool ppteams;
-	    bool haveDepGraph;
-	    RegionGraph* itrGraph;
-	    RegionGraph* depGraph;
-	    int  boxGrow, index, scomp, ncomp, iteration;
-	    double time;
-	    double getFireableTime;
-	    amrex::MultiFab *_dest;
-
-	    IndexType     typ;
-
-	    Vector<amrex::AsyncFillPatchIterator*> m_level_afpi; 
-	    Vector<amrex::AsyncFillPatchIterator*> m_upper_level_afpi;
-	    std::ofstream fout;
-
-	public:
-	    RGIter(RegionGraph* rg, bool enableAllTasks=false);
-	    RGIter(RegionGraph* rg, RegionGraph* drg, bool isDep=true);
-	    RGIter(amrex::AsyncFillPatchIterator* afpi, bool enableAllTasks=false);
-	    RGIter(Vector<amrex::AsyncFillPatchIterator*> afpi, Vector<amrex::AsyncFillPatchIterator*> upper_afpi, 
-		    amrex::MultiFab& dest, int  bG, double tm, int  ind, int  sc, int nc, int itr);
-	    ~RGIter();
-
-	    void init();
-	    void sync_workers();
-	    //! Increment iterator to the next tile we own.
-	    void operator++ ();
-	    //! Is the iterator valid, are more regions to iterate over?
-	    bool isValid();
-	    int LocalIndex() const { return currentRegion; }
-	    void exec();
-
-	    amrex::Box tileBox();
-	    amrex::Box validBox() const;
-	    amrex::Box tilebox();
-	    amrex::Box growntilebox();
-	    amrex::Box growntilebox(int ng);
-	    amrex::Box nodaltilebox(int dir);
-    };
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RGIter.cpp b/Src/AmrTask/rts_impls/mpi_omp/RGIter.cpp
deleted file mode 100755
index 74ffe274bb6..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RGIter.cpp
+++ /dev/null
@@ -1,615 +0,0 @@
-#include <AMReX_Box.H>
-#include <RGIter.H>
-#include <WorkerThread.H>
-#include <Perilla.H>
-#include <cmath>
-
-#include <AMReX_AmrLevel.H>
-#include <PerillaConfig.H>
-using namespace perilla;
-#include <PerillaRts.H>
-#include "RGIter.H"
-
-namespace amrex{
-
-    RGIter::RGIter(RegionGraph* rg, bool enableAllTasks):
-	itrGraph(rg),
-	implicit(false),
-	ppteams(true),
-	//typ(rg->typ),
-	haveDepGraph(false),
-	depGraph(NULL),
-	getFireableTime(0.)
-    {
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(perilla::isMasterWorkerThread())
-	    itrGraph->Reset();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(enableAllTasks)
-	    itrGraph->enableAllRegions();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	init();
-    }
-
-    RGIter::RGIter(RegionGraph* rg, RegionGraph* drg, bool isDep):
-	itrGraph(rg),
-	implicit(false),
-	ppteams(true),
-	//typ(rg->typ),
-	haveDepGraph(isDep),
-	depGraph(drg),
-	getFireableTime(0.)
-    {
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(perilla::isMasterWorkerThread()) itrGraph->Reset();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	init();
-    }
-
-    RGIter::RGIter(amrex::AsyncFillPatchIterator* afpi, bool enableAllTasks):
-	itrGraph(afpi->destGraph),
-	implicit(false),
-	ppteams(true),
-	//typ(afpi->destGraph->typ),
-	haveDepGraph(false),
-	depGraph(NULL),
-	getFireableTime(0.)
-    {
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(perilla::isMasterWorkerThread())
-	    afpi->Reset();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(enableAllTasks)
-	    itrGraph->enableAllRegions();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-	init();
-    }
-
-#ifndef USE_PERILLA_ON_DEMAND
-    RGIter::RGIter(Vector<amrex::AsyncFillPatchIterator*> afpi, Vector<amrex::AsyncFillPatchIterator*> upper_afpi, 
-	    amrex::MultiFab& dest, int  bG, double tm, int  ind, int  sc, int nc, int itr):
-	itrGraph(afpi[itr-1]->destGraph),
-	m_level_afpi(afpi),
-	m_upper_level_afpi(upper_afpi),
-	boxGrow(bG), 
-	time(tm), 
-	index(ind), 
-	scomp(sc), 
-	ncomp(nc), 
-	iteration(itr),
-	implicit(true),
-	ppteams(true),
-	//typ(afpi[itr-1]->destGraph->typ),
-	haveDepGraph(false),
-	depGraph(NULL),
-	getFireableTime(0.)
-    {
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	bool push = true;
-
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(perilla::isMasterWorkerThread())
-	    m_level_afpi[iteration-1]->Reset();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-	if(ntid == perilla::NUM_THREADS_PER_TEAM-2)
-	{
-	    int f;
-	    int level = m_level_afpi[iteration-1]->m_amrlevel.level;
-	    double dt = m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level);
-	    this->currentItr = 1;
-	    this->totalItr = 1;
-
-	    //////////////////////////////////////Push Pull Thread Start/////////////////////////
-	    while(m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->queueSize(true) != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks ||
-		    m_level_afpi[iteration-1]->destGraph->worker[tg]->computedTasks != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks)
-	    {
-		f = m_level_afpi[iteration-1]->destGraph->getFireableRegion(tg);
-		if(f != -1)
-		{
-		    m_level_afpi[iteration-1]->Receive(this,dest,boxGrow,time,index,scomp,ncomp,f,true);
-		    m_level_afpi[iteration-1]->destGraph->setFireableRegion(f);
-		    if(m_level_afpi[iteration-1]->destGraph->worker[tg]->unfireableRegionQueue->queueSize(true) !=0 && 
-			    m_level_afpi[iteration-1]->destGraph->worker[tg]->fireableRegionQueue->queueSize(true) < 2)
-			continue;
-		}
-
-		if(m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->queueSize() != 0)
-		{
-		    f = m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->removeRegion();
-
-		    if(push & level == m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel() && iteration < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level))
-			m_level_afpi[iteration]->SendIntraLevel(*(this),boxGrow,time+dt,index,scomp,ncomp,iteration,f,true);
-
-		    if(push & level < m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-		    {
-			for(int i=0; i < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level+1); i++)
-			{
-			    m_upper_level_afpi[i]->SendInterLevel(this,boxGrow,time+(i*m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)),index,scomp,ncomp,i+1,f,true);
-			}
-		    }	
-		    m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-		}
-	    }
-	    //fout.close();
-	    ////////////////////////////////////////////////////////Push Pull Thread End////////////////////
-	}
-	else
-	{
-	    //fout << "Calling init "<< std::endl;
-	    //fout.close();
-	    init();
-	}
-    }
-
-#else
-
-    RGIter::RGIter(Vector<amrex::AsyncFillPatchIterator*> afpi, Vector<amrex::AsyncFillPatchIterator*> upper_afpi,
-            amrex::MultiFab& dest, int  bG, double tm, int  ind, int  sc, int nc, int itr):
-        itrGraph(afpi[itr-1]->destGraph),
-        m_level_afpi(afpi),
-        m_upper_level_afpi(upper_afpi),
-	_dest(&dest),
-        boxGrow(bG),
-        time(tm),
-        index(ind),
-        scomp(sc),
-        ncomp(nc),
-        iteration(itr),
-        implicit(true),
-        ppteams(true),
-        haveDepGraph(false),
-        depGraph(NULL),
-        getFireableTime(0.)
-   {
-        int myProc = amrex::ParallelDescriptor::MyProc();
-        bool push = true;
-
-        int tid = perilla::tid();
-        int tg = perilla::wid();
-        int ntid = perilla::wtid();
-
-        if(perilla::isCommunicationThread())
-        {
-            std::vector<RegionGraph*> flattenedGraphArray;
-            Perilla::flattenGraphHierarchy(m_level_afpi[iteration-1]->m_amrlevel.parent->graphArray, flattenedGraphArray);
-            while(true){
-                Perilla::serviceMultipleGraphCommDynamic(flattenedGraphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-                {
-                    break;
-                }
-            }
-        }else
-{
-
-        AsyncFillPatchIterator::initialSend(m_level_afpi, m_upper_level_afpi, boxGrow, time, index, scomp, ncomp, iteration);
-        syncAllWorkerThreads();
-
-        itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-        if(perilla::isMasterWorkerThread())
-            m_level_afpi[iteration-1]->Reset();
-        itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-        if(ntid == perilla::NUM_THREADS_PER_TEAM-2)
-        {
-            int f;
-            int level = m_level_afpi[iteration-1]->m_amrlevel.level;
-            double dt = m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level);
-            this->currentItr = 1;
-            this->totalItr = 1;
-            while(m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->queueSize(true) != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks ||
-                    m_level_afpi[iteration-1]->destGraph->worker[tg]->computedTasks != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks)
-            {
-                f = m_level_afpi[iteration-1]->destGraph->getFireableRegion(tg);
-                if(f != -1)
-                {
-                    m_level_afpi[iteration-1]->Receive(this,*_dest,boxGrow,time,index,scomp,ncomp,f,true);
-                    m_level_afpi[iteration-1]->destGraph->setFireableRegion(f);
-                    if(m_level_afpi[iteration-1]->destGraph->worker[tg]->unfireableRegionQueue->queueSize(true) !=0 &&
-                            m_level_afpi[iteration-1]->destGraph->worker[tg]->fireableRegionQueue->queueSize(true) < 2)
-                        continue;
-                }
-
-                if(m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->queueSize() != 0)
-                {
-                    f = m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->removeRegion();
-
-                    if(push & level == m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel() && iteration < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level))
-                        m_level_afpi[iteration]->SendIntraLevel(*(this),boxGrow,time+dt,index,scomp,ncomp,iteration,f,true);
-
-                    if(push & level < m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-                    {
-                        for(int i=0; i < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level+1); i++)
-                        {
-                            m_upper_level_afpi[i]->SendInterLevel(this,boxGrow,time+(i*m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)),index,scomp,ncomp,i+1,f,true);
-                        }
-                    }
-                    m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-                }
-            }
-        }
-        else
-        {
-            //fout << "Calling init "<< std::endl;
-            //fout.close();
-            init();
-        }
-}
-
-    }
-
-#endif
-    using namespace perilla;
-
-    RGIter::~RGIter()
-    {
-	//fout.close();
-    }
-
-    void RGIter::init()
-    {
-	if(itrGraph->fabTiles.size() == 0)
-	    tiling = false;
-	else
-	    tiling = true;
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	if(implicit)
-	{
-	    if(!itrGraph->isGraphEmptyV2())
-	    {
-		currentRegion = itrGraph->getPulledFireableRegion();
-		if(tiling)
-		    totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) );
-		else
-		    totalItr = 1;
-
-		currentItr = 1;
-
-		currentTile = 0;
-		if(tiling)
-		    for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) == ntid/*-perilla::NUM_COMM_THREADS*/)
-			    break;
-	    }
-	    else
-	    {
-	    }
-	}
-	else
-	{
-	    if(!itrGraph->isGraphEmpty())
-	    {
-		if(haveDepGraph)
-		    currentRegion = itrGraph->getAnyFireableRegion(*depGraph);
-		else
-		    currentRegion = itrGraph->getAnyFireableRegion();
-
-		if(tiling)
-		    totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) );
-		else
-		    totalItr = 1;
-
-		currentItr = 1;
-
-		currentTile = 0;
-		if(tiling)
-		    for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == ntid/*-perilla::NUM_COMM_THREADS*/)
-			    break;
-	    }
-	    else
-	    {
-	    }
-	}
-    }
-
-    //! Increment iterator to the next tile we own.
-    void RGIter::operator++ ()
-    {
-
-	currentItr++;
-
-	if(tiling)
-	    for( (currentTile == itrGraph->fabTiles[currentRegion]->numTiles ? currentTile : ++currentTile); currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-	    {
-		if(implicit)
-		{
-		    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) == ntid/*-perilla::NUM_COMM_THREADS*/)
-			break;
-		}
-		else
-		{
-		    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == ntid/*-perilla::NUM_COMM_THREADS*/)
-			break;
-		}
-	    }
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-
-	if( currentItr > totalItr )//&& currentTile == itrGraph->fabTiles[currentRegion]->numTiles)
-	{
-	    //if(WorkerThread::isTeamMasterThread(tid) )
-	    //fout << "++B GEmpty " << itrGraph->isGraphEmpty(tg) << std::endl;
-
-	    //fout << "++B CmpReg isGE " << (implicit?  itrGraph->isGraphEmptyV2(tg) : itrGraph->isGraphEmpty(tg)) << " CompleteQ "<< itrGraph->worker[tg]->nompletedRegionQueue->queueSize(true) << " totTasks " << itrGraph->worker[tg]->totalTasks << " FireQ "<< itrGraph->worker[tg]->fireableRegionQueue->queueSize(true) << " UnfireQ "<< itrGraph->worker[tg]->unfireableRegionQueue->queueSize(true) << std::endl;
-
-	    if(implicit)
-		itrGraph->regionComputed(currentRegion);
-	    else
-		itrGraph->finalizeRegion(currentRegion);
-
-	    //if(WorkerThread::isTeamMasterThread(tid) )
-	    //fout << "++A GEmpty " << itrGraph->isGraphEmpty(tg) << std::endl;
-
-	    //fout << "++A CmpReg isGE " << (implicit?  itrGraph->isGraphEmptyV2(tg) : itrGraph->isGraphEmpty(tg)) << " CompleteQ "<< itrGraph->worker[tg]->completedRegionQueue->queueSize(true) << " totTasks " << itrGraph->worker[tg]->totalTasks << " FireQ "<< itrGraph->worker[tg]->fireableRegionQueue->queueSize(true) << " UnfireQ "<< itrGraph->worker[tg]->unfireableRegionQueue->queueSize(true) << std::endl;
-
-	    if(implicit)
-	    {
-		if(!itrGraph->isGraphEmptyV2())
-		{
-		    currentRegion = itrGraph->getPulledFireableRegion();
-		    if(tiling)
-			totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) );
-		    else
-			totalItr = 1;
-
-		    currentItr = 1;
-
-		    currentTile = 0;
-		    if(tiling)
-			for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) == ntid/*-perilla::NUM_COMM_THREADS*/)
-				break;
-		}
-		else
-		{
-		    //fout << "Graph is Empty" << std::endl;
-		    //currentRegion = 0;
-		    //currentTile = 0;
-		}
-	    }
-	    else
-	    {
-		if(!itrGraph->isGraphEmpty())
-		{
-//		    double start_time_wtime = omp_get_wtime();	  
-
-		    if(haveDepGraph)
-			currentRegion = itrGraph->getAnyFireableRegion(*depGraph);
-		    else
-			currentRegion = itrGraph->getAnyFireableRegion();
-
-//		    double end_time_wtime = omp_get_wtime();
-//		    getFireableTime += end_time_wtime - start_time_wtime;
-
-		    if(tiling)
-			totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) );
-		    else
-			totalItr = 1;
-
-		    currentItr = 1;
-
-		    currentTile = 0;
-		    if(tiling)
-			for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == ntid/*-perilla::NUM_COMM_THREADS*/)
-				break;	      
-		}
-	    }
-	}
-
-	//fout << "++E Region " << currentRegion << " Tile " << currentTile << " numTile "<< itrGraph->fabTiles[currentRegion]->numTiles <<" tid " << tid << " myP " << myProc <<std::endl;
-	//fout.close();
-    }
-
-    //! Is the iterator valid, are more regions to iterate over?
-    bool RGIter::isValid ()
-    {
-	bool valid;
-	bool do_remaining = true;
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-
-	if(implicit)
-	{
-	    if(ntid != perilla::NUM_THREADS_PER_TEAM-1)
-	    {
-		valid = !itrGraph->isGraphEmptyV2();
-		if(valid)	      
-		    do_remaining = false;
-	    }
-
-	    if(do_remaining)
-	    {
-		bool push = false;
-
-		int f;
-		int level = m_level_afpi[iteration-1]->m_amrlevel.level;
-		double dt = m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level);
-		this->currentItr = 1;
-		this->totalItr = 1;
-
-		while(!itrGraph->isGraphEmpty())
-		{
-		    f = itrGraph->worker[tg]->computedRegionQueue->getFrontRegion(true);
-
-		    if(push & level == m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel() && iteration < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level))
-			m_level_afpi[iteration]->SendIntraLevel(this,boxGrow,time+dt,index,scomp,ncomp,iteration,f,false);
-		    //else if(level == parent->finestLevel() && iteration == ncycle)
-		    //SborderAFPI[0]->PushOnly(NUM_GROW, time+dt, State_Type, 0, NUM_STATE, f, tid, 0x02, 1);
-
-		    if(push & level < m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-		    {
-			for(int i=0; i < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level+1); i++)
-			{
-			    m_upper_level_afpi[i]->SendInterLevel(this,boxGrow,time+(i*m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)),index,scomp,ncomp,i+1,f,false);
-			    //upperLevel.SborderAFPI[i]->PushOnly(NUM_GROW, time+(i*parent->dtLevel(level+1)), State_Type, 0, NUM_STATE, f, tid, tuc, tempf, false);
-			}
-		    }		
-
-		    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-		    if(perilla::isMasterWorkerThread())
-		    {
-			f = itrGraph->worker[tg]->computedRegionQueue->removeRegion();
-			itrGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-		    }	  	
-		}
-
-
-		//m_level_afpi[iteration-1]->destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-		if(perilla::isMasterWorkerThread())
-		    m_level_afpi[iteration-1]->completeRegionGraphs();
-		valid = false;
-	    }
-	}
-	else
-	{
-	    if(itrGraph->isGraphEmpty())
-		if(perilla::isMasterWorkerThread())
-		{
-		    itrGraph->finalizeRegionGraph();
-		}
-	    valid = !(itrGraph->isGraphEmpty());
-	}
-	/*
-	   itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	   if(!isV && tg==0 && myProc==0)
-	   if(WorkerThread::isTeamMasterThread(tid))
-	   fout << " M " <<std::endl;
-	//    else
-	//  fout << " W " <<std::endl;
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	 */
-
-	/*
-	   fout << "isValid Ending " << !(itrGraph->isGraphEmpty(tg)) << " tid " << tid <<std::endl;
-	   fout.close();
-	 */
-	//if(!valid && tid == perilla::NUM_COMM_THREADS)
-	{
-	    //Perilla::getAnyFRTime += getFireableTime;
-	    //if(itrGraph->graphID != -1)
-		//Perilla::getAnyFRTimeSplit[itrGraph->graphID-1] += getFireableTime;
-	    //if(myProc == 150 && itrGraph->graphID != -1)
-	    //{
-	    //  std::cout << "gID " << itrGraph->graphID << " getFRTime " << getFireableTime << std::endl;
-	    //}
-	}
-
-	return  valid;
-    }
-
-    amrex::Box RGIter::tileBox()
-    {
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	//fout.open(std::to_string(myProc)+ "_" + std::to_string(tid) + ".txt", std::fstream::app);
-
-	//fout << "nTls " << itrGraph->fabTiles[currentRegion]->numTiles << " cT " << currentTile << std::endl;
-
-	if(currentTile == itrGraph->fabTiles[currentRegion]->numTiles)
-	    //if( (currentTile % (perilla::NUM_THREADS_PER_TEAM-1) != ntid-1) )
-	{
-	    //fout << "invalidBox " << std::endl;
-	    //fout.close();
-	    return amrex::Box();
-	}
-	else
-	{
-	    //fout << "validBox tBxSize " << itrGraph->fabTiles[currentRegion]->tileBx.size() << std::endl;
-	    //fout.close();
-	    return   *(itrGraph->fabTiles[currentRegion]->tileBx[currentTile]);
-	}
-    }
-
-    amrex::Box RGIter::validBox() const
-    {
-	return *(itrGraph->fabTiles[currentRegion]->validBx);
-    }
-
-    amrex::Box RGIter::tilebox()
-    {
-	return this->tileBox();
-    }
-
-    amrex::Box RGIter::growntilebox()
-    {
-
-    }
-
-    amrex::Box RGIter::growntilebox(int ng)
-    {
-
-	Box bx = this->tileBox();
-	if(currentTile == itrGraph->fabTiles[currentRegion]->numTiles)
-	    return bx;
-
-	if (ng < -100) ng = 0;
-	const Box& vbx = validBox();
-	for (int d=0; d<BL_SPACEDIM; ++d) {
-	    if (bx.smallEnd(d) == vbx.smallEnd(d)) {
-		bx.growLo(d, ng);
-	    }
-	    if (bx.bigEnd(d) == vbx.bigEnd(d)) {
-		bx.growHi(d, ng);
-	    }
-	}
-	return bx;
-
-    }
-
-    amrex::Box RGIter::nodaltilebox(int dir)
-    {
-	BL_ASSERT(dir < BL_SPACEDIM);
-	//BL_ASSERT(tile_array != 0);
-
-	//Box bx((*tile_array)[currentIndex]);
-	Box bx = this->tileBox();
-	bx.convert(typ);
-	const Box& vbx = this->validBox();
-	const IntVect& Big = vbx.bigEnd();
-	int d0, d1;
-	if (dir < 0) {
-	    d0 = 0;
-	    d1 = BL_SPACEDIM-1;
-	} else {
-	    d0 = d1 = dir;
-	}
-	for (int d=d0; d<=d1; ++d) {
-	    if (typ.cellCentered(d)) { // validbox should also be cell-centered in d-direction.
-		bx.surroundingNodes(d);
-		if (bx.bigEnd(d) <= Big[d]) {
-		    bx.growHi(d,-1);
-		}
-	    }
-	}
-	return bx;
-    }
-
-    void RGIter::sync_workers()
-    {
-
-	if(implicit)
-	    itrGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1);
-	else
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-    }
-}
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RegionGraph.H b/Src/AmrTask/rts_impls/mpi_omp/RegionGraph.H
deleted file mode 100755
index 2683e7bec57..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RegionGraph.H
+++ /dev/null
@@ -1,324 +0,0 @@
-#ifndef P_REGIONGRAPH_H
-#define P_REGIONGRAPH_H
-
-#include <RegionQueue.H>
-#include <LocalConnection.H>
-#include <RemoteConnection.H>
-#include <WorkerThread.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Box.H>
-#include <omp.h>
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include "PerillaMemCheck.H"
-extern PerillaMemCheck memcheck;
-#endif
-
-namespace amrex{
-
-    class RegionGraph;
-
-    class FabCopyAssoc
-    {
-	public:
-	    LocalConnection l_con;
-	    RemoteConnection r_con;
-	    FabCopyAssoc *next;
-	    FabCopyAssoc *prev;
-	    RegionGraph *graphPartner;
-	    //  CopyAssoc *orig_copyAssoc;
-	    FabCopyAssoc()
-	    {
-		next=0;
-		prev=0;
-		graphPartner=0;
-	    }
-            ~FabCopyAssoc()
-            {
-                if(next) delete next;
-            }
-    };
-
-    class pTileArray
-    {
-	public:
-	    int numTiles;
-	    std::vector<Box*> tileBx;
-	    Box* validBx;
-	    pTileArray(): numTiles(0), tileBx(0){}
-	    ~pTileArray()
-	    {
-		tileBx.clear();
-	    }
-    };
-
-    class Task
-    {
-	public:
-            std::vector<int> state;
-	    bool init;
-	    FabCopyAssoc *cpAsc_srcHead;
-	    FabCopyAssoc *cpAsc_dstHead;
-
-	    std::vector<int> depTaskIDs;
-	    int numDepTasksCompleted;
-	    bool depTasksCompleted;
-
-	    Task()
-	    {
-		state.reserve(16);
-		depTaskIDs.reserve(1024);
-		depTasksCompleted = true;
-		numDepTasksCompleted = 0;
-		cpAsc_srcHead=0;
-		cpAsc_dstHead=0;
-	    }
-
-	    ~Task()
-	    {
-		state.clear();
-		depTaskIDs.clear();
-		if(cpAsc_srcHead != 0)
-		    delete[] cpAsc_srcHead;
-		if(cpAsc_dstHead != 0)
-		    delete[] cpAsc_dstHead;
-	    }
-    };
-
-    class Worker
-    {
-	public:
-	    int totalTasks;
-	    int computedTasks;
-	    bool init;
-	    Barrier* barr;
-	    Barrier* l_barr;
-	    RegionQueue* fireableRegionQueue;
-	    RegionQueue* unfireableRegionQueue;
-	    RegionQueue* computedRegionQueue;
-	    RegionQueue* completedRegionQueue;
-	    Worker():init(false), l_barr(0), barr(0), totalTasks(0){}
-
-            ~Worker(){
-                delete barr;
-                delete l_barr;
-                delete fireableRegionQueue;
-                delete unfireableRegionQueue;
-                delete computedRegionQueue;
-                delete completedRegionQueue;
-            }
-    };
-
-    //template <class FAB>
-    class CopyMap
-    {
-	public:
-	    std::vector<FArrayBox*> map;
-	    CopyMap *next;
-	    CopyMap()
-		:
-		    next(0)
-	{
-#ifdef PERILLA_DEBUG
-                memcheck.add(memcheck.genKey(this), (void*)this, "CopyMap");
-#endif
-
-        }
-
-	    void alloc_CopyMap(const MultiFab& mf)
-	    {
-
-		Vector<int> IndArr = mf.IndexArray();
-		const int n = IndArr.size();
-		//const int n = mf.size();
-		map.reserve(n);
-		//sMap.resize(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = IndArr[i];
-		    const Box& tmp = mf.fabbox(K);
-		    map.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }
-	    ~CopyMap()
-	    {
-                for (int i = 0; i < map.size(); ++i)
-                {
-                    delete map[i];
-                }
-		map.clear();
-		if(next !=0 )
-		    delete next;
-#ifdef PERILLA_DEBUG
-                memcheck.remove(memcheck.genKey(this));
-#endif
-	    }
-    };
-
-    class RegionGraph
-    {
-	public:
-	    static int graphCnt;
-	    int graphID;
-	    int numTasks;
-	    int numFabs;
-	    int totalFinishes;
-	    bool isDepGraph;
-	    bool* okToReset;
-	    omp_lock_t finishLock;
-
-	    std::vector<pTileArray*> fabTiles;
-	    std::vector<pTileArray*> fabTiles_gtbx;
-
-	    std::vector<FArrayBox*> lMap;
-	    std::vector<FArrayBox*> sMap;
-	    std::vector<FArrayBox*> rMap;
-	    CopyMap *sCopyMapHead;
-	    CopyMap *rCopyMapHead;  
-
-	    std::vector<Task*> task;
-	    std::vector<Worker*> worker;
-
-	    RegionGraph* srcLinkGraph;
-
-	public:
-	    RegionGraph(int numtasks);
-	    void Initialize();
-	    void Reset();
-	    bool isGraphEmpty();
-	    bool isGraphEmptyV2();
-	    void finalizeGraph();
-	    void regionGraphReset(int numfabs);
-	    void regionGraphMinReset(void);
-	    void enableAllRegions();
-	    void disableRegion(int r, int tg);
-	    void finalizeRegion(int r);
-            void finalizeRegionGraph();
-	    void regionComputed(int r);
-	    bool isFireableRegion(int r);
-	    int  getAnyFireableRegion();
-            int  getAnyFireableRegion(RegionGraph& depGraph);
-	    int  getPulledFireableRegion();
-	    int  getFireableRegion(bool isSingleThread=false);
-	    void setFireableRegion(int r);
-	    void graphTeardown();
-	    void workerTeardown();
-            int size(){return task.size();}
-
-	    int getRegion(){
-	        return worker[perilla::wid()]->computedRegionQueue->getFrontRegion(true);
-            }
-
-            void syncComputeWorkerThreads(){
-	        worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-            }
-            void syncComputeWorkerThreads(int numthreads){
-	        worker[perilla::wid()]->barr->sync(numthreads);
-            }
-
-            void syncWorkerThreads(){
-	        worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-            }
-            void syncWorkerThreads(int numthreads){
-	        worker[perilla::wid()]->barr->sync(numthreads);
-            }
-
-	    void alloc_lMap(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		lMap.reserve(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    lMap.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }  
-
-	    void alloc_sMap(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		sMap.reserve(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    sMap.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }
-
-	    void alloc_rMap(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		rMap.reserve(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    rMap.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }
-
-	    void buildTileArray(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		fabTiles.resize(n);
-
-		for (int i = 0; i < n; ++i)
-		{
-		    fabTiles[i] = new pTileArray();
-		}
-		for (MFIter mfi(mf, true); mfi.isValid(); ++mfi)
-		{
-		    fabTiles[mfi.LocalIndex()]->numTiles++;
-		    fabTiles[mfi.LocalIndex()]->tileBx.push_back(new Box(mfi.tilebox()));
-		    fabTiles[mfi.LocalIndex()]->validBx = new Box(mfi.validbox());
-		}
-	    }
-
-	    void buildTileArray_gtbx(const MultiFab& mf, int ng)
-	    {
-		const int n = mf.IndexArray().size();
-		fabTiles_gtbx.resize(n);
-
-		for (int i = 0; i < n; ++i)
-		{
-		    fabTiles_gtbx[i] = new pTileArray();
-		}
-		for (MFIter mfi(mf, true); mfi.isValid(); ++mfi)
-		{
-		    fabTiles_gtbx[mfi.LocalIndex()]->numTiles++;
-		    fabTiles_gtbx[mfi.LocalIndex()]->tileBx.push_back(new Box(mfi.growntilebox(ng)));
-		}
-	    }
-
-            void buildTileArray(const amrex::MultiFab& mf, const amrex::IntVect& tilesize)
-            {
-                int myProc = amrex::ParallelDescriptor::MyProc();
-                const int n = mf.indexArray.size();
-                fabTiles.resize(n);
-
-                //typ = mf.boxArray().ixType();
-
-                for (int i = 0; i < n; ++i)
-                {
-                    fabTiles[i] = new pTileArray();
-                }
-                for (amrex::MFIter mfi(mf, tilesize); mfi.isValid(); ++mfi)
-                {
-                    if( fabTiles[mfi.LocalIndex()]->numTiles == 0 )
-                        fabTiles[mfi.LocalIndex()]->validBx = new amrex::Box(mfi.validbox());
-                    fabTiles[mfi.LocalIndex()]->numTiles++;
-                    fabTiles[mfi.LocalIndex()]->tileBx.push_back(new amrex::Box(mfi.tilebox()));
-                }
-            }
-
-
-	    ~RegionGraph();
-    };
-}//end namespace
-
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RegionGraph.cpp b/Src/AmrTask/rts_impls/mpi_omp/RegionGraph.cpp
deleted file mode 100755
index 895037152f8..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RegionGraph.cpp
+++ /dev/null
@@ -1,945 +0,0 @@
-#include <RegionGraph.H>
-#include <WorkerThread.H>
-#include <stdlib.h>
-#include <omp.h>
-
-using namespace std;
-using namespace amrex;
-using namespace perilla;
-
-int RegionGraph::graphCnt = 0;
-
-RegionGraph::RegionGraph(int numtasks)
-{
-    sCopyMapHead = 0;
-    rCopyMapHead = 0;
-    srcLinkGraph = 0;
-    isDepGraph = false;
-    numFabs = numtasks;
-    numTasks = numtasks;
-    graphID = ++graphCnt;
-    worker.resize(perilla::NUM_THREAD_TEAMS);
-    task.resize(numTasks);
-    totalFinishes=0;
-    okToReset = new bool[perilla::NUM_THREAD_TEAMS];
-    omp_init_lock(&finishLock);
-    Initialize();
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-void RegionGraph::Initialize()
-{
-    int numfabs = numTasks;        
-    int numthreads = omp_get_num_threads();
-
-    if(numthreads==1)
-    {
-#pragma omp parallel shared(numfabs)
-	{
-	    int tg = WorkerThread::perilla_wid();
-
-	    if(WorkerThread::perilla_isMasterWorkerThread())
-	    {
-		worker[tg] = new Worker();
-		worker[tg]->barr = new Barrier(perilla::NUM_THREADS_PER_TEAM-1);
-		worker[tg]->l_barr = new Barrier(perilla::NUM_THREADS_PER_TEAM-2);
-		if(numfabs <= perilla::TASK_QUEUE_DEFAULT_MAXSIZE)
-		{
-		    worker[tg]->fireableRegionQueue = new RegionQueue();
-		    worker[tg]->unfireableRegionQueue = new RegionQueue();
-		    worker[tg]->computedRegionQueue = new RegionQueue();
-		    worker[tg]->completedRegionQueue = new RegionQueue();
-		}
-		else
-		{
-		    worker[tg]->fireableRegionQueue = new RegionQueue(numfabs);
-		    worker[tg]->unfireableRegionQueue = new RegionQueue(numfabs);
-		    worker[tg]->computedRegionQueue = new RegionQueue(numfabs);
-		    worker[tg]->completedRegionQueue = new RegionQueue(numfabs);
-		}
-		worker[tg]->totalTasks = 0;
-		worker[tg]->computedTasks = 0;
-		for(int f=0; f < numfabs; f++)
-		    if(WorkerThread::isMyRegion(tg,f))
-		    {
-			task[f] = new Task();
-			worker[tg]->unfireableRegionQueue->addRegion(f);
-			worker[tg]->totalTasks++;
-			for(int i=0; i<16; i++)
-			    task[f]->state[i] = 0;
-			task[f]->init = true;
-		    }
-		worker[tg]->init = true;
-		okToReset[tg] = false;	      
-	    }
-	}// omp parallel end
-    }
-    else // numthread are > 1, so already in parallel region
-    {
-	int tg = WorkerThread::perilla_wid();
-	if(WorkerThread::perilla_isMasterWorkerThread() && worker[tg]->init == false )
-	{
-	    worker[tg]->barr = new Barrier(perilla::NUM_THREADS_PER_TEAM-1);
-	    worker[tg]->l_barr = new Barrier(perilla::NUM_THREADS_PER_TEAM-2);
-	    worker[tg]->fireableRegionQueue = new RegionQueue();
-	    worker[tg]->unfireableRegionQueue = new RegionQueue();
-	    worker[tg]->completedRegionQueue = new RegionQueue();
-	    worker[tg]->totalTasks = 0;
-	    worker[tg]->computedTasks = 0;
-	    for(int f=0; f < numfabs; f++)
-		if(WorkerThread::isMyRegion(tg,f))
-		{
-		    worker[tg]->unfireableRegionQueue->addRegion(f);
-		    worker[tg]->totalTasks++;
-		    for(int i=0; i<16; i++)
-			task[f]->state[i] = 0;
-		    task[f]->init = true;
-		}
-	    worker[tg]->init = true;
-	}	
-    }
-}
-
-void RegionGraph::Reset()
-{
-    int tg= perilla::wid();
-    omp_set_lock(&finishLock);
-    if(okToReset[tg])
-	totalFinishes--;
-    omp_unset_lock(&finishLock);
-
-    if(okToReset[tg])
-    {
-	worker[tg]->totalTasks = 0;
-	worker[tg]->computedTasks = 0;
-	while(worker[tg]->completedRegionQueue->queueSize(true) > 0)
-	{
-	    int r = worker[tg]->completedRegionQueue->removeRegion(true);
-	    if(WorkerThread::isMyRegion(tg, r))
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		worker[tg]->totalTasks++;
-		for(int i=0; i<16; i++)
-		    task[r]->state[i] = 0;
-		task[r]->init = true;
-		if(task[r]->depTaskIDs.size() > 0)
-		    task[r]->depTasksCompleted = false; 
-	    }
-	    else
-		break;
-	}
-    }
-}
-
-bool RegionGraph::isGraphEmpty()
-{
-    int tg= perilla::wid();
-    //worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); 
-    perilla::syncWorkerThreads();
-    if(worker[tg]->completedRegionQueue->queueSize(true)== worker[tg]->totalTasks)
-	return true;
-    return false;	       
-}
-
-bool RegionGraph::isGraphEmptyV2()
-{
-    int tg=perilla::wid();
-
-    if(worker[tg]->completedRegionQueue->queueSize(true) == worker[tg]->totalTasks || worker[tg]->computedTasks == worker[tg]->totalTasks)
-	return true;
-	return false;	       
-}
-
-void RegionGraph::finalizeGraph()
-{
-    omp_set_lock(&finishLock);
-    totalFinishes++;
-    int tg=perilla::wid();
-    okToReset[tg]=true;
-    omp_unset_lock(&finishLock);
-}
-
-void RegionGraph::regionGraphReset(int numfabs)
-{
-    int nt;
-    int tg;
-    int r;
-    //#pragma omp parallel private(r,tg,nt,tid) shared(numfabs)
-    {
-        tg = perilla::wid();
-        nt = perilla::wtid();
-        if(perilla::isMasterThread())
-	    totalFinishes=0;	
-	//#pragma omp barrier
-        if(perilla::isMasterWorkerThread())
-	{
-	    worker[tg]->totalTasks = 0;
-	    worker[tg]->computedTasks = 0;
-	    while(worker[tg]->completedRegionQueue->queueSize(true) > 0)
-	    {
-		r = worker[tg]->completedRegionQueue->removeRegion(true);
-		if(WorkerThread::isMyRegion(tg, r))
-		{
-		    worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		    worker[tg]->totalTasks++;
-		    for(int i=0; i<16; i++)
-			task[r]->state[i] = 0;
-		    task[r]->init = true;
-		}
-		else
-		    break;
-	    }
-	    okToReset[tg] = false;
-	}
-    }// omp parallel end
-}
-
-
-void RegionGraph::regionGraphMinReset(void)
-{
-    int nt;
-    int tg;
-    int r;
-    {
-        tg = perilla::wid();
-        nt = perilla::wtid();
-	if(perilla::isMasterThread())	
-	    totalFinishes=0;	
-	if(perilla::isMasterWorkerThread())
-	{
-	    while(worker[tg]->completedRegionQueue->queueSize(true) > 0)
-	    {
-		r = worker[tg]->completedRegionQueue->removeRegion(true);
-		if(WorkerThread::isMyRegion(tg, r))
-		{
-		    worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		}
-		else
-		    break;
-	    }
-	    okToReset[tg] = false;
-	}
-    }
-}
-
-
-void RegionGraph::enableAllRegions()
-{
-    int numfabs = numTasks;
-    int r;
-    int tg = WorkerThread::perilla_wid();
-    perilla::syncWorkerThreads();
-    if(perilla::isMasterWorkerThread())
-	for(int f=0; f<numfabs; f++)
-	    if(WorkerThread::isMyRegion(tg, f))
-	    {
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-		worker[tg]->fireableRegionQueue->addRegion(r,true);
-	    }    
-    //worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads        
-    perilla::syncWorkerThreads();
-}
-
-void RegionGraph::disableRegion(int r, int tg)
-{
-    //int tg = perilla::wid();
-    if(perilla::isMasterWorkerThread())
-	if(WorkerThread::isMyRegion(tg, r))
-	{
-	    int rID = worker[tg]->fireableRegionQueue->removeRegion(true);
-	    worker[tg]->unfireableRegionQueue->addRegion(rID,true);
-	}
-}
-
-void RegionGraph::regionComputed(int r)
-{
-    int tg= perilla::wid();
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-2);
-    if(perilla::isMasterWorkerThread())
-	if(WorkerThread::isMyRegion(tg, r))
-	{
-	    int rr = worker[tg]->fireableRegionQueue->removeRegion();
-	    if(r != rr)
-	    {
-		std::cout << "ERROR: In computedeRegion" << std::endl;
-		exit(EXIT_FAILURE);
-	    }
-	    worker[tg]->computedRegionQueue->addRegion(rr);
-	    worker[tg]->computedTasks++;
-	}
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-2);
-}
-
-void RegionGraph::finalizeRegion(int r)
-{
-    int tg= perilla::wid();
-    int ntid=perilla::wtid();
-    perilla::syncWorkerThreads();
-    if(perilla::isMasterWorkerThread())
-	if(WorkerThread::isMyRegion(tg, r))
-	{
-	    int rr = worker[tg]->fireableRegionQueue->removeRegion(true);
-	    if(r != rr)
-	    {
-		std::cout << "ERROR: In completeRegion" << std::endl;
-		exit(EXIT_FAILURE);
-	    }
-	    worker[tg]->completedRegionQueue->addRegion(rr,true);
-	}
-    perilla::syncWorkerThreads();
-}
-
-void RegionGraph::finalizeRegionGraph()
-{
-    int tg= perilla::wid();
-    omp_set_lock(&finishLock);
-    totalFinishes++;
-    okToReset[tg]=true;
-    omp_unset_lock(&finishLock);
-}
-
-bool RegionGraph::isFireableRegion(int r)
-{
-    int myProc = ParallelDescriptor::MyProc();
-    FabCopyAssoc *cpDst = task[r]->cpAsc_dstHead;
-    if(lMap.size() > 0)
-	if(lMap[r]->l_con.firingRuleCnt != lMap[r]->l_con.ndcpy)
-	{
-	    return false;
-	}
-	while(cpDst != 0)
-	{
-	    if(cpDst->l_con.firingRuleCnt != cpDst->l_con.ndcpy)
-	    {
-		return false;
-	    }
-	    cpDst = cpDst->next;
-	}
-
-	if(srcLinkGraph != 0)
-	{
-	    if(!task[r]->depTasksCompleted)
-	    {
-		for(int i=0; i<task[r]->depTaskIDs.size(); i++)
-		    if(!srcLinkGraph->isFireableRegion(task[r]->depTaskIDs[i]))
-			return false;
-		task[r]->depTasksCompleted = true;
-	    }
-	}
-
-    if(ParallelDescriptor::NProcs() == 1) return true;
-
-    if(lMap.size() > 0)
-	if(lMap[r]->r_con.firingRuleCnt != lMap[r]->r_con.nrcv)
-	{
-	    return false;
-	}
-
-	cpDst = task[r]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    if(cpDst->r_con.firingRuleCnt != cpDst->r_con.nrcv)
-	    {
-		return false;
-	    }
-	    cpDst = cpDst->next;
-	}
-    return true;
-}
-
-int RegionGraph::getFireableRegion(bool isSingleThread)
-{
-    int r = -1;
-    bool fireable;
-    int tg= perilla::wid();
-
-    if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0 && worker[tg]->fireableRegionQueue->queueSize() == 0)
-    {
-	fireable = false;
-	r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	while(!fireable)
-	{
-	    fireable = isFireableRegion(r);
-	    if(!fireable)
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    }
-	}
-    }
-    else if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0)
-    {
-	int unfQsize = worker[tg]->unfireableRegionQueue->queueSize(true);
-	for(int i = 0; i < unfQsize; i++)
-	{
-	    int tr = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    if(isFireableRegion(tr))
-	    {
-		r = tr;
-		break;
-	    }
-	    else
-		worker[tg]->unfireableRegionQueue->addRegion(tr,true);
-	}
-    }
-
-    return r;
-}
-
-#if 0
-int RegionGraph::getFireableRegion(bool patchFilled, bool isSingleThread)
-{   
-    int r = -1;
-    bool fireable;
-    int tg= perilla::wid();
-    int nt= perilla::wtid();
-
-    //if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0 && worker[tg]->fireableRegionQueue->queueSize() == 0)      
-    //{
-    if(!isSingleThread)worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(perilla::isMasterWorkerThread())
-    { 
-	if(worker[tg]->fireableRegionQueue->queueSize()==0){
-	    fireable = false;
-	    assert(worker[tg]->unfireableRegionQueue->queueSize()>0);
-	    r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    while(!fireable)
-	    {   
-		fireable = isFireableRegion(r, patchFilled);
-		//fireable = true;
-		if(!fireable)
-		{   
-		    worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		    r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-		}
-		else worker[tg]->fireableRegionQueue->addRegion(r,true);
-	    }
-	}
-    }
-#if 0
-    else if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0)
-    {
-	int unfQsize = worker[tg]->unfireableRegionQueue->queueSize(true);
-	for(int i = 0; i < unfQsize; i++)
-	{
-	    int tr = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    if(isFireableRegion(tr))
-	    {
-		r = tr;
-		break;
-	    }
-	    else
-		worker[tg]->unfireableRegionQueue->addRegion(tr,true);
-	}
-    }
-#endif
-    if(!isSingleThread)worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    std::cout<<"FOUND A REGION"<<r<<std::endl;
-    r = worker[tg]->fireableRegionQueue->getFrontRegion(true);
-    return r;
-}
-#endif
-
-
-
-#if 0
-int RegionGraph::getFireableRegion(bool patchFilled)
-{
-    int r = -1;
-    bool fireable;
-    int tg= perilla::wid();
-    int nt= perilla::wtid();
-
-    //if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0 && worker[tg]->fireableRegionQueue->queueSize() == 0)      
-    //{
-    worker[tg]->barr->sync(); // Barrier to synchronize team threads
-    if(nt == 0 && worker[tg]->fireableRegionQueue->queueSize()==0){      
-	fireable = false;
-	assert(worker[tg]->unfireableRegionQueue->queueSize()>0);
-	r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	while(!fireable)
-	{
-	    fireable = isFireableRegion(r, patchFilled);
-	    //fireable = true;
-	    if(!fireable)
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    }
-	    else worker[tg]->fireableRegionQueue->addRegion(r,true);
-	}	  
-    }
-#if 0
-    else if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0)
-    {
-	int unfQsize = worker[tg]->unfireableRegionQueue->queueSize(true);
-	for(int i = 0; i < unfQsize; i++)
-	{
-	    int tr = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    if(isFireableRegion(tr))
-	    {
-		r = tr;
-		break;
-	    }
-	    else
-		worker[tg]->unfireableRegionQueue->addRegion(tr,true);
-	}
-    }
-#endif
-    worker[tg]->barr->sync(); // Barrier to synchronize team threads
-    r = worker[tg]->fireableRegionQueue->getFrontRegion(true);
-    return r;
-}
-#endif
-
-void RegionGraph::setFireableRegion(int r)
-{
-    worker[perilla::wid()]->fireableRegionQueue->addRegion(r);
-}
-
-
-int RegionGraph::getAnyFireableRegion()
-{
-    int myProc = ParallelDescriptor::MyProc();
-    int tg = perilla::wid();
-    int nt = perilla::wtid();
-    int r;
-    perilla::syncWorkerThreads();
-    if(nt ==0)
-    if(worker[tg]->fireableRegionQueue->queueSize()==0)      
-    {
-	bool fireable = false;
-	r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	while(!fireable)
-	{
-	    fireable = isFireableRegion(r);
-	    if(!fireable)
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    }
-	    else
-		worker[tg]->fireableRegionQueue->addRegion(r,true);
-	}
-    }
-    perilla::syncWorkerThreads();
-    return worker[tg]->fireableRegionQueue->getFrontRegion(true);
-}
-
-int RegionGraph::getAnyFireableRegion(RegionGraph& depGraph)
-{
-    int nt;
-    int tg;
-    int r;
-    bool fireable;
-
-    int myProc = amrex::ParallelDescriptor::MyProc();
-
-    tg = perilla::wid();
-    nt = perilla::wtid();
-    if(nt == perilla::NUM_COMM_THREADS && worker[tg]->fireableRegionQueue->queueSize()==0)
-    {
-        fireable = false;
-        r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-        while(!fireable)
-        {
-            fireable = isFireableRegion(r);
-            fireable &= depGraph.isFireableRegion(r);
-            if(!fireable)
-            {
-                worker[tg]->unfireableRegionQueue->addRegion(r,true);
-                r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-            }
-            else
-                worker[tg]->fireableRegionQueue->addRegion(r,true);
-        }
-    }
-    worker[tg]->barr->sync();
-    //worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-    r = worker[tg]->fireableRegionQueue->getFrontRegion(true);
-    return r;
-}
-
-
-int RegionGraph::getPulledFireableRegion()
-{
-    int myProc = ParallelDescriptor::MyProc();
-    int tg = WorkerThread::perilla_wid();
-    int nt = WorkerThread::perilla_wtid();
-    if(nt == 0 && worker[tg]->fireableRegionQueue->queueSize()==0)      
-    {
-	while(worker[tg]->fireableRegionQueue->queueSize()==0);
-    }
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-2);
-    return worker[tg]->fireableRegionQueue->getFrontRegion(true);
-}
-
-void RegionGraph::graphTeardown()
-{
-    MPI_Status status;
-    Package* package;
-    int numfabs = numTasks;
-    int tg = WorkerThread::perilla_wid();
-
-#if 0
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpDst = task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		cpDst->l_con.firingRuleCnt = 0;
-
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		{
-		    while(cpDst->l_con.dcpy[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpDst->l_con.dcpy[i].pQueue.dequeue();
-			//package->completed = false;
-			//package->served = false;
-			//package->notified = false;
-			//package->request = MPI_REQUEST_NULL;		    
-			cpDst->l_con.dcpy[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-		cpDst = cpDst->next;
-	    }
-	}
-    }
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpSrc = task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		//cpSrc->l_con.firingRuleCnt = 0;
-
-		for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		{
-		    while(cpSrc->l_con.scpy[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpSrc->l_con.scpy[i].pQueue.dequeue();
-
-			FabCopyAssoc* cpDst = cpSrc->graphPartner->task[cpSrc->l_con.scpy[i].nd]->cpAsc_dstHead;
-			while(cpDst != 0)
-			{
-			    if(cpDst->graphPartner == this) //graphArray[g])
-				break;
-			    cpDst = cpDst->next;
-			}			    
-			//Package* sPackage = cpSrc->l_con.scpy[i].pQueue.dequeue(true);
-			omp_set_lock(&(cpDst->l_con.dLock));
-			int dPartner = cpSrc->l_con.scpy[i].dPartner;
-			Package* dPackage = cpDst->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			/*
-			   for(int j=0; j<dPackage->bufSize; j++)
-			   {
-			   dPackage->databuf[j] = sPackage->databuf[j];
-			   }
-			 */
-			std::memcpy(dPackage->databuf, package->databuf, dPackage->bufSize * sizeof(double));
-			//std::swap(dPackage->databuf, sPackage->databuf);
-
-			cpDst->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			if(cpDst->l_con.dcpy[dPartner].pQueue.queueSize(true) == 1)
-			    cpDst->l_con.firingRuleCnt++;
-			omp_unset_lock(&(cpDst->l_con.dLock));
-			//cpSrc->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-
-			//package->completed = false;
-			//package->served = false;
-			//package->notified = false;
-			//package->request = MPI_REQUEST_NULL;		    
-			cpSrc->l_con.scpy[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-		cpSrc = cpSrc->next;
-	    }
-	}
-    }
-
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    if(lMap.size() > 0)
-	    {
-		lMap[f]->l_con.firingRuleCnt = 0;
-	    }
-	}
-    }
-#endif
-
-    if(ParallelDescriptor::NProcs() == 1) return;
-
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpDst = task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		cpDst->r_con.firingRuleCnt = 0;
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		{
-		    while(cpDst->r_con.rcv[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpDst->r_con.rcv[i].pQueue.dequeue();
-			package->completed = false;
-			package->served = false;
-			package->notified = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpDst->r_con.rcv[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-		cpDst = cpDst->next;
-	    }
-	}
-    }
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpSrc = task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		//cpSrc->r_con.firingRuleCnt = 0;
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		{
-		    while(cpSrc->r_con.snd[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpSrc->r_con.snd[i].pQueue.dequeue();
-			package->completed = false;
-			package->served = false;
-			package->notified = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpSrc->r_con.snd[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-		cpSrc = cpSrc->next;
-	    }
-	}
-    }
-
-
-#if 0
-    if(tg == 0)
-    {
-	CopyMap* cpDst = rCopyMapHead;
-	while(cpDst != 0)
-	{
-	    for(int f=0; f<cpDst->map.size(); f++)
-	    {
-		cpDst->map[f]->r_con.firingRuleCnt = 0;
-		for(int i=0; i<cpDst->map[f]->r_con.nrcv; i++)
-		{
-		    while(cpDst->map[f]->r_con.rcv[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpDst->map[f]->r_con.rcv[i].pQueue.dequeue();
-			if(package->request != MPI_REQUEST_NULL)
-			    MPI_Cancel( &(package->request) );
-			package->completed = false;
-			package->served = false;
-			package->notified = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpDst->map[f]->r_con.rcv[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-	    }
-
-	    cpDst = cpDst->next;
-	}
-
-
-	CopyMap* cpSrc = sCopyMapHead;
-	while(cpSrc != 0)
-	{
-	    for(int f=0; f<cpSrc->map.size(); f++)
-	    {
-		for(int i=0; i<cpSrc->map[f]->r_con.nsnd; i++)
-		{
-		    while(cpSrc->map[f]->r_con.snd[i].pQueue.queueSize() >= 1)
-		    {
-
-			package = cpSrc->map[f]->r_con.snd[i].pQueue.dequeue();
-			/*		
-					int ns = cpSrc->map[f]->r_con.snd[i].ns;
-					int nd = cpSrc->map[f]->r_con.snd[i].nd;
-					int r_gid = cpSrc->map[f]->r_con.snd[i].r_gid;
-					int r_grids = cpSrc->map[f]->r_con.snd[i].r_grids;
-			//int tag = tagGen(ns, nd, r_gid-1, np*r_grids, nGraphs);
-			int tag = Perilla::myTagMap[r_gid][nd][ns][cpSrc->map[f]->r_con.snd[i].sz];
-
-			Package* sPackage = lMap[f]->r_con.snd[i].pQueue.getFront(true);
-			package->request = ParallelDescriptor::Asend(sPackage->databuf,
-			cpSrc->map[f]->r_con.snd[i].sz,
-			cpSrc->map[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-
-			 */
-			MPI_Wait( &(package->request), &status );
-			package->completed = false;
-			package->served = false;
-			package->notified = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpSrc->map[f]->r_con.snd[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-	    }
-
-	    cpSrc = cpSrc->next;
-	}
-    }
-
-    //if(WorkerThread::isTeamMasterThread(tid)) commented out b/c its already call by single thread in a team
-    //Perilla::globalBarrier->sync(perilla::NUM_THREAD_TEAMS);
-
-    // Parallel Copy Reset on Local tg
-    for(int f=0; f<numfabs; f++)
-    {
-	//if(WorkerThread::isMyRegion(tg,f))
-	{
-	    if(lMap.size() > 0)
-	    {
-		lMap[f]->r_con.firingRuleCnt = 0;
-
-		for(int i=0; i<lMap[f]->r_con.nsnd; i++)
-		    while(lMap[f]->r_con.snd[i].pQueue.queueSize() >= 1)
-		    {
-			package = lMap[f]->r_con.snd[i].pQueue.dequeue();
-			package->completed = false;
-			package->served = false;
-			package->notified = false;
-			package->request = MPI_REQUEST_NULL;
-			lMap[f]->r_con.snd[i].recycleQueue.enqueue(package);
-		    }
-
-		for(int i=0; i<lMap[f]->r_con.nrcv; i++)
-		    while(lMap[f]->r_con.rcv[i].pQueue.queueSize() >= 1)
-		    {
-			package = lMap[f]->r_con.rcv[i].pQueue.dequeue();
-			package->completed = false;
-			package->served = false;
-			package->notified = false;
-			package->request = MPI_REQUEST_NULL;
-			lMap[f]->r_con.rcv[i].recycleQueue.enqueue(package);
-		    }
-	    }
-	}
-    }              																             
-
-    // Fill boundary reset on local tg
-    if(tg == 0)
-    {
-	for(int f=0; f<numfabs; f++)
-	{
-	    if(rMap.size() > 0)
-	    {
-		// if(WorkerThread::isMyRegion(tg,f))
-		{
-		    for(int i=0; i< rMap[f]->r_con.nrcv; i++)
-			while( rMap[f]->r_con.rcv[i].pQueue.queueSize() >= 1)
-			{
-			    package =  rMap[f]->r_con.rcv[i].pQueue.dequeue();
-			    if(package->request != MPI_REQUEST_NULL)
-				MPI_Cancel( &(package->request) );
-			    package->completed = false;
-			    package->served = false;
-			    package->notified = false;
-			    package->request = MPI_REQUEST_NULL;
-			    rMap[f]->r_con.rcv[i].recycleQueue.enqueue(package);
-			}
-		    for(int i=0; i< sMap[f]->r_con.nsnd; i++)
-			while( sMap[f]->r_con.snd[i].pQueue.queueSize() >= 1)
-			{
-			    package =  sMap[f]->r_con.snd[i].pQueue.dequeue();
-			    MPI_Wait( &(package->request), &status );
-			    package->completed = false;
-			    package->served = false;
-			    package->notified = false;
-			    package->request = MPI_REQUEST_NULL;
-			    sMap[f]->r_con.snd[i].recycleQueue.enqueue(package);
-			}
-		}
-	    }
-	}
-    }
-#endif
-
-}
-
-void RegionGraph::workerTeardown()
-{
-    int numfabs = numTasks;
-    Package* package;
-
-    regionGraphMinReset();   
-}
-
-RegionGraph::~RegionGraph()
-{
-    delete[] okToReset;
-    for(int tg=0; tg<perilla::NUM_THREAD_TEAMS; tg++)delete worker[tg];
-    worker.clear();
-    for(int i=0; i<task.size(); i++) delete task[i];
-    task.clear();
-
-    if(sCopyMapHead != 0)
-      delete sCopyMapHead;
-    if(rCopyMapHead != 0)
-      delete rCopyMapHead;
-
-    for(int i=0; i<lMap.size(); i++) delete lMap[i];
-    for(int i=0; i<sMap.size(); i++) delete sMap[i];
-    for(int i=0; i<rMap.size(); i++) delete rMap[i];
-
-    lMap.clear();
-    sMap.clear();
-    rMap.clear();
-
-    for(int i=0; i<fabTiles.size(); i++) delete fabTiles[i];
-    for(int i=0; i<fabTiles_gtbx.size(); i++) delete fabTiles_gtbx[i];
-
-    fabTiles.clear();
-    fabTiles_gtbx.clear();
-#ifdef PERILLA_DEBUG
-    memcheck.remove(memcheck.genKey(this));
-#endif
-}
-
-#if 0
-
-RegionGraph::~RegionGraph()
-{
-    lMap.clear();
-    sMap.clear();
-    rMap.clear();
-    //fabTiles.clear();
-    //if(sCopyMapHead != 0)
-    //  delete sCopyMapHead;
-    //if(rCopyMapHead != 0)
-    //  delete rCopyMapHead;
-    //delete[] worker;
-    //delete[] task;
-    worker.clear();
-    task.clear();
-    delete[] okToReset;
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RegionQueue.H b/Src/AmrTask/rts_impls/mpi_omp/RegionQueue.H
deleted file mode 100755
index 1543c72bec0..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RegionQueue.H
+++ /dev/null
@@ -1,34 +0,0 @@
-#ifndef P_REGIONQUEUE_H
-#define P_REGIONQUEUE_H
-
-#include <PerillaConfig.H>
-#include <omp.h>
-
-//////////////////////// class RegionQueue Declaration Start /////////////////////////////////////
-class RegionQueue
-{
-private:
-  int* buffer;
-  int n;
-  int front;
-  int rear;
-  int max_size;
-  omp_lock_t queueLock;
-public:
-  RegionQueue();
-  RegionQueue(int numTasks);
-  ~RegionQueue();
-  void addRegion(int r);
-  void addRegion(int r, bool lockIgnore);
-  int removeRegion();
-  int removeRegion(bool lockIgnore);  
-  int getFrontRegion();
-  int getFrontRegion(bool lockIgnore);
-  int queueSize(bool lockIgnore);
-  int queueSize();
-  void reallocate();
-};
-//////////////////////// class RegionQueue Declaration End /////////////////////////////////////
-
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RegionQueue.cpp b/Src/AmrTask/rts_impls/mpi_omp/RegionQueue.cpp
deleted file mode 100755
index 14a72c79138..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RegionQueue.cpp
+++ /dev/null
@@ -1,101 +0,0 @@
-#include <RegionQueue.H>
-#include <stdio.h>
-#include <string.h>
-#include <stdlib.h>
-
-//////////////////////// class RegionQueue Definition Start /////////////////////////////////////  
-  RegionQueue::RegionQueue(void)
-  {
-    max_size= perilla::TASK_QUEUE_DEFAULT_MAXSIZE;
-    buffer = new int[max_size];
-    n = 0;
-    front = 0;
-    rear = 0;
-    omp_init_lock(&queueLock);
-  }
-
-  RegionQueue::RegionQueue(int numTasks)
-  {
-    buffer = new int[numTasks];
-    n = 0;
-    max_size = numTasks;
-    front = 0;
-    rear = 0;
-    omp_init_lock(&queueLock);
-  }
-
-  RegionQueue::~RegionQueue()
-  {
-      delete[] buffer;
-  }
-
-  void RegionQueue::addRegion(int r)
-  {
-    omp_set_lock(&queueLock);
-    buffer[rear] = r;
-    rear = (rear+1)%max_size;
-    n++;
-    omp_unset_lock(&queueLock);
-  }
-
-  void RegionQueue::addRegion(int r, bool lockIgnore)
-  {
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    buffer[rear] = r;
-    rear = (rear+1)%max_size;
-    n++;
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-  }
-
-  int RegionQueue::removeRegion()
-  {
-    int r;
-    omp_set_lock(&queueLock);
-    r = buffer[front];
-    front = (front+1)%max_size;
-    n--;
-    omp_unset_lock(&queueLock);
-    return r;
-  }
-
-  int RegionQueue::removeRegion(bool lockIgnore)
-  {
-    int r;
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    r = buffer[front];
-    front = (front+1)%max_size;
-    n--;
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-    return r;
-  }
-
-  int RegionQueue::getFrontRegion()
-  {
-    return buffer[front];
-  }
-
-  int RegionQueue::getFrontRegion(bool lockIgnore)
-  {
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    return buffer[front];
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-  }
-
-  int RegionQueue::queueSize()
-  {
-    int size;
-    omp_set_lock(&queueLock);
-    size = n;
-    omp_unset_lock(&queueLock);
-    return size;
-  }
-
-  int RegionQueue::queueSize(bool lockIgnore)
-  {
-    int size;
-    if(!lockIgnore)omp_set_lock(&queueLock);
-    size = n;
-    if(!lockIgnore)omp_unset_lock(&queueLock);
-    return size;
-  }
-//////////////////////// class RegionQueue Definition End /////////////////////////////////////  
diff --git a/Src/AmrTask/rts_impls/mpi_omp/RemoteConnection.H b/Src/AmrTask/rts_impls/mpi_omp/RemoteConnection.H
deleted file mode 100755
index 47c16dac9bf..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/RemoteConnection.H
+++ /dev/null
@@ -1,95 +0,0 @@
-#ifndef P_REMOTECONNECTION_H
-#define P_REMOTECONNECTION_H
-
-#include <omp.h>
-#include <AMReX_Box.H>
-#include <PackageQueue.H>
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include "PerillaMemCheck.H"
-extern PerillaMemCheck memcheck;
-#endif
-
-class RemoteCommDescriptor
-{
-public:
-  int ns, lns;   // ! Source box in layout
-  int nd, lnd;   //! Destination box in layout
-  int r_gid;
-  int r_grids;
-  int sz, pr;
-  Box sbx;     // ! Sub-box for this copy
-  Box dbx;     // ! Sub-box for this copy
-  PackageQueue pQueue;  // !store incoming or outgoing messages, both fab and the runtime can access this queue
-  PackageQueue recycleQueue; //!store used messages, only fab can access this queue, no lock is required
-  int cnt;
-  RemoteCommDescriptor() :
-    ns(-1), lns(-1),
-    nd(-1), lnd(-1),
-    sz(0), pr(0),
-    cnt(0), r_gid(0),
-    r_grids(0)
-  {
-#ifdef PERILLA_DEBUG
-                memcheck.add(memcheck.genKey(this), (void*)this, "RemoteCommDescriptor");
-#endif
-  }
-  ~RemoteCommDescriptor(){
-#ifdef PERILLA_DEBUG
-                memcheck.remove(memcheck.genKey(this));
-#endif
-  }
-};
-
-class TransDescriptor
-{
-  int sz, pv, pr;
-};
-  
-class RemoteConnection  
-{
-public:
-  int nsnd;
-  int nrcv;
-  bool remotePushReady;
-  bool remotePullDone;
-  int nrp, nsp;
-  omp_lock_t *sndLock, *rcvLock, *ghostLock;
-  int firingRuleCnt;
-  RemoteCommDescriptor *snd;
-  RemoteCommDescriptor *rcv;
-  TransDescriptor *str;
-  TransDescriptor *rtr;
-  RemoteConnection() :
-    nsnd(0),
-    nrcv(0),
-    remotePushReady(false),
-    remotePullDone(false),
-    nrp(0), nsp(0),
-    firingRuleCnt(0),
-    snd(NULL), rcv(NULL),
-    str(NULL), rtr(NULL)
-  {
-    sndLock = new omp_lock_t;
-    rcvLock = new omp_lock_t;
-    ghostLock = new omp_lock_t;
-    omp_init_lock(sndLock);
-    omp_init_lock(rcvLock);
-    omp_init_lock(ghostLock);
-  }
-
-  ~RemoteConnection()
-  {
-    if(snd)
-      delete[] snd;
-    if(rcv)
-      delete[] rcv;
-    delete sndLock;
-    delete rcvLock;
-    delete ghostLock;
-  }
-};
-
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/WorkerThread.H b/Src/AmrTask/rts_impls/mpi_omp/WorkerThread.H
deleted file mode 100755
index 449ab0f096e..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/WorkerThread.H
+++ /dev/null
@@ -1,73 +0,0 @@
-#ifndef P_WORKERTHREAD_H
-#define P_WORKERTHREAD_H
-
-#include <PerillaConfig.H>
-#include <Barrier.H>
-#include <omp.h>
-
-namespace perilla{
-
-    class WorkerThread
-    {
-	static void* team_shared_memory[perilla::NUM_THREAD_TEAMS];  
-        int tid;
-	public:
-        static void init();
-        static Barrier *globalBarrier;
-        static Barrier localBarriers[perilla::NUM_THREAD_TEAMS];
-	static int perilla_tid();
-	static int perilla_wtid();
-	static int perilla_wid();
-	static int perilla_nWorkerThreads();
-	static int perilla_nWorkers();
-	static int perilla_nTeamThreads();
-	static bool perilla_isMasterWorkerThread();  
-	static bool perilla_isMasterThread();
-	static bool perilla_isCommunicationThread();
-	static bool isMyRegion(int workerID, int regionID);
-	static void setTeamSharedMemory(void* dummy, int tid, int tg);  
-	static void* getTeamSharedMemory(int tg);
-        static void syncWorkers();
-        static void syncThreads();
-        static void syncComputeThreads();
-        static void syncTeamThreads();
-        static void syncAllThreads();
-        static void syncAllComputeThreads();
-        static void syncWorkerThreads();
-        static void syncWorkerThreads(int numthreads);
-        static void syncComputeWorkerThreads();
-        static void syncComputeWorkerThreads(int numthreads);
-    };
-
-    static int tid(){return WorkerThread::perilla_tid();}
-    static int wtid(){return WorkerThread::perilla_wtid();}
-    static int wid(){return WorkerThread::perilla_wid();}
-    static int nWorkerThreads(){return WorkerThread::perilla_nWorkerThreads();}
-    static int nWorkers(){return WorkerThread::perilla_nWorkers();}
-    static int nThreads(){return perilla::NUM_THREAD_TEAMS*perilla::NUM_THREADS_PER_TEAM;}
-    static bool isMasterWorkerThread(){return WorkerThread::perilla_isMasterWorkerThread();}
-    static bool isMasterThread(){return WorkerThread::perilla_isMasterThread();}
-    static bool isCommunicationThread(){return WorkerThread::perilla_isCommunicationThread();}
-    static bool isMyRegion(int workerID, int regionID){return WorkerThread::isMyRegion(workerID, regionID);}
-    static void setTeamSharedMemory(void* dummy, int tid, int tg){WorkerThread::setTeamSharedMemory(dummy, tid, tg);}
-    static void* getTeamSharedMemory(int tg){WorkerThread::getTeamSharedMemory(tg);}
-    static void syncWorkers(){WorkerThread::syncWorkers();}
-    static void syncThreads(){WorkerThread::syncThreads();}
-    static void syncComputeThreads(){WorkerThread::syncComputeThreads();}
-    static void syncComputeWorkerThreads(){WorkerThread::syncComputeWorkerThreads();}
-    static void syncComputeWorkerThreads(int numthreads){WorkerThread::syncComputeWorkerThreads(numthreads);}
-    static void syncWorkerThreads(){WorkerThread::syncWorkerThreads();}
-    static void syncWorkerThreads(int numthreads){WorkerThread::syncWorkerThreads(numthreads);}
-    static void syncAllWorkerThreads(){
-        perilla::syncWorkerThreads();
-        perilla::syncWorkers();
-    }
-    static void syncAllComputeThreads(){
-        perilla::syncAllComputeThreads();	
-    }
-    static void syncAllThreads(){
-        WorkerThread::syncAllThreads();
-    }
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/rts_impls/mpi_omp/WorkerThread.cpp b/Src/AmrTask/rts_impls/mpi_omp/WorkerThread.cpp
deleted file mode 100755
index 5609740ef3a..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/WorkerThread.cpp
+++ /dev/null
@@ -1,114 +0,0 @@
-#include <WorkerThread.H>
-#include <PerillaConfig.H>
-#include <Perilla.H>
-#include<stdio.h>
-
-namespace perilla
-{
-    void* WorkerThread::team_shared_memory[perilla::NUM_THREAD_TEAMS];
-    Barrier* WorkerThread::globalBarrier;
-    Barrier WorkerThread::localBarriers[perilla::NUM_THREAD_TEAMS];
-
-    void WorkerThread::init(){
-        WorkerThread::globalBarrier= new Barrier(perilla::NUM_THREAD_TEAMS);
-    }
-
-    void WorkerThread::syncWorkers(){
-	if(isMasterWorkerThread()) WorkerThread::globalBarrier->sync(perilla::NUM_THREAD_TEAMS);
-    }
-
-    void WorkerThread::syncTeamThreads(){
-        WorkerThread::localBarriers[perilla_wid()].sync(perilla::NUM_THREADS_PER_TEAM);
-    }
-
-    void WorkerThread::syncWorkerThreads(){
-        WorkerThread::localBarriers[perilla_wid()].sync(perilla::NUM_THREADS_PER_TEAM-1);
-    }
-    void WorkerThread::syncWorkerThreads(int numthreads){
-        WorkerThread::localBarriers[perilla_wid()].sync(numthreads);
-    }
-
-    void WorkerThread::syncAllComputeThreads(){
-        syncWorkerThreads();
-        syncWorkers();
-    }
-
-    void WorkerThread::syncAllThreads(){
-	#pragma omp barrier
-    }
-
-    void WorkerThread::syncThreads(){
-        syncWorkerThreads();
-        syncWorkers;
-    }
-
-    void WorkerThread::syncComputeWorkerThreads(){
-        WorkerThread::localBarriers[perilla_wid()].sync(perilla::NUM_THREADS_PER_TEAM-1);
-    }
-
-    void WorkerThread::syncComputeWorkerThreads(int numthreads){
-        WorkerThread::localBarriers[perilla_wid()].sync(numthreads);
-    }
- 
-    int WorkerThread::perilla_tid(){
-	return omp_get_thread_num();
-    }
-
-    int WorkerThread::perilla_nTeamThreads(){
-	return perilla::NUM_THREADS_PER_TEAM;
-    }
-
-    int WorkerThread::perilla_nWorkerThreads(){
-	return perilla::NUM_THREADS_PER_TEAM-1;
-    }
-    int WorkerThread::perilla_nWorkers(){
-	return perilla::NUM_THREAD_TEAMS;
-    }
-
-    int WorkerThread::perilla_wtid()
-    {
-	int tid= omp_get_thread_num();
-	return (tid % perilla::NUM_THREADS_PER_TEAM) -1;    
-    }
-
-    int WorkerThread::perilla_wid()
-    {
-	int tid= omp_get_thread_num();
-	return tid / perilla::NUM_THREADS_PER_TEAM;    
-    }
-
-    bool WorkerThread::perilla_isMasterWorkerThread()
-    {
-	int tid= omp_get_thread_num();
-	if((tid % perilla::NUM_THREADS_PER_TEAM)==1)
-	    return true;
-	else
-	    return false;
-    }
-
-    bool WorkerThread::perilla_isMasterThread(){
-	return perilla_tid()==1;
-    }
-
-    bool WorkerThread::perilla_isCommunicationThread()
-    {
-	int tid= omp_get_thread_num();
-	return (tid % perilla::NUM_THREADS_PER_TEAM)==0 ;
-    }
-
-    bool WorkerThread::isMyRegion(int workerID, int regionID)
-    {
-	return ((regionID) % perilla::NUM_THREAD_TEAMS)==workerID;
-    }
-
-    void WorkerThread::setTeamSharedMemory(void* dummy, int tid, int tg)
-    {
-	if((tid % perilla::NUM_THREADS_PER_TEAM)==1)
-	    team_shared_memory[tg] = dummy;    
-    }
-
-    void* WorkerThread::getTeamSharedMemory(int tg)
-    {    
-	return team_shared_memory[tg];
-    }
-}//end namepsace
diff --git a/Src/AmrTask/rts_impls/mpi_omp/perilla.mak b/Src/AmrTask/rts_impls/mpi_omp/perilla.mak
deleted file mode 100755
index 561fa15801f..00000000000
--- a/Src/AmrTask/rts_impls/mpi_omp/perilla.mak
+++ /dev/null
@@ -1,22 +0,0 @@
-CEXE_sources += Barrier.cpp
-CEXE_sources += RGIter.cpp
-CEXE_sources += PackageQueue.cpp
-CEXE_sources += Perilla.cpp
-CEXE_sources += RegionGraph.cpp
-CEXE_sources += RegionQueue.cpp
-CEXE_sources += WorkerThread.cpp
-CEXE_sources += AsyncMultiFabUtil.cpp
-
-
-CEXE_headers += Barrier.H
-CEXE_headers += Config.H
-CEXE_headers += LocalConnection.H
-CEXE_headers += PackageQueue.H
-CEXE_headers += RegionGraph.H
-CEXE_headers += RegionQueue.H
-CEXE_headers += RemoteConnection.H
-CEXE_headers += WorkerThread.H
-CEXE_headers += AsyncMultiFabUtil.H
-
-
-
diff --git a/Src/AmrTask/rts_impls/runtime_common/AsyncMultiFabUtil.H b/Src/AmrTask/rts_impls/runtime_common/AsyncMultiFabUtil.H
deleted file mode 100755
index bf23f017626..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/AsyncMultiFabUtil.H
+++ /dev/null
@@ -1,34 +0,0 @@
-#ifndef _AsyncMultiFabUtil_H_
-#define _AsyncMultiFabUtil_H_
-
-#include <AMReX_MultiFab.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_Amr.H>
-#include <AMReX_AmrLevel.H>
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const int ratio, int f);
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom, int scomp, int ncomp, const int ratio, int f);        
-
-// Average fine cell-based MultiFab onto crse cell-centered MultiFab without volume weighting.
-// This routine DOES NOT assume that the crse BoxArray is a coarsened version of the fine BoxArray.
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_push(Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int ratio, int f);  
-
-void average_down_pull(MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int ratio, int f);
-
-
-void average_down_push (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, MultiFab* crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-                       amrex::Geometry&, amrex::Geometry&,int scomp, int ncomp, const IntVect& ratio, int f);
-
-void average_down_pull (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse,
-                       amrex::Geometry&, amrex::Geometry&, int scomp, int ncomp, const IntVect& ratio, int f);
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/AsyncMultiFabUtil.cpp b/Src/AmrTask/rts_impls/runtime_common/AsyncMultiFabUtil.cpp
deleted file mode 100755
index 1ced35e1afe..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/AsyncMultiFabUtil.cpp
+++ /dev/null
@@ -1,190 +0,0 @@
-#include <AMReX_MultiFabUtil.H>
-//#include <AMReX_MultiFabUtil_F.H>
-#include <AsyncMultiFabUtil.H>
-#include <AMReX_MultiFabUtil_C.H>
-#include <Perilla.H>
-#include <WorkerThread.H>
-
-using namespace amrex;
-using namespace perilla;
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	const Geometry& fgeom, const Geometry& cgeom, int scomp, int ncomp, int rr, int f)
-{
-    average_down_push(amr,S_fine,S_crse,crse_S_fine,RG_fine,RG_crse,fgeom,cgeom,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	const Geometry& fgeom, const Geometry& cgeom, int scomp, int ncomp, int rr, int f)
-{
-    average_down_pull(S_fine,S_crse,RG_fine,RG_crse,fgeom,cgeom,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	const Geometry& fgeom, const Geometry& cgeom, int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    if (S_fine.is_nodal() || S_crse.is_nodal())
-    {
-	amrex::Error("Can't use amrex::average_down for nodal MultiFab!");
-    }
-
-#if (BL_SPACEDIM == 3)
-    average_down_push(amr, S_fine, S_crse, crse_S_fine, RG_fine, RG_crse, scomp, ncomp, ratio, f);
-    return;
-#else
-
-    assert(S_crse.nComp() == S_fine.nComp());
-
-
-    MultiFab fvolume;
-    fgeom.GetVolume(fvolume, fine_BA, 0);
-
-    int lfi = crse_S_fine.IndexArray()[f];
-    const Box& tbx = crse_S_fine[ lfi ].box();
-
-    amrex_avgdown_with_vol(tbx,crse_S_fine[lfi].array(),S_fine[lfi].array(),fvolume[lfi].array(),
-	    0,scomp,ncomp,ratio);
-
-    Perilla::multifabCopyPushAsync(RG_crse, RG_fine, &S_crse, &crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-#endif
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fgeom, const Geometry& cgeom, 
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-
-    if (S_fine.is_nodal() || S_crse.is_nodal())
-    {
-	amrex::Error("Can't use amrex::average_down for nodal MultiFab!");
-    }
-
-#if (BL_SPACEDIM == 3)
-    average_down_pull(S_fine, S_crse, RG_fine, RG_crse, scomp, ncomp, ratio, f);
-    return;
-#else
-    assert(S_crse.nComp() == S_fine.nComp());
-    Perilla::multifabCopyPull(RG_crse, RG_fine, &S_crse, &S_fine, f, scomp, 0, ncomp, 0, 0, false);
-#endif
-}
-
-// *************************************************************************************************************
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-	int scomp, int ncomp, int rr, int f)
-{
-    average_down_push(amr,S_fine,S_crse,crse_S_fine,RG_fine,RG_crse,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int rr, int f)
-{
-    average_down_pull(S_fine,S_crse,RG_fine,RG_crse,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-}
-
-void average_down_push (Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    assert(S_crse.nComp() == S_fine.nComp());
-
-    //  NOTE: The tilebox is defined at the coarse level.
-    int lfi = crse_S_fine.IndexArray()[f];
-    int tg = WorkerThread::perilla_wid();
-    int nt = WorkerThread::perilla_wtid();
-
-    for(int t=0; t<RG_fine->fabTiles[f]->numTiles; t++)
-	if(t % (perilla::NUM_THREADS_PER_TEAM-1) == nt)
-	{
-	    const Box& tbx = *(RG_fine->fabTiles[f]->tileBx[t]);
-	    amrex_avgdown(tbx,crse_S_fine[lfi].array(),S_fine[lfi].array(),0,scomp,ncomp,ratio);
-	}
-    RG_fine->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    Perilla::multifabCopyPushAsync(RG_crse, RG_fine, &S_crse, &crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-void average_down_pull (MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    assert(S_crse.nComp() == S_fine.nComp());
-    Perilla::multifabCopyPull(RG_crse, RG_fine, &S_crse, &S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-
-void average_down_push (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, MultiFab* crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,amrex::Geometry& geom, amrex::Geometry& geom1,
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    if(rgi.currentItr != rgi.totalItr)
-	return;
-    int tg = WorkerThread::perilla_wid();
-
-    f = rgi.currentRegion;
-    //  NOTE: The tilebox is defined at the coarse level.
-    int lfi = crse_S_fine->IndexArray()[f];
-
-    //  NOTE: We copy from component scomp of the fine fab into component 0 of the crse fab
-    //        because the crse fab is a temporary which was made starting at comp 0, it is
-    //        not part of the actual crse multifab which came in.
-
-    //perilla::syncWorkerThreads();
-    RG_fine->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    int nThreads= perilla::nWorkerThreads();
-    for(int t=0; t<RG_fine->fabTiles[f]->numTiles; t+= nThreads)
-    {
-	const Box& tbx = *(RG_fine->fabTiles[f]->tileBx[t]);
-	amrex_avgdown(tbx,(*crse_S_fine)[lfi].array(),(*S_fine)[lfi].array(),0,scomp,ncomp,ratio);
-    }
-    //perilla::syncWorkerThreads();
-    RG_fine->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    Perilla::multifabCopyPush(RG_crse, RG_fine, S_crse, crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-void average_down_pull (RGIter& rgi, MultiFab* S_fine, MultiFab* S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, amrex::Geometry& geom, amrex::Geometry& geom1,
-	int scomp, int ncomp, const IntVect& ratio, int f)
-{
-    if(rgi.currentItr != 1)
-	return;
-    f = rgi.currentRegion;
-
-    Perilla::multifabCopyPull(RG_crse, RG_fine, S_crse, S_fine, f, scomp, 0, ncomp, 0, 0, false);
-}
-
-
-#if 0
-#include "PerillaMemCheck.H"
-
-void PerillaMemCheck::add(string key, void* obj, string classname)
-{
-    lock.lock();
-    if(objMap.find(key) == objMap.end())
-    {
-        objMap[key]= obj;
-	printf("Adding an object\n");
-    }
-    else{
-        printf("Reinsert an object\n");
-        exit(0);
-    }
-    lock.unlock();
-}
-
-
-void PerillaMemCheck::remove(string key){
-    lock.lock();
-    if(objMap.find(key) != objMap.end())
-    {
-        objMap.erase(key);
-	printf("Removing an object\n");
-    }
-    else{
-        printf("Object not found\n");
-        exit(0);
-    }
-
-    lock.unlock();
-}
-void PerillaMemCheck::report(){
-    if(objMap.size()) {
-        printf("Memory leak found\n");
-    }else printf("all packages deallocated\n");
-}
-
-
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/Barrier.H b/Src/AmrTask/rts_impls/runtime_common/Barrier.H
deleted file mode 100755
index 1ceb5caa579..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/Barrier.H
+++ /dev/null
@@ -1,20 +0,0 @@
-#ifndef P_BARRIER_H
-#define P_BARRIER_H
-#include <pthread.h>
-
-class Barrier
-{
-private:
-  volatile int counter;
-  int maxThreads;
-  pthread_cond_t condition;
-  pthread_mutex_t condition_mutex;
-  volatile bool globalSense;
-public:
-  Barrier();
-  Barrier(int maxThreads);
-  void init(int maxThreads);
-  void sync();
-  void sync(int numthreads);
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/Barrier.cpp b/Src/AmrTask/rts_impls/runtime_common/Barrier.cpp
deleted file mode 100755
index 9f905943acf..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/Barrier.cpp
+++ /dev/null
@@ -1,79 +0,0 @@
-#include "Barrier.H"
-#include <stdio.h>
-#include <limits.h>
-#include<assert.h>
-
-Barrier::Barrier()
-{
-  //With this intializer, numthreads has to be specified when syncing, i.e. sync(numthreads)
-  counter = INT_MAX;
-  maxThreads=INT_MAX;
-  condition= PTHREAD_COND_INITIALIZER;
-  condition_mutex= PTHREAD_MUTEX_INITIALIZER;
-  globalSense = false;
-}
-
-Barrier::Barrier(int numthreads)
-{
-//With this initializer, both sync() and sync(numthreads) can be used
-  counter = numthreads;
-  maxThreads= numthreads;
-  condition= PTHREAD_COND_INITIALIZER;
-  condition_mutex= PTHREAD_MUTEX_INITIALIZER;
-  globalSense = false;
-}
-
-void Barrier::init(int numthreads)
-{
-//Similar to Barrier(int numthreads)
-  counter = numthreads;
-  maxThreads= numthreads;
-  condition= PTHREAD_COND_INITIALIZER;
-  condition_mutex= PTHREAD_MUTEX_INITIALIZER;
-  globalSense = false;
-}
-
-void Barrier::sync() //sync all threads associated with this barrier
-{
-  assert(maxThreads<INT_MAX);
-  bool localSense;
-  localSense = globalSense;
-  localSense =  !localSense;
-
-  pthread_mutex_lock(&condition_mutex);
-  counter--;
-
-  if(counter == 0)
-  {
-      counter = maxThreads;
-      globalSense = localSense;
-      pthread_cond_broadcast(&condition);
-  } else {
-      //while(globalSense != localSense){pthread_cond_wait(&condition, &condition_mutex);} //keep sleeping until signaled
-      pthread_cond_wait(&condition, &condition_mutex);
-  }
-  pthread_mutex_unlock(&condition_mutex);
-}
-
-//sync a subset of threads (note: each thread cannot belong to more than 1 synchronization subset)
-void Barrier::sync(int numthreads) 
-{
-  assert(numthreads<=maxThreads);
-  bool localSense;
-  localSense = globalSense;
-  localSense =  !localSense;
-
-  pthread_mutex_lock(&condition_mutex);
-  counter--;
-
-  if(counter == (maxThreads-numthreads))
-  {
-      counter = maxThreads;
-      globalSense = localSense;
-      pthread_cond_broadcast(&condition);
-  } else {
-      //while(globalSense != localSense){pthread_cond_wait(&condition, &condition_mutex);} //keep sleeping until signaled
-      pthread_cond_wait(&condition, &condition_mutex);
-  }
-  pthread_mutex_unlock(&condition_mutex);
-}
diff --git a/Src/AmrTask/rts_impls/runtime_common/LocalConnection.H b/Src/AmrTask/rts_impls/runtime_common/LocalConnection.H
deleted file mode 100755
index 2ffaca0ce75..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/LocalConnection.H
+++ /dev/null
@@ -1,67 +0,0 @@
-#ifndef P_LOCALCONNECTION_H
-#define P_LOCALCONNECTION_H
-
-#include <PackageQueue.H>
-#include <Barrier.H>
-#include <AMReX_Box.H>
-#include <pthread.h>
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include "PerillaMemCheck.H"
-extern PerillaMemCheck memcheck;
-#endif
-
-using namespace perilla;
-using namespace amrex;
-
-class LocalCopyDescriptor
-{
-    public:
-	int ns;   //Source box in layout
-	int nd;   //Destination box in layout
-	int sz;
-	Box sbx;     //Sub-box for this copy
-	Box dbx;     //Sub-box for this copy
-	PackageQueue pQueue;  //store incoming or outgoing messages, both fab and the runtime can access this queue
-	PackageQueue recycleQueue; //just for now, I'll replace this with a NUMA aware package allocator
-	int sPartner, dPartner;
-	int dcpyCnt,scpyCnt;
-	pthread_mutex_t ghostLock;
-	LocalCopyDescriptor() : ns(-1), nd(-1), scpyCnt(0), dcpyCnt(0), sz(0), sPartner(-1), dPartner(-1), ghostLock(PTHREAD_MUTEX_INITIALIZER)
-	{
-#ifdef PERILLA_DEBUG
-//                memcheck.add(memcheck.genKey(this), (void*)this, "LocalCopyDescriptor");
-#endif
-	}
-	~LocalCopyDescriptor(){
-#ifdef PERILLA_DEBUG
-//                memcheck.remove(memcheck.genKey(this));
-#endif
-	}
-};
-
-class LocalConnection
-{
-    public:
-	int nscpy;   //Number of cpy chunks
-	int ndcpy;   //Number of cpy chunks
-	pthread_mutex_t sLock, dLock, ghostLock;
-	int firingRuleCnt;
-	int scpyCnt, dcpyCnt;
-	Barrier *localBarrier;
-	LocalCopyDescriptor *scpy;
-	LocalCopyDescriptor *dcpy;
-	LocalConnection() : nscpy(0), ndcpy(0), firingRuleCnt(0), scpy(NULL), dcpy(NULL), scpyCnt(0), dcpyCnt(0), localBarrier(NULL),sLock(PTHREAD_MUTEX_INITIALIZER),dLock(PTHREAD_MUTEX_INITIALIZER),ghostLock(PTHREAD_MUTEX_INITIALIZER){
-//                memcheck.add(memcheck.genKey(this), (void*)this, "LocalCopyDescriptor");
-}
-
-	~LocalConnection()
-	{
-	    if(localBarrier) free(localBarrier);
-	    if(scpy) delete [] scpy;
-	    if(dcpy) delete [] dcpy;
-//                memcheck.remove(memcheck.genKey(this));
-	}
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/Make.package b/Src/AmrTask/rts_impls/runtime_common/Make.package
deleted file mode 100644
index 137eb3063d5..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/Make.package
+++ /dev/null
@@ -1,8 +0,0 @@
-PERILLA_LIB=EXE
-
-C$(PERILLA_LIB)_sources += Barrier.cpp RGIter.cpp RegionQueue.cpp RegionGraph.cpp WorkerThread.cpp AsyncMultiFabUtil.cpp AsyncMultiFabUtil.cpp PerillaMemCheck.cpp Perilla_common.cpp
-
-C$(PERILLA_LIB)_headers += Barrier.H LocalConnection.H RGIter.H RegionQueue.H RemoteConnection.H WorkerThread.H RegionGraph.H AsyncMultiFabUtil.H PerillaMemCheck.H Perilla.H
-
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
diff --git a/Src/AmrTask/rts_impls/runtime_common/PerillaMemCheck.H b/Src/AmrTask/rts_impls/runtime_common/PerillaMemCheck.H
deleted file mode 100644
index f624aaceb7c..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/PerillaMemCheck.H
+++ /dev/null
@@ -1,30 +0,0 @@
-#ifndef P_MEMCHECK_H
-#define P_MEMCHECK_H
-#include <string>
-#include <sstream>
-#include <map>
-#include "mylock.h"
-using namespace std;
-
-namespace perilla{
-
-    class PerillaMemCheck
-    {
-	public:
-	void add(string key, void* obj, string classname);
-	void remove(string key);
-	string genKey(void *obj){
-	    std::stringstream ost;
-	    ost<<obj;
-	    return ost.str();
-	}
-	PerillaMemCheck():addCnt(0), rmCnt(0){}
-	void report();
-	private:
-	MyLock lock;
-	std::map<string, void* > objMap; 
-	int addCnt, rmCnt;
-    };
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/PerillaMemCheck.cpp b/Src/AmrTask/rts_impls/runtime_common/PerillaMemCheck.cpp
deleted file mode 100644
index e77886eaa02..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/PerillaMemCheck.cpp
+++ /dev/null
@@ -1,40 +0,0 @@
-#include "PerillaMemCheck.H"
-using namespace perilla;
-
-void PerillaMemCheck::add(string key, void* obj, string classname)
-{
-    lock.lock();
-    if(objMap.find(key) == objMap.end())
-    {
-        objMap[key]= obj;
-	addCnt++;
-    }
-    else{
-        printf("MemCheck Error: Reinsert an object\n");
-        exit(0);
-    }
-    lock.unlock();
-}
-
-
-void PerillaMemCheck::remove(string key){
-    lock.lock();
-    if(objMap.find(key) != objMap.end())
-    {
-        objMap.erase(key);
-	rmCnt++;
-    }
-    else{
-        printf("MemCheck Error: Object not found (%d Allocated vs %d Deleted)\n", addCnt, rmCnt);
-        exit(0);
-    }
-
-    lock.unlock();
-}
-void PerillaMemCheck::report(){
-    if(objMap.size()) {
-        printf("Memory leak found: %d objects (%d Allocated vs %d Deleted)\n", objMap.size(), addCnt, rmCnt);
-    }else printf("All allocated objects have been deallocated (%d Allocated vs %d Deleted)\n", addCnt, rmCnt);
-}
-
-
diff --git a/Src/AmrTask/rts_impls/runtime_common/Perilla_common.cpp b/Src/AmrTask/rts_impls/runtime_common/Perilla_common.cpp
deleted file mode 100755
index bf2de14eec3..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/Perilla_common.cpp
+++ /dev/null
@@ -1,3429 +0,0 @@
-#include <AMReX_MultiFab.H>
-#include <AMReX_FabArray.H>
-#include <AMReX_Periodicity.H>
-#include <WorkerThread.H>
-#include <PerillaConfig.H>
-#include <RegionGraph.H>
-#include <Barrier.H>
-#include <vector>
-#include <iostream>
-#include <limits>
-#include <exception>
-#include <mpi.h>
-#include <Perilla.H>
-using namespace std;
-using namespace amrex;
-using namespace perilla;
-
-
-volatile int Perilla::numTeamsFinished = 0;
-volatile int Perilla::updateMetadata_request = 0;
-volatile int Perilla::updateMetadata_noticed = 0;
-volatile int Perilla::updateMetadata_done = 0;
-int Perilla::max_step=1;
-std::map<int,std::map<int,int>> Perilla::pTagCnt;
-int Perilla::uTags=0;
-bool Perilla::genTags=true;
-std::map<int, std::map<int, std::map<int, std::map<int, std::map<int,int> > > > > Perilla::tagMap;
-std::map<int, std::map<int, std::map<int, std::map<int, int> > > > Perilla::myTagMap;
-
-pthread_mutex_t table_lock= PTHREAD_MUTEX_INITIALIZER;
-std::map<size_t, int> tidTable;
-void Perilla::registerId(int tid){
-    pthread_mutex_lock(&table_lock);
-    tidTable[pthread_self()]= tid;
-    pthread_mutex_unlock(&table_lock);
-}
-
-int Perilla::tid(){//this function can be called after all threads already register their ids
-    #ifdef USE_PERILLA_ON_DEMAND
-    return omp_get_thread_num();
-    #else
-    return tidTable[pthread_self()];
-    #endif
-}
-
-void Perilla::clearTagMap(){
-    Perilla::tagMap.clear();
-}
-
-void Perilla::clearMyTagMap(){
-    Perilla::myTagMap.clear();
-}
-
-
-void Perilla::flattenGraphHierarchy(std::vector<std::vector<RegionGraph*> > graphArrayHierarchy, std::vector<RegionGraph*> &graphArray){
-    graphArray.clear();
-    int gCnt=0;
-    for(int l=0; l<graphArrayHierarchy.size(); l++) gCnt+= graphArrayHierarchy[l].size();
-    for(int l=0; l<graphArrayHierarchy.size(); l++)
-        for(int g=0; g<graphArrayHierarchy[l].size(); g++)
-            graphArray.push_back(graphArrayHierarchy[l][g]);
-}
-
-void Perilla::communicateTags()
-{
-    int myProc = ParallelDescriptor::MyProc();
-    int nPs = ParallelDescriptor::NProcs();
-    typedef std::map<int, int> tags_t;
-    typedef std::map<int, std::map<int,int>> stags_t;
-    typedef std::map<int, std::map<int,std::map<int,int>>> dstags_t; 
-    typedef std::map<int, std::map<int,std::map<int,std::map<int,int>>>> gdstags_t;
-    typedef std::map<int, std::map<int,std::map<int,std::map<int,std::map<int,int>>>>> pgdstags_t;
-
-    int** tags = new int*[nPs];
-    int** rtags = new int*[nPs];
-    int* rTagCnt = new int[nPs*2];
-    int* sTagCnt = new int[nPs*2];
-
-    MPI_Request *srrequest;
-    srrequest = new MPI_Request[nPs];
-    MPI_Request *ssrequest;
-    ssrequest = new MPI_Request[nPs];
-    MPI_Request *trrequest;
-    trrequest = new MPI_Request[nPs];
-    MPI_Request *tsrequest;
-    tsrequest = new MPI_Request[nPs];
-
-    std::vector<bool> proc_communicated;
-
-    proc_communicated.resize(nPs);
-    for(int p=0; p<nPs; p++)
-	proc_communicated[p]=false;
-
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	{
-	    MPI_Irecv(&rTagCnt[p*2], 2, MPI_INT, p , 1000, MPI_COMM_WORLD, &srrequest[p]);
-	}
-    }
-
-    for(pgdstags_t::iterator it1 = Perilla::tagMap.begin(); it1  != Perilla::tagMap.end(); it1++)
-    {
-	int tac=0;
-	int ng=0;
-	for(gdstags_t::iterator it2 = it1->second.begin(); it2  != it1->second.end(); it2++)
-	{
-	    tac++;
-	    tac++;
-	    ng++;
-	    for(dstags_t::iterator it3 = it2->second.begin(); it3  != it2->second.end(); it3++)
-		for(stags_t::iterator it4 = it3->second.begin(); it4  != it3->second.end(); it4++)
-		    for(tags_t::iterator it5 = it4->second.begin(); it5  != it4->second.end(); it5++)
-		    {
-			tac+=4;
-		    }
-	}
-	sTagCnt[it1->first*2] = tac;
-	sTagCnt[it1->first*2+1] = ng;
-	tags[it1->first] = new int[sTagCnt[it1->first*2]];
-	MPI_Isend(&sTagCnt[it1->first*2], 2, MPI_INT, it1->first, 1000, MPI_COMM_WORLD, &ssrequest[it1->first]);
-	proc_communicated[it1->first]=true;
-    }
-
-    for(int p=0; p<nPs; p++)
-	if(p!=myProc)
-	    if(!proc_communicated[p])
-	    {
-		sTagCnt[p*2] = 0;
-		sTagCnt[p*2+1] = 0;
-		MPI_Isend(&sTagCnt[p*2], 2, MPI_INT, p, 1000, MPI_COMM_WORLD, &ssrequest[p]);
-	    }
-
-
-    for(pgdstags_t::iterator it1 = Perilla::tagMap.begin(); it1  != Perilla::tagMap.end(); it1++)
-    {
-	int tac=0;
-	for(gdstags_t::iterator it2 = it1->second.begin(); it2  != it1->second.end(); it2++)
-	{
-	    tags[it1->first][tac++] = it2->first;
-	    tags[it1->first][tac++] = pTagCnt[it1->first][it2->first];
-	    int gtagc = 0;
-	    for(dstags_t::iterator it3 = it2->second.begin(); it3  != it2->second.end(); it3++)
-		for(stags_t::iterator it4 = it3->second.begin(); it4  != it3->second.end(); it4++)
-		    for(tags_t::iterator it5 = it4->second.begin(); it5  != it4->second.end(); it5++)
-		    {
-			tags[it1->first][tac++] = it3->first;
-			tags[it1->first][tac++] = it4->first;
-			tags[it1->first][tac++] = it5->first;
-			tags[it1->first][tac++] = it5->second;
-			gtagc++;
-		    }
-	    BL_ASSERT(pTagCnt[it1->first][it2->first] == gtagc);
-	}
-	MPI_Isend(tags[it1->first], tac, MPI_INT, it1->first, 1001, MPI_COMM_WORLD, &tsrequest[it1->first]);
-    }
-
-    MPI_Status status;
-    for(int p=0; p<nPs; p++)
-    {      
-	if(p!=myProc)
-	{
-	    MPI_Wait( &srrequest[p], &status );
-	    if(rTagCnt[p*2] > 0)
-	    {
-		rtags[p] = new int[rTagCnt[p*2]];
-		MPI_Irecv(rtags[p], rTagCnt[p*2], MPI_INT, p , 1001, MPI_COMM_WORLD, &trrequest[p]);
-	    }
-	}
-    }
-
-
-    //      //MPI_Irecv(size) Wait
-
-
-    //MPI_recive tags arra
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	{
-	    if(rTagCnt[p*2] > 0)
-	    {
-		MPI_Wait( &trrequest[p], &status );
-		int tCnt=0;
-		for(int g=0; g<rTagCnt[p*2+1];g++)
-		{
-		    int gi = rtags[p][tCnt++];
-		    int sCnt = rtags[p][tCnt++];
-		    for(int j=0; j<sCnt; j++)
-		    {
-			Perilla::myTagMap[gi][rtags[p][tCnt]][rtags[p][tCnt+1]][rtags[p][tCnt+2]]=rtags[p][tCnt+3];
-			//std::cout<< "at myP "<<myProc<<" g " << gi << " d " << rtags[p][tCnt]<< " s " << rtags[p][tCnt+1] << " t "<< rtags[p][tCnt+2]<<std::endl;
-			tCnt += 4;    
-		    }
-		}
-		//std::cout<< "at P "<< myProc <<" rCnt "<<rTagCnt[p*2]<<" " << tCnt << std::endl;
-	    }
-	}      	
-    }
-
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	    if(rTagCnt[p*2] > 0)
-	    {
-		delete[] rtags[p];
-	    }
-    }
-
-
-    for(int p=0; p<nPs; p++)
-    {
-	if(p!=myProc)
-	    if(proc_communicated[p])
-	    {
-		MPI_Wait( &tsrequest[p], &status );
-		delete[] tags[p];
-	    }
-    }
-
-    delete[] srrequest;
-    delete[] ssrequest;
-    delete[] trrequest;
-    delete[] tsrequest;
-    delete[] tags;
-    delete[] rtags;
-    delete[] rTagCnt;
-    delete[] sTagCnt;
-
-    Perilla::genTags=false;
-}
-
-
-void Perilla::multifabBuildFabCon(RegionGraph* rg, const MultiFab& mf, const Periodicity& period)
-{
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = mf.IndexArray().size();
-    bool cross = false;
-    const FabArrayBase::FB& TheFB = mf.getFB(mf.nGrowVect(), period, false, false);
-    const int n_loc_mf = TheFB.m_LocTags->size();
-    const int n_snds_mf = TheFB.m_SndTags->size();
-    const int n_rcvs_mf = TheFB.m_RcvTags->size();
-
-    Vector<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-    Vector<int> send_pr;
-    send_cctc.reserve(n_snds_mf);
-
-    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheFB.m_SndTags->begin(),
-            m_End = TheFB.m_SndTags->end();
-            m_it != m_End;
-            ++m_it)
-    {
-        if(m_it->first != myProc)      // Not destined to me.
-        {
-            send_pr.push_back(m_it->first);
-            send_cctc.push_back(&(m_it->second));
-        }
-    }
-
-    Vector<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-    Vector<int> recv_pr;
-    recv_cctc.reserve(n_rcvs_mf);
-
-    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheFB.m_RcvTags->begin(),
-            m_End = TheFB.m_RcvTags->end();
-            m_it != m_End;
-            ++m_it)
-    {
-        if(m_it->first != myProc)      // I am not the source for this receipt
-        {
-            recv_pr.push_back(m_it->first);
-            recv_cctc.push_back(&(m_it->second));
-        }
-    }
-
-//#pragma omp parallel shared(rg, mf, numfabs, np, TheFB, recv_cctc, send_cctc)
-    {
-        //int tg = omp_get_thread_num();
-        int fg;
-//        if(WorkerThread::perilla_isCommunicationThread())
-//#pragma omp single
-        {
-            //bool cc = !mf->is_nodal(); //  cc = multifab_cell_centered_q(mf)
-            //mf->sMap.reserve(numfabs);
-            //mf->rMap.reserve(numfabs);
-            //std::cout<< "Allocating sMap and rMap" <<std::endl;
-            rg->alloc_lMap(mf);
-            rg->alloc_sMap(mf);
-            rg->alloc_rMap(mf);
-        }
-//#pragma omp barrier      
-        //if(tid==0)                              
-        {
-            //bool cc = !mf->is_nodal(); //  cc = multifab_cell_centered_q(mf)
-            //mf->sMap.reserve(numfabs);
-            //mf->rMap.reserve(numfabs);
-//#pragma omp for
-            for(int f=0; f<numfabs; f++) //        !create local communication metadata for each fab
-            {
-//                if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-                {
-                    rg->lMap[f]->l_con.nscpy = 0;
-
-                    //for(int i=0; i<bxasc->l_con.ncpy; i++)
-                    for(int i=0; i<n_loc_mf; i++)
-                    {
-                        const FabArrayBase::CopyComTag& tag = (*TheFB.m_LocTags)[i];
-
-                        //std::cout << tag.srcIndex << " " << tag.dstIndex << " " <<tag.sbox.smallEnd() <<" "<< tag.sbox.bigEnd() << std::endl;
-
-                        BL_ASSERT(mf.distributionMap[tag.dstIndex] == myProc);
-                        BL_ASSERT(mf.distributionMap[tag.srcIndex] == myProc);
-                        //get(tag.dstIndex).copy(get(tag.srcIndex),tag.box,scomp,tag.box,scomp,ncomp);
-                        //if(f == local_index(mf,bxasc->l_con.cpy[i].ns)) //LocalIndex
-                        if(mf.IndexArray()[f] == tag.srcIndex)
-                            rg->lMap[f]->l_con.nscpy++;
-                        //if(f == local_index(mf,bxasc->l_con.cpy[i].nd)) //LocalIndex
-                        if(mf.IndexArray()[f] == tag.dstIndex)
-                            rg->lMap[f]->l_con.ndcpy++;
-                    }
-                    /*
-                       if(rg->lMap[f]->l_con.nscpy+rg->lMap[f]->l_con.ndcpy != n_loc_mf)
-                       std::cout<< "Diff in Sum " << rg->lMap[f]->l_con.nscpy << " " <<rg->lMap[f]->l_con.ndcpy << " " << n_loc_mf <<std::endl;
-                       BL_ASSERT(rg->lMap[f]->l_con.nscpy+rg->lMap[f]->l_con.ndcpy == n_loc_mf);
-                     */
-                }
-            }
-        }
-//#pragma omp barrier
-        //now we know how many copying segments each fab owns as source and destination allocate memory for metadata   
-//#pragma omp for
-        for(int f=0; f<numfabs; f++)
-        {
-            //fg = f % (omp_get_num_threads()/perilla::NUM_THREADS_PER_TEAM);   /// need to check if computing correct ???????
-            //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==1))
-//            if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-            {
-                //omp_init_lock(&(rg->lMap[f]->l_con.sLock));
-                //omp_init_lock(&(rg->lMap[f]->l_con.dLock));
-                //omp_init_lock(&(rg->lMap[f]->l_con.ghostLock));
-
-                //std::cout<< "MF l_con nscpy " <<rg->lMap[f]->l_con.nscpy << " ndcpy " << rg->lMap[f]->l_con.ndcpy <<std::endl;
-
-                rg->lMap[f]->l_con.scpy = new LocalCopyDescriptor[rg->lMap[f]->l_con.nscpy];
-                rg->lMap[f]->l_con.dcpy = new LocalCopyDescriptor[rg->lMap[f]->l_con.ndcpy];
-                rg->lMap[f]->l_con.scpyCnt = 0;
-                rg->lMap[f]->l_con.dcpyCnt = 0;
-            }
-        }
-//#pragma omp barrier
-        if(np > 1)
-        {
-//#pragma omp for
-            for(int f=0; f<numfabs; f++)
-            {
-//                if(WorkerThread::perilla_isMasterWorkerThread() && WorkerThread::isMyRegion(tg,f))
-                {
-                    rg->lMap[f]->r_con.nrcv = 0;
-                    rg->lMap[f]->r_con.nsnd = 0;
-                    rg->lMap[f]->r_con.firingRuleCnt = 0;
-
-                    //for(int i=0; i<bxasc->r_con.nsnd; i++)
-                    for(int i=0; i<n_snds_mf; i++)
-                    {
-                        const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                        for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                it != cctc.end(); ++it)
-                        {
-                            //if(f == local_index(mf,bxasc->r_con.snd[i].ns)) //LocalIndex
-                            if(mf.IndexArray()[f] == it->srcIndex)
-                            {
-                                rg->lMap[f]->r_con.nsnd++;
-                            }
-                        }
-                    }
-                    //for(int i=0; i<bxasc->r_con.nrcv; i++)
-                    for(int i=0; i<n_rcvs_mf; i++)
-                    {
-                        const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                        for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                it != cctc.end(); ++it)
-                        {
-                            //if(f == local_index(mf,bxasc->r_con.rcv[i].nd)) //LocalIndex
-                            if(mf.IndexArray()[f] == it->dstIndex)
-                            {
-                                rg->lMap[f]->r_con.nrcv++;
-                            }
-                        }
-                    }
-                    //rg->sMap[f]->r_con.sndLock = new omp_lock_t;
-                    //rg->rMap[f]->r_con.rcvLock = new omp_lock_t;
-                    //omp_init_lock(rg->sMap[f]->r_con.sndLock);
-                    //omp_init_lock(rg->rMap[f]->r_con.rcvLock);
-                    rg->lMap[f]->r_con.snd = new RemoteCommDescriptor[rg->lMap[f]->r_con.nsnd];
-                    rg->lMap[f]->r_con.rcv = new RemoteCommDescriptor[rg->lMap[f]->r_con.nrcv];
-                }
-            }
- //           if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-            {
-//#pragma omp for
-                for(int f=0; f<numfabs; f++)
-                {
-                    rg->rMap[f]->r_con.nrcv = 0;
-                    rg->sMap[f]->r_con.nsnd = 0;
-
-                    //for(int i=0; i<bxasc->r_con.nsnd; i++)
-                    for(int i=0; i<n_snds_mf; i++)
-                    {
-                        const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                        for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                it != cctc.end(); ++it)
-                        {
-                            //if(f == local_index(mf,bxasc->r_con.snd[i].ns)) //LocalIndex
-                            if(mf.IndexArray()[f] == it->srcIndex)
-                            {
-                                rg->sMap[f]->r_con.nsnd++;
-                            }
-                        }
-                    }
-                    //for(int i=0; i<bxasc->r_con.nrcv; i++)
-                    for(int i=0; i<n_rcvs_mf; i++)
-                    {
-                        const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                        for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                it != cctc.end(); ++it)
-                        {
-                            //if(f == local_index(mf,bxasc->r_con.rcv[i].nd)) //LocalIndex
-                            if(mf.IndexArray()[f] == it->dstIndex)
-                            {
-                                rg->rMap[f]->r_con.nrcv++;
-                            }
-                        }
-                    }
-                    //rg->sMap[f]->r_con.sndLock = new omp_lock_t;
-                    //rg->rMap[f]->r_con.rcvLock = new omp_lock_t;
-                    //omp_init_lock(rg->sMap[f]->r_con.sndLock);
-                    //omp_init_lock(rg->rMap[f]->r_con.rcvLock);
-                    rg->sMap[f]->r_con.snd = new RemoteCommDescriptor[rg->sMap[f]->r_con.nsnd];
-                    rg->rMap[f]->r_con.rcv = new RemoteCommDescriptor[rg->rMap[f]->r_con.nrcv];
-                }
-            }
-        }
-    } // omp parallel
-    //std::cout<< "counting done " <<std::endl;
-    //    !!touch data to bind pages to the NUMA node
-//#pragma omp parallel shared(mf, numfabs, TheFB, recv_cctc, send_cctc)
-    {
-//        int tg = WorkerThread::perilla_wid();
-
-        //      std::cout<< "Barr 4- "<< tid <<" "<< tg << " " << WorkerThread::isTeamMasterThread(tid) << std::endl;
-
-        //      std::cout<< "Barr 5" <<std::endl;
-        int fg, scnt, dcnt;
-
-//#pragma omp for
-        for(int f=0; f<numfabs; f++)
-        {
-            //fg = f % (omp_get_num_threads()/perilla::NUM_THREADS_PER_TEAM);
-            //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==1))
-
-            //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==0))
- //           if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-            {
-                rg->lMap[f]->l_con.localBarrier = new Barrier(perilla::NUM_THREADS_PER_TEAM-1);
-                // !create local communication meta data for sources and destinations
-                scnt = -1;
-                dcnt = -1;
-                //for(int i=0; i<bxasc->l_con.ncpy; i++)
-                for(int i=0; i<n_loc_mf; i++)
-                {
-                    const FabArrayBase::CopyComTag& tag = (*TheFB.m_LocTags)[i];
-                    BL_ASSERT(mf.distributionMap[tag.dstIndex] == myProc);
-                    BL_ASSERT(mf.distributionMap[tag.srcIndex] == myProc);
-
-                    //if(f == local_index(mf,bxasc->l_con.cpy[i].ns)) //LocalIndex
-                    if(mf.IndexArray()[f] == tag.srcIndex)
-                    {
-                        scnt++;
-                        //omp_init_lock(&(rg->lMap[f]->l_con.scpy[scnt].ghostLock));
-                        rg->lMap[f]->l_con.scpy[scnt].ns = mf.localindex(tag.srcIndex); //local_index(mf,bxasc->l_con.cpy[i].ns); //LocalIndex
-                        rg->lMap[f]->l_con.scpy[scnt].nd = mf.localindex(tag.dstIndex); //local_index(mf,bxasc->l_con.cpy[i].nd); //LocalIndex
-                        rg->lMap[f]->l_con.scpy[scnt].sbx = tag.sbox; //bxasc->l_con.cpy[i].sbx;
-                        rg->lMap[f]->l_con.scpy[scnt].dbx = tag.dbox; //bxasc->l_con.cpy[i].dbx;                    
-                        // !create queues for ghost cells
-                        //call queue_init(mf%fbs(f)%l_con%scpy(scnt)%pQueue)
-                        //call queue_init(mf%fbs(f)%l_con%scpy(scnt)%recycleQueue)
-
-                        int psize = tag.sbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-                        /*
-                           p => dataptr(mf%fbs(f), mf%fbs(f)%l_con%scpy(scnt)%sbx, 1, mf%nc)
-                           s1= size(p,1)
-                           s2= size(p,2)
-                           s3= size(p,3)
-                           s4= size(p,4)
-                           s1*s2*s3*s4
-                         */
-                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                        {
-                            Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                            for(int j=0; j<psize; j++)
-                                ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                            rg->lMap[f]->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);
-                        }
-                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                            rg->lMap[f]->l_con.scpy[scnt].recycleQueue.enqueue(rg->lMap[f]->l_con.scpy[scnt].pQueue.dequeue());
-                    }
-                    //if(f == local_index(mf,bxasc->l_con.cpy[i].nd)) //LocalIndex
-                    if(mf.IndexArray()[f] == tag.dstIndex)
-                    {
-                        dcnt++;
-                        rg->lMap[f]->l_con.dcpy[dcnt].ns = mf.localindex(tag.srcIndex); //local_index(mf,bxasc->l_con.cpy[i].ns); //LocalIndex
-                        rg->lMap[f]->l_con.dcpy[dcnt].nd = mf.localindex(tag.dstIndex); //local_index(mf,bxasc->l_con.cpy[i].nd); //LocalIndex
-                        rg->lMap[f]->l_con.dcpy[dcnt].sbx = tag.sbox; //bxasc->l_con.cpy[i].sbx;
-                        rg->lMap[f]->l_con.dcpy[dcnt].dbx = tag.dbox; //bxasc->l_con.cpy[i].dbx;                    
-                        //call queue_init(mf%fbs(f)%l_con%dcpy(dcnt)%pQueue)
-                        //call queue_init(mf%fbs(f)%l_con%dcpy(dcnt)%recycleQueue)
-                        int psize = tag.dbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-                        /*
-                           p => dataptr(mf%fbs(f), mf%fbs(f)%l_con%dcpy(dcnt)%dbx, 1, mf%nc)
-                           s1= size(p,1)
-                           s2= size(p,2)
-                           s3= size(p,3)
-                           s4= size(p,4)
-                           s1*s2*s3*s4
-                         */
-
-                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                        {
-                            Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                            for(int j=0; j<psize; j++)
-                                ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                            rg->lMap[f]->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);
-                        }
-                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                            rg->lMap[f]->l_con.dcpy[dcnt].recycleQueue.enqueue(rg->lMap[f]->l_con.dcpy[dcnt].pQueue.dequeue());
-                    }
-                } // for(i<n_loc_mf)
-                //std::cout<< scnt << " " << dcnt << std::endl;
-            }
-        }// for(f<numfabs)
-
-//#pragma omp barrier       
-
- //       if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-//#pragma omp for
-            for(int f=0; f<numfabs; f++)
-            {
-                for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++)
-                    for(int j=0; j<rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.ndcpy; j++)
-                        if(rg->lMap[f]->l_con.scpy[i].dbx == rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[j].dbx)
-                            rg->lMap[f]->l_con.scpy[i].dPartner = j;
-
-                for(int i=0; i<rg->lMap[f]->l_con.ndcpy; i++)
-                    for(int j=0; j<rg->lMap[rg->lMap[f]->l_con.dcpy[i].ns]->l_con.nscpy; j++)
-                        if(rg->lMap[f]->l_con.dcpy[i].dbx == rg->lMap[rg->lMap[f]->l_con.dcpy[i].ns]->l_con.scpy[j].dbx)
-                            rg->lMap[f]->l_con.dcpy[i].sPartner = j;
-            }
-    }
-    if(np == 1) return;
-
-    //std::cout<< "local init done" <<std::endl;
-
-//#pragma omp parallel shared(rg, mf, numfabs)
-    {
-        int tg = WorkerThread::perilla_wid();
-        int fg, nsnd, nrcv;
-
-        for(int f=0; f<numfabs; f++)
-        {
-            //fg = f % (omp_get_num_threads()/perilla::NUM_THREADS_PER_TEAM);
-            //if((fg == tg) && ((tid%perilla::NUM_THREADS_PER_TEAM)==0))
- //           if(WorkerThread::isMyRegion(tg,f) && WorkerThread::perilla_isMasterWorkerThread())
-            {
-                //rg->lMap[f]->r_con.sndLock = new omp_lock_t;
-                //rg->lMap[f]->r_con.rcvLock = new omp_lock_t;
-                //omp_init_lock(rg->lMap[f]->r_con.sndLock);
-                //omp_init_lock(rg->lMap[f]->r_con.rcvLock);
-                //rg->lMap[f]->r_con.snd = new RemoteCommDescriptor[rg->lMap[f]->r_con.nsnd];
-                //rg->lMap[f]->r_con.rcv = new RemoteCommDescriptor[rg->lMap[f]->r_con.nrcv];
-                nrcv= -1;
-                //for(int i=0; i<bxasc->r_con.nrcv; i++)
-                for(int i=0; i<n_rcvs_mf; i++)
-                {
-                    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                    int pr = recv_pr[i];
-                    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                            it != cctc.end(); ++it)
-                    {
-                        //if(f == local_index(mf,bxasc->r_con.rcv[i].nd)) //LocalIndex
-                        if(mf.IndexArray()[f] == it->dstIndex)
-                        {
-                            nrcv++;
-                            rg->lMap[f]->r_con.rcv[nrcv].ns = it->srcIndex; //bxasc->r_con.rcv[i].ns;
-                            //rg->lMap[f]->r_con.rcv[nrcv].lnd = ; //local_index(mf,bxasc->r_con.rcv[i].nd); // not used anywhere so deferred ---------????????
-                            //rg->lMap[f]->r_con.rcv[nrcv].lns = -1; //undefined
-                            rg->lMap[f]->r_con.rcv[nrcv].nd = it->dstIndex; //bxasc->r_con.rcv[i].nd;
-                            rg->lMap[f]->r_con.rcv[nrcv].lnd = mf.localindex(it->dstIndex);
-                            rg->lMap[f]->r_con.rcv[nrcv].lns = mf.localindex(it->srcIndex);
-                            rg->lMap[f]->r_con.rcv[nrcv].sbx = it->sbox; //bxasc->r_con.rcv[i].sbx;
-                            rg->lMap[f]->r_con.rcv[nrcv].dbx = it->dbox; //bxasc->r_con.rcv[i].dbx;
-                            rg->lMap[f]->r_con.rcv[nrcv].pr = pr; //bxasc->r_con.rcv[i].pr;
-                            rg->lMap[f]->r_con.rcv[nrcv].cnt = 0;
-                            //!create queues for ghost cells
-                            //call queue_init(mf%fbs(f)%r_con%rcv(nrcv)%pQueue)
-                            //call queue_init(mf%fbs(f)%r_con%rcv(nrcv)%recycleQueue)
-                            int psize = it->sbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-                            /*
-                               p => dataptr(mf%fbs(f), mf%fbs(f)%r_con%rcv(nrcv)%dbx, 1, mf%nc)
-                               s1= size(p,1)
-                               s2= size(p,2)
-                               s3= size(p,3)
-                               s4= size(p,4)
-                               s1*s2*s3*s4
-                             */
-                            rg->lMap[f]->r_con.rcv[nrcv].sz = psize;
-                            for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                            {
-                                Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                for(int j=0; j<psize; j++)
-                                    ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                rg->lMap[f]->r_con.rcv[nrcv].pQueue.enqueue(tmpPkg);
-                            }
-                            for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                rg->lMap[f]->r_con.rcv[nrcv].recycleQueue.enqueue(rg->lMap[f]->r_con.rcv[nrcv].pQueue.dequeue());
-                        }
-                    }
-                } // for(i<n_rcvs_mf)
-                nsnd = -1;
-                //for(int i=0; i<bxasc->r_con.nsnd; i++)
-                for(int i=0; i<n_snds_mf; i++)
-                {
-                    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                    int pr = send_pr[i];
-                    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                            it != cctc.end(); ++it)
-                    {
-                        //if(f == local_index(mf,bxasc->r_con.snd[i].ns)) //LocalIndex
-                        if(mf.IndexArray()[f] == it->srcIndex )
-                        {
-                            nsnd++;
-                            rg->lMap[f]->r_con.snd[nsnd].ns = it->srcIndex; //bxasc->r_con.snd[i].ns;
-                            rg->lMap[f]->r_con.snd[nsnd].nd = it->dstIndex; //bxasc->r_con.snd[i].nd;
-                            //rg->lMap[f]->r_con.snd[nsnd].lns = ; //local_index(mf,bxasc->r_con.snd[i].ns); //not used anywhere so deferred ------?????????
-                            //rg->lMap[f]->r_con.snd[nsnd].lnd = -1; //undefined
-                            rg->lMap[f]->r_con.snd[nsnd].lns = mf.localindex(it->srcIndex);
-                            rg->lMap[f]->r_con.snd[nsnd].lnd = mf.localindex(it->dstIndex);
-                            rg->lMap[f]->r_con.snd[nsnd].sbx = it->sbox; //bxasc->r_con.snd[i].sbx;
-                            rg->lMap[f]->r_con.snd[nsnd].dbx = it->dbox; //bxasc->r_con.snd[i].dbx;
-                            rg->lMap[f]->r_con.snd[nsnd].pr = pr; //bxasc->r_con.snd[i].pr;
-                            rg->lMap[f]->r_con.snd[nsnd].cnt = 0;
-                            //!create queues for ghost cells            
-                            //call queue_init(mf%fbs(f)%r_con%snd(nsnd)%pQueue)
-                            //call queue_init(mf%fbs(f)%r_con%snd(nsnd)%recycleQueue)
-                            int psize = it->sbox.numPts() * mf.nComp(); //---------------------------------------------------------------????????????????
-                            /*
-                               p => dataptr(mf%fbs(f), mf%fbs(f)%r_con%snd(nsnd)%sbx, 1, mf%nc)
-                               s1= size(p,1)
-                               s2= size(p,2)
-                               s3= size(p,3)
-                               s4= size(p,4)
-                               s1*s2*s3*s4
-                             */
-                            rg->lMap[f]->r_con.snd[nsnd].sz = psize;
-                            for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                            {
-                                Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                for(int j=0; j<psize; j++)
-                                    ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                rg->lMap[f]->r_con.snd[nsnd].pQueue.enqueue(tmpPkg);
-                            }
-                            for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                rg->lMap[f]->r_con.snd[nsnd].recycleQueue.enqueue(rg->lMap[f]->r_con.snd[nsnd].pQueue.dequeue());
-
-                            //std::cout<< "RQ f "<< f << " i "<< nsnd <<std::endl;
-                        }
-                    }
-                } // for(i<n_snds_mf)
-                //std::cout<< "tid "<< tid << " f "<< f << " nfabs "<< numfabs <<std::endl;
-            }// if(fg==tg...)
-            //#pragma omp barrier
-        }//for(f<numfabs)
-
-        //std::cout<< "Barr 1 tid " << tid <<std::endl;
-
-//#pragma omp barrier      //----------------------------------- Barrier ------------------------------------------      
-        //if(tid == 0)
- //       if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-        {
-            for(int f=0; f<numfabs; f++)
-            {
-                for(int i=0; i<rg->lMap[f]->r_con.nsnd; i++)
-                {
-                    rg->sMap[f]->r_con.snd[i].ns = rg->lMap[f]->r_con.snd[i].ns;
-                    rg->sMap[f]->r_con.snd[i].nd = rg->lMap[f]->r_con.snd[i].nd;
-                    rg->sMap[f]->r_con.snd[i].lns = rg->lMap[f]->r_con.snd[i].lns;
-                    rg->sMap[f]->r_con.snd[i].lnd = rg->lMap[f]->r_con.snd[i].lnd;
-                    rg->sMap[f]->r_con.snd[i].r_gid = rg->graphID-1;
-                    rg->sMap[f]->r_con.snd[i].r_grids = rg->numFabs;
-                    rg->sMap[f]->r_con.snd[i].sbx = rg->lMap[f]->r_con.snd[i].sbx;
-                    rg->sMap[f]->r_con.snd[i].dbx = rg->lMap[f]->r_con.snd[i].dbx;
-                    rg->sMap[f]->r_con.snd[i].pr = rg->lMap[f]->r_con.snd[i].pr;
-                    rg->sMap[f]->r_con.snd[i].sz = rg->lMap[f]->r_con.snd[i].sz;
-                    rg->sMap[f]->r_con.snd[i].cnt = 0;
-                    rg->lMap[f]->r_con.snd[i].cnt = 0;
-
-                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                    {
-                        Package *tmpPkg = new Package(rg->lMap[f]->r_con.snd[i].sz);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<rg->lMap[f]->r_con.snd[i].sz; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                        for(int j=0; j<rg->lMap[f]->r_con.snd[i].sz; j++)
-                            ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                        rg->sMap[f]->r_con.snd[i].pQueue.enqueue(tmpPkg);
-                    }
-                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                        rg->sMap[f]->r_con.snd[i].recycleQueue.enqueue(rg->sMap[f]->r_con.snd[i].pQueue.dequeue());
-                }
-                for(int i=0; i<rg->lMap[f]->r_con.nrcv; i++)
-                {
-                    rg->rMap[f]->r_con.rcv[i].ns = rg->lMap[f]->r_con.rcv[i].ns;
-                    rg->rMap[f]->r_con.rcv[i].nd = rg->lMap[f]->r_con.rcv[i].nd;
-                    rg->rMap[f]->r_con.rcv[i].lns = rg->lMap[f]->r_con.rcv[i].lns;
-                    rg->rMap[f]->r_con.rcv[i].lnd = rg->lMap[f]->r_con.rcv[i].lnd;
-                    rg->rMap[f]->r_con.rcv[i].r_gid = rg->graphID-1;
-                    rg->rMap[f]->r_con.rcv[i].r_grids = rg->numFabs;
-                    rg->rMap[f]->r_con.rcv[i].sbx = rg->lMap[f]->r_con.rcv[i].sbx;
-                    rg->rMap[f]->r_con.rcv[i].dbx = rg->lMap[f]->r_con.rcv[i].dbx;
-                    rg->rMap[f]->r_con.rcv[i].pr = rg->lMap[f]->r_con.rcv[i].pr;
-                    rg->rMap[f]->r_con.rcv[i].sz = rg->lMap[f]->r_con.rcv[i].sz;
-                    rg->rMap[f]->r_con.rcv[i].cnt = 0;
-                    rg->lMap[f]->r_con.rcv[i].cnt = 0;
-
-                    if(Perilla::genTags)
-                    {
-                        try
-                        {
-                            int rcv_pr = rg->rMap[f]->r_con.rcv[i].pr;
-                            int dstIndex = rg->rMap[f]->r_con.rcv[i].nd;
-                            int srcIndex = rg->rMap[f]->r_con.rcv[i].ns;
-                            int psize = rg->rMap[f]->r_con.rcv[i].sz;
-                            std::map<int,int>::iterator itr = tagMap[rcv_pr][rg->graphID-1][dstIndex][srcIndex].find(psize);
-                            if( itr != tagMap[rcv_pr][rg->graphID-1][dstIndex][srcIndex].end())
-                            {
-                                //rg->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-                            }
-                            else
-                            {
-                                tagMap[rcv_pr][rg->graphID-1][dstIndex][srcIndex][psize] = Perilla::uTags++;
-                                //rg->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-                                std::map<int,int>::iterator itr2 = pTagCnt[rcv_pr].find(rg->graphID-1);
-                                if(itr2 != pTagCnt[rcv_pr].end())
-                                    pTagCnt[rcv_pr][rg->graphID-1] = pTagCnt[rcv_pr][rg->graphID-1] + 1;
-                                else
-                                    pTagCnt[rcv_pr][rg->graphID-1] = 1;
-                            }
-                        }
-                        catch(std::exception& e)
-                        {
-                            std::cout <<"Inside tagGeneration gID "<< rg->graphID <<" "<< e.what() << '\n';
-                        }
-                    }
-                    //tagMap[rcv_pr][rg->graphID][it->dstIndex][it->srcIndex] = pTagCnt[rcv_pr];                                  
-
-                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                    {
-                        Package *tmpPkg = new Package(rg->lMap[f]->r_con.rcv[i].sz);
-#ifdef PERILLA_USE_UPCXX    
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<rg->lMap[f]->r_con.rcv[i].sz; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                        for(int j=0; j<rg->lMap[f]->r_con.rcv[i].sz; j++)
-                            ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                        rg->rMap[f]->r_con.rcv[i].pQueue.enqueue(tmpPkg);
-                    }
-                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                        rg->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rg->rMap[f]->r_con.rcv[i].pQueue.dequeue());
-                }
-            }
-        }// if(tid==0)
-
-    }// omp parallel    
-}// multifabBuildFabCon
-
-
-#if 0
-void Perilla::serviceLocalRequests(RegionGraph* rg, int tg)    
-{
-    int numfabs = rg->lMap.size();
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    //int lockSucceeded = pthread_mutex_trylock(&(rg->lMap[f]->l_con.sLock));
-	    //if(lockSucceeded != 0) // 0-Fail, otherwise-Succeed
-	    {		
-		for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++){
-		    if(rg->lMap[f]->l_con.scpy[i].pQueue.queueSize()>0)
-		    {
-	                pthread_mutex_lock(&(rg->lMap[f]->l_con.sLock));
-			assert(doublechecked==false);
-			Package *sPackage = rg->lMap[f]->l_con.scpy[i].pQueue.dequeue();
-			if(perilla::LAZY_PUSH)
-			{
-			    //  Implemetation deffered. Currently not required
-			}
-			//if(graph->graphID == 1 && rg->lMap[f]->l_con.scpy[i].nd == 1)
-			//std::cout<< "Processing gID 1 nd 1 from f " << f << " i " << i << std::endl;
-			pthread_mutex_lock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			int dPartner = rg->lMap[f]->l_con.scpy[i].dPartner;
-
-			//if(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.queueSize() == 0 )
-			if(dPartner == -1)
-			    std::cout<< " Caution rQ size dPrtn "<< rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.ndcpy << " " << dPartner <<" graph ID " <<rg->graphID<<std::endl;
-			//std::cout<< " Caution rQ size "<< rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.queueSize() <<std::endl;
-
-			Package *dPackage = rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-
-			//for(int j=0; j<sPackage->bufSize; j++)
-			//dPackage->databuf[j] = sPackage->databuf[j];        //copy data------------------------------???????????????
-
-			std::memcpy(dPackage->databuf, sPackage->databuf, dPackage->bufSize * sizeof(double));
-
-			rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			if(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.queueSize(true)==1)
-			    rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.firingRuleCnt++;
-			pthread_mutex_unlock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			rg->lMap[f]->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-	 	        pthread_mutex_unlock(&(rg->lMap[f]->l_con.sLock));
-		    }
-		}
-		//pthread_mutex_unlock(&(rg->lMap[f]->l_con.sLock));
-	    }// if(!lock succeedded)
-	    if(perilla::LAZY_PUSH)
-	    {
-		//  Implemetation deffered. Currently not required
-	    }	    
-	}// if(tg==fg)
-    }// for(f<numfabs)    
-}//serviceLocalRequests
-
-
-void Perilla::serviceRemoteRequests(RegionGraph* rg, int graphID, int nGraphs)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = rg->rMap.size();
-
-    // !we first post send and receive  
-    for(int f=0; f<numfabs; f++)
-    {
-	//int lockSucceeded = pthread_mutex_trylock(&(rg->rMap[f]->r_con.rcvLock));
-	//if(lockSucceeded != 0)
-	{
-	    //if(pthread_mutex_trylock(&(rg->lMap[f]->r_con.rcvLock)) != 0)
-	    {
-		for(int i=0; i<rg->lMap[f]->r_con.nrcv; i++)
-		{
-		    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed
-			nextsReq = true;
-		    else
-		    {
-			Package *rearPackage = rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);//!CHECK THIS POINT LATER
-			if(rearPackage->completed && rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			    nextsReq = true;
-			else //!expected message is still on the way
-			    nextsReq = false;
-		    }
-		    if(nextsReq) //!take a message from recycle pool and post a receive
-		    {
-	                pthread_mutex_lock(&(rg->rMap[f]->r_con.rcvLock));
-	                pthread_mutex_lock(&(rg->lMap[f]->r_con.rcvLock));
-			int ns = rg->rMap[f]->r_con.rcv[i].ns;
-			int nd = rg->rMap[f]->r_con.rcv[i].nd;
-			int lnd = rg->rMap[f]->r_con.rcv[i].lnd;
-			int r_grids = rg->rMap[f]->r_con.rcv[i].r_grids;
-			//!create a package to keep track of receive requests
-			Package *rMetaPackage = rg->rMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			//!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-			Package *rPackage = rg->lMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			//tag = tagGen(mf%rMap(f)%r_con%rcv(i)%ns, mf%rMap(f)%r_con%rcv(i)%nd, gid, parallel_nprocs()*nfabs(mf), ngr)---------??????
-			//int tag = tagGen(rg->rMap[f]->r_con.rcv[i].ns, rg->rMap[f]->r_con.rcv[i].nd, graphID-1, np*numfabs, nGraphs);			
-			int tag = tagMap[rg->rMap[f]->r_con.rcv[i].pr][graphID][nd][ns][rg->rMap[f]->r_con.rcv[i].sz];
-
-			rMetaPackage->request = MPI_REQUEST_NULL;
-			rg->lMap[f]->r_con.rcv[i].pQueue.enqueue(rPackage,true);   //!this is not done yet
-			rg->rMap[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage,true);   //!this is not done yet
-			//rMetaPackage->request = parallel_irecv_dv(rpackage%ptr%dataBuf,mf%rMap(f)%r_con%rcv(i)%sz, mf%rMap(f)%r_con%rcv(i)%pr, tag) --------- ????
-			rMetaPackage->request = ParallelDescriptor::Arecv(rPackage->databuf,
-				rg->rMap[f]->r_con.rcv[i].sz,
-				rg->rMap[f]->r_con.rcv[i].pr, tag).req(); // tag == SeqNum in c++ ver
-		        pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-	                pthread_mutex_unlock(&(rg->rMap[f]->r_con.rcvLock));
-		    }
-		}
-		//pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-	    }// if(omp_test_lock)
-	    //pthread_mutex_unlock(&(rg->rMap[f]->r_con.rcvLock));
-	}// if(lockSucceeded)
-    }// for(f<numfabs)
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	for(int i=0; i<rg->sMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //then !no message has been issued or all send requests have been fulfilled
-		nextrReq = false;
-	    else
-		nextrReq = true;
-
-	    if(nextrReq)
-	    {
-		Package *sMetaPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(!sMetaPackage->served)
-		{
-		    Package *sPackage = rg->lMap[f]->r_con.snd[i].pQueue.getFront(true);
-		    sMetaPackage->completed = false;
-		    sMetaPackage->served = true;
-		    sMetaPackage->request = MPI_REQUEST_NULL;
-		    int ns = rg->sMap[f]->r_con.snd[i].ns;
-		    int nd = rg->sMap[f]->r_con.snd[i].nd;
-		    int r_gid = rg->sMap[f]->r_con.snd[i].r_gid;
-		    int r_grids = rg->sMap[f]->r_con.snd[i].r_grids;
-		    //tag = tagGen(mf%sMap(f)%r_con%snd(i)%ns, mf%sMap(f)%r_con%snd(i)%nd, gid, parallel_nprocs()*nfabs(mf), ngr) -???????
-		    //int tag = tagGen(rg->sMap[f]->r_con.snd[i].ns, rg->sMap[f]->r_con.snd[i].nd, graphID-1, np*numfabs, nGraphs);
-		    int tag = Perilla::myTagMap[r_gid][nd][ns][rg->sMap[f]->r_con.snd[i].sz];
-		    //int tag = myTagMap[graphID-1][rg->sMap[f]->r_con.snd[i].nd][rg->sMap[f]->r_con.snd[i].ns];
-		    //sMetaPackage%ptr%request = parallel_isend_dv(spackage%ptr%dataBuf,mf%sMap(f)%r_con%snd(i)%sz, mf%sMap(f)%r_con%snd(i)%pr, tag) --?????
-		    sMetaPackage->request = ParallelDescriptor::Asend(sPackage->databuf,
-			    rg->sMap[f]->r_con.snd[i].sz,
-			    rg->sMap[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-		}
-	    }
-	} // for(i<nsnd)
-    } // for(f<numfabs)
-
-    //!now we test if send and receive requests have been serviced
-    for(int f=0; f<numfabs; f++)
-    {
-	//!receive requests
-	for(int i=0; i<rg->rMap[f]->r_con.nrcv; i++)
-	{
-	    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-	    {
-		//if(pthread_mutex_trylock(&(rg->lMap[f]->r_con.rcvLock)) != 0) // 0-Fail, otherwise-Succeed
-		{
-		    Package *rearPackage =  rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);
-		    if(!rearPackage->completed)
-		    {
-			bool flag = false;
-			int ret_flag;
-			MPI_Status status;
-
-			std::cout<< "myP "<< myProc << " f "<< f << " i "<< i<< " Req "<<rearPackage->request << std::endl;
-
-			ParallelDescriptor::Test(rearPackage->request, ret_flag, status);
-			flag = (ret_flag == 0) ? false : true;//parallel_test_one(rearPackage%ptr%request) -------???????
-			if(flag)
-			{
-		            pthread_mutex_lock(&(rg->lMap[f]->r_con.rcvLock));
-			    rearPackage->completeRequest();
-			    rg->lMap[f]->r_con.rcv[i].pQueue.getRear()->completeRequest();
-			    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				rg->lMap[f]->r_con.firingRuleCnt++;
-		            pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-			}
-		    }
-		    //pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-		} // if(omp_test_lock)
-	    } // if(queueSize > 0)
-	} // for(i<nrcv)
-    } // for(f<numfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {
-	//!send requests
-	for(int i=0; i<rg->lMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-	    {
-		Package *frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(frontPackage->served && !frontPackage->completed) //!latest receive request has NOT been completed
-		{
-		    bool flag = false;
-		    int ret_flag;
-		    MPI_Status status;
-		    ParallelDescriptor::Test(frontPackage->request, ret_flag, status);
-		    flag = (ret_flag == 0) ? false : true;//parallel_test_one(frontPackage%ptr%request) -------???????		    
-		    if(flag)
-		    {
-			pthread_mutex_lock(&(rg->sMap[f]->r_con.sndLock));
-			frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = MPI_REQUEST_NULL;
-			rg->sMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			pthread_mutex_unlock(&(rg->sMap[f]->r_con.sndLock));
-			pthread_mutex_lock(&(rg->lMap[f]->r_con.sndLock));
-			frontPackage = rg->lMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = MPI_REQUEST_NULL;
-			rg->lMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			pthread_mutex_unlock(&(rg->lMap[f]->r_con.sndLock));			
-		    }
-		}
-	    } // if(queueSize > 0)
-	} // for(i<nsnd)
-    }// for(f<numfabs)
-
-}// serviceRemoteRequests
-#endif
-
-
-
-
-
-
-#if 0
-void Perilla::fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f)
-{
-
-exit(0);
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    //if(graph->graphID == 1 && f == 1)
-    //std::cout << "fillBPush for gID 1 f 1 ntid "<< ntid <<std::endl;
-
-    if(perilla::LAZY_PUSH)
-    { }
-    else
-    {
-	if(ntid == 0)
-	    pthread_mutex_lock(&(graph->lMap[f]->l_con.sLock));
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-	if(perilla::PACKING_FINEGRAIN)
-	{}
-	else
-	{
-	    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-		if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-
-		    //if(graph->graphID == 1 && graph->lMap[f]->l_con.scpy[i].nd == 1)
-		    //std::cout << "fillBPush for gID 1 nd 1 pQenQ f " << f << " i " << i <<std::endl;
-		    Package *sPackage = graph->lMap[f]->l_con.scpy[i].recycleQueue.getFront(true);
-		    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->l_con.scpy[i].sbx,0,nComp,sPackage->databuf);
-
-		    for(int d=0; d<sPackage->bufSize; d++)
-			if(sPackage->databuf[d] == 0)
-			{
-			    //std::cout<< "in fbPush Sending 0 from f "<< f <<std::endl;
-			    //BL_ASSERT(sPackage->databuf[d] != 0);
-			}
-		    //if(graph->lMap[f]->l_con.scpy[i].sbx.smallEnd() == graph->lMap[f]->l_con.scpy[i].sbx.bigEnd())
-		    //if(graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(0)==7 && graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(1)==7 && graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(2)==4)
-		    //  std::cout<< "Corner Push for f "<< f << " data0 " <<sPackage->databuf[0]<< " size " <<sPackage->bufSize << " se "<< graph->lMap[f]->l_con.scpy[i].sbx.smallEnd() <<std::endl;
-
-		}	    
-	} // if(PACKING_FINEGRAIN) - else
-
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-	if(ntid==0)
-	{
-	    //if(graph->graphID == 1 && f == 1)
-	    //std::cout << "fillBPush for gID 1 f 1 pQ enQ" <<std::endl;
-	    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-	    {
-		//if(graph->graphID == 1 && graph->lMap[f]->l_con.scpy[i].nd == 1)
-		//std::cout << "fillBPush for gID 1 nd 1 pQ enQ from f "<< f <<std::endl;
-		graph->lMap[f]->l_con.scpy[i].pQueue.enqueue( graph->lMap[f]->l_con.scpy[i].recycleQueue.dequeue(true),true );
-	    }
-	    pthread_mutex_unlock(&(graph->lMap[f]->l_con.sLock));
-	}
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    } // if(LAZY_PUSH) - else
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-	pthread_mutex_lock(&(graph->lMap[f]->r_con.sndLock));
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	if((i%(perilla::NUM_THREADS_PER_TEAM-1))==ntid)
-	{
-	    //std::cout << "RQS " << graph->lMap[f]->r_con.snd[i].recycleQueue.queueSize() << std::endl;
-
-	    Package *sndPackage = graph->lMap[f]->r_con.snd[i].recycleQueue.dequeue(true);	  
-	    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->r_con.snd[i].sbx,0,nComp,sndPackage->databuf);
-	    graph->lMap[f]->r_con.snd[i].pQueue.enqueue( sndPackage,true );
-	    //!the local message handler will detect the change and notify the remote message handler =>read access
-	    //!the remote message handler first modifies the front item of this queue, then it push this item back to the message pool
-	}
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(ntid==0)
-    {
-	pthread_mutex_unlock(&(graph->lMap[f]->r_con.sndLock));
-	pthread_mutex_lock(&(graph->sMap[f]->r_con.sndLock));
-	for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	    graph->sMap[f]->r_con.snd[i].pQueue.enqueue( graph->sMap[f]->r_con.snd[i].recycleQueue.dequeue(true),true );
-	pthread_mutex_unlock(&(graph->sMap[f]->r_con.sndLock));
-    }    																					      
-
-} // fillBoundaryPush
-#endif
-
-
-#if 0
-void Perilla::fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f, bool singleT)
-{
-exit(0);
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    if(ntid==0)
-	pthread_mutex_lock(&(graph->lMap[f]->l_con.dLock));
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads    
-
-    if(perilla::LAZY_PUSH)
-    { }
-    else
-    {
-	if(perilla::UNPACKING_FINEGRAIN)
-	{}
-	else
-	{
-	    for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-		if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package *dPackage = graph->lMap[f]->l_con.dcpy[i].pQueue.getFront(true);
-
-		    /*for(int d=0; d<dPackage->bufSize; d++)
-			if(dPackage->databuf[d] == 0)
-			{
-			    //std::cout<< "in fbPull Reciving 0 for f "<< f <<std::endl;
-			    //BL_ASSERT(dPackage->databuf[d] != 0);
-			}*/
-		    /*
-		       if(f==0)
-		    //if(graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd() == graph->lMap[f]->l_con.dcpy[i].dbx.bigEnd())
-		    //if(graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(0)==-1 && graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(1)==-1 && graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(2)==4)
-		    std::cout<< "Corner Pull for f "<< f << " data0 " <<dPackage->databuf[0]<< " size " <<dPackage->bufSize <<" se " <<graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd()<<std::endl;
-		     */
-		    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->l_con.dcpy[i].dbx,0,nComp,dPackage->databuf);		  
-		}
-	} // if(UNPACKING_FINEGRAIN) - else
-    } // if(LAZY_PUSH) - else
-
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    graph->lMap[f]->l_con.dcpy[i].recycleQueue.enqueue( graph->lMap[f]->l_con.dcpy[i].pQueue.dequeue(true),true );
-
-	graph->lMap[f]->l_con.firingRuleCnt = graph->lMap[f]->l_con.firingRuleCnt - graph->lMap[f]->l_con.ndcpy;
-
-	graph->lMap[f]->l_con.scpyCnt = 0;
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    if(graph->lMap[f]->l_con.dcpy[i].pQueue.queueSize(true) >= 1)
-		graph->lMap[f]->l_con.firingRuleCnt++;
-	pthread_mutex_unlock(&(graph->lMap[f]->l_con.dLock));
-    }
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-    {
-	pthread_mutex_lock(&(graph->rMap[f]->r_con.rcvLock));
-	pthread_mutex_lock(&(graph->lMap[f]->r_con.rcvLock));
-    }
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	{
-	    Package *rcvMetaPackage = graph->rMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = MPI_REQUEST_NULL;
-	    graph->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-	    Package *rcvPackage = graph->lMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->r_con.rcv[i].dbx,0,nComp,rcvPackage->databuf);
-	    rcvPackage->completed = false;
-	    graph->lMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);
-	}
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	graph->lMap[f]->r_con.firingRuleCnt = graph->lMap[f]->r_con.firingRuleCnt - graph->lMap[f]->r_con.nrcv;
-	for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	    if(graph->lMap[f]->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		if(graph->lMap[f]->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-		    graph->lMap[f]->r_con.firingRuleCnt++;
-	pthread_mutex_unlock(&(graph->lMap[f]->r_con.rcvLock));
-	pthread_mutex_unlock(&(graph->rMap[f]->r_con.rcvLock));
-    }
-
-} // fillBoundaryPull
-#endif
-
-
-
-
-/////////////////////////////////////////////////////////////////////////////////////////////////////////////////
-
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, int nc, int ng, int ngSrc, const Periodicity& period)
-{
-    //    MultiFab* mfSrc = gSrc->assocMF;
-    //    MultiFab* mfDst = gDst->assocMF;
-    int myProc = ParallelDescriptor::MyProc();
-    int np = ParallelDescriptor::NProcs();
-
-    try{
-
-        if(true)//if(!(*mfSrc == *mfDst))
-        {
-            if(ng > mfDst.nGrow()) cout <<"MULTIFAB_COPY_C: ng > mfDst.nGrow not supported in parallel copy"<< endl;
-            if(ngSrc > mfSrc.nGrow()) cout <<"MULTIFAB_COPY_C: ngSrc > mfSrc.nGrow"<< endl;
-            if(ngSrc > 0)
-            {   
-                
-                // To be implemented
-                //do i = 1, nboxes(msrc%la)
-                //  call push_back(bl, grow(box_nodalize(get_box(msrc%la,i),msrc%nodal),lngsrc))
-                //end do
-                //call build(batmp, bl, sort = .false.)
-                //call destroy(bl)
-                //call build(lasrctmp, batmp, boxarray_bbox(batmp), explicit_mapping = get_proc(msrc%la))
-                //call destroy(batmp)
-                //call build(msrctmp, lasrctmp, nc = lnc, ng = 0)
-                //pmfsrc => msrctmp
-            }
-            if(np > 1)
-            {   
-                if(gSrc->sCopyMapHead == 0)
-                    gSrc->sCopyMapHead = new CopyMap();
-                else
-                {   
-                    CopyMap *tmpCopyMap = new CopyMap();
-                    tmpCopyMap->next = gSrc->sCopyMapHead;
-                    gSrc->sCopyMapHead = tmpCopyMap;
-                }
-                if(gDst->rCopyMapHead == 0)
-                    gDst->rCopyMapHead = new CopyMap();
-                else
-                {   
-                    CopyMap *tmpCopyMap = new CopyMap();
-                    tmpCopyMap->next = gDst->rCopyMapHead;
-                    gDst->rCopyMapHead = tmpCopyMap;
-                }
-                //gSrc->sCopyMapHead->map.reserve(mfSrc.size());
-                //gDst->rCopyMapHead->map.reserve(mfDst.size());
-                gSrc->sCopyMapHead->alloc_CopyMap(mfSrc);
-                gDst->rCopyMapHead->alloc_CopyMap(mfDst);
-            }
-
-            if(gSrc->numTasks != mfSrc.IndexArray().size())
-                std::cout<< "before " <<gSrc->numTasks << " now " <<mfSrc.size() << " at gID " << gSrc->graphID << std::endl;
-
-            gSrc->numFabs = mfSrc.size();
-            gDst->numFabs = mfDst.size();
-
-            gSrc->numTasks = mfSrc.IndexArray().size();
-            gDst->numTasks = mfDst.IndexArray().size();
-
-            int nfabsSrc = mfSrc.IndexArray().size();
-            int nfabsDst = mfDst.IndexArray().size();
-
-            const FabArrayBase::CPC& TheCPC = mfDst.getCPC(IntVect(ng), mfSrc, IntVect(ngSrc), period);
-
-            const int nloc_cpAsc = TheCPC.m_LocTags->size();
-            const int nsnds_cpAsc = TheCPC.m_SndTags->size();
-            const int nrcvs_cpAsc = TheCPC.m_RcvTags->size();
-
-            Vector<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-            Vector<int> send_pr;
-            send_cctc.reserve(nsnds_cpAsc);
-
-            for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC.m_SndTags->begin(),
-                    m_End = TheCPC.m_SndTags->end();
-                    m_it != m_End;
-                    ++m_it)
-            {
-                if(m_it->first != myProc)      // Not destined to me.
-                {
-                    send_pr.push_back(m_it->first);
-                    send_cctc.push_back(&(m_it->second));
-                }
-            }
-
-            //  std::cout<< "Loop 1" <<std::endl;
-
-            Vector<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-            Vector<int> recv_pr;
-            recv_cctc.reserve(nrcvs_cpAsc);
-
-            for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC.m_RcvTags->begin(),
-                    m_End = TheCPC.m_RcvTags->end();
-                    m_it != m_End;
-                    ++m_it)
-            {
-                if(m_it->first != myProc)      // I am not the source for this receipt
-                {
-                    recv_pr.push_back(m_it->first);
-                    recv_cctc.push_back(&(m_it->second));
-                }
-            }
-
-            //std::cout<< "Before parallel at gID " << gDst->graphID << " numTask " << gDst->numTasks << " numFabs " << gDst->numFabs <<std::endl;      
-
-//#pragma omp parallel shared(gSrc, gDst, mfSrc, mfDst, nfabsSrc, nfabsDst)
-            {
-		
-//#ifdef _OPENMP
-//                int tid = omp_get_thread_num();//perilla::tid();//omp_get_thread_num();   
-//#else
-//		int tid = 0;
-//#endif
-//                int tg = tid/perilla::NUM_THREADS_PER_TEAM;//perilla::wid();//WorkerThread::perilla_wid();
-//                int nt= tid%perilla::NUM_THREADS_PER_TEAM;
-//                int fg;
-
-                for(int f=0; f<nfabsSrc; f++)
-                {
-//		  if(nt==0)
-//                    if(WorkerThread::isMyRegion(tg,f))// && WorkerThread::perilla_isMasterWorkerThread())
-                    {
-                        //if(gDst->graphID > 25)
-                        //std::cout<< "Inside parallel Generating Send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;   
-
-                        FabCopyAssoc *cpSrc;
-                        if(gSrc->task[f]->cpAsc_srcHead == 0)
-                        {
-                            gSrc->task[f]->cpAsc_srcHead = new FabCopyAssoc();
-                            cpSrc = gSrc->task[f]->cpAsc_srcHead;
-                        }
-                        else
-                        {
-                            cpSrc = new FabCopyAssoc();
-                            cpSrc->next = gSrc->task[f]->cpAsc_srcHead;
-                            gSrc->task[f]->cpAsc_srcHead = cpSrc;
-                        }
-
-                        cpSrc->graphPartner = gDst;
-                        cpSrc->l_con.nscpy = 0;
-                        for(int i=0; i<nloc_cpAsc; i++)
-                        {
-                            const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-                            //if(f == tag.srcIndex)
-                            if(mfSrc.IndexArray()[f] == tag.srcIndex)
-                                cpSrc->l_con.nscpy++;
-                        }
-                        cpSrc->l_con.scpy = new LocalCopyDescriptor[cpSrc->l_con.nscpy];
-                        int scnt = 0;
-                        //if(gDst->graphID == 4 && tag.dstIndex == 60 )
-                        //std::cout<< "Inside parallel Generating Local Copy send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;        
-
-                        for(int i=0; i<nloc_cpAsc; i++)
-                        {
-                            const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-                            //if(f == tag.srcIndex)
-                            if(mfSrc.IndexArray()[f] == tag.srcIndex)
-                            {
-
-                                //if(gDst->graphID == 4 && (tag.dstIndex == 60 || tag.dstIndex == 59) )
-                                //std::cout <<"myP " <<myProc<< " Added in S LocDep nd " << tag.dstIndex << " ns "<< tag.srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-                                cpSrc->l_con.scpy[scnt].ns = mfSrc.localindex(tag.srcIndex);
-                                cpSrc->l_con.scpy[scnt].nd = mfDst.localindex(tag.dstIndex);
-                                cpSrc->l_con.scpy[scnt].sbx = tag.sbox;
-                                cpSrc->l_con.scpy[scnt].dbx = tag.dbox;
-                                int psize = tag.sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-                                //std::cout<< " gSrc ID "<< gSrc->graphID << " f "<<f<< " sndPkgsize " << psize <<std::endl;
-                                for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                {
-                                    Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                    for(int j=0; j<psize; j++)
-                                        ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                    cpSrc->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);
-                                }
-                                for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                    cpSrc->l_con.scpy[scnt].recycleQueue.enqueue(cpSrc->l_con.scpy[scnt].pQueue.dequeue());
-                                scnt++;
-                            }
-                        }
-
-                        if(np > 1)
-                        {
-                            cpSrc->r_con.nsnd = 0;
-                            cpSrc->r_con.remotePushReady = false;
-                            cpSrc->r_con.firingRuleCnt = 0;
-                            for(int i=0; i<nsnds_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    if(mfSrc.IndexArray()[f] == it->srcIndex)
-                                        cpSrc->r_con.nsnd++;
-                                }
-                            } // for(i<nsnds_cpAsc)
-                            cpSrc->r_con.snd = new RemoteCommDescriptor[cpSrc->r_con.nsnd];
-                            scnt = 0;
-                            for(int i=0; i<nsnds_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    if(mfSrc.IndexArray()[f] == it->srcIndex)
-                                    {
-
-                                        //if(gDst->graphID == 17 && (it->srcIndex == 1198 || it->srcIndex == 1198 || it->srcIndex == 978 || it->srcIndex == 978))
-                                        //std::cout <<"myP " <<myProc<< " Added in S Dep r " << it->dstIndex << " s "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg <<" nsnd " << gSrc<< std::endl;
-
-                                        cpSrc->r_con.snd[scnt].ns = it->srcIndex;
-                                        cpSrc->r_con.snd[scnt].nd = it->dstIndex;
-                                        cpSrc->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-                                        cpSrc->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);
-                                        cpSrc->r_con.snd[scnt].sbx = it->sbox;
-                                        cpSrc->r_con.snd[scnt].dbx = it->dbox;
-                                        int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-                                        
-                                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                        {   
-                                            Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                            for(int j=0; j<psize; j++)
-                                                ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                            cpSrc->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-                                        }
-                                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                            cpSrc->r_con.snd[scnt].recycleQueue.enqueue(cpSrc->r_con.snd[scnt].pQueue.dequeue());
-                                        scnt++;
-                                    }
-                                }                                     
-                            } // for(i<nsnds_cpAsc)                               
-                        } // if(np > 1)                                                                                                                                         
-                    } // if(fg==tg)
-//#pragma omp barrier
-                    //        std::cout<< "Barrier 1" <<std::endl;            
-                    if(np > 1)
-                    {
-                        //if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-//		        if(tid==0)
-                        {
-
-                            // std::cout<< "Inside parallel Generating Remote Send tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;  
-
-                            gSrc->sCopyMapHead->map[f]->r_con.nsnd = 0;
-                            gSrc->sCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-                            for(int i=0; i<nsnds_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    if(mfSrc.IndexArray()[f] == it->srcIndex)
-                                        gSrc->sCopyMapHead->map[f]->r_con.nsnd++;
-                                }
-                            } // for(i<nsnds_cpAsc)
-                            gSrc->sCopyMapHead->map[f]->r_con.snd = new RemoteCommDescriptor[gSrc->sCopyMapHead->map[f]->r_con.nsnd];
-                            int scnt = 0;
-                            for(int i=0; i<nsnds_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-
-                                    if(mfSrc.IndexArray()[f] == it->srcIndex)
-                                    {
-
-                                        //if(gDst->graphID == 31 && (it->dstIndex == 519))
-                                        //std::cout <<"myP " <<myProc<< " Added in S Dep nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].ns = it->srcIndex;
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].nd = it->dstIndex;
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_gid = gDst->graphID-1;
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sbx = it->sbox;
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].dbx = it->dbox;
-
-                                        int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sz = psize;
-                                        gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pr = send_pr[i];
-
-                                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                        {
-                                            //Package *tmpPkg = new Package(psize);
-                                            Package *tmpPkg = new Package();
-                                            //for(int j=0; j<psize; j++)
-                                            //tmpPkg->databuf[j] = 0;
-                                            gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-                                        }
-                                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                            gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].recycleQueue.enqueue(gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.dequeue());
-                                        scnt++;
-                                    }
-                                }
-                            } // for(i<nsnds_cpAsc)
-                        } // if(tid==0)
-                    } // if(np > 1)       
-                } // for(f<nfabsSrc)
-                //        std::cout<< "Barrier 2 " <<" tid "<<tid<<std::endl;     
-//#pragma omp barrier               
-                for(int f=0; f<nfabsDst; f++)
-                {
-//		  if(nt==0)
-//                    if(WorkerThread::isMyRegion(tg,f))// && perilla::isMasterWorkerThread())
-                    {
-                        //        std::cout <<"tid: "<< tid << " f: "<< f << " is master "<<WorkerThread::isTeamMasterThread(tid) << " is my region "<<WorkerThread::isMyRegion(tg,f)<<std::endl;                 
-
-                        //if(gDst->graphID > 25)
-                        //std::cout<< "Inside parallel Generating Recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl; 
-
-                        FabCopyAssoc *cpDst;
-                        if(gDst->task[f]->cpAsc_dstHead == 0)
-                        {
-                            gDst->task[f]->cpAsc_dstHead = new FabCopyAssoc();
-                            cpDst = gDst->task[f]->cpAsc_dstHead;
-                        }
-                        else
-                        {
-                            cpDst = new FabCopyAssoc();
-                            cpDst->next = gDst->task[f]->cpAsc_dstHead;
-                            gDst->task[f]->cpAsc_dstHead = cpDst;
-                        }
-                        cpDst->graphPartner = gSrc;
-                        cpDst->l_con.ndcpy = 0;
-                        cpDst->l_con.firingRuleCnt = 0;
-                        cpDst->l_con.dcpyCnt = 0;
-                        for(int i=0; i<nloc_cpAsc; i++)
-                        {
-                            const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-                            //if(f == tag.dstIndex)
-                            if(mfDst.IndexArray()[f] == tag.dstIndex)
-                                cpDst->l_con.ndcpy++;
-                        }
-                        cpDst->l_con.dcpy = new LocalCopyDescriptor[cpDst->l_con.ndcpy];
-                        int dcnt = 0;
-
-                        //if(gDst->graphID > 25)
-                        //std::cout<< "Inside parallel Generating Local copy recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;      
-
-
-                        //if(gDst->graphID ==27 && f == 633)
-                        //std::cout<< "tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc << " ndcpy " << cpDst->l_con.ndcpy <<std::endl;     
-
-                        for(int i=0; i<nloc_cpAsc; i++)
-                        {
-                            const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-                            //if(f == tag.dstIndex)
-                            if(mfDst.IndexArray()[f] == tag.dstIndex)
-                            {
-
-                                //if(gDst->graphID == 4 && (tag.dstIndex == 60 || tag.dstIndex == 59))
-                                //std::cout<< "dcpy tid " << tid << " f " << f << " i " << i << " dcnt " << dcnt << " ns "<<tag.srcIndex << " nd "<<tag.dstIndex << " lo " << tag.dbox.smallEnd() << " hi " << tag.dbox.bigEnd() <<std::endl;   
-
-                                cpDst->l_con.dcpy[dcnt].ns = mfSrc.localindex(tag.srcIndex);
-                                cpDst->l_con.dcpy[dcnt].nd = mfDst.localindex(tag.dstIndex);
-                                cpDst->l_con.dcpy[dcnt].sbx = tag.sbox;
-                                cpDst->l_con.dcpy[dcnt].dbx = tag.dbox;
-
-                                int psize = tag.dbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-                                cpDst->l_con.dcpy[dcnt].sz = psize;
-
-                                if(!gDst->isDepGraph)
-                                {
-                                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                    {
-                                        Package *tmpPkg = new  Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-
-                                        for(int j=0; j<psize; j++)
-                                            ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                        cpDst->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);
-                                    }
-
-                                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                        cpDst->l_con.dcpy[dcnt].recycleQueue.enqueue(cpDst->l_con.dcpy[dcnt].pQueue.dequeue());
-
-                                }
-                                dcnt++;
-                            }
-                        }
-
-                        RegionGraph* depGraph = gDst->srcLinkGraph;
-                        for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-                        {
-                            int dfi = gDst->task[f]->depTaskIDs[df];
-                            FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-                            for(int i=0; i<cpdDst->l_con.ndcpy ; i++)
-                            {
-                                for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                {
-                                    int psize = cpdDst->l_con.dcpy[i].sz;
-                                    Package *tmpPkg = new  Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                    for(int j=0; j<psize; j++)
-                                        ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                    cpdDst->l_con.dcpy[i].pQueue.enqueue(tmpPkg);
-                                }
-                                for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                    cpdDst->l_con.dcpy[i].recycleQueue.enqueue(cpdDst->l_con.dcpy[i].pQueue.dequeue());
-                            }
-                        }
-
-                        if(np > 1)
-                        {
-                            cpDst->r_con.nrcv = 0;
-                            cpDst->r_con.remotePullDone = false;
-                            cpDst->r_con.firingRuleCnt = 0;
-                            for(int i=0; i<nrcvs_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    if(mfDst.IndexArray()[f] == it->dstIndex)
-                                        cpDst->r_con.nrcv++;
-                                }
-                            } // for(i<nrcvs_cpAsc)
-                            cpDst->r_con.rcv = new RemoteCommDescriptor[cpDst->r_con.nrcv];
-                            dcnt = 0;
-                            for(int i=0; i<nrcvs_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    //if(f == it->dstIndex)
-                                    if(mfDst.IndexArray()[f] == it->dstIndex)
-                                    {
-                                        cpDst->r_con.rcv[dcnt].nd = it->dstIndex;
-                                        cpDst->r_con.rcv[dcnt].ns = it->srcIndex;
-                                        cpDst->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-                                        cpDst->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-                                        cpDst->r_con.rcv[dcnt].sbx = it->sbox;
-                                        cpDst->r_con.rcv[dcnt].dbx = it->dbox;
-                                        int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-                                        cpDst->r_con.rcv[dcnt].sz = psize;
-
-                                        if(!gDst->isDepGraph)
-                                        {
-                                            for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                            {
-                                                Package *tmpPkg = new Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                                for(int j=0; j<psize; j++)
-                                                    ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                                cpDst->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-                                            }
-                                            for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                                cpDst->r_con.rcv[dcnt].recycleQueue.enqueue(cpDst->r_con.rcv[dcnt].pQueue.dequeue());                                      
-                                        }
-
-                                        dcnt++;
-                                    }
-                                }
-                            }// for(i<nrcvs_cpAsc)
-
-                            RegionGraph* depGraph = gDst->srcLinkGraph;
-                            for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-                            {
-                                int dfi = gDst->task[f]->depTaskIDs[df];
-                                FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-                                for(int i=0; i<cpdDst->r_con.nrcv ; i++)
-                                {
-                                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                    {
-                                        int psize = cpdDst->r_con.rcv[i].sz;
-                                        Package *tmpPkg = new  Package(psize);
-#ifdef PERILLA_USE_UPCXX
-                            void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-                            for(int j=0; j<psize; j++)
-                                ((double*)local_ptr)[j]= 0;
-#else
-                                        for(int j=0; j<psize; j++)
-                                            ((double*)tmpPkg->databuf)[j] = 0;
-#endif
-                                        cpdDst->r_con.rcv[i].pQueue.enqueue(tmpPkg);
-                                    }
-                                    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                        cpdDst->r_con.rcv[i].recycleQueue.enqueue(cpdDst->r_con.rcv[i].pQueue.dequeue());
-                                }
-                            }
-                        } // if(np > 1)
-                    }// if(fg==tg)
-
-//#pragma omp barrier               
-                    if(np > 1)
-                    {
-                        //if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-//                        if(tid==0)
-                        {
-
-                            //  std::cout<< "Inside parallel Generating Remote Recive tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;       
-
-                            gDst->rCopyMapHead->map[f]->r_con.nrcv = 0;
-                            gDst->rCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-                            for(int i=0; i<nrcvs_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    //if(f == it->dstIndex)
-                                    if(mfDst.IndexArray()[f] == it->dstIndex)
-                                        gDst->rCopyMapHead->map[f]->r_con.nrcv++;
-                                }
-                            }
-                            gDst->rCopyMapHead->map[f]->r_con.rcv = new RemoteCommDescriptor[gDst->rCopyMapHead->map[f]->r_con.nrcv];
-                            int dcnt = 0;
-                            for(int i=0; i<nrcvs_cpAsc; i++)
-                            {
-                                const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-                                for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-                                        it != cctc.end(); ++it)
-                                {
-                                    //if(f == it->dstIndex)
-                                    if(mfDst.IndexArray()[f] == it->dstIndex)
-                                    {
-
-                                        // if(myProc==54 && gDst->graphID == 25 && f == 10)
-                                        // std::cout <<"myP " <<myProc<<" Dep n R Added nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " sgID "<< gSrc->graphID <<" tg "<<tg<< " from P " << recv_pr[i] <<std::endl;
-
-
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].nd = it->dstIndex;
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].ns = it->srcIndex;
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sbx = it->sbox;
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].dbx = it->dbox;
-
-                                        int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sz = psize;
-                                        gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pr = recv_pr[i];
-
-                                        BL_ASSERT(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd == f);
-
-                                        if(Perilla::genTags)
-                                        {
-                                            try{
-                                                std::map<int,int>::iterator itr = tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].find(psize);
-                                                if( itr != tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].end())
-                                                {
-                                                    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-                                                }
-                                                else
-                                                {
-                                                    tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex][psize] = Perilla::uTags++;
-                                                    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-                                                    std::map<int,int>::iterator itr2 = pTagCnt[recv_pr[i]].find(gDst->graphID-1);
-                                                    if(itr2 != pTagCnt[recv_pr[i]].end())
-                                                        pTagCnt[recv_pr[i]][gDst->graphID-1] = pTagCnt[recv_pr[i]][gDst->graphID-1] + 1;
-                                                    else
-                                                        pTagCnt[recv_pr[i]][gDst->graphID-1] = 1;                                                                          
-                                                }
-                                            }
-                                            catch(std::exception& e)
-                                            {
-                                                std::cout <<"Inside tagGeneration gID "<< gDst->graphID <<" "<< e.what() << '\n';
-                                            }
-                                        }
-                                        //tagMap[recv_pr[i]][gDst->graphID][it->dstIndex][it->srcIndex] = pTagCnt[recv_pr[i]];                            
-
-
-                                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                        {
-                                            //Package *tmpPkg = new Package(psize);
-                                            Package *tmpPkg = new Package();
-                                            //for(int j=0; j<psize; j++)
-                                            //tmpPkg->databuf[j] = 0;
-                                            gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-                                        }
-                                        for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-                                            gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].recycleQueue.enqueue(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.dequeue());
-                                        dcnt++;
-                                    }
-                                }
-                            } // for(i<nrcvs_cpAsc)
-
-                        } // if(tid==0)
-                    } // if(np > 1)
-                    //} //if(fg==tg)
-            } // for(f<nfabsDst)
-            // std::cout<< "Barrier 4" <<" tid "<<tid <<std::endl;                        
-//#pragma omp barrier
-            for(int f=0; f<nfabsSrc; f++)
-            {
-//	      if(nt==0)
-//                if(WorkerThread::isMyRegion(tg,f))// && WorkerThread::perilla_isMasterWorkerThread())
-                {
-
-                    //if(gDst->graphID > 25)
-                    //std::cout<< "Inside parallel Generating Send partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;                
-
-                    for(int i=0; i<gSrc->task[f]->cpAsc_srcHead->l_con.nscpy; i++)
-                    {
-                        int lnd = gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].nd;
-                        for(int j=0; j<gDst->task[ lnd ]->cpAsc_dstHead->l_con.ndcpy; j++)
-                            if(gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dbx == gDst->task[ lnd ]->cpAsc_dstHead->l_con.dcpy[j].dbx)
-                                gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dPartner = j;
-                    }
-                }
-            } // for(f<nfabsSrc)
-            //std::cout<< "Barrier 5" <<" tid "<<tid<<std::endl;                          
-//#pragma omp barrier
-            for(int f=0; f<nfabsDst; f++)
-            {
-//	      if(nt==0)
-//                if(WorkerThread::isMyRegion(tg,f))// && WorkerThread::perilla_isMasterWorkerThread())
-                {
-
-                    //if(gDst->graphID > 25)
-                    //std::cout<< "Inside parallel Generating Recive partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;    
-
-                    for(int i=0; i<gDst->task[f]->cpAsc_dstHead->l_con.ndcpy; i++)
-                    {
-                        int lns = gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].ns;
-                        for(int j=0; j<gSrc->task[ lns ]->cpAsc_srcHead->l_con.nscpy; j++)
-                            if(gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].dbx == gSrc->task[ lns ]->cpAsc_srcHead->l_con.scpy[j].dbx)
-                                gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].sPartner = j;
-                    }
-                }
-            } // for(f<nfabsDst)                                                                                                                                 
-        } // omp parallel
-    } // if(!(*mfSrc == *mfDst))    
-}
-catch(std::exception& e)
-{
-    std::cout <<"Inside MFcopyAssoc gID "<< gDst->graphID <<" "<< e.what() << '\n';
-}
-
-
-//std::cout<< "All done safely at gID " << gDst->graphID <<std::endl;   
-
-} // multifabExtractCopyAssoc
-
-
-
-#if 0
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int myProc = ParallelDescriptor::MyProc();
-
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    //MultiFab* mfDst = destGraph->assocMF;
-    //MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    //if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-        if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-        //if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-        FabCopyAssoc* cpDst = destGraph->task[f]->cpAsc_dstHead;
-        while(cpDst != 0)
-        {   
-            if(cpDst->graphPartner == srcGraph)
-                break;
-            cpDst = cpDst->next;
-        }
-        if(cpDst == 0) cout <<"Metadata for across grid copy not found"<< endl;
-        //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-        if(singleT)
-        {
-            pthread_mutex_lock(&(cpDst->l_con.dLock));
-            for(int i=0; i<cpDst->l_con.ndcpy; i++)
-            {
-                Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-                mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-            }
-            for(int i=0; i<cpDst->l_con.ndcpy; i++)
-                cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue()); // corrected from pQ to recycleQ and from recycleQ to pQ
-            cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-            pthread_mutex_unlock(&(cpDst->l_con.dLock));
-        }
-        else
-        {
-            if(ntid==0)
-                pthread_mutex_lock(&(cpDst->l_con.dLock));
-            destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-            for(int i=0; i<cpDst->l_con.ndcpy; i++)
-                if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-                {
-                    Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-                    mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-                }
-            destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-            if(ntid == 0)
-            {
-                for(int i=0; i<cpDst->l_con.ndcpy; i++)
-                    cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue()); // corrected from pQ to recycleQ and from recycleQ to pQ
-                cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-                pthread_mutex_unlock(&(cpDst->l_con.dLock));
-            }
-            destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-        }
-
-        int np = ParallelDescriptor::NProcs();
-        if(np == 1)
-            return;
-
-        if(singleT)
-        {
-            //pthread_mutex_lock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-            pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-            for(int i=0; i<cpDst->r_con.nrcv; i++)
-            {
-                ///*
-                Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-                mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf); 
-                rcvPackage->completed = false;
-                rcvPackage->served = false;
-                rcvPackage->request = MPI_REQUEST_NULL;
-                cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage, true);                         // corrected from pQ to recycleQ           
-
-		/*
-                Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-                rcvMetaPackage->completed = false;
-                rcvMetaPackage->served = false;
-                rcvMetaPackage->request = MPI_REQUEST_NULL;
-                destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage, true);
-                */
-                //Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-                //mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-            }
-            cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-            cpDst->r_con.remotePullDone = true;
-            ///*
-            for(int i=0; i<cpDst->r_con.nrcv; i++)
-                if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-                    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-                        cpDst->r_con.firingRuleCnt++;
-            //*/
-            pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-            //pthread_mutex_unlock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-        }
-        else
-        {
-            if(ntid==0)
-            {
-                //pthread_mutex_lock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-                pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-            }
-            destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-            for(int i=0; i<cpDst->r_con.nrcv; i++)
-                if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-                {
-                    ///*
-
-                    Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-                    mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-                    rcvPackage->completed = false;
-                    rcvPackage->served = false;
-                    rcvPackage->request = MPI_REQUEST_NULL;
-                    cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage, true);                         // corrected from pQ to recycleQ       
-
-                    /*Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-                    rcvMetaPackage->completed = false;
-                    rcvMetaPackage->served = false;
-                    rcvMetaPackage->request = MPI_REQUEST_NULL;
-                    destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage, true);
-                    */
-
-                    //Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-                   // mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-
-                }
-            destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-            if(ntid==0)
-            {
-                cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-                cpDst->r_con.remotePullDone = true;
-                ///*
-                for(int i=0; i<cpDst->r_con.nrcv; i++)
-                    if(cpDst->r_con.rcv[i].pQueue.queueSize() >= 1)
-                        if(cpDst->r_con.rcv[i].pQueue.getFront()->checkRequest())
-                            cpDst->r_con.firingRuleCnt++;
-                //*/
-                pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-                //pthread_mutex_unlock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-            }
-            destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-        }
-    } // if(!(*mfDst == *mfSrc))
-
-} // multifabCopyPull
-#endif
-
-
-
-
-#if 0
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    //double start_time_wtime = omp_get_wtime();
-
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-
-    //mTeams = false; 
-
-    //if(np==1)
-      //multifabCopyPull_1Team(destGraph,srcGraph,mfDst,mfSrc,f,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-    /*else if(mTeams)
-      {
-        if(WorkerThread::isLocPPTID(tid))
-          multifabCopyLocPull(destGraph,srcGraph,mfDst,mfSrc,f,tid,dstcomp,srccomp,nc,ng,ngsrc);
-        else
-          multifabCopyRmtPull(destGraph,srcGraph,mfDst,mfSrc,f,tid,dstcomp,srccomp,nc,ng,ngsrc);
-      }
-    else
-      multifabCopyPull_1Team(destGraph,srcGraph,mfDst,mfSrc,f,tid,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-*/
-
-    if(!singleT)
-      srcGraph->worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-    //double end_time_wtime = omp_get_wtime();
-    //if(ntid==0)
-      //Perilla::getPPPTimeSplit[3] += end_time_wtime - start_time_wtime;
-}
-#endif
-
-
-#if 0
-Array<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-Array<int> send_pr;
-Array<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-Array<int> recv_pr;
-
-
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, int nc, int ng, int ngSrc, const Periodicity& period)
-{
-#if 1
-    int myProc = ParallelDescriptor::MyProc();
-    int np = ParallelDescriptor::NProcs();
-    try{
-	if(true)//if(!(*mfSrc == *mfDst))
-	{
-#ifdef USE_PERILLA_PTHREADS
-//	    if(perilla::isMasterThread())
-#endif
-            {
-		if(ng > mfDst.nGrow()) cout <<"MULTIFAB_COPY_C: ng > mfDst.nGrow not supported in parallel copy"<< endl;
-		if(ngSrc > mfSrc.nGrow()) cout <<"MULTIFAB_COPY_C: ngSrc > mfSrc.nGrow"<< endl;
-		if(ngSrc > 0)
-		{
-		    // To be implemented
-		    //do i = 1, nboxes(msrc%la)
-		    //  call push_back(bl, grow(box_nodalize(get_box(msrc%la,i),msrc%nodal),lngsrc))
-		    //end do
-		    //call build(batmp, bl, sort = .false.)
-		    //call destroy(bl)
-		    //call build(lasrctmp, batmp, boxarray_bbox(batmp), explicit_mapping = get_proc(msrc%la))
-		    //call destroy(batmp)
-		    //call build(msrctmp, lasrctmp, nc = lnc, ng = 0)
-		    //pmfsrc => msrctmp
-		    assert(false);
-		}
-		if(np > 1)
-		{
-		    if(gSrc->sCopyMapHead == 0)
-			gSrc->sCopyMapHead = new CopyMap();
-		    else
-		    {
-			CopyMap *tmpCopyMap = new CopyMap();
-			tmpCopyMap->next = gSrc->sCopyMapHead;
-			gSrc->sCopyMapHead = tmpCopyMap;
-		    }
-		    if(gDst->rCopyMapHead == 0)
-			gDst->rCopyMapHead = new CopyMap();
-		    else
-		    {
-			CopyMap *tmpCopyMap = new CopyMap();
-			tmpCopyMap->next = gDst->rCopyMapHead;
-			gDst->rCopyMapHead = tmpCopyMap;
-		    }
-		    //gSrc->sCopyMapHead->map.reserve(mfSrc.size());
-		    //gDst->rCopyMapHead->map.reserve(mfDst.size());
-		    gSrc->sCopyMapHead->alloc_CopyMap(mfSrc);
-		    gDst->rCopyMapHead->alloc_CopyMap(mfDst);
-		}
-
-		//if(gSrc->numTasks != mfSrc.IndexArray().size())
-		//    std::cout<< "before " <<gSrc->numTasks << " now " <<mfSrc.size() << " at gID " << gSrc->graphID << std::endl;	
-
-		gSrc->numFabs = mfSrc.size();
-		gDst->numFabs = mfDst.size();	
-		gSrc->numTasks = mfSrc.IndexArray().size();
-		gDst->numTasks = mfDst.IndexArray().size();
-	    }
-#ifdef USE_PERILLA_PTHREADS
-//	    perilla::syncAllThreads();
-#endif
-	    const FabArrayBase::CPC *TheCPC= &mfDst.getCPC(ng, mfSrc, ngSrc, period);;
-
-	    int nfabsSrc = mfSrc.IndexArray().size();
-	    int nfabsDst = mfDst.IndexArray().size();
-
-	    const int nloc_cpAsc = TheCPC->m_LocTags->size();
-	    const int nsnds_cpAsc = TheCPC->m_SndTags->size();
-	    const int nrcvs_cpAsc = TheCPC->m_RcvTags->size();     
-#ifdef USE_PERILLA_PTHREADS
-//	    perilla::syncAllThreads();
-#endif
-
-	    if(np > 1){
-#ifdef USE_PERILLA_PTHREADS
-//		if(perilla::isMasterThread())
-#endif
-		{
-		    send_cctc.reserve(nsnds_cpAsc);
-
-		    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC->m_SndTags->begin(),
-			    m_End = TheCPC->m_SndTags->end();
-			    m_it != m_End;
-			    ++m_it)
-		    {
-			if(m_it->first != myProc)      // Not destined to me.
-			{
-			    send_pr.push_back(m_it->first);
-			    send_cctc.push_back(&(m_it->second));
-			}
-		    }
-
-		    recv_cctc.reserve(nrcvs_cpAsc);
-
-		    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC->m_RcvTags->begin(),
-			    m_End = TheCPC->m_RcvTags->end();
-			    m_it != m_End;
-			    ++m_it)
-		    {
-			if(m_it->first != myProc)      // I am not the source for this receipt
-			{
-			    recv_pr.push_back(m_it->first);
-			    recv_cctc.push_back(&(m_it->second));
-			}
-		    }
-		}
-	    }
-#ifdef USE_PERILLA_PTHREADS
-//	    perilla::syncAllThreads();
-#endif
-
-//#ifndef USE_PERILLA_PTHREADS
-	    #pragma omp parallel shared(gSrc, gDst, mfSrc, mfDst, nfabsSrc, nfabsDst)
-//#endif
-	    {
-#ifdef _OPENMP
-		int tid = omp_get_thread_num();//perilla::tid();//omp_get_thread_num();	  
-#else
-		int tid=0;
-#endif
-		int tg = tid/perilla::NUM_THREADS_PER_TEAM;//perilla::wid();//WorkerThread::perilla_wid();
- 		int nt= tid%perilla::NUM_THREADS_PER_TEAM;
-		int fg;
-		//std::cout<<"thread "<< tid<<"group "<<tg<< "Before parallel at gID " << gDst->graphID << " numTask " << gDst->numTasks << " numFabs " << gDst->numFabs <<std::endl;	
-
-		for(int f=0; f<nfabsSrc; f++)
-		{
-		  //if(perilla::isMasterWorkerThread())
-		  if(nt==0)
-		    if(WorkerThread::isMyRegion(tg,f))
-		    {
-			int scnt = 0;
-			FabCopyAssoc *cpSrc;
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			if(gSrc->task[f]->cpAsc_srcHead == 0)
-			{
-			    gSrc->task[f]->cpAsc_srcHead = new FabCopyAssoc();
-			    cpSrc = gSrc->task[f]->cpAsc_srcHead;
-			}
-			else
-			{
-			    cpSrc = new FabCopyAssoc();
-			    cpSrc->next = gSrc->task[f]->cpAsc_srcHead;
-			    gSrc->task[f]->cpAsc_srcHead = cpSrc;
-			}
-
-			cpSrc->graphPartner = gDst;
-			cpSrc->l_con.nscpy = 0;
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag& tag = (*TheCPC->m_LocTags)[i];
-			    //if(f == tag.srcIndex)
-			    if(mfSrc.IndexArray()[f] == tag.srcIndex)
-				cpSrc->l_con.nscpy++;		  
-			}
-			cpSrc->l_con.scpy = new LocalCopyDescriptor[cpSrc->l_con.nscpy];		
-
-			//if(gDst->graphID == 4 && tag.dstIndex == 60 )
-			//std::cout<< "Inside parallel Generating Local Copy send at tid " << tid << " f " << f << " gID " << gDst->graphID <<" num local connections"<< nloc_cpAsc << std::endl;	
-
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag *tag = &(*TheCPC->m_LocTags)[i];
-			    //if(f == tag.srcIndex)
-			    if(mfSrc.IndexArray()[f] == tag->srcIndex)			
-			    {
-				cpSrc->l_con.scpy[scnt].ns = mfSrc.localindex(tag->srcIndex);
-				cpSrc->l_con.scpy[scnt].nd = mfDst.localindex(tag->dstIndex);
-				cpSrc->l_con.scpy[scnt].sbx = tag->sbox;
-				cpSrc->l_con.scpy[scnt].dbx = tag->dbox;
-				int psize = tag->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				//std::cout<< " gSrc ID "<< gSrc->graphID << " f "<<f<< " sndPkgsize " << psize <<std::endl;
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				{
-				    Package *tmpPkg = new Package(psize);
-				    for(int j=0; j<psize; j++)
-					tmpPkg->databuf[j] = 0;
-				    cpSrc->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);
-				}
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    cpSrc->l_con.scpy[scnt].recycleQueue.enqueue(cpSrc->l_con.scpy[scnt].pQueue.dequeue());
-				scnt++;
-			    }
-			}
-
-			if(np > 1)
-			{
-			    cpSrc->r_con.nsnd = 0;
-			    cpSrc->r_con.remotePushReady = false;
-			    cpSrc->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)				
-					cpSrc->r_con.nsnd++;
-				}		      
-			    } // for(i<nsnds_cpAsc)
-			    cpSrc->r_con.snd = new RemoteCommDescriptor[cpSrc->r_con.nsnd];
-			    scnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-				    {
-					cpSrc->r_con.snd[scnt].ns = it->srcIndex;
-					cpSrc->r_con.snd[scnt].nd = it->dstIndex;			      
-					cpSrc->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					cpSrc->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);			      
-					cpSrc->r_con.snd[scnt].sbx = it->sbox;
-					cpSrc->r_con.snd[scnt].dbx = it->dbox;
-					int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    Package *tmpPkg = new Package(psize);
-					    for(int j=0; j<psize; j++)
-						tmpPkg->databuf[j] = 0;
-					    cpSrc->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    cpSrc->r_con.snd[scnt].recycleQueue.enqueue(cpSrc->r_con.snd[scnt].pQueue.dequeue());			      
-					scnt++;
-				    }
-				}		      		      
-			    } // for(i<nsnds_cpAsc)		    		  
-			} // if(np > 1)	      																	
-		    } // if(fg==tg)
-
-		    //perilla::syncAllThreads();
-		    #pragma omp barrier
-		    if(np > 1)
-		    {
-			//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-		        if(tid==0)
-			{
-
-			    // std::cout<< "Inside parallel Generating Remote Send tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			    gSrc->sCopyMapHead->map[f]->r_con.nsnd = 0;
-			    gSrc->sCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)				
-					gSrc->sCopyMapHead->map[f]->r_con.nsnd++;
-				}
-			    } // for(i<nsnds_cpAsc)
-			    gSrc->sCopyMapHead->map[f]->r_con.snd = new RemoteCommDescriptor[gSrc->sCopyMapHead->map[f]->r_con.nsnd];
-			    int scnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-				    {
-
-					//if(gDst->graphID == 31 && (it->dstIndex == 519))
-					//std::cout <<"myP " <<myProc<< " Added in S Dep nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].ns = it->srcIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].nd = it->dstIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_gid = gDst->graphID-1;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);				  
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sbx = it->sbox;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].dbx = it->dbox;
-
-					int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sz = psize;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pr = send_pr[i];
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].recycleQueue.enqueue(gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.dequeue());  
-					scnt++;
-				    }
-				}
-			    } // for(i<nsnds_cpAsc)
-			} // if(tid==0)
-		    } // if(np > 1)	  
-		} // for(f<nfabsSrc)
-		//	  std::cout<< "Barrier 2 " <<" tid "<<tid<<std::endl;	  
-		//perilla::syncAllThreads();
-		#pragma omp barrier
-		for(int f=0; f<nfabsDst; f++)
-		{
-		  //if(perilla::isMasterWorkerThread())
-		  if(nt==0)
-		    if(WorkerThread::isMyRegion(tg,f))		
-		    {
-			//	  std::cout <<"tid: "<< tid << " f: "<< f << " is master "<<WorkerThread::isTeamMasterThread(tid) << " is my region "<<WorkerThread::isMyRegion(tg,f)<<std::endl;		  
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			FabCopyAssoc *cpDst;
-			if(gDst->task[f]->cpAsc_dstHead == 0)
-			{
-			    gDst->task[f]->cpAsc_dstHead = new FabCopyAssoc();
-			    cpDst = gDst->task[f]->cpAsc_dstHead;
-			}
-			else
-			{
-			    cpDst = new FabCopyAssoc();
-			    cpDst->next = gDst->task[f]->cpAsc_dstHead;
-			    gDst->task[f]->cpAsc_dstHead = cpDst;
-			}
-			cpDst->graphPartner = gSrc;
-			cpDst->l_con.ndcpy = 0;
-			cpDst->l_con.firingRuleCnt = 0;
-			cpDst->l_con.dcpyCnt = 0;
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag *tag = &(*TheCPC->m_LocTags)[i];
-			    //if(f == tag.dstIndex)
-			    if(mfDst.IndexArray()[f] == tag->dstIndex)
-				cpDst->l_con.ndcpy++;		  
-			}
-			cpDst->l_con.dcpy = new LocalCopyDescriptor[cpDst->l_con.ndcpy];		
-			int dcnt = 0;
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Local copy recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-
-			//if(gDst->graphID ==27 && f == 633)
-			//std::cout<< "tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc << " ndcpy " << cpDst->l_con.ndcpy <<std::endl;	
-
-
-			for(int i=0; i<nloc_cpAsc; i++)
-			{
-			    const FabArrayBase::CopyComTag *tag = &(*TheCPC->m_LocTags)[i];
-			    //if(f == tag->dstIndex)
-			    if(mfDst.IndexArray()[f] == tag->dstIndex)
-			    {
-
-				//if(gDst->graphID == 4 && (tag->dstIndex == 60 || tag->dstIndex == 59))
-				//std::cout<< "dcpy tid " << tid << " f " << f << " i " << i << " dcnt " << dcnt << " ns "<<tag->srcIndex << " nd "<<tag->dstIndex << " lo " << tag->dbox.smallEnd() << " hi " << tag->dbox.bigEnd() <<std::endl;	
-
-				cpDst->l_con.dcpy[dcnt].ns = mfSrc.localindex(tag->srcIndex);
-				cpDst->l_con.dcpy[dcnt].nd = mfDst.localindex(tag->dstIndex);
-				cpDst->l_con.dcpy[dcnt].sbx = tag->sbox;
-				cpDst->l_con.dcpy[dcnt].dbx = tag->dbox;
-
-				// if(gDst->graphID > 25 && f == 633)
-				//std::cout<< " Generating Package tid " << tid << " i " << i <<std::endl;	
-
-				int psize = tag->dbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				cpDst->l_con.dcpy[dcnt].sz = psize;
-
-				if(!gDst->isDepGraph)
-				{
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					Package *tmpPkg = new  Package(psize);
-
-					// if(tmpPkg == nullptr)
-					//std::cout<<"Found the culprit tid " << tid << " f " << f << " i " << i << std::endl;
-
-					for(int j=0; j<psize; j++)
-					    tmpPkg->databuf[j] = 0;
-					cpDst->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);
-				    }
-
-				    // if(gDst->graphID > 25 && f == 633)
-				    //std::cout<< " Generating  now in reQ Package tid " << tid << " i " << i <<std::endl;	
-
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpDst->l_con.dcpy[dcnt].recycleQueue.enqueue(cpDst->l_con.dcpy[dcnt].pQueue.dequeue());		      
-
-				    //if(gDst->graphID > 25 && f == 633)
-				    //  std::cout<< " Generated Package tid " << tid << " i " << i <<std::endl;	
-				}
-
-				dcnt++;
-			    }
-			}
-
-			// if(gDst->graphID > 25 && f > 630)
-			//std::cout<< "Safe now tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc <<std::endl;	
-
-			RegionGraph* depGraph = gDst->srcLinkGraph;
-			for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-			{
-			    int dfi = gDst->task[f]->depTaskIDs[df];
-			    FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-			    for(int i=0; i<cpdDst->l_con.ndcpy ; i++)
-			    {
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				{
-				    int psize = cpdDst->l_con.dcpy[i].sz;
-				    Package *tmpPkg = new  Package(psize);       
-				    for(int j=0; j<psize; j++)
-					tmpPkg->databuf[j] = 0;
-				    cpdDst->l_con.dcpy[i].pQueue.enqueue(tmpPkg);
-				}			      
-				for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    cpdDst->l_con.dcpy[i].recycleQueue.enqueue(cpdDst->l_con.dcpy[i].pQueue.dequeue());		      
-			    }
-			}		  
-
-			if(np > 1)
-			{
-			    cpDst->r_con.nrcv = 0;
-			    cpDst->r_con.remotePullDone = false;
-			    cpDst->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-					cpDst->r_con.nrcv++;
-				}		      
-			    } // for(i<nrcvs_cpAsc)
-			    cpDst->r_con.rcv = new RemoteCommDescriptor[cpDst->r_con.nrcv];
-			    dcnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-				    {
-					cpDst->r_con.rcv[dcnt].nd = it->dstIndex;
-					cpDst->r_con.rcv[dcnt].ns = it->srcIndex;
-					cpDst->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					cpDst->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);				  
-					cpDst->r_con.rcv[dcnt].sbx = it->sbox;
-					cpDst->r_con.rcv[dcnt].dbx = it->dbox;
-					int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-					cpDst->r_con.rcv[dcnt].sz = psize;
-
-					if(!gDst->isDepGraph)
-					{
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    {
-						Package *tmpPkg = new Package(psize);
-						for(int j=0; j<psize; j++)
-						    tmpPkg->databuf[j] = 0;
-						cpDst->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-					    }
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						cpDst->r_con.rcv[dcnt].recycleQueue.enqueue(cpDst->r_con.rcv[dcnt].pQueue.dequeue());		      			      
-					}
-
-					dcnt++;
-				    }
-				}
-			    }// for(i<nrcvs_cpAsc)
-
-			    RegionGraph* depGraph = gDst->srcLinkGraph;
-			    for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-			    {
-				int dfi = gDst->task[f]->depTaskIDs[df];
-				FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-				for(int i=0; i<cpdDst->r_con.nrcv ; i++)
-				{
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					int psize = cpdDst->r_con.rcv[i].sz;
-					Package *tmpPkg = new  Package(psize);       
-					for(int j=0; j<psize; j++)
-					    tmpPkg->databuf[j] = 0;
-					cpdDst->r_con.rcv[i].pQueue.enqueue(tmpPkg);
-				    }			      
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpdDst->r_con.rcv[i].recycleQueue.enqueue(cpdDst->r_con.rcv[i].pQueue.dequeue());		      
-				}
-			    }		  
-
-
-			} // if(np > 1)
-		    }// if(fg==tg)
-
-		    //perilla::syncAllThreads();
-		    #pragma omp barrier
-
-		    if(np > 1)
-		    {
-			//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)			
-			if(tid==0)
-			{
-			    //  std::cout<< "Inside parallel Generating Remote Recive tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-			    gDst->rCopyMapHead->map[f]->r_con.nrcv = 0;
-			    gDst->rCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-					gDst->rCopyMapHead->map[f]->r_con.nrcv++;
-				}
-			    }
-			    gDst->rCopyMapHead->map[f]->r_con.rcv = new RemoteCommDescriptor[gDst->rCopyMapHead->map[f]->r_con.nrcv];
-			    int dcnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-				    {
-
-					// if(myProc==54 && gDst->graphID == 25 && f == 10)
-					// std::cout <<"myP " <<myProc<<" Dep n R Added nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " sgID "<< gSrc->graphID <<" tg "<<tg<< " from P " << recv_pr[i] <<std::endl;
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].nd = it->dstIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].ns = it->srcIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sbx = it->sbox;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].dbx = it->dbox;
-
-					int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sz = psize;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pr = recv_pr[i];
-
-					BL_ASSERT(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd == f);
-
-					if(Perilla::genTags)
-					{
-					    try{
-						std::map<int,int>::iterator itr = tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].find(psize);
-						if( itr != tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].end())
-						{
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-						}
-						else
-						{
-						    tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex][psize] = Perilla::uTags++;
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-						    std::map<int,int>::iterator itr2 = pTagCnt[recv_pr[i]].find(gDst->graphID-1);
-						    if(itr2 != pTagCnt[recv_pr[i]].end())
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = pTagCnt[recv_pr[i]][gDst->graphID-1] + 1;
-						    else
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = 1;									     									      
-						}
-					    }
-					    catch(std::exception& e)
-					    {
-						std::cout <<"Inside tagGeneration gID "<< gDst->graphID <<" "<< e.what() << '\n';
-					    }
-					}
-					//tagMap[recv_pr[i]][gDst->graphID][it->dstIndex][it->srcIndex] = pTagCnt[recv_pr[i]];				  
-
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].recycleQueue.enqueue(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.dequeue());
-					dcnt++;
-				    }
-				}
-			    } // for(i<nrcvs_cpAsc)
-
-			} // if(tid==0)
-		    } // if(np > 1)
-		    //} //if(fg==tg)
-	    } // for(f<nfabsDst)
-	    // std::cout<< "Barrier 4" <<" tid "<<tid <<std::endl;	      	  	  
-	    //perilla::syncAllThreads();
-	    #pragma omp for
-	    for(int f=0; f<nfabsSrc; f++)
-	    {
-	      //if(perilla::isMasterWorkerThread())
-              if(nt==0)
-		if(WorkerThread::isMyRegion(tg,f))	      
-		{	
-
-		    //if(gDst->graphID > 25)
-		    //std::cout<< "Inside parallel Generating Send partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;		  
-
-		    for(int i=0; i<gSrc->task[f]->cpAsc_srcHead->l_con.nscpy; i++)
-		    {
-			int lnd = gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].nd;
-			for(int j=0; j<gDst->task[ lnd ]->cpAsc_dstHead->l_con.ndcpy; j++)
-			    if(gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dbx == gDst->task[ lnd ]->cpAsc_dstHead->l_con.dcpy[j].dbx)
-				gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dPartner = j;
-		    }
-		}
-	    } // for(f<nfabsSrc)
-	    //std::cout<< "Barrier 5" <<" tid "<<tid<<std::endl;	      	  	  
-	    //perilla::syncAllThreads();
-	    #pragma omp for
-	    for(int f=0; f<nfabsDst; f++)
-	    {
-	      //if(perilla::isMasterWorkerThread())
-	      if(nt==0)
-		if(WorkerThread::isMyRegion(tg,f))
-		{
-		    //if(gDst->graphID > 25)
-		    //std::cout<< "Inside parallel Generating Recive partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-		    for(int i=0; i<gDst->task[f]->cpAsc_dstHead->l_con.ndcpy; i++)
-		    {
-			int lns = gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].ns;
-			for(int j=0; j<gSrc->task[ lns ]->cpAsc_srcHead->l_con.nscpy; j++)
-			    if(gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].dbx == gSrc->task[ lns ]->cpAsc_srcHead->l_con.scpy[j].dbx)
-				gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].sPartner = j;
-		    }
-		}
-	    } // for(f<nfabsDst)																 
-	} // omp parallel
-    } // if(!(*mfSrc == *mfDst))    
-}
-catch(std::exception& e)
-{
-    std::cout <<"Inside MFcopyAssoc gID "<< gDst->graphID <<" "<< e.what() << '\n';
-}
-
-
-//std::cout<< "All done safely at gID " << gDst->graphID <<std::endl;	
-
-#endif
-
-} // multifabExtractCopyAssoc
-
-#endif
-
-
-
-#if 0
-void Perilla::multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-exit(0);
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    int myProc = ParallelDescriptor::MyProc();
-    // MultiFab* mfDst = destGraph->assocMF;
-    // MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-	//if(srcGraph->graphID==18 && f ==316 && ntid == 0)
-	//std::cout << "srgG chk see " << srcGraph << " " <<myProc <<std::endl;
-
-	while(cpSrc != 0)
-	{
-	    if(cpSrc->graphPartner == destGraph)
-		break;
-	    cpSrc = cpSrc->next;
-	} 
-	if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;	
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->l_con.sLock));		    
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-	    {
-		Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-	    }	    
-	    for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-	    pthread_mutex_unlock(&(cpSrc->l_con.sLock));   
-	}
-	else
-	{
-	    if(ntid == 0)
-		pthread_mutex_lock(&(cpSrc->l_con.sLock));	
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf);
-		}	    
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    if(ntid==0)
-	    {
-		for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		    cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-		pthread_mutex_unlock(&(cpSrc->l_con.sLock));   
-	    }
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	//if(myProc==26 && srcGraph->graphID==18  && ntid == 0)
-	//std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-	//if(myProc==28 && srcGraph->graphID==18  && ntid == 0)
-	//std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-	//if(srcGraph->graphID==18 && f ==316)	 
-	//BL_ASSERT(cpSrc->r_con.nsnd == 177);
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-
-		Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-	    }
-
-	    pthread_mutex_unlock(&(cpSrc->r_con.sndLock)); 
-
-	    cpSrc->r_con.remotePushReady = true;
-	    ///*
-	    pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-	    pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-	}
-	else
-	{
-	    if(ntid == 0)
-		pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-
-		    // if(myProc==4 && srcGraph->graphID==2 && (f ==0 || f ==2))
-		    //std::cout << " Pushing 2 316 164"<<std::endl;
-
-		    Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf);
-		    cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-
-		}
-
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    if(ntid==0)
-	    {
-		pthread_mutex_unlock(&(cpSrc->r_con.sndLock)); 
-
-		cpSrc->r_con.remotePushReady = true;
-		///*
-		pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-		pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-		//*/
-	    }
-	    srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))      													      
-} // multifabCopyPushAsync
-#endif
-
-
-#if 0
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int myProc = ParallelDescriptor::MyProc();
-
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    //MultiFab* mfDst = destGraph->assocMF;
-    //MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    //if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	//if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpDst = destGraph->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    if(cpDst->graphPartner == srcGraph)
-		break;
-	    cpDst = cpDst->next;
-	} 
-	if(cpDst == 0) cout <<"Metadata for across grid copy not found"<< endl;
-	//destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpDst->l_con.dLock));
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-	    {
-		Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-	    }	
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue(true),true); // corrected from pQ to recycleQ and from recycleQ to pQ
-	    cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-	    pthread_mutex_unlock(&(cpDst->l_con.dLock));
-	}
-	else
-	{
-	    if(ntid==0)
-		pthread_mutex_lock(&(cpDst->l_con.dLock));
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf);
-		}	
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);       	
-
-	    if(ntid == 0)
-	    {
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		    cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue(true),true); // corrected from pQ to recycleQ and from recycleQ to pQ
-		cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-		pthread_mutex_unlock(&(cpDst->l_con.dLock));
-	    }
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-	    pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		///*
-		Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-		rcvMetaPackage->completed = false;
-		rcvMetaPackage->served = false;
-		rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-		destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-		Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);	      
-		rcvPackage->completed = false;
-		cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ	      
-		//*/
-
-		//Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-		//mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-	    }
-	    cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-	    cpDst->r_con.remotePullDone = true;
-	    ///*
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			cpDst->r_con.firingRuleCnt++;
-	    //*/
-	    pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-	    pthread_mutex_unlock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-
-	}
-	else
-	{	
-	    if(ntid==0)
-	    {
-		pthread_mutex_lock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-		pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-	    }
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    ///*
-		    Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-		    rcvMetaPackage->completed = false;
-		    rcvMetaPackage->served = false;
-		    rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-		    destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-		    Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);	      
-		    rcvPackage->completed = false;
-		    cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ	      
-		    //*/
-
-		    //Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-		    //mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-
-		}
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    if(ntid==0)
-	    {
-		cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-		cpDst->r_con.remotePullDone = true;
-		///*
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-			if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			    cpDst->r_con.firingRuleCnt++;
-		//*/
-		pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		pthread_mutex_unlock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-	    }
-	    destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))
-
-} // multifabCopyPull
-#endif
-
-
-
-#if 0
-void Perilla::serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    int graphID = graphArray[g]->graphID;
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    //if(pthread_mutex_trylock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock)) != 0)
-	    {
-	        //pthread_mutex_lock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-		//if(pthread_mutex_trylock(&(cpDst->r_con.rcvLock)) != 0)
-		{
-		    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    {
-			//if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed
-			if(cpDst->r_con.rcv[i].pQueue.queueSize(true)==0)
-			{
-			    nextrReq = true;
-			}
-			else
-			{			    
-			    //Package *rearPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.getRear(true);//!CHECK THIS POINT LATER
-			    Package *rearPackage = cpDst->r_con.rcv[i].pQueue.getRear(true);//!CHECK THIS POINT LATER
-			    // Also check the recycle queue because when rear is completed it may cause unlimited recv posts
-			    //if(rearPackage->completed && graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.queueSize(true) > 1) //!latest receive request has been completed
-			    if(rearPackage->completed && cpDst->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			    {
-				nextrReq = true;
-			    }
-			    else //!expected message is still on the way
-				nextrReq = false;
-			}
-			if(nextrReq) //!take a message from recycle pool and post a receive
-			{
-	            //pthread_mutex_lock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-		    pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-			    //!create a package to keep track of receive requests
-			    //Package *rMetaPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			    //!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-			    int ns = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].ns;
-			    int nd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].nd;
-			    int lnd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-			    int r_grids = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].r_grids;
-			    Package *rPackage = cpDst->r_con.rcv[i].recycleQueue.dequeue(true);
-			    //int tag = tagGen(ns, nd, graphID-1, np*r_grids, nGraphs);
-			    //int tag = Perilla::myTagMap[graphID-1][nd][ns];
-			    //int tag = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-			    int tag = tagMap[graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr][g][nd][ns][graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz];
-
-			    rPackage->request = MPI_REQUEST_NULL;
-			    rPackage->completed=false;
-			    cpDst->r_con.rcv[i].pQueue.enqueue(rPackage, true);   //!this is not done yet
-			    //graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage, true);   //!this is not done yet	 
-			    rPackage->request = ParallelDescriptor::Arecv(rPackage->databuf,
-				    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz,
-				    graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr, tag).req(); // tag == SeqNum in c++ ver
-		    pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		    //pthread_mutex_unlock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-			}						
-		    } // for (i<i<cpDst->r_con.nrcv)
-		} // if(ga locked)
-		//pthread_mutex_unlock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-	    } // if(mf locked)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-		//if(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed	       	
-                if(cpSrc->r_con.snd[i].pQueue.queueSize(true) == 0)
-		    nextsReq = false;
-		else
-		    nextsReq = true;
-
-		if(nextsReq) //!take a message from recycle pool and post a receive
-		{
-		    Package *sPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-		    if(!sPackage->served)
-		    {		    
-		        //Package *sMetaPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.getFront(true);
-			sPackage->completed = false;
-			sPackage->served = true;
-			sPackage->request = MPI_REQUEST_NULL;
-			int ns = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].ns;
-			int nd = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].nd;
-			int r_gid = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_gid;
-			int r_grids = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_grids;
-			int tag = Perilla::myTagMap[r_gid][nd][ns][graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz];
-			sPackage->request = ParallelDescriptor::Asend(sPackage->databuf,
-				graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz,
-				graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-		    }
-		}		
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	   //if(pthread_mutex_trylock(&(cpDst->r_con.rcvLock)) != 0)
-           {		    
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		//if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-		{		    
-			//Package *rearPackage =  graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.getRear(true);
-			Package *rearPackage =  cpDst->r_con.rcv[i].pQueue.getRear(true);
-			if(rearPackage)
-			if(!rearPackage->completed)
-			{
-	   pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-			    bool flag = false;
-			    int ret_flag=0;
-			    MPI_Status status;
-			    ParallelDescriptor::Test(rearPackage->request, ret_flag, status);
-
-			    flag = (ret_flag == 0) ? false : true;//parallel_test_one(rearPackage%ptr%request) -------???????
-			    if(flag)
-			    {
-				rearPackage->completeRequest();				
-				cpDst->r_con.rcv[i].pQueue.getRear(true)->completeRequest();
-
-				//if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				if(cpDst->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				{
-				    cpDst->r_con.firingRuleCnt++;
-				}
-			    }
-	    pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-			}		   		    
-		} // if(pQueue.queueSize(true) > 0)		    
-	    } // for (i<i<cpDst->r_con.nrcv)
-           } // if(ga locked)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {		
-		//if(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-                if(cpSrc->r_con.snd[i].pQueue.queueSize(true) >0)
-		{
-		    //Package *frontPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.getFront(true);
-		    Package *frontPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-		    if(frontPackage->served && !frontPackage->completed) //!latest receive request has NOT been completed
-		    {
-			bool flag = false;
-			int ret_flag;
-			MPI_Status status;
-			ParallelDescriptor::Test(frontPackage->request, ret_flag, status);
-			flag = (ret_flag == 0) ? false : true;//parallel_test_one(frontPackage%ptr%request) -------???????		    
-			if(flag)
-			{
-
-			    //pthread_mutex_lock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-			    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-			    frontPackage = cpSrc->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = MPI_REQUEST_NULL;
-			    cpSrc->r_con.snd[i].recycleQueue.enqueue(frontPackage, true);
-			    pthread_mutex_unlock(&(cpSrc->r_con.sndLock));			
-
-/*
-			    frontPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = MPI_REQUEST_NULL;
-			    graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage, true);
-*/
-			    //pthread_mutex_unlock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-			}
-		    }
-		} // if(queueSize > 0)				
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-} // serviceRemoteGridCopyRequests
-#endif
-
-#if 0
-void Perilla::resetRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    //MultiFab* mf = graphArray[g]->assocMF;
-    int graphID = graphArray[g]->graphID;
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		if(cpSrc->r_con.remotePushReady)
-		{
-		    pthread_mutex_lock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-		    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    {
-			graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-		    }
-		    pthread_mutex_unlock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-		    cpSrc->r_con.remotePushReady = false;
-		}// if remotepushready
-		cpSrc = cpSrc->next;
-	    }
-	}// ismyRegion
-    }//for f<numfabs
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		if(pthread_mutex_trylock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock)) != 0)
-		{
-		    if(pthread_mutex_trylock(&(cpDst->r_con.rcvLock)) != 0)
-		    {
-			//if(f==1 && g==26 && myProc == 54)
-			//std::cout<<"Completing Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpDst->r_con.remotePullDone <<std::endl;
-			if(cpDst->r_con.remotePullDone)
-			{
-			    for(int i=0; i<cpDst->r_con.nrcv; i++)
-			    {
-
-				Package *rcvMetaPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-				rcvMetaPackage->completed = false;
-				rcvMetaPackage->served = false;
-				rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-				graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-				Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-				rcvPackage->completed = false;
-				cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ
-
-				//cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - 1;
-
-				if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-				    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-					cpDst->r_con.firingRuleCnt++;
-
-
-			    } // for (i<i<cpDst->r_con.nrcv)
-
-			    cpDst->r_con.remotePullDone = false;
-
-			    //if(f==1 && g==26 && myProc == 54)
-			    // std::cout<<"Completed Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpDst->r_con.remotePullDone <<std::endl;
-
-			}
-			pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		    } // if(ga locked)
-		    pthread_mutex_unlock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-		} // if(mf locked)
-		cpDst = cpDst->next;
-	    } // while(cpDst != 0)	
-	    /*  
-		if(false)
-		for(int id=0; id<graphArray[g]->task[f]->depTaskIDs.size(); id++)
-		{	    
-		int df = graphArray[g]->task[f]->depTaskIDs[id];
-		if(WorkerThread::isMyRegion(0,df))
-		{
-		int lgID = graphArray[g]->srcLinkGraph->graphID-1;
-
-	    //if(f==1 && g==26 && myProc == 54)
-	    //std::cout<<"Completing Dep Push f " << df << " gID " << lgID+1 << " myP " << myProc  <<std::endl;
-
-	    FabCopyAssoc* cpdDst = graphArray[lgID]->task[df]->cpAsc_dstHead;
-	    while(cpdDst != 0)
-	    {
-	    if(omp_test_lock(graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcvLock) != 0)
-	    {
-	    if(omp_test_lock(cpdDst->r_con.rcvLock) != 0)
-	    {
-	    //if(f==1 && g==26 && myProc == 54)
-	    //std::cout<<"Completing Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpdDst->r_con.remotePullDone <<std::endl;
-	    if(cpdDst->r_con.remotePullDone)
-	    {
-	    for(int i=0; i<cpdDst->r_con.nrcv; i++)
-	    {
-
-	    Package *rcvMetaPackage = graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-	    graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-	    Package* rcvPackage = cpdDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-	    rcvPackage->completed = false;
-	    cpdDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ
-
-	    //cpdDst->r_con.firingRuleCnt = cpdDst->r_con.firingRuleCnt - 1;
-
-	    if(cpdDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-	    if(cpdDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-	    cpdDst->r_con.firingRuleCnt++;
-
-
-	    } // for (i<i<cpdDst->r_con.nrcv)
-
-	    cpdDst->r_con.remotePullDone = false;
-
-	    //if(df==10 && lgID==24 && myProc == 54)
-	    // std::cout<<"Completed Push f " << df << " gID " << lgID+1 << " myP " << myProc << " PDone "<< cpdDst->r_con.remotePullDone <<std::endl;
-	    }
-	    omp_unset_lock(cpdDst->r_con.rcvLock);
-	    } // if(ga locked)
-	    omp_unset_lock(graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcvLock);
-	    } // if(mf locked)
-	    cpdDst = cpdDst->next;
-	    } // while(cpdDst != 0)	
-
-
-	    } // if tg==0 region
-
-
-	    } // for all dependents
-	     */
-	}
-    } // for(f<nfabs)
-  }
-#endif
-
diff --git a/Src/AmrTask/rts_impls/runtime_common/RGIter.H b/Src/AmrTask/rts_impls/runtime_common/RGIter.H
deleted file mode 100755
index 0cdd09b7066..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RGIter.H
+++ /dev/null
@@ -1,73 +0,0 @@
-#ifndef RGITER_H_
-#define RGITER_H_
-
-#include <RegionGraph.H>
-//#include <AMReX_Amr.H>
-//#include <PerillaRts.H>
-#include <fstream>
-
-namespace amrex{
-
-    class AsyncFillPatchIterator;
-
-    class RGIter
-    {
-	public:
-	    int tid;
-	    int ntid;
-	    int tg;
-	    int currentRegion;
-	    int currentTile;
-	    int totalItr;
-	    int currentItr;
-	    bool tiling;
-	    bool implicit;
-	    bool ppteams;
-	    bool haveDepGraph;
-	    RegionGraph* itrGraph;
-	    RegionGraph* depGraph;
-	    int  boxGrow, index, scomp, ncomp, iteration;
-	    double time;
-	    double getFireableTime;
-	    amrex::MultiFab *_dest;
-
-	    IndexType     typ;
-
-	    Vector<amrex::AsyncFillPatchIterator*> m_level_afpi; 
-	    Vector<amrex::AsyncFillPatchIterator*> m_upper_level_afpi;
-	    std::ofstream fout;
-
-	public:
-	    RGIter(RegionGraph* rg 
-#ifdef USE_PERILLA_ON_DEMAND
-            ,std::vector<RegionGraph*> graphArray
-#endif
-	    , bool enableAllTasks=false);
-	    RGIter(RegionGraph* rg 
-#ifdef USE_PERILLA_ON_DEMAND
-            ,std::vector<RegionGraph*> graphArray
-#endif
-	    , RegionGraph* drg, bool isDep=true);
-	    RGIter(amrex::AsyncFillPatchIterator* afpi, bool enableAllTasks=false);
-	    RGIter(Vector<amrex::AsyncFillPatchIterator*> afpi, Vector<amrex::AsyncFillPatchIterator*> upper_afpi, 
-		    amrex::MultiFab& dest, int  bG, double tm, int  ind, int  sc, int nc, int itr);
-	    ~RGIter();
-
-	    void init();
-	    void sync_workers();
-	    //! Increment iterator to the next tile we own.
-	    void operator++ ();
-	    //! Is the iterator valid, are more regions to iterate over?
-	    bool isValid();
-	    int LocalIndex() const { return currentRegion; }
-	    void exec();
-
-	    amrex::Box tileBox();
-	    amrex::Box validBox() const;
-	    amrex::Box tilebox();
-	    amrex::Box growntilebox();
-	    amrex::Box growntilebox(int ng);
-	    amrex::Box nodaltilebox(int dir);
-    };
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/RGIter.cpp b/Src/AmrTask/rts_impls/runtime_common/RGIter.cpp
deleted file mode 100755
index 0a456199da8..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RGIter.cpp
+++ /dev/null
@@ -1,639 +0,0 @@
-#include <AMReX_Box.H>
-#include <RGIter.H>
-#include <WorkerThread.H>
-#include <Perilla.H>
-#include <cmath>
-
-#include <AMReX_AmrLevel.H>
-#include <PerillaConfig.H>
-using namespace perilla;
-#include <PerillaRts.H>
-
-#ifdef USE_PERILLA_ON_DEMAND
-    pthread_mutex_t teamFinLock=PTHREAD_MUTEX_INITIALIZER;
-#endif
-
-namespace amrex{
-
-    RGIter::RGIter(RegionGraph* rg
-#ifdef USE_PERILLA_ON_DEMAND
-	,std::vector<RegionGraph*> graphArray
-#endif    
-	, bool enableAllTasks
-	):
-	itrGraph(rg),
-	implicit(false),
-	ppteams(true),
-	//typ(rg->typ),
-	haveDepGraph(false),
-	depGraph(NULL),
-	getFireableTime(0.)
-    {
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-#ifdef USE_PERILLA_ON_DEMAND
-	if(tid==0)Perilla::syncProcesses();
-        Perilla::numTeamsFinished=0;
-	#pragma omp barrier
-        if(perilla::isCommunicationThread())
-        {
-            while(true){
-                Perilla::serviceMultipleGraphCommDynamic(graphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-                {
-		    /*perilla::syncWorkers(ntid);
-		    if(tg==0){
-   		       graphArray.clear();
-		       Perilla::numTeamsFinished=0;
-		    }
-		    perilla::syncWorkers(ntid);*/
-                    break;
-                }
-            }
-        }else{
-#endif
-	    itrGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    if(perilla::isMasterWorkerThread())
-	        itrGraph->Reset();
-	    itrGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    if(enableAllTasks)
-	        itrGraph->enableAllRegions();
-	    itrGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    init();
-#ifdef USE_PERILLA_ON_DEMAND
-        }
-#endif
-    }
-
-    RGIter::RGIter(RegionGraph* rg
-#ifdef USE_PERILLA_ON_DEMAND
-        ,std::vector<RegionGraph*> graphArray
-#endif
-	, RegionGraph* drg, bool isDep
-    ):
-	itrGraph(rg),
-	implicit(false),
-	ppteams(true),
-	//typ(rg->typ),
-	haveDepGraph(isDep),
-	depGraph(drg),
-	getFireableTime(0.)
-    {
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-
-#ifdef USE_PERILLA_ON_DEMAND
-        if(tid==0)Perilla::syncProcesses();
-        Perilla::numTeamsFinished=0;
-        #pragma omp barrier
-        if(perilla::isCommunicationThread())
-        {
-            //Perilla::flattenGraphHierarchy(m_level_afpi[iteration-1]->m_amrlevel.parent->graphArray, graphArray);
-            while(true){
-                Perilla::serviceMultipleGraphCommDynamic(graphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-                {
-		    perilla::syncWorkers(ntid);
-		    if(tg==0){
-		        graphArray.clear();
-		        //Perilla::numTeamsFinished=0;
-		    }
-		    perilla::syncWorkers(ntid);
-                    break;
-                }
-            }
-        }else{
-#endif
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    if(perilla::isMasterWorkerThread()) itrGraph->Reset();
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    init();
-#ifdef USE_PERILLA_ON_DEMAND
-        }   
-#endif
-    }
-
-    RGIter::RGIter(amrex::AsyncFillPatchIterator* afpi, bool enableAllTasks):
-	itrGraph(afpi->destGraph),
-	implicit(false),
-	ppteams(true),
-	//typ(afpi->destGraph->typ),
-	haveDepGraph(false),
-	depGraph(NULL),
-	getFireableTime(0.)
-    {
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-#ifdef USE_PERILLA_ON_DEMAND
-        if(tid==0)Perilla::syncProcesses();
-        Perilla::numTeamsFinished=0;
-        #pragma omp barrier
-
-        if(perilla::isCommunicationThread())
-        {
-            std::vector<RegionGraph*> flattenedGraphArray;
-            Perilla::flattenGraphHierarchy(m_level_afpi[iteration-1]->m_amrlevel.parent->graphArray, flattenedGraphArray);
-            while(true){
-                Perilla::serviceMultipleGraphCommDynamic(flattenedGraphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-                {
-		    /*perilla::syncWorkers(ntid);
-		    flattenedGraphArray.clear();
-		    if(tg==0) Perilla::numTeamsFinished=0;
-		    perilla::syncWorkers(ntid);*/
-                    break;
-                }
-            }
-        }else{
-#endif  
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    if(perilla::isMasterWorkerThread())
-	        afpi->Reset();
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    if(enableAllTasks)
-	        itrGraph->enableAllRegions();
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	    init();
-#ifdef USE_PERILLA_ON_DEMAND
-        }   
-#endif
-    }
-
-#ifndef USE_PERILLA_ON_DEMAND
-    RGIter::RGIter(Vector<amrex::AsyncFillPatchIterator*> afpi, Vector<amrex::AsyncFillPatchIterator*> upper_afpi, 
-	    amrex::MultiFab& dest, int  bG, double tm, int  ind, int  sc, int nc, int itr):
-	itrGraph(afpi[itr-1]->destGraph),
-	m_level_afpi(afpi),
-	m_upper_level_afpi(upper_afpi),
-	boxGrow(bG), 
-	time(tm), 
-	index(ind), 
-	scomp(sc), 
-	ncomp(nc), 
-	iteration(itr),
-	implicit(true),
-	ppteams(true),
-	//typ(afpi[itr-1]->destGraph->typ),
-	haveDepGraph(false),
-	depGraph(NULL),
-	getFireableTime(0.)
-    {
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	bool push = true;
-
-	tid = perilla::tid();
-	tg = perilla::wid();
-	ntid = perilla::wtid();
-        AsyncFillPatchIterator::initialSend(afpi, upper_afpi, bG, tm, ind, 0, nc, itr);
-
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-	if(perilla::isMasterWorkerThread())
-	    m_level_afpi[iteration-1]->Reset();
-	itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-	if(ntid == perilla::NUM_THREADS_PER_TEAM-2)
-	{
-	    int f;
-	    int level = m_level_afpi[iteration-1]->m_amrlevel.level;
-	    double dt = m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level);
-	    this->currentItr = 1;
-	    this->totalItr = 1;
-
-	    //////////////////////////////////////Push Pull Thread Start/////////////////////////
-	    while(m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->queueSize(true) != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks ||
-		    m_level_afpi[iteration-1]->destGraph->worker[tg]->computedTasks != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks)
-	    {
-		f = m_level_afpi[iteration-1]->destGraph->getFireableRegion(tg);
-		if(f != -1)
-		{
-		    m_level_afpi[iteration-1]->Receive(this,dest,boxGrow,time,index,scomp,ncomp,f,true);
-		    m_level_afpi[iteration-1]->destGraph->setFireableRegion(f);
-		    if(m_level_afpi[iteration-1]->destGraph->worker[tg]->unfireableRegionQueue->queueSize(true) !=0 && 
-			    m_level_afpi[iteration-1]->destGraph->worker[tg]->fireableRegionQueue->queueSize(true) < 2)
-			continue;
-		}
-
-		if(m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->queueSize() != 0)
-		{
-		    f = m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->removeRegion();
-
-		    if(push & level == m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel() && iteration < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level))
-			m_level_afpi[iteration]->SendIntraLevel(*(this),boxGrow,time+dt,index,scomp,ncomp,iteration,f,true);
-
-		    if(push & level < m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-		    {
-			for(int i=0; i < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level+1); i++)
-			{
-			    m_upper_level_afpi[i]->SendInterLevel(this,boxGrow,time+(i*m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)),index,scomp,ncomp,i+1,f,true);
-			}
-		    }	
-		    m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-		}
-	    }
-	    //fout.close();
-	    ////////////////////////////////////////////////////////Push Pull Thread End////////////////////
-	}
-	else
-	{
-	    //fout << "Calling init "<< std::endl;
-	    //fout.close();
-	    init();
-	}
-    }
-
-#else
-
-    RGIter::RGIter(Vector<amrex::AsyncFillPatchIterator*> afpi, Vector<amrex::AsyncFillPatchIterator*> upper_afpi,
-            amrex::MultiFab& dest, int  bG, double tm, int  ind, int  sc, int nc, int itr)
-:
-        itrGraph(afpi[itr-1]->destGraph),
-        m_level_afpi(afpi),
-        m_upper_level_afpi(upper_afpi),
-        _dest(&dest),
-        boxGrow(bG),
-        time(tm),
-        index(ind),
-        scomp(sc),
-        ncomp(nc),
-        iteration(itr),
-        implicit(true),
-        ppteams(true),
-        haveDepGraph(false),
-        depGraph(NULL),
-        getFireableTime(0.)
-   {
-        int myProc = amrex::ParallelDescriptor::MyProc();
-        bool push = true;
-        tid = perilla::tid();
-        tg = perilla::wid();
-        ntid= perilla::wtid();
-        if(tid==0)Perilla::syncProcesses();
-        Perilla::numTeamsFinished=0;
-	#pragma omp barrier
-
-        if(perilla::isCommunicationThread())
-        {
-            std::vector<RegionGraph*> flattenedGraphArray;
-            Perilla::flattenGraphHierarchy(m_level_afpi[iteration-1]->m_amrlevel.parent->graphArray, flattenedGraphArray);
-            while(true){
-                Perilla::serviceMultipleGraphCommDynamic(flattenedGraphArray,true,perilla::tid());
-                if( Perilla::numTeamsFinished == perilla::NUM_THREAD_TEAMS)
-                {
-		    flattenedGraphArray.clear();
-                    break;
-                }
-            }
-        }else
-{
-
-        AsyncFillPatchIterator::initialSend(afpi, upper_afpi, bG, tm, ind, 0, nc, itr);
-        //AsyncFillPatchIterator::initialSend(m_level_afpi, m_upper_level_afpi, boxGrow, time, index, scomp, ncomp, iteration);
-
-        itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-        if(perilla::isMasterWorkerThread())
-            m_level_afpi[iteration-1]->Reset();
-        itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-        if(ntid == perilla::NUM_THREADS_PER_TEAM-2)
-        {
-            int f;
-            int level = m_level_afpi[iteration-1]->m_amrlevel.level;
-            double dt = m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level);
-            this->currentItr = 1;
-            this->totalItr = 1;
-            while(m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->queueSize(true) != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks ||
-                    m_level_afpi[iteration-1]->destGraph->worker[tg]->computedTasks != m_level_afpi[iteration-1]->destGraph->worker[tg]->totalTasks)
-            {
-                f = m_level_afpi[iteration-1]->destGraph->getFireableRegion(tg);
-                if(f != -1)
-                {
-                    m_level_afpi[iteration-1]->Receive(this,*_dest,boxGrow,time,index,scomp,ncomp,f,true);
-                    m_level_afpi[iteration-1]->destGraph->setFireableRegion(f);
-                    if(m_level_afpi[iteration-1]->destGraph->worker[tg]->unfireableRegionQueue->queueSize(true) !=0 &&
-                            m_level_afpi[iteration-1]->destGraph->worker[tg]->fireableRegionQueue->queueSize(true) < 2)
-                        continue;
-                }
-
-                if(m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->queueSize() != 0)
-                {
-                    f = m_level_afpi[iteration-1]->destGraph->worker[tg]->computedRegionQueue->removeRegion();
-
-                    if(push & level == m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel() && iteration < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level))
-                        m_level_afpi[iteration]->SendIntraLevel(*(this),boxGrow,time+dt,index,scomp,ncomp,iteration,f,true);
-
-                    if(push & level < m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-                    {
-                        for(int i=0; i < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level+1); i++)
-                        {
-                            m_upper_level_afpi[i]->SendInterLevel(this,boxGrow,time+(i*m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)),index,scomp,ncomp,i+1,f,true);
-                        }
-                    }
-                    m_level_afpi[iteration-1]->destGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-                }
-            }
-        }
-        else
-        {
-            //fout << "Calling init "<< std::endl;
-            //fout.close();
-            init();
-        }
-}
-    }
-
-#endif
-
-    using namespace perilla;
-
-    RGIter::~RGIter()
-    {
-	//fout.close();
-    }
-
-    void RGIter::init()
-    {
-	if(itrGraph->fabTiles.size() == 0)
-	    tiling = false;
-	else
-	    tiling = true;
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	if(implicit)
-	{
-	    if(!itrGraph->isGraphEmptyV2())
-	    {
-		currentRegion = itrGraph->getPulledFireableRegion();
-		if(tiling)
-		    totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) );
-		else
-		    totalItr = 1;
-
-		currentItr = 1;
-
-		currentTile = 0;
-		if(tiling)
-		    for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) == ntid)
-			    break;
-	    }
-	}
-	else
-	{
-	    if(!itrGraph->isGraphEmpty())
-	    {
-		if(haveDepGraph)
-		    currentRegion = itrGraph->getAnyFireableRegion(*depGraph);
-		else
-		    currentRegion = itrGraph->getAnyFireableRegion();
-
-		if(tiling)
-		    totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) );
-		else
-		    totalItr = 1;
-
-		currentItr = 1;
-
-		currentTile = 0;
-		if(tiling)
-		    for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == ntid)
-			    break;
-	    }
-	}
-    }
-
-    //! Increment iterator to the next tile we own.
-    void RGIter::operator++ ()
-    {
-	currentItr++;
-	if(tiling)
-	    for( (currentTile == itrGraph->fabTiles[currentRegion]->numTiles ? currentTile : ++currentTile); currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-	    {
-		if(implicit)
-		{
-		    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) == ntid) break;
-		}
-		else
-		{
-		    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == ntid) break;
-		}
-	    }
-	int myProc = amrex::ParallelDescriptor::MyProc();
-	if(currentItr > totalItr)
-	{
-	    if(implicit) itrGraph->regionComputed(currentRegion);
-	    else itrGraph->finalizeRegion(currentRegion);
-	    if(implicit)
-	    {
-		if(!itrGraph->isGraphEmptyV2())
-		{
-		    currentRegion = itrGraph->getPulledFireableRegion();
-		    if(tiling)
-			totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) );
-		    else
-			totalItr = 1;
-
-		    currentItr = 1;
-
-		    currentTile = 0;
-		    if(tiling)
-			for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1) == ntid/*-perilla::NUM_COMM_THREADS*/)
-				break;
-		}
-	    }
-	    else
-	    {
-		if(!itrGraph->isGraphEmpty())
-		{
-		    if(haveDepGraph)
-			currentRegion = itrGraph->getAnyFireableRegion(*depGraph);
-		    else
-			currentRegion = itrGraph->getAnyFireableRegion();
-		    if(tiling)
-			totalItr = std::ceil( (1.0*itrGraph->fabTiles[currentRegion]->numTiles) / (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) );
-		    else
-			totalItr = 1;
-
-		    currentItr = 1;
-		    currentTile = 0;
-		    if(tiling)
-			for(currentTile = 0; currentTile < itrGraph->fabTiles[currentRegion]->numTiles; currentTile++)
-			    if(currentTile % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == ntid/*-perilla::NUM_COMM_THREADS*/)
-				break;	      
-		}
-	    }
-	}
-    }
-
-    bool RGIter::isValid ()
-    {
-        if(perilla::isCommunicationThread()) return false;
-	bool valid;
-	bool do_remaining = true;
-
-	int myProc = amrex::ParallelDescriptor::MyProc();
-
-	if(implicit)
-	{
-	    if(ntid != perilla::NUM_THREADS_PER_TEAM-1)
-	    {
-		valid = !itrGraph->isGraphEmptyV2();
-		if(valid)	      
-		{
-		    do_remaining = false;
-		}
-	    }
-
-	    if(do_remaining)
-	    {
-		bool push = false;
-		int f;
-		int level = m_level_afpi[iteration-1]->m_amrlevel.level;
-		double dt = m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level);
-		this->currentItr = 1;
-		this->totalItr = 1;
-#if 0
-		while(!itrGraph->isGraphEmpty())
-		{
-		    f = itrGraph->worker[tg]->computedRegionQueue->getFrontRegion(true);
-
-		    if(push & level == m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel() && iteration < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level))
-			m_level_afpi[iteration]->SendIntraLevel(this,boxGrow,time+dt,index,scomp,ncomp,iteration,f,false);
-		    //else if(level == parent->finestLevel() && iteration == ncycle)
-		    //SborderAFPI[0]->PushOnly(NUM_GROW, time+dt, State_Type, 0, NUM_STATE, f, tid, 0x02, 1);
-
-		    if(push & level < m_level_afpi[iteration-1]->m_amrlevel.parent->finestLevel())
-		    {
-			for(int i=0; i < m_level_afpi[iteration-1]->m_amrlevel.parent->nCycle(level+1); i++)
-			{
-			    m_upper_level_afpi[i]->SendInterLevel(this,boxGrow,time+(i*m_level_afpi[iteration-1]->m_amrlevel.parent->dtLevel(level+1)),index,scomp,ncomp,i+1,f,false);
-			    //upperLevel.SborderAFPI[i]->PushOnly(NUM_GROW, time+(i*parent->dtLevel(level+1)), State_Type, 0, NUM_STATE, f, tid, tuc, tempf, false);
-			}
-		    }		
-
-		    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1);
-		    if(perilla::isMasterWorkerThread())
-		    {
-			f = itrGraph->worker[tg]->computedRegionQueue->removeRegion();
-			itrGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-		    }	  	
-		}
-#endif
-
-		//m_level_afpi[iteration-1]->destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-		if(perilla::isMasterWorkerThread())
-		{
-		    m_level_afpi[iteration-1]->completeRegionGraphs();
-#ifdef USE_PERILLA_ON_DEMAND		    
-                    pthread_mutex_lock(&teamFinLock);
-                    Perilla::numTeamsFinished++;
-                    pthread_mutex_unlock(&teamFinLock);
-#endif
-		}
-		valid = false;
-	    }
-	}
-	else
-	{
-	    if(itrGraph->isGraphEmpty())
-            {
-		if(perilla::isMasterWorkerThread())
-		{
-		    itrGraph->finalizeRegionGraph();
-#ifdef USE_PERILLA_ON_DEMAND		    
-                    pthread_mutex_lock(&teamFinLock);
-                    Perilla::numTeamsFinished++;
-                    pthread_mutex_unlock(&teamFinLock);
-#endif
-                }
-            }
-	    valid = !(itrGraph->isGraphEmpty());
-	}
-	return  valid;
-    }
-
-    amrex::Box RGIter::tileBox()
-    {
-	int myProc = amrex::ParallelDescriptor::MyProc();
-
-	if(currentTile == itrGraph->fabTiles[currentRegion]->numTiles)
-	{
-	    return amrex::Box();
-	}
-	else
-	{
-	    return   *(itrGraph->fabTiles[currentRegion]->tileBx[currentTile]);
-	}
-    }
-
-    amrex::Box RGIter::validBox() const
-    {
-	return *(itrGraph->fabTiles[currentRegion]->validBx);
-    }
-
-    amrex::Box RGIter::tilebox()
-    {
-	return this->tileBox();
-    }
-
-    amrex::Box RGIter::growntilebox()
-    {
-	return this->tileBox();	
-    }
-
-    amrex::Box RGIter::growntilebox(int ng)
-    {
-	Box bx = this->tileBox();
-	if(currentTile == itrGraph->fabTiles[currentRegion]->numTiles)
-	    return bx;
-
-	if (ng < -100) ng = 0;
-	const Box& vbx = validBox();
-	for (int d=0; d<BL_SPACEDIM; ++d) {
-	    if (bx.smallEnd(d) == vbx.smallEnd(d)) {
-		bx.growLo(d, ng);
-	    }
-	    if (bx.bigEnd(d) == vbx.bigEnd(d)) {
-		bx.growHi(d, ng);
-	    }
-	}
-	return bx;
-    }
-
-    amrex::Box RGIter::nodaltilebox(int dir)
-    {
-	BL_ASSERT(dir < BL_SPACEDIM);
-	Box bx = this->tileBox();
-	bx.convert(typ);
-	const Box& vbx = this->validBox();
-	const IntVect& Big = vbx.bigEnd();
-	int d0, d1;
-	if (dir < 0) {
-	    d0 = 0;
-	    d1 = BL_SPACEDIM-1;
-	} else {
-	    d0 = d1 = dir;
-	}
-	for (int d=d0; d<=d1; ++d) {
-	    if (typ.cellCentered(d)) { // validbox should also be cell-centered in d-direction.
-		bx.surroundingNodes(d);
-		if (bx.bigEnd(d) <= Big[d]) {
-		    bx.growHi(d,-1);
-		}
-	    }
-	}
-	return bx;
-    }
-
-    void RGIter::sync_workers()
-    {
-	if(implicit)
-	    itrGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1);
-	else
-	    itrGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-    }
-}
diff --git a/Src/AmrTask/rts_impls/runtime_common/RegionGraph.H b/Src/AmrTask/rts_impls/runtime_common/RegionGraph.H
deleted file mode 100755
index d6c17f8fe65..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RegionGraph.H
+++ /dev/null
@@ -1,323 +0,0 @@
-#ifndef P_REGIONGRAPH_H
-#define P_REGIONGRAPH_H
-
-#include <RegionQueue.H>
-#include <LocalConnection.H>
-#include <RemoteConnection.H>
-#include <WorkerThread.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Box.H>
-#include <pthread.h>
-
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include "PerillaMemCheck.H"
-extern PerillaMemCheck memcheck;
-#endif
-
-namespace amrex{
-
-    class RegionGraph;
-
-    class FabCopyAssoc
-    {
-	public:
-	    LocalConnection l_con;
-	    RemoteConnection r_con;
-	    FabCopyAssoc *next;
-	    FabCopyAssoc *prev;
-	    RegionGraph *graphPartner;
-	    //  CopyAssoc *orig_copyAssoc;
-	    FabCopyAssoc()
-	    {
-		next=0;
-		prev=0;
-		graphPartner=0;
-	    }
-            ~FabCopyAssoc()
-            {
-                if(next) delete next;
-            }
-    };
-
-    class pTileArray
-    {
-	public:
-	    int numTiles;
-	    std::vector<Box*> tileBx;
-	    Box* validBx;
-	    pTileArray(): numTiles(0), tileBx(0){}
-            ~pTileArray()
-            {   
-                //for(int i=0; i<tileBx.size(); i++) delete tileBx[i];
-                tileBx.clear();
-                //if(validBx) delete validBx;
-            }
-    };
-
-    class Task
-    {
-	public:
-	    std::vector<int> state;
-	    bool init;
-	    FabCopyAssoc *cpAsc_srcHead;
-	    FabCopyAssoc *cpAsc_dstHead;
-
-	    std::vector<int> depTaskIDs;
-	    int numDepTasksCompleted;
-	    bool depTasksCompleted;
-
-	    Task()
-	    {
-		state.reserve(16);
-		depTaskIDs.reserve(1024);
-		depTasksCompleted = true;
-		numDepTasksCompleted = 0;
-		cpAsc_srcHead=0;
-		cpAsc_dstHead=0;
-	    }
-
-	    ~Task()
-	    {
-		state.clear();
-		depTaskIDs.clear();
-		if(cpAsc_srcHead != 0)
-		    delete cpAsc_srcHead;
-		if(cpAsc_dstHead != 0)
-		    delete cpAsc_dstHead;
-	    }
-    };
-
-    class Worker
-    {
-	public:
-	    int totalTasks;
-	    int computedTasks;
-	    bool init;
-	    Barrier* barr;
-	    Barrier* l_barr;
-	    RegionQueue* fireableRegionQueue;
-	    RegionQueue* unfireableRegionQueue;
-	    RegionQueue* computedRegionQueue;
-	    RegionQueue* completedRegionQueue;
-	    Worker():init(false), barr(0), l_barr(0), totalTasks(0){}
-
-            ~Worker(){
-	        delete barr;
-        	delete l_barr;
-        	delete fireableRegionQueue;
-        	delete unfireableRegionQueue;
-        	delete computedRegionQueue;
-        	delete completedRegionQueue;
-	    }
-    };
-
-    //template <class FAB>
-    class CopyMap
-    {
-	public:
-	    std::vector<FArrayBox*> map;
-	    CopyMap *next;
-	    CopyMap()
-		:
-		    next(0)
-	{
-#ifdef PERILLA_DEBUG
-    	        memcheck.add(memcheck.genKey(this), (void*)this, "CopyMap");
-#endif
-	}
-
-	    void alloc_CopyMap(const MultiFab& mf)
-	    {
-		//Array<int> IndArr = mf.IndexArray();
-		const int n = mf.IndexArray().size();
-		//const int n = mf.size();
-		map.reserve(n);
-		//sMap.resize(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    map.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }
-	    ~CopyMap()
-	    {
-                for (int i = 0; i < map.size(); ++i)
-                {
-		    delete map[i];
-                }
-		map.clear();
-		if(next !=0 )
-		    delete next;
-#ifdef PERILLA_DEBUG
-    	        memcheck.remove(memcheck.genKey(this));
-#endif
-	    }
-    };
-
-    class RegionGraph
-    {
-	public:
-	    static int graphCnt;
-	    int graphID;
-	    int numTasks;
-	    int numFabs;
-	    int totalFinishes;
-	    bool isDepGraph;
-	    bool* okToReset;
-	    pthread_mutex_t finishLock;
-
-	    std::vector<pTileArray*> fabTiles;
-	    std::vector<pTileArray*> fabTiles_gtbx;
-
-	    std::vector<FArrayBox*> lMap;
-	    std::vector<FArrayBox*> sMap;
-	    std::vector<FArrayBox*> rMap;
-	    CopyMap *sCopyMapHead;
-	    CopyMap *rCopyMapHead;  
-
-	    std::vector<Task*> task;
-	    std::vector<Worker*> worker;
-
-	    RegionGraph* srcLinkGraph;
-
-	public:
-	    RegionGraph(int numtasks);
-	    void Initialize();
-	    void Reset();
-	    bool isGraphEmpty();
-	    bool isGraphEmptyV2();
-	    void finalizeGraph();
-	    void regionGraphReset(int numfabs);
-	    void regionGraphMinReset(void);
-	    void enableAllRegions();
-	    void disableRegion(int r);
-	    void finalizeRegion(int r);
-	    void finalizeRegionGraph();
-	    void regionComputed(int r);
-	    bool isFireableRegion(int r);
-	    int  getAnyFireableRegion();
-            int  getAnyFireableRegion(RegionGraph& depGraph);
-	    int  getPulledFireableRegion();
-	    int  getFireableRegion(bool isSingleThread=false);
-	    void setFireableRegion(int r);
-	    void graphTeardown();
-	    void workerTeardown();
-	    int size(){return task.size();}
-
-	    int getRegion(){
-		return worker[perilla::wid()]->computedRegionQueue->getFrontRegion(true);
-	    }
-
-	    void syncComputeWorkerThreads(){
-		worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    }
-	    void syncComputeWorkerThreads(int numthreads){
-		worker[perilla::wid()]->barr->sync(numthreads);
-	    }
-
-	    void syncWorkerThreads(){
-		worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    }
-
-	    void syncWorkerThreads(int numthreads){
-		worker[perilla::wid()]->barr->sync(numthreads);
-	    }
-
-	    void alloc_lMap(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		lMap.reserve(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    lMap.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }  
-
-	    void alloc_sMap(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		sMap.reserve(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    sMap.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }
-
-	    void alloc_rMap(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		rMap.reserve(n);
-		for (int i = 0; i < n; ++i)
-		{
-		    int K = mf.IndexArray()[i];
-		    const Box& tmp = mf.fabbox(K);
-		    rMap.push_back(new FArrayBox(tmp, mf.nComp(), false, true));
-		}
-	    }
-
-	    void buildTileArray(const MultiFab& mf)
-	    {
-		const int n = mf.IndexArray().size();
-		fabTiles.resize(n);
-
-		for (int i = 0; i < n; ++i)
-		{
-		    fabTiles[i] = new pTileArray();
-		}
-		for (MFIter mfi(mf, true); mfi.isValid(); ++mfi)
-		{
-		    fabTiles[mfi.LocalIndex()]->numTiles++;
-		    fabTiles[mfi.LocalIndex()]->tileBx.push_back(new Box(mfi.tilebox()));
-		    fabTiles[mfi.LocalIndex()]->validBx = new Box(mfi.validbox());
-		}
-	    }
-
-	    void buildTileArray_gtbx(const MultiFab& mf, int ng)
-	    {
-		const int n = mf.IndexArray().size();
-		fabTiles_gtbx.resize(n);
-
-		for (int i = 0; i < n; ++i)
-		{
-		    fabTiles_gtbx[i] = new pTileArray();
-		}
-		for (MFIter mfi(mf, true); mfi.isValid(); ++mfi)
-		{
-		    fabTiles_gtbx[mfi.LocalIndex()]->numTiles++;
-		    fabTiles_gtbx[mfi.LocalIndex()]->tileBx.push_back(new Box(mfi.growntilebox(ng)));
-		}
-	    }
-
-	    void buildTileArray(const amrex::MultiFab& mf, const amrex::IntVect& tilesize)
-	    {
-		int myProc = amrex::ParallelDescriptor::MyProc();
-		const int n = mf.indexArray.size();
-		fabTiles.resize(n);
-
-		//typ = mf.boxArray().ixType();
-
-		for (int i = 0; i < n; ++i)
-		{
-		    fabTiles[i] = new pTileArray();
-		}
-		for (amrex::MFIter mfi(mf, tilesize); mfi.isValid(); ++mfi)
-		{
-		    if( fabTiles[mfi.LocalIndex()]->numTiles == 0 )
-			fabTiles[mfi.LocalIndex()]->validBx = new amrex::Box(mfi.validbox());
-		    fabTiles[mfi.LocalIndex()]->numTiles++;
-		    fabTiles[mfi.LocalIndex()]->tileBx.push_back(new amrex::Box(mfi.tilebox()));
-		}
-	    }
-
-	    ~RegionGraph();
-    };
-}//end namespace
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/RegionGraph.cpp b/Src/AmrTask/rts_impls/runtime_common/RegionGraph.cpp
deleted file mode 100755
index 0e72a1c631e..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RegionGraph.cpp
+++ /dev/null
@@ -1,792 +0,0 @@
-#include <RegionGraph.H>
-#include <WorkerThread.H>
-#include <stdlib.h>
-
-using namespace std;
-using namespace amrex;
-using namespace perilla;
-
-int RegionGraph::graphCnt = 0;
-
-RegionGraph::RegionGraph(int numtasks)
-{
-    sCopyMapHead = 0;
-    rCopyMapHead = 0;
-    srcLinkGraph = 0;
-    isDepGraph = false;
-    numFabs = numtasks;
-    numTasks = numtasks;
-    graphID = ++graphCnt;
-    worker.resize(perilla::NUM_THREAD_TEAMS);
-    task.resize(numTasks);
-    totalFinishes=0;
-    okToReset = new bool[perilla::NUM_THREAD_TEAMS];
-    finishLock= PTHREAD_MUTEX_INITIALIZER;
-    Initialize();
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-void RegionGraph::Initialize()
-{
-    int numfabs = numTasks;        
-
-    int tg = WorkerThread::perilla_wid();
-    for(int tg=0; tg<perilla::NUM_THREAD_TEAMS; tg++)
-    {
-	worker[tg] = new Worker();
-	worker[tg]->barr = new Barrier(perilla::NUM_THREADS_PER_TEAM - perilla::NUM_COMM_THREADS);
-	worker[tg]->l_barr = new Barrier(perilla::NUM_THREADS_PER_TEAM - perilla::NUM_COMM_THREADS -1);
-	if(numfabs <= perilla::TASK_QUEUE_DEFAULT_SIZE)
-	{
-	    worker[tg]->fireableRegionQueue = new RegionQueue();
-	    worker[tg]->unfireableRegionQueue = new RegionQueue();
-	    worker[tg]->computedRegionQueue = new RegionQueue();
-	    worker[tg]->completedRegionQueue = new RegionQueue();
-	}
-	else
-	{
-	    worker[tg]->fireableRegionQueue = new RegionQueue(numfabs);
-	    worker[tg]->unfireableRegionQueue = new RegionQueue(numfabs);
-	    worker[tg]->computedRegionQueue = new RegionQueue(numfabs);
-	    worker[tg]->completedRegionQueue = new RegionQueue(numfabs);
-	}
-	worker[tg]->totalTasks = 0;
-	worker[tg]->computedTasks = 0;
-	for(int f=0; f < numfabs; f++)
-	{
-	    if(WorkerThread::isMyRegion(tg, f))
-	    {
-		task[f] = new Task();
-		worker[tg]->unfireableRegionQueue->addRegion(f);
-		worker[tg]->totalTasks++;
-		for(int i=0; i<16; i++)
-		    task[f]->state[i] = 0;
-		task[f]->init = true;
-	    }
-	}
-	worker[tg]->init = true;
-	okToReset[tg] = false;	      
-    }
-}
-
-void RegionGraph::Reset()
-{
-    int tg= perilla::wid();
-    pthread_mutex_lock(&finishLock);
-    if(okToReset[tg])
-	totalFinishes--;
-    pthread_mutex_unlock(&finishLock);
-
-
-    if(okToReset[tg])
-    {
-	worker[tg]->totalTasks = 0;
-	worker[tg]->computedTasks = 0;
-	while(worker[tg]->completedRegionQueue->queueSize(true) > 0)
-	{
-	    int r = worker[tg]->completedRegionQueue->removeRegion(true);
-	    if(WorkerThread::isMyRegion(tg, r))
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		worker[tg]->totalTasks++;
-		for(int i=0; i<16; i++)
-		    task[r]->state[i] = 0;
-		task[r]->init = true;
-		if(task[r]->depTaskIDs.size() > 0)
-		    task[r]->depTasksCompleted = false; 
-	    }
-	    else
-		break;
-	}
-    }
-}
-
-bool RegionGraph::isGraphEmpty()
-{
-    int tg= perilla::wid();
-    worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); 
-    if(worker[tg]->completedRegionQueue->queueSize(true)== worker[tg]->totalTasks)
-	return true;
-    return false;	       
-}
-
-bool RegionGraph::isGraphEmptyV2()
-{
-    int tg=perilla::wid();
-
-    if(worker[tg]->completedRegionQueue->queueSize(true) == worker[tg]->totalTasks || worker[tg]->computedTasks == worker[tg]->totalTasks)
-	return true;
-    return false;	       
-}
-
-void RegionGraph::finalizeGraph()
-{
-    pthread_mutex_lock(&finishLock);
-    totalFinishes++;
-    int tg=perilla::wid();
-    okToReset[tg]=true;
-    pthread_mutex_unlock(&finishLock);
-}
-
-void RegionGraph::regionGraphReset(int numfabs)
-{
-    int nt;
-    int tg;
-    int r;
-
-    {
-	tg = perilla::wid();
-	nt = perilla::wtid();
-	if(perilla::isMasterThread())	
-	    totalFinishes=0;	
-	if(perilla::isMasterWorkerThread())
-	{
-	    worker[tg]->totalTasks = 0;
-	    worker[tg]->computedTasks = 0;
-	    while(worker[tg]->completedRegionQueue->queueSize(true) > 0)
-	    {
-		r = worker[tg]->completedRegionQueue->removeRegion(true);
-		if(WorkerThread::isMyRegion(tg, r))
-		{
-		    worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		    worker[tg]->totalTasks++;
-		    for(int i=0; i<16; i++)
-			task[r]->state[i] = 0;
-		    task[r]->init = true;
-		}
-		else
-		    break;
-	    }
-	    okToReset[tg] = false;
-	}
-    }
-}
-
-void RegionGraph::regionGraphMinReset(void)
-{
-    int nt;
-    int tg;
-    int r;
-    {
-	tg = WorkerThread::perilla_wid();
-	nt = WorkerThread::perilla_wtid();
-	if(perilla::isMasterThread())	
-	    totalFinishes=0;	
-	if(perilla::isMasterWorkerThread())
-	{
-	    while(worker[tg]->completedRegionQueue->queueSize(true) > 0)
-	    {
-		r = worker[tg]->completedRegionQueue->removeRegion(true);
-		if(WorkerThread::isMyRegion(tg, r))
-		{
-		    worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		}
-		else
-		    break;
-	    }
-	    okToReset[tg] = false;
-	}
-    }
-}
-
-
-void RegionGraph::enableAllRegions()
-{
-    int numfabs = numTasks;
-    int r;
-    int tg = WorkerThread::perilla_wid();
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-    if(perilla::isMasterWorkerThread())
-	for(int f=0; f<numfabs; f++)
-	    if(WorkerThread::isMyRegion(tg, f))
-	    {
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-		worker[tg]->fireableRegionQueue->addRegion(r,true);
-	    }    
-    worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads        
-}
-
-void RegionGraph::disableRegion(int r)
-{
-    int tg = WorkerThread::perilla_wid();
-    if(perilla::isMasterWorkerThread())
-	if(WorkerThread::isMyRegion(tg, r))
-	{
-	    int rID = worker[tg]->fireableRegionQueue->removeRegion(true);
-	    worker[tg]->unfireableRegionQueue->addRegion(rID,true);
-	}
-}
-
-void RegionGraph::regionComputed(int r)
-{
-    int tg= perilla::wid();
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1);
-    if(perilla::isMasterWorkerThread())
-	if(WorkerThread::isMyRegion(tg, r))
-	{
-	    int rr = worker[tg]->fireableRegionQueue->removeRegion();
-	    if(r != rr)
-	    {
-		std::cout << "ERROR: In computedeRegion" << std::endl;
-		exit(EXIT_FAILURE);
-	    }
-	    worker[tg]->computedRegionQueue->addRegion(rr);
-	    worker[tg]->computedTasks++;
-	}
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1);
-}
-
-void RegionGraph::finalizeRegion(int r)
-{
-    int tg= perilla::wid();
-    int ntid=perilla::wtid();
-    worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-    if(perilla::isMasterWorkerThread())
-	if(WorkerThread::isMyRegion(tg, r))
-	{
-	    int rr = worker[tg]->fireableRegionQueue->removeRegion(true);
-	    if(r != rr)
-	    {
-		std::cout << "ERROR: In completeRegion" << std::endl;
-		exit(EXIT_FAILURE);
-	    }
-	    worker[tg]->completedRegionQueue->addRegion(rr,true);
-	}
-    worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-}
-
-void RegionGraph::finalizeRegionGraph()
-{
-    int tg= perilla::wid();
-    pthread_mutex_lock(&finishLock);
-    totalFinishes++;
-    okToReset[tg]=true;
-    pthread_mutex_unlock(&finishLock);
-}
-
-bool RegionGraph::isFireableRegion(int r)
-{
-    int myProc = ParallelDescriptor::MyProc();
-    FabCopyAssoc *cpDst = task[r]->cpAsc_dstHead;
-    if(lMap.size() > 0)
-	if(lMap[r]->l_con.firingRuleCnt != lMap[r]->l_con.ndcpy)
-	{
-	    return false;
-	}
-    while(cpDst != 0)
-    {
-	if(cpDst->l_con.firingRuleCnt != cpDst->l_con.ndcpy)
-	{
-	    return false;
-	}
-	cpDst = cpDst->next;
-    }
-
-    if(srcLinkGraph != 0)
-    {
-	if(!task[r]->depTasksCompleted)
-	{
-	    for(int i=0; i<task[r]->depTaskIDs.size(); i++){
-		if(!srcLinkGraph->isFireableRegion(task[r]->depTaskIDs[i]))
-		    return false;
-	    }
-	    task[r]->depTasksCompleted = true;
-	}
-    }
-
-    if(ParallelDescriptor::NProcs() == 1) return true;
-
-    if(lMap.size() > 0)
-	if(lMap[r]->r_con.firingRuleCnt != lMap[r]->r_con.nrcv)
-	{
-	    return false;
-	}
-
-    cpDst = task[r]->cpAsc_dstHead;
-    while(cpDst != 0)
-    {
-	if(cpDst->r_con.firingRuleCnt != cpDst->r_con.nrcv)
-	{
-	    return false;
-	}
-	cpDst = cpDst->next;
-    }
-    return true;
-}
-
-
-int RegionGraph::getFireableRegion(bool isSingleThread)
-{
-    int r = -1;
-    bool fireable;
-    int tg= perilla::wid();
-
-    if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0 && worker[tg]->fireableRegionQueue->queueSize() == 0)
-    {
-	fireable = false;
-	r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	while(!fireable)
-	{
-	    fireable = isFireableRegion(r);
-	    if(!fireable)
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    }
-	}
-    }
-    else if(worker[tg]->unfireableRegionQueue->queueSize(true)!=0)
-    {
-	int unfQsize = worker[tg]->unfireableRegionQueue->queueSize(true);
-	for(int i = 0; i < unfQsize; i++)
-	{
-	    int tr = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    if(isFireableRegion(tr))
-	    {
-		r = tr;
-		break;
-	    }
-	    else
-		worker[tg]->unfireableRegionQueue->addRegion(tr,true);
-	}
-    }
-    return r;
-}
-
-void RegionGraph::setFireableRegion(int r)
-{
-    worker[perilla::wid()]->fireableRegionQueue->addRegion(r);
-}
-
-int RegionGraph::getAnyFireableRegion()
-{
-    int myProc = ParallelDescriptor::MyProc();
-    int tg = perilla::wid();
-    int nt = perilla::wtid();
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-    if(nt == 0 && worker[tg]->fireableRegionQueue->queueSize()==0)      
-    {
-	bool fireable = false;
-	int r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	while(!fireable)
-	{
-	    fireable = isFireableRegion(r);
-	    if(!fireable)
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    }
-	    else
-		worker[tg]->fireableRegionQueue->addRegion(r,true);
-	}
-    }
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-    return worker[tg]->fireableRegionQueue->getFrontRegion(true);
-}
-
-int RegionGraph::getAnyFireableRegion(RegionGraph& depGraph)
-{
-    int nt;
-    int tg;
-    int r;
-    bool fireable;
-
-    int myProc = amrex::ParallelDescriptor::MyProc();
-
-    tg = perilla::wid();
-    nt = perilla::wtid();
-    if(nt == 0 && worker[tg]->fireableRegionQueue->queueSize()==0) 
-    {
-	fireable = false;
-	r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	while(!fireable)
-	{
-	    fireable = isFireableRegion(r);
-	    fireable &= depGraph.isFireableRegion(r);
-	    if(!fireable)
-	    {
-		worker[tg]->unfireableRegionQueue->addRegion(r,true);
-		r = worker[tg]->unfireableRegionQueue->removeRegion(true);
-	    }
-	    else
-		worker[tg]->fireableRegionQueue->addRegion(r,true);
-	}
-    }
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-    r = worker[tg]->fireableRegionQueue->getFrontRegion(true);
-    return r;
-}
-
-
-
-int RegionGraph::getPulledFireableRegion()
-{
-    bool fireable;
-    int myProc = ParallelDescriptor::MyProc();
-    int tg = WorkerThread::perilla_wid();
-    int nt = WorkerThread::perilla_wtid();
-    if(nt == 0 && worker[tg]->fireableRegionQueue->queueSize()==0)      
-    {
-	while(worker[tg]->fireableRegionQueue->queueSize()==0);
-    }
-    worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS-1);
-    return worker[tg]->fireableRegionQueue->getFrontRegion(true);
-}
-
-void RegionGraph::graphTeardown()
-{
-#if 0
-    MPI_Status status;
-    Package* package;
-    int tg= perilla::wid();
-    int numfabs = numTasks;
-
-#if 0
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpDst = task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		cpDst->l_con.firingRuleCnt = 0;
-
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		{
-		    while(cpDst->l_con.dcpy[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpDst->l_con.dcpy[i].pQueue.dequeue();
-			//package->completed = false;
-			//package->served = false;
-			//package->request = MPI_REQUEST_NULL;		    
-			cpDst->l_con.dcpy[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-		cpDst = cpDst->next;
-	    }
-	}
-    }
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpSrc = task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		//cpSrc->l_con.firingRuleCnt = 0;
-
-		for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		{
-		    while(cpSrc->l_con.scpy[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpSrc->l_con.scpy[i].pQueue.dequeue();
-
-			FabCopyAssoc* cpDst = cpSrc->graphPartner->task[cpSrc->l_con.scpy[i].nd]->cpAsc_dstHead;
-			while(cpDst != 0)
-			{
-			    if(cpDst->graphPartner == this) //graphArray[g])
-				break;
-			    cpDst = cpDst->next;
-			}			    
-			//Package* sPackage = cpSrc->l_con.scpy[i].pQueue.dequeue(true);
-			pthread_mutex_lock(&(cpDst->l_con.dLock));
-			int dPartner = cpSrc->l_con.scpy[i].dPartner;
-			Package* dPackage = cpDst->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			/*
-			   for(int j=0; j<dPackage->bufSize; j++)
-			   {
-			   dPackage->databuf[j] = sPackage->databuf[j];
-			   }
-			 */
-			std::memcpy(dPackage->databuf, package->databuf, dPackage->bufSize * sizeof(double));
-			//std::swap(dPackage->databuf, sPackage->databuf);
-
-			cpDst->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			if(cpDst->l_con.dcpy[dPartner].pQueue.queueSize(true) == 1)
-			    cpDst->l_con.firingRuleCnt++;
-			pthread_mutex_unlock(&(cpDst->l_con.dLock));
-			//cpSrc->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-
-			//package->completed = false;
-			//package->served = false;
-			//package->request = MPI_REQUEST_NULL;		    
-			cpSrc->l_con.scpy[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-		cpSrc = cpSrc->next;
-	    }
-	}
-    }
-
-
-
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    if(lMap.size() > 0)
-	    {
-		lMap[f]->l_con.firingRuleCnt = 0;
-	    }
-	}
-    }
-#endif
-
-    if(ParallelDescriptor::NProcs() == 1) return;
-
-
-#ifndef PERILLA_USE_UPCXX
-
-#if 1
-    if(perilla::tid()!=0) return;
-    for(int f=0; f<numfabs; f++)
-    {
-	//if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpDst = task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		cpDst->r_con.firingRuleCnt = 0;
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		{
-		    while(cpDst->r_con.rcv[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpDst->r_con.rcv[i].pQueue.dequeue();
-			if(package->request != MPI_REQUEST_NULL)
-{
-			    MPI_Cancel( &(package->request) );
-}
-			package->completed = false;
-			package->served = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpDst->r_con.rcv[i].recycleQueue.enqueue(package);
-		    }
-		}
-		cpDst = cpDst->next;
-	    }
-	}
-    }
-#endif
-
-#if 1
-    for(int f=0; f<numfabs; f++)
-    {
-	//if(WorkerThread::isMyRegion(tg,f))
-	{
-	    FabCopyAssoc *cpSrc = task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		//cpSrc->r_con.firingRuleCnt = 0;
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		{
-		    while(cpSrc->r_con.snd[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpSrc->r_con.snd[i].pQueue.dequeue();
-			MPI_Wait( &(package->request), &status );
-			package->completed = false;
-			package->served = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpSrc->r_con.snd[i].recycleQueue.enqueue(package);
-		    }
-		}
-		cpSrc = cpSrc->next;
-	    }
-	}
-    }
-#endif
-
-
-#if 1
-    if(tg == 0)
-    {
-	CopyMap* cpDst = rCopyMapHead;
-	while(cpDst != 0)
-	{
-	    for(int f=0; f<cpDst->map.size(); f++)
-	    {
-		cpDst->map[f]->r_con.firingRuleCnt = 0;
-		for(int i=0; i<cpDst->map[f]->r_con.nrcv; i++)
-		{
-		    while(cpDst->map[f]->r_con.rcv[i].pQueue.queueSize() >= 1)
-		    {
-			package = cpDst->map[f]->r_con.rcv[i].pQueue.dequeue();
-			if(package->request != MPI_REQUEST_NULL)
-			    MPI_Cancel( &(package->request) );
-			package->completed = false;
-			package->served = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpDst->map[f]->r_con.rcv[i].recycleQueue.enqueue(package);
-		    }
-		}
-
-	    }
-
-	    cpDst = cpDst->next;
-	}
-
-
-#if 1
-	CopyMap* cpSrc = sCopyMapHead;
-	while(cpSrc != 0)
-	{
-	    for(int f=0; f<cpSrc->map.size(); f++)
-	    {
-		for(int i=0; i<cpSrc->map[f]->r_con.nsnd; i++)
-		{
-		    while(cpSrc->map[f]->r_con.snd[i].pQueue.queueSize() >= 1)
-		    {
-
-			package = cpSrc->map[f]->r_con.snd[i].pQueue.dequeue();
-			/*		
-					int ns = cpSrc->map[f]->r_con.snd[i].ns;
-					int nd = cpSrc->map[f]->r_con.snd[i].nd;
-					int r_gid = cpSrc->map[f]->r_con.snd[i].r_gid;
-					int r_grids = cpSrc->map[f]->r_con.snd[i].r_grids;
-			//int tag = tagGen(ns, nd, r_gid-1, np*r_grids, nGraphs);
-			int tag = Perilla::myTagMap[r_gid][nd][ns][cpSrc->map[f]->r_con.snd[i].sz];
-
-			Package* sPackage = lMap[f]->r_con.snd[i].pQueue.getFront(true);
-			package->request = ParallelDescriptor::Asend(sPackage->databuf,
-			cpSrc->map[f]->r_con.snd[i].sz,
-			cpSrc->map[f]->r_con.snd[i].pr, tag).req();  // tag == SeqNum in c++ ver
-
-			 */
-			MPI_Wait( &(package->request), &status );
-			package->completed = false;
-			package->served = false;
-			package->request = MPI_REQUEST_NULL;		    
-			cpSrc->map[f]->r_con.snd[i].recycleQueue.enqueue(package);
-		    }
-		}
-	    }
-	    cpSrc = cpSrc->next;
-	}
-#endif
-    }
-
-#endif
-
-//ndefupcxx
-#endif
-
-    //if(WorkerThread::isTeamMasterThread(tid)) commented out b/c its already call by single thread in a team
-    //Perilla::globalBarrier->sync(perilla::NUM_THREAD_TEAMS);
-
-#if 0
-    // Parallel Copy Reset on Local tg
-    for(int f=0; f<numfabs; f++)
-    {
-	//if(WorkerThread::isMyRegion(tg,f))
-	{
-	    if(lMap.size() > 0)
-	    {
-		lMap[f]->r_con.firingRuleCnt = 0;
-
-		for(int i=0; i<lMap[f]->r_con.nsnd; i++)
-		    while(lMap[f]->r_con.snd[i].pQueue.queueSize() >= 1)
-		    {
-			package = lMap[f]->r_con.snd[i].pQueue.dequeue();
-			package->completed = false;
-			package->served = false;
-			package->request = MPI_REQUEST_NULL;
-			lMap[f]->r_con.snd[i].recycleQueue.enqueue(package);
-		    }
-
-		for(int i=0; i<lMap[f]->r_con.nrcv; i++)
-		    while(lMap[f]->r_con.rcv[i].pQueue.queueSize() >= 1)
-		    {
-			package = lMap[f]->r_con.rcv[i].pQueue.dequeue();
-			package->completed = false;
-			package->served = false;
-			package->request = MPI_REQUEST_NULL;
-			lMap[f]->r_con.rcv[i].recycleQueue.enqueue(package);
-		    }
-	    }
-	}
-    }              																             
-
-    // Fill boundary reset on local tg
-    if(tg == 0)
-    {
-	for(int f=0; f<numfabs; f++)
-	{
-	    if(rMap.size() > 0)
-	    {
-		// if(WorkerThread::isMyRegion(tg,f))
-		{
-		    for(int i=0; i< rMap[f]->r_con.nrcv; i++)
-			while( rMap[f]->r_con.rcv[i].pQueue.queueSize() >= 1)
-			{
-			    package =  rMap[f]->r_con.rcv[i].pQueue.dequeue();
-			    if(package->request != MPI_REQUEST_NULL)
-				MPI_Cancel( &(package->request) );
-{
-printf("Canceling a message\n");
-}
-			    package->completed = false;
-			    package->served = false;
-			    package->request = MPI_REQUEST_NULL;
-			    rMap[f]->r_con.rcv[i].recycleQueue.enqueue(package);
-			}
-		    for(int i=0; i< sMap[f]->r_con.nsnd; i++)
-			while( sMap[f]->r_con.snd[i].pQueue.queueSize() >= 1)
-			{
-			    package =  sMap[f]->r_con.snd[i].pQueue.dequeue();
-			    MPI_Wait( &(package->request), &status );
-			    package->completed = false;
-			    package->served = false;
-			    package->request = MPI_REQUEST_NULL;
-			    sMap[f]->r_con.snd[i].recycleQueue.enqueue(package);
-			}
-		}
-	    }
-	}
-    }
-#endif
-#endif
-}
-
-void RegionGraph::workerTeardown()
-{
-    int numfabs = numTasks;
-    Package* package;
-
-    regionGraphMinReset();   
-}
-
-RegionGraph::~RegionGraph()
-{
-    delete[] okToReset;
-    for(int tg=0; tg<perilla::NUM_THREAD_TEAMS; tg++)delete worker[tg];
-    worker.clear();
-    for(int i=0; i<task.size(); i++) delete task[i];
-    task.clear();
-
-    if(sCopyMapHead != 0)
-      delete sCopyMapHead;
-    if(rCopyMapHead != 0)
-      delete rCopyMapHead;
-
-    for(int i=0; i<lMap.size(); i++) delete lMap[i];
-    for(int i=0; i<sMap.size(); i++) delete sMap[i];
-    for(int i=0; i<rMap.size(); i++) delete rMap[i];
-
-    lMap.clear();
-    sMap.clear();
-    rMap.clear();
-
-    for(int i=0; i<fabTiles.size(); i++) delete fabTiles[i];
-    for(int i=0; i<fabTiles_gtbx.size(); i++) delete fabTiles_gtbx[i];
-
-    fabTiles.clear();
-    fabTiles_gtbx.clear();
-#ifdef PERILLA_DEBUG
-    memcheck.remove(memcheck.genKey(this));
-#endif
-}
diff --git a/Src/AmrTask/rts_impls/runtime_common/RegionQueue.H b/Src/AmrTask/rts_impls/runtime_common/RegionQueue.H
deleted file mode 100755
index bee8f8c9fa4..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RegionQueue.H
+++ /dev/null
@@ -1,33 +0,0 @@
-#ifndef P_REGIONQUEUE_H
-#define P_REGIONQUEUE_H
-
-#include <PerillaConfig.H>
-#include <pthread.h>
-
-//////////////////////// class RegionQueue Declaration Start /////////////////////////////////////
-class RegionQueue
-{
-private:
-  int* buffer;
-  int n;
-  int front;
-  int rear;
-  int max_size;
-  pthread_mutex_t queueLock;
-public:
-  RegionQueue();
-  RegionQueue(int numTasks);
-  ~RegionQueue();
-  void addRegion(int r);
-  void addRegion(int r, bool canAvoidLock);
-  int removeRegion();
-  int removeRegion(bool canAvoidLock);  
-  int getFrontRegion();
-  int getFrontRegion(bool canAvoidLock);
-  int queueSize(bool canAvoidLock);
-  int queueSize();
-  void reallocate();
-};
-//////////////////////// class RegionQueue Declaration End /////////////////////////////////////
-
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/RegionQueue.cpp b/Src/AmrTask/rts_impls/runtime_common/RegionQueue.cpp
deleted file mode 100755
index 894e116a120..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RegionQueue.cpp
+++ /dev/null
@@ -1,102 +0,0 @@
-#include <RegionQueue.H>
-#include <stdio.h>
-#include <string.h>
-#include <stdlib.h>
-
-//////////////////////// class RegionQueue Definition Start /////////////////////////////////////  
-RegionQueue::RegionQueue(void)
-{
-    max_size= perilla::TASK_QUEUE_DEFAULT_SIZE;
-    buffer = new int[max_size];
-    n = 0;
-    front = 0;
-    rear = 0;
-    queueLock=PTHREAD_MUTEX_INITIALIZER;
-}
-
-RegionQueue::RegionQueue(int numTasks)
-{
-    buffer = new int[numTasks];
-    n = 0;
-    max_size = numTasks;
-    front = 0;
-    rear = 0;
-    queueLock=PTHREAD_MUTEX_INITIALIZER;
-}
-
-RegionQueue::~RegionQueue()
-{
-    delete[] buffer;
-}
-
-
-void RegionQueue::addRegion(int r)
-{
-    pthread_mutex_lock(&queueLock);
-    buffer[rear] = r;
-    rear = (rear+1)%max_size;
-    n++;
-    pthread_mutex_unlock(&queueLock);
-}
-
-void RegionQueue::addRegion(int r, bool canAvoidLockd)
-{
-    if(!canAvoidLockd)pthread_mutex_lock(&queueLock);
-    buffer[rear] = r;
-    rear = (rear+1)%max_size;
-    n++;
-    if(!canAvoidLockd)pthread_mutex_unlock(&queueLock);
-}
-
-int RegionQueue::removeRegion()
-{
-    int r;
-    pthread_mutex_lock(&queueLock);
-    r = buffer[front];
-    front = (front+1)%max_size;
-    n--;
-    pthread_mutex_unlock(&queueLock);
-    return r;
-}
-
-int RegionQueue::removeRegion(bool canAvoidLockd)
-{
-    int r;
-    if(!canAvoidLockd)pthread_mutex_lock(&queueLock);
-    r = buffer[front];
-    front = (front+1)%max_size;
-    n--;
-    if(!canAvoidLockd)pthread_mutex_unlock(&queueLock);
-    return r;
-}
-
-int RegionQueue::getFrontRegion()
-{
-    return buffer[front];
-}
-
-int RegionQueue::getFrontRegion(bool canAvoidLockd)
-{
-    if(!canAvoidLockd)pthread_mutex_lock(&queueLock);
-    return buffer[front];
-    if(!canAvoidLockd)pthread_mutex_unlock(&queueLock);
-}
-
-int RegionQueue::queueSize()
-{
-    int size;
-    pthread_mutex_lock(&queueLock);
-    size = n;
-    pthread_mutex_unlock(&queueLock);
-    return size;
-}
-
-int RegionQueue::queueSize(bool canAvoidLockd)
-{
-    int size;
-    if(!canAvoidLockd)pthread_mutex_lock(&queueLock);
-    size = n;
-    if(!canAvoidLockd)pthread_mutex_unlock(&queueLock);
-    return size;
-}
-//////////////////////// class RegionQueue Definition End /////////////////////////////////////  
diff --git a/Src/AmrTask/rts_impls/runtime_common/RemoteConnection.H b/Src/AmrTask/rts_impls/runtime_common/RemoteConnection.H
deleted file mode 100755
index 23bc16e97f8..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/RemoteConnection.H
+++ /dev/null
@@ -1,93 +0,0 @@
-#ifndef P_REMOTECONNECTION_H
-#define P_REMOTECONNECTION_H
-
-#include <AMReX_Box.H>
-#include <PackageQueue.H>
-#include <pthread.h>
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include "PerillaMemCheck.H"
-extern PerillaMemCheck memcheck;
-#endif
-
-
-class RemoteCommDescriptor
-{
-public:
-  int ns, lns;   // ! Source box in layout
-  int nd, lnd;   //! Destination box in layout
-  int r_gid;
-  int r_grids;
-  int sz, pr;
-  Box sbx;     // ! Sub-box for this copy
-  Box dbx;     // ! Sub-box for this copy
-  PackageQueue pQueue;  // !store incoming or outgoing messages, both fab and the runtime can access this queue
-  PackageQueue recycleQueue; //!store used messages, only fab can access this queue, no lock is required
-  int cnt;
-  RemoteCommDescriptor() :
-    ns(-1), lns(-1),
-    nd(-1), lnd(-1),
-    sz(0), pr(0),
-    cnt(0), r_gid(0),
-    r_grids(0)
-  {
-#ifdef PERILLA_DEBUG
-    	        memcheck.add(memcheck.genKey(this), (void*)this, "RemoteCommDescriptor");
-#endif
-  }
-
-   ~RemoteCommDescriptor(){
-#ifdef PERILLA_DEBUG
-    	        memcheck.remove(memcheck.genKey(this));
-#endif
-  }
-};
-
-class TransDescriptor
-{
-  int sz, pv, pr;
-};
-  
-class RemoteConnection  
-{
-public:
-  int nsnd;
-  int nrcv;
-  bool remotePushReady;
-  bool remotePullDone;
-  int nrp, nsp;
-  pthread_mutex_t sndLock, rcvLock, ghostLock;
-  int firingRuleCnt;
-  RemoteCommDescriptor *snd;
-  RemoteCommDescriptor *rcv;
-  TransDescriptor *str;
-  TransDescriptor *rtr;
-  RemoteConnection() :
-    nsnd(0),
-    nrcv(0),
-    remotePushReady(false),
-    remotePullDone(false),
-    nrp(0), nsp(0),
-    firingRuleCnt(0),
-    snd(NULL), rcv(NULL),
-    str(NULL), rtr(NULL),
-    sndLock(PTHREAD_MUTEX_INITIALIZER),
-    rcvLock(PTHREAD_MUTEX_INITIALIZER),
-    ghostLock(PTHREAD_MUTEX_INITIALIZER)
-  {
-//    	        memcheck.add(memcheck.genKey(this), (void*)this, "RemoteCommDescriptor");
-  }
-
-  ~RemoteConnection()
-  {
-    if(snd)
-      delete[] snd;
-    if(rcv)
-      delete[] rcv;
-//    	        memcheck.remove(memcheck.genKey(this));
-  }
-};
-
-
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/WorkerThread.H b/Src/AmrTask/rts_impls/runtime_common/WorkerThread.H
deleted file mode 100755
index 7c20c796d4c..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/WorkerThread.H
+++ /dev/null
@@ -1,75 +0,0 @@
-#ifndef P_WORKERTHREAD_H
-#define P_WORKERTHREAD_H
-#include <PerillaConfig.H>
-#include <Barrier.H>
-#include <pthread.h>
-
-namespace perilla{
-
-    class WorkerThread
-    {
-	//static void* team_shared_memory[perilla::NUM_THREAD_TEAMS];  
-        int tid;
-	public:
-        static void init();
-        static Barrier* globalBarrier;
-        static Barrier* localBarriers[perilla::NUM_THREAD_TEAMS];
-        static Barrier* localBarriers1[perilla::NUM_THREAD_TEAMS];
-	static int perilla_tid();
-	static int perilla_wtid();
-	static int perilla_wid();
-	static int perilla_nWorkerThreads();
-	static int perilla_nWorkers();
-	static int perilla_nTeamThreads();
-	static bool perilla_isMasterWorkerThread();  
-	static bool perilla_isMasterThread();
-	static bool perilla_isCommunicationThread();
-	static bool isMyRegion(int workerID, int regionID);
-	static void setTeamSharedMemory(void* dummy, int tid, int tg);  
-	static void* getTeamSharedMemory(int tg);
-        static void syncWorkers();
-        static void syncWorkers(int tid);
-        static void syncThreads();
-        static void syncComputeThreads();
-        static void syncAllComputeThreads();
-        static void syncTeamThreads();
-        static void syncAllThreads();
-        static void syncWorkerThreads();
-        static void syncWorkerThreads(int numthreads);
-        static void syncComputeWorkerThreads();
-        static void syncComputeWorkerThreads(int numthreads);
-    };
-
-    static int tid(){return WorkerThread::perilla_tid();}
-    static int wtid(){return WorkerThread::perilla_wtid();}
-    static int wid(){return WorkerThread::perilla_wid();}
-    static int nWorkerThreads(){return WorkerThread::perilla_nWorkerThreads();}
-    static int nWorkers(){return WorkerThread::perilla_nWorkers();}
-    static int nThreads(){return perilla::NUM_THREAD_TEAMS*perilla::NUM_THREADS_PER_TEAM;}
-    static bool isMasterWorkerThread(){return WorkerThread::perilla_isMasterWorkerThread();}
-    static bool isMasterThread(){return WorkerThread::perilla_isMasterThread();}
-    static bool isCommunicationThread(){return WorkerThread::perilla_isCommunicationThread();}
-    static bool isMyRegion(int workerID, int regionID){return WorkerThread::isMyRegion(workerID, regionID);}
-    //static void setTeamSharedMemory(void* dummy, int tid, int tg){WorkerThread::setTeamSharedMemory(dummy, tid, tg);}
-    //static void* getTeamSharedMemory(int tg){WorkerThread::getTeamSharedMemory(tg);}
-    static void syncWorkers(){WorkerThread::syncWorkers();}
-    static void syncWorkers(int tid){WorkerThread::syncWorkers(tid);}
-    static void syncThreads(){WorkerThread::syncThreads();}
-    static void syncComputeThreads(){WorkerThread::syncComputeThreads();}
-    static void syncAllComputeThreads(){WorkerThread::syncAllComputeThreads();}
-    static void syncComputeWorkerThreads(){WorkerThread::syncComputeWorkerThreads();}
-    static void syncComputeWorkerThreads(int numthreads){WorkerThread::syncComputeWorkerThreads(numthreads);}
-    static void syncWorkerThreads(){WorkerThread::syncWorkerThreads();}
-    static void syncWorkerThreads(int numthreads){WorkerThread::syncWorkerThreads(numthreads);}
-    static void syncAllThreads()
-    {
-	WorkerThread::syncAllThreads();
-    }
-    static void syncAllWorkerThreads()
-    {
-        WorkerThread::syncWorkerThreads();
-        WorkerThread::syncWorkers();
-    }
-}//end namespace
-
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/WorkerThread.cpp b/Src/AmrTask/rts_impls/runtime_common/WorkerThread.cpp
deleted file mode 100755
index db7aa169441..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/WorkerThread.cpp
+++ /dev/null
@@ -1,141 +0,0 @@
-#include <WorkerThread.H>
-#include <PerillaConfig.H>
-#include <Perilla.H>
-#include<stdio.h>
-
-using namespace perilla;
-//namespace perilla
-//{
-    //void* WorkerThread::team_shared_memory[perilla::NUM_THREAD_TEAMS];
-    Barrier* WorkerThread::globalBarrier;
-    Barrier* WorkerThread::localBarriers[perilla::NUM_THREAD_TEAMS];
-    Barrier* WorkerThread::localBarriers1[perilla::NUM_THREAD_TEAMS];
-
-    void WorkerThread::init(){
-	WorkerThread::globalBarrier= new Barrier(perilla::NUM_THREAD_TEAMS);
-	for(int i=0; i<perilla::NUM_THREAD_TEAMS; i++) WorkerThread::localBarriers[i]= new Barrier(perilla::NUM_THREADS_PER_TEAM);
-	for(int i=0; i<perilla::NUM_THREAD_TEAMS; i++) WorkerThread::localBarriers1[i]= new Barrier(perilla::NUM_THREADS_PER_TEAM);
-    }
-
-    void WorkerThread::syncWorkers(){
-	if(isMasterWorkerThread()) WorkerThread::globalBarrier->sync(perilla::NUM_THREAD_TEAMS);
-    }
-
-    void WorkerThread::syncWorkers(int tid){
-        if(perilla_wid()==tid) WorkerThread::globalBarrier->sync(perilla::NUM_THREAD_TEAMS);
-    }
-
-    void WorkerThread::syncTeamThreads(){
-        WorkerThread::localBarriers[perilla_wid()]->sync(perilla::NUM_THREADS_PER_TEAM);
-    }
-
-    void WorkerThread::syncWorkerThreads(){
-        WorkerThread::localBarriers1[perilla_wid()]->sync(perilla::NUM_THREADS_PER_TEAM-1);
-    }
-    void WorkerThread::syncWorkerThreads(int numthreads){
-	assert(numthreads== perilla::NUM_THREADS_PER_TEAM-1);
-        WorkerThread::localBarriers1[perilla_wid()]->sync(numthreads);
-    }
-
-
-#if defined(USE_PERILLA_OMP) | defined(USE_PERILLA_ON_DEMAND) 
-    void WorkerThread::syncAllThreads(){
-        #pragma omp barrier
-    }
-#else
-    void WorkerThread::syncAllThreads(){
-        syncTeamThreads();
-        syncWorkers();
-    }
-#endif
-
-    void WorkerThread::syncAllComputeThreads(){
-        syncComputeWorkerThreads();
-        syncWorkers();
-    }
-
-    void WorkerThread::syncThreads(){
-        syncWorkerThreads();
-        syncWorkers();
-    }
-
-    void WorkerThread::syncComputeWorkerThreads(){
-        WorkerThread::localBarriers1[perilla_wid()]->sync(perilla::NUM_THREADS_PER_TEAM-1);
-    }
-
-    void WorkerThread::syncComputeWorkerThreads(int numthreads){
-	assert(numthreads== perilla::NUM_THREADS_PER_TEAM-1);
-        WorkerThread::localBarriers1[perilla_wid()]->sync(numthreads);
-    }
-
-#if defined(USE_PERILLA_OMP ) | defined(USE_PERILLA_ON_DEMAND)
-    int WorkerThread::perilla_tid(){
-        return omp_get_thread_num();
-    }
-#else
-    int WorkerThread::perilla_tid(){
-	return Perilla::tid();
-    }
-#endif
-
-    int WorkerThread::perilla_nTeamThreads(){
-	return perilla::NUM_THREADS_PER_TEAM;
-    }
-
-    int WorkerThread::perilla_nWorkerThreads(){
-	return perilla::NUM_THREADS_PER_TEAM-1;
-    }
-
-    int WorkerThread::perilla_nWorkers(){
-	return perilla::NUM_THREAD_TEAMS;
-    }
-
-    int WorkerThread::perilla_wtid()
-    {
-	int tid= perilla_tid();
-	return (tid % perilla::NUM_THREADS_PER_TEAM) -1;    
-    }
-
-    int WorkerThread::perilla_wid()
-    {
-	int tid= perilla_tid();
-	return tid / perilla::NUM_THREADS_PER_TEAM;    
-    }
-
-    bool WorkerThread::perilla_isMasterWorkerThread()
-    {
-	int tid= perilla_tid();
-	if((tid % perilla::NUM_THREADS_PER_TEAM)==1)
-	    return true;
-	else
-	    return false;
-    }
-
-    bool WorkerThread::perilla_isMasterThread(){ //pick the first one among master worker threads
-	return perilla_tid()==1;
-    }
-
-    bool WorkerThread::perilla_isCommunicationThread()
-    {
-	int tid= perilla_tid();
-	return (tid % perilla::NUM_THREADS_PER_TEAM)==0 ;
-    }
-
-    bool WorkerThread::isMyRegion(int workerID, int regionID)
-    {
-	return ((regionID) % perilla::NUM_THREAD_TEAMS)==workerID;
-    }
-
-#if 0
-    void WorkerThread::setTeamSharedMemory(void* dummy, int tid, int tg)
-    {
-	if((tid % perilla::NUM_THREADS_PER_TEAM)==1)
-	    team_shared_memory[tg] = dummy;    
-    }
-
-    void* WorkerThread::getTeamSharedMemory(int tg)
-    {    
-	return team_shared_memory[tg];
-    }
-#endif
-//}//end namepsace
diff --git a/Src/AmrTask/rts_impls/runtime_common/mylock.h b/Src/AmrTask/rts_impls/runtime_common/mylock.h
deleted file mode 100644
index bddb8ed6970..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/mylock.h
+++ /dev/null
@@ -1,27 +0,0 @@
-#ifndef MYLOCK
-#define MYLOCK
-
-#include <pthread.h>
-
-class MyLock
-{
-    private: 
-	pthread_mutex_t _lock;
-
-    public:
-	MyLock(){
-            pthread_mutex_init(&_lock, NULL);
-	}
-	~MyLock(){
-	    pthread_mutex_destroy(&_lock);
-	}
-	void lock()
-	{
-	    pthread_mutex_lock(&_lock);
-	}
-	void unlock()
-	{
-	    pthread_mutex_unlock(&_lock);
-	}
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/runtime_common/perilla.mak b/Src/AmrTask/rts_impls/runtime_common/perilla.mak
deleted file mode 100755
index 073260631ff..00000000000
--- a/Src/AmrTask/rts_impls/runtime_common/perilla.mak
+++ /dev/null
@@ -1,25 +0,0 @@
-CEXE_sources += Barrier.cpp
-CEXE_sources += RGIter.cpp
-CEXE_sources += RegionQueue.cpp
-CEXE_sources += RegionGraph.cpp
-CEXE_sources += WorkerThread.cpp
-CEXE_sources += AsyncMultiFabUtil.cpp
-CEXE_sources += PerillaMemCheck.cpp
-CEXE_sources += Perilla_common.cpp
-
-
-CEXE_headers += Barrier.H
-CEXE_headers += Config.H
-CEXE_headers += LocalConnection.H
-CEXE_headers += PackageQueue.H
-CEXE_headers += RegionGraph.H
-CEXE_headers += RegionQueue.H
-CEXE_headers += RegionGraph.H
-CEXE_headers += RemoteConnection.H
-CEXE_headers += WorkerThread.H
-CEXE_headers += AsyncMultiFabUtil.H
-CEXE_headers += PerillaMemCheck.H
-CEXE_headers += Perilla.H
-
-
-
diff --git a/Src/AmrTask/rts_impls/upcxx/Make.package b/Src/AmrTask/rts_impls/upcxx/Make.package
deleted file mode 100644
index 6490fb8ef78..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/Make.package
+++ /dev/null
@@ -1,13 +0,0 @@
-PERILLA_LIB=EXE
-
-COMMON_DIR=$(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-
-C$(PERILLA_LIB)_sources += PackageQueue.cpp Perilla.cpp PerillaRts.cpp
-
-C$(PERILLA_LIB)_headers += $(COMMON_DIR)/Barrier.H Config.H $(COMMON_DIR)/LocalConnection.H PackageQueue.H $(COMMON_DIR)/RegionGraph.H $(COMMON_DIR)/RGIter.H $(COMMON_DIR)/RegionQueue.H $(COMMON_DIR)/RemoteConnection.H $(COMMON_DIR)/WorkerThread.H $(COMMON_DIR)/AsyncMultiFabUtil.H PerillaRts.H
-
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-
diff --git a/Src/AmrTask/rts_impls/upcxx/PackageQueue.H b/Src/AmrTask/rts_impls/upcxx/PackageQueue.H
deleted file mode 100755
index 9bcadc11d9a..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/PackageQueue.H
+++ /dev/null
@@ -1,59 +0,0 @@
-#ifndef P_PACKAGEQUEUE_H
-#define P_PACKAGEQUEUE_H
-
-#include <PerillaConfig.H>
-#include <pthread.h>
-#include <upcxx/upcxx.hpp>
-typedef upcxx::future<> CommRequest;
-
-class Package
-{
-private:
-  int source, destination;
-public:
-  upcxx::global_ptr<double> databuf;
-  pthread_mutex_t packageLock;
-  volatile int bufSize;
-  volatile bool completed; //message transfer is done
-  volatile bool served; //message transfer request has been served but may have not completed
-  CommRequest *request; //!for inter-process communication 
-  int tag;
-  Package();
-  ~Package();
-  Package(int size);
-  Package(int src, int dest);
-  Package(int src, int dest, int size);
-  void setPackageSource(int src);
-  void setPackageDestination(int dest);
-  void completeRequest(void);
-  void completeRequest(bool canAvoidLock);
-  bool checkRequest(void);
-  void generatePackage(int size);
-};
-
-class PackageQueue
-{
-private:
-  Package *buffer[perilla::MSG_QUEUE_DEFAULT_MAXSIZE];
-  volatile int n;
-  volatile int front;
-  volatile int rear;
-  volatile int prear;
-  int max_size;
-public:  
-  pthread_mutex_t queueLock;
-  PackageQueue();
-  ~PackageQueue();
-  int queueSize(void);  
-  int queueSize(bool canAvoidLock);
-  void enqueue(Package* package);  
-  void enqueue(Package* package, bool canAvoidLock);
-  Package* dequeue(void);  
-  Package* dequeue(bool canAvoidLock);
-  Package* getRear(void);
-  Package* getRear(bool canAvoidLock);
-  Package* getFront(void);
-  Package* getFront(bool canAvoidLock);
-  void emptyQueue(bool canAvoidLock);
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/upcxx/PackageQueue.cpp b/Src/AmrTask/rts_impls/upcxx/PackageQueue.cpp
deleted file mode 100755
index ac34408b0d5..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/PackageQueue.cpp
+++ /dev/null
@@ -1,274 +0,0 @@
-#include <PackageQueue.H>
-#include <iostream>
-
-#ifdef PERILLA_DEBUG
-#include <PerillaMemCheck.H>
-using namespace perilla;
-extern PerillaMemCheck memcheck;
-#endif
-
-Package::Package()
-{
-    databuf = nullptr;
-    bufSize = 0;
-    source = 0;
-    destination = 0;
-    completed = false;
-    served = false;
-    request = 0;
-    tag=0;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::~Package()
-{
-    if(databuf!= nullptr) 
-      if(databuf.is_local())
-      {
-	upcxx::delete_array(databuf);
-      }
-#ifdef PERILLA_DEBUG
-        memcheck.remove(memcheck.genKey(this));
-#endif
-}
-
-Package::Package(int size)
-{
-    databuf = (upcxx::global_ptr<double>)upcxx::new_array<double>(size);
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    served = false;
-    request = 0;
-    tag=0;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::Package(int src, int dest)
-{
-    databuf= nullptr;
-    bufSize = 0;
-    source = src;
-    destination = dest;
-    completed = false;
-    served = false;
-    request = 0;
-    tag=0;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-Package::Package(int src, int dest, int size)
-{
-    databuf = (upcxx::global_ptr<double>)upcxx::new_array<double>(size);
-    bufSize = size;
-    source = src;
-    destination = dest;
-    completed = false;
-    served = false;
-    request = 0;
-    tag=0;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-void Package::setPackageSource(int src)
-{
-    source = src;
-}
-
-void Package::setPackageDestination(int dest)
-{
-    destination = dest;
-}
-
-void Package::completeRequest(void)
-{
-    pthread_mutex_lock(&packageLock);
-    completed = true;
-    pthread_mutex_unlock(&packageLock);
-}
-
-void Package::completeRequest(bool canAvoidLock)
-{
-    if(!canAvoidLock)pthread_mutex_lock(&packageLock);
-    completed = true;
-    if(!canAvoidLock)pthread_mutex_unlock(&packageLock);
-}
-
-bool Package::checkRequest(void)
-{
-    return completed;
-}  
-
-void Package::generatePackage(int size)
-{
-    databuf = (upcxx::global_ptr<double>)upcxx::new_array<double>(size);
-    bufSize = size;
-    source = 0;
-    destination = 0;
-    completed = false;
-    served = false;
-    request = 0;
-    tag=0;
-    packageLock= PTHREAD_MUTEX_INITIALIZER;
-#ifdef PERILLA_DEBUG
-    memcheck.add(memcheck.genKey(this), (void*)this, "Package");
-#endif
-}
-
-PackageQueue::PackageQueue()
-{
-    n = 0;
-    front = 0;
-    rear = 0;
-    prear = -1;
-    max_size=perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    queueLock= PTHREAD_MUTEX_INITIALIZER;;
-}
-
-int PackageQueue::queueSize(void)
-{
-    int size;
-    pthread_mutex_lock(&queueLock);
-    size = n;
-    pthread_mutex_unlock(&queueLock);
-    return size;
-}
-
-int PackageQueue::queueSize(bool canAvoidLock)
-{
-    int size;
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-    size = n;
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-    return size;
-}
-
-void PackageQueue::enqueue(Package* package)
-{
-    pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n==perilla::MSG_QUEUE_DEFAULT_MAXSIZE){
-        printf("Failed to Enqueue: Queue Overflow\n");
-        exit(0);
-    }
-#endif
-    buffer[rear] = package;
-    prear = rear;    
-    rear = (rear+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n++;
-    pthread_mutex_unlock(&queueLock);
-}
-
-void PackageQueue::enqueue(Package* package, bool canAvoidLock)
-{
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n==perilla::MSG_QUEUE_DEFAULT_MAXSIZE){
-        printf("Failed to Enqueue: Queue Overflow\n");
-        exit(0);
-    }
-#endif
-    buffer[rear] = package;
-    prear = rear;
-    rear = (rear+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n++;
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-}
-
-Package* PackageQueue::dequeue(void)
-{
-    Package* package = 0;
-    pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n<0){
-        printf("Failed to Dequeue: Queue Empty\n");
-        exit(0);
-    }
-#endif
-    package = buffer[front];
-    front = (front+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n--;
-    pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::dequeue(bool canAvoidLock)
-{
-    Package* package = 0;
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-#ifdef PERILLA_DEBUG
-    if(n<0){
-        printf("Failed to Dequeue: Queue Empty\n");
-        exit(0);
-    }
-#endif
-    package = buffer[front];
-    front = (front+1)%perilla::MSG_QUEUE_DEFAULT_MAXSIZE;
-    n--;
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getRear(void)
-{
-    Package* package = 0;
-    pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[prear];
-    pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getRear(bool canAvoidLock)
-{
-    Package* package = 0;
-    if(!canAvoidLock)pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[prear];
-    if(!canAvoidLock)pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getFront(void)
-{
-    Package* package = 0;
-    pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[front];
-    pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-Package* PackageQueue::getFront(bool canAvoidLock)
-{
-    Package* package = 0;
-    if(!canAvoidLock) pthread_mutex_lock(&queueLock);
-    if(n) package = buffer[front];
-    if(!canAvoidLock) pthread_mutex_unlock(&queueLock);
-    return package;
-}
-
-void PackageQueue::emptyQueue(bool canAvoidLock){
-    if(!canAvoidLock) pthread_mutex_lock(&queueLock);
-    while(n){
-        Package* p= dequeue(true);
-        delete p;
-    }
-    if(!canAvoidLock) pthread_mutex_unlock(&queueLock);
-}
-
-PackageQueue::~PackageQueue()
-{
-    emptyQueue(true);
-}
-
diff --git a/Src/AmrTask/rts_impls/upcxx/Perilla.H b/Src/AmrTask/rts_impls/upcxx/Perilla.H
deleted file mode 100755
index f4f17c59b51..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/Perilla.H
+++ /dev/null
@@ -1,78 +0,0 @@
-#ifndef _PERILLA_
-#define _PERILLA_
-
-#include <AMReX_MultiFab.H>
-#include <vector>
-#include <map>
-#include <RegionGraph.H>
-#include <pthread.h>
-
-#include <RGIter.H>
-
-//#define USE_PERILLA_PTHREADS
-
-using namespace std;
-
-namespace amrex{
-    class Perilla
-    {
-	static int tagGen(int src, int dest, int channelID, int nFabs, int nChannels);
-
-	public:
-	static int uTags;
-	static bool genTags;
-        static int max_step;
-
-	static std::map<int,std::map<int,int>> pTagCnt;
-	static std::map<int,std::map<int,std::map<int,std::map<int,std::map<int,int>>>>> tagMap;
-	static std::map<int,std::map<int,std::map<int,std::map<int,int>>>> myTagMap;
-        static void clearTagMap();
-        static void clearMyTagMap();
-	static void communicateTags();
-        static void registerId(int tid);
-	static int tid();
-	static volatile int numTeamsFinished;
-        static volatile int updateMetadata_request;
-        static volatile int updateMetadata_noticed;
-        static volatile int updateMetadata_done;
-	static Barrier * globalBarrier;
-        static void syncProcesses();
-	static void multifabBuildFabCon(RegionGraph* graph, const MultiFab& mf, const Periodicity& period);
-	static void serviceLocalRequests(RegionGraph *graph, int tg);
-	static void serviceRemoteRequests(RegionGraph *graph, int graphID, int nGraphs);
-	static void serviceRemoteRequests(RegionGraph *graph);  
-	//static void serviceSingleGraphComm(RegionGraph* graph, int tid);
-	//static void serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, bool cpyAcross, int tid);
-	static void serviceMultipleGraphCommDynamic(std::vector<RegionGraph*> graphArray, bool cpyAcross, int tid);
-        static void flattenGraphHierarchy(std::vector<std::vector<RegionGraph*> >graphArray, std::vector<RegionGraph*> &flattenedGraphArray);
-	//static void serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, int tid);
-	static void fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f);
-	static void fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f,  bool singleT);
-
-        void   multifabExtractCopyAssoc(void* threadInfo);
-	static void multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& dmf, const MultiFab& smf, int nc, int ng, int ngSrc, const Periodicity& period);
-	static void multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& dmf, const MultiFab& smf, const Periodicity& period);
-	static void multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-	static void multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT); 
-	static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-	static void multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* dmf, MultiFab* smf, int f, bool singleT);
-	static void serviceLocalGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int tg);
-	static void serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraph, int tg);
-	static void resetRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraph, int tg);
-
-
-
-        static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-        static void multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, bool singleT);
-       
-       static void multifabCopyPush_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* dmf, amrex::MultiFab* smf, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT);
-       static void fillBoundaryPull_1Team(RegionGraph *graph, amrex::MultiFab& mf, int f);
-
-        static void fillBoundaryPush(amrex::RGIter& rgi, amrex::MultiFab& mf);
-        static void fillBoundaryPull(amrex::RGIter& rgi, amrex::MultiFab& mf, bool singleT);
-        static void fillBoundaryPush(amrex::RGIter& rgi, RegionGraph *graph, amrex::MultiFab& mf);
-        static void fillBoundaryPull(amrex::RGIter& rgi, RegionGraph *graph, amrex::MultiFab& mf, bool singleT);
-
-    }; // class Perilla
-}
-#endif
diff --git a/Src/AmrTask/rts_impls/upcxx/Perilla.cpp b/Src/AmrTask/rts_impls/upcxx/Perilla.cpp
deleted file mode 100755
index 186bbd0a8f9..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/Perilla.cpp
+++ /dev/null
@@ -1,3036 +0,0 @@
-#include <AMReX_MultiFab.H>
-#include <AMReX_FabArray.H>
-#include <AMReX_Periodicity.H>
-#include <WorkerThread.H>
-#include <PerillaConfig.H>
-#include <RegionGraph.H>
-#include <Barrier.H>
-#include <vector>
-#include <iostream>
-#include <limits>
-#include <exception>
-#include <mpi.h>
-#include <Perilla.H>
-using namespace std;
-using namespace amrex;
-using namespace perilla;
-using namespace upcxx;
-
-
-struct sMsgMap_t{
-    std::map< int, std::map< int,  std::list< Package* > > > map; 
-    volatile int size=0;
-    pthread_mutex_t lock= PTHREAD_MUTEX_INITIALIZER;
-}sMsgMap;
-
-struct rMsgMap_t{
-    std::map< int, std::map< int,  std::list< Package* > > > map; 
-    volatile int size=0;
-    pthread_mutex_t lock= PTHREAD_MUTEX_INITIALIZER;
-}rMsgMap;
-
-struct getReq_t{
-    int src;
-    int tag;
-    upcxx::global_ptr<double> sbuf;
-    int size;
-    getReq_t(int _src, int _tag, upcxx::global_ptr<double> _sbuf, int _size):src(_src), tag(_tag), sbuf(_sbuf), size(_size){}
-};
-
-struct pendingGetList_t{
-    std::list< getReq_t* > _pendingGets;
-    pthread_mutex_t lock= PTHREAD_MUTEX_INITIALIZER;
-    void add(getReq_t* req){
-         pthread_mutex_lock(&lock);
-	_pendingGets.push_back(req);
-         pthread_mutex_unlock(&lock);
-    }
-    void process(){
-        if(_pendingGets.size()==0) return;
-        pthread_mutex_lock(&(rMsgMap.lock));
-        pthread_mutex_lock(&lock);
-        std::list< getReq_t* >::iterator it= _pendingGets.begin();
-        while(it != _pendingGets.end()){
-            double* localbuf= NULL;
-            int src= (*it)->src; 
-	    int tag= (*it)->tag;
-            if(rMsgMap.map.find(src) != rMsgMap.map.end()){
-	        if(rMsgMap.map[src].find(tag) != rMsgMap.map[src].end()){
-                   if(rMsgMap.map[src][tag].size() >0){
-                       rMsgMap.map[src][tag].front()->tag= tag;
-                       localbuf= (rMsgMap.map[src][tag].front()->databuf).local(); //(double*) (static_cast<upcxx::global_ptr<void> > (rMsgMap.map[src][tag].front()->databuf).local());
-                       *(rMsgMap.map[src][tag].front()->request)= upcxx::rget((*it)->sbuf, localbuf, (*it)->size);
-                       rMsgMap.map[src][tag].pop_front();
-                       rMsgMap.size--;
-                       std::list< getReq_t* >::iterator it1= it;
-                       it++;
-		       delete (*it);
-                       _pendingGets.erase(it1);
-	           }else it++;
-		}else it++;
-            }else it++;
-        }
-        pthread_mutex_unlock(&lock);
-        pthread_mutex_unlock(&(rMsgMap.lock));
-    }
-} pendingGetList;
-
-
-void Perilla::syncProcesses(){
-    upcxx::barrier();
-}
-
-
-void Perilla::serviceLocalRequests(RegionGraph* rg, int tg)    
-{
-    int numfabs = rg->lMap.size();
-    for(int f=0; f<numfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f))
-	{
-	    bool anyReq=false;
-	    for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++)
-		if(rg->lMap[f]->l_con.scpy[i].pQueue.queueSize(true)>0){
-		    anyReq=true;
-		    break;
-	        }
-	    if(anyReq)	
-	    {
-	        pthread_mutex_lock(&(rg->lMap[f]->l_con.sLock));
-	        for(int i=0; i<rg->lMap[f]->l_con.nscpy; i++){
-		    if(rg->lMap[f]->l_con.scpy[i].pQueue.queueSize(true)>0)
-	 	    {
-			Package *sPackage = rg->lMap[f]->l_con.scpy[i].pQueue.dequeue(true);
-			pthread_mutex_lock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			int dPartner = rg->lMap[f]->l_con.scpy[i].dPartner;
-			Package *dPackage = rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			std::memcpy(dPackage->databuf.local(), sPackage->databuf.local(), dPackage->bufSize * sizeof(double));
-			rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			if(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dcpy[dPartner].pQueue.queueSize(true)==1)
-			    rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.firingRuleCnt++;
-			pthread_mutex_unlock(&(rg->lMap[rg->lMap[f]->l_con.scpy[i].nd]->l_con.dLock));
-			rg->lMap[f]->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-		    }
-	        }
-		pthread_mutex_unlock(&(rg->lMap[f]->l_con.sLock));
-	    }
-	}// if(tg==fg)
-    }// for(f<numfabs)    
-}//serviceLocalRequests
-
-void Perilla::serviceRemoteRequests(RegionGraph* rg, int graphID, int nGraphs)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = rg->rMap.size();
-
-    for(int f=0; f<numfabs; f++)
-    {
-	//int lockSucceeded = pthread_mutex_trylock(&(rg->rMap[f]->r_con.rcvLock));
-	//if(lockSucceeded != 0)
-	{
-	    //if(pthread_mutex_trylock(&(rg->lMap[f]->r_con.rcvLock)) != 0)
-	    {
-		for(int i=0; i<rg->lMap[f]->r_con.nrcv; i++)
-		{
-		    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed
-			nextrReq = true;
-		    else
-		    {
-			Package *rearPackage = rg->rMap[f]->r_con.rcv[i].pQueue.getRear(true);//!CHECK THIS POINT LATER
-			if(rearPackage->completed && rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			    nextrReq = true;
-			else //!expected message is still on the way
-			    nextrReq = false;
-		    }
-		    if(nextrReq) //!take a message from recycle pool and post a receive
-		    {
-                        pthread_mutex_lock(&(rg->rMap[f]->r_con.rcvLock));
-                        pthread_mutex_lock(&(rg->lMap[f]->r_con.rcvLock));
-			int ns = rg->rMap[f]->r_con.rcv[i].ns;
-			int nd = rg->rMap[f]->r_con.rcv[i].nd;
-			int lnd = rg->rMap[f]->r_con.rcv[i].lnd;
-			int r_grids = rg->rMap[f]->r_con.rcv[i].r_grids;
-			//!create a package to keep track of receive requests
-			Package *rMetaPackage = rg->rMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			//!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-			Package *rPackage = rg->lMap[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			int tag = tagMap[rg->rMap[f]->r_con.rcv[i].pr][graphID][nd][ns][rg->rMap[f]->r_con.rcv[i].sz];
-
-			rPackage->request = new future<>;
-			rPackage->tag = tag;
-			rg->lMap[f]->r_con.rcv[i].pQueue.enqueue(rPackage,true);   //!this is not done yet
-			rg->rMap[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage,true);   //!this is not done yet
-			pthread_mutex_lock(&(rMsgMap.lock));
-			rMsgMap.map[rg->rMap[f]->r_con.rcv[i].pr][tag].push_back(rPackage);
-                        rMsgMap.size++;
-			pthread_mutex_unlock(&(rMsgMap.lock));
-                        pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-                        pthread_mutex_unlock(&(rg->rMap[f]->r_con.rcvLock));
-		    }
-		}
-		//pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-	    }// if(omp_test_lock)
-	    //pthread_mutex_unlock(&(rg->rMap[f]->r_con.rcvLock));
-	}// if(lockSucceeded)
-    }// for(f<numfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {
-	for(int i=0; i<rg->sMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //then !no message has been issued or all send requests have been fulfilled
-		nextsReq = false;
-	    else
-		nextsReq = true;
-	    if(nextsReq)
-	    {
-		Package *sMetaPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(!sMetaPackage->served)
-		{
-		    Package *sPackage = rg->lMap[f]->r_con.snd[i].pQueue.getFront(true);
-		    sMetaPackage->completed = false;
-		    sMetaPackage->served = true;
-		    int ns = rg->sMap[f]->r_con.snd[i].ns;
-		    int nd = rg->sMap[f]->r_con.snd[i].nd;
-		    int r_gid = rg->sMap[f]->r_con.snd[i].r_gid;
-		    int r_grids = rg->sMap[f]->r_con.snd[i].r_grids;
-		    int tag = Perilla::myTagMap[r_gid][nd][ns][rg->sMap[f]->r_con.snd[i].sz];
-		    int src= upcxx::rank_me();
-		    //register send request so that the receiver can send back confirmation upon pull completion
-                    sPackage->completed = false;
-                    pthread_mutex_lock(&(sMsgMap.lock));
-                    sMsgMap.map[rg->sMap[f]->r_con.snd[i].pr][tag].push_back(sPackage);
-                    sMsgMap.size++;
-                    pthread_mutex_unlock(&(sMsgMap.lock));
-		    int size= rg->sMap[f]->r_con.snd[i].sz;
-		    upcxx::global_ptr<double> sbuf= sPackage->databuf; //static_cast<upcxx::global_ptr<double> >((double*)sPackage->databuf);
-		    int dst= rg->sMap[f]->r_con.snd[i].pr;
-		    upcxx::rpc(dst, 
-		       [=](){
-			  //at destination rank, look up recv buffer and pull remote data and store data in the buffer
-			  bool posted_recv=false;
-			  double* localbuf= NULL;
-			  pthread_mutex_lock(&(rMsgMap.lock));
-			  if(rMsgMap.map.find(src) != rMsgMap.map.end()){
-			      if(rMsgMap.map[src].find(tag) != rMsgMap.map[src].end())
-				 if(rMsgMap.map[src][tag].size() >0){
-				     posted_recv=true;
-				     localbuf= (rMsgMap.map[src][tag].front()->databuf).local(); //(double*) static_cast<upcxx::global_ptr<void> > (rMsgMap.map[src][tag].front()->databuf).local(); 
-			    	     *(rMsgMap.map[src][tag].front()->request)= upcxx::rget(sbuf, localbuf, size);
-			             rMsgMap.map[src][tag].pop_front();
-                                     rMsgMap.size--;
-		                 }
-			  } 
-                          pthread_mutex_unlock(&(rMsgMap.lock));
-			  //save pull request for later when recv buffer is posted 
-			  if(posted_recv==false){
-			      getReq_t *req= new getReq_t(src, tag, sbuf, size);
-			      pendingGetList.add(req);
-			  }
-		       }
-		    );
-		}
-	    }
-	} // for(i<nsnd)
-    } // for(f<numfabs)
-
-    pendingGetList.process();
-
-    //!now we test if send and receive requests have been serviced
-    for(int f=0; f<numfabs; f++)
-    {
-	//!receive requests
-	for(int i=0; i<rg->rMap[f]->r_con.nrcv; i++)
-	{
-	    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-	    {
-		//if(pthread_mutex_trylock(&(rg->lMap[f]->r_con.rcvLock)) != 0) // 0-Fail, otherwise-Succeed
-		{
-		    Package *rearPackage =  rg->lMap[f]->r_con.rcv[i].pQueue.getRear(true);
-		    if(!rearPackage->completed)
-		    {
-			bool flag = false;
-			int ret_flag;
-			if(rearPackage->request->ready())
-			{
-                            pthread_mutex_lock(&(rg->lMap[f]->r_con.rcvLock));
-                              int ns =  rg->lMap[f]->r_con.rcv[i].ns;
-                              int nd =  rg->lMap[f]->r_con.rcv[i].nd;
-                              int lnd =  rg->lMap[f]->r_con.rcv[i].lnd;
-                              int r_grids =  rg->lMap[f]->r_con.rcv[i].r_grids;
-                              int tag = rearPackage->tag;
-                              //int tag = tagMap[ rg->lMap[f]->r_con.rcv[i].pr][graphID][nd][ns][ rg->lMap[f]->r_con.rcv[i].sz];
-                              int dst = upcxx::rank_me();
-                              int src=  rg->lMap[f]->r_con.rcv[i].pr;
-                                upcxx::rpc(src,
-                                    [=](){
-                                        pthread_mutex_lock(&(sMsgMap.lock));
-                                        sMsgMap.map[dst][tag].front()->completed=true;
-                                        sMsgMap.map[dst][tag].pop_front();
-		                        sMsgMap.size--;
-                                        pthread_mutex_unlock(&(sMsgMap.lock));
-                                    }
-                                );
-
-			    delete rearPackage->request;
-			    rearPackage->completeRequest();
-			    rg->lMap[f]->r_con.rcv[i].pQueue.getRear()->completeRequest();
-			    if(rg->rMap[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				rg->lMap[f]->r_con.firingRuleCnt++;
-                            pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-			}
-		    }
-		    //pthread_mutex_unlock(&(rg->lMap[f]->r_con.rcvLock));
-		} // if(omp_test_lock)
-	    } // if(queueSize > 0)
-	} // for(i<nrcv)
-    } // for(f<numfabs)
-
-    for(int f=0; f<numfabs; f++)
-    {
-	//!send requests
-	for(int i=0; i<rg->lMap[f]->r_con.nsnd; i++)
-	{
-	    if(rg->sMap[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-	    {
-		Package *frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.getFront(true);
-		if(frontPackage->served) //!latest receive request has NOT been completed
-		{
-		    bool flag = false;
-		    int ret_flag;
-		    if(frontPackage->request==0)
-		    {
-			pthread_mutex_lock(&(rg->sMap[f]->r_con.sndLock));
-			frontPackage = rg->sMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = 0;
-			frontPackage->tag = 0;
-			rg->sMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			pthread_mutex_unlock(&(rg->sMap[f]->r_con.sndLock));
-
-			pthread_mutex_lock(&(rg->lMap[f]->r_con.sndLock));
-			frontPackage = rg->lMap[f]->r_con.snd[i].pQueue.dequeue(true);
-			frontPackage->completed = false;
-			frontPackage->served = false;
-			frontPackage->request = 0;
-			frontPackage->tag = 0;
-			rg->lMap[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			pthread_mutex_unlock(&(rg->lMap[f]->r_con.sndLock));			
-		    }
-		}
-	    } // if(queueSize > 0)
-	} // for(i<nsnd)
-    }// for(f<numfabs)
-}// serviceRemoteRequests
-
-#if 0
-void Perilla::serviceRemoteRequests(RegionGraph* rg)
-{
-    serviceRemoteRequests(rg,0,1);
-}
-
-void Perilla::serviceSingleGraphComm(RegionGraph* graph, int tid)
-{
-    int np = ParallelDescriptor::NProcs();
-    int tg = WorkerThread::perilla_wid();
-    while(true)
-    {
-	if(graph->totalFinishes < perilla::NUM_THREAD_TEAMS)
-	{
-	    serviceLocalRequests(graph, tg);
-	    if((np>1) & (tg==0))
-		serviceRemoteRequests(graph);
-	}
-	else
-	{
-	    if(tg==0)
-	    {
-		while(graph->totalFinishes < perilla::NUM_THREAD_TEAMS)
-		{
-		}		
-		//call parallel_barrier()  ---????????
-		ParallelDescriptor::Barrier("serviceSingleGraph-1");
-		graph->graphTeardown();
-		graph->workerTeardown();
-		//call parallel_barrier() ------?????????
-		ParallelDescriptor::Barrier("serviceSingleGraph-2");
-	    }
-	    break;
-	}
-    } // while(true)
-} //serviceSingleGraphComm
-
-void Perilla::serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, bool cpyAcross, int tid)
-{
-    int tg = WorkerThread::perilla_wid();
-    int np = ParallelDescriptor::NProcs();    
-    int graphFinishCnt = 0;
-    while(true)
-    {
-	for(int g=0; g<nGraphs; g++)
-	{
-	    if(graphArray[g].totalFinishes < perilla::NUM_THREAD_TEAMS)
-	    {
-		serviceLocalRequests(&graphArray[g], tg);
-		//if(cpyAcross)
-		//serviceLocalGridCopyRequests(graphArray,g,tg);
-		if(np > 1)
-		    if(tg==0)
-		    {
-			serviceRemoteRequests(&graphArray[g],g,nGraphs);
-			//if(cpyAcross)
-			//serviceRemoteGridCopyRequests(graphArray,g,nGraphs,tg);
-		    }
-	    }
-	}
-	//!check if we have finished all the graph execution
-	bool noMoreWork = true;
-	for(int g=0; g<nGraphs; g++)
-	    if(graphArray[g].totalFinishes < perilla::NUM_THREAD_TEAMS)
-		noMoreWork = false;
-	if(noMoreWork)
-	    break;	
-    } // while(true)
-    if(tg==0)
-	for(int g=0; g<nGraphs; g++)
-	{
-	    ParallelDescriptor::Barrier("serviceMultipleGraph-1");
-	    graphArray[g].graphTeardown();
-	    graphArray[g].workerTeardown();
-	    ParallelDescriptor::Barrier("serviceMultipleGraph-2");
-	}
-} // serviceMultipleGraphComm
-#endif
-
-#if 1
-void Perilla::serviceMultipleGraphCommDynamic(std::vector<RegionGraph*> graphArray, bool cpyAcross, int tid)
-{
-    int tg = WorkerThread::perilla_wid();
-    int np = ParallelDescriptor::NProcs();    
-    int nGraphs = graphArray.size();
-
-    for(int g=0; g<graphArray.size(); g++)
-    {
-	serviceLocalRequests(graphArray[g], tg);
-	if(cpyAcross)
-	    serviceLocalGridCopyRequests(graphArray,g,tg);
-        if(np > 1)//if(tg==0)
-        {
-            if(tg==0){
-	        serviceRemoteRequests(graphArray[g],g,nGraphs);
-                if(cpyAcross)
-	            serviceRemoteGridCopyRequests(graphArray,g,nGraphs,tg);
-	    }
-        }
-    }
-} //serviceMultipleGraphCommDynamic
-#endif
-
-#if 0
-void Perilla::serviceMultipleGraphComm(RegionGraph graphArray[], int nGraphs, int tid)
-{
-    serviceMultipleGraphComm(graphArray,nGraphs,false,tid);
-} // serviceMultipleGraphComm
-#endif
-
-void Perilla::fillBoundaryPush(RegionGraph* graph, MultiFab* mf, int f)
-{
-
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    //if(graph->graphID == 1 && f == 1)
-    //std::cout << "fillBPush for gID 1 f 1 ntid "<< ntid <<std::endl;
-
-    if(perilla::LAZY_PUSH)
-    { }
-    else
-    {
-	if(ntid == 0)
-	    pthread_mutex_lock(&(graph->lMap[f]->l_con.sLock));
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-	if(perilla::PACKING_FINEGRAIN)
-	{}
-	else
-	{
-	    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-		if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-
-		    //if(graph->graphID == 1 && graph->lMap[f]->l_con.scpy[i].nd == 1)
-		    //std::cout << "fillBPush for gID 1 nd 1 pQenQ f " << f << " i " << i <<std::endl;
-		    Package *sPackage = graph->lMap[f]->l_con.scpy[i].recycleQueue.getFront(true);
-		    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->l_con.scpy[i].sbx,0,nComp,sPackage->databuf.local());
-
-		    //for(int d=0; d<sPackage->bufSize; d++)
-			//if(sPackage->databuf[d] == 0)
-			//{
-			    //std::cout<< "in fbPush Sending 0 from f "<< f <<std::endl;
-			    //BL_ASSERT(sPackage->databuf[d] != 0);
-			//}
-		    //if(graph->lMap[f]->l_con.scpy[i].sbx.smallEnd() == graph->lMap[f]->l_con.scpy[i].sbx.bigEnd())
-		    //if(graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(0)==7 && graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(1)==7 && graph->lMap[f]->l_con.scpy[i].sbx.smallEnd(2)==4)
-		    //  std::cout<< "Corner Push for f "<< f << " data0 " <<sPackage->databuf[0]<< " size " <<sPackage->bufSize << " se "<< graph->lMap[f]->l_con.scpy[i].sbx.smallEnd() <<std::endl;
-
-		}	    
-	} // if(PACKING_FINEGRAIN) - else
-
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-	if(ntid==0)
-	{
-	    //if(graph->graphID == 1 && f == 1)
-	    //std::cout << "fillBPush for gID 1 f 1 pQ enQ" <<std::endl;
-	    for(int i=0; i<graph->lMap[f]->l_con.nscpy; i++)
-	    {
-		//if(graph->graphID == 1 && graph->lMap[f]->l_con.scpy[i].nd == 1)
-		//std::cout << "fillBPush for gID 1 nd 1 pQ enQ from f "<< f <<std::endl;
-		graph->lMap[f]->l_con.scpy[i].pQueue.enqueue( graph->lMap[f]->l_con.scpy[i].recycleQueue.dequeue(true),true );
-	    }
-	    pthread_mutex_unlock(&(graph->lMap[f]->l_con.sLock));
-	}
-	graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    } // if(LAZY_PUSH) - else
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-	pthread_mutex_lock(&(graph->lMap[f]->r_con.sndLock));
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	if((i%(perilla::NUM_THREADS_PER_TEAM-1))==ntid)
-	{
-	    //std::cout << "RQS " << graph->lMap[f]->r_con.snd[i].recycleQueue.queueSize() << std::endl;
-
-	    Package *sndPackage = graph->lMap[f]->r_con.snd[i].recycleQueue.dequeue(true);	  
-	    mf->m_fabs_v[f]->copyToMem(graph->lMap[f]->r_con.snd[i].sbx,0,nComp,sndPackage->databuf.local());
-	    graph->lMap[f]->r_con.snd[i].pQueue.enqueue( sndPackage,true );
-	    //!the local message handler will detect the change and notify the remote message handler =>read access
-	    //!the remote message handler first modifies the front item of this queue, then it push this item back to the message pool
-	}
-    graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-    if(ntid==0)
-    {
-	pthread_mutex_unlock(&(graph->lMap[f]->r_con.sndLock));
-	pthread_mutex_lock(&(graph->sMap[f]->r_con.sndLock));
-	for(int i=0; i<graph->lMap[f]->r_con.nsnd; i++)
-	    graph->sMap[f]->r_con.snd[i].pQueue.enqueue( graph->sMap[f]->r_con.snd[i].recycleQueue.dequeue(true),true );
-	pthread_mutex_unlock(&(graph->sMap[f]->r_con.sndLock));
-    }    																					      
-
-} // fillBoundaryPush
-
-void Perilla::fillBoundaryPull(RegionGraph* graph, MultiFab* mf, int f, bool singleT)
-{
-
-    int nComp = mf->nComp();
-    int tg= WorkerThread::perilla_wid();
-    int ntid = WorkerThread::perilla_wtid();
-
-    if(ntid==0)
-	pthread_mutex_lock(&(graph->lMap[f]->l_con.dLock));
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads    
-
-    if(perilla::LAZY_PUSH)
-    { }
-    else
-    {
-	if(perilla::UNPACKING_FINEGRAIN)
-	{}
-	else
-	{
-	    for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-		if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-		{
-		    Package *dPackage = graph->lMap[f]->l_con.dcpy[i].pQueue.getFront(true);
-		    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->l_con.dcpy[i].dbx,0,nComp,dPackage->databuf.local());		  
-		}
-	} // if(UNPACKING_FINEGRAIN) - else
-    } // if(LAZY_PUSH) - else
-
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    graph->lMap[f]->l_con.dcpy[i].recycleQueue.enqueue( graph->lMap[f]->l_con.dcpy[i].pQueue.dequeue(true),true );
-
-	graph->lMap[f]->l_con.firingRuleCnt = graph->lMap[f]->l_con.firingRuleCnt - graph->lMap[f]->l_con.ndcpy;
-
-	graph->lMap[f]->l_con.scpyCnt = 0;
-	for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-	    if(graph->lMap[f]->l_con.dcpy[i].pQueue.queueSize(true) >= 1)
-		graph->lMap[f]->l_con.firingRuleCnt++;
-	pthread_mutex_unlock(&(graph->lMap[f]->l_con.dLock));
-    }
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    int np = ParallelDescriptor::NProcs();
-    if (np==1) return;
-
-    if(ntid==0)
-    {
-	pthread_mutex_lock(&(graph->rMap[f]->r_con.rcvLock));
-	pthread_mutex_lock(&(graph->lMap[f]->r_con.rcvLock));
-    }
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	if( (i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	{
-	    Package *rcvMetaPackage = graph->rMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = 0;
-	    graph->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-	    Package *rcvPackage = graph->lMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-	    mf->m_fabs_v[f]->copyFromMem(graph->lMap[f]->r_con.rcv[i].dbx,0,nComp,rcvPackage->databuf.local());
-	    rcvPackage->completed = false;
-	    graph->lMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);
-	}
-    if(!singleT)
-        graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1); // Barrier to synchronize team threads
-
-    if(ntid==0)
-    {
-	graph->lMap[f]->r_con.firingRuleCnt = graph->lMap[f]->r_con.firingRuleCnt - graph->lMap[f]->r_con.nrcv;
-	for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-	    if(graph->lMap[f]->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		if(graph->lMap[f]->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-		    graph->lMap[f]->r_con.firingRuleCnt++;
-	pthread_mutex_unlock(&(graph->lMap[f]->r_con.rcvLock));
-	pthread_mutex_unlock(&(graph->rMap[f]->r_con.rcvLock));
-    }
-
-} // fillBoundaryPull
-
-  void Perilla::fillBoundaryPull(amrex::RGIter& rgi, RegionGraph* rg, amrex::MultiFab& mf, bool singleT)
-  {
-    if(rgi.currentItr != 1)
-      return;
-
-    int f = rgi.currentRegion;
-    fillBoundaryPull(rg, &mf, f, singleT);
-  }
-
-  void Perilla::fillBoundaryPull(amrex::RGIter& rgi, amrex::MultiFab& mf, bool singleT)
-  {
-    if(rgi.currentItr != 1)
-      return;
-
-    int f = rgi.currentRegion;
-    fillBoundaryPull(rgi.itrGraph, &mf, f, singleT);
-  }
-
-
-/////////////////////////////////////////////////////////////////////////////////////////////////////////////////
-
-#if 0
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, int nc, int ng, int ngSrc, const Periodicity& period)
-{
-    //    MultiFab* mfSrc = gSrc->assocMF;
-    //    MultiFab* mfDst = gDst->assocMF;
-    int myProc = ParallelDescriptor::MyProc();
-    int np = ParallelDescriptor::NProcs();
-
-    try{
-
-	if(true)//if(!(*mfSrc == *mfDst))
-	{
-	    if(ng > mfDst.nGrow()) cout <<"MULTIFAB_COPY_C: ng > mfDst.nGrow not supported in parallel copy"<< endl;
-	    if(ngSrc > mfSrc.nGrow()) cout <<"MULTIFAB_COPY_C: ngSrc > mfSrc.nGrow"<< endl;
-	    if(ngSrc > 0)
-	    {   
-
-		// To be implemented
-		//do i = 1, nboxes(msrc%la)
-		//  call push_back(bl, grow(box_nodalize(get_box(msrc%la,i),msrc%nodal),lngsrc))
-		//end do
-		//call build(batmp, bl, sort = .false.)
-		//call destroy(bl)
-		//call build(lasrctmp, batmp, boxarray_bbox(batmp), explicit_mapping = get_proc(msrc%la))
-		//call destroy(batmp)
-		//call build(msrctmp, lasrctmp, nc = lnc, ng = 0)
-		//pmfsrc => msrctmp
-	    }
-	    if(np > 1)
-	    {   
-		if(gSrc->sCopyMapHead == 0)
-		    gSrc->sCopyMapHead = new CopyMap();
-		else
-		{   
-		    CopyMap *tmpCopyMap = new CopyMap();
-		    tmpCopyMap->next = gSrc->sCopyMapHead;
-		    gSrc->sCopyMapHead = tmpCopyMap;
-		}
-		if(gDst->rCopyMapHead == 0)
-		    gDst->rCopyMapHead = new CopyMap();
-		else
-		{   
-		    CopyMap *tmpCopyMap = new CopyMap();
-		    tmpCopyMap->next = gDst->rCopyMapHead;
-		    gDst->rCopyMapHead = tmpCopyMap;
-		}
-		//gSrc->sCopyMapHead->map.reserve(mfSrc.size());
-		//gDst->rCopyMapHead->map.reserve(mfDst.size());
-		gSrc->sCopyMapHead->alloc_CopyMap(mfSrc);
-		gDst->rCopyMapHead->alloc_CopyMap(mfDst);
-	    }
-
-	    if(gSrc->numTasks != mfSrc.IndexArray().size())
-		std::cout<< "before " <<gSrc->numTasks << " now " <<mfSrc.size() << " at gID " << gSrc->graphID << std::endl;
-
-	    gSrc->numFabs = mfSrc.size();
-	    gDst->numFabs = mfDst.size();
-
-	    gSrc->numTasks = mfSrc.IndexArray().size();
-	    gDst->numTasks = mfDst.IndexArray().size();
-
-	    int nfabsSrc = mfSrc.IndexArray().size();
-	    int nfabsDst = mfDst.IndexArray().size();
-
-	    const FabArrayBase::CPC& TheCPC = mfDst.getCPC(IntVect(ng), mfSrc, IntVect(ngSrc), period);
-
-	    const int nloc_cpAsc = TheCPC.m_LocTags->size();
-	    const int nsnds_cpAsc = TheCPC.m_SndTags->size();
-	    const int nrcvs_cpAsc = TheCPC.m_RcvTags->size();
-
-	    Vector<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-	    Vector<int> send_pr;
-	    send_cctc.reserve(nsnds_cpAsc);
-
-	    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC.m_SndTags->begin(),
-		    m_End = TheCPC.m_SndTags->end();
-		    m_it != m_End;
-		    ++m_it)
-	    {
-		if(m_it->first != myProc)      // Not destined to me.
-		{
-		    send_pr.push_back(m_it->first);
-		    send_cctc.push_back(&(m_it->second));
-		}
-	    }
-
-	    //  std::cout<< "Loop 1" <<std::endl;
-
-	    Vector<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-	    Vector<int> recv_pr;
-	    recv_cctc.reserve(nrcvs_cpAsc);
-
-	    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC.m_RcvTags->begin(),
-		    m_End = TheCPC.m_RcvTags->end();
-		    m_it != m_End;
-		    ++m_it)
-	    {
-		if(m_it->first != myProc)      // I am not the source for this receipt
-		{
-		    recv_pr.push_back(m_it->first);
-		    recv_cctc.push_back(&(m_it->second));
-		}
-	    }
-
-	    //std::cout<< "Before parallel at gID " << gDst->graphID << " numTask " << gDst->numTasks << " numFabs " << gDst->numFabs <<std::endl;      
-
-//#pragma omp parallel shared(gSrc, gDst, mfSrc, mfDst, nfabsSrc, nfabsDst)
-	    {
-//		int tid = omp_get_thread_num();//perilla::tid();//omp_get_thread_num();   
-//		int tg = tid/perilla::NUM_THREADS_PER_TEAM;//perilla::wid();//WorkerThread::perilla_wid();
-//		int nt= tid%perilla::NUM_THREADS_PER_TEAM;
-//		int fg;
-
-		for(int f=0; f<nfabsSrc; f++)
-		{
-//		    if(nt==0)
-//			if(WorkerThread::isMyRegion(tg,f))// && WorkerThread::perilla_isMasterWorkerThread())
-			{
-			    //if(gDst->graphID > 25)
-			    //std::cout<< "Inside parallel Generating Send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;   
-
-			    FabCopyAssoc *cpSrc;
-			    if(gSrc->task[f]->cpAsc_srcHead == 0)
-			    {
-				gSrc->task[f]->cpAsc_srcHead = new FabCopyAssoc();
-				cpSrc = gSrc->task[f]->cpAsc_srcHead;
-			    }
-			    else
-			    {
-				cpSrc = new FabCopyAssoc();
-				cpSrc->next = gSrc->task[f]->cpAsc_srcHead;
-				gSrc->task[f]->cpAsc_srcHead = cpSrc;
-			    }
-
-			    cpSrc->graphPartner = gDst;
-			    cpSrc->l_con.nscpy = 0;
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-				//if(f == tag.srcIndex)
-				if(mfSrc.IndexArray()[f] == tag.srcIndex)
-				    cpSrc->l_con.nscpy++;
-			    }
-			    cpSrc->l_con.scpy = new LocalCopyDescriptor[cpSrc->l_con.nscpy];
-			    int scnt = 0;
-			    //if(gDst->graphID == 4 && tag.dstIndex == 60 )
-			    //std::cout<< "Inside parallel Generating Local Copy send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;        
-
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-				//if(f == tag.srcIndex)
-				if(mfSrc.IndexArray()[f] == tag.srcIndex)
-				{
-
-				    //if(gDst->graphID == 4 && (tag.dstIndex == 60 || tag.dstIndex == 59) )
-				    //std::cout <<"myP " <<myProc<< " Added in S LocDep nd " << tag.dstIndex << " ns "<< tag.srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-				    cpSrc->l_con.scpy[scnt].ns = mfSrc.localindex(tag.srcIndex);
-				    cpSrc->l_con.scpy[scnt].nd = mfDst.localindex(tag.dstIndex);
-				    cpSrc->l_con.scpy[scnt].sbx = tag.sbox;
-				    cpSrc->l_con.scpy[scnt].dbx = tag.dbox;
-				    int psize = tag.sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				    //std::cout<< " gSrc ID "<< gSrc->graphID << " f "<<f<< " sndPkgsize " << psize <<std::endl;
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					Package *tmpPkg = new Package(psize);
-			                void* local_ptr= tmpPkg->databuf.local(); //(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-					assert(local_ptr!=0);
-					for(int j=0; j<psize; j++){
-					    //tmpPkg->databuf[j] = 0;
-					    ((double*)local_ptr)[j]=0;
-				        }
-					cpSrc->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);
-				    }
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpSrc->l_con.scpy[scnt].recycleQueue.enqueue(cpSrc->l_con.scpy[scnt].pQueue.dequeue());
-				    scnt++;
-				}
-			    }
-
-			    if(np > 1)
-			    {
-				cpSrc->r_con.nsnd = 0;
-				cpSrc->r_con.remotePushReady = false;
-				cpSrc->r_con.firingRuleCnt = 0;
-				for(int i=0; i<nsnds_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					if(mfSrc.IndexArray()[f] == it->srcIndex)
-					    cpSrc->r_con.nsnd++;
-				    }
-				} // for(i<nsnds_cpAsc)
-				cpSrc->r_con.snd = new RemoteCommDescriptor[cpSrc->r_con.nsnd];
-				scnt = 0;
-				for(int i=0; i<nsnds_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					if(mfSrc.IndexArray()[f] == it->srcIndex)
-					{
-
-					    //if(gDst->graphID == 17 && (it->srcIndex == 1198 || it->srcIndex == 1198 || it->srcIndex == 978 || it->srcIndex == 978))
-					    //std::cout <<"myP " <<myProc<< " Added in S Dep r " << it->dstIndex << " s "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg <<" nsnd " << gSrc<< std::endl;
-
-					    cpSrc->r_con.snd[scnt].ns = it->srcIndex;
-					    cpSrc->r_con.snd[scnt].nd = it->dstIndex;
-					    cpSrc->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					    cpSrc->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);
-					    cpSrc->r_con.snd[scnt].sbx = it->sbox;
-					    cpSrc->r_con.snd[scnt].dbx = it->dbox;
-					    int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    {   
-						Package *tmpPkg = new Package(psize);
-			    		        void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-						for(int j=0; j<psize; j++){
-						    //tmpPkg->databuf[j] = 0;
-						    ((double*)local_ptr)[j]=0;
-						}
-						cpSrc->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					    }
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						cpSrc->r_con.snd[scnt].recycleQueue.enqueue(cpSrc->r_con.snd[scnt].pQueue.dequeue());
-					    scnt++;
-					}
-				    }                                     
-				} // for(i<nsnds_cpAsc)                               
-			    } // if(np > 1)                                                                                                                                         
-			} // if(fg==tg)
-//#pragma omp barrier
-		    //        std::cout<< "Barrier 1" <<std::endl;            
-		    if(np > 1)
-		    {
-			//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-			//if(tid==0)
-			{
-
-			    // std::cout<< "Inside parallel Generating Remote Send tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;  
-
-			    gSrc->sCopyMapHead->map[f]->r_con.nsnd = 0;
-			    gSrc->sCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-					gSrc->sCopyMapHead->map[f]->r_con.nsnd++;
-				}
-			    } // for(i<nsnds_cpAsc)
-			    gSrc->sCopyMapHead->map[f]->r_con.snd = new RemoteCommDescriptor[gSrc->sCopyMapHead->map[f]->r_con.nsnd];
-			    int scnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-				    {
-
-					//if(gDst->graphID == 31 && (it->dstIndex == 519))
-					//std::cout <<"myP " <<myProc<< " Added in S Dep nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].ns = it->srcIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].nd = it->dstIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_gid = gDst->graphID-1;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sbx = it->sbox;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].dbx = it->dbox;
-
-					int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sz = psize;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pr = send_pr[i];
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].recycleQueue.enqueue(gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.dequeue());
-					scnt++;
-				    }
-				}
-			    } // for(i<nsnds_cpAsc)
-			} // if(tid==0)
-		    } // if(np > 1)       
-		} // for(f<nfabsSrc)
-		//        std::cout<< "Barrier 2 " <<" tid "<<tid<<std::endl;     
-//#pragma omp barrier               
-		for(int f=0; f<nfabsDst; f++)
-		{
-		    //if(nt==0)
-			//if(WorkerThread::isMyRegion(tg,f))// && perilla::isMasterWorkerThread())
-			{
-			    //        std::cout <<"tid: "<< tid << " f: "<< f << " is master "<<WorkerThread::isTeamMasterThread(tid) << " is my region "<<WorkerThread::isMyRegion(tg,f)<<std::endl;                 
-
-			    //if(gDst->graphID > 25)
-			    //std::cout<< "Inside parallel Generating Recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl; 
-
-			    FabCopyAssoc *cpDst;
-			    if(gDst->task[f]->cpAsc_dstHead == 0)
-			    {
-				gDst->task[f]->cpAsc_dstHead = new FabCopyAssoc();
-				cpDst = gDst->task[f]->cpAsc_dstHead;
-			    }
-			    else
-			    {
-				cpDst = new FabCopyAssoc();
-				cpDst->next = gDst->task[f]->cpAsc_dstHead;
-				gDst->task[f]->cpAsc_dstHead = cpDst;
-			    }
-			    cpDst->graphPartner = gSrc;
-			    cpDst->l_con.ndcpy = 0;
-			    cpDst->l_con.firingRuleCnt = 0;
-			    cpDst->l_con.dcpyCnt = 0;
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-				//if(f == tag.dstIndex)
-				if(mfDst.IndexArray()[f] == tag.dstIndex)
-				    cpDst->l_con.ndcpy++;
-			    }
-			    cpDst->l_con.dcpy = new LocalCopyDescriptor[cpDst->l_con.ndcpy];
-			    int dcnt = 0;
-
-			    //if(gDst->graphID > 25)
-			    //std::cout<< "Inside parallel Generating Local copy recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;      
-
-
-			    //if(gDst->graphID ==27 && f == 633)
-			    //std::cout<< "tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc << " ndcpy " << cpDst->l_con.ndcpy <<std::endl;     
-
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag& tag = (*TheCPC.m_LocTags)[i];
-				//if(f == tag.dstIndex)
-				if(mfDst.IndexArray()[f] == tag.dstIndex)
-				{
-
-				    //if(gDst->graphID == 4 && (tag.dstIndex == 60 || tag.dstIndex == 59))
-				    //std::cout<< "dcpy tid " << tid << " f " << f << " i " << i << " dcnt " << dcnt << " ns "<<tag.srcIndex << " nd "<<tag.dstIndex << " lo " << tag.dbox.smallEnd() << " hi " << tag.dbox.bigEnd() <<std::endl;   
-
-				    cpDst->l_con.dcpy[dcnt].ns = mfSrc.localindex(tag.srcIndex);
-				    cpDst->l_con.dcpy[dcnt].nd = mfDst.localindex(tag.dstIndex);
-				    cpDst->l_con.dcpy[dcnt].sbx = tag.sbox;
-				    cpDst->l_con.dcpy[dcnt].dbx = tag.dbox;
-
-				    // if(gDst->graphID > 25 && f == 633)
-				    //std::cout<< " Generating Package tid " << tid << " i " << i <<std::endl;      
-
-				    int psize = tag.dbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				    cpDst->l_con.dcpy[dcnt].sz = psize;
-
-				    if(!gDst->isDepGraph)
-				    {
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    Package *tmpPkg = new  Package(psize);
-			    		    void* local_ptr= tmpPkg->databuf.local();//(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-
-					    // if(tmpPkg == nullptr)
-					    //std::cout<<"Found the culprit tid " << tid << " f " << f << " i " << i << std::endl;
-
-					    for(int j=0; j<psize; j++){
-						//tmpPkg->databuf[j] = 0;
-						((double*)local_ptr)[j]=0;
-					    }
-					    cpDst->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);
-					}
-
-					// if(gDst->graphID > 25 && f == 633)
-					//std::cout<< " Generating  now in reQ Package tid " << tid << " i " << i <<std::endl;      
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    cpDst->l_con.dcpy[dcnt].recycleQueue.enqueue(cpDst->l_con.dcpy[dcnt].pQueue.dequeue());
-
-					//if(gDst->graphID > 25 && f == 633)
-					//  std::cout<< " Generated Package tid " << tid << " i " << i <<std::endl; 
-				    }
-
-				    dcnt++;
-				}
-			    }
-
-			    // if(gDst->graphID > 25 && f > 630)
-			    //std::cout<< "Safe now tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc <<std::endl;       
-
-			    RegionGraph* depGraph = gDst->srcLinkGraph;
-			    for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-			    {
-				int dfi = gDst->task[f]->depTaskIDs[df];
-				FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-				for(int i=0; i<cpdDst->l_con.ndcpy ; i++)
-				{
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					int psize = cpdDst->l_con.dcpy[i].sz;
-					Package *tmpPkg = new  Package(psize);
-			    		void* local_ptr= tmpPkg->databuf.local(); //(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-					for(int j=0; j<psize; j++){
-					    //tmpPkg->databuf[j] = 0;
-					    ((double*)local_ptr)[j]=0;
-				        }
-					cpdDst->l_con.dcpy[i].pQueue.enqueue(tmpPkg);
-				    }
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpdDst->l_con.dcpy[i].recycleQueue.enqueue(cpdDst->l_con.dcpy[i].pQueue.dequeue());
-				}
-			    }
-
-			    if(np > 1)
-			    {
-				cpDst->r_con.nrcv = 0;
-				cpDst->r_con.remotePullDone = false;
-				cpDst->r_con.firingRuleCnt = 0;
-				for(int i=0; i<nrcvs_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					if(mfDst.IndexArray()[f] == it->dstIndex)
-					    cpDst->r_con.nrcv++;
-				    }
-				} // for(i<nrcvs_cpAsc)
-				cpDst->r_con.rcv = new RemoteCommDescriptor[cpDst->r_con.nrcv];
-				dcnt = 0;
-				for(int i=0; i<nrcvs_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					//if(f == it->dstIndex)
-					if(mfDst.IndexArray()[f] == it->dstIndex)
-					{
-					    cpDst->r_con.rcv[dcnt].nd = it->dstIndex;
-					    cpDst->r_con.rcv[dcnt].ns = it->srcIndex;
-					    cpDst->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					    cpDst->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-					    cpDst->r_con.rcv[dcnt].sbx = it->sbox;
-					    cpDst->r_con.rcv[dcnt].dbx = it->dbox;
-					    int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-					    cpDst->r_con.rcv[dcnt].sz = psize;
-
-					    if(!gDst->isDepGraph)
-					    {
-						for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						{
-						    Package *tmpPkg = new Package(psize);
-			    			    void* local_ptr= tmpPkg->databuf.local(); //(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-						    for(int j=0; j<psize; j++){
-							//tmpPkg->databuf[j] = 0;
-							((double*)local_ptr)[j]=0;
-						    }
-						    cpDst->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-						}
-						for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						    cpDst->r_con.rcv[dcnt].recycleQueue.enqueue(cpDst->r_con.rcv[dcnt].pQueue.dequeue());                                      
-					    }
-
-					    dcnt++;
-					}
-				    }
-				}// for(i<nrcvs_cpAsc)
-
-				RegionGraph* depGraph = gDst->srcLinkGraph;
-				for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-				{
-				    int dfi = gDst->task[f]->depTaskIDs[df];
-				    FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-				    for(int i=0; i<cpdDst->r_con.nrcv ; i++)
-				    {
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    int psize = cpdDst->r_con.rcv[i].sz;
-					    Package *tmpPkg = new  Package(psize);
-			    		    void* local_ptr= tmpPkg->databuf.local(); //(static_cast<upcxx::global_ptr<void> >(tmpPkg->databuf)).local();
-					    for(int j=0; j<psize; j++){
-						//tmpPkg->databuf[j] = 0;
-						((double*)local_ptr)[j]=0;
-					    }
-					    cpdDst->r_con.rcv[i].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    cpdDst->r_con.rcv[i].recycleQueue.enqueue(cpdDst->r_con.rcv[i].pQueue.dequeue());
-				    }
-				}
-			    } // if(np > 1)
-			}// if(fg==tg)
-
-//#pragma omp barrier               
-		    if(np > 1)
-		    {
-			//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-			//if(tid==0)
-			{
-
-			    //  std::cout<< "Inside parallel Generating Remote Recive tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;       
-
-			    gDst->rCopyMapHead->map[f]->r_con.nrcv = 0;
-			    gDst->rCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-					gDst->rCopyMapHead->map[f]->r_con.nrcv++;
-				}
-			    }
-			    gDst->rCopyMapHead->map[f]->r_con.rcv = new RemoteCommDescriptor[gDst->rCopyMapHead->map[f]->r_con.nrcv];
-			    int dcnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-				    {
-
-					// if(myProc==54 && gDst->graphID == 25 && f == 10)
-					// std::cout <<"myP " <<myProc<<" Dep n R Added nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " sgID "<< gSrc->graphID <<" tg "<<tg<< " from P " << recv_pr[i] <<std::endl;
-
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].nd = it->dstIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].ns = it->srcIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sbx = it->sbox;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].dbx = it->dbox;
-
-					int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sz = psize;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pr = recv_pr[i];
-
-					BL_ASSERT(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd == f);
-
-					if(Perilla::genTags)
-					{
-					    try{
-						std::map<int,int>::iterator itr = tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].find(psize);
-						if( itr != tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].end())
-						{
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-						}
-						else
-						{
-						    tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex][psize] = Perilla::uTags++;
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-						    std::map<int,int>::iterator itr2 = pTagCnt[recv_pr[i]].find(gDst->graphID-1);
-						    if(itr2 != pTagCnt[recv_pr[i]].end())
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = pTagCnt[recv_pr[i]][gDst->graphID-1] + 1;
-						    else
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = 1;                                                                          
-						}
-					    }
-					    catch(std::exception& e)
-					    {
-						std::cout <<"Inside tagGeneration gID "<< gDst->graphID <<" "<< e.what() << '\n';
-					    }
-					}
-					//tagMap[recv_pr[i]][gDst->graphID][it->dstIndex][it->srcIndex] = pTagCnt[recv_pr[i]];                            
-
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].recycleQueue.enqueue(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.dequeue());
-					dcnt++;
-				    }
-				}
-			    } // for(i<nrcvs_cpAsc)
-
-			} // if(tid==0)
-		    } // if(np > 1)
-		    //} //if(fg==tg)
-	    } // for(f<nfabsDst)
-	    // std::cout<< "Barrier 4" <<" tid "<<tid <<std::endl;                        
-//#pragma omp barrier
-	    for(int f=0; f<nfabsSrc; f++)
-	    {
-		//if(nt==0)
-		    //if(WorkerThread::isMyRegion(tg,f))// && WorkerThread::perilla_isMasterWorkerThread())
-		    {
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Send partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;                
-
-			for(int i=0; i<gSrc->task[f]->cpAsc_srcHead->l_con.nscpy; i++)
-			{
-			    int lnd = gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].nd;
-			    for(int j=0; j<gDst->task[ lnd ]->cpAsc_dstHead->l_con.ndcpy; j++)
-				if(gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dbx == gDst->task[ lnd ]->cpAsc_dstHead->l_con.dcpy[j].dbx)
-				    gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dPartner = j;
-			}
-		    }
-	    } // for(f<nfabsSrc)
-	    //std::cout<< "Barrier 5" <<" tid "<<tid<<std::endl;                          
-//#pragma omp barrier
-	    for(int f=0; f<nfabsDst; f++)
-	    {
-		//if(nt==0)
-		    //if(WorkerThread::isMyRegion(tg,f))// && WorkerThread::perilla_isMasterWorkerThread())
-		    {
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Recive partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;    
-
-			for(int i=0; i<gDst->task[f]->cpAsc_dstHead->l_con.ndcpy; i++)
-			{
-			    int lns = gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].ns;
-			    for(int j=0; j<gSrc->task[ lns ]->cpAsc_srcHead->l_con.nscpy; j++)
-				if(gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].dbx == gSrc->task[ lns ]->cpAsc_srcHead->l_con.scpy[j].dbx)
-				    gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].sPartner = j;
-			}
-		    }
-	    } // for(f<nfabsDst)                                                                                                                                 
-	} // omp parallel
-    } // if(!(*mfSrc == *mfDst))    
-}
-catch(std::exception& e)
-{
-    std::cout <<"Inside MFcopyAssoc gID "<< gDst->graphID <<" "<< e.what() << '\n';
-}
-
-
-//std::cout<< "All done safely at gID " << gDst->graphID <<std::endl;   
-
-} // multifabExtractCopyAssoc
-#endif
-
-
-#if 0
-Array<const FabArrayBase::CopyComTagsContainer*> send_cctc;
-Array<int> send_pr;
-Array<const FabArrayBase::CopyComTagsContainer*> recv_cctc;
-Array<int> recv_pr;
-
-
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, int nc, int ng, int ngSrc, const Periodicity& period)
-{
-#if 1
-    int myProc = ParallelDescriptor::MyProc();
-    int np = ParallelDescriptor::NProcs();
-    try{
-	if(true)//if(!(*mfSrc == *mfDst))
-	{
-#ifdef USE_PERILLA_PTHREADS
-	    //	    if(perilla::isMasterThread())
-#endif
-	    {
-		if(ng > mfDst.nGrow()) cout <<"MULTIFAB_COPY_C: ng > mfDst.nGrow not supported in parallel copy"<< endl;
-		if(ngSrc > mfSrc.nGrow()) cout <<"MULTIFAB_COPY_C: ngSrc > mfSrc.nGrow"<< endl;
-		if(ngSrc > 0)
-		{
-		    // To be implemented
-		    //do i = 1, nboxes(msrc%la)
-		    //  call push_back(bl, grow(box_nodalize(get_box(msrc%la,i),msrc%nodal),lngsrc))
-		    //end do
-		    //call build(batmp, bl, sort = .false.)
-		    //call destroy(bl)
-		    //call build(lasrctmp, batmp, boxarray_bbox(batmp), explicit_mapping = get_proc(msrc%la))
-		    //call destroy(batmp)
-		    //call build(msrctmp, lasrctmp, nc = lnc, ng = 0)
-		    //pmfsrc => msrctmp
-		    assert(false);
-		}
-		if(np > 1)
-		{
-		    if(gSrc->sCopyMapHead == 0)
-			gSrc->sCopyMapHead = new CopyMap();
-		    else
-		    {
-			CopyMap *tmpCopyMap = new CopyMap();
-			tmpCopyMap->next = gSrc->sCopyMapHead;
-			gSrc->sCopyMapHead = tmpCopyMap;
-		    }
-		    if(gDst->rCopyMapHead == 0)
-			gDst->rCopyMapHead = new CopyMap();
-		    else
-		    {
-			CopyMap *tmpCopyMap = new CopyMap();
-			tmpCopyMap->next = gDst->rCopyMapHead;
-			gDst->rCopyMapHead = tmpCopyMap;
-		    }
-		    //gSrc->sCopyMapHead->map.reserve(mfSrc.size());
-		    //gDst->rCopyMapHead->map.reserve(mfDst.size());
-		    gSrc->sCopyMapHead->alloc_CopyMap(mfSrc);
-		    gDst->rCopyMapHead->alloc_CopyMap(mfDst);
-		}
-
-		//if(gSrc->numTasks != mfSrc.IndexArray().size())
-		//    std::cout<< "before " <<gSrc->numTasks << " now " <<mfSrc.size() << " at gID " << gSrc->graphID << std::endl;	
-
-		gSrc->numFabs = mfSrc.size();
-		gDst->numFabs = mfDst.size();	
-		gSrc->numTasks = mfSrc.IndexArray().size();
-		gDst->numTasks = mfDst.IndexArray().size();
-	    }
-#ifdef USE_PERILLA_PTHREADS
-	    //	    perilla::syncAllThreads();
-#endif
-	    const FabArrayBase::CPC *TheCPC= &mfDst.getCPC(ng, mfSrc, ngSrc, period);;
-
-	    int nfabsSrc = mfSrc.IndexArray().size();
-	    int nfabsDst = mfDst.IndexArray().size();
-
-	    const int nloc_cpAsc = TheCPC->m_LocTags->size();
-	    const int nsnds_cpAsc = TheCPC->m_SndTags->size();
-	    const int nrcvs_cpAsc = TheCPC->m_RcvTags->size();     
-#ifdef USE_PERILLA_PTHREADS
-	    //	    perilla::syncAllThreads();
-#endif
-
-	    if(np > 1){
-#ifdef USE_PERILLA_PTHREADS
-		//		if(perilla::isMasterThread())
-#endif
-		{
-		    send_cctc.reserve(nsnds_cpAsc);
-
-		    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC->m_SndTags->begin(),
-			    m_End = TheCPC->m_SndTags->end();
-			    m_it != m_End;
-			    ++m_it)
-		    {
-			if(m_it->first != myProc)      // Not destined to me.
-			{
-			    send_pr.push_back(m_it->first);
-			    send_cctc.push_back(&(m_it->second));
-			}
-		    }
-
-		    recv_cctc.reserve(nrcvs_cpAsc);
-
-		    for (FabArrayBase::MapOfCopyComTagContainers::const_iterator m_it = TheCPC->m_RcvTags->begin(),
-			    m_End = TheCPC->m_RcvTags->end();
-			    m_it != m_End;
-			    ++m_it)
-		    {
-			if(m_it->first != myProc)      // I am not the source for this receipt
-			{
-			    recv_pr.push_back(m_it->first);
-			    recv_cctc.push_back(&(m_it->second));
-			}
-		    }
-		}
-	    }
-#ifdef USE_PERILLA_PTHREADS
-	    //	    perilla::syncAllThreads();
-#endif
-
-	    //#ifndef USE_PERILLA_PTHREADS
-#pragma omp parallel shared(gSrc, gDst, mfSrc, mfDst, nfabsSrc, nfabsDst)
-	    //#endif
-	    {
-		int tid = omp_get_thread_num();//perilla::tid();//omp_get_thread_num();	  
-		int tg = tid/perilla::NUM_THREADS_PER_TEAM;//perilla::wid();//WorkerThread::perilla_wid();
-		int nt= tid%perilla::NUM_THREADS_PER_TEAM;
-		int fg;
-		//std::cout<<"thread "<< tid<<"group "<<tg<< "Before parallel at gID " << gDst->graphID << " numTask " << gDst->numTasks << " numFabs " << gDst->numFabs <<std::endl;	
-
-		for(int f=0; f<nfabsSrc; f++)
-		{
-		    //if(perilla::isMasterWorkerThread())
-		    if(nt==0)
-			if(WorkerThread::isMyRegion(tg,f))
-			{
-			    int scnt = 0;
-			    FabCopyAssoc *cpSrc;
-			    //if(gDst->graphID > 25)
-			    //std::cout<< "Inside parallel Generating Send at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			    if(gSrc->task[f]->cpAsc_srcHead == 0)
-			    {
-				gSrc->task[f]->cpAsc_srcHead = new FabCopyAssoc();
-				cpSrc = gSrc->task[f]->cpAsc_srcHead;
-			    }
-			    else
-			    {
-				cpSrc = new FabCopyAssoc();
-				cpSrc->next = gSrc->task[f]->cpAsc_srcHead;
-				gSrc->task[f]->cpAsc_srcHead = cpSrc;
-			    }
-
-			    cpSrc->graphPartner = gDst;
-			    cpSrc->l_con.nscpy = 0;
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag& tag = (*TheCPC->m_LocTags)[i];
-				//if(f == tag.srcIndex)
-				if(mfSrc.IndexArray()[f] == tag.srcIndex)
-				    cpSrc->l_con.nscpy++;		  
-			    }
-			    cpSrc->l_con.scpy = new LocalCopyDescriptor[cpSrc->l_con.nscpy];		
-
-			    //if(gDst->graphID == 4 && tag.dstIndex == 60 )
-			    //std::cout<< "Inside parallel Generating Local Copy send at tid " << tid << " f " << f << " gID " << gDst->graphID <<" num local connections"<< nloc_cpAsc << std::endl;	
-
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag *tag = &(*TheCPC->m_LocTags)[i];
-				//if(f == tag.srcIndex)
-				if(mfSrc.IndexArray()[f] == tag->srcIndex)			
-				{
-				    cpSrc->l_con.scpy[scnt].ns = mfSrc.localindex(tag->srcIndex);
-				    cpSrc->l_con.scpy[scnt].nd = mfDst.localindex(tag->dstIndex);
-				    cpSrc->l_con.scpy[scnt].sbx = tag->sbox;
-				    cpSrc->l_con.scpy[scnt].dbx = tag->dbox;
-				    int psize = tag->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				    //std::cout<< " gSrc ID "<< gSrc->graphID << " f "<<f<< " sndPkgsize " << psize <<std::endl;
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					Package *tmpPkg = new Package(psize);
-					for(int j=0; j<psize; j++)
-					    tmpPkg->databuf[j] = 0;
-					cpSrc->l_con.scpy[scnt].pQueue.enqueue(tmpPkg);
-				    }
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpSrc->l_con.scpy[scnt].recycleQueue.enqueue(cpSrc->l_con.scpy[scnt].pQueue.dequeue());
-				    scnt++;
-				}
-			    }
-
-			    if(np > 1)
-			    {
-				cpSrc->r_con.nsnd = 0;
-				cpSrc->r_con.remotePushReady = false;
-				cpSrc->r_con.firingRuleCnt = 0;
-				for(int i=0; i<nsnds_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					if(mfSrc.IndexArray()[f] == it->srcIndex)				
-					    cpSrc->r_con.nsnd++;
-				    }		      
-				} // for(i<nsnds_cpAsc)
-				cpSrc->r_con.snd = new RemoteCommDescriptor[cpSrc->r_con.nsnd];
-				scnt = 0;
-				for(int i=0; i<nsnds_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					if(mfSrc.IndexArray()[f] == it->srcIndex)
-					{
-					    cpSrc->r_con.snd[scnt].ns = it->srcIndex;
-					    cpSrc->r_con.snd[scnt].nd = it->dstIndex;			      
-					    cpSrc->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					    cpSrc->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);			      
-					    cpSrc->r_con.snd[scnt].sbx = it->sbox;
-					    cpSrc->r_con.snd[scnt].dbx = it->dbox;
-					    int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    {
-						Package *tmpPkg = new Package(psize);
-						for(int j=0; j<psize; j++)
-						    tmpPkg->databuf[j] = 0;
-						cpSrc->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					    }
-					    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						cpSrc->r_con.snd[scnt].recycleQueue.enqueue(cpSrc->r_con.snd[scnt].pQueue.dequeue());			      
-					    scnt++;
-					}
-				    }		      		      
-				} // for(i<nsnds_cpAsc)		    		  
-			    } // if(np > 1)	      																	
-			} // if(fg==tg)
-
-		    //perilla::syncAllThreads();
-#pragma omp barrier
-		    if(np > 1)
-		    {
-			//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)
-			if(tid==0)
-			{
-
-			    // std::cout<< "Inside parallel Generating Remote Send tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			    gSrc->sCopyMapHead->map[f]->r_con.nsnd = 0;
-			    gSrc->sCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)				
-					gSrc->sCopyMapHead->map[f]->r_con.nsnd++;
-				}
-			    } // for(i<nsnds_cpAsc)
-			    gSrc->sCopyMapHead->map[f]->r_con.snd = new RemoteCommDescriptor[gSrc->sCopyMapHead->map[f]->r_con.nsnd];
-			    int scnt = 0;
-			    for(int i=0; i<nsnds_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *send_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-
-				    if(mfSrc.IndexArray()[f] == it->srcIndex)
-				    {
-
-					//if(gDst->graphID == 31 && (it->dstIndex == 519))
-					//std::cout <<"myP " <<myProc<< " Added in S Dep nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " i "<< scnt << " tg " <<tg << std::endl;
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].ns = it->srcIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].nd = it->dstIndex;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_gid = gDst->graphID-1;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lns = mfSrc.localindex(it->srcIndex);
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].lnd = mfDst.localindex(it->dstIndex);				  
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sbx = it->sbox;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].dbx = it->dbox;
-
-					int psize = it->sbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].sz = psize;
-					gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pr = send_pr[i];
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].recycleQueue.enqueue(gSrc->sCopyMapHead->map[f]->r_con.snd[scnt].pQueue.dequeue());  
-					scnt++;
-				    }
-				}
-			    } // for(i<nsnds_cpAsc)
-			} // if(tid==0)
-		    } // if(np > 1)	  
-		} // for(f<nfabsSrc)
-		//	  std::cout<< "Barrier 2 " <<" tid "<<tid<<std::endl;	  
-		//perilla::syncAllThreads();
-#pragma omp barrier
-		for(int f=0; f<nfabsDst; f++)
-		{
-		    //if(perilla::isMasterWorkerThread())
-		    if(nt==0)
-			if(WorkerThread::isMyRegion(tg,f))		
-			{
-			    //	  std::cout <<"tid: "<< tid << " f: "<< f << " is master "<<WorkerThread::isTeamMasterThread(tid) << " is my region "<<WorkerThread::isMyRegion(tg,f)<<std::endl;		  
-
-			    //if(gDst->graphID > 25)
-			    //std::cout<< "Inside parallel Generating Recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			    FabCopyAssoc *cpDst;
-			    if(gDst->task[f]->cpAsc_dstHead == 0)
-			    {
-				gDst->task[f]->cpAsc_dstHead = new FabCopyAssoc();
-				cpDst = gDst->task[f]->cpAsc_dstHead;
-			    }
-			    else
-			    {
-				cpDst = new FabCopyAssoc();
-				cpDst->next = gDst->task[f]->cpAsc_dstHead;
-				gDst->task[f]->cpAsc_dstHead = cpDst;
-			    }
-			    cpDst->graphPartner = gSrc;
-			    cpDst->l_con.ndcpy = 0;
-			    cpDst->l_con.firingRuleCnt = 0;
-			    cpDst->l_con.dcpyCnt = 0;
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag *tag = &(*TheCPC->m_LocTags)[i];
-				//if(f == tag.dstIndex)
-				if(mfDst.IndexArray()[f] == tag->dstIndex)
-				    cpDst->l_con.ndcpy++;		  
-			    }
-			    cpDst->l_con.dcpy = new LocalCopyDescriptor[cpDst->l_con.ndcpy];		
-			    int dcnt = 0;
-
-			    //if(gDst->graphID > 25)
-			    //std::cout<< "Inside parallel Generating Local copy recive at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-
-			    //if(gDst->graphID ==27 && f == 633)
-			    //std::cout<< "tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc << " ndcpy " << cpDst->l_con.ndcpy <<std::endl;	
-
-
-			    for(int i=0; i<nloc_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTag *tag = &(*TheCPC->m_LocTags)[i];
-				//if(f == tag->dstIndex)
-				if(mfDst.IndexArray()[f] == tag->dstIndex)
-				{
-
-				    //if(gDst->graphID == 4 && (tag->dstIndex == 60 || tag->dstIndex == 59))
-				    //std::cout<< "dcpy tid " << tid << " f " << f << " i " << i << " dcnt " << dcnt << " ns "<<tag->srcIndex << " nd "<<tag->dstIndex << " lo " << tag->dbox.smallEnd() << " hi " << tag->dbox.bigEnd() <<std::endl;	
-
-				    cpDst->l_con.dcpy[dcnt].ns = mfSrc.localindex(tag->srcIndex);
-				    cpDst->l_con.dcpy[dcnt].nd = mfDst.localindex(tag->dstIndex);
-				    cpDst->l_con.dcpy[dcnt].sbx = tag->sbox;
-				    cpDst->l_con.dcpy[dcnt].dbx = tag->dbox;
-
-				    // if(gDst->graphID > 25 && f == 633)
-				    //std::cout<< " Generating Package tid " << tid << " i " << i <<std::endl;	
-
-				    int psize = tag->dbox.numPts() * mfSrc.nComp(); //---------------------------------------------------------------????????????????
-				    cpDst->l_con.dcpy[dcnt].sz = psize;
-
-				    if(!gDst->isDepGraph)
-				    {
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    Package *tmpPkg = new  Package(psize);
-
-					    // if(tmpPkg == nullptr)
-					    //std::cout<<"Found the culprit tid " << tid << " f " << f << " i " << i << std::endl;
-
-					    for(int j=0; j<psize; j++)
-						tmpPkg->databuf[j] = 0;
-					    cpDst->l_con.dcpy[dcnt].pQueue.enqueue(tmpPkg);
-					}
-
-					// if(gDst->graphID > 25 && f == 633)
-					//std::cout<< " Generating  now in reQ Package tid " << tid << " i " << i <<std::endl;	
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    cpDst->l_con.dcpy[dcnt].recycleQueue.enqueue(cpDst->l_con.dcpy[dcnt].pQueue.dequeue());		      
-
-					//if(gDst->graphID > 25 && f == 633)
-					//  std::cout<< " Generated Package tid " << tid << " i " << i <<std::endl;	
-				    }
-
-				    dcnt++;
-				}
-			    }
-
-			    // if(gDst->graphID > 25 && f > 630)
-			    //std::cout<< "Safe now tid " << tid << " f " << f << " gID " << gDst->graphID << " numReciv " << nloc_cpAsc <<std::endl;	
-
-			    RegionGraph* depGraph = gDst->srcLinkGraph;
-			    for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-			    {
-				int dfi = gDst->task[f]->depTaskIDs[df];
-				FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-				for(int i=0; i<cpdDst->l_con.ndcpy ; i++)
-				{
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-				    {
-					int psize = cpdDst->l_con.dcpy[i].sz;
-					Package *tmpPkg = new  Package(psize);       
-					for(int j=0; j<psize; j++)
-					    tmpPkg->databuf[j] = 0;
-					cpdDst->l_con.dcpy[i].pQueue.enqueue(tmpPkg);
-				    }			      
-				    for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					cpdDst->l_con.dcpy[i].recycleQueue.enqueue(cpdDst->l_con.dcpy[i].pQueue.dequeue());		      
-				}
-			    }		  
-
-			    if(np > 1)
-			    {
-				cpDst->r_con.nrcv = 0;
-				cpDst->r_con.remotePullDone = false;
-				cpDst->r_con.firingRuleCnt = 0;
-				for(int i=0; i<nrcvs_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					if(mfDst.IndexArray()[f] == it->dstIndex)
-					    cpDst->r_con.nrcv++;
-				    }		      
-				} // for(i<nrcvs_cpAsc)
-				cpDst->r_con.rcv = new RemoteCommDescriptor[cpDst->r_con.nrcv];
-				dcnt = 0;
-				for(int i=0; i<nrcvs_cpAsc; i++)
-				{
-				    const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				    for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					    it != cctc.end(); ++it)
-				    {
-					//if(f == it->dstIndex)
-					if(mfDst.IndexArray()[f] == it->dstIndex)
-					{
-					    cpDst->r_con.rcv[dcnt].nd = it->dstIndex;
-					    cpDst->r_con.rcv[dcnt].ns = it->srcIndex;
-					    cpDst->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					    cpDst->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);				  
-					    cpDst->r_con.rcv[dcnt].sbx = it->sbox;
-					    cpDst->r_con.rcv[dcnt].dbx = it->dbox;
-					    int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-					    cpDst->r_con.rcv[dcnt].sz = psize;
-
-					    if(!gDst->isDepGraph)
-					    {
-						for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						{
-						    Package *tmpPkg = new Package(psize);
-						    for(int j=0; j<psize; j++)
-							tmpPkg->databuf[j] = 0;
-						    cpDst->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-						}
-						for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-						    cpDst->r_con.rcv[dcnt].recycleQueue.enqueue(cpDst->r_con.rcv[dcnt].pQueue.dequeue());		      			      
-					    }
-
-					    dcnt++;
-					}
-				    }
-				}// for(i<nrcvs_cpAsc)
-
-				RegionGraph* depGraph = gDst->srcLinkGraph;
-				for(int df=0; df < gDst->task[f]->depTaskIDs.size(); df++)
-				{
-				    int dfi = gDst->task[f]->depTaskIDs[df];
-				    FabCopyAssoc *cpdDst = depGraph->task[dfi]->cpAsc_dstHead;
-				    for(int i=0; i<cpdDst->r_con.nrcv ; i++)
-				    {
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    int psize = cpdDst->r_con.rcv[i].sz;
-					    Package *tmpPkg = new  Package(psize);       
-					    for(int j=0; j<psize; j++)
-						tmpPkg->databuf[j] = 0;
-					    cpdDst->r_con.rcv[i].pQueue.enqueue(tmpPkg);
-					}			      
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    cpdDst->r_con.rcv[i].recycleQueue.enqueue(cpdDst->r_con.rcv[i].pQueue.dequeue());		      
-				    }
-				}		  
-
-
-			    } // if(np > 1)
-			}// if(fg==tg)
-
-		    //perilla::syncAllThreads();
-#pragma omp barrier
-
-		    if(np > 1)
-		    {
-			//if(WorkerThread::perilla_isMasterWorkerThread() && tg==0)			
-			if(tid==0)
-			{
-			    //  std::cout<< "Inside parallel Generating Remote Recive tg 0 at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-			    gDst->rCopyMapHead->map[f]->r_con.nrcv = 0;
-			    gDst->rCopyMapHead->map[f]->r_con.firingRuleCnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-					gDst->rCopyMapHead->map[f]->r_con.nrcv++;
-				}
-			    }
-			    gDst->rCopyMapHead->map[f]->r_con.rcv = new RemoteCommDescriptor[gDst->rCopyMapHead->map[f]->r_con.nrcv];
-			    int dcnt = 0;
-			    for(int i=0; i<nrcvs_cpAsc; i++)
-			    {
-				const FabArrayBase::CopyComTagsContainer& cctc = *recv_cctc[i];
-				for (FabArrayBase::CopyComTagsContainer::const_iterator it = cctc.begin();
-					it != cctc.end(); ++it)
-				{
-				    //if(f == it->dstIndex)
-				    if(mfDst.IndexArray()[f] == it->dstIndex)
-				    {
-
-					// if(myProc==54 && gDst->graphID == 25 && f == 10)
-					// std::cout <<"myP " <<myProc<<" Dep n R Added nd " << it->dstIndex << " ns "<< it->srcIndex << " f " << f << " sgID "<< gSrc->graphID <<" tg "<<tg<< " from P " << recv_pr[i] <<std::endl;
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].nd = it->dstIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].ns = it->srcIndex;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = mfDst.localindex(it->dstIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lns = mfSrc.localindex(it->srcIndex);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].r_grids = (gDst->numFabs > gSrc->numFabs ? gDst->numFabs : gSrc->numFabs);
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sbx = it->sbox;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].dbx = it->dbox;
-
-					int psize = it->dbox.numPts() * mfDst.nComp(); //---------------------------------------------------------------????????????????
-
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].sz = psize;
-					gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pr = recv_pr[i];
-
-					BL_ASSERT(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd == f);
-
-					if(Perilla::genTags)
-					{
-					    try{
-						std::map<int,int>::iterator itr = tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].find(psize);
-						if( itr != tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex].end())
-						{
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = itr->second;
-						}
-						else
-						{
-						    tagMap[recv_pr[i]][gDst->graphID-1][it->dstIndex][it->srcIndex][psize] = Perilla::uTags++;
-						    //gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].lnd = Perilla::uTags++;
-						    std::map<int,int>::iterator itr2 = pTagCnt[recv_pr[i]].find(gDst->graphID-1);
-						    if(itr2 != pTagCnt[recv_pr[i]].end())
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = pTagCnt[recv_pr[i]][gDst->graphID-1] + 1;
-						    else
-							pTagCnt[recv_pr[i]][gDst->graphID-1] = 1;									     									      
-						}
-					    }
-					    catch(std::exception& e)
-					    {
-						std::cout <<"Inside tagGeneration gID "<< gDst->graphID <<" "<< e.what() << '\n';
-					    }
-					}
-					//tagMap[recv_pr[i]][gDst->graphID][it->dstIndex][it->srcIndex] = pTagCnt[recv_pr[i]];				  
-
-
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					{
-					    //Package *tmpPkg = new Package(psize);
-					    Package *tmpPkg = new Package();
-					    //for(int j=0; j<psize; j++)
-					    //tmpPkg->databuf[j] = 0;
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.enqueue(tmpPkg);
-					}
-					for(int p=0; p<perilla::NUM_PREGENERATED_PACKAGES; p++)
-					    gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].recycleQueue.enqueue(gDst->rCopyMapHead->map[f]->r_con.rcv[dcnt].pQueue.dequeue());
-					dcnt++;
-				    }
-				}
-			    } // for(i<nrcvs_cpAsc)
-
-			} // if(tid==0)
-		    } // if(np > 1)
-		    //} //if(fg==tg)
-	    } // for(f<nfabsDst)
-	    // std::cout<< "Barrier 4" <<" tid "<<tid <<std::endl;	      	  	  
-	    //perilla::syncAllThreads();
-#pragma omp for
-	    for(int f=0; f<nfabsSrc; f++)
-	    {
-		//if(perilla::isMasterWorkerThread())
-		if(nt==0)
-		    if(WorkerThread::isMyRegion(tg,f))	      
-		    {	
-
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Send partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;		  
-
-			for(int i=0; i<gSrc->task[f]->cpAsc_srcHead->l_con.nscpy; i++)
-			{
-			    int lnd = gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].nd;
-			    for(int j=0; j<gDst->task[ lnd ]->cpAsc_dstHead->l_con.ndcpy; j++)
-				if(gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dbx == gDst->task[ lnd ]->cpAsc_dstHead->l_con.dcpy[j].dbx)
-				    gSrc->task[f]->cpAsc_srcHead->l_con.scpy[i].dPartner = j;
-			}
-		    }
-	    } // for(f<nfabsSrc)
-	    //std::cout<< "Barrier 5" <<" tid "<<tid<<std::endl;	      	  	  
-	    //perilla::syncAllThreads();
-#pragma omp for
-	    for(int f=0; f<nfabsDst; f++)
-	    {
-		//if(perilla::isMasterWorkerThread())
-		if(nt==0)
-		    if(WorkerThread::isMyRegion(tg,f))
-		    {
-			//if(gDst->graphID > 25)
-			//std::cout<< "Inside parallel Generating Recive partners at tid " << tid << " f " << f << " gID " << gDst->graphID <<std::endl;	
-
-			for(int i=0; i<gDst->task[f]->cpAsc_dstHead->l_con.ndcpy; i++)
-			{
-			    int lns = gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].ns;
-			    for(int j=0; j<gSrc->task[ lns ]->cpAsc_srcHead->l_con.nscpy; j++)
-				if(gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].dbx == gSrc->task[ lns ]->cpAsc_srcHead->l_con.scpy[j].dbx)
-				    gDst->task[f]->cpAsc_dstHead->l_con.dcpy[i].sPartner = j;
-			}
-		    }
-	    } // for(f<nfabsDst)																 
-	} // omp parallel
-    } // if(!(*mfSrc == *mfDst))    
-}
-catch(std::exception& e)
-{
-    std::cout <<"Inside MFcopyAssoc gID "<< gDst->graphID <<" "<< e.what() << '\n';
-}
-
-
-//std::cout<< "All done safely at gID " << gDst->graphID <<std::endl;	
-
-#endif
-
-} // multifabExtractCopyAssoc
-
-#endif
-
-
-void Perilla::multifabExtractCopyAssoc(RegionGraph* gDst, RegionGraph* gSrc, const MultiFab& mfDst, const MultiFab& mfSrc, const Periodicity& period) 
-{
-    multifabExtractCopyAssoc(gDst, gSrc, mfDst, mfSrc, 1 /*component*/, 0/*ghost*/, 0/*src ghost*/, period);
-}
-
-void Perilla::multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    int myProc = ParallelDescriptor::MyProc();
-    // MultiFab* mfDst = destGraph->assocMF;
-    // MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-	//if(srcGraph->graphID==18 && f ==316 && ntid == 0)
-	//std::cout << "srgG chk see " << srcGraph << " " <<myProc <<std::endl;
-
-	while(cpSrc != 0)
-	{
-	    if(cpSrc->graphPartner == destGraph)
-		break;
-	    cpSrc = cpSrc->next;
-	} 
-	if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;	
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->l_con.sLock));		    
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-	    {
-		Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf.local());
-	    }	    
-	    for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-	    pthread_mutex_unlock(&(cpSrc->l_con.sLock));   
-	}
-	else
-	{
-	    if(ntid == 0)
-            {
-		pthread_mutex_lock(&(cpSrc->l_con.sLock));	
-	    //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-		//if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		{
-		    Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf.local());
-		}	    
-	    //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    //if(ntid==0)
-	    //{
-		for(int i=0;i<cpSrc->l_con.nscpy; i++)
-		    cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-		pthread_mutex_unlock(&(cpSrc->l_con.sLock));   
-	    }
-	    //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	//if(myProc==26 && srcGraph->graphID==18  && ntid == 0)
-	//std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-	//if(myProc==28 && srcGraph->graphID==18  && ntid == 0)
-	//std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-	//if(srcGraph->graphID==18 && f ==316)	 
-	//BL_ASSERT(cpSrc->r_con.nsnd == 177);
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-
-		Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf.local());
-		cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-	    }
-
-	    pthread_mutex_unlock(&(cpSrc->r_con.sndLock)); 
-
-	    cpSrc->r_con.remotePushReady = true;
-	    ///*
-	    pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-	    pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-	}
-	else
-	{
-	    if(ntid == 0)
-	    {
-		pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-	    //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-		//if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		{
-
-		    // if(myProc==4 && srcGraph->graphID==2 && (f ==0 || f ==2))
-		    //std::cout << " Pushing 2 316 164"<<std::endl;
-
-		    Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-		    mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf.local());
-		    cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-
-		}
-
-	    //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	    //if(ntid==0)
-	    //{
-		pthread_mutex_unlock(&(cpSrc->r_con.sndLock)); 
-
-		cpSrc->r_con.remotePushReady = true;
-		///*
-		pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-		for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-		pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-		//*/
-	    }
-	    //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))      													      
-} // multifabCopyPushAsync
-
-
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-    int myProc = ParallelDescriptor::MyProc();
-
-    int ntid = WorkerThread::perilla_wtid();
-    int tg = WorkerThread::perilla_wid();
-    //MultiFab* mfDst = destGraph->assocMF;
-    //MultiFab* mfSrc = srcGraph->assocMF;
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    //if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    if(true)//if(!(*mfDst == *mfSrc))
-    {
-	if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-	//if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-	FabCopyAssoc* cpDst = destGraph->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    if(cpDst->graphPartner == srcGraph)
-		break;
-	    cpDst = cpDst->next;
-	} 
-	if(cpDst == 0) cout <<"Metadata for across grid copy not found"<< endl;
-	//destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	if(singleT)
-	{
-	    pthread_mutex_lock(&(cpDst->l_con.dLock));
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-	    {
-		Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf.local());
-	    }	
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue(true),true); // corrected from pQ to recycleQ and from recycleQ to pQ
-	    cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-	    pthread_mutex_unlock(&(cpDst->l_con.dLock));
-	}
-	else
-	{
-	    if(ntid==0)
-	    {
-		pthread_mutex_lock(&(cpDst->l_con.dLock));
-	    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-		//if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	    for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		{
-		    Package* rcvPackage = cpDst->l_con.dcpy[i].pQueue.getFront(true); // corrected from recycleQ to pQ
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->l_con.dcpy[i].dbx,dstcomp,nc,rcvPackage->databuf.local());
-		}	
-	    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);       	
-
-	    //if(ntid == 0)
-	    //{
-		for(int i=0; i<cpDst->l_con.ndcpy; i++)
-		    cpDst->l_con.dcpy[i].recycleQueue.enqueue(cpDst->l_con.dcpy[i].pQueue.dequeue(true),true); // corrected from pQ to recycleQ and from recycleQ to pQ
-		cpDst->l_con.firingRuleCnt = cpDst->l_con.firingRuleCnt - cpDst->l_con.ndcpy;
-		pthread_mutex_unlock(&(cpDst->l_con.dLock));
-	    }
-	    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-
-	int np = ParallelDescriptor::NProcs();
-	if(np == 1)
-	    return;
-
-	if(singleT)
-	{
-	    //pthread_mutex_lock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-	    pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		///*
-		//Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-                Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);
-		mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf.local());	      
-		rcvPackage->completed = false;
-		rcvPackage->served = false;
-		rcvPackage->request = 0;	 
-                cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage, true); 
-		//destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-		//Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		//rcvPackage->completed = false;
-		//cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ	      
-		//*/
-
-		//Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-		//mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-	    }
-	    cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-	    cpDst->r_con.remotePullDone = true;
-	    ///*
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-		    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			cpDst->r_con.firingRuleCnt++;
-	    //*/
-	    pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-	    //pthread_mutex_unlock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-
-	}
-	else
-	{	
-	    if(ntid==0)
-	    {
-		//pthread_mutex_lock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-		pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-	    //}
-	    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-		//if((i%(perilla::NUM_THREADS_PER_TEAM-1)) == ntid)
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		{
-		    ///*
-		    //Package *rcvMetaPackage = destGraph->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-                    Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true); 
-		    mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf.local());	      
-		    rcvPackage->completed = false;
-		    rcvPackage->served = false;
-		    rcvPackage->request = 0;	  
-                    cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage, true);
-		    //destGraph->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-		    //Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-		    //rcvPackage->completed = false;
-		    //cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ	      
-		    //*/
-
-		    //Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.getFront(true);                               // corrected from recycleQ to pQ
-		    //mfDst->m_fabs_v[f]->copyFromMem(cpDst->r_con.rcv[i].dbx,dstcomp,nc,rcvPackage->databuf);
-
-		}
-	    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-
-	    //if(ntid==0)
-	    //{
-		cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - cpDst->r_con.nrcv;
-
-		cpDst->r_con.remotePullDone = true;
-		///*
-		for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-			if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-			    cpDst->r_con.firingRuleCnt++;
-		//*/
-		pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		//pthread_mutex_unlock(&(destGraph->rCopyMapHead->map[f]->r_con.rcvLock));
-	    }
-	    //destGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-1);
-	}
-    } // if(!(*mfDst == *mfSrc))
-
-} // multifabCopyPull
-
-void Perilla::multifabCopyPull(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, bool singleT) 
-{
-    multifabCopyPull(destGraph, srcGraph, mfDst, mfSrc, f, 1, 1, 1, 0, 0,singleT);
-}
-
-
-void Perilla::serviceLocalGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int tg)
-{
-    int nfabs = graphArray[g]->numTasks;
-    for(int f=0; f<nfabs; f++)
-    {
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-	        bool anyReq=false;
-		for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		    if(cpSrc->l_con.scpy[i].pQueue.queueSize(true)>0){
-		        anyReq=true;
-			break;
-		    }
-                if(anyReq)
-		{
-                    pthread_mutex_lock(&(cpSrc->l_con.sLock));
-		    for(int i=0; i<cpSrc->l_con.nscpy; i++)
-		    {
-			if(cpSrc->l_con.scpy[i].pQueue.queueSize(true)>0)
-			{
-			    FabCopyAssoc* cpDst = cpSrc->graphPartner->task[cpSrc->l_con.scpy[i].nd]->cpAsc_dstHead;
-			    while(cpDst != 0)
-			    {
-				if(cpDst->graphPartner == graphArray[g])
-				    break;
-				cpDst = cpDst->next;
-			    }			    
-			    Package* sPackage = cpSrc->l_con.scpy[i].pQueue.dequeue(true);
-			    pthread_mutex_lock(&(cpDst->l_con.dLock));
-			    int dPartner = cpSrc->l_con.scpy[i].dPartner;
-			    Package* dPackage = cpDst->l_con.dcpy[dPartner].recycleQueue.dequeue(true);
-			    std::memcpy(dPackage->databuf.local(), sPackage->databuf.local(), dPackage->bufSize * sizeof(double));
-			    cpDst->l_con.dcpy[dPartner].pQueue.enqueue(dPackage,true);
-			    if(cpDst->l_con.dcpy[dPartner].pQueue.queueSize(true) == 1)
-				cpDst->l_con.firingRuleCnt++;
-			    pthread_mutex_unlock(&(cpDst->l_con.dLock));
-			    cpSrc->l_con.scpy[i].recycleQueue.enqueue(sPackage,true);
-			}
-		    } // for
-                    pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-		}//anyReq
-		cpSrc = cpSrc->next;
-	    } // while(cpSrc != 0)
-	} // if(tg==fg)
-    } // for(f<nfabs)
-} // serviceLocalGridCopyRequests
-
-
-void Perilla::serviceRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    bool nextsReq, nextrReq;
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    int graphID = graphArray[g]->graphID;
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    //if(pthread_mutex_trylock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock)) != 0)
-	    {
-		//if(pthread_mutex_trylock(&(cpDst->r_con.rcvLock)) != 0)
-		{
-		    for(int i=0; i<cpDst->r_con.nrcv; i++)
-		    {
-			if(cpDst->r_con.rcv[i].pQueue.queueSize(true)==0) 
-			{
-			    nextrReq = true;
-			}
-			else
-			{			    
-			    Package *rearPackage = cpDst->r_con.rcv[i].pQueue.getRear(true); 
-			    // Also check the recycle queue because when rear is completed it may cause unlimited recv posts
-                            if(rearPackage->completed && cpDst->r_con.rcv[i].pQueue.queueSize(true) == 1) //!latest receive request has been completed
-			    {
-				nextrReq = true;
-			    }
-			    else //!expected message is still on the way
-				nextrReq = false;
-			}
-			if(nextrReq) //!take a message from recycle pool and post a receive
-			{
-			    //!create a package to keep track of receive requests
-		            pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-			    //Package *rMetaPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.dequeue(true);
-			    //!extract a package from the recycle pool at the destination NUMA node to buffer incoming data
-			    int ns = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].ns;
-			    int nd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].nd;
-			    int lnd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-			    int r_grids = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].r_grids;
-			    Package *rPackage = cpDst->r_con.rcv[i].recycleQueue.dequeue(true);
-			    int tag = tagMap[graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr][g][nd][ns][graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz];
-
-                            rPackage->request = new future<>;
-                            rPackage->completed=false;
-			    rPackage->tag = tag;
-			    cpDst->r_con.rcv[i].pQueue.enqueue(rPackage,true);   //!this is not done yet
-			    //graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.enqueue(rMetaPackage,true);   //!this is not done yet	 
-
-                            pthread_mutex_lock(&(rMsgMap.lock));
-                            rMsgMap.map[graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr][tag].push_back(rPackage);
-                            rMsgMap.size++;
-                            pthread_mutex_unlock(&(rMsgMap.lock));
-		            pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-			}						
-		    } // for (i<i<cpDst->r_con.nrcv)
-		    //pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		} // if(ga locked)
-		//pthread_mutex_unlock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-	    } // if(mf locked)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {
-		//if(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.queueSize(true) == 0) //!no message has been received or all received messages have been claimed	       	
-                if(cpSrc->r_con.snd[i].pQueue.queueSize(true) == 0)
-		    nextrReq = false;
-		else
-		    nextrReq = true;
-
-		if(nextrReq) //!take a message from recycle pool and post a receive
-		{
-		    //Package *sMetaPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.getFront(true);
-                    Package *sPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-		    if(!sPackage->served)
-		    {		    
-			sPackage->completed = false;
-			sPackage->served = true;
-                        //sMetaPackage->request = new future<>;
-			int ns = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].ns;
-			int nd = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].nd;
-			int r_gid = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_gid;
-			int r_grids = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].r_grids;
-			//int tag = tagGen(ns, nd, r_gid-1, np*r_grids, nGraphs);
-			int tag = Perilla::myTagMap[r_gid][nd][ns][graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz];
-                        int src= upcxx::rank_me();
-			int dst= graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pr;
-		        int size= graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].sz;
-
-                        //sPackage->request = new future<>;
-                        pthread_mutex_lock(&(sMsgMap.lock));
-                        sMsgMap.map[dst][tag].push_back(sPackage);
-                        sMsgMap.size++;
-                        pthread_mutex_unlock(&(sMsgMap.lock));
-                        upcxx::global_ptr<double> sbuf= sPackage->databuf; //static_cast<upcxx::global_ptr<double> >((double*)sPackage->databuf);
-
-                        upcxx::rpc(dst,
-                            [=](){
-                                //at destination rank, look up recv buffer and pull remote data and store data in the buffer
-                                bool posted_recv=false;
-                                double* localbuf= NULL;
-                                pthread_mutex_lock(&(rMsgMap.lock));
-                                if(rMsgMap.map.find(src) != rMsgMap.map.end()){
-                                    if(rMsgMap.map[src].find(tag) != rMsgMap.map[src].end())
-                                         if(rMsgMap.map[src][tag].size() >0){
-                                             posted_recv=true;
-                                             localbuf= (rMsgMap.map[src][tag].front()->databuf).local();//(double*) (static_cast<upcxx::global_ptr<void> > (rMsgMap.map[src][tag].front()->databuf).local());
-   	                                     rMsgMap.map[src][tag].front()->tag= tag;
-					     if(localbuf){
-                                                 *(rMsgMap.map[src][tag].front()->request)= upcxx::rget(sbuf, localbuf, size);
-                                                 rMsgMap.map[src][tag].pop_front();
-			                         rMsgMap.size--;
-				             }
-                                         }
-                                }
-                                pthread_mutex_unlock(&(rMsgMap.lock));
-                                //save pull request for later when recv buffer is posted 
-                                if(posted_recv==false){
-                                    getReq_t *req= new getReq_t(src, tag, sbuf, size);
-                                    pendingGetList.add(req);
-                                }
-                                //store send request to notify sender later upon completion
-                                //sFutureMap[fu]= sMetaPackage->request;
-                            }
-                        );
-		    } //served
-		}//nextReq		
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-
-    pendingGetList.process();
-
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	while(cpDst != 0)
-	{
-	    for(int i=0; i<cpDst->r_con.nrcv; i++)
-	    {
-		//if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) > 0) //!all messages before rear have completed
-                if(cpDst->r_con.rcv[i].pQueue.queueSize(true) > 0)
-		{		    
-		    //if(pthread_mutex_trylock(&(cpDst->r_con.rcvLock)) != 0)
-		    {		    
-			Package *rearPackage =  cpDst->r_con.rcv[i].pQueue.getRear(true); //graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.getRear(true);
-			if(!rearPackage->completed)
-			{
-			    if(rearPackage->request->ready())
-			    {
-			      pthread_mutex_lock(&(cpDst->r_con.rcvLock));
-                              int ns = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].ns;
-                              int nd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].nd;
-                              int lnd = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].lnd;
-                              int r_grids = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].r_grids;
-                              int tag = rearPackage->tag;
-                              //int tag = tagMap[graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr][g][nd][ns][graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].sz];
-			      int dst = upcxx::rank_me();
-                              int src= graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pr; 
-		                upcxx::rpc(src,
-                	            [=](){
-                                        pthread_mutex_lock(&(sMsgMap.lock));
-                                        //upcxx::future<> *ft= sMsgMap.map[dst][tag].front()->request;
-				        //delete ft;//so that sender know
-					sMsgMap.map[dst][tag].front()->completed = true;
-                                        sMsgMap.map[dst][tag].pop_front();
-		                        sMsgMap.size--;
-                                        pthread_mutex_unlock(&(sMsgMap.lock));
-                                    }
-                                );
-
-				delete rearPackage->request;
-				rearPackage->completed=true;
-				//cpDst->r_con.rcv[i].pQueue.getRear()->completeRequest();
-                                //graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.getRear()->completeRequest();
-
-				//if(graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.queueSize(true) == 1)
-                                if(cpDst->r_con.rcv[i].pQueue.queueSize(true) == 1)
-				{
-				    cpDst->r_con.firingRuleCnt++;
-				}
-			        pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-			    }
-			}		   		    
-			//pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		    } // if(ga locked)
-		} // if(pQueue.queueSize(true) > 0)		    
-	    } // for (i<i<cpDst->r_con.nrcv)
-	    cpDst = cpDst->next;
-	} // while(cpDst != 0)	
-    } // for(f<nfabs)
-
-
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	while(cpSrc != 0)
-	{
-	    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-	    {		
-		//if(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.queueSize(true) > 0)
-                if(cpSrc->r_con.snd[i].pQueue.queueSize(true) >0)
-		{
-		    //Package *frontPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.getFront(true);
-                    Package *frontPackage = cpSrc->r_con.snd[i].pQueue.getFront(true);
-		    if(frontPackage->served /*&& !frontPackage->completed*/) //!latest receive request has NOT been completed
-		    {
-			bool flag = false;
-			int ret_flag;
-			//if(frontPackage->request==NULL)//data have been received by receiver
-			if(frontPackage->completed)//data have been received by receiver
-			{
-/*
-			    pthread_mutex_lock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-			    frontPackage = graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = 0;
-			    frontPackage->tag = 0;
-			    graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			    pthread_mutex_unlock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-*/
-
-			    pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-			    frontPackage = cpSrc->r_con.snd[i].pQueue.dequeue(true);
-			    frontPackage->completed = false;
-			    frontPackage->served = false;
-			    frontPackage->request = 0;
-			    frontPackage->tag = 0;
-			    cpSrc->r_con.snd[i].recycleQueue.enqueue(frontPackage,true);
-			    pthread_mutex_unlock(&(cpSrc->r_con.sndLock));			
-			}
-		    }
-		} // if(queueSize > 0)				
-	    } // for (i<i<cpSrc->r_con.nsnd)	    
-	    cpSrc = cpSrc->next;
-	} // while(cpSrc != 0)	
-    } // for(f<nfabs)
-
-
-    upcxx::progress();
-} // serviceRemoteGridCopyRequests
-
-#if 0
-void Perilla::resetRemoteGridCopyRequests(std::vector<RegionGraph*> graphArray, int g, int nGraphs, int tg)
-{
-    int np = ParallelDescriptor::NProcs();
-    int myProc = ParallelDescriptor::MyProc();
-    int numfabs = graphArray[g]->numTasks;
-    //MultiFab* mf = graphArray[g]->assocMF;
-    int graphID = graphArray[g]->graphID;
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpSrc = graphArray[g]->task[f]->cpAsc_srcHead;
-	    while(cpSrc != 0)
-	    {
-		if(cpSrc->r_con.remotePushReady)
-		{
-		    pthread_mutex_lock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-		    for(int i=0; i<cpSrc->r_con.nsnd; i++)
-		    {
-			graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(graphArray[g]->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);	    
-		    }
-		    pthread_mutex_unlock(&(graphArray[g]->sCopyMapHead->map[f]->r_con.sndLock));
-		    cpSrc->r_con.remotePushReady = false;
-		}// if remotepushready
-		cpSrc = cpSrc->next;
-	    }
-	}// ismyRegion
-    }//for f<numfabs
-
-    for(int f=0; f<numfabs; f++)
-    {	
-	if(WorkerThread::isMyRegion(tg,f)) //tg == fg
-	{
-	    FabCopyAssoc* cpDst = graphArray[g]->task[f]->cpAsc_dstHead;
-	    while(cpDst != 0)
-	    {
-		if(pthread_mutex_trylock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock)) != 0)
-		{
-		    if(pthread_mutex_trylock(&(cpDst->r_con.rcvLock)) != 0)
-		    {
-			//if(f==1 && g==26 && myProc == 54)
-			//std::cout<<"Completing Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpDst->r_con.remotePullDone <<std::endl;
-			if(cpDst->r_con.remotePullDone)
-			{
-			    for(int i=0; i<cpDst->r_con.nrcv; i++)
-			    {
-
-				Package *rcvMetaPackage = graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].pQueue.dequeue(true);
-				rcvMetaPackage->completed = false;
-				rcvMetaPackage->served = false;
-				rcvMetaPackage->request = 0;	 
-				graphArray[g]->rCopyMapHead->map[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-				Package* rcvPackage = cpDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-				rcvPackage->completed = false;
-				cpDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ
-
-				//cpDst->r_con.firingRuleCnt = cpDst->r_con.firingRuleCnt - 1;
-
-				if(cpDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-				    if(cpDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-					cpDst->r_con.firingRuleCnt++;
-
-
-			    } // for (i<i<cpDst->r_con.nrcv)
-
-			    cpDst->r_con.remotePullDone = false;
-
-			    //if(f==1 && g==26 && myProc == 54)
-			    // std::cout<<"Completed Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpDst->r_con.remotePullDone <<std::endl;
-
-			}
-			pthread_mutex_unlock(&(cpDst->r_con.rcvLock));
-		    } // if(ga locked)
-		    pthread_mutex_unlock(&(graphArray[g]->rCopyMapHead->map[f]->r_con.rcvLock));
-		} // if(mf locked)
-		cpDst = cpDst->next;
-	    } // while(cpDst != 0)	
-	    /*  
-		if(false)
-		for(int id=0; id<graphArray[g]->task[f]->depTaskIDs.size(); id++)
-		{	    
-		int df = graphArray[g]->task[f]->depTaskIDs[id];
-		if(WorkerThread::isMyRegion(0,df))
-		{
-		int lgID = graphArray[g]->srcLinkGraph->graphID-1;
-
-	    //if(f==1 && g==26 && myProc == 54)
-	    //std::cout<<"Completing Dep Push f " << df << " gID " << lgID+1 << " myP " << myProc  <<std::endl;
-
-	    FabCopyAssoc* cpdDst = graphArray[lgID]->task[df]->cpAsc_dstHead;
-	    while(cpdDst != 0)
-	    {
-	    if(omp_test_lock(graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcvLock) != 0)
-	    {
-	    if(omp_test_lock(cpdDst->r_con.rcvLock) != 0)
-	    {
-	    //if(f==1 && g==26 && myProc == 54)
-	    //std::cout<<"Completing Push f " << f << " gID " << g+1 << " myP " << myProc << " PDone "<< cpdDst->r_con.remotePullDone <<std::endl;
-	    if(cpdDst->r_con.remotePullDone)
-	    {
-	    for(int i=0; i<cpdDst->r_con.nrcv; i++)
-	    {
-
-	    Package *rcvMetaPackage = graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcv[i].pQueue.dequeue(true);
-	    rcvMetaPackage->completed = false;
-	    rcvMetaPackage->served = false;
-	    rcvMetaPackage->request = MPI_REQUEST_NULL;	  
-	    graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-
-	    Package* rcvPackage = cpdDst->r_con.rcv[i].pQueue.dequeue(true);                               // corrected from recycleQ to pQ
-	    rcvPackage->completed = false;
-	    cpdDst->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);                         // corrected from pQ to recycleQ
-
-	    //cpdDst->r_con.firingRuleCnt = cpdDst->r_con.firingRuleCnt - 1;
-
-	    if(cpdDst->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-	    if(cpdDst->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-	    cpdDst->r_con.firingRuleCnt++;
-
-
-	    } // for (i<i<cpdDst->r_con.nrcv)
-
-	    cpdDst->r_con.remotePullDone = false;
-
-	    //if(df==10 && lgID==24 && myProc == 54)
-	    // std::cout<<"Completed Push f " << df << " gID " << lgID+1 << " myP " << myProc << " PDone "<< cpdDst->r_con.remotePullDone <<std::endl;
-	    }
-	    omp_unset_lock(cpdDst->r_con.rcvLock);
-	    } // if(ga locked)
-	    omp_unset_lock(graphArray[lgID]->rCopyMapHead->map[df]->r_con.rcvLock);
-	    } // if(mf locked)
-	    cpdDst = cpdDst->next;
-	    } // while(cpdDst != 0)	
-
-
-	    } // if tg==0 region
-
-
-	    } // for all dependents
-	     */
-
-
-
-	}
-    } // for(f<nfabs)
-
-}
-#endif
-
-  void Perilla::fillBoundaryPush(amrex::RGIter& rgi, amrex::MultiFab& mf)
-  {
-    if(rgi.currentItr != rgi.totalItr)
-      return;
-
-    int f = rgi.currentRegion;
-    fillBoundaryPush(rgi.itrGraph, &mf, f);
-  }
-
-  void Perilla::fillBoundaryPush(amrex::RGIter& rgi, RegionGraph* rg, amrex::MultiFab& mf)
-  {
-    if(rgi.currentItr != rgi.totalItr)
-      return;
-
-    int f = rgi.currentRegion;
-    fillBoundaryPush(rg, &mf, f);
-  }
-
-void Perilla::multifabCopyPushAsync(RegionGraph* destGraph, RegionGraph* srcGraph, MultiFab* mfDst, MultiFab* mfSrc, int f, bool singleT)
-{
-    multifabCopyPushAsync(destGraph, srcGraph, mfDst, mfSrc, f, 1, 1, 1, 0, 0, singleT);
-}
-
-
-void Perilla::multifabCopyPush(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-{
-
-    //double start_time_wtime = omp_get_wtime();
-
-    if(nc<1) cout <<"MULTIFAB_COPY_C: nc must be >= 1"<< endl;
-    if(mfDst->nComp() < (dstcomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for dst multifab"<< endl;
-    if(mfSrc->nComp() < (srccomp-1)) cout <<"MULTIFAB_COPY_C: nc too large for src multifab"<< endl;
-
-    //mTeams = false; 
-
-//    if(np==1)
-      //multifabCopyPush_1Team(destGraph,srcGraph,mfDst,mfSrc,f,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-/*    else if(mTeams)
-      {
-        if(WorkerThread::isLocPPTID(tid))
-          multifabCopyLocPush(destGraph,srcGraph,mfDst,mfSrc,f,tid,dstcomp,srccomp,nc,ng,ngsrc);
-        else
-          multifabCopyRmtPush(destGraph,srcGraph,mfDst,mfSrc,f,tid,dstcomp,srccomp,nc,ng,ngsrc);
-      }
-    else
-      multifabCopyPush_1Team(destGraph,srcGraph,mfDst,mfSrc,f,tid,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-*/
-
-    multifabCopyPush_1Team(destGraph,srcGraph,mfDst,mfSrc,f,dstcomp,srccomp,nc,ng,ngsrc,singleT);
-    //if(!singleT)
-      //srcGraph->worker[perilla::wid()]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-    //double end_time_wtime = omp_get_wtime();
-    //if(ntid==0)
-      //Perilla::getPPPTimeSplit[2] += end_time_wtime - start_time_wtime;
-}
-
-  void Perilla::multifabCopyPush_1Team(RegionGraph* destGraph, RegionGraph* srcGraph, amrex::MultiFab* mfDst, amrex::MultiFab* mfSrc, int f, int dstcomp, int srccomp, int nc, int ng, int ngsrc, bool singleT)
-  {
-    int ntid = perilla::wtid();// - perilla::NUM_COMM_THREADS;
-    int tg = perilla::wid();
-    int myProc = amrex::ParallelDescriptor::MyProc();
-
-    if(true)//if(!(*mfDst == *mfSrc))
-      {
-        if(ng > mfDst->nGrow()) cout <<"MULTIFAB_COPY_C: ng > 0 not supported in parallel copy"<< endl;
-        if(ngsrc > mfSrc->nGrow()) cout <<"MULTIFAB_COPY_C: ngsrc > msrc%ng"<< endl;
-        FabCopyAssoc* cpSrc = srcGraph->task[f]->cpAsc_srcHead;
-
-        while(cpSrc != 0)
-          {
-            if(cpSrc->graphPartner == destGraph)
-              break;
-            cpSrc = cpSrc->next;
-          }
-        if(cpSrc == 0) cout <<"Metadata for across grid copy not found"<< endl;
-
-        if(singleT)
-          {
-            pthread_mutex_lock(&(cpSrc->l_con.sLock));
-            for(int i=0; i<cpSrc->l_con.nscpy; i++)
-              {
-                Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-                mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf.local());
-              }
-            for(int i=0;i<cpSrc->l_con.nscpy; i++)
-              cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-            pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-          }
-        else
-          {
-            if(ntid == 0)
-	    {
-              pthread_mutex_lock(&(cpSrc->l_con.sLock));
-            //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-            //std::ofstream fout;
-            //fout.open(std::to_string(myProc)+ "_" + std::to_string(tid) + ".txt", std::fstream::app);
-              //if((i%(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS)) == ntid)
-            for(int i=0; i<cpSrc->l_con.nscpy; i++)
-                {
-                  Package* sndPackage = cpSrc->l_con.scpy[i].recycleQueue.getFront(true);
-                  mfSrc->m_fabs_v[f]->copyToMem(cpSrc->l_con.scpy[i].sbx,srccomp,nc,sndPackage->databuf.local());
-                  /*
-                  for(int ii=0; ii < sndPackage->bufSize; ii++)
-                    if(sndPackage->databuf[ii] == 0)
-                      fout << "MFCPush loc zero at " << f << " i " << i << " ii " << ii << " sbx "<< cpSrc->l_con.scpy[i].sbx << std::endl;
-                  */
-                }
-
-            //fout.close();
-
-            //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-            //if(ntid==0)
-              //{
-                for(int i=0;i<cpSrc->l_con.nscpy; i++)
-                  cpSrc->l_con.scpy[i].pQueue.enqueue(cpSrc->l_con.scpy[i].recycleQueue.dequeue(true),true);
-                pthread_mutex_unlock(&(cpSrc->l_con.sLock));
-              }
-            //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-          }
-
-        int np = amrex::ParallelDescriptor::NProcs();
-        if(np == 1)
-          return;
-
-        //if(myProc==26 && srcGraph->graphID==18  && ntid == 0)
-        //std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-        //if(myProc==28 && srcGraph->graphID==18  && ntid == 0)
-        //std::cout << "Notw its sgID 18,"<< f <<" turn lets see " << cpSrc->r_con.nsnd <<std::endl;
-
-        //if(srcGraph->graphID==18 && f ==316)   
-        //BL_ASSERT(cpSrc->r_con.nsnd == 177);
-        if(singleT)
-          {
-            pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-            for(int i=0; i<cpSrc->r_con.nsnd; i++)
-              {
-                Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-                mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf.local());
-                sndPackage->served = false;
-                sndPackage->completed = false;
-                cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-              }
-            cpSrc->r_con.remotePushReady = true;
-
-            pthread_mutex_unlock(&(cpSrc->r_con.sndLock));
-
-            /*
-            pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-            for(int i=0; i<cpSrc->r_con.nsnd; i++)
-              srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);
-            pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-            */
-          }
-        else
-          {
-            if(ntid == 0)
-	    {
-              pthread_mutex_lock(&(cpSrc->r_con.sndLock));
-              //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-
-              //if((i%(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS)) == ntid)
-            for(int i=0; i<cpSrc->r_con.nsnd; i++)
-                {
-                  Package* sndPackage = cpSrc->r_con.snd[i].recycleQueue.dequeue(true);
-                  mfSrc->m_fabs_v[f]->copyToMem(cpSrc->r_con.snd[i].sbx,srccomp,nc,sndPackage->databuf.local());
-                  sndPackage->served = false;
-                  sndPackage->completed = false;
-                  cpSrc->r_con.snd[i].pQueue.enqueue(sndPackage,true);
-                }
-
-            //fout.close();         
-            //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-            //if(ntid==0)
-              //{
-                cpSrc->r_con.remotePushReady = true;
-                /*
-                pthread_mutex_lock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-                for(int i=0; i<cpSrc->r_con.nsnd; i++)
-                  srcGraph->sCopyMapHead->map[f]->r_con.snd[i].pQueue.enqueue(srcGraph->sCopyMapHead->map[f]->r_con.snd[i].recycleQueue.dequeue(true),true);
-                pthread_mutex_unlock(&(srcGraph->sCopyMapHead->map[f]->r_con.sndLock));
-                */
-                pthread_mutex_unlock(&(cpSrc->r_con.sndLock));
-              }
-            //srcGraph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS);
-          }
-      } // if(!(*mfDst == *mfSrc))                                                                                                                    
-  } // multifabCopyPush
-
-
-
-  void Perilla::fillBoundaryPull_1Team(RegionGraph* graph, amrex::MultiFab& mf, int f)
-  {
-    int myProc = amrex::ParallelDescriptor::MyProc();
-    int mfi = mf.IndexArray()[f];
-
-    int nComp = mf.nComp();
-    int tg= perilla::wid();
-    int ntid = perilla::wtid();//-perilla::NUM_COMM_THREADS;
-
-    if(ntid==0)
-    {
-      pthread_mutex_lock(&(graph->lMap[f]->l_con.dLock));
-    //graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads    
-
-    if(perilla::LAZY_PUSH)
-      { }
-    else
-      {
-        if(perilla::UNPACKING_FINEGRAIN)
-          {}
-        else
-          {
-              //if( (i%(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS)) == ntid)
-            for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-                {
-                  Package *dPackage = graph->lMap[f]->l_con.dcpy[i].pQueue.getFront(true);
-                  /*
-                  for(int d=0; d<dPackage->bufSize; d++)
-                    if(dPackage->databuf[d] == 0)
-                      {
-                        //std::cout<< "in fbPull Reciving 0 for f "<< f <<std::endl;
-                        //BL_ASSERT(dPackage->databuf[d] != 0);
-                      }
-                  */
-                  /*
-                  if(f==0)
-                  //if(graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd() == graph->lMap[f]->l_con.dcpy[i].dbx.bigEnd())
-                  //if(graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(0)==-1 && graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(1)==-1 && graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd(2)==4)
-                      std::cout<< "Corner Pull for f "<< f << " data0 " <<dPackage->databuf[0]<< " size " <<dPackage->bufSize <<" se " <<graph->lMap[f]->l_con.dcpy[i].dbx.smallEnd()<<std::endl;
-                  */
-                  /*
-                  if(mfi==0)
-                    {
-                      std::cout<< "LPull " << i <<std::endl;
-                      for(int d=0; d<dPackage->bufSize; d++)
-                        std::cout << dPackage->databuf[d] << " ";
-                      std::cout << std::endl;
-                    }
-                  */
-                  mf.m_fabs_v[f]->copyFromMem(graph->lMap[f]->l_con.dcpy[i].dbx,0,nComp,dPackage->databuf.local());
-                }
-          } // if(UNPACKING_FINEGRAIN) - else
-      } // if(LAZY_PUSH) - else
-
-    //graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-
-    //if(ntid==0)
-      //{
-        for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-          {
-            graph->lMap[f]->l_con.dcpy[i].recycleQueue.enqueue( graph->lMap[f]->l_con.dcpy[i].pQueue.dequeue(true),true );
-          }
-
-        graph->lMap[f]->l_con.firingRuleCnt = graph->lMap[f]->l_con.firingRuleCnt - graph->lMap[f]->l_con.ndcpy;
-
-
-        graph->lMap[f]->l_con.scpyCnt = 0;
-        for(int i=0; i<graph->lMap[f]->l_con.ndcpy; i++)
-          if(graph->lMap[f]->l_con.dcpy[i].pQueue.queueSize(true) >= 1)
-            {
-              graph->lMap[f]->l_con.firingRuleCnt++;
-            }
-
-        pthread_mutex_unlock(&(graph->lMap[f]->l_con.dLock));
-      }
-    //graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-
-    int np = amrex::ParallelDescriptor::NProcs();
-    if (np==1) return;
-    if(ntid==0)
-      {
-        pthread_mutex_lock(&(graph->rMap[f]->r_con.rcvLock));
-        pthread_mutex_lock(&(graph->lMap[f]->r_con.rcvLock));
-      //}
-    //graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-
-      //if( (i%(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS)) == ntid)
-    for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-        {
-          Package *rcvMetaPackage = graph->rMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-          rcvMetaPackage->completed = false;
-          rcvMetaPackage->served = false;
-          rcvMetaPackage->request = 0;
-          graph->rMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvMetaPackage,true);
-          Package *rcvPackage = graph->lMap[f]->r_con.rcv[i].pQueue.dequeue(true);
-
-          mf.m_fabs_v[f]->copyFromMem(graph->lMap[f]->r_con.rcv[i].dbx,0,nComp,rcvPackage->databuf.local());
-          rcvPackage->completed = false;
-          graph->lMap[f]->r_con.rcv[i].recycleQueue.enqueue(rcvPackage,true);
-        }
-    //graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-
-    //if(ntid==0)
-      //{
-        graph->lMap[f]->r_con.firingRuleCnt = graph->lMap[f]->r_con.firingRuleCnt - graph->lMap[f]->r_con.nrcv;
-        for(int i=0; i<graph->lMap[f]->r_con.nrcv; i++)
-          if(graph->lMap[f]->r_con.rcv[i].pQueue.queueSize(true) >= 1)
-            if(graph->lMap[f]->r_con.rcv[i].pQueue.getFront(true)->checkRequest())
-              graph->lMap[f]->r_con.firingRuleCnt++;
-        pthread_mutex_unlock(&(graph->lMap[f]->r_con.rcvLock));
-        pthread_mutex_unlock(&(graph->rMap[f]->r_con.rcvLock));
-      }
-    //graph->worker[tg]->barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-  } // fillBoundaryPull
-
diff --git a/Src/AmrTask/rts_impls/upcxx/PerillaConfig.H b/Src/AmrTask/rts_impls/upcxx/PerillaConfig.H
deleted file mode 100755
index 8b2609001e1..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/PerillaConfig.H
+++ /dev/null
@@ -1,22 +0,0 @@
-#ifndef P_PERILLACONFIG_H
-#define P_PERILLACONFIG_H
-
-//class PerillaConfig
-namespace perilla
-{
-  static const int NUM_THREAD_TEAMS=4;
-  static const int NUM_THREADS_PER_TEAM=4;
-  static const int NUM_COMM_THREADS=1;
-  static const int NUM_PREGENERATED_PACKAGES=3;
-  static const int MSG_QUEUE_DEFAULT_MAXSIZE=3; // same as num of pregenerated packages because these got swaped between pQ and recycleQ
-  static const int TASK_QUEUE_DEFAULT_SIZE=512;
-  static const int MAX_SQRT_TAG=512;  //sqrt(512*512)
-  static const bool NUMA_AWARE_MESSAGEHANDLER=true;
-  static const int LOCK_GRANULARITY=1; //!0 is queue level, 1 is region level
-  
-  static const bool LAZY_PUSH=false;
-  static const bool LAZY_PULL=false;
-  static const bool PACKING_FINEGRAIN=false; //!PACKING_FINEGRAIN = TRUE is effective when LAZY_PUSH=FALSE
-  static const bool UNPACKING_FINEGRAIN=false; //!is effective when LAZY_PUSH=FALSE
-};
-#endif
diff --git a/Src/AmrTask/rts_impls/upcxx/PerillaRts.H b/Src/AmrTask/rts_impls/upcxx/PerillaRts.H
deleted file mode 100644
index 23d4676dfdf..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/PerillaRts.H
+++ /dev/null
@@ -1,45 +0,0 @@
-#include <AMReX_Amr.H>
-#include <PerillaConfig.H>
-
-
-namespace perilla{
-
-struct _workerThreadInfo{
-    int _tid; //thread id in local group
-    int _size; //number of threads in the group
-};
-
-struct _threadInfo{
-    bool _isComm; //whether this thread handles communication
-    int _wtid; //worker thread id (-1 if this thread is decicated to communication)
-    int _nWts; //number of thread groups
-};
-
-class RTS
-{
-    private:
-	int _nWrks;
-	void RTS_Init();
-	int _rank, _nProcs;
-
-    public:
-	RTS(){
-	    _nWrks=1;
-	    char* nWrks= getenv("NWORKERS");
-	    if(nWrks) _nWrks= atoi(nWrks);
-	}
-	RTS(int nWrks):_nWrks(nWrks){}
-	int ProcCount();
-	int MyProc();
-	int WorkerThreadCount();
-	int MyWorkerThread();
-	void Init(); //Build the runtime system from scratch
-	void Init(int rank, int nProcs);//Build the runtime system on pre-existing MPI processes
-	void Iterate(void *graph, int max_step, Real stop_time);
-	void Finalize();
-//	double Time();
-	void Barrier();
-	void runAMR(Amr* amrptr, int max_step, Real stop_time);
-};
-
-}
diff --git a/Src/AmrTask/rts_impls/upcxx/PerillaRts.cpp b/Src/AmrTask/rts_impls/upcxx/PerillaRts.cpp
deleted file mode 100644
index 7dae4f39e11..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/PerillaRts.cpp
+++ /dev/null
@@ -1,211 +0,0 @@
-//Question? email tannguyen@lbl.gov
-//Created 07-19-2017
-//Last modification 08-14-2017
-#include <mpi.h>
-#include <sched.h>
-#include <sys/syscall.h>
-#include <unistd.h>
-#include <mylock.h>
-#include <pthread.h>
-#include "PerillaRts.H"
-
-#include <iostream>
-#include <queue>
-using namespace std;
-#include <cassert>
-
-using namespace perilla;
-#ifdef PERILLA_DEBUG
-#include <PerillaMemCheck.H>
-PerillaMemCheck memcheck;
-#endif
-
-namespace perilla{
-    Amr* amrptr;
-    struct RtsDomain{
-	pthread_t *_threads;
-	int _size;
-	MyLock _lock;
-	RtsDomain():_threads(NULL), _size(0){};
-	~RtsDomain(){
-	    free(_threads);
-	}
-    };
-    int numa_nodes;
-    RtsDomain *dom;
-    MyLock _l;
-    volatile char startSignal=0;
-    pthread_mutex_t startLock= PTHREAD_MUTEX_INITIALIZER;
-
-    int RTS::ProcCount(){
-	return _nProcs;
-    }
-
-    int RTS::MyProc(){
-	return _rank;
-    }
-
-    int RTS::WorkerThreadCount(){
-	return _nWrks;
-    }
-
-    int RTS::MyWorkerThread(){
-	return 0;
-    }
-
-    struct argT {
-	int numaID;
-	int tid;
-	int g_tid;
-	int nThreads;
-	int nTotalThreads;
-	int max_step;
-	Real stop_time;
-	RTS* thisRTS;
-    };
-
-    void RTS::runAMR(Amr* amr, int max_step, Real stop_time){
-        while (amr->okToContinue() &&
-              (amr->levelSteps(0) < max_step || max_step < 0) &&
-              (amr->cumTime() < stop_time || stop_time < 0.0) )
-            
-        {
-            // Do a coarse timestep, which calls one or multiple timestep updates (i.e. timeStep()) at each AMR level
-            amr->coarseTimeStep(stop_time);
-        }
-    }
-
-#ifdef USE_PERILLA_PTHREADS
-    void run(void* threadInfo){
-	argT *args= (argT*)threadInfo;
-	int numaID= args->numaID;
-	int tid= args->tid;
-	int g_tid= args->g_tid;
-	int nThreads= args->nThreads;
-	int nTotalThreads= args->nTotalThreads;
-	int max_step= args->max_step;
-	Real stop_time= args->stop_time;
-	RTS* rts= args->thisRTS;
-	Perilla::registerId(g_tid);
-	//done with thread id setup, now wait for the start signal from master
-        pthread_mutex_lock(&startLock);
-	startSignal++;
-        pthread_mutex_unlock(&startLock);
-	while(startSignal!= nTotalThreads){}
-        rts->runAMR(amrptr, max_step, stop_time);
-    }
-#endif
-
-    void InitializeMPI(){
-	int provided;
-	MPI_Init_thread(0, 0, MPI_THREAD_FUNNELED, &provided);
-	if(provided == MPI_THREAD_SINGLE){//with this MPI, process can't spawn threads
-	    cerr << "Spawning threads is not allowed by the MPI implementation" << std::endl;;
-	}
-    }
-
-    void RTS::RTS_Init(){
-	amrptr= NULL;
-    }
-
-    void RTS::Init(){
-        InitializeMPI();
-        MPI_Comm_rank(MPI_COMM_WORLD, &_rank);
-        MPI_Comm_size(MPI_COMM_WORLD, &_nProcs);
-        RTS_Init();
-    }
-
-    void RTS::Init(int rank, int nProcs){
-        _rank= rank;
-	_nProcs= nProcs;
-	RTS_Init();
-    }
-
-    void RTS::Finalize(){
-#ifdef PERILLA_DEBUG
-	memcheck.report();
-#endif
-    }
-
-    void RTS::Iterate(void* amrGraph, int max_step, Real stop_time){
-	    assert(amrGraph);
-	    Perilla::max_step= max_step;
-	    amrptr= (Amr*)amrGraph;
-            WorkerThread::init();
-#ifndef USE_PERILLA_PTHREADS
-            runAMR(amrptr, max_step, stop_time);
-#else
-	    int numa_nodes= perilla::NUM_THREAD_TEAMS;
-	    int worker_per_numa = perilla::NUM_THREADS_PER_TEAM;
-            int _nWrks= numa_nodes*worker_per_numa;
-	    int base=0; 
-	    int localID=-1;
-	    //create a list of persistent threads for each NUMA node
-	    cpu_set_t cpuset;
-	    pthread_attr_t attr;
-	    pthread_attr_init(&attr);
-	    dom= new RtsDomain[numa_nodes];
-	    for(int i=0; i<numa_nodes; i++){
-		dom[i]._threads= new pthread_t[worker_per_numa];
-	    }
-	    for(int i=0, domNo=-1; i<_nWrks; i++){
-		localID++;
-		if(localID==0){
-		    domNo++;
-		}
-		CPU_ZERO(&cpuset);
-		CPU_SET(base+localID, &cpuset);
-		if(! (localID==0 && domNo==0)){
-		    pthread_attr_setaffinity_np(&attr, sizeof(cpu_set_t), &cpuset);
-		    argT* arg= new argT;
-		    arg->numaID= domNo;
-		    arg->tid= localID;
-		    arg->g_tid= domNo*worker_per_numa+localID;
-		    arg->nThreads= worker_per_numa;
-		    arg->nTotalThreads= _nWrks;
-		    arg->thisRTS= this;
-		    arg->max_step= max_step;
-		    arg->stop_time= stop_time;
-		    int err = pthread_create(&(dom[domNo]._threads[localID]), &attr, (void*(*)(void*))run, arg);
-		}else{ //master thread
-		    dom[domNo]._threads[localID]= pthread_self();
-		    Perilla::registerId(0);
-		    //enable worker threads to start computing
-        	    pthread_mutex_lock(&startLock);
-	   	    startSignal++;
-	            pthread_mutex_unlock(&startLock);
-                }
-		dom[domNo]._size++;
-		if(localID == (worker_per_numa-1)){
-		    localID=-1;
-		    base+= worker_per_numa;
-		}
-	    }
-	    while(startSignal!= _nWrks){}//wait until all threads have done the setup phase
-            runAMR(amrptr, max_step, stop_time);
-	    for(int i=1; i<_nWrks; i++) pthread_join(dom[i/worker_per_numa]._threads[i%worker_per_numa], NULL);
-#endif
-    }
-
-#if 0
-    const double kMicro = 1.0e-6;
-    double RTS::Time()
-    {
-	struct timeval TV;
-
-	const int RC = gettimeofday(&TV, NULL);
-	if(RC == -1)
-	{
-	    printf("ERROR: Bad call to gettimeofday\n");
-	    return(-1);
-	}
-	return( ((double)TV.tv_sec) + kMicro * ((double)TV.tv_usec) );
-    } 
-#endif
-
-    void RTS::Barrier(){
-	upcxx::barrier();
-    }
-
-}//end namespace
-
diff --git a/Src/AmrTask/rts_impls/upcxx/perilla.mak b/Src/AmrTask/rts_impls/upcxx/perilla.mak
deleted file mode 100755
index 757d77878da..00000000000
--- a/Src/AmrTask/rts_impls/upcxx/perilla.mak
+++ /dev/null
@@ -1,20 +0,0 @@
-CEXE_sources += Barrier.cpp
-CEXE_sources += PackageQueue.cpp
-CEXE_sources += Perilla.cpp
-CEXE_sources += RGIter.cpp
-CEXE_sources += RegionGraph.cpp
-CEXE_sources += WorkerThread.cpp
-CEXE_sources += AsyncMultiFabUtil.cpp
-
-
-CEXE_headers += Barrier.H
-CEXE_headers += Config.H
-CEXE_headers += LocalConnection.H
-CEXE_headers += PackageQueue.H
-CEXE_headers += RegionGraph.H
-CEXE_headers += RemoteConnection.H
-CEXE_headers += WorkerThread.H
-CEXE_headers += AsyncMultiFabUtil.H
-
-
-
diff --git a/Src/AmrTask/todolist b/Src/AmrTask/todolist
deleted file mode 100644
index 3e52aba3d1b..00000000000
--- a/Src/AmrTask/todolist
+++ /dev/null
@@ -1 +0,0 @@
--Make the graph instantiation NUMA aware (important when there are tasks that allocate data)
diff --git a/Src/Base/AMReX.H b/Src/Base/AMReX.H
index 8e2b33fb4fa..f56250ab4fc 100644
--- a/Src/Base/AMReX.H
+++ b/Src/Base/AMReX.H
@@ -7,7 +7,9 @@
 #include <AMReX_GpuAssert.H>
 #include <AMReX_ccse-mpi.H>
 #include <AMReX_Exception.H>
+#include <AMReX_Extension.H>
 #include <AMReX_INT.H>
+#include <AMReX_REAL.H>
 #include <AMReX_Math.H>
 
 #include <iostream>
@@ -88,41 +90,77 @@ namespace amrex
     void ExecOnFinalize (PTR_TO_VOID_FUNC);
     void ExecOnInitialize (PTR_TO_VOID_FUNC);
 
+    //! This shuts up the compiler about unused variables
+    template <class... Ts>
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    void ignore_unused (const Ts&...) {}
+
     //! Print out message to cerr and exit via amrex::Abort().
     void Error (const std::string& msg);
-    namespace detail { void Error_host_doit (const char * msg); }
-    AMREX_GPU_HOST_DEVICE inline
-    void Error (const char * msg = 0) {
+
+    void Error_host (const char* msg);
+
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+    AMREX_GPU_EXTERNAL AMREX_GPU_DEVICE AMREX_NO_INLINE
+    void Error_device (const char * msg);
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    void Error (const char* msg = 0) {
 #if AMREX_DEVICE_COMPILE
-        if (msg) AMREX_DEVICE_PRINTF("Error %s\n", msg);
-        AMREX_DEVICE_ASSERT(0);
+#ifdef NDEBUG
+        amrex::ignore_unused(msg);
+#else
+        Error_device(msg);
+#endif
 #else
-        detail::Error_host_doit(msg);
+        Error_host(msg);
 #endif
     }
 
     //! Print out warning message to cerr.
     void Warning (const std::string& msg);
-    namespace detail { void Warning_host_doit (const char * msg); }
-    AMREX_GPU_HOST_DEVICE inline
+
+    void Warning_host (const char * msg);
+
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+    AMREX_GPU_EXTERNAL AMREX_GPU_DEVICE AMREX_NO_INLINE
+    void Warning_device (const char * msg);
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     void Warning (const char * msg) {
 #if AMREX_DEVICE_COMPILE
-        if (msg) AMREX_DEVICE_PRINTF("Warning %s\n", msg);
+#ifdef NDEBUG
+        amrex::ignore_unused(msg);
 #else
-        detail::Warning_host_doit(msg);
+        Warning_device(msg);
+#endif
+#else
+        Warning_host(msg);
 #endif
     }
 
     //! Print out message to cerr and exit via abort().
     void Abort (const std::string& msg);
-    namespace detail { void Abort_host_doit (const char * msg); }
-    AMREX_GPU_HOST_DEVICE inline
+
+    void Abort_host (const char * msg);
+
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+    AMREX_GPU_EXTERNAL AMREX_GPU_DEVICE AMREX_NO_INLINE
+    void Abort_device (const char * msg);
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     void Abort (const char * msg = 0) {
 #if AMREX_DEVICE_COMPILE
-        if (msg) AMREX_DEVICE_PRINTF("Abort %s\n", msg);
-        AMREX_DEVICE_ASSERT(0);
+#ifdef NDEBUG
+        amrex::ignore_unused(msg);
 #else
-        detail::Abort_host_doit(msg);
+        Abort_device(msg);
+#endif
+#else
+        Abort_host(msg);
 #endif
     }
 
@@ -131,32 +169,27 @@ namespace amrex
     * via abort().  Intended for use by the BL_ASSERT() macro
     * in <AMReX_BLassert.H>.
     */
-    namespace detail { void Assert_host_doit (const char* EX, const char* file, int line,
-                                              const char* msg); }
-    AMREX_GPU_HOST_DEVICE inline
+
+    void Assert_host (const char* EX, const char* file, int line, const char* msg);
+
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+    AMREX_GPU_EXTERNAL AMREX_GPU_DEVICE AMREX_NO_INLINE
+    void Assert_device (const char* EX, const char* file, int line, const char* msg);
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     void Assert (const char* EX, const char* file, int line, const char* msg = nullptr) {
 #if AMREX_DEVICE_COMPILE
-        if (msg) {
-            AMREX_DEVICE_PRINTF("Assertion `%s' failed, file \"%s\", line %d, Msg: %s",
-                                EX, file, line, msg);
-        } else {
-            AMREX_DEVICE_PRINTF("Assertion `%s' failed, file \"%s\", line %d",
-                                EX, file, line);
-        }
-        AMREX_DEVICE_ASSERT(0);
+#ifdef NDEBUG
+        amrex::ignore_unused(EX,file,line,msg);
+#else
+        Assert_device(EX,file,line,msg);
+#endif
 #else
-        detail::Assert_host_doit(EX, file, line, msg);
+        Assert_host(EX,file,line,msg);
 #endif
     }
 
-    /**
-    * \brief Prints out an out-of-memory message and aborts.  It is
-    *         called by various routines when a call to new fails.
-    *
-    *        Called as amrex::OutOfMemory(__FILE__, __LINE__);
-    */
-    void OutOfMemory (const char* file, int line);
-
     /**
     * \brief This is used by amrex::Error(), amrex::Abort(), and amrex::Assert()
     * to ensure that when writing the message to stderr, that no additional
diff --git a/Src/Base/AMReX.cpp b/Src/Base/AMReX.cpp
index a727099aad0..9b2f9b47e99 100644
--- a/Src/Base/AMReX.cpp
+++ b/Src/Base/AMReX.cpp
@@ -1,15 +1,4 @@
-#include <unistd.h>
-#include <cstdio>
-#include <cstdlib>
-#include <cstring>
-#include <iostream>
-#include <iomanip>
-#include <new>
-#include <stack>
-#include <limits>
-#include <vector>
-#include <algorithm>
-
+#include <AMReX_FileSystem.H>
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX.H>
 #include <AMReX_BaseFab.H>
@@ -20,7 +9,9 @@
 #include <AMReX_Random.H>
 #include <AMReX_Print.H>
 #include <AMReX_Arena.H>
-
+#include <AMReX_BLBackTrace.H>
+#include <AMReX_MemPool.H>
+#include <AMReX_Geometry.H>
 #include <AMReX_Gpu.H>
 
 #ifdef AMREX_USE_CUPTI
@@ -53,10 +44,22 @@
 #include <omp.h>
 #endif
 
-#include <AMReX_BLBackTrace.H>
-#include <AMReX_MemPool.H>
+#if defined(__APPLE__)
+#include <xmmintrin.h>
+#endif
 
-#include <AMReX_Geometry.H>
+#include <cstdio>
+#include <cstdlib>
+#include <cstring>
+#include <csignal>
+#include <cfenv>
+#include <iostream>
+#include <iomanip>
+#include <new>
+#include <stack>
+#include <limits>
+#include <vector>
+#include <algorithm>
 
 namespace amrex {
 
@@ -145,7 +148,7 @@ amrex::write_to_stderr_without_buffering (const char* str)
     }
 }
 
-static
+namespace {
 void
 write_lib_id(const char* msg)
 {
@@ -158,9 +161,28 @@ write_lib_id(const char* msg)
 	fwrite("::", 2, 1, stderr);
     }
 }
+}
 
 void
-amrex::detail::Error_host_doit (const char* msg)
+amrex::Error (const std::string& msg)
+{
+    Error(msg.c_str());
+}
+
+void
+amrex::Abort (const std::string& msg)
+{
+    Abort(msg.c_str());
+}
+
+void
+amrex::Warning (const std::string& msg)
+{
+    Warning(msg.c_str());
+}
+
+void
+amrex::Error_host (const char * msg)
 {
     if (system::error_handler) {
         system::error_handler(msg);
@@ -169,18 +191,46 @@ amrex::detail::Error_host_doit (const char* msg)
     } else {
         write_lib_id("Error");
         write_to_stderr_without_buffering(msg);
+#ifdef _OPENMP
+#pragma omp critical (amrex_abort_omp_critical)
+#endif
         ParallelDescriptor::Abort();
     }
 }
 
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+#if AMREX_DEVICE_COMPILE
+AMREX_GPU_DEVICE
 void
-amrex::Error (const std::string& msg)
+amrex::Error_device (const char * msg)
 {
-    Error(msg.c_str());
+    if (msg) AMREX_DEVICE_PRINTF("Error %s\n", msg);
+    AMREX_DEVICE_ASSERT(0);
+}
+#endif
+#endif
+
+void
+amrex::Warning_host (const char * msg)
+{
+    if (msg) {
+	amrex::Print(Print::AllProcs,amrex::ErrorStream()) << msg << '!' << '\n';
+    }
+}
+
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+#if AMREX_DEVICE_COMPILE
+AMREX_GPU_DEVICE
+void
+amrex::Warning_device (const char * msg)
+{
+    if (msg) AMREX_DEVICE_PRINTF("Warning %s\n", msg);
 }
+#endif
+#endif
 
 void
-amrex::detail::Abort_host_doit (const char* msg)
+amrex::Abort_host (const char * msg)
 {
     if (system::error_handler) {
         system::error_handler(msg);
@@ -196,29 +246,20 @@ amrex::detail::Abort_host_doit (const char* msg)
    }
 }
 
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+#if AMREX_DEVICE_COMPILE
+AMREX_GPU_DEVICE
 void
-amrex::Abort (const std::string& msg)
+amrex::Abort_device (const char * msg)
 {
-    Abort(msg.c_str());
-}
-
-void
-amrex::detail::Warning_host_doit (const char* msg)
-{
-    if (msg)
-    {
-	amrex::Print(Print::AllProcs,amrex::ErrorStream()) << msg << '!' << '\n';
-    }
-}
-
-void
-amrex::Warning (const std::string& msg)
-{
-    Warning(msg.c_str());
+    if (msg) AMREX_DEVICE_PRINTF("Abort %s\n", msg);
+    AMREX_DEVICE_ASSERT(0);
 }
+#endif
+#endif
 
 void
-amrex::detail::Assert_host_doit (const char* EX, const char* file, int line, const char* msg)
+amrex::Assert_host (const char* EX, const char* file, int line, const char* msg)
 {
     const int N = 512;
 
@@ -247,10 +288,31 @@ amrex::detail::Assert_host_doit (const char* EX, const char* file, int line, con
         throw RuntimeError(buf);
     } else {
        write_to_stderr_without_buffering(buf);
+#ifdef _OPENMP
+#pragma omp critical (amrex_abort_omp_critical)
+#endif
        ParallelDescriptor::Abort();
    }
 }
 
+#if defined(AMREX_USE_GPU) && !defined(NDEBUG)
+#if AMREX_DEVICE_COMPILE
+AMREX_GPU_DEVICE
+void
+amrex::Assert_device (const char* EX, const char* file, int line, const char* msg)
+{
+    if (msg) {
+        AMREX_DEVICE_PRINTF("Assertion `%s' failed, file \"%s\", line %d, Msg: %s",
+                            EX, file, line, msg);
+    } else {
+        AMREX_DEVICE_PRINTF("Assertion `%s' failed, file \"%s\", line %d",
+                            EX, file, line);
+    }
+    AMREX_DEVICE_ASSERT(0);
+}
+#endif
+#endif
+
 namespace
 {
     std::stack<amrex::PTR_TO_VOID_FUNC> The_Finalize_Function_Stack;
@@ -315,13 +377,7 @@ amrex::Initialize (int& argc, char**& argv, bool build_parm_parse,
     if (argc > 0)
     {
         if (argv[0][0] != '/') {
-            constexpr int bufSize = 1024;
-            char temp[bufSize];
-            char *rCheck = getcwd(temp, bufSize);
-            if(rCheck == 0) {
-                amrex::Abort("**** Error:  getcwd buffer too small.");
-            }
-            system::exename = temp;
+            system::exename = FileSystem::CurrentPath();
             system::exename += "/";
         }
         system::exename += argv[0];
@@ -333,7 +389,7 @@ amrex::Initialize (int& argc, char**& argv, bool build_parm_parse,
         }
     }
 
-#if defined(PERILLA_USE_UPCXX) || defined(AMREX_USE_UPCXX)
+#if defined(AMREX_USE_UPCXX)
     upcxx::init();
 #endif
 
@@ -433,7 +489,8 @@ amrex::Initialize (int& argc, char**& argv, bool build_parm_parse,
             if (invalid)   curr_fpe_excepts |= FE_INVALID;
             if (divbyzero) curr_fpe_excepts |= FE_DIVBYZERO;
             if (overflow)  curr_fpe_excepts |= FE_OVERFLOW;
-#if !defined(__PGI) || (__PGIC__ >= 16)
+#if !defined(AMREX_USE_DPCPP) && (!defined(__PGI) || (__PGIC__ >= 16))
+            // xxxxx DPCPP todo: fpe trap
             prev_fpe_excepts = fegetexcept();
             if (curr_fpe_excepts != 0) {
                 feenableexcept(curr_fpe_excepts);  // trap floating point exceptions
@@ -482,6 +539,9 @@ amrex::Initialize (int& argc, char**& argv, bool build_parm_parse,
     BL_PROFILE_INITPARAMS();
 #endif
     machine::Initialize();
+#ifdef AMREX_USE_GPU
+    Gpu::Fuser::Initialize();
+#endif
 
     if (system::verbose > 0)
     {
@@ -611,7 +671,7 @@ amrex::Finalize (amrex::AMReX* pamrex)
     Gpu::Device::Finalize();
 #endif
 
-#if defined(PERILLA_USE_UPCXX) || defined(AMREX_USE_UPCXX)
+#if defined(AMREX_USE_UPCXX)
     upcxx::finalize();
 #endif
 
diff --git a/Src/Base/AMReX_Algorithm.H b/Src/Base/AMReX_Algorithm.H
index a9aa54d6038..06d3055a9ed 100644
--- a/Src/Base/AMReX_Algorithm.H
+++ b/Src/Base/AMReX_Algorithm.H
@@ -6,6 +6,7 @@
 #include <AMReX_GpuQualifiers.H>
 #include <AMReX_Extension.H>
 #include <AMReX_Dim3.H>
+#include <AMReX_BLassert.H>
 
 namespace amrex
 {
@@ -55,6 +56,50 @@ namespace amrex
         t1 = std::move(t2);
         t2 = std::move(temp);
     }
+
+    template <typename T>
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    constexpr const T& Clamp (const T& v, const T& lo, const T& hi)
+    {
+        return (v < lo) ? lo : (hi < v) ? hi : v;
+    }
+
+    template <class T, class F>
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    T bisect (T lo, T hi, F f, T tol=1e-12, int max_iter=100)
+    {
+        AMREX_ASSERT_WITH_MESSAGE(hi > lo,
+            "Error - calling bisect but lo and hi don't describe a reasonable interval.");
+
+        T flo = f(lo);
+        T fhi = f(hi);
+
+        if (flo == T(0)) return flo;
+        if (fhi == T(0)) return fhi;
+
+        AMREX_ASSERT_WITH_MESSAGE(flo * fhi <= T(0),
+            "Error - calling bisect but lo and hi don't bracket a root.");
+
+        T mi = (lo + hi) / T(2);
+        T fmi = 0.0;
+        int n = 1;
+        while (n <= max_iter)
+        {
+            if (hi - lo < tol) break;
+            mi = (lo + hi) / T(2);
+            fmi = f(mi);
+            if (fmi == T(0)) break;
+            fmi*flo < T(0) ? hi = mi : lo = mi;
+            flo = f(lo);
+            fhi = f(hi);
+            ++n;
+        }
+
+        AMREX_ASSERT_WITH_MESSAGE(n < max_iter,
+            "Error - maximum number of iterations reached in bisect.");
+
+        return mi;
+    }
 }
 
 #endif
diff --git a/Src/Base/AMReX_Arena.H b/Src/Base/AMReX_Arena.H
index 7cfa8d4c209..cc230e41a86 100644
--- a/Src/Base/AMReX_Arena.H
+++ b/Src/Base/AMReX_Arena.H
@@ -89,8 +89,6 @@ public:
     static void PrintUsage ();
     static void Finalize ();
 
-protected:
-
 #if 0
     union Word
     {
@@ -104,6 +102,8 @@ protected:
 
     static const std::size_t align_size = 16;
 
+protected:
+
     ArenaInfo arena_info;
 
     void* allocate_system (std::size_t nbytes);
diff --git a/Src/Base/AMReX_Arena.cpp b/Src/Base/AMReX_Arena.cpp
index 51344845933..044cb86fc7b 100644
--- a/Src/Base/AMReX_Arena.cpp
+++ b/Src/Base/AMReX_Arena.cpp
@@ -11,7 +11,17 @@
 #include <AMReX_ParmParse.H>
 #include <AMReX_Gpu.H>
 
+#ifdef _WIN32
+///#include <memoryapi.h>
+//#define AMREX_MLOCK(x,y) VirtualLock(x,y)
+//#define AMREX_MUNLOCK(x,y) VirtualUnlock(x,y)
+#define AMREX_MLOCK(x,y) ((void)0)
+#define AMREX_MUNLOCK(x,y) ((void)0)
+#else
 #include <sys/mman.h>
+#define AMREX_MLOCK(x,y) mlock(x,y)
+#define AMREX_MUNLOCK(x,y) munlock(x,y)
+#endif
 
 namespace amrex {
 
@@ -27,6 +37,11 @@ namespace {
     bool use_buddy_allocator = false;
     Long buddy_allocator_size = 0L;
     Long the_arena_init_size = 0L;
+#ifdef AMREX_USE_HIP
+    bool the_arena_is_managed = false; // xxxxx HIP FIX HERE
+#else
+    bool the_arena_is_managed = true;
+#endif
     bool abort_on_out_of_gpu_memory = false;
 }
 
@@ -54,7 +69,7 @@ Arena::allocate_system (std::size_t nbytes)
     if (arena_info.use_cpu_memory)
     {
         p = std::malloc(nbytes);
-        if (p && arena_info.device_use_hostalloc) mlock(p, nbytes);
+        if (p && arena_info.device_use_hostalloc) AMREX_MLOCK(p, nbytes);
     }
     else if (arena_info.device_use_hostalloc)
     {
@@ -76,9 +91,9 @@ Arena::allocate_system (std::size_t nbytes)
         if (arena_info.device_use_managed_memory)
         {
             AMREX_HIP_OR_CUDA_OR_DPCPP
-                (AMREX_HIP_SAFE_CALL(hipMalloc(&p, nbytes));,
+                (AMREX_HIP_SAFE_CALL(hipMallocManaged(&p, nbytes));,
                  AMREX_CUDA_SAFE_CALL(cudaMallocManaged(&p, nbytes));,
-                 p = sycl::malloc_shared(nbytes, Gpu::Device::syclDevice(), Gpu::Device::syclContext()););
+                 p = sycl::malloc_shared(nbytes, Gpu::Device::syclDevice(), Gpu::Device::syclContext()));
             if (arena_info.device_set_readonly)
             {
                 Gpu::Device::mem_advise_set_readonly(p, nbytes);
@@ -94,12 +109,12 @@ Arena::allocate_system (std::size_t nbytes)
             AMREX_HIP_OR_CUDA_OR_DPCPP
                 (AMREX_HIP_SAFE_CALL ( hipMalloc(&p, nbytes));,
                  AMREX_CUDA_SAFE_CALL(cudaMalloc(&p, nbytes));,
-                 p = sycl::malloc_device(nbytes, Gpu::Device::syclDevice(), Gpu::Device::syclContext()););
+                 p = sycl::malloc_device(nbytes, Gpu::Device::syclDevice(), Gpu::Device::syclContext()));
         }
     }
 #else
     p = std::malloc(nbytes);
-    if (p && arena_info.device_use_hostalloc) mlock(p, nbytes);
+    if (p && arena_info.device_use_hostalloc) AMREX_MLOCK(p, nbytes);
 #endif
     if (p == nullptr) amrex::Abort("Sorry, malloc failed");
     return p;
@@ -111,7 +126,7 @@ Arena::deallocate_system (void* p, std::size_t nbytes)
 #ifdef AMREX_USE_GPU
     if (arena_info.use_cpu_memory)
     {
-        if (p && arena_info.device_use_hostalloc) munlock(p, nbytes);
+        if (p && arena_info.device_use_hostalloc) AMREX_MUNLOCK(p, nbytes);
         std::free(p);
     }
     else if (arena_info.device_use_hostalloc)
@@ -126,10 +141,10 @@ Arena::deallocate_system (void* p, std::size_t nbytes)
         AMREX_HIP_OR_CUDA_OR_DPCPP
             (AMREX_HIP_SAFE_CALL ( hipFree(p));,
              AMREX_CUDA_SAFE_CALL(cudaFree(p));,
-             sycl::free(p,Gpu::Device::syclContext()););
+             sycl::free(p,Gpu::Device::syclContext()));
     }
 #else
-    if (p && arena_info.device_use_hostalloc) munlock(p, nbytes);
+    if (p && arena_info.device_use_hostalloc) AMREX_MUNLOCK(p, nbytes);
     std::free(p);
 #endif
 }
@@ -150,6 +165,7 @@ Arena::Initialize ()
     pp.query("use_buddy_allocator", use_buddy_allocator);
     pp.query("buddy_allocator_size", buddy_allocator_size);
     pp.query("the_arena_init_size", the_arena_init_size);
+    pp.query("the_arena_is_managed", the_arena_is_managed);
     pp.query("abort_on_out_of_gpu_memory", abort_on_out_of_gpu_memory);
 
 #ifdef AMREX_USE_GPU
@@ -165,13 +181,21 @@ Arena::Initialize ()
         }
         std::size_t chunk = 512*1024*1024;
         buddy_allocator_size = (buddy_allocator_size/chunk) * chunk;
-        the_arena = new DArena(buddy_allocator_size, 512, ArenaInfo().SetPreferred());
+        if (the_arena_is_managed) {
+            the_arena = new DArena(buddy_allocator_size, 512, ArenaInfo().SetPreferred());
+        } else {
+            the_arena = new DArena(buddy_allocator_size, 512, ArenaInfo().SetDeviceMemory());
+        }
     }
     else
 #endif
     {
 #if defined(BL_COALESCE_FABS) || defined(AMREX_USE_GPU)
-        the_arena = new CArena(0, ArenaInfo().SetPreferred());
+        if (the_arena_is_managed) {
+            the_arena = new CArena(0, ArenaInfo().SetPreferred());
+        } else {
+            the_arena = new CArena(0, ArenaInfo().SetDeviceMemory());
+        }
 #ifdef AMREX_USE_GPU
         if (the_arena_init_size <= 0) {
 #ifdef AMREX_USE_DPCPP
diff --git a/Src/Base/AMReX_Array.H b/Src/Base/AMReX_Array.H
index 6b2154542f1..f53ad13429c 100644
--- a/Src/Base/AMReX_Array.H
+++ b/Src/Base/AMReX_Array.H
@@ -39,25 +39,29 @@ namespace amrex {
         T& operator [] (int i) noexcept { return arr[i]; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        const T* data () const noexcept { return arr; };
+        const T* data () const noexcept { return arr; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        T* data () noexcept { return arr; };
+        T* data () noexcept { return arr; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        std::size_t size() const noexcept { return N; };
+        std::size_t size() const noexcept { return N; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        const T* begin() const noexcept { return arr; };
+        const T* begin() const noexcept { return arr; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        const T* end() const noexcept { return arr + N; };
+        const T* end() const noexcept { return arr + N; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        T* begin() noexcept { return arr; };
+        T* begin() noexcept { return arr; }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-        T* end() noexcept { return arr + N; };
+        T* end() noexcept { return arr + N; }
+
+        AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+        void fill( const T& value ) noexcept
+        { for (std::size_t i = 0; i < N; ++i) arr[i] = value; }
 
         T arr[amrex::max(N,std::size_t{1})];
     };
@@ -75,11 +79,13 @@ namespace amrex {
     {
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         const T& operator() (int i) const noexcept {
+            AMREX_ASSERT(i >= XLO && i <= XHI);
             return arr[i-XLO];
         }
 
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T& operator() (int i) noexcept {
+            AMREX_ASSERT(i >= XLO && i <= XHI);
             return arr[i-XLO];
         }
 
@@ -94,6 +100,7 @@ namespace amrex {
                   typename std::enable_if<std::is_same<O,Order::F>::value,int>::type=0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         const T& operator() (int i, int j) const noexcept {
+            AMREX_ASSERT(i >= XLO && i <= XHI && j >= YLO && j <= YHI);
             return arr[i+j*(XHI-XLO+1)-(YLO*(XHI-XLO+1)+XLO)];
         }
 
@@ -101,6 +108,7 @@ namespace amrex {
                   typename std::enable_if<std::is_same<O,Order::F>::value,int>::type=0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T& operator() (int i, int j) noexcept {
+            AMREX_ASSERT(i >= XLO && i <= XHI && j >= YLO && j <= YHI);
             return arr[i+j*(XHI-XLO+1)-(YLO*(XHI-XLO+1)+XLO)];
         }
 
@@ -108,6 +116,7 @@ namespace amrex {
                   typename std::enable_if<std::is_same<O,Order::C>::value,int>::type=0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         const T& operator() (int i, int j) const noexcept {
+            AMREX_ASSERT(i >= XLO && i <= XHI && j >= YLO && j <= YHI);
             return arr[j+i*(YHI-YLO+1)-(XLO*(YHI-YLO+1)+YLO)];
         }
 
@@ -115,6 +124,7 @@ namespace amrex {
                   typename std::enable_if<std::is_same<O,Order::C>::value,int>::type=0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T& operator() (int i, int j) noexcept {
+            AMREX_ASSERT(i >= XLO && i <= XHI && j >= YLO && j <= YHI);
             return arr[j+i*(YHI-YLO+1)-(XLO*(YHI-YLO+1)+YLO)];
         }
 
@@ -166,31 +176,31 @@ namespace amrex
     template <class T, typename = typename T::FABType>
     std::array<T*,AMREX_SPACEDIM> GetArrOfPtrs (std::array<T,AMREX_SPACEDIM>& a) noexcept
     {
-        return {AMREX_D_DECL(&a[0], &a[1], &a[2])};
+        return {{AMREX_D_DECL(&a[0], &a[1], &a[2])}};
     }
 
     template <class T>
     std::array<T*,AMREX_SPACEDIM> GetArrOfPtrs (const std::array<std::unique_ptr<T>,AMREX_SPACEDIM>& a) noexcept
     {
-        return {AMREX_D_DECL(a[0].get(), a[1].get(), a[2].get())};
+        return {{AMREX_D_DECL(a[0].get(), a[1].get(), a[2].get())}};
     }
-    
+
     template <class T>
     std::array<T const*,AMREX_SPACEDIM> GetArrOfConstPtrs (const std::array<T,AMREX_SPACEDIM>& a) noexcept
     {
-        return {AMREX_D_DECL(&a[0], &a[1], &a[2])};
+        return {{AMREX_D_DECL(&a[0], &a[1], &a[2])}};
     }
 
     template <class T>
     std::array<T const*,AMREX_SPACEDIM> GetArrOfConstPtrs (const std::array<T*,AMREX_SPACEDIM>& a) noexcept
     {
-       return {AMREX_D_DECL(a[0], a[1], a[2])};
+        return {{AMREX_D_DECL(a[0], a[1], a[2])}};
     }
 
     template <class T>
     std::array<T const*,AMREX_SPACEDIM> GetArrOfConstPtrs (const std::array<std::unique_ptr<T>,AMREX_SPACEDIM>& a) noexcept
     {
-        return {AMREX_D_DECL(a[0].get(), a[1].get(), a[2].get())};
+        return {{AMREX_D_DECL(a[0].get(), a[1].get(), a[2].get())}};
     }
 
 }
@@ -210,4 +220,3 @@ namespace amrex
 }
 
 #endif
-
diff --git a/Src/Base/AMReX_Array4.H b/Src/Base/AMReX_Array4.H
index a23fd8ed1ff..3fd9ad9c62a 100644
--- a/Src/Base/AMReX_Array4.H
+++ b/Src/Base/AMReX_Array4.H
@@ -10,17 +10,17 @@ namespace amrex {
     struct Array4
     {
         T* AMREX_RESTRICT p;
-        Long jstride;
-        Long kstride;
-        Long nstride;
-        Dim3 begin;
-        Dim3 end;  // end is hi + 1
-        int  ncomp;
+        Long jstride = 0;
+        Long kstride = 0;
+        Long nstride = 0;
+        Dim3 begin{1,1,1};
+        Dim3 end{0,0,0};  // end is hi + 1
+        int  ncomp=0;
 
         AMREX_GPU_HOST_DEVICE
         constexpr Array4 () noexcept : p(nullptr) {}
 
-        template <class U=T, class = typename std::enable_if<std::is_const<U>::value>::type >
+        template <class U=T, typename std::enable_if<std::is_const<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE
         constexpr Array4 (Array4<typename std::remove_const<T>::type> const& rhs) noexcept
             : p(rhs.p),
@@ -44,9 +44,9 @@ namespace amrex {
             {}
 
         template <class U,
-                  class = typename std::enable_if
+                  typename std::enable_if
                   <std::is_same<typename std::remove_const<T>::type,
-                                typename std::remove_const<U>::type>::value>::type >
+                                typename std::remove_const<U>::type>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE
         constexpr Array4 (Array4<U> const& rhs, int start_comp) noexcept
             : p((T*)(rhs.p+start_comp*rhs.nstride)),
@@ -61,7 +61,7 @@ namespace amrex {
         AMREX_GPU_HOST_DEVICE
         explicit operator bool() const noexcept { return p != nullptr; }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         U& operator() (int i, int j, int k) const noexcept {
 #if defined(AMREX_DEBUG) || defined(AMREX_BOUND_CHECK)
@@ -70,7 +70,7 @@ namespace amrex {
             return p[(i-begin.x)+(j-begin.y)*jstride+(k-begin.z)*kstride];
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         U& operator() (int i, int j, int k, int n) const noexcept {
 #if defined(AMREX_DEBUG) || defined(AMREX_BOUND_CHECK)
@@ -79,7 +79,7 @@ namespace amrex {
             return p[(i-begin.x)+(j-begin.y)*jstride+(k-begin.z)*kstride+n*nstride];
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T* ptr (int i, int j, int k) const noexcept {
 #if defined(AMREX_DEBUG) || defined(AMREX_BOUND_CHECK)
@@ -88,7 +88,7 @@ namespace amrex {
             return p + ((i-begin.x)+(j-begin.y)*jstride+(k-begin.z)*kstride);
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T* ptr (int i, int j, int k, int n) const noexcept {
 #if defined(AMREX_DEBUG) || defined(AMREX_BOUND_CHECK)
@@ -97,7 +97,7 @@ namespace amrex {
             return p + ((i-begin.x)+(j-begin.y)*jstride+(k-begin.z)*kstride+n*nstride);
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         U& operator() (IntVect const& iv) const noexcept {
 #if (AMREX_SPACEDIM == 1)
@@ -109,7 +109,7 @@ namespace amrex {
 #endif
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         U& operator() (IntVect const& iv, int n) const noexcept {
 #if (AMREX_SPACEDIM == 1)
@@ -121,7 +121,7 @@ namespace amrex {
 #endif
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T* ptr (IntVect const& iv) const noexcept {
 #if (AMREX_SPACEDIM == 1)
@@ -133,7 +133,7 @@ namespace amrex {
 #endif
         }
 
-        template <class U=T, class = typename std::enable_if<!std::is_void<U>::value>::type >
+        template <class U=T, typename std::enable_if<!std::is_void<U>::value,int>::type = 0>
         AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
         T* ptr (IntVect const& iv, int n) const noexcept {
 #if (AMREX_SPACEDIM == 1)
diff --git a/Src/Base/AMReX_AsyncOut.H b/Src/Base/AMReX_AsyncOut.H
index ed02e2f799e..523d6027df7 100644
--- a/Src/Base/AMReX_AsyncOut.H
+++ b/Src/Base/AMReX_AsyncOut.H
@@ -1,7 +1,6 @@
 #ifndef AMREX_ASYNCOUT_H_
 #define AMREX_ASYNCOUT_H_
 
-#include <AMReX_ParallelDescriptor.H>
 #include <functional>
 
 namespace amrex {
diff --git a/Src/Base/AMReX_AsyncOut.cpp b/Src/Base/AMReX_AsyncOut.cpp
index 66aa3594680..4d42552f9ad 100644
--- a/Src/Base/AMReX_AsyncOut.cpp
+++ b/Src/Base/AMReX_AsyncOut.cpp
@@ -1,49 +1,36 @@
 #include <AMReX_AsyncOut.H>
+#include <AMReX_BackgroundThread.H>
+#include <AMReX_ParallelDescriptor.H>
 #include <AMReX_Vector.H>
 #include <AMReX_ParmParse.H>
+#include <AMReX_Utility.H>
 #include <AMReX.H>
-#include <algorithm>
-#include <condition_variable>
-#include <memory>
-#include <mutex>
-#include <queue>
-#include <thread>
 
 namespace amrex {
 namespace AsyncOut {
 
 namespace {
 
+#if defined(AMREX_USE_DPCPP) || defined(AMREX_USE_HIP)
+int s_asyncout = true; // Have this on by default for DPC++ for now so that
+                       // I/O writing plotfile does not depend on unified
+                       // memory.
+#else
 int s_asyncout = false;
+#endif
 int s_noutfiles = 64;
 MPI_Comm s_comm = MPI_COMM_NULL;
 
-std::unique_ptr<std::thread> s_thread;
-std::mutex s_mutx;
-std::condition_variable s_cond;
-static std::queue<std::function<void()> > s_func;
-static bool s_finalizing = false;
+std::unique_ptr<BackgroundThread> s_thread;
 
 WriteInfo s_info;
 
-void do_job ()
-{
-    while (true)
-    {
-        std::unique_lock<std::mutex> lck(s_mutx);
-        s_cond.wait(lck, [] () -> bool { return not s_func.empty(); });
-        auto f = s_func.front();
-        s_func.pop();
-        lck.unlock();
-        f();
-        if (s_finalizing) break;
-    }
-}
-
 }
 
 void Initialize ()
 {
+    amrex::ignore_unused(s_comm,s_info);
+
     ParmParse pp("amrex");
     pp.query("async_out", s_asyncout);
     pp.query("async_out_nfiles", s_noutfiles);
@@ -51,19 +38,24 @@ void Initialize ()
     int nprocs = ParallelDescriptor::NProcs();
     s_noutfiles = std::min(s_noutfiles, nprocs);
 
+#ifdef AMREX_USE_MPI
     if (s_asyncout and s_noutfiles < nprocs)
     {
-#ifdef AMREX_MPI_THREAD_MULTIPLE
+        int provided = -1;
+        MPI_Query_thread(&provided);
+        if (provided < MPI_THREAD_MULTIPLE)
+            amrex::Abort("AsyncOut with " + std::to_string(s_noutfiles) + " and "
+                         + std::to_string(nprocs) + " processes requires "
+                         + "MPI_THREAD_MULTIPLE at runtime, but got "
+                         + ParallelDescriptor::mpi_level_to_string(provided));
+
         int myproc = ParallelDescriptor::MyProc();
         s_info = GetWriteInfo(myproc);
         MPI_Comm_split(ParallelDescriptor::Communicator(), s_info.ifile, myproc, &s_comm);
-#else
-        amrex::Abort("AsyncOut with " + std::to_string(s_noutfiles) + " and "
-                     +std::to_string(nprocs) + " processes requires MPI_THREAD_MULTIPLE");
-#endif
     }
+#endif
 
-    if (s_asyncout) s_thread.reset(new std::thread(do_job));
+    if (s_asyncout) s_thread.reset(new BackgroundThread());
 
     ExecOnFinalize(Finalize);
 }
@@ -71,8 +63,6 @@ void Initialize ()
 void Finalize ()
 {
     if (s_thread) {
-        Submit([] () { s_finalizing = true; });
-        s_thread->join();
         s_thread.reset();
     }
 
@@ -109,25 +99,17 @@ WriteInfo GetWriteInfo (int rank)
 
 void Submit (std::function<void()>&& a_f)
 {
-    std::lock_guard<std::mutex> lck(s_mutx);
-    s_func.emplace(std::move(a_f));
-    s_cond.notify_one();
+    s_thread->Submit(std::move(a_f));
 }
 
 void Submit (std::function<void()> const& a_f)
 {
-    std::lock_guard<std::mutex> lck(s_mutx);
-    s_func.emplace(a_f);
-    s_cond.notify_one();
+    s_thread->Submit(a_f);
 }
 
 void Finish ()
 {
-    if (s_thread) {
-        Submit([] () { s_finalizing = true; });
-        s_thread->join();
-        s_thread.reset(new std::thread(do_job));
-    }
+    s_thread->Finish();
 }
 
 void Wait ()
diff --git a/Src/Base/AMReX_BCUtil.cpp b/Src/Base/AMReX_BCUtil.cpp
index 033e81fc71a..3a950d29d4f 100644
--- a/Src/Base/AMReX_BCUtil.cpp
+++ b/Src/Base/AMReX_BCUtil.cpp
@@ -6,11 +6,11 @@ namespace amrex
 
 namespace {
 
-void dummy_cpu_fill_extdir (Box const& bx, Array4<Real> const& dest,
-                            const int dcomp, const int numcomp,
-                            GeometryData const& geom, const Real time,
-                            const BCRec* bcr, const int bcomp,
-                            const int orig_comp)
+void dummy_cpu_fill_extdir (Box const& /*bx*/, Array4<Real> const& /*dest*/,
+                            const int /*dcomp*/, const int /*numcomp*/,
+                            GeometryData const& /*geom*/, const Real /*time*/,
+                            const BCRec* /*bcr*/, const int /*bcomp*/,
+                            const int /*orig_comp*/)
 {
     // do something for external Dirichlet (BCType::ext_dir) if there are
 }
@@ -18,11 +18,11 @@ void dummy_cpu_fill_extdir (Box const& bx, Array4<Real> const& dest,
 struct dummy_gpu_fill_extdir
 {
     AMREX_GPU_DEVICE
-    void operator() (const IntVect& iv, Array4<Real> const& dest,
-                     const int dcomp, const int numcomp,
-                     GeometryData const& geom, const Real time,
-                     const BCRec* bcr, const int bcomp,
-                     const int orig_comp) const
+    void operator() (const IntVect& /*iv*/, Array4<Real> const& /*dest*/,
+                     const int /*dcomp*/, const int /*numcomp*/,
+                     GeometryData const& /*geom*/, const Real /*time*/,
+                     const BCRec* /*bcr*/, const int /*bcomp*/,
+                     const int /*orig_comp*/) const
         {
             // do something for external Dirichlet (BCType::ext_dir) if there are
         }
diff --git a/Src/Base/AMReX_BLBackTrace.H b/Src/Base/AMReX_BLBackTrace.H
index ab2335e133a..df9029ceff1 100644
--- a/Src/Base/AMReX_BLBackTrace.H
+++ b/Src/Base/AMReX_BLBackTrace.H
@@ -5,31 +5,17 @@
 #include <string>
 #include <utility>
 #include <sstream>
-
 #include <cstdio>
 #include <cstdlib>
 
-#include <execinfo.h>
-#if defined(__APPLE__)
-#include <xmmintrin.h>
-#endif
-
-#include <csignal>
-#include <cfenv>
-
 #ifdef _OPENMP
 #include <omp.h>
 #endif
 
-#ifdef AMREX_BACKTRACING
 #define BL_PASTE2(x, y) x##y
 #define BL_PASTE(x, y) BL_PASTE2(x, y)
 #define BL_BACKTRACE_PUSH( S )  amrex::BLBTer BL_PASTE( bl_bter, __COUNTER__ )( S, __FILE__, __LINE__ )
 #define BL_BACKTRACE_POP()   amrex::BLBackTrace::bt_stack.pop()
-#else
-#define BL_BACKTRACE_PUSH(S) ((void)0)
-#define BL_BACKTRACE_POP(S) ((void)0)
-#endif
 
 namespace amrex {
 
@@ -41,16 +27,13 @@ struct BLBackTrace
     //! Non-abort backtrace. Prints to specified file and continues.
     static void print_backtrace_info (const std::string& filename);
 
-#ifdef AMREX_BACKTRACING
     static std::stack<std::pair<std::string, std::string> > bt_stack;
 // threadprivate here doesn't work with Cray and Intel
-#if defined(_OPENMP) && !defined(_CRAYC) && !defined(__INTEL_COMPILER)
+#if defined(_OPENMP) && !defined(_CRAYC) && !defined(__INTEL_COMPILER) && !defined(__PGI)
 #pragma omp threadprivate(bt_stack)
 #endif
-#endif // AMREX_BACKTRACING
 };
 
-#ifdef AMREX_BACKTRACING
 class BLBTer
 {
 public:
@@ -60,7 +43,6 @@ private:
     std::string line_file;
     void pop_bt_stack();
 };
-#endif // AMREX_BACKTRACING
 
 }
 
diff --git a/Src/Base/AMReX_BLBackTrace.cpp b/Src/Base/AMReX_BLBackTrace.cpp
index 77ccba2bbd7..e78cf7549e9 100644
--- a/Src/Base/AMReX_BLBackTrace.cpp
+++ b/Src/Base/AMReX_BLBackTrace.cpp
@@ -1,22 +1,23 @@
-#include <iostream>
-#include <sstream>
-#include <fstream>
-#include <cstring>
-#include <cstdio>
-
-#include <unistd.h>
-
 #include <AMReX_BLBackTrace.H>
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX_Print.H>
 #include <AMReX_VisMF.H>
 #include <AMReX_AsyncOut.H>
 #include <AMReX.H>
+#include <AMReX_Utility.H>
 
 #ifdef AMREX_TINY_PROFILING
 #include <AMReX_TinyProfiler.H>
 #endif
 
+#include <iostream>
+#include <sstream>
+#include <fstream>
+#include <cstring>
+#include <cstdio>
+#include <csignal>
+#include <cfenv>
+
 #if defined(AMREX_EXPORT_DYNAMIC) && defined(__APPLE__)
 #include <cxxabi.h>
 #include <dlfcn.h>
@@ -25,11 +26,14 @@
 #define AMREX_BACKTRACE_SUPPORTED 1
 #endif
 
+#ifndef _WIN32
+#include <execinfo.h>
+#include <unistd.h>
+#endif
+
 namespace amrex {
 
-#ifdef AMREX_BACKTRACING
 std::stack<std::pair<std::string, std::string> >  BLBackTrace::bt_stack;
-#endif
 
 void
 BLBackTrace::handler(int s)
@@ -78,7 +82,6 @@ BLBackTrace::handler(int s)
     
     amrex::ErrorStream() << "See " << errfilename << " file for details" << std::endl;
 
-#ifdef AMREX_BACKTRACING
     if (!bt_stack.empty()) {
 	std::ofstream errfile;
 	errfile.open(errfilename.c_str(), std::ofstream::out | std::ofstream::app);
@@ -92,7 +95,6 @@ BLBackTrace::handler(int s)
 	    errfile << std::endl;
 	}
     }
-#endif
 
 #ifdef AMREX_TINY_PROFILING
     {
@@ -107,7 +109,7 @@ BLBackTrace::handler(int s)
 #endif
 
     if (ParallelDescriptor::NProcs() > 1) {
-	sleep(3);
+	amrex::Sleep(3);
     }
 
 #endif
@@ -292,8 +294,6 @@ BLBackTrace::print_backtrace_info (FILE* f)
 #endif
 }
 
-#ifdef AMREX_BACKTRACING
-
 BLBTer::BLBTer(const std::string& s, const char* file, int line)
 {
     std::ostringstream ss;
@@ -353,6 +353,4 @@ BLBTer::pop_bt_stack()
     }
 }
 
-#endif
-
 }
diff --git a/Src/Base/AMReX_BLFort.H b/Src/Base/AMReX_BLFort.H
index b2dc6a41f50..b7311f7fe9e 100644
--- a/Src/Base/AMReX_BLFort.H
+++ b/Src/Base/AMReX_BLFort.H
@@ -110,7 +110,7 @@
 
 // Define macros for doing reductions.
 
-#ifdef AMREX_USE_GPU
+#if defined(AMREX_USE_GPU) && defined(AMREX_USE_GPU_PRAGMA)
 #define AMREX_MFITER_REDUCE_SUM(var) mfi.add_reduce_value(var, amrex::MFIter::SUM)
 #define AMREX_MFITER_REDUCE_MIN(var) mfi.add_reduce_value(var, amrex::MFIter::MIN)
 #define AMREX_MFITER_REDUCE_MAX(var) mfi.add_reduce_value(var, amrex::MFIter::MAX)
diff --git a/Src/Base/AMReX_BLProfiler.H b/Src/Base/AMReX_BLProfiler.H
index cb4eff409b2..e242751018e 100644
--- a/Src/Base/AMReX_BLProfiler.H
+++ b/Src/Base/AMReX_BLProfiler.H
@@ -525,17 +525,17 @@ namespace amrex {
 class BLProfiler
 {
   public:
-    explicit BLProfiler(const std::string &funcname) { }
+    explicit BLProfiler(const std::string &/*funcname*/) { }
     static void Initialize() { }
     static void InitParams() { }
     static void Finalize() { }
-    static void WriteStats(std::ostream &os) { }
+    static void WriteStats(std::ostream &/*os*/) { }
     static void WriteCommStats() { }
     void start() { }
     void stop() { }
-    static void InitParams(const Real ptl, const bool writeall,
-                           const bool writefabs) { }
-    static void AddStep(const int snum) { }
+    static void InitParams(const Real /*ptl*/, const bool /*writeall*/,
+                           const bool /*writefabs*/) { }
+    static void AddStep(const int /*snum*/) { }
 };
 
 }
diff --git a/Src/Base/AMReX_BLProfiler.cpp b/Src/Base/AMReX_BLProfiler.cpp
index 8ba85b83477..21bfd2a2faa 100644
--- a/Src/Base/AMReX_BLProfiler.cpp
+++ b/Src/Base/AMReX_BLProfiler.cpp
@@ -513,11 +513,13 @@ namespace BLProfilerUtils {
 void WriteHeader(std::ostream &ios, const int colWidth,
                  const Real maxlen, const bool bwriteavg)
 {
+  int maxlenI = int(maxlen);
+
   if(bwriteavg) {
-    ios << std::setfill('-') << std::setw(maxlen+4 + 7 * (colWidth+2))
+    ios << std::setfill('-') << std::setw(maxlenI+4 + 7 * (colWidth+2))
         << std::left << "Total times " << '\n';
     ios << std::right << std::setfill(' ');
-    ios << std::setw(maxlen + 2) << "Function Name"
+    ios << std::setw(maxlenI + 2) << "Function Name"
         << std::setw(colWidth + 2) << "NCalls"
         << std::setw(colWidth + 2) << "Min"
         << std::setw(colWidth + 2) << "Avg"
@@ -527,10 +529,10 @@ void WriteHeader(std::ostream &ios, const int colWidth,
         << std::setw(colWidth + 4) << "Percent %"
         << '\n';
   } else {
-    ios << std::setfill('-') << std::setw(maxlen+4 + 3 * (colWidth+2))
+    ios << std::setfill('-') << std::setw(maxlenI+4 + 3 * (colWidth+2))
         << std::left << "Total times " << '\n';
     ios << std::right << std::setfill(' ');
-    ios << std::setw(maxlen + 2) << "Function Name"
+    ios << std::setw(maxlenI + 2) << "Function Name"
         << std::setw(colWidth + 2) << "NCalls"
         << std::setw(colWidth + 2) << "Time"
         << std::setw(colWidth + 4) << "Percent %"
@@ -544,6 +546,7 @@ void WriteRow(std::ostream &ios, const std::string &fname,
 	      const int colWidth, const Real maxlen,
 	      const bool bwriteavg)
 {
+    int maxlenI = int(maxlen);
     int numPrec(4), pctPrec(2);
     Real stdDev(0.0), coeffVariation(0.0);
     if(pstats.variance > 0.0) {
@@ -555,7 +558,7 @@ void WriteRow(std::ostream &ios, const std::string &fname,
 
     if(bwriteavg) {
       ios << std::right;
-      ios << std::setw(maxlen + 2) << fname << "  "
+      ios << std::setw(maxlenI + 2) << fname << "  "
           << std::setw(colWidth) << pstats.nCalls << "  "
           << std::setprecision(numPrec) << std::fixed << std::setw(colWidth)
 	  << pstats.minTime << "  "
@@ -570,7 +573,7 @@ void WriteRow(std::ostream &ios, const std::string &fname,
           << std::setprecision(pctPrec) << std::fixed << std::setw(colWidth)
 	  << percent << " %" << '\n';
     } else {
-      ios << std::setw(maxlen + 2) << fname << "  "
+      ios << std::setw(maxlenI + 2) << fname << "  "
           << std::setw(colWidth) << pstats.nCalls << "  "
           << std::setprecision(numPrec) << std::fixed << std::setw(colWidth)
 	  << pstats.totalTime << "  "
@@ -770,7 +773,7 @@ void WriteStats(std::ostream &ios,
 }  // end namespace BLProfilerUtils
 
 void BLProfiler::WriteBaseProfile(bool bFlushing, bool memCheck) {   // ---- write basic profiling data
-
+  amrex::ignore_unused(memCheck);
   // --------------------------------------- gather global stats
   Real baseProfStart(amrex::second());  // time the timer
   const int nProcs(ParallelDescriptor::NProcs());
@@ -1162,8 +1165,9 @@ void BLProfiler::WriteCallTrace(bool bFlushing, bool memCheck) {   // ---- write
 
 
 
-void BLProfiler::WriteCommStats(bool bFlushing, bool memCheck) {
-
+void BLProfiler::WriteCommStats(bool bFlushing, bool memCheck)
+{
+  amrex::ignore_unused(bFlushing);
   Real wcsStart(amrex::second());
   bool bAllCFTypesExcluded(OnExcludeList(AllCFTypes));
   if( ! bAllCFTypesExcluded) {
@@ -1461,6 +1465,7 @@ void BLProfiler::AddAllReduce(const CommFuncType cft, const int size,
 void BLProfiler::AddWait(const CommFuncType cft, const MPI_Request &req,
 			 const MPI_Status &status, const bool beforecall)
 {
+  amrex::ignore_unused(req);
 #ifdef BL_USE_MPI
   if(OnExcludeList(cft)) {
     return;
@@ -1481,6 +1486,7 @@ void BLProfiler::AddWaitsome(const CommFuncType cft, const Vector<MPI_Request> &
                              const int completed, const Vector<MPI_Status> &status,
                              const bool beforecall)
 {
+  amrex::ignore_unused(reqs);
 #ifdef BL_USE_MPI
   if(OnExcludeList(cft)) {
     return;
@@ -1658,28 +1664,28 @@ namespace amrex {
 
 BL_FORT_PROC_DECL(BL_PROFFORTFUNCSTART_CPP,bl_proffortfuncstart_cpp)
   (
-   const int istr[], const int *NSTR
+   const int /*istr*/[], const int * /*NSTR*/
    )
 {
 }
 
 BL_FORT_PROC_DECL(BL_PROFFORTFUNCSTOP_CPP,bl_proffortfuncstop_cpp)
   (
-   const int istr[], const int *NSTR
+   const int /*istr*/[], const int * /*NSTR*/
    )
 {
 }
 
 BL_FORT_PROC_DECL(BL_PROFFORTFUNCSTART_CPP_INT,bl_proffortfuncstart_cpp_int)
   (
-   int i
+   int /*i*/
    )
 {
 }
 
 BL_FORT_PROC_DECL(BL_PROFFORTFUNCSTOP_CPP_INT,bl_proffortfuncstop_cpp_int)
   (
-   int i
+   int /*i*/
    )
 {
 }
diff --git a/Src/Base/AMReX_BackgroundThread.H b/Src/Base/AMReX_BackgroundThread.H
new file mode 100644
index 00000000000..33283c60d49
--- /dev/null
+++ b/Src/Base/AMReX_BackgroundThread.H
@@ -0,0 +1,39 @@
+#ifndef AMREX_BACKGROUND_THREAD_H_
+#define AMREX_BACKGROUND_THREAD_H_
+
+#include <algorithm>
+#include <condition_variable>
+#include <functional>
+#include <memory>
+#include <mutex>
+#include <queue>
+#include <thread>
+
+namespace amrex {
+
+class BackgroundThread
+{
+public:
+    BackgroundThread ();
+    ~BackgroundThread ();
+
+    void Submit (std::function<void()>&& a_f);
+    void Submit (std::function<void()> const& a_f);
+
+    void Finish (); // Not required. Call this if you want all jobs to finish.
+
+private:
+    void do_job ();
+
+    std::unique_ptr<std::thread> m_thread;
+    std::mutex m_mutx;
+    std::condition_variable m_job_cond;
+    std::condition_variable m_done_cond;
+    std::queue<std::function<void()> > m_func;
+    bool m_clearing = false;
+    bool m_finalizing = false;
+};
+
+}
+
+#endif
diff --git a/Src/Base/AMReX_BackgroundThread.cpp b/Src/Base/AMReX_BackgroundThread.cpp
new file mode 100644
index 00000000000..31a2568d337
--- /dev/null
+++ b/Src/Base/AMReX_BackgroundThread.cpp
@@ -0,0 +1,63 @@
+#include <AMReX_BackgroundThread.H>
+
+namespace amrex {
+
+BackgroundThread::BackgroundThread ()
+{
+    m_thread.reset(new std::thread(&BackgroundThread::do_job, this));
+}
+
+BackgroundThread::~BackgroundThread ()
+{
+    if (m_thread) {
+        Submit([this] () { m_finalizing = true; });
+        m_thread->join();
+        m_thread.reset();
+    }
+}
+
+void BackgroundThread::do_job ()
+{
+    while (true)
+    {
+        std::unique_lock<std::mutex> lck(m_mutx);
+        m_job_cond.wait(lck, [this] () -> bool { return !m_func.empty(); });
+        auto f = m_func.front();
+        m_func.pop();
+        lck.unlock();
+        f();
+        if (m_clearing) { // All jobs before this have finished.
+            m_done_cond.notify_one();
+        }
+        if (m_finalizing) {
+            break;
+        }
+    }
+}
+
+void BackgroundThread::Submit (std::function<void()>&& a_f)
+{
+    std::lock_guard<std::mutex> lck(m_mutx);
+    m_func.emplace(std::move(a_f));
+    m_job_cond.notify_one();
+}
+
+void BackgroundThread::Submit (std::function<void()> const& a_f)
+{
+    std::lock_guard<std::mutex> lck(m_mutx);
+    m_func.emplace(a_f);
+    m_job_cond.notify_one();
+}
+
+void BackgroundThread::Finish ()
+{
+    if (m_thread) {
+        Submit([this] () { m_clearing = true; });
+        std::unique_lock<std::mutex> lck(m_mutx);
+        m_done_cond.wait(lck, [this] () -> bool { return m_func.empty(); });
+        m_clearing = false;
+        lck.unlock();
+    }
+}
+
+}
diff --git a/Src/Base/AMReX_BaseFab.H b/Src/Base/AMReX_BaseFab.H
index d9660dcf635..b33884ba933 100644
--- a/Src/Base/AMReX_BaseFab.H
+++ b/Src/Base/AMReX_BaseFab.H
@@ -33,11 +33,6 @@
 #include <AMReX_Gpu.H>
 #include <AMReX_Math.H>
 
-#ifdef USE_PERILLA
-#include <LocalConnection.H>
-#include <RemoteConnection.H>
-#endif
-
 namespace amrex
 {
 
@@ -278,7 +273,7 @@ public:
     */
     void resize (const Box& b, int N = 1);
 
-    template <class U=T, class = typename std::enable_if<std::is_trivially_destructible<U>::value>::type >
+    template <class U=T, typename std::enable_if<std::is_trivially_destructible<U>::value,int>::type = 0>
     Elixir elixir () noexcept;
 
     /**
@@ -298,7 +293,7 @@ public:
     }
 
     //! Returns bytes used in the Box for those components
-    std::size_t nBytes (const Box& bx, int start_comp, int ncomps) const noexcept
+    std::size_t nBytes (const Box& bx, int ncomps) const noexcept
         { return bx.numPts() * sizeof(T) * ncomps; }
 
     //! Returns the number of components
@@ -1610,15 +1605,6 @@ protected:
     Long truesize = 0L;         //!< nvar*numpts that was allocated on heap.
     bool ptr_owner = false;     //!< Owner of T*?
     bool shared_memory = false; //!< Is the memory allocated in shared memory?
-
-#ifdef USE_PERILLA
-public:
-    LocalConnection l_con;
-    RemoteConnection r_con;
-    bool fireable;
-    int padding[1024];
-#endif
-
 };
 
 template <class T>
@@ -1659,12 +1645,14 @@ BaseFab<T>::prefetchToHost () const noexcept
         // auto& q = Gpu::Device::streamQueue();
         // q.submit([&] (sycl::handler& h) { h.prefetch(this->dptr, s); });
 #elif defined(AMREX_USE_CUDA)
-        std::size_t s = sizeof(T)*this->nvar*this->domain.numPts();
-        AMREX_CUDA_SAFE_CALL(cudaMemPrefetchAsync(this->dptr, s,
-                                                  cudaCpuDeviceId,
-                                                  Gpu::gpuStream()));
+        if (Gpu::Device::devicePropMajor() >= 6) {
+            std::size_t s = sizeof(T)*this->nvar*this->domain.numPts();
+            AMREX_CUDA_SAFE_CALL(cudaMemPrefetchAsync(this->dptr, s,
+                                                      cudaCpuDeviceId,
+                                                      Gpu::gpuStream()));
+        }
 #elif defined(AMREX_USE_HIP)
-        // HIP FIX HERE
+        // xxxxx HIP FIX HERE after managed memory is supported
 #endif
     }
 #endif
@@ -1681,12 +1669,14 @@ BaseFab<T>::prefetchToDevice () const noexcept
         auto& q = Gpu::Device::streamQueue();
         q.submit([&] (sycl::handler& h) { h.prefetch(this->dptr, s); });
 #elif defined(AMREX_USE_CUDA)
-        std::size_t s = sizeof(T)*this->nvar*this->domain.numPts();
-        AMREX_CUDA_SAFE_CALL(cudaMemPrefetchAsync(this->dptr, s,
-                                                  Gpu::Device::deviceId(),
-                                                  Gpu::gpuStream()));
+        if (Gpu::Device::devicePropMajor() >= 6) {
+            std::size_t s = sizeof(T)*this->nvar*this->domain.numPts();
+            AMREX_CUDA_SAFE_CALL(cudaMemPrefetchAsync(this->dptr, s,
+                                                      Gpu::Device::deviceId(),
+                                                      Gpu::gpuStream()));
+        }
 #elif defined(AMREX_USE_HIP)
-        // HIP FIX HERE
+        // xxxxx HIP FIX HERE after managed memory is supported
 #endif
     }
 #endif
@@ -2036,7 +2026,7 @@ BaseFab<T>::resize (const Box& b, int n)
 }
 
 template <class T>
-template <class,class>
+template <class U, typename std::enable_if<std::is_trivially_destructible<U>::value,int>::type>
 Elixir
 BaseFab<T>::elixir () noexcept
 {
@@ -2470,7 +2460,7 @@ BaseFab<T>::maxabs (const Box& subbox, int comp) const noexcept
 #endif
     {
         T r = 0;
-        amrex::Loop(subbox, [=,&r] (int i, int j, int k) AMREX_NOEXCEPT
+        amrex::Loop(subbox, [=,&r] (int i, int j, int k) noexcept
         {
             r = amrex::max(r, amrex::Math::abs(a(i,j,k)));
         });
@@ -3943,7 +3933,7 @@ BaseFab<T>::sum (const Box& bx, DestComp dcomp, NumComps ncomp) const noexcept
     } else
 #endif
     {
-        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) AMREX_NOEXCEPT
+        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) noexcept
         {
             r += a(i,j,k,n+dcomp.i);
         });
@@ -3983,7 +3973,7 @@ BaseFab<T>::dot (const BaseFab<T>& src, const Box& bx, SrcComp scomp, DestComp d
     } else
 #endif
     {
-        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) AMREX_NOEXCEPT
+        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) noexcept
         {
             r += d(i,j,k,n+dcomp.i) * s(i,j,k,n+scomp.i);
         });
@@ -4029,7 +4019,7 @@ BaseFab<T>::dot (const Box& bx, DestComp dcomp, NumComps ncomp) const noexcept
     } else
 #endif
     {
-        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) AMREX_NOEXCEPT
+        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) noexcept
         {
             r += a(i,j,k,n+dcomp.i)*a(i,j,k,n+dcomp.i);
         });
@@ -4073,7 +4063,7 @@ BaseFab<T>::dotmask (const BaseFab<T>& src, const Box& bx, const BaseFab<int>& m
     } else
 #endif
     {
-        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) AMREX_NOEXCEPT
+        amrex::LoopOnCpu(bx, ncomp.n, [=,&r] (int i, int j, int k, int n) noexcept
         {
             int mi = static_cast<int>(static_cast<bool>(m(i,j,k)));
             r += d(i,j,k,n+dcomp.i)*s(i,j,k,n+scomp.i)*mi;
diff --git a/Src/Base/AMReX_BaseFabUtility.H b/Src/Base/AMReX_BaseFabUtility.H
index 2fba229ea29..73f68960685 100644
--- a/Src/Base/AMReX_BaseFabUtility.H
+++ b/Src/Base/AMReX_BaseFabUtility.H
@@ -9,11 +9,11 @@ template <class Tto, class Tfrom>
 AMREX_GPU_HOST_DEVICE
 void
 cast (BaseFab<Tto>& tofab, BaseFab<Tfrom> const& fromfab,
-      Box const& bx, SrcComp scomp, DestComp dcomp, NumComps ncomp) AMREX_NOEXCEPT 
+      Box const& bx, SrcComp scomp, DestComp dcomp, NumComps ncomp) noexcept
 {
     auto const& tdata = tofab.array();
     auto const& fdata = fromfab.const_array();
-    amrex::LoopConcurrent(bx, ncomp.n, [=] (int i, int j, int k, int n) AMREX_NOEXCEPT
+    amrex::LoopConcurrent(bx, ncomp.n, [=] (int i, int j, int k, int n) noexcept
     {
         tdata(i,j,k,n+dcomp.i) = static_cast<Tto>(fdata(i,j,k,n+scomp.i));
     });
diff --git a/Src/Base/AMReX_BlockMutex.H b/Src/Base/AMReX_BlockMutex.H
index 8339bfce8a0..b00c55e797f 100644
--- a/Src/Base/AMReX_BlockMutex.H
+++ b/Src/Base/AMReX_BlockMutex.H
@@ -11,7 +11,7 @@ struct BlockMutex
 {
     union state_t
     {
-        struct { int blockid; int count; };
+        struct II { int blockid; int count; } data;
         unsigned long long ull;
     };
 
@@ -32,6 +32,7 @@ struct BlockMutex
     void lock (int i) noexcept {
 #ifdef AMREX_USE_DPCPP
 // xxxxx DPCPP todo
+        amrex::ignore_unused(i);
 #else
         int blockid = blockIdx.z*blockDim.x*blockDim.y + blockIdx.y*blockDim.x + blockIdx.x;
         state_t old = m_state[i];
@@ -39,13 +40,13 @@ struct BlockMutex
         do {
             assumed = old;
             state_t val;
-            val.blockid = blockid;
-            if (assumed.blockid == blockid) {
+            val.data.blockid = blockid;
+            if (assumed.data.blockid == blockid) {
                 // Already locked by another thread in this block. Need to ++count.
-                val.count = assumed.count + 1;
+                val.data.count = assumed.data.count + 1;
             } else {
                 // Currently unlocked or locked by another block.  Need to lock.
-                val.count = 1;
+                val.data.count = 1;
                 assumed = FreeState();
             }
             old.ull = atomicCAS((unsigned long long*)(m_state+i), assumed.ull, val.ull);
@@ -57,19 +58,20 @@ struct BlockMutex
     void unlock (int i) noexcept {
 #ifdef AMREX_USE_DPCPP
 // xxxxx DPCPP todo
+        amrex::ignore_unused(i);
 #else
         state_t old = m_state[i];
         state_t assumed;
         do {
             assumed = old;
             state_t val;
-            if (assumed.count == 1) {
+            if (assumed.data.count == 1) {
                 // Need to unlock
                 val = FreeState();
             } else {
                 // --count, but do NOT unlock
                 val = assumed;
-                --val.count;
+                --val.data.count;
             }
             old.ull = atomicCAS((unsigned long long*)(m_state+i), assumed.ull, val.ull);
         } while (assumed.ull != old.ull);
diff --git a/Src/Base/AMReX_BlockMutex.cpp b/Src/Base/AMReX_BlockMutex.cpp
index e1bdf5d75bb..e16892fec17 100644
--- a/Src/Base/AMReX_BlockMutex.cpp
+++ b/Src/Base/AMReX_BlockMutex.cpp
@@ -6,6 +6,7 @@ namespace amrex {
 
 void BlockMutex::init_states (state_t* state, int N) noexcept {
 #ifdef AMREX_USE_DPCPP
+    amrex::ignore_unused(state,N);
     amrex::Abort("xxxxx DPCPP todo");
 #else
     amrex::launch((N+255)/256, 256, Gpu::nullStream(),
diff --git a/Src/Base/AMReX_Box.H b/Src/Base/AMReX_Box.H
index 3a06cdccb6b..2927288e5e3 100644
--- a/Src/Base/AMReX_Box.H
+++ b/Src/Base/AMReX_Box.H
@@ -152,33 +152,33 @@ public:
     AMREX_GPU_HOST_DEVICE
     GpuArray<int,3> length3d () const noexcept {
 #if (AMREX_SPACEDIM == 1)
-        return {bigend[0]-smallend[0]+1, 1, 1};
+        return {{bigend[0]-smallend[0]+1, 1, 1}};
 #elif (AMREX_SPACEDIM == 2)
-        return {bigend[0]-smallend[0]+1, bigend[1]-smallend[1]+1, 1};
+        return {{bigend[0]-smallend[0]+1, bigend[1]-smallend[1]+1, 1}};
 #elif (AMREX_SPACEDIM == 3)
-        return {bigend[0]-smallend[0]+1, bigend[1]-smallend[1]+1, bigend[2]-smallend[2]+1};
+        return {{bigend[0]-smallend[0]+1, bigend[1]-smallend[1]+1, bigend[2]-smallend[2]+1}};
 #endif
     }
 
     AMREX_GPU_HOST_DEVICE
     GpuArray<int,3> loVect3d () const noexcept {
 #if (AMREX_SPACEDIM == 1)
-        return {smallend[0], 0, 0};
+        return {{smallend[0], 0, 0}};
 #elif (AMREX_SPACEDIM == 2)
-        return {smallend[0], smallend[1], 0};
+        return {{smallend[0], smallend[1], 0}};
 #elif (AMREX_SPACEDIM == 3)
-        return {smallend[0], smallend[1], smallend[2]};
+        return {{smallend[0], smallend[1], smallend[2]}};
 #endif
     }
 
     AMREX_GPU_HOST_DEVICE
     GpuArray<int,3> hiVect3d () const noexcept {
 #if (AMREX_SPACEDIM == 1)
-        return {bigend[0], 0, 0};
+        return {{bigend[0], 0, 0}};
 #elif (AMREX_SPACEDIM == 2)
-        return {bigend[0], bigend[1], 0};
+        return {{bigend[0], bigend[1], 0}};
 #elif (AMREX_SPACEDIM == 3)
-        return {bigend[0], bigend[1], bigend[2]};
+        return {{bigend[0], bigend[1], bigend[2]}};
 #endif
     }
 
@@ -473,6 +473,9 @@ public:
     AMREX_GPU_HOST_DEVICE
     Box& surroundingNodes (int dir) noexcept;
 
+    AMREX_GPU_HOST_DEVICE
+    Box& surroundingNodes (Direction d) noexcept { return surroundingNodes(static_cast<int>(d)); }
+
     //! Convert to CELL type in all directions.
     AMREX_GPU_HOST_DEVICE
     Box& enclosedCells () noexcept;
@@ -481,6 +484,9 @@ public:
     AMREX_GPU_HOST_DEVICE
     Box& enclosedCells (int dir) noexcept;
 
+    AMREX_GPU_HOST_DEVICE
+    Box& enclosedCells (Direction d) noexcept { return enclosedCells(static_cast<int>(d)); }
+
     /**
     * \brief Return Box that is intersection of this Box
     * and argument.  The Boxes MUST be of same type.
@@ -498,17 +504,6 @@ public:
         return *this;
     }
 
-    //! for serialization
-    static size_t linearSize() noexcept
-    {
-        size_t retval = 2*IntVect::linearSize();
-        return retval;
-    }
-
-    //! for serialization
-    void linearOut(void* a_buffer ) const noexcept;
-    void linearIn(void* a_buffer ) noexcept;
-
     /**
     * \brief Modify Box to that of the minimum Box containing both
     * the original Box and the argument.
@@ -572,6 +567,9 @@ public:
     AMREX_GPU_HOST_DEVICE
     Box& grow (int idir, int n_cell) noexcept { smallend.shift(idir, -n_cell); bigend.shift(idir, n_cell); return *this; }
 
+    AMREX_GPU_HOST_DEVICE
+    Box& grow (Direction d, int n_cell) noexcept { return grow(static_cast<int>(d), n_cell); }
+
     /**
     * \brief Grow the Box on the low end by n_cell cells in direction idir.
     * NOTE: n_cell negative shrinks the Box by that number of cells.
@@ -579,6 +577,9 @@ public:
     AMREX_GPU_HOST_DEVICE
     Box& growLo (int idir, int n_cell = 1) noexcept { smallend.shift(idir, -n_cell); return *this; }
 
+    AMREX_GPU_HOST_DEVICE
+    Box& growLo (Direction d, int n_cell = 1) noexcept { return growLo(static_cast<int>(d), n_cell); }
+
     /**
     * \brief Grow the Box on the high end by n_cell cells in
     * direction idir.  NOTE: n_cell negative shrinks the Box by that
@@ -587,6 +588,9 @@ public:
     AMREX_GPU_HOST_DEVICE
     Box& growHi (int idir, int n_cell = 1) noexcept { bigend.shift(idir,n_cell); return *this; }
 
+    AMREX_GPU_HOST_DEVICE
+    Box& growHi (Direction d, int n_cell = 1) noexcept { return growHi(static_cast<int>(d), n_cell); }
+
     //! Grow in the direction of the given face.
     AMREX_GPU_HOST_DEVICE
     Box& grow (Orientation face, int n_cell = 1) noexcept {
@@ -871,7 +875,6 @@ Box::atOffset (Long offset) const noexcept
                                 static_cast<int>(k+lo[2])) };
 }
 
-// HIP FIX HERE - Initialization List: {{
 AMREX_GPU_HOST_DEVICE
 AMREX_FORCE_INLINE
 GpuArray<int,3>
@@ -899,34 +902,6 @@ Box::setRange (int dir,
     return *this;
 }
 
-inline
-void
-Box::linearOut(void* a_buffer ) const noexcept
-{
-    unsigned char* buf = (unsigned char*) a_buffer;
-    const IntVect& ivlo = this->smallEnd();
-    const IntVect& ivhi = this->bigEnd();
-    ivlo.linearOut(buf);
-    buf += ivlo.linearSize();
-    ivhi.linearOut(buf);
-//    buf += ivhi.linearSize();
-}
-
-inline
-void
-Box::linearIn(void* a_buffer ) noexcept
-{
-    unsigned char* buf = (unsigned char*) a_buffer;
-    IntVect ivlo;
-    IntVect ivhi;
-    ivlo.linearIn(buf);
-    buf += ivlo.linearSize();
-    ivhi.linearIn(buf);
-//    buf += ivhi.linearSize();
-
-    *this = Box(ivlo, ivhi);
-}
-
 AMREX_GPU_HOST_DEVICE
 AMREX_FORCE_INLINE
 void
@@ -1071,7 +1046,7 @@ public:
 
 inline BoxConverter::~BoxConverter () { }
 
-void AllGatherBoxes (Vector<Box>& bxs);
+void AllGatherBoxes (Vector<Box>& bxs, int n_extra_reserve=0);
 
     /**
     * \brief Grow Box in all directions by given amount.
@@ -1107,6 +1082,13 @@ Box grow (const Box& b, int idir, int n_cell) noexcept
     return result;
 }
 
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+Box grow (const Box& b, Direction d, int n_cell) noexcept
+{
+    return grow(b, static_cast<int>(d), n_cell);
+}
+
 AMREX_GPU_HOST_DEVICE
 AMREX_FORCE_INLINE
 Box growLo (const Box& b, int idir, int n_cell) noexcept
@@ -1116,6 +1098,13 @@ Box growLo (const Box& b, int idir, int n_cell) noexcept
     return result;
 }
 
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+Box growLo (const Box& b, Direction d, int n_cell) noexcept
+{
+    return growLo(b, static_cast<int>(d), n_cell);
+}
+
 AMREX_GPU_HOST_DEVICE
 AMREX_FORCE_INLINE
 Box growHi (const Box& b, int idir, int n_cell) noexcept
@@ -1125,6 +1114,13 @@ Box growHi (const Box& b, int idir, int n_cell) noexcept
     return result;
 }
 
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+Box growHi (const Box& b, Direction d, int n_cell) noexcept
+{
+    return growHi(b, static_cast<int>(d), n_cell);
+}
+
     /**
     * \brief Coarsen Box by given (positive) refinement ratio.
     * NOTE: if type(dir) = CELL centered: lo <- lo/ratio and
@@ -1226,6 +1222,13 @@ Box surroundingNodes (const Box& b, int dir) noexcept
     return bx;
 }
 
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+Box surroundingNodes (const Box& b, Direction d) noexcept
+{
+    return surroundingNodes(b, static_cast<int>(d));
+}
+
     /**
     * \brief Returns a Box with NODE based coordinates in all
     * directions that encloses Box b.
@@ -1273,6 +1276,13 @@ Box enclosedCells (const Box& b, int dir) noexcept
     return bx;
 }
 
+AMREX_GPU_HOST_DEVICE
+AMREX_FORCE_INLINE
+Box enclosedCells (const Box& b, Direction d) noexcept
+{
+    return enclosedCells(b, static_cast<int>(d));
+}
+
     /**
     * \brief Returns a Box with CELL based coordinates in all
     * directions that is enclosed by b.
diff --git a/Src/Base/AMReX_Box.cpp b/Src/Base/AMReX_Box.cpp
index 5e6a92a65ac..b0d6423e032 100644
--- a/Src/Base/AMReX_Box.cpp
+++ b/Src/Base/AMReX_Box.cpp
@@ -104,19 +104,51 @@ BoxCommHelper::BoxCommHelper (const Box& bx, int* p_)
 }
 
 void
-AllGatherBoxes (Vector<Box>& bxs)
+AllGatherBoxes (Vector<Box>& bxs, int n_extra_reserve)
 {
 #ifdef BL_USE_MPI
-    // cell centered boxes only!
-    const auto szof_bx = Box::linearSize();
 
-    const Long count = bxs.size() * static_cast<Long>(szof_bx);
-    const auto& countvec = ParallelDescriptor::Gather(count, ParallelDescriptor::IOProcessorNumber());
-    
+#if 0
+    // In principle, MPI_Allgather/MPI_Allgatherv should not be slower than
+    // MPI_Gather/MPI_Gatherv followed by MPI_Bcast.  But that's not true on Summit.
+    MPI_Comm comm = ParallelContext::CommunicatorSub();
+    const int count = bxs.size();
+    Vector<int> countvec(ParallelContext::NProcsSub());
+    MPI_Allgather(&count, 1, MPI_INT, countvec.data(), 1, MPI_INT, comm);
+
+    Vector<int> offset(countvec.size(),0);
+    Long count_tot = countvec[0];
+    for (int i = 1, N = offset.size(); i < N; ++i) {
+        offset[i] = offset[i-1] + countvec[i-1];
+        count_tot += countvec[i];
+    }
+
+    if (count_tot == 0) return;
+
+    if (count_tot > static_cast<Long>(std::numeric_limits<int>::max())) {
+        amrex::Abort("AllGatherBoxes: not many boxes");
+    }
+
+    Vector<Box> recv_buffer;
+    recv_buffer.reserve(count_tot+n_extra_reserve);
+    recv_buffer.resize(count_tot);
+    MPI_Allgatherv(bxs.data(), count, ParallelDescriptor::Mpi_typemap<Box>::type(),
+                   recv_buffer.data(), countvec.data(), offset.data(),
+                   ParallelDescriptor::Mpi_typemap<Box>::type(), comm);
+
+    std::swap(bxs,recv_buffer);
+#else
+    MPI_Comm comm = ParallelContext::CommunicatorSub();
+    const int root = ParallelContext::IOProcessorNumberSub();
+    const int myproc = ParallelContext::MyProcSub();
+    const int nprocs = ParallelContext::NProcsSub();
+    const int count = bxs.size();
+    Vector<int> countvec(nprocs);
+    MPI_Gather(&count, 1, MPI_INT, countvec.data(), 1, MPI_INT, root, comm);
+
     Long count_tot = 0L;
-    Vector<Long> offset(countvec.size(),0L);
-    if (ParallelDescriptor::IOProcessor())
-    {
+    Vector<int> offset(countvec.size(),0);
+    if (myproc == root) {
         count_tot = countvec[0];
         for (int i = 1, N = offset.size(); i < N; ++i) {
             offset[i] = offset[i-1] + countvec[i-1];
@@ -124,31 +156,28 @@ AllGatherBoxes (Vector<Box>& bxs)
         }
     }
 
-    ParallelDescriptor::Bcast(&count_tot, 1, ParallelDescriptor::IOProcessorNumber());
+    MPI_Bcast(&count_tot, 1, MPI_INT, root, comm);
 
     if (count_tot == 0) return;
 
-    Vector<char> send_buffer(count);
-    char* psend = (count > 0) ? send_buffer.data() : nullptr;
-    char* p = psend;
-    for (const auto& b : bxs) {
-        b.linearOut(p);
-        p += szof_bx;
+    if (count_tot > static_cast<Long>(std::numeric_limits<int>::max())) {
+        amrex::Abort("AllGatherBoxes: not many boxes");
     }
 
-    Vector<char> recv_buffer(count_tot);
-    ParallelDescriptor::Gatherv(psend, count, recv_buffer.data(), countvec, offset, ParallelDescriptor::IOProcessorNumber());
-
-    ParallelDescriptor::Bcast(recv_buffer.data(), count_tot, ParallelDescriptor::IOProcessorNumber());
+    Vector<Box> recv_buffer;
+    recv_buffer.reserve(count_tot+n_extra_reserve);
+    recv_buffer.resize(count_tot);
+    MPI_Gatherv(bxs.data(), count, ParallelDescriptor::Mpi_typemap<Box>::type(),
+                recv_buffer.data(), countvec.data(), offset.data(),
+                ParallelDescriptor::Mpi_typemap<Box>::type(), root, comm);
+    MPI_Bcast(recv_buffer.data(), count_tot, ParallelDescriptor::Mpi_typemap<Box>::type(),
+              root, comm);
 
-    const Long nboxes_tot = count_tot/szof_bx;
-    bxs.resize(nboxes_tot);
+    std::swap(bxs,recv_buffer);
+#endif
 
-    p = recv_buffer.data();
-    for (auto& b : bxs) {
-        b.linearIn(p);
-        p += szof_bx;
-    }
+#else
+    amrex::ignore_unused(bxs,n_extra_reserve);
 #endif
 }
 
diff --git a/Src/Base/AMReX_BoxArray.H b/Src/Base/AMReX_BoxArray.H
index 9f4d17ecbd3..7f3f8bfdd4d 100644
--- a/Src/Base/AMReX_BoxArray.H
+++ b/Src/Base/AMReX_BoxArray.H
@@ -516,6 +516,8 @@ using BndryBATransformer = BATransformer;
 */
 
 class MFIter;
+class AmrMesh;
+class FabArrayBase;
 
 class BoxArray
 {
@@ -551,6 +553,8 @@ public:
     explicit BoxArray (BoxList&& bl) noexcept;
 
     BoxArray (const BoxArray& rhs, const BATransformer& trans);
+
+    BoxArray (BoxList&& bl, IntVect const& max_grid_size);
     
     /**
     * \brief Initialize the BoxArray from a single box.
@@ -796,10 +800,16 @@ public:
     //! Make ourselves unique.
     void uniqify ();
 
+    friend class AmrMesh;
+    friend class FabArrayBase;
+
 private:
     //!  Update BoxArray index type according the box type, and then convert boxes to cell-centered.
     void type_update ();
 
+    BoxList const& simplified_list () const; // For regular AMR grids only
+    BoxArray simplified () const;
+
     BARef::HashType& getHashMap () const;
 
     IntVect getDoiLo () const noexcept;
@@ -808,6 +818,7 @@ private:
     BATransformer m_bat;
     //! The data -- a reference-counted pointer to a Ref.
     std::shared_ptr<BARef> m_ref;
+    mutable std::shared_ptr<BoxList> m_simplified_list;
 };
 
 //! Write a BoxArray to an ostream in ASCII format.
diff --git a/Src/Base/AMReX_BoxArray.cpp b/Src/Base/AMReX_BoxArray.cpp
index 1ec8ed8e4f0..cf6ebb79a1c 100644
--- a/Src/Base/AMReX_BoxArray.cpp
+++ b/Src/Base/AMReX_BoxArray.cpp
@@ -10,9 +10,7 @@
 #include <AMReX_MemProfiler.H>
 #endif
 
-#ifdef _OPENMP
-#include <omp.h>
-#endif
+#include <AMReX_OpenMP.H>
 
 namespace amrex {
 
@@ -280,7 +278,8 @@ BoxArray::BoxArray ()
 BoxArray::BoxArray (const Box& bx)
     :
     m_bat(bx.ixType()),
-    m_ref(std::make_shared<BARef>(amrex::enclosedCells(bx)))
+    m_ref(std::make_shared<BARef>(amrex::enclosedCells(bx))),
+    m_simplified_list(std::make_shared<BoxList>(bx))
 {}
 
 BoxArray::BoxArray (const BoxList& bl)
@@ -327,15 +326,30 @@ BoxArray::BoxArray (const BoxArray& rhs, const BATransformer& trans)
 BoxArray::BoxArray (const BoxArray& rhs)
     :
     m_bat(rhs.m_bat),
-    m_ref(rhs.m_ref)
+    m_ref(rhs.m_ref),
+    m_simplified_list(rhs.m_simplified_list)
 {}
 
+BoxArray::BoxArray (BoxList&& bl, IntVect const& max_grid_size)
+    :
+    m_bat(),
+    m_ref(std::make_shared<BARef>()),
+    m_simplified_list(std::make_shared<BoxList>(std::move(bl)))
+{
+    BoxList tmpbl = *m_simplified_list;
+    tmpbl.maxSize(max_grid_size);
+    m_bat = BATransformer(tmpbl.ixType());
+    m_ref->define(std::move(tmpbl));
+    type_update();
+}
+
 void
 BoxArray::define (const Box& bx)
 {
     clear();
     m_bat = BATransformer(bx.ixType());
     m_ref->define(amrex::enclosedCells(bx));
+    m_simplified_list = std::make_shared<BoxList>(bx);
 }
 
 void
@@ -361,6 +375,7 @@ BoxArray::clear ()
 {
     m_bat = BATransformer();
     m_ref.reset(new BARef());
+    m_simplified_list.reset();
 }
 
 void
@@ -544,7 +559,11 @@ BoxArray::maxSize (const IntVect& block_size)
     blst.maxSize(block_size);
     const int N = blst.size();
     if (size() != N) { // If size doesn't change, do nothing.
+        BoxList bak = (m_simplified_list) ? *m_simplified_list : BoxList();
         define(std::move(blst));
+        if (bak.isNotEmpty()) {
+            m_simplified_list = std::make_shared<BoxList>(std::move(bak));
+        }
     }
     return *this;
 }
@@ -1023,10 +1042,8 @@ BoxArray::minimalBox () const
 #pragma omp parallel
 #endif
 	    {
-#ifndef _OPENMP
-		int tid = 0;
-#else
-		int tid = omp_get_thread_num();
+                int tid = OpenMP::get_thread_num();
+#ifdef _OPENMP
 #pragma omp for
 #endif
 		for (int i = 0; i < N; ++i) {
@@ -1075,10 +1092,8 @@ BoxArray::minimalBox (Long& npts_avg_box) const
 #pragma omp parallel reduction(+:npts_tot)
 #endif
             {
-#ifndef _OPENMP
-                int tid = 0;
-#else
-                int tid = omp_get_thread_num();
+                int tid = OpenMP::get_thread_num();
+#ifdef _OPENMP
 #pragma omp for
 #endif
                 for (int i = 0; i < N; ++i) {
@@ -1260,99 +1275,87 @@ BoxArray::complementIn (BoxList& bl, const Box& bx) const
     bl.set(bx.ixType());
     bl.push_back(bx);
 
-    if (!empty()) 
-    {
-	BARef::HashType& BoxHashMap = getHashMap();
+    if (empty()) return;
 
-	BL_ASSERT(bx.ixType() == ixType());
+    BARef::HashType& BoxHashMap = getHashMap();
 
-	Box gbx = bx;
+    BL_ASSERT(bx.ixType() == ixType());
 
-	IntVect glo = gbx.smallEnd();
-	IntVect ghi = gbx.bigEnd();
-	const IntVect& doilo = getDoiLo();
-	const IntVect& doihi = getDoiHi();
+    Box gbx = bx;
 
-	gbx.setSmall(glo - doihi).setBig(ghi + doilo);
-        gbx.refine(crseRatio()).coarsen(m_ref->crsn);
-	
-        const IntVect& sm = amrex::max(gbx.smallEnd()-1, m_ref->bbox.smallEnd());
-        const IntVect& bg = amrex::min(gbx.bigEnd(),     m_ref->bbox.bigEnd());
+    IntVect glo = gbx.smallEnd();
+    IntVect ghi = gbx.bigEnd();
+    const IntVect& doilo = getDoiLo();
+    const IntVect& doihi = getDoiHi();
 
-        Box cbx(sm,bg);
-        cbx.normalize();
+    gbx.setSmall(glo - doihi).setBig(ghi + doilo);
+    gbx.refine(crseRatio()).coarsen(m_ref->crsn);
 
-	if (!cbx.intersects(m_ref->bbox)) return;
+    const IntVect& sm = amrex::max(gbx.smallEnd()-1, m_ref->bbox.smallEnd());
+    const IntVect& bg = amrex::min(gbx.bigEnd(),     m_ref->bbox.bigEnd());
 
-	auto TheEnd = BoxHashMap.cend();
+    Box cbx(sm,bg);
+    cbx.normalize();
 
-        BoxList newbl(bl.ixType());
-        newbl.reserve(bl.capacity());
-        BoxList newdiff(bl.ixType());
+    if (!cbx.intersects(m_ref->bbox)) return;
 
-        auto& abox = m_ref->m_abox;
+    auto TheEnd = BoxHashMap.cend();
 
-	for (IntVect iv = cbx.smallEnd(), End = cbx.bigEnd(); 
-	     iv <= End && bl.isNotEmpty(); 
-	     cbx.next(iv))
+    Vector<Box> intersect_boxes;
+    auto& abox = m_ref->m_abox;
+    if (m_bat.is_null()) {
+        AMREX_LOOP_3D(cbx, i, j, k,
         {
-            auto it = BoxHashMap.find(iv);
-
-            if (it != TheEnd)
-            {
-                if (m_bat.is_null()) {
-                    for (const int index : it->second)
-                    {
-                        const Box& ibox = abox[index];
-                        const Box& isect = bx & ibox;
-
-                        if (isect.ok())
-                        {
-                            newbl.clear();
-                            for (const Box& b : bl) {
-                                amrex::boxDiff(newdiff, b, isect);
-                                newbl.join(newdiff);
-                            }
-                            bl.swap(newbl);
-                        }
+            auto it = BoxHashMap.find(IntVect(AMREX_D_DECL(i,j,k)));
+            if (it != TheEnd) {
+                for (const int index : it->second) {
+                    const Box& ibox = abox[index];
+                    if (bx.intersects(ibox)) {
+                        intersect_boxes.push_back(ibox);
                     }
-                } else if (m_bat.is_simple()) {
-                    IndexType t = ixType();
-                    IntVect cr = crseRatio();
-                    for (const int index : it->second)
-                    {
-                        const Box& ibox = amrex::convert(amrex::coarsen(abox[index],cr),t);
-                        const Box& isect = bx & ibox;
-
-                        if (isect.ok())
-                        {
-                            newbl.clear();
-                            for (const Box& b : bl) {
-                                amrex::boxDiff(newdiff, b, isect);
-                                newbl.join(newdiff);
-                            }
-                            bl.swap(newbl);
-                        }
+                }
+            }
+        });
+    } else if (m_bat.is_simple()) {
+        IndexType t = ixType();
+        IntVect cr = crseRatio();
+        AMREX_LOOP_3D(cbx, i, j, k,
+        {
+            auto it = BoxHashMap.find(IntVect(AMREX_D_DECL(i,j,k)));
+            if (it != TheEnd) {
+                for (const int index : it->second) {
+                    const Box& ibox = amrex::convert(amrex::coarsen(abox[index],cr),t);
+                    if (bx.intersects(ibox)) {
+                        intersect_boxes.push_back(ibox);
                     }
-                } else {
-                    for (const int index : it->second)
-                    {
-                        const Box& ibox = m_bat.m_op.m_bndryReg(abox[index]);
-                        const Box& isect = bx & ibox;
-
-                        if (isect.ok())
-                        {
-                            newbl.clear();
-                            for (const Box& b : bl) {
-                                amrex::boxDiff(newdiff, b, isect);
-                                newbl.join(newdiff);
-                            }
-                            bl.swap(newbl);
-                        }
+                }
+            }
+        });
+    } else {
+        AMREX_LOOP_3D(cbx, i, j, k,
+        {
+            auto it = BoxHashMap.find(IntVect(AMREX_D_DECL(i,j,k)));
+            if (it != TheEnd) {
+                for (const int index : it->second) {
+                    const Box& ibox = m_bat.m_op.m_bndryReg(abox[index]);
+                    if (bx.intersects(ibox)) {
+                        intersect_boxes.push_back(ibox);
                     }
                 }
             }
+        });
+    }
+
+    BoxList newbl(bl.ixType());
+    BoxList newdiff(bl.ixType());
+    for  (auto const& ibox : intersect_boxes) {
+        newbl.clear();
+        for (Box const& b : bl) {
+            amrex::boxDiff(newdiff, b, ibox);
+            newbl.join(newdiff);
         }
+        bl.swap(newbl);
+        if (bl.isEmpty()) { return; }
     }
 }
 
@@ -1553,6 +1556,24 @@ BoxArray::uniqify ()
         }
         m_bat.set_coarsen_ratio(IntVect::TheUnitVector());
     }
+    m_simplified_list.reset();
+}
+
+BoxList const&
+BoxArray::simplified_list () const
+{
+    if (!m_simplified_list) {
+        BoxList bl = boxList();
+        bl.ordered_simplify();
+        m_simplified_list = std::make_shared<BoxList>(std::move(bl));
+    }
+    return *m_simplified_list;
+}
+
+BoxArray
+BoxArray::simplified () const
+{
+    return BoxArray(simplified_list()).convert(ixType());
 }
 
 std::ostream&
diff --git a/Src/Base/AMReX_BoxDomain.cpp b/Src/Base/AMReX_BoxDomain.cpp
index dc3a07a2f62..8c4a7c4a7d3 100644
--- a/Src/Base/AMReX_BoxDomain.cpp
+++ b/Src/Base/AMReX_BoxDomain.cpp
@@ -63,6 +63,7 @@ BoxDomain&
 BoxDomain::complementIn (const Box&       b,
                          const BoxDomain& bl)
 {
+    BL_PROFILE("BoxDomain::complementIn()");
     BoxList::complementIn(b,bl);
     BL_ASSERT(ok());
     return *this;
diff --git a/Src/Base/AMReX_BoxList.H b/Src/Base/AMReX_BoxList.H
index aa9612f3fdf..3513b5cae63 100644
--- a/Src/Base/AMReX_BoxList.H
+++ b/Src/Base/AMReX_BoxList.H
@@ -139,11 +139,13 @@ public:
     //! Remove empty Boxes from this BoxList.
     BoxList& removeEmpty();
 
-    BoxList& complementIn (const Box&     b,
-                           const BoxList& bl);
-    BoxList& complementIn (const Box&     b,
-                            BoxList&&     bl);
+    BoxList& complementIn (const Box& b, const BoxList& bl);
+    BoxList& complementIn (const Box& b, BoxList&& bl);
     BoxList& complementIn (const Box& b, const BoxArray& ba);
+    BoxList& parallelComplementIn (const Box& b, const BoxList& bl);
+    BoxList& parallelComplementIn (const Box& b, BoxList&& bl);
+    BoxList& parallelComplementIn (const Box& b, const BoxArray& ba);
+
     //! Refine each Box in the BoxList by the ratio.
     BoxList& refine (int ratio);
     //! Refine each Box in the BoxList by the ratio.
@@ -173,6 +175,8 @@ public:
     * is O(N-squared) while the other algorithm is O(N).
     */
     int simplify (bool best = false);
+    //! Assuming the boxes are nicely ordered
+    int ordered_simplify ();
     //! Forces each Box in the BoxList to have sides of length <= chunk.
     BoxList& maxSize (int chunk);
     //! Forces each Box in the BoxList to have dimth side of length <= chunk[dim].
@@ -210,9 +214,11 @@ public:
 	std::swap(btype, rhs.btype);
     }
 
+    void Bcast ();
+
 private:
     //! Core simplify routine.
-    int simplify_doit (bool best);
+    int simplify_doit (int depth);
 
     //! The list of Boxes.
     Vector<Box> m_lbox;
diff --git a/Src/Base/AMReX_BoxList.cpp b/Src/Base/AMReX_BoxList.cpp
index 71b9da577c8..c70a0cfa8df 100644
--- a/Src/Base/AMReX_BoxList.cpp
+++ b/Src/Base/AMReX_BoxList.cpp
@@ -7,6 +7,7 @@
 #include <AMReX_BoxArray.H>
 #include <AMReX_BoxList.H>
 #include <AMReX_BLProfiler.H>
+#include <AMReX_ParallelDescriptor.H>
 
 #ifdef _OPENMP
 #include <omp.h>
@@ -69,7 +70,7 @@ BoxList::clear ()
 void
 BoxList::join (const BoxList& blist)
 {
-    BL_ASSERT(ixType() == blist.ixType());
+    BL_ASSERT(blist.size() == 0 || ixType() == blist.ixType());
     m_lbox.insert(std::end(m_lbox), std::begin(blist), std::end(blist));
 }
 
@@ -83,7 +84,7 @@ BoxList::join (const Vector<Box>& barr)
 void
 BoxList::catenate (BoxList& blist)
 {
-    BL_ASSERT(ixType() == blist.ixType());
+    BL_ASSERT(blist.size() == 0 || ixType() == blist.ixType());
     m_lbox.insert(std::end(m_lbox), std::begin(blist), std::end(blist));
     blist.m_lbox.clear();
 }
@@ -98,8 +99,7 @@ BoxList::removeEmpty()
 }
 
 BoxList
-intersect (const BoxList& bl,
-           const Box&     b)
+intersect (const BoxList& bl, const Box& b)
 {
     BL_ASSERT(bl.ixType() == b.ixType());
     BoxList newbl(bl);
@@ -108,8 +108,7 @@ intersect (const BoxList& bl,
 }
 
 BoxList
-refine (const BoxList& bl,
-        int            ratio)
+refine (const BoxList& bl, int ratio)
 {
     BoxList nbl(bl);
     nbl.refine(ratio);
@@ -117,8 +116,7 @@ refine (const BoxList& bl,
 }
 
 BoxList
-coarsen (const BoxList& bl,
-         int            ratio)
+coarsen (const BoxList& bl, int ratio)
 {
     BoxList nbl(bl);
     nbl.coarsen(ratio);
@@ -126,8 +124,7 @@ coarsen (const BoxList& bl,
 }
 
 BoxList
-accrete (const BoxList& bl,
-         int            sz)
+accrete (const BoxList& bl, int sz)
 {
     BoxList nbl(bl);
     nbl.accrete(sz);
@@ -303,8 +300,7 @@ BoxList::intersect (const BoxList& bl)
 }
 
 BoxList
-complementIn (const Box&     b,
-              const BoxList& bl)
+complementIn (const Box& b, const BoxList& bl)
 {
     BL_ASSERT(bl.ixType() == b.ixType());
     BoxList newb(b.ixType());
@@ -313,16 +309,14 @@ complementIn (const Box&     b,
 }
 
 BoxList&
-BoxList::complementIn (const Box&     b,
-                       const BoxList& bl)
+BoxList::complementIn (const Box& b, const BoxList& bl)
 {
     BoxArray ba(bl);
     return complementIn(b, ba);
 }
 
 BoxList&
-BoxList::complementIn (const Box& b,
-                       BoxList&&  bl)
+BoxList::complementIn (const Box& b, BoxList&& bl)
 {
     BoxArray ba(std::move(bl));
     return complementIn(b, ba);
@@ -406,6 +400,112 @@ BoxList::complementIn (const Box& b, const BoxArray& ba)
     return *this;
 }
 
+BoxList&
+BoxList::parallelComplementIn (const Box& b, const BoxList& bl)
+{
+    return parallelComplementIn(b, BoxArray(bl));
+}
+
+BoxList&
+BoxList::parallelComplementIn (const Box& b, BoxList&& bl)
+{
+    return parallelComplementIn(b, BoxArray(std::move(bl)));
+}
+
+BoxList&
+BoxList::parallelComplementIn (const Box& b, BoxArray const& ba)
+{
+    BL_PROFILE("BoxList::parallelComplementIn()");
+#ifndef AMREX_USE_MPI
+    return complementIn(b,ba);
+#else
+    if (ba.size() <= 8)
+    {
+        return complementIn(b,ba);
+    }
+    else
+    {
+        BL_PROFILE_VAR("BoxList::pci", boxlistpci);
+
+        Long npts_avgbox;
+        Box mbox = ba.minimalBox(npts_avgbox);
+        *this = amrex::boxDiff(b, mbox);
+        auto mytyp = ixType();
+
+        BoxList bl_mesh(mbox & b);
+
+#if (AMREX_SPACEDIM == 1)
+        Real s_avgbox = npts_avgbox;
+#elif (AMREX_SPACEDIM == 2)
+        Real s_avgbox = std::sqrt(npts_avgbox);
+#elif (AMREX_SPACEDIM == 3)
+        Real s_avgbox = std::cbrt(npts_avgbox);
+#endif
+
+        const int block_size = 4 * std::max(1,static_cast<int>(std::ceil(s_avgbox/4.))*4);
+        bl_mesh.maxSize(block_size);
+        const int N = bl_mesh.size();
+
+        const int nprocs = ParallelContext::NProcsSub();
+        const int myproc = ParallelContext::MyProcSub();
+        const int navg = N / nprocs;
+        const int nextra = N - navg*nprocs;
+        const int ilo = (myproc < nextra) ? myproc*(navg+1) : myproc*navg+nextra;
+        const int ihi = (myproc < nextra) ? ilo+navg+1-1 : ilo+navg-1;
+
+        Vector<Box> local_boxes;
+
+#ifdef _OPENMP
+        bool start_omp_parallel = !omp_in_parallel();
+        const int nthreads = omp_get_max_threads();
+#else
+        bool start_omp_parallel = false;
+#endif
+
+        if (start_omp_parallel)
+        {
+#ifdef _OPENMP
+            Vector<BoxList> bl_priv(nthreads, BoxList(mytyp));
+            int ntot = 0;
+#pragma omp parallel reduction(+:ntot)
+            {
+                BoxList bl_tmp(mytyp);
+                auto& vbox = bl_priv[omp_get_thread_num()].m_lbox;
+#pragma omp for
+                for (int i = ilo; i <= ihi; ++i)
+                {
+                    ba.complementIn(bl_tmp, bl_mesh.m_lbox[i]);
+                    vbox.insert(std::end(vbox), std::begin(bl_tmp), std::end(bl_tmp));
+                }
+                ntot += bl_tmp.size();
+            }
+            local_boxes.reserve(ntot);
+            for (auto& bl : bl_priv) {
+                local_boxes.insert(std::end(local_boxes), std::begin(bl), std::end(bl));
+            }
+#else
+            amrex::Abort("BoxList::complementIn: how did this happen");
+#endif
+        }
+        else
+        {
+            BoxList bl_tmp(mytyp);
+            for (int i = ilo; i <= ihi; ++i)
+            {
+                ba.complementIn(bl_tmp, bl_mesh.m_lbox[i]);
+                local_boxes.insert(std::end(local_boxes), std::begin(bl_tmp), std::end(bl_tmp));
+            }
+        }
+
+        amrex::AllGatherBoxes(local_boxes, this->size());
+        local_boxes.insert(std::end(local_boxes), std::begin(m_lbox), std::end(m_lbox));
+        std::swap(m_lbox, local_boxes);
+
+        return *this;
+    }
+#endif
+}
+
 BoxList&
 BoxList::refine (int ratio)
 {
@@ -467,8 +567,7 @@ BoxList::accrete (const IntVect& sz)
 }
 
 BoxList&
-BoxList::shift (int dir,
-                int nzones)
+BoxList::shift (int dir, int nzones)
 {
     for (auto& bx : m_lbox)
     {
@@ -478,8 +577,7 @@ BoxList::shift (int dir,
 }
 
 BoxList&
-BoxList::shiftHalf (int dir,
-                    int num_halfs)
+BoxList::shiftHalf (int dir, int num_halfs)
 {
     for (auto& bx : m_lbox)
     {
@@ -503,8 +601,7 @@ BoxList::shiftHalf (const IntVect& iv)
 //
 
 BoxList
-boxDiff (const Box& b1in,
-         const Box& b2)
+boxDiff (const Box& b1in, const Box& b2)
 {
    BL_ASSERT(b1in.sameType(b2));  
    BoxList bl_diff(b1in.ixType());
@@ -564,11 +661,28 @@ BoxList::simplify (bool best)
     std::sort(m_lbox.begin(), m_lbox.end(), [](const Box& l, const Box& r) {
             return l.smallEnd() < r.smallEnd(); });
 
-    return simplify_doit(best);
+    //
+    // If we're not looking for the "best" we can do in one pass, we
+    // limit how far afield we look for abutting boxes.  This greatly
+    // speeds up this routine for large numbers of boxes.  It does not
+    // do quite as good a job though as full brute force.
+    //
+    int depth = best ? size() : 100;
+    return simplify_doit(depth);
 }
 
 int
-BoxList::simplify_doit (bool best)
+BoxList::ordered_simplify ()
+{
+    int count;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        count = simplify_doit(1);
+    }
+    return count;
+}
+
+int
+BoxList::simplify_doit (int depth)
 {
     //
     // Try to merge adjacent boxes.
@@ -579,16 +693,9 @@ BoxList::simplify_doit (bool best)
     {
         const int* alo   = bla->loVect();
         const int* ahi   = bla->hiVect();
-        //
-        // If we're not looking for the "best" we can do in one pass, we
-        // limit how far afield we look for abutting boxes.  This greatly
-        // speeds up this routine for large numbers of boxes.  It does not
-        // do quite as good a job though as full brute force.
-        //
-        const int MaxCnt = (best ? size() : 100);
 
         iterator blb = bla + 1;
-        for (int cnt = 0; blb != End && cnt < MaxCnt; ++cnt, ++blb)
+        for (int cnt = 0; blb != End && cnt < depth; ++cnt, ++blb)
         {
             const int* blo = blb->loVect();
             const int* bhi = blb->hiVect();
@@ -663,55 +770,55 @@ BoxList&
 BoxList::maxSize (const IntVect& chunk)
 {
     Vector<Box> new_boxes;
-
-    for (int i = 0; i < AMREX_SPACEDIM; ++i)
-    {
-        new_boxes.clear();
-        for (auto& bx : m_lbox)
-        {
-            const IntVect& boxlen = bx.size();
-            const int* len = boxlen.getVect();
-
-            if (len[i] > chunk[i])
-            {
-                //
-                // Reduce by powers of 2.
-                //
-                int ratio = 1;
-                int bs    = chunk[i];
-                int nlen  = len[i];
-                while ((bs%2 == 0) && (nlen%2 == 0))
-                {
-                    ratio *= 2;
+    for (auto const& bx : m_lbox) {
+        const IntVect boxlen = amrex::enclosedCells(bx).size();
+        const IntVect boxlo = bx.smallEnd();
+        IntVect ratio{1}, numblk{1}, extra{0};
+        IntVect sz = boxlen;
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+            if (boxlen[idim] > chunk[idim]) {
+                int bs    = chunk[idim];
+                int nlen  = boxlen[idim];
+                while ((bs%2 == 0) && (nlen%2 == 0)) {
+                    ratio[idim] *= 2;
                     bs    /= 2;
                     nlen  /= 2;
                 }
-                //
-                // Determine number and size of (coarsened) cuts.
-                //
-                const int numblk = nlen/bs + (nlen%bs ? 1 : 0);
-                const int sz     = nlen/numblk;
-                const int extra  = nlen%numblk;
-                //
-                // Number of cuts = number of blocks - 1.
-                //
-                for (int k = 0; k < numblk-1; k++)
-                {
-                    //
-                    // Compute size of this chunk, expand by power of 2.
-                    //
-                    const int ksize = (k < extra ? sz+1 : sz) * ratio;
-                    //
-                    // Chop from high end.
-                    //
-                    const int pos = bx.bigEnd(i) - ksize + 1;
-
-                    new_boxes.push_back(bx.chop(i,pos));
-                }
+                numblk[idim] = (nlen+bs-1)/bs;
+                sz[idim] = nlen/numblk[idim];
+                extra[idim] = nlen - sz[idim]*numblk[idim];
             }
         }
-        join(new_boxes);
+        if (numblk == 1) {
+            new_boxes.push_back(bx);
+        } else {
+#if (AMREX_SPACEDIM == 3)
+            for (int k = 0; k < numblk[2]; ++k) {
+                int klo = (k < extra[2]) ? k*(sz[2]+1)*ratio[2] : (k*sz[2]+extra[2])*ratio[2];
+                int khi = (k < extra[2]) ? klo+(sz[2]+1)*ratio[2]-1 : klo+sz[2]*ratio[2]-1;
+                klo += boxlo[2];
+                khi += boxlo[2];
+#endif
+#if (AMREX_SPACEDIM >= 2)
+                for (int j = 0; j < numblk[1]; ++j) {
+                    int jlo = (j < extra[1]) ? j*(sz[1]+1)*ratio[1] : (j*sz[1]+extra[1])*ratio[1];
+                    int jhi = (j < extra[1]) ? jlo+(sz[1]+1)*ratio[1]-1 : jlo+sz[1]*ratio[1]-1;
+                    jlo += boxlo[1];
+                    jhi += boxlo[1];
+#endif
+                    for (int i = 0; i < numblk[0]; ++i) {
+                        int ilo = (i < extra[0]) ? i*(sz[0]+1)*ratio[0] : (i*sz[0]+extra[0])*ratio[0];
+                        int ihi = (i < extra[0]) ? ilo+(sz[0]+1)*ratio[0]-1 : ilo+sz[0]*ratio[0]-1;
+                        ilo += boxlo[0];
+                        ihi += boxlo[0];
+                        new_boxes.push_back(Box(IntVect(AMREX_D_DECL(ilo,jlo,klo)),
+                                                IntVect(AMREX_D_DECL(ihi,jhi,khi))).
+                                            convert(ixType()));
+            AMREX_D_TERM(},},})
+        }
     }
+    std::swap(new_boxes, m_lbox);
+
     return *this;
 }
 
@@ -773,8 +880,7 @@ BoxList::convert (IndexType typ) noexcept
 }
 
 std::ostream&
-operator<< (std::ostream&  os,
-            const BoxList& blist)
+operator<< (std::ostream& os, const BoxList& blist)
 {
     BoxList::const_iterator bli = blist.begin(), End = blist.end();
     os << "(BoxList " << blist.size() << ' ' << blist.ixType() << '\n';
@@ -802,4 +908,16 @@ BoxList::operator== (const BoxList& rhs) const
     return true;
 }
 
+void
+BoxList::Bcast ()
+{
+    int nboxes = this->size();
+    const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
+    ParallelDescriptor::Bcast(&nboxes, 1, IOProcNumber);
+    if (ParallelDescriptor::MyProc() != IOProcNumber) {
+        m_lbox.resize(nboxes);
+    }
+    ParallelDescriptor::Bcast(m_lbox.data(), nboxes, IOProcNumber);
+}
+
 }
diff --git a/Src/Base/AMReX_CArena.H b/Src/Base/AMReX_CArena.H
index 211cb97d6ab..05bbe19b488 100644
--- a/Src/Base/AMReX_CArena.H
+++ b/Src/Base/AMReX_CArena.H
@@ -59,7 +59,7 @@ public:
     void PrintUsage (std::string const& name) const;
 
     //! The default memory hunk size to grab from the heap.
-    enum { DefaultHunkSize = 1024*1024*8 };
+    constexpr static std::size_t DefaultHunkSize = 1024*1024*8;
 
 protected:
     //! The nodes in our free list and block list.
diff --git a/Src/Base/AMReX_CArena.cpp b/Src/Base/AMReX_CArena.cpp
index ce3e1bca307..f6bde9c0a62 100644
--- a/Src/Base/AMReX_CArena.cpp
+++ b/Src/Base/AMReX_CArena.cpp
@@ -121,8 +121,10 @@ CArena::free (void* vp)
     // `vp' had better be in the busy list.
     //
     auto busy_it = m_busylist.find(Node(vp,0,0));
-
-    BL_ASSERT(!(busy_it == m_busylist.end()));
+    if (busy_it == m_busylist.end()) {
+        amrex::Abort("CArena::free: unknown pointer");
+        return;
+    }
     BL_ASSERT(m_freelist.find(*busy_it) == m_freelist.end());
 
     m_actually_used -= busy_it->size();
diff --git a/Src/Base/AMReX_CoordSys.H b/Src/Base/AMReX_CoordSys.H
index e62262e9a00..647600de9d1 100644
--- a/Src/Base/AMReX_CoordSys.H
+++ b/Src/Base/AMReX_CoordSys.H
@@ -82,7 +82,7 @@ public:
 
     GpuArray<Real,AMREX_SPACEDIM> CellSizeArray () const noexcept {
         BL_ASSERT(ok);
-        return { AMREX_D_DECL(dx[0],dx[1],dx[2]) };
+        return {{ AMREX_D_DECL(dx[0],dx[1],dx[2]) }};
     }
 
     //! Returns the inverse cellsize for each coordinate direction.
@@ -93,7 +93,7 @@ public:
 
     GpuArray<Real,AMREX_SPACEDIM> InvCellSizeArray () const noexcept {
         BL_ASSERT(ok);
-        return { AMREX_D_DECL(inv_dx[0],inv_dx[1],inv_dx[2]) };
+        return {{ AMREX_D_DECL(inv_dx[0],inv_dx[1],inv_dx[2]) }};
     }
 
     //! Returns location of cell center in specified direction.
diff --git a/Src/Base/AMReX_CoordSys.cpp b/Src/Base/AMReX_CoordSys.cpp
index fd1529942f1..7d748960560 100644
--- a/Src/Base/AMReX_CoordSys.cpp
+++ b/Src/Base/AMReX_CoordSys.cpp
@@ -206,7 +206,7 @@ CoordSys::SetVolume (FArrayBox& a_volfab,
     AMREX_ASSERT(region.cellCentered());
 
     auto vol = a_volfab.array();
-    GpuArray<Real,AMREX_SPACEDIM> a_dx{AMREX_D_DECL(dx[0], dx[1], dx[2])};
+    GpuArray<Real,AMREX_SPACEDIM> a_dx{{AMREX_D_DECL(dx[0], dx[1], dx[2])}};
 
 #if (AMREX_SPACEDIM == 3)
     AMREX_ASSERT(IsCartesian());
@@ -216,7 +216,7 @@ CoordSys::SetVolume (FArrayBox& a_volfab,
         vol(i,j,k) = dv;
     });
 #else
-    GpuArray<Real,AMREX_SPACEDIM> a_offset{AMREX_D_DECL(offset[0],offset[1],offset[2])};
+    GpuArray<Real,AMREX_SPACEDIM> a_offset{{AMREX_D_DECL(offset[0],offset[1],offset[2])}};
     int coord = (int) c_sys;
     AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( region, tbx,
     {
@@ -239,6 +239,8 @@ CoordSys::SetDLogA (FArrayBox& a_dlogafab,
                     const Box& region,
                     int        dir) const
 {
+    amrex::ignore_unused(dir);
+
     AMREX_ASSERT(ok);
     AMREX_ASSERT(region.cellCentered());
 
@@ -491,6 +493,7 @@ CoordSys::Volume (const Real xlo[AMREX_SPACEDIM],
 Real
 CoordSys::AreaLo (const IntVect& point, int dir) const noexcept
 {
+    amrex::ignore_unused(point,dir);
 #if (AMREX_SPACEDIM==2)
     Real xlo[AMREX_SPACEDIM];
     switch (c_sys)
@@ -501,6 +504,7 @@ CoordSys::AreaLo (const IntVect& point, int dir) const noexcept
         case 0: return dx[1];
         case 1: return dx[0];
         }
+        return 0.; // to silent compiler warning
     case RZ:
         LoNode(point,xlo);
         switch (dir)
@@ -508,6 +512,7 @@ CoordSys::AreaLo (const IntVect& point, int dir) const noexcept
         case 0: return TWOPI*dx[1]*xlo[0];
         case 1: return ((xlo[0]+dx[0])*(xlo[0]+dx[0])-xlo[0]*xlo[0])*(0.5*TWOPI);
         }
+        return 0.; // to silent compiler warning
     default:
         AMREX_ASSERT(0);
     }
@@ -526,6 +531,7 @@ CoordSys::AreaLo (const IntVect& point, int dir) const noexcept
 Real
 CoordSys::AreaHi (const IntVect& point, int dir) const noexcept
 {
+    amrex::ignore_unused(point,dir);
 #if (AMREX_SPACEDIM==2)
     Real xhi[AMREX_SPACEDIM];
     switch (c_sys)
@@ -536,6 +542,7 @@ CoordSys::AreaHi (const IntVect& point, int dir) const noexcept
         case 0: return dx[1];
         case 1: return dx[0];
         }
+        return 0.; // to silent compiler warning
     case RZ:
         HiNode(point,xhi);
         switch (dir)
@@ -543,6 +550,7 @@ CoordSys::AreaHi (const IntVect& point, int dir) const noexcept
         case 0: return TWOPI*dx[1]*xhi[0];
         case 1: return (xhi[0]*xhi[0]-(xhi[0]-dx[0])*(xhi[0]-dx[0]))*(TWOPI*0.5);
         }
+        return 0.; // to silent compiler warning
     default:
         AMREX_ASSERT(0);
     }
diff --git a/Src/Base/AMReX_Dim3.H b/Src/Base/AMReX_Dim3.H
index 3a79ca3a59c..f8205b14189 100644
--- a/Src/Base/AMReX_Dim3.H
+++ b/Src/Base/AMReX_Dim3.H
@@ -7,31 +7,8 @@
 
 namespace amrex {
 
-#ifdef AMREX_USE_HIP
-struct Dim3 { int x; int y; int z;
-    AMREX_GPU_HOST_DEVICE
-    constexpr Dim3 () : x(0), y(0), z(0) {}
-    AMREX_GPU_HOST_DEVICE
-    constexpr Dim3 (int x_, int y_, int z_) // xxxxx HIP: todo
-        : x(x_), y(y_), z(z_) {}
-    AMREX_GPU_HOST_DEVICE
-    constexpr Dim3 (Dim3 const& rhs)
-        : x(rhs.x), y(rhs.y), z(rhs.z) {}
-};
-struct XDim3 { Real x; Real y; Real z;
-    AMREX_GPU_HOST_DEVICE
-    constexpr XDim3 () : x(0._rt), y(0._rt), z(0._rt) {}
-    AMREX_GPU_HOST_DEVICE
-    constexpr XDim3 (Real x_, Real y_, Real z_) // xxxxx HIP: todo
-        : x(x_), y(y_), z(z_) {}
-    AMREX_GPU_HOST_DEVICE
-    constexpr XDim3 (XDim3 const& rhs)
-        : x(rhs.x), y(rhs.y), z(rhs.z) {}
-};
-#else
 struct Dim3 { int x; int y; int z; };
 struct XDim3 { Real x; Real y; Real z; };
-#endif
 
 inline std::ostream& operator<< (std::ostream& os, const Dim3& d) {
     os << '(' << d.x << ',' << d.y << ',' << d.z << ')';
diff --git a/Src/Base/AMReX_DistributionMapping.H b/Src/Base/AMReX_DistributionMapping.H
index e0982d7b303..9b4d2722353 100644
--- a/Src/Base/AMReX_DistributionMapping.H
+++ b/Src/Base/AMReX_DistributionMapping.H
@@ -236,7 +236,9 @@ class DistributionMapping
     * if use_box_vol is true, weight boxes by their volume in Distribute
     * otherwise, all boxes will be treated with equal weight
     */
-    static std::vector<std::vector<int> > makeSFC (const BoxArray& ba, bool use_box_vol=true);
+    static std::vector<std::vector<int> > makeSFC (const BoxArray& ba, 
+                                                   bool use_box_vol=true,
+                                                   const int nprocs=ParallelContext::NProcsSub() );
 
     /** \brief Computes the average cost per MPI rank given a distribution mapping
      * global cost vector.
diff --git a/Src/Base/AMReX_DistributionMapping.cpp b/Src/Base/AMReX_DistributionMapping.cpp
index 7447a750039..b268226511e 100644
--- a/Src/Base/AMReX_DistributionMapping.cpp
+++ b/Src/Base/AMReX_DistributionMapping.cpp
@@ -294,6 +294,7 @@ DistributionMapping::LeastUsedTeams (Vector<int>        & rteam,
     rteam.push_back(0);
     rworker.clear();
     rworker.push_back(Vector<int>(1,0));
+    amrex::ignore_unused(nteams,nworkers);
 #endif
 }
 
@@ -856,7 +857,8 @@ DistributionMapping::KnapSackProcessorMap (const BoxArray& boxes,
 					   int             nprocs)
 {
     BL_ASSERT(boxes.size() > 0);
-    BL_ASSERT(m_ref->m_pmap.size() == boxes.size());
+
+    m_ref->m_pmap.resize(boxes.size());
 
     if (boxes.size() <= nprocs || nprocs < 2)
     {
@@ -882,53 +884,161 @@ namespace
         class Compare
         {
         public:
+            AMREX_FORCE_INLINE
             bool operator () (const SFCToken& lhs,
                               const SFCToken& rhs) const;
         };
-
-        SFCToken (int box, const IntVect& idx, Real vol)
-            :
-            m_box(box), m_idx(idx), m_vol(vol) {}
-
-        int     m_box;
-        IntVect m_idx;
-        Real    m_vol;
-
-        static int MaxPower;
+        int m_box;
+        Array<uint32_t,AMREX_SPACEDIM> m_morton;
     };
 }
 
-int SFCToken::MaxPower = 64;
-
+AMREX_FORCE_INLINE
 bool
 SFCToken::Compare::operator () (const SFCToken& lhs,
                                 const SFCToken& rhs) const
 {
-    for (int i = SFCToken::MaxPower - 1; i >= 0; --i)
+#if (AMREX_SPACEDIM == 1)
+        return lhs.m_morton[0] < rhs.m_morton[0];
+#elif (AMREX_SPACEDIM == 2)
+        return (lhs.m_morton[1] <  rhs.m_morton[1]) ||
+              ((lhs.m_morton[1] == rhs.m_morton[1]) &&
+               (lhs.m_morton[0] <  rhs.m_morton[0]));
+#else
+        return (lhs.m_morton[2] <  rhs.m_morton[2]) ||
+              ((lhs.m_morton[2] == rhs.m_morton[2]) &&
+              ((lhs.m_morton[1] <  rhs.m_morton[1]) ||
+              ((lhs.m_morton[1] == rhs.m_morton[1]) &&
+               (lhs.m_morton[0] <  rhs.m_morton[0]))));
+#endif
+}
+
+namespace {
+#if (AMREX_SPACEDIM == 3)
+    AMREX_FORCE_INLINE
+    uint32_t make_space (uint32_t x)
+    {
+        // x            : 0000,0000,0000,0000,0000,00a9,8765,4321
+        x = (x | (x << 16)) & 0x030000FF;
+        // x << 16      : 0000,00a9,8765,4321,0000,0000,0000,0000
+        // x | (x << 16): 0000,00a9,8765,4321,0000,00a9,8765,4321
+        // 0x030000FF   : 0000,0011,0000,0000,0000,0000,1111,1111
+        // x            : 0000,00a9,0000,0000,0000,0000,8765,4321
+        x = (x | (x <<  8)) & 0x0300F00F;
+        // x << 8       : 0000,0000,0000,0000,8765,4321,0000,0000
+        // x | (x << 8) : 0000,00a9,0000,0000,8765,4321,8765,4321
+        // 0x0300F00F   : 0000,0011,0000,0000,1111,0000,0000,1111
+        // x            : 0000,00a9,0000,0000,8765,0000,0000,4321
+        x = (x | (x <<  4)) & 0x030C30C3;
+        // x << 4       : 00a9,0000,0000,8765,0000,0000,4321,0000
+        // x | (x << 4) : 00a9,00a9,0000,8765,8765,0000,4321,4321
+        // 0x030C30C3   : 0000,0011,0000,1100,0011,0000,1100,0011
+        // x            : 0000,00a9,0000,8700,0065,0000,4300,0021
+        x = (x | (x <<  2)) & 0x09249249;
+        // x << 2       : 0000,a900,0087,0000,6500,0043,0000,2100
+        // x | (x << 2) : 0000,a9a9,0087,8700,6565,0043,4300,2121
+        // 0x09249249   : 0000,1001,0010,0100,1001,0010,0100,1001
+        // x            : 0000,a009,0080,0700,6005,0040,0300,2001
+        return x;
+    }
+#elif (AMREX_SPACEDIM == 2)
+    AMREX_FORCE_INLINE
+    uint32_t make_space (uint32_t x)
     {
-        const int N = (1<<i);
+        // x           : 0000,0000,0000,0000,gfed,cba9,8765,4321
+        x = (x | (x << 8)) & 0x00FF00FF;
+        // x << 8      : 0000,0000,gfed,cba9,8765,4321,0000,0000
+        // x | (x << 8): 0000,0000,gfed,cba9,????,????,8765,4321
+        // 0x00FF00FF  : 0000,0000,1111,1111,0000,0000,1111,1111
+        // x           : 0000,0000,gfed,cba9,0000,0000,8765,4321
+        x = (x | (x << 4)) & 0x0F0F0F0F;
+        // x << 4      : 0000,gfed,cba9,0000,0000,8765,4321,0000
+        // x | (x << 4): 0000,gfed,????,cba9,0000,8765,????,4321
+        // 0x0F0F0F0F  : 0000,1111,0000,1111,0000,1111,0000,1111
+        // x           : 0000,gfed,0000,cba9,0000,8765,0000,4321
+        x = (x | (x << 2)) & 0x33333333;
+        // x << 2      : 00gf,ed00,00cb,a900,0087,6500,0043,2100
+        // x | (x << 2): 00gf,??ed,00cb,??a9,0087,??65,0043,??21
+        // 0x33333333  : 0011,0011,0011,0011,0011,0011,0011,0011
+        // x           : 00gf,00ed,00cb,00a9,0087,0065,0043,0021
+        x = (x | (x << 1)) & 0x55555555;
+        // x << 1      : 0gf0,0ed0,0cb0,0a90,0870,0650,0430,0210
+        // x | (x << 1): 0g?f,0e?d,0c?b,0a?9,08?7,06?5,04?3,02?1
+        // 0x55555555  : 0101,0101,0101,0101,0101,0101,0101,0101
+        // x           : 0g0f,0e0d,0c0b,0a09,0807,0605,0403,0201
+        return x;
+    }
+#endif
 
-        for (int j = AMREX_SPACEDIM-1; j >= 0; --j)
-        {
-            const int il = lhs.m_idx[j]/N;
-            const int ir = rhs.m_idx[j]/N;
+    AMREX_FORCE_INLINE
+    SFCToken makeSFCToken (int box_index, IntVect const& iv)
+    {
+        SFCToken token;
+        token.m_box = box_index;
+
+#if (AMREX_SPACEDIM == 3)
+
+        constexpr int imin = -(1 << 29);
+        AMREX_ASSERT_WITH_MESSAGE(AMREX_D_TERM(iv[0] >= imin && iv[0] < -imin,
+                                            && iv[1] >= imin && iv[1] < -imin,
+                                            && iv[2] >= imin && iv[2] < -imin),
+                                  "SFCToken: index out of range");
+        uint32_t x = iv[0] - imin;
+        uint32_t y = iv[1] - imin;
+        uint32_t z = iv[2] - imin;
+        // extract lowest 10 bits and make space for interleaving
+        token.m_morton[0] = make_space(x & 0x3FF)
+                         | (make_space(y & 0x3FF) << 1)
+                         | (make_space(z & 0x3FF) << 2);
+        x = x >> 10;
+        y = y >> 10;
+        z = z >> 10;
+        token.m_morton[1] = make_space(x & 0x3FF)
+                         | (make_space(y & 0x3FF) << 1)
+                         | (make_space(z & 0x3FF) << 2);
+        x = x >> 10;
+        y = y >> 10;
+        z = z >> 10;
+        token.m_morton[2] = make_space(x & 0x3FF)
+                         | (make_space(y & 0x3FF) << 1)
+                         | (make_space(z & 0x3FF) << 2);
+
+#elif (AMREX_SPACEDIM == 2)
+
+        constexpr uint32_t offset = 1u << 31;
+        static_assert(static_cast<uint32_t>(std::numeric_limits<int>::max())+1 == offset,
+                      "INT_MAX != (1<<31)-1");
+        uint32_t x = (iv[0] >= 0) ? static_cast<uint32_t>(iv[0]) + offset
+            : static_cast<uint32_t>(iv[0]-std::numeric_limits<int>::lowest());
+        uint32_t y = (iv[1] >= 0) ? static_cast<uint32_t>(iv[1]) + offset
+            : static_cast<uint32_t>(iv[1]-std::numeric_limits<int>::lowest());
+        // extract lowest 16 bits and make sapce for interleaving
+        token.m_morton[0] = make_space(x & 0xFFFF)
+                         | (make_space(y & 0xFFFF) << 1);
+        x = x >> 16;
+        y = y >> 16;
+        token.m_morton[1] = make_space(x) | (make_space(y) << 1);
+
+#elif (AMREX_SPACEDIM == 1)
+
+        constexpr uint32_t offset = 1u << 31;
+        static_assert(static_cast<uint32_t>(std::numeric_limits<int>::max())+1 == offset,
+                      "INT_MAX != (1<<31)-1");
+        token.m_morton[0] = (iv[0] >= 0) ? static_cast<uint32_t>(iv[0]) + offset
+            : static_cast<uint32_t>(iv[0]-std::numeric_limits<int>::lowest());
 
-            if (il < ir)
-            {
-                return true;
-            }
-            else if (il > ir)
-            {
-                return false;
-            }
-        }
+#else
+        static_assert(false,"AMREX_SPACEDIM != 1, 2 or 3");
+#endif
+
+        return token;
     }
-    return false;
 }
 
 static
 void
 Distribute (const std::vector<SFCToken>&     tokens,
+            const std::vector<Long>&         wgts,
             int                              nprocs,
             Real                             volpercpu,
             std::vector< std::vector<int> >& v)
@@ -944,8 +1054,7 @@ Distribute (const std::vector<SFCToken>&     tokens,
         for (const auto &t : tokens) {
             Print() << "    " << idx++ << ": "
                     << t.m_box << ": "
-                    << t.m_idx << ": "
-                    << t.m_vol << std::endl;
+                    << t.m_morton << std::endl;
         }
     }
 
@@ -963,7 +1072,7 @@ Distribute (const std::vector<SFCToken>&     tokens,
               K < TSZ && (i == (nprocs-1) || (vol < volpercpu));
               ++K)
         {
-            vol += tokens[K].m_vol;
+            vol += wgts[tokens[K].m_box];
             ++cnt;
 
             v[i].push_back(tokens[K].m_box);
@@ -977,7 +1086,7 @@ Distribute (const std::vector<SFCToken>&     tokens,
         {
             --K;
             v[i].pop_back();
-            totalvol -= tokens[K].m_vol;
+            totalvol -= wgts[tokens[K].m_box];
         }
     }
 
@@ -993,9 +1102,8 @@ Distribute (const std::vector<SFCToken>&     tokens,
                 BL_ASSERT(box == t.m_box);
                 Print() << "    " << idx << ": "
                         << t.m_box << ": "
-                        << t.m_idx << ": "
-                        << t.m_vol << std::endl;
-                rank_vol += t.m_vol;
+                        << t.m_morton << std::endl;
+                rank_vol += wgts[t.m_box];
                 idx++;
             }
             Print() << "    Total Rank Vol: " << rank_vol << std::endl;
@@ -1047,34 +1155,15 @@ DistributionMapping::SFCProcessorMapDoIt (const BoxArray&          boxes,
                 << nprocs << ", " << nteams << ", " << nworkers << ")\n";
     }
 
-    std::vector<SFCToken> tokens;
-
     const int N = boxes.size();
-
+    std::vector<SFCToken> tokens;
     tokens.reserve(N);
-
-    int maxijk = 0;
-
     for (int i = 0; i < N; ++i)
     {
-	const Box& bx = boxes[i];
-        tokens.push_back(SFCToken(i,bx.smallEnd(),wgts[i]));
-
-        const SFCToken& token = tokens.back();
-
-        AMREX_D_TERM(maxijk = std::max(maxijk, token.m_idx[0]);,
-                     maxijk = std::max(maxijk, token.m_idx[1]);,
-                     maxijk = std::max(maxijk, token.m_idx[2]););
+        const Box& bx = boxes[i];
+        tokens.push_back(makeSFCToken(i, bx.smallEnd()));
     }
     //
-    // Set SFCToken::MaxPower for BoxArray.
-    //
-    int m = 0;
-    for ( ; (1 << m) <= maxijk; ++m) {
-        ;  // do nothing
-    }
-    SFCToken::MaxPower = m;
-    //
     // Put'm in Morton space filling curve order.
     //
     std::sort(tokens.begin(), tokens.end(), SFCToken::Compare());
@@ -1082,14 +1171,14 @@ DistributionMapping::SFCProcessorMapDoIt (const BoxArray&          boxes,
     // Split'm up as equitably as possible per team.
     //
     Real volperteam = 0;
-    for (const SFCToken& tok : tokens) {
-        volperteam += tok.m_vol;
+    for (Long wt : wgts) {
+        volperteam += wt;
     }
     volperteam /= nteams;
 
     std::vector< std::vector<int> > vec(nteams);
 
-    Distribute(tokens,nteams,volperteam,vec);
+    Distribute(tokens,wgts,nteams,volperteam,vec);
 
     // vec has a size of nteams and vec[] holds a vector of box ids.
 
@@ -1311,33 +1400,14 @@ DistributionMapping::RRSFCDoIt (const BoxArray&          boxes,
     amrex::Abort("Team support is not implemented yet in RRSFC");
 #endif
 
-    std::vector<SFCToken> tokens;
-
     const int nboxes = boxes.size();
-
+    std::vector<SFCToken> tokens;
     tokens.reserve(nboxes);
-
-    int maxijk = 0;
-
     for (int i = 0; i < nboxes; ++i)
     {
-	const Box& bx = boxes[i];
-        tokens.push_back(SFCToken(i,bx.smallEnd(),0.0));
-
-        const SFCToken& token = tokens.back();
-
-        AMREX_D_TERM(maxijk = std::max(maxijk, token.m_idx[0]);,
-               maxijk = std::max(maxijk, token.m_idx[1]);,
-               maxijk = std::max(maxijk, token.m_idx[2]););
-    }
-    //
-    // Set SFCToken::MaxPower for BoxArray.
-    //
-    int m = 0;
-    for ( ; (1 << m) <= maxijk; ++m) {
-        ;  // do nothing
+        const Box& bx = boxes[i];
+        tokens.push_back(makeSFCToken(i, bx.smallEnd()));
     }
-    SFCToken::MaxPower = m;
     //
     // Put'm in Morton space filling curve order.
     //
@@ -1471,6 +1541,8 @@ DistributionMapping::makeKnapSack (const LayoutData<Real>& rcost_local,
             r = DistributionMapping(pmap);
         }
     }
+#else
+    amrex::ignore_unused(broadcastToAll);
 #endif
     
     return r;
@@ -1522,42 +1594,45 @@ DistributionMapping::ComputeDistributionMappingEfficiency (const DistributionMap
     *efficiency = (std::accumulate(rankToCost.begin(),
                                    rankToCost.end(), 0.0) / (nprocs*maxCost));
 }
-  
-DistributionMapping
-DistributionMapping::makeKnapSack (const MultiFab& weight, int nmax)
-{
-    BL_PROFILE("makeKnapSack");
-
-    DistributionMapping r;
 
-    Vector<Long> cost(weight.size());
-#ifdef BL_USE_MPI
-    {
-	Vector<Real> rcost(cost.size(), 0.0);
+namespace {
+Vector<Long>
+gather_weights (const MultiFab& weight)
+{
+#ifdef AMREX_USE_MPI
+    LayoutData<Real> costld(weight.boxArray(),weight.DistributionMap());
 #ifdef _OPENMP
-#pragma omp parallel
+#pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
-	for (MFIter mfi(weight); mfi.isValid(); ++mfi) {
-	    int i = mfi.index();
-	    rcost[i] = weight[mfi].sum<RunOn::Device>(mfi.validbox(),0);
-	}
-
-	ParallelAllReduce::Sum(&rcost[0], rcost.size(), ParallelContext::CommunicatorSub());
-
-	Real wmax = *std::max_element(rcost.begin(), rcost.end());
-	Real scale = (wmax == 0) ? 1.e9 : 1.e9/wmax;
-
-	for (int i = 0; i < rcost.size(); ++i) {
-	    cost[i] = Long(rcost[i]*scale) + 1L;
-	}
+    for (MFIter mfi(weight); mfi.isValid(); ++mfi) {
+        costld[mfi] = weight[mfi].sum<RunOn::Device>(mfi.validbox(),0);
     }
+    Vector<Real> rcost(weight.size());
+    ParallelDescriptor::GatherLayoutDataToVector(costld, rcost,
+                                                 ParallelContext::IOProcessorNumberSub());
+    ParallelDescriptor::Bcast(rcost.data(), rcost.size(), ParallelContext::IOProcessorNumberSub());
+    Real wmax = *std::max_element(rcost.begin(), rcost.end());
+    Real scale = (wmax == 0) ? 1.e9 : 1.e9/wmax;
+    Vector<Long> lcost(rcost.size());
+    for (int i = 0; i < rcost.size(); ++i) {
+        lcost[i] = static_cast<Long>(rcost[i]*scale) + 1L;
+    }
+    return lcost;
+#else
+    return Vector<Long>(weight.size(), 1L);
 #endif
+}
+}
 
+DistributionMapping
+DistributionMapping::makeKnapSack (const MultiFab& weight, int nmax)
+{
+    BL_PROFILE("makeKnapSack");
+    Vector<Long> cost = gather_weights(weight);
     int nprocs = ParallelContext::NProcsSub();
     Real eff;
-
+    DistributionMapping r;
     r.KnapSackProcessorMap(cost, nprocs, &eff, true, nmax);
-
     return r;
 }
 
@@ -1565,71 +1640,21 @@ DistributionMapping
 DistributionMapping::makeKnapSack (const MultiFab& weight, Real& eff, int nmax)
 {
     BL_PROFILE("makeKnapSack");
-
-    DistributionMapping r;
-
-    Vector<Long> cost(weight.size());
-#ifdef BL_USE_MPI
-    {
-        Vector<Real> rcost(cost.size(), 0.0);
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for (MFIter mfi(weight); mfi.isValid(); ++mfi) {
-            int i = mfi.index();
-            rcost[i] = weight[mfi].sum<RunOn::Device>(mfi.validbox(),0);
-        }
-
-        ParallelAllReduce::Sum(&rcost[0], rcost.size(), ParallelContext::CommunicatorSub());
-
-        Real wmax = *std::max_element(rcost.begin(), rcost.end());
-        Real scale = (wmax == 0) ? 1.e9 : 1.e9/wmax;
-
-        for (int i = 0; i < rcost.size(); ++i) {
-            cost[i] = Long(rcost[i]*scale) + 1L;
-        }
-    }
-#endif
-
+    Vector<Long> cost = gather_weights(weight);
     int nprocs = ParallelContext::NProcsSub();
-
+    DistributionMapping r;
     r.KnapSackProcessorMap(cost, nprocs, &eff, true, nmax);
-
     return r;
 }
 
 DistributionMapping
 DistributionMapping::makeRoundRobin (const MultiFab& weight)
 {
-    DistributionMapping r;
-
-    Vector<Long> cost(weight.size());
-#ifdef BL_USE_MPI
-    {
-	Vector<Real> rcost(cost.size(), 0.0);
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-	for (MFIter mfi(weight); mfi.isValid(); ++mfi) {
-	    int i = mfi.index();
-	    rcost[i] = weight[mfi].sum<RunOn::Device>(mfi.validbox(),0);
-	}
-
-	ParallelAllReduce::Sum(&rcost[0], rcost.size(), ParallelContext::CommunicatorSub());
-
-	Real wmax = *std::max_element(rcost.begin(), rcost.end());
-        Real scale = (wmax == 0) ? 1.e9 : 1.e9/wmax;
-
-	for (int i = 0; i < rcost.size(); ++i) {
-	    cost[i] = Long(rcost[i]*scale) + 1L;
-	}
-    }
-#endif
-
+    BL_PROFILE("makeRoundRobin");
+    Vector<Long> cost = gather_weights(weight);
     int nprocs = ParallelContext::NProcsSub();
-
+    DistributionMapping r;
     r.RoundRobinProcessorMap(cost, nprocs);
-
     return r;
 }
 
@@ -1637,36 +1662,10 @@ DistributionMapping
 DistributionMapping::makeSFC (const MultiFab& weight, bool sort)
 {
     BL_PROFILE("makeSFC");
-
-    DistributionMapping r;
-
-    Vector<Long> cost(weight.size());
-#ifdef BL_USE_MPI
-    {
-	Vector<Real> rcost(cost.size(), 0.0);
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-	for (MFIter mfi(weight); mfi.isValid(); ++mfi) {
-	    int i = mfi.index();
-	    rcost[i] = weight[mfi].sum<RunOn::Device>(mfi.validbox(),0);
-	}
-
-	ParallelAllReduce::Sum(&rcost[0], rcost.size(), ParallelContext::CommunicatorSub());
-
-	Real wmax = *std::max_element(rcost.begin(), rcost.end());
-        Real scale = (wmax == 0) ? 1.e9 : 1.e9/wmax;
-
-	for (int i = 0; i < rcost.size(); ++i) {
-	    cost[i] = Long(rcost[i]*scale) + 1L;
-	}
-    }
-#endif
-
+    Vector<Long> cost = gather_weights(weight);
     int nprocs = ParallelContext::NProcsSub();
-
+    DistributionMapping r;
     r.SFCProcessorMap(weight.boxArray(), cost, nprocs, sort);
-
     return r;
 }
 
@@ -1674,36 +1673,10 @@ DistributionMapping
 DistributionMapping::makeSFC (const MultiFab& weight, Real& eff, bool sort)
 {
     BL_PROFILE("makeSFC");
-
-    DistributionMapping r;
-
-    Vector<Long> cost(weight.size());
-#ifdef BL_USE_MPI
-    {
-        Vector<Real> rcost(cost.size(), 0.0);
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for (MFIter mfi(weight); mfi.isValid(); ++mfi) {
-            int i = mfi.index();
-            rcost[i] = weight[mfi].sum<RunOn::Device>(mfi.validbox(),0);
-        }
-
-	ParallelAllReduce::Sum(&rcost[0], rcost.size(), ParallelContext::CommunicatorSub());
-
-        Real wmax = *std::max_element(rcost.begin(), rcost.end());
-        Real scale = (wmax == 0) ? 1.e9 : 1.e9/wmax;
-
-        for (int i = 0; i < rcost.size(); ++i) {
-            cost[i] = Long(rcost[i]*scale) + 1L;
-        }
-    }
-#endif
-
+    Vector<Long> cost = gather_weights(weight);
     int nprocs = ParallelContext::NProcsSub();
-
+    DistributionMapping r;
     r.SFCProcessorMap(weight.boxArray(), cost, nprocs, eff, sort);
-
     return r;
 }
 
@@ -1812,57 +1785,43 @@ DistributionMapping::makeSFC (const LayoutData<Real>& rcost_local,
             r = DistributionMapping(pmap);
         }
     }
+#else
+    amrex::ignore_unused(broadcastToAll);
 #endif
 
     return r;
 }
     
 std::vector<std::vector<int> >
-DistributionMapping::makeSFC (const BoxArray& ba, bool use_box_vol)
+DistributionMapping::makeSFC (const BoxArray& ba, bool use_box_vol, const int nprocs)
 {
     BL_PROFILE("makeSFC");
 
-    std::vector<SFCToken> tokens;
-
     const int N = ba.size();
-
+    std::vector<SFCToken> tokens;
+    std::vector<Long> wgts;
     tokens.reserve(N);
-
-    int maxijk = 0;
-
-    Real vol_sum = 0;
+    wgts.reserve(N);
+    Long vol_sum = 0;
     for (int i = 0; i < N; ++i)
     {
-	const Box& bx = ba[i];
-        const auto & bx_vol = (use_box_vol ? bx.volume() : 1);
-        tokens.push_back(SFCToken(i,bx.smallEnd(),bx_vol));
-        vol_sum += bx_vol;
-
-        const SFCToken& token = tokens.back();
-
-        AMREX_D_TERM(maxijk = std::max(maxijk, token.m_idx[0]);,
-                     maxijk = std::max(maxijk, token.m_idx[1]);,
-                     maxijk = std::max(maxijk, token.m_idx[2]););
+        const Box& bx = ba[i];
+        tokens.push_back(makeSFCToken(i, bx.smallEnd()));
+        const Long v = use_box_vol ? bx.volume() : Long(1);
+        vol_sum += v;
+        wgts.push_back(v);
     }
     //
-    // Set SFCToken::MaxPower for BoxArray.
-    //
-    int m = 0;
-    for ( ; (1 << m) <= maxijk; ++m) {
-        ;  // do nothing
-    }
-    SFCToken::MaxPower = m;
-    //
     // Put'm in Morton space filling curve order.
     //
     std::sort(tokens.begin(), tokens.end(), SFCToken::Compare());
 
-    const int nprocs = ParallelContext::NProcsSub();
     Real volper;
     volper = vol_sum / nprocs;
 
     std::vector< std::vector<int> > r(nprocs);
-    Distribute(tokens, nprocs, volper, r);
+
+    Distribute(tokens, wgts, nprocs, volper, r);
 
     return r;
 }
diff --git a/Src/Base/AMReX_EArena.H b/Src/Base/AMReX_EArena.H
index 315de02f87d..1321a98e063 100644
--- a/Src/Base/AMReX_EArena.H
+++ b/Src/Base/AMReX_EArena.H
@@ -41,7 +41,7 @@ public:
     std::size_t free_space_available () const noexcept;
 
     //! The default memory hunk size to grab from the heap.
-    enum { DefaultHunkSize = 1024*1024*8 };
+    constexpr static std::size_t DefaultHunkSize = 1024*1024*8;
 
 protected:
 
diff --git a/Src/Base/AMReX_Extension.H b/Src/Base/AMReX_Extension.H
index dd7efaff2ca..b8bcf6e3c69 100644
--- a/Src/Base/AMReX_Extension.H
+++ b/Src/Base/AMReX_Extension.H
@@ -3,15 +3,6 @@
 
 #if !defined(BL_LANG_FORT)
 
-// HIP FIX HERE - noexcept
-
-#ifdef AMREX_HIP_PLATFORM_HCC
-#define AMREX_NOEXCEPT
-#else
-#define AMREX_NOEXCEPT noexcept
-#endif
-
-
 // restrict
 
 #ifdef __cplusplus
@@ -126,15 +117,44 @@
 #define AMREX_INLINE inline
 #endif
 
+// no inline
+#if defined(__GNUC__) || defined(__clang__) || defined(__CUDACC__) || defined(__HIP__) || defined(__SYCL_COMPILER_VERSION)
+#define AMREX_NO_INLINE __attribute__((noinline))
+#else
+#define AMREX_NO_INLINE
+#endif
 
 // __attribute__((weak))
 
-#ifdef AMREX_TYPECHECK
+#if defined(AMREX_TYPECHECK)
 #define AMREX_ATTRIBUTE_WEAK 
+#elif defined(_WIN32)
+#define AMREX_ATTRIBUTE_WEAK
 #else
 #define AMREX_ATTRIBUTE_WEAK __attribute__((weak))
 #endif
 
+#if defined(__cplusplus) && defined(_WIN32)
+#include <iso646.h>
+#endif
+
+#if (__cplusplus >= 201703L)
+#define AMREX_FALLTHROUGH [[fallthrough]]
+#elif defined(__clang__)
+#define AMREX_FALLTHROUGH [[clang::fallthrough]]
+#elif defined(__GNUC__) && (__GNUC__ >= 7) && !defined(__INTEL_COMPILER)
+#define AMREX_FALLTHROUGH [[gnu::fallthrough]]
+#else
+#define AMREX_FALLTHROUGH ((void)0)
+#endif
+
 #endif /* !BL_LANG_FORT */
 
 #endif
+
+/*
+ * DPCPP version strings
+ * beta08 #define __SYCL_COMPILER_VERSION 20200715
+ * beta09 #define __SYCL_COMPILER_VERSION 20200827
+ * beta10 #define __SYCL_COMPILER_VERSION 20201005
+*/
diff --git a/Src/Base/AMReX_FACopyDescriptor.H b/Src/Base/AMReX_FACopyDescriptor.H
index 1dce8057044..e03697ed251 100644
--- a/Src/Base/AMReX_FACopyDescriptor.H
+++ b/Src/Base/AMReX_FACopyDescriptor.H
@@ -563,13 +563,13 @@ FabArrayCopyDescriptor<FAB>::CollectData ()
 
     // for meta-data
     Vector<int> md_sender, md_offset, md_icnts, md_bcnts;
-    int* md_recv_data;
+    int* md_recv_data = nullptr;
     Vector<int*> md_send_data;
     Vector<MPI_Request> md_recv_reqs, md_send_reqs;
 
     // for data
     Vector<int> data_sender, data_offset;
-    value_type* recv_data;
+    value_type* recv_data = nullptr;
     Vector<value_type*> send_data;
     Vector<MPI_Request> data_recv_reqs, data_send_reqs;
 
diff --git a/Src/Base/AMReX_FArrayBox.cpp b/Src/Base/AMReX_FArrayBox.cpp
index 9323c82710e..1ed44b082b0 100644
--- a/Src/Base/AMReX_FArrayBox.cpp
+++ b/Src/Base/AMReX_FArrayBox.cpp
@@ -527,7 +527,7 @@ FABio::read_header (std::istream& is,
 FABio*
 FABio::read_header (std::istream& is,
                     FArrayBox&    f,
-		    int           compIndex,
+		    int           /*compIndex*/,
 		    int&          nCompAvailable)
 {
 //    BL_PROFILE("FArrayBox::read_header_is_i");
@@ -718,9 +718,9 @@ FABio_ascii::skip (std::istream& is,
 }
 
 void
-FABio_ascii::skip (std::istream& is,
-                   FArrayBox&    f,
-		   int           nCompToSkip) const
+FABio_ascii::skip (std::istream& /*is*/,
+                   FArrayBox&    /*f*/,
+		   int           /*nCompToSkip*/) const
 {
     amrex::Error("FABio_ascii::skip(..., int nCompToSkip) not implemented");
 }
@@ -748,7 +748,7 @@ FABio_8bit::write (std::ostream&    os,
 {
     BL_ASSERT(comp >= 0 && num_comp >= 1 && (comp+num_comp) <= f.nComp());
 
-    const Real eps = 1.0e-8_rt; // FIXME - whats a better value?
+    const Real eps = 1.0e-8; // FIXME - whats a better value?
     const Long siz = f.box().numPts();
 
     unsigned char *c = new unsigned char[siz];
diff --git a/Src/Base/AMReX_FBI.H b/Src/Base/AMReX_FBI.H
index 6c294fbf68a..69a40df0a67 100644
--- a/Src/Base/AMReX_FBI.H
+++ b/Src/Base/AMReX_FBI.H
@@ -54,19 +54,26 @@ ParallelFor (Vector<Array4BoxTag<T> > const& tags, int ncomp, F && f)
     }
     nwarps.push_back(ntotwarps);
 
-    std::size_t nbytes = ntags*sizeof(TagType);
-    auto d_tags = static_cast<TagType*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_tags, tags.data(), nbytes);
+    std::size_t sizeof_tags = ntags*sizeof(TagType);
+    std::size_t offset_nwarps = Arena::align(sizeof_tags);
+    std::size_t sizeof_nwarps = (ntags+1)*sizeof(int);
+    std::size_t total_buf_size = offset_nwarps + sizeof_nwarps;
 
-    nbytes = (ntags+1)*sizeof(int);
-    auto d_nwarps = static_cast<int*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_nwarps, nwarps.data(), nbytes);
+    char* h_buffer = (char*)The_Pinned_Arena()->alloc(total_buf_size);
+    char* d_buffer = (char*)The_Arena()->alloc(total_buf_size);
 
-    constexpr int nthreads = 128;
+    std::memcpy(h_buffer, tags.data(), sizeof_tags);
+    std::memcpy(h_buffer+offset_nwarps, nwarps.data(), sizeof_nwarps);
+    Gpu::htod_memcpy_async(d_buffer, h_buffer, total_buf_size);
+
+    auto d_tags = reinterpret_cast<TagType*>(d_buffer);
+    auto d_nwarps = reinterpret_cast<int*>(d_buffer+offset_nwarps);
+
+    constexpr int nthreads = 256;
     constexpr int nwarps_per_block = nthreads/Gpu::Device::warp_size;
     int nblocks = (ntotwarps + nwarps_per_block-1) / nwarps_per_block;
 #ifdef AMREX_USE_DPCPP
-    amrex::launch(nblocks, nthreads, Gpu::nullStream(),
+    amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE (sycl::nd_item<1> const& item) noexcept
     AMREX_REQUIRE_SUBGROUP_SIZE(Gpu::Device::warp_size)
     {
@@ -112,14 +119,14 @@ ParallelFor (Vector<Array4BoxTag<T> > const& tags, int ncomp, F && f)
         }
     });
 #else
-    amrex::launch(nblocks, nthreads, Gpu::nullStream(),
+    amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE () noexcept
     {
         int g_tid = blockDim.x*blockIdx.x + threadIdx.x;
         int g_wid = g_tid / Gpu::Device::warp_size;
         if (g_wid >= ntotwarps) return;
 
-        int tag_id;
+        int tag_id = -10000;
         {
             int lo = 0;
             int hi = ntags;
@@ -159,8 +166,8 @@ ParallelFor (Vector<Array4BoxTag<T> > const& tags, int ncomp, F && f)
 #endif
 
     Gpu::synchronize();
-    The_Device_Arena()->free(d_nwarps);
-    The_Device_Arena()->free(d_tags);
+    The_Pinned_Arena()->free(h_buffer);
+    The_Arena()->free(d_buffer);
 }
 #endif
 
@@ -196,7 +203,7 @@ struct CellAtomicAdd
     AMREX_GPU_DEVICE AMREX_FORCE_INLINE void
     operator() (U* d, U s) const noexcept
     {
-        Gpu::Atomic::Add(d,s);
+        Gpu::Atomic::AddNoRet(d,s);
     }
 };
 
@@ -221,19 +228,27 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
     }
     nwarps.push_back(ntotwarps);
 
-    std::size_t nbytes = N_locs*sizeof(TagType);
-    auto d_tags = static_cast<TagType*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_tags, copy_tags.data(), nbytes);
+    const int ntags = copy_tags.size();
+    std::size_t sizeof_tags = ntags*sizeof(TagType);
+    std::size_t offset_nwarps = Arena::align(sizeof_tags);
+    std::size_t sizeof_nwarps = (ntags+1)*sizeof(int);
+    std::size_t total_buf_size = offset_nwarps + sizeof_nwarps;
+
+    char* h_buffer = (char*)The_Pinned_Arena()->alloc(total_buf_size);
+    char* d_buffer = (char*)The_Arena()->alloc(total_buf_size);
+
+    std::memcpy(h_buffer, copy_tags.data(), sizeof_tags);
+    std::memcpy(h_buffer+offset_nwarps, nwarps.data(), sizeof_nwarps);
+    Gpu::htod_memcpy_async(d_buffer, h_buffer, total_buf_size);
 
-    nbytes = (N_locs+1)*sizeof(int);
-    auto d_nwarps = static_cast<int*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_nwarps, nwarps.data(), nbytes);
+    auto d_tags = reinterpret_cast<TagType*>(d_buffer);
+    auto d_nwarps = reinterpret_cast<int*>(d_buffer+offset_nwarps);
 
-    constexpr int nthreads = 128;
+    constexpr int nthreads = 256;
     constexpr int nwarps_per_block = nthreads/Gpu::Device::warp_size;
     int nblocks = (ntotwarps + nwarps_per_block-1) / nwarps_per_block;
 #ifdef AMREX_USE_DPCPP
-    amrex::launch(nblocks, nthreads, Gpu::nullStream(),
+    amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE (sycl::nd_item<1> const& item) noexcept
     AMREX_REQUIRE_SUBGROUP_SIZE(Gpu::Device::warp_size)
     {
@@ -280,14 +295,14 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
         }
     });
 #else
-    amrex::launch(nblocks, nthreads, Gpu::nullStream(),
+    amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE () noexcept
     {
         int g_tid = blockDim.x*blockIdx.x + threadIdx.x;
         int g_wid = g_tid / Gpu::Device::warp_size;
         if (g_wid >= ntotwarps) return;
 
-        int tag_id;
+        int tag_id = -10000;
         {
             int lo = 0;
             int hi = N_locs;
@@ -328,8 +343,8 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
 #endif
 
     Gpu::synchronize();
-    The_Device_Arena()->free(d_nwarps);
-    The_Device_Arena()->free(d_tags);
+    The_Pinned_Arena()->free(h_buffer);
+    The_Arena()->free(d_buffer);
 }
 
 template <class T, class F>
@@ -353,30 +368,38 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
     }
     nwarps.push_back(ntotwarps);
 
-    std::size_t nbytes = N_locs*sizeof(TagType);
-    auto d_tags = static_cast<TagType*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_tags, copy_tags.data(), nbytes);
+    const int ntags = copy_tags.size();
+    std::size_t sizeof_tags = ntags*sizeof(TagType);
+    std::size_t offset_nwarps = Arena::align(sizeof_tags);
+    std::size_t sizeof_nwarps = (ntags+1)*sizeof(int);
+    std::size_t offset_masks = Arena::align(offset_nwarps+sizeof_nwarps);
+    std::size_t sizeof_masks = masks.size()*sizeof(Array4<int>);
+    std::size_t total_buf_size = offset_masks + sizeof_masks;
+
+    char* h_buffer = (char*)The_Pinned_Arena()->alloc(total_buf_size);
+    char* d_buffer = (char*)The_Arena()->alloc(total_buf_size);
 
-    nbytes = (N_locs+1)*sizeof(int);
-    auto d_nwarps = static_cast<int*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_nwarps, nwarps.data(), nbytes);
+    std::memcpy(h_buffer, copy_tags.data(), sizeof_tags);
+    std::memcpy(h_buffer+offset_nwarps, nwarps.data(), sizeof_nwarps);
+    std::memcpy(h_buffer+offset_masks, masks.data(), sizeof_masks);
+    Gpu::htod_memcpy_async(d_buffer, h_buffer, total_buf_size);
 
-    nbytes = masks.size()*sizeof(Array4<int>);
-    auto d_masks = static_cast<Array4<int>*>(The_Device_Arena()->alloc(nbytes));
-    Gpu::htod_memcpy(d_masks, masks.data(), nbytes);
+    auto d_tags = reinterpret_cast<TagType*>(d_buffer);
+    auto d_nwarps = reinterpret_cast<int*>(d_buffer+offset_nwarps);
+    auto d_masks = reinterpret_cast<Array4<int>*>(d_buffer+offset_masks);
 
-    constexpr int nthreads = 128;
+    constexpr int nthreads = 256;
     constexpr int nwarps_per_block = nthreads/Gpu::Device::warp_size;
     int nblocks = (ntotwarps + nwarps_per_block-1) / nwarps_per_block;
 #ifdef AMREX_USE_DPCPP
-    amrex::launch(nblocks, nthreads, Gpu::nullStream(),
+    amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE (sycl::nd_item<1> const& item) noexcept
     {
         int g_tid = item.get_global_id(0);
         int g_wid = g_tid / Gpu::Device::warp_size;
         if (g_wid >= ntotwarps) return;
 
-        int tag_id;
+        int tag_id = -1;
         {
             int lo = 0;
             int hi = N_locs;
@@ -414,10 +437,18 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
         int to_try  = 1;
         while (true) {
             int msk = (m && to_try) ? Gpu::Atomic::CAS(m, 0, mypriority) : 0;
+#if (__SYCL_COMPILER_VERSION <= 20200827)
             if (sycl::intel::all_of(item.get_sub_group(), msk == 0)) {  // 0 means lock acquired
+#else
+            if (sycl::ONEAPI::all_of(item.get_sub_group(), msk == 0)) {  // 0 means lock acquired
+#endif
                 break; // all threads have acquired.
             } else {
+#if (__SYCL_COMPILER_VERSION <= 20200827)
                 if (sycl::intel::any_of(item.get_sub_group(), msk > mypriority)) {
+#else
+                if (sycl::ONEAPI::any_of(item.get_sub_group(), msk > mypriority)) {
+#endif
                     if (m) *m = 0; // yield
                     item.mem_fence(); // xxxxx DPCPP todo: This is block level, but needs to be device level fence, which is currently a PR in intel/llvm
                     to_try = 1;
@@ -437,7 +468,7 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
         if (m) *m = 0;
     });
 #else
-    amrex::launch(nblocks, nthreads, Gpu::nullStream(),
+    amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE () noexcept
     {
         int g_tid = blockDim.x*blockIdx.x + threadIdx.x;
@@ -515,9 +546,8 @@ fab_to_fab (Vector<Array4CopyTag<T> > const& copy_tags, int scomp, int dcomp, in
 #endif
 
     Gpu::synchronize();
-    The_Device_Arena()->free(d_masks);
-    The_Device_Arena()->free(d_nwarps);
-    The_Device_Arena()->free(d_tags);
+    The_Pinned_Arena()->free(h_buffer);
+    The_Arena()->free(d_buffer);
 }
 
 template <typename T, amrex::EnableIf_t<amrex::IsStoreAtomic<T>::value,int> = 0>
@@ -661,16 +691,18 @@ FabArray<FAB>::FB_local_copy_gpu (const FB& TheFB, int scomp, int ncomp)
     }
 
     if (maskfabs.size() > 0) {
+        Gpu::FuseSafeGuard fsg(maskfabs.size() >= Gpu::getFuseNumKernelsThreshold());
         for (Gpu::StreamIter sit(maskfabs.size()); sit.isValid(); ++sit) {
             BaseFab<int>& mskfab = maskfabs[sit()];
             const Array4<int>& msk = mskfab.array();
             const Box& bx = mskfab.box();
-            amrex::ParallelFor(bx,
+            amrex::ParallelFor(Gpu::KernelInfo{}.setFusible(true), bx,
             [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
             {
                 msk(i,j,k) = 0;
             });
         }
+        Gpu::LaunchFusedKernels();
     }
 
     if (is_thread_safe) {
@@ -923,7 +955,7 @@ FabArray<FAB>::FB_pack_send_buffer_cuda_graph (const FB& TheFB, int scomp, int n
         // Is the conditional ever expected false?
         int launches = 0;
         for (int send = 0; send < N_snds; ++send) {
-            if (send_data[send] != nullptr) {
+            if (send_size[send] > 0) {
                 launches += send_cctc[send]->size();
             }
         }
@@ -940,8 +972,7 @@ FabArray<FAB>::FB_pack_send_buffer_cuda_graph (const FB& TheFB, int scomp, int n
                                                      std::size_t(sizeof(CopyMemory)*launches) );
 
             const int j = sit();
-            char* dptr = send_data[j];
-            if (dptr != nullptr)
+            if (send_size[j] > 0)
             {
                 auto const& cctc = *send_cctc[j];
                 for (auto const& tag : cctc)
@@ -971,9 +1002,9 @@ FabArray<FAB>::FB_pack_send_buffer_cuda_graph (const FB& TheFB, int scomp, int n
     for (int send = 0; send < N_snds; ++send)
     {
         const int j = send;
-        char* dptr = send_data[j];
-        if (dptr != nullptr)
+        if (send_size[j] > 0)
         {
+            char* dptr = send_data[j];
             auto const& cctc = *send_cctc[j];
             for (auto const& tag : cctc)
             {
@@ -985,6 +1016,7 @@ FabArray<FAB>::FB_pack_send_buffer_cuda_graph (const FB& TheFB, int scomp, int n
                 
                 dptr += (tag.sbox.numPts() * ncomp * sizeof(value_type));
             }
+            amrex::ignore_unused(send_size);
             BL_ASSERT(dptr <= send_data[j] + send_size[j]);
         }
     }
@@ -999,7 +1031,7 @@ FabArray<FAB>::FB_unpack_recv_buffer_cuda_graph (const FB& TheFB, int dcomp, int
                                                  Vector<char*> const& recv_data,
                                                  Vector<std::size_t> const& recv_size,
                                                  Vector<CopyComTagsContainer const*> const& recv_cctc,
-                                                 bool is_thread_safe)
+                                                 bool /*is_thread_safe*/)
 {
     const int N_rcvs = recv_cctc.size();
     if (N_rcvs == 0) return;
@@ -1008,9 +1040,9 @@ FabArray<FAB>::FB_unpack_recv_buffer_cuda_graph (const FB& TheFB, int dcomp, int
     LayoutData<Vector<VoidCopyTag> > recv_copy_tags(boxArray(),DistributionMap());
     for (int k = 0; k < N_rcvs; ++k)
     {
-        const char* dptr = recv_data[k];
-        if (dptr != nullptr)
+        if (recv_size[k] > 0)
         {
+            const char* dptr = recv_data[k];
             auto const& cctc = *recv_cctc[k];
             for (auto const& tag : cctc)
             {
@@ -1018,6 +1050,7 @@ FabArray<FAB>::FB_unpack_recv_buffer_cuda_graph (const FB& TheFB, int dcomp, int
                 dptr += tag.dbox.numPts() * ncomp * sizeof(value_type);
                 launches++;
             }
+            amrex::ignore_unused(recv_size);
             BL_ASSERT(dptr <= recv_data[k] + recv_size[k]);
         }
     }
@@ -1080,23 +1113,35 @@ FabArray<FAB>::FB_unpack_recv_buffer_cuda_graph (const FB& TheFB, int dcomp, int
 template <class FAB>
 void
 FabArray<FAB>::pack_send_buffer_gpu (FabArray<FAB> const& src, int scomp, int ncomp,
-                                     Vector<char*>& send_data,
+                                     Vector<char*> const& send_data,
                                      Vector<std::size_t> const& send_size,
                                      Vector<CopyComTagsContainer const*> const& send_cctc)
 {
+    amrex::ignore_unused(send_size);
+
     const int N_snds = send_data.size();
     if (N_snds == 0) return;
 
+    char* pbuffer = send_data[0];
+    std::size_t szbuffer = 0;
+#if 0
+    // For linear solver test on summit, this is slower than writing to
+    // pinned memory directly on device.
+    if (not ParallelDescriptor::UseGpuAwareMpi()) {
+        // Memory in send_data is pinned.
+        szbuffer = (send_data[N_snds-1]-send_data[0]) + send_size[N_snds-1];
+        pbuffer = (char*)The_Arena()->alloc(szbuffer);
+    }
+#endif
+
     typedef Array4CopyTag<value_type> TagType;
     Vector<TagType> snd_copy_tags;
-    // FIX HIP HERE -- Dim3
-    Dim3 zero;
-    zero.x = 0; zero.y = 0; zero.z = 0;
     for (int j = 0; j < N_snds; ++j)
     {
-        char* dptr = send_data[j];
-        if (dptr != nullptr)
+        if (send_size[j] > 0)
         {
+            std::size_t offset = send_data[j]-send_data[0];
+            char* dptr = pbuffer + offset;
             auto const& cctc = *send_cctc[j];
             for (auto const& tag : cctc)
             {
@@ -1104,16 +1149,24 @@ FabArray<FAB>::pack_send_buffer_gpu (FabArray<FAB> const& src, int scomp, int nc
                     amrex::makeArray4((value_type*)(dptr), tag.sbox, ncomp),
                     src.array(tag.srcIndex),
                     tag.sbox,
-                    zero
+                    Dim3{0,0,0}
                 });
                 dptr += (tag.sbox.numPts() * ncomp * sizeof(value_type));
             }
-            BL_ASSERT(dptr <= send_data[j] + send_size[j]);
+            BL_ASSERT(dptr <= pbuffer + offset + send_size[j]);
         }
     }
 
     detail::fab_to_fab<value_type>(snd_copy_tags, scomp, 0, ncomp,
                                    detail::CellStore<value_type>());
+
+    // There is Gpu::synchronize in fab_to_fab.
+
+    if (pbuffer != send_data[0]) {
+        Gpu::copyAsync(Gpu::deviceToHost,pbuffer,pbuffer+szbuffer,send_data[0]);
+        Gpu::synchronize();
+        The_Arena()->free(pbuffer);
+    }
 }
 
 template <class FAB>
@@ -1124,9 +1177,25 @@ FabArray<FAB>::unpack_recv_buffer_gpu (FabArray<FAB>& dst, int dcomp, int ncomp,
                                        Vector<CopyComTagsContainer const*> const& recv_cctc,
                                        CpOp op, bool is_thread_safe)
 {
+    amrex::ignore_unused(recv_size);
+
     const int N_rcvs = recv_cctc.size();
     if (N_rcvs == 0) return;
 
+    char* pbuffer = recv_data[0];
+#if 0
+    std::size_t szbuffer = 0;
+    // For linear solver test on summit, this is slower than writing to
+    // pinned memory directly on device.
+    if (not ParallelDescriptor::UseGpuAwareMpi()) {
+        // Memory in recv_data is pinned.
+        szbuffer = (recv_data[N_rcvs-1]-recv_data[0]) + recv_size[N_rcvs-1];
+        pbuffer = (char*)The_Arena()->alloc(szbuffer);
+        Gpu::copyAsync(Gpu::hostToDevice,recv_data[0],recv_data[0]+szbuffer,pbuffer);
+        Gpu::synchronize();
+    }
+#endif
+
     typedef Array4CopyTag<value_type> TagType;
     Vector<TagType> recv_copy_tags;
 
@@ -1143,9 +1212,10 @@ FabArray<FAB>::unpack_recv_buffer_gpu (FabArray<FAB>& dst, int dcomp, int ncomp,
 
     for (int k = 0; k < N_rcvs; ++k)
     {
-        const char* dptr = recv_data[k];
-        if (dptr != nullptr)
+        if (recv_size[k] > 0)
         {
+            std::size_t offset = recv_data[k]-recv_data[0];
+            const char* dptr = pbuffer + offset;
             auto const& cctc = *recv_cctc[k];
             for (auto const& tag : cctc)
             {
@@ -1165,21 +1235,23 @@ FabArray<FAB>::unpack_recv_buffer_gpu (FabArray<FAB>& dst, int dcomp, int ncomp,
                     masks.push_back(maskfabs[li].array());
                 }
             }
-            BL_ASSERT(dptr <= recv_data[k] + recv_size[k]);
+            BL_ASSERT(dptr <= pbuffer + offset + recv_size[k]);
         }
     }
 
     if (maskfabs.size() > 0) {
+        Gpu::FuseSafeGuard fsg(maskfabs.size() >= Gpu::getFuseNumKernelsThreshold());
         for (Gpu::StreamIter sit(maskfabs.size()); sit.isValid(); ++sit) {
             BaseFab<int>& mskfab = maskfabs[sit()];
             const Array4<int>& msk = mskfab.array();
             const Box& bx = mskfab.box();
-            amrex::ParallelFor(bx,
+            amrex::ParallelFor(Gpu::KernelInfo().setFusible(true), bx,
             [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
             {
                 msk(i,j,k) = 0;
             });
         }
+        Gpu::LaunchFusedKernels();
     }
 
     if (op == FabArrayBase::COPY)
@@ -1200,6 +1272,12 @@ FabArray<FAB>::unpack_recv_buffer_gpu (FabArray<FAB>& dst, int dcomp, int ncomp,
             detail::fab_to_fab_atomic_add<value_type>(recv_copy_tags, 0, dcomp, ncomp, masks);
         }
     }
+
+    // There is Gpu::synchronize in fab_to_fab.
+
+    if (pbuffer != recv_data[0]) {
+        The_Arena()->free(pbuffer);
+    }
 }
 
 #endif /* AMREX_USE_GPU */
@@ -1207,10 +1285,12 @@ FabArray<FAB>::unpack_recv_buffer_gpu (FabArray<FAB>& dst, int dcomp, int ncomp,
 template <class FAB>
 void
 FabArray<FAB>::pack_send_buffer_cpu (FabArray<FAB> const& src, int scomp, int ncomp,
-                                     Vector<char*>& send_data,
+                                     Vector<char*> const& send_data,
                                      Vector<std::size_t> const& send_size,
                                      Vector<CopyComTagsContainer const*> const& send_cctc)
 {
+    amrex::ignore_unused(send_size);
+
     const int N_snds = send_data.size();
     if (N_snds == 0) return;
 
@@ -1219,9 +1299,9 @@ FabArray<FAB>::pack_send_buffer_cpu (FabArray<FAB> const& src, int scomp, int nc
 #endif
     for (int j = 0; j < N_snds; ++j)
     {
-        char* dptr = send_data[j];
-        if (dptr != nullptr)
+        if (send_size[j] > 0)
         {
+            char* dptr = send_data[j];
             auto const& cctc = *send_cctc[j];
             for (auto const& tag : cctc)
             {
@@ -1248,6 +1328,8 @@ FabArray<FAB>::unpack_recv_buffer_cpu (FabArray<FAB>& dst, int dcomp, int ncomp,
                                        Vector<CopyComTagsContainer const*> const& recv_cctc,
                                        CpOp op, bool is_thread_safe)
 {
+    amrex::ignore_unused(recv_size);
+
     const int N_rcvs = recv_cctc.size();
     if (N_rcvs == 0) return;
 
@@ -1258,9 +1340,9 @@ FabArray<FAB>::unpack_recv_buffer_cpu (FabArray<FAB>& dst, int dcomp, int ncomp,
 #endif
         for (int k = 0; k < N_rcvs; ++k)
         {
-            const char* dptr = recv_data[k];
-            if (dptr != nullptr)
+            if (recv_size[k] > 0)
             {
+                const char* dptr = recv_data[k];
                 auto const& cctc = *recv_cctc[k];
                 for (auto const& tag : cctc)
                 {
@@ -1286,9 +1368,9 @@ FabArray<FAB>::unpack_recv_buffer_cpu (FabArray<FAB>& dst, int dcomp, int ncomp,
         recv_copy_tags.define(dst.boxArray(),dst.DistributionMap());
         for (int k = 0; k < N_rcvs; ++k)
         {
-            const char* dptr = recv_data[k];
-            if (dptr != nullptr)
+            if (recv_size[k] > 0)
             {
+                const char* dptr = recv_data[k];
                 auto const& cctc = *recv_cctc[k];
                 for (auto const& tag : cctc)
                 {
diff --git a/Src/Base/AMReX_FPC.cpp b/Src/Base/AMReX_FPC.cpp
index 514120f29b7..97b6ee4637f 100644
--- a/Src/Base/AMReX_FPC.cpp
+++ b/Src/Base/AMReX_FPC.cpp
@@ -23,7 +23,8 @@
     defined(__amd64__) || \
     defined(__LITTLE_ENDIAN__) || \
     defined(__powerpc__) || \
-    defined(powerpc)
+    defined(powerpc) || \
+    defined(_WIN32)
 #define AMREX_LITTLE_ENDIAN
 #endif
 
diff --git a/Src/Base/AMReX_FabArray.H b/Src/Base/AMReX_FabArray.H
index 7ce47fed648..db0b2073d2f 100644
--- a/Src/Base/AMReX_FabArray.H
+++ b/Src/Base/AMReX_FabArray.H
@@ -47,8 +47,8 @@
 
 namespace amrex {
 
-template <typename T, class = typename std::enable_if<!IsBaseFab<T>::value>::type >
-Long nBytesOwned (T const& t) noexcept { return 0; }
+template <typename T, typename std::enable_if<!IsBaseFab<T>::value,int>::type = 0>
+Long nBytesOwned (T const&) noexcept { return 0; }
 
 template <typename T>
 Long nBytesOwned (BaseFab<T> const& fab) noexcept { return fab.nBytesOwned(); }
@@ -136,26 +136,12 @@ struct MFInfo {
     }
 };
 
-    template <class T>
-    class MFGraph;
-#ifdef USE_PERILLA
-    class Perilla;
-#endif
-
 template <class FAB>
 class FabArray
     :
     public FabArrayBase
 {
 public:
-    friend class Action;
-    friend class AmrTask;
-    template <class T>
-    friend class MFGraph;
-#ifdef USE_PERILLA
-    friend class Perilla;
-#endif
-
 
     struct FABType {
         typedef FAB value_type;
@@ -270,7 +256,8 @@ public:
 
     /**
     * \brief Return true if the FabArray is well-defined.  That is,
-    * if FABs are allocated for each Box in the BoxArray and the
+    * the FabArray has a BoxArray and DistributionMapping, the
+    * FABs are allocated for each Box in the BoxArray and the
     * sizes of the FABs and the number of components are consistent
     * with the definition of the FabArray.
     */
@@ -310,46 +297,46 @@ public:
     FAB      * fabPtr (int K) noexcept;  // Here K is global index
     FAB const* fabPtr (int K) const noexcept;
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void prefetchToHost (const MFIter& mfi) const noexcept;
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void prefetchToDevice (const MFIter& mfi) const noexcept;
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> array (const MFIter& mfi) const noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type> array (const MFIter& mfi) noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> array (int K) const noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type> array (int K) noexcept;
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> const_array (const MFIter& mfi) const noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> const_array (int K) const noexcept;
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> array (const MFIter& mfi, int start_comp) const noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type> array (const MFIter& mfi, int start_comp) noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> array (int K, int start_comp) const noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type> array (int K, int start_comp) noexcept;
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> const_array (const MFIter& mfi, int start_comp) const noexcept;
     //
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     Array4<typename FabArray<FAB>::value_type const> const_array (int K, int start_comp) const noexcept;
 
     //! Explicitly set the Kth FAB in the FabArray to point to elem.
@@ -362,11 +349,11 @@ public:
     void clear ();
 
     //! Set all components in the entire region of each FAB to val.
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val);
 
     //! Set all components in the entire region of each FAB to val.
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void operator= (value_type val);
 
     /**
@@ -374,13 +361,13 @@ public:
     * each FAB in the FabArray, starting at component comp to val.
     * Also set the value of nghost boundary cells.
     */
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val,
                  int        comp,
                  int        num_comp,
                  int        nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val,
                  int        comp,
                  int        num_comp,
@@ -392,14 +379,14 @@ public:
     * as nghost boundary cells, to val, provided they also intersect
     * with the Box region.
     */
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val,
                  const Box& region,
                  int        comp,
                  int        num_comp,
                  int        nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val,
                  const Box& region,
                  int        comp,
@@ -409,10 +396,10 @@ public:
     * \brief Set all components in the valid region of each FAB in the
     * FabArray to val, including nghost boundary cells.
     */
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val, int nghost);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val, const IntVect& nghost);
 
     /**
@@ -420,50 +407,50 @@ public:
     * FabArray to val, including nghost boundary cells, that also
     * intersect the Box region.
     */
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val, const Box& region, int nghost);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type val, const Box& region, const IntVect& nghost);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void abs (int comp, int num_comp, int nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void abs (int comp, int num_comp, const IntVect& nghost);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void plus (value_type val, int comp, int num_comp, int nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void plus (value_type val, const Box& region, int comp, int num_comp, int nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void mult (value_type val, int comp, int num_comp, int nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void mult (value_type val, const Box& region, int comp, int num_comp, int nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void invert (value_type numerator, int comp, int num_comp, int nghost = 0);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void invert (value_type numerator, const Box& region, int comp, int num_comp, int nghost = 0);
 
     //! Set all values in the boundary region to val.
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setBndry (value_type val);
 
     //! Set ncomp values in the boundary region, starting at start_comp to val.
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setBndry (value_type val, int strt_comp, int ncomp);
 
    //! Set all values outside the Geometry domain to val.
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setDomainBndry (value_type val, const Geometry& goem);
 
     //! Set ncomp values outside the Geometry domain to val, starting at start_comp.
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setDomainBndry (value_type val, int strt_comp, int ncomp, const Geometry& goem);
 
     /**
@@ -653,7 +640,7 @@ public:
     void FillBoundary_nowait (int scomp, int ncomp, bool cross = false);
     void FillBoundary_nowait (int scomp, int ncomp, const Periodicity& period, bool cross = false);
     void FillBoundary_nowait (int scomp, int ncomp, const IntVect& nghost, const Periodicity& period, bool cross = false);
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void FillBoundary_finish ();
 
     void FillBoundary_test ();
@@ -673,14 +660,14 @@ public:
     //             (including ghost cells outside periodic boundaries)
     // physbnd   : boundary cells outside the domain (excluding periodic boundaries)
     // interior  : interior cells (i.e., valid cells)
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void BuildMask (const Box& phys_domain, const Periodicity& period,
 		    value_type covered, value_type notcovered,
 		    value_type physbnd, value_type interior);
 
     // The following are private functions.  But we have to make them public for cuda.
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void FBEP_nowait (int scomp, int ncomp, const IntVect& nghost,
                       const Periodicity& period, bool cross,
                       bool enforce_periodicity_only = false);
@@ -689,10 +676,10 @@ public:
     void PC_local_cpu (const CPC& thecpc, FabArray<FAB> const& src,
                        int scomp, int dcomp, int ncomp, CpOp op);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     void setVal (value_type x, const CommMetaData& thecmd, int scomp, int ncomp);
 
-    template <class F=FAB, class = typename std::enable_if<IsBaseFab<F>::value>::type >
+    template <class F=FAB, typename std::enable_if<IsBaseFab<F>::value,int>::type = 0>
     LayoutData<int> RecvLayoutMask (const CommMetaData& thecmd);
 
 #ifdef AMREX_USE_GPU
@@ -731,7 +718,7 @@ public:
 #endif
 
     static void pack_send_buffer_gpu (FabArray<FAB> const& src, int scomp, int ncomp,
-                                      Vector<char*>& send_data,
+                                      Vector<char*> const& send_data,
                                       Vector<std::size_t> const& send_size,
                                       Vector<const CopyComTagsContainer*> const& send_cctc);
 
@@ -744,7 +731,7 @@ public:
 #endif
 
     static void pack_send_buffer_cpu (FabArray<FAB> const& src, int scomp, int ncomp,
-                                      Vector<char*>& send_data,
+                                      Vector<char*> const& send_data,
                                       Vector<std::size_t> const& send_size,
                                       Vector<const CopyComTagsContainer*> const& send_cctc);
 
@@ -837,7 +824,6 @@ private:
                    Vector<std::size_t>&                   recv_size,
                    Vector<int>&                           recv_from,
                    Vector<MPI_Request>&                   recv_reqs,
-                   int                                    icomp,
                    int                                    ncomp,
                    int                                    SeqNum);
 
@@ -932,27 +918,31 @@ FabArray<FAB>::fabPtr (int K) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::prefetchToHost (const MFIter& mfi) const noexcept
 {
 #ifdef AMREX_USE_CUDA
     this->fabPtr(mfi)->prefetchToHost();
+#else
+    amrex::ignore_unused(mfi);
 #endif
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::prefetchToDevice (const MFIter& mfi) const noexcept
 {
 #ifdef AMREX_USE_CUDA
     this->fabPtr(mfi)->prefetchToDevice();
+#else
+    amrex::ignore_unused(mfi);
 #endif
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::array (const MFIter& mfi) const noexcept
 {
@@ -960,7 +950,7 @@ FabArray<FAB>::array (const MFIter& mfi) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type>
 FabArray<FAB>::array (const MFIter& mfi) noexcept
 {
@@ -968,7 +958,7 @@ FabArray<FAB>::array (const MFIter& mfi) noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::array (int K) const noexcept
 {
@@ -976,7 +966,7 @@ FabArray<FAB>::array (int K) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type>
 FabArray<FAB>::array (int K) noexcept
 {
@@ -984,7 +974,7 @@ FabArray<FAB>::array (int K) noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::const_array (const MFIter& mfi) const noexcept
 {
@@ -992,7 +982,7 @@ FabArray<FAB>::const_array (const MFIter& mfi) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::const_array (int K) const noexcept
 {
@@ -1000,7 +990,7 @@ FabArray<FAB>::const_array (int K) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::array (const MFIter& mfi, int start_comp) const noexcept
 {
@@ -1008,7 +998,7 @@ FabArray<FAB>::array (const MFIter& mfi, int start_comp) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type>
 FabArray<FAB>::array (const MFIter& mfi, int start_comp) noexcept
 {
@@ -1016,7 +1006,7 @@ FabArray<FAB>::array (const MFIter& mfi, int start_comp) noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::array (int K, int start_comp) const noexcept
 {
@@ -1024,7 +1014,7 @@ FabArray<FAB>::array (int K, int start_comp) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type>
 FabArray<FAB>::array (int K, int start_comp) noexcept
 {
@@ -1032,7 +1022,7 @@ FabArray<FAB>::array (int K, int start_comp) noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::const_array (const MFIter& mfi, int start_comp) const noexcept
 {
@@ -1040,7 +1030,7 @@ FabArray<FAB>::const_array (const MFIter& mfi, int start_comp) const noexcept
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 Array4<typename FabArray<FAB>::value_type const>
 FabArray<FAB>::const_array (int K, int start_comp) const noexcept
 {
@@ -1078,7 +1068,7 @@ FabArray<FAB>::clear ()
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val, int nghost)
 {
@@ -1086,7 +1076,7 @@ FabArray<FAB>::setVal (value_type val, int nghost)
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val, const IntVect& nghost)
 {
@@ -1094,7 +1084,7 @@ FabArray<FAB>::setVal (value_type val, const IntVect& nghost)
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val, const Box& region, int nghost)
 {
@@ -1102,7 +1092,7 @@ FabArray<FAB>::setVal (value_type val, const Box& region, int nghost)
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val, const Box& region, const IntVect& nghost)
 {
@@ -1214,6 +1204,8 @@ template <class FAB>
 bool
 FabArray<FAB>::ok () const
 {
+    if (!define_function_called) return false;
+
     int isok = 1;
 
     for (MFIter fai(*this); fai.isValid() && isok; ++fai)
@@ -1448,7 +1440,7 @@ FabArray<FAB>::setFab (const MFIter& mfi,
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setBndry (value_type val)
 {
@@ -1456,7 +1448,7 @@ FabArray<FAB>::setBndry (value_type val)
 }
 
 template <class FAB>
-template <class FOO, class BAR>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setBndry (value_type val,
                          int        strt_comp,
@@ -1475,7 +1467,7 @@ FabArray<FAB>::setBndry (value_type val,
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setDomainBndry (value_type val, const Geometry& geom)
 {
@@ -1483,7 +1475,7 @@ FabArray<FAB>::setDomainBndry (value_type val, const Geometry& geom)
 }
 
 template <class FAB>
-template <class FOO, class BAR>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setDomainBndry (value_type val,
                                int        strt_comp,
@@ -1544,7 +1536,7 @@ FabArray<FAB>::copyTo (FAB& dest,
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val)
 {
@@ -1552,7 +1544,7 @@ FabArray<FAB>::setVal (value_type val)
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::operator= (value_type val)
 {
@@ -1560,7 +1552,7 @@ FabArray<FAB>::operator= (value_type val)
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val,
                        int        comp,
@@ -1571,7 +1563,7 @@ FabArray<FAB>::setVal (value_type val,
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::setVal (value_type val,
                        int        comp,
@@ -1590,7 +1582,7 @@ FabArray<FAB>::setVal (value_type val,
     {
 	const Box& bx = fai.growntilebox(nghost);
         auto fab = this->array(fai);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, ncomp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, ncomp, i, j, k, n,
         {
             fab(i,j,k,n+comp) = val;
         });
@@ -1598,7 +1590,7 @@ FabArray<FAB>::setVal (value_type val,
 }
 
 template <class FAB>
-template <class,class>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val,
                        const Box& region,
@@ -1610,7 +1602,7 @@ FabArray<FAB>::setVal (value_type val,
 }
 
 template <class FAB>
-template <class FOO, class BAR> // Foo fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::setVal (value_type val,
                        const Box& region,
@@ -1633,7 +1625,7 @@ FabArray<FAB>::setVal (value_type val,
 
         if (b.ok()) {
             auto fab = this->array(fai);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( b, ncomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( b, ncomp, i, j, k, n,
             {
                 fab(i,j,k,n+comp) = val;
             });
@@ -1642,7 +1634,7 @@ FabArray<FAB>::setVal (value_type val,
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::abs (int comp, int ncomp, int nghost)
 {
@@ -1650,7 +1642,7 @@ FabArray<FAB>::abs (int comp, int ncomp, int nghost)
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::abs (int comp, int ncomp, const IntVect& nghost)
 {
@@ -1663,7 +1655,7 @@ FabArray<FAB>::abs (int comp, int ncomp, const IntVect& nghost)
     {
         const Box& bx = mfi.growntilebox(nghost);
         auto fab = this->array(mfi);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, ncomp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, ncomp, i, j, k, n,
         {
             fab(i,j,k,n+comp) = amrex::Math::abs(fab(i,j,k,n+comp));
         });
@@ -1671,7 +1663,7 @@ FabArray<FAB>::abs (int comp, int ncomp, const IntVect& nghost)
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::plus (value_type val, int comp, int num_comp, int nghost)
 {
@@ -1682,7 +1674,7 @@ FabArray<FAB>::plus (value_type val, int comp, int num_comp, int nghost)
     {
         const Box& bx = mfi.growntilebox(nghost);
         auto fab = this->array(mfi);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, num_comp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, num_comp, i, j, k, n,
         {
             fab(i,j,k,n+comp) += val;
         });
@@ -1690,7 +1682,7 @@ FabArray<FAB>::plus (value_type val, int comp, int num_comp, int nghost)
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::plus (value_type val, const Box& region, int comp, int num_comp, int nghost)
 {
@@ -1702,7 +1694,7 @@ FabArray<FAB>::plus (value_type val, const Box& region, int comp, int num_comp,
         const Box& bx = mfi.growntilebox(nghost) & region;
         if (bx.ok()) {
             auto fab = this->array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, num_comp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, num_comp, i, j, k, n,
             {
                 fab(i,j,k,n+comp) += val;
             });
@@ -1711,7 +1703,7 @@ FabArray<FAB>::plus (value_type val, const Box& region, int comp, int num_comp,
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::mult (value_type val, int comp, int num_comp, int nghost)
 {
@@ -1722,7 +1714,7 @@ FabArray<FAB>::mult (value_type val, int comp, int num_comp, int nghost)
     {
         const Box& bx = mfi.growntilebox(nghost);
         auto fab = this->array(mfi);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, num_comp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, num_comp, i, j, k, n,
         {
             fab(i,j,k,n+comp) *= val;
         });
@@ -1730,7 +1722,7 @@ FabArray<FAB>::mult (value_type val, int comp, int num_comp, int nghost)
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::mult (value_type val, const Box& region, int comp, int num_comp, int nghost)
 {
@@ -1742,7 +1734,7 @@ FabArray<FAB>::mult (value_type val, const Box& region, int comp, int num_comp,
         const Box& bx = mfi.growntilebox(nghost) & region;
         if (bx.ok()) {
             auto fab = this->array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, num_comp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, num_comp, i, j, k, n,
             {
                 fab(i,j,k,n+comp) *= val;
             });
@@ -1751,7 +1743,7 @@ FabArray<FAB>::mult (value_type val, const Box& region, int comp, int num_comp,
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::invert (value_type numerator, int comp, int num_comp, int nghost)
 {
@@ -1762,7 +1754,7 @@ FabArray<FAB>::invert (value_type numerator, int comp, int num_comp, int nghost)
     {
         const Box& bx = mfi.growntilebox(nghost);
         auto fab = this->array(mfi);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, num_comp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, num_comp, i, j, k, n,
         {
             fab(i,j,k,n+comp) = numerator / fab(i,j,k,n+comp);
         });
@@ -1770,7 +1762,7 @@ FabArray<FAB>::invert (value_type numerator, int comp, int num_comp, int nghost)
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::invert (value_type numerator, const Box& region, int comp, int num_comp, int nghost)
 {
@@ -1782,7 +1774,7 @@ FabArray<FAB>::invert (value_type numerator, const Box& region, int comp, int nu
         const Box& bx = mfi.growntilebox(nghost) & region;
         if (bx.ok()) {
             auto fab = this->array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, num_comp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, num_comp, i, j, k, n,
             {
                 fab(i,j,k,n+comp) = numerator / fab(i,j,k,n+comp);
             });
@@ -1953,7 +1945,7 @@ FabArray<FAB>::FillBoundary_nowait (int scomp, int ncomp, const IntVect& nghost,
 }
 
 template <class FAB>
-template <class F, class B>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::BuildMask (const Box& phys_domain, const Periodicity& period,
 			  value_type covered, value_type notcovered,
@@ -1978,7 +1970,7 @@ FabArray<FAB>::BuildMask (const Box& phys_domain, const Periodicity& period,
         Box const& fbx = mfi.growntilebox();
         Box const& gbx = fbx & domain;
         Box const& vbx = mfi.validbox();
-        AMREX_HOST_DEVICE_FOR_4D(fbx, ncomp, i, j, k, n,
+        AMREX_HOST_DEVICE_FOR_4D_FUSIBLE(fbx, ncomp, i, j, k, n,
         {
             IntVect iv(AMREX_D_DECL(i,j,k));
             if (vbx.contains(iv)) {
@@ -1996,15 +1988,15 @@ FabArray<FAB>::BuildMask (const Box& phys_domain, const Periodicity& period,
 }
 
 template <class FAB>
-template <class F, class B>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 void
 FabArray<FAB>::setVal (value_type val, const CommMetaData& thecmd, int scomp, int ncomp)
 {
 #ifdef AMREX_USE_GPU
     if (Gpu::inLaunchRegion())
     {
-        CMD_local_setVal_gpu(val, thecmd, 0, ncomp);
-        CMD_remote_setVal_gpu(val, thecmd, 0, ncomp);
+        CMD_local_setVal_gpu(val, thecmd, scomp, ncomp);
+        CMD_remote_setVal_gpu(val, thecmd, scomp, ncomp);
     }
     else
 #endif
@@ -2017,7 +2009,7 @@ FabArray<FAB>::setVal (value_type val, const CommMetaData& thecmd, int scomp, in
 #endif
         for (int i = 0; i < N_locs; ++i) {
             const CopyComTag& tag = LocTags[i];
-            (*this)[tag.dstIndex].template setVal<RunOn::Host>(val, tag.dbox, 0, ncomp);
+            (*this)[tag.dstIndex].template setVal<RunOn::Host>(val, tag.dbox, scomp, ncomp);
         }
 
         for (auto it = RcvTags.begin(); it != RcvTags.end(); ++it) {
@@ -2027,14 +2019,14 @@ FabArray<FAB>::setVal (value_type val, const CommMetaData& thecmd, int scomp, in
 #endif
             for (int i = 0; i < N; ++i) {
                 const CopyComTag& tag = it->second[i];
-                (*this)[tag.dstIndex].template setVal<RunOn::Host>(val, tag.dbox, 0, ncomp);
+                (*this)[tag.dstIndex].template setVal<RunOn::Host>(val, tag.dbox, scomp, ncomp);
             }
         }
     }
 }
 
 template <class FAB>
-template <class F, class B>
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type>
 LayoutData<int>
 FabArray<FAB>::RecvLayoutMask (const CommMetaData& thecmd)
 {
diff --git a/Src/Base/AMReX_FabArrayBase.H b/Src/Base/AMReX_FabArrayBase.H
index 002d2a3586f..631da49e938 100644
--- a/Src/Base/AMReX_FabArrayBase.H
+++ b/Src/Base/AMReX_FabArrayBase.H
@@ -23,11 +23,6 @@ class Geometry;
 class FArrayBox;
 template <typename FAB> class FabFactory;
 template <typename FAB> class FabArray;
-class AmrTask;
-#ifdef USE_PERILLA
-class Perilla;
-class RegionGraph;
-#endif
 
 namespace EB2 { class IndexSpace; }
 
@@ -35,11 +30,6 @@ class FabArrayBase
 {
     friend class MFIter;
     friend class MFGhostIter;
-    friend class AmrTask;
-#ifdef USE_PERILLA
-    friend class Perilla;
-    friend class RegionGraph;
-#endif
 
     template <class FAB> friend void FillBoundary (Vector<FabArray<FAB>*> const& mf, const Periodicity& period);
 
@@ -143,6 +133,7 @@ public:
     */
     bool is_cell_centered () const noexcept;
 
+    void setMultiGhost(bool a_multi_ghost) {m_multi_ghost = a_multi_ghost;}
 
     // These are provided for convenience to keep track of how many
     // ghost cells are up to date.  The number of filled ghost cells
@@ -324,6 +315,7 @@ public:
                 const Box&          dstdomain,
                 const IntVect&      dstng,
                 const BoxConverter& coarsener,
+                const Box&          fdomain,
                 const Box&          cdomain,
                 const EB2::IndexSpace* index_space);
 
@@ -332,16 +324,16 @@ public:
         Long bytes () const;
 
         BoxArray            ba_crse_patch;
-        DistributionMapping dm_crse_patch;
+        BoxArray            ba_fine_patch;
+        DistributionMapping dm_patch;
         std::unique_ptr<FabFactory<FArrayBox> > fact_crse_patch;
-        Vector<int>          dst_idxs;
-        Vector<Box>          dst_boxes;
+        std::unique_ptr<FabFactory<FArrayBox> > fact_fine_patch;
         //
         BDKey               m_srcbdk;
         BDKey               m_dstbdk;
         Box                 m_dstdomain;
         IntVect             m_dstng;
-        BoxConverter*       m_coarsener;
+        std::unique_ptr<BoxConverter> m_coarsener;
         //
         Long                m_nuse;
     };
@@ -355,10 +347,10 @@ public:
 
     static const FPinfo& TheFPinfo (const FabArrayBase& srcfa,
                                     const FabArrayBase& dstfa,
-                                    const Box&          dstdomain,
                                     const IntVect&      dstng,
                                     const BoxConverter& coarsener,
-                                    const Box&          cdomain,
+                                    const Geometry&     fgeom,
+                                    const Geometry&     cgeom,
                                     const EB2::IndexSpace*);
 
     void flushFPinfo (bool no_assertion=false);
@@ -466,6 +458,7 @@ public:
     int                 n_comp;
     mutable BDKey       m_bdkey;
     IntVect             n_filled;  // Note that IntVect is zero by default.
+    bool                m_multi_ghost = false;
 
     //
     // Tiling
@@ -501,7 +494,7 @@ public:
     {
         FB (const FabArrayBase& fa, const IntVect& nghost,
             bool cross, const Periodicity& period,
-	    bool enforce_periodicity_only);
+	    bool enforce_periodicity_only, bool multi_ghost = false);
         ~FB ();
 
         IndexType    m_typ;
@@ -512,6 +505,7 @@ public:
         Periodicity  m_period;
         //
         Long         m_nuse;
+        bool         m_multi_ghost = false;
         //
 #if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )
         CudaGraph<CopyMemory> m_localCopy;
diff --git a/Src/Base/AMReX_FabArrayBase.cpp b/Src/Base/AMReX_FabArrayBase.cpp
index 2a775f9e792..50e00ad2c9c 100644
--- a/Src/Base/AMReX_FabArrayBase.cpp
+++ b/Src/Base/AMReX_FabArrayBase.cpp
@@ -25,7 +25,7 @@ namespace amrex {
 //
 int     FabArrayBase::MaxComp;
 
-#if defined(AMREX_USE_GPU) && defined(AMREX_USE_GPU_PRAGMA)
+#if defined(AMREX_USE_GPU)
 
 #if AMREX_SPACEDIM == 1
 IntVect FabArrayBase::mfiter_tile_size(1024000);
@@ -116,11 +116,15 @@ FabArrayBase::Initialize ()
         MaxComp = 1;
     }
 
+#ifdef AMREX_USE_GPU
     if (ParallelDescriptor::UseGpuAwareMpi()) {
-        the_fa_arena = The_Device_Arena();
+        the_fa_arena = The_Arena();
     } else {
         the_fa_arena = The_Pinned_Arena();
     }
+#else
+    the_fa_arena = The_Cpu_Arena();
+#endif
 
     amrex::ExecOnFinalize(FabArrayBase::Finalize);
 
@@ -509,6 +513,7 @@ FabArrayBase::CPC::CPC (const BoxArray& ba, const IntVect& ng,
 void
 FabArrayBase::flushCPC (bool no_assertion) const
 {
+    amrex::ignore_unused(no_assertion);
     BL_ASSERT(no_assertion || getBDKey() == m_bdkey);
 
     std::vector<CPCacheIter> others;
@@ -621,11 +626,12 @@ FabArrayBase::getCPC (const IntVect& dstng, const FabArrayBase& src, const IntVe
 
 FabArrayBase::FB::FB (const FabArrayBase& fa, const IntVect& nghost,
                       bool cross, const Periodicity& period, 
-                      bool enforce_periodicity_only)
+                      bool enforce_periodicity_only,
+                      bool multi_ghost)
     : m_typ(fa.boxArray().ixType()), m_crse_ratio(fa.boxArray().crseRatio()),
       m_ngrow(nghost), m_cross(cross),
       m_epo(enforce_periodicity_only), m_period(period),
-      m_nuse(0)
+      m_nuse(0), m_multi_ghost(multi_ghost)
 {
     BL_PROFILE("FabArrayBase::FB::FB()");
 
@@ -646,6 +652,8 @@ FabArrayBase::FB::FB (const FabArrayBase& fa, const IntVect& nghost,
 void
 FabArrayBase::FB::define_fb(const FabArrayBase& fa)
 {
+    AMREX_ASSERT(m_multi_ghost ? fa.nGrow() >= 2 : true); // must have >= 2 ghost nodes
+    AMREX_ASSERT(m_multi_ghost ? !m_period.isAnyPeriodic() : true); // this only works for non-periodic
     const int                  MyProc   = ParallelDescriptor::MyProc();
     const BoxArray&            ba       = fa.boxArray();
     const DistributionMapping& dm       = fa.DistributionMap();
@@ -656,6 +664,7 @@ FabArrayBase::FB::define_fb(const FabArrayBase& fa)
     
     const int nlocal = imap.size();
     const IntVect& ng = m_ngrow;
+    const IntVect ng_ng = m_ngrow - 1;
     std::vector< std::pair<int,Box> > isects;
     
     const std::vector<IntVect>& pshifts = m_period.shiftIntVect();
@@ -666,7 +675,8 @@ FabArrayBase::FB::define_fb(const FabArrayBase& fa)
     {
 	const int ksnd = imap[i];
 	const Box& vbx = ba[ksnd];
-	
+	const Box& vbx_ng  = amrex::grow(vbx,1);
+
 	for (auto pit=pshifts.cbegin(); pit!=pshifts.cend(); ++pit)
 	{
 	    ba.intersections(vbx+(*pit), isects, false, ng);
@@ -680,7 +690,20 @@ FabArrayBase::FB::define_fb(const FabArrayBase& fa)
 		if (ParallelDescriptor::sameTeam(dst_owner)) {
 		    continue;  // local copy will be dealt with later
 		} else if (MyProc == dm[ksnd]) {
-		    const BoxList& bl = amrex::boxDiff(bx, ba[krcv]);
+		    BoxList bl = amrex::boxDiff(bx, ba[krcv]);
+            if (m_multi_ghost)
+            {
+                // In the case where ngrow>1, augment the send/rcv box list
+                // with boxes for overlapping ghost nodes.
+                const Box& ba_krcv   = amrex::grow(ba[krcv],1);
+                const Box& dst_bx_ng = (amrex::grow(ba_krcv,ng_ng) & (vbx_ng + (*pit)));
+                const BoxList &bltmp = ba.complementIn(dst_bx_ng);
+                for (auto const& btmp : bltmp)
+                {
+                    bl.join(amrex::boxDiff(btmp,ba_krcv));
+                }
+                bl.simplify();
+            }
 		    for (BoxList::const_iterator lit = bl.begin(); lit != bl.end(); ++lit)
 			send_tags[dst_owner].push_back(CopyComTag(*lit, (*lit)-(*pit), krcv, ksnd));
 		}
@@ -713,6 +736,7 @@ FabArrayBase::FB::define_fb(const FabArrayBase& fa)
     {
 	const int   krcv = imap[i];
 	const Box& vbx   = ba[krcv];
+	const Box& vbx_ng  = amrex::grow(vbx,1);
 	const Box& bxrcv = amrex::grow(vbx, ng);
 	
 	if (check_local) {
@@ -735,7 +759,22 @@ FabArrayBase::FB::define_fb(const FabArrayBase& fa)
 		const Box& dst_bx   = isects[j].second - *pit;
 		const int src_owner = dm[ksnd];
 		
-		const BoxList& bl = amrex::boxDiff(dst_bx, vbx);
+		BoxList bl = amrex::boxDiff(dst_bx, vbx);
+		
+        if (m_multi_ghost) 
+        {
+            // In the case where ngrow>1, augment the send/rcv box list
+            // with boxes for overlapping ghost nodes.
+            Box ba_ksnd = ba[ksnd];
+            ba_ksnd.grow(1);
+            const Box dst_bx_ng = (ba_ksnd & (bxrcv + (*pit))) - (*pit);
+            const BoxList &bltmp = ba.complementIn(dst_bx_ng);
+            for (auto const& btmp : bltmp)
+            {
+                bl.join(amrex::boxDiff(btmp,vbx_ng));
+            }
+            bl.simplify();
+        }
 		for (BoxList::const_iterator lit = bl.begin(); lit != bl.end(); ++lit)
 		{
 		    const Box& blbx = *lit;
@@ -1010,6 +1049,7 @@ FabArrayBase::FB::~FB ()
 void
 FabArrayBase::flushFB (bool no_assertion) const
 {
+    amrex::ignore_unused(no_assertion);
     BL_ASSERT(no_assertion || getBDKey() == m_bdkey);
     std::pair<FBCacheIter,FBCacheIter> er_it = m_TheFBCache.equal_range(m_bdkey);
     for (FBCacheIter it = er_it.first; it != er_it.second; ++it)
@@ -1051,6 +1091,7 @@ FabArrayBase::getFB (const IntVect& nghost, const Periodicity& period,
             it->second->m_crse_ratio == boxArray().crseRatio()   &&
 	    it->second->m_ngrow      == nghost                   &&
 	    it->second->m_cross      == cross                    &&
+	    it->second->m_multi_ghost== m_multi_ghost            &&
 	    it->second->m_epo        == enforce_periodicity_only &&
 	    it->second->m_period     == period              )
 	{
@@ -1061,7 +1102,7 @@ FabArrayBase::getFB (const IntVect& nghost, const Periodicity& period,
     }
 
     // Have to build a new one
-    FB* new_fb = new FB(*this, nghost, cross, period, enforce_periodicity_only);
+    FB* new_fb = new FB(*this, nghost, cross, period, enforce_periodicity_only,m_multi_ghost);
 
 #ifdef BL_PROFILE
     m_FBC_stats.bytes += new_fb->bytes();
@@ -1078,10 +1119,11 @@ FabArrayBase::getFB (const IntVect& nghost, const Periodicity& period,
 }
 
 FabArrayBase::FPinfo::FPinfo (const FabArrayBase& srcfa,
-			      const FabArrayBase& dstfa,
-			      const Box&          dstdomain,
-			      const IntVect&      dstng,
-			      const BoxConverter& coarsener,
+                              const FabArrayBase& dstfa,
+                              const Box&          dstdomain,
+                              const IntVect&      dstng,
+                              const BoxConverter& coarsener,
+                              const Box&          fdomain,
                               const Box&          cdomain,
                               const EB2::IndexSpace* index_space)
     : m_srcbdk   (srcfa.getBDKey()),
@@ -1090,89 +1132,192 @@ FabArrayBase::FPinfo::FPinfo (const FabArrayBase& srcfa,
       m_dstng    (dstng),
       m_coarsener(coarsener.clone()),
       m_nuse     (0)
-{ 
+{
+    amrex::ignore_unused(fdomain,cdomain,index_space);
     BL_PROFILE("FPinfo::FPinfo()");
+
     const BoxArray& srcba = srcfa.boxArray();
     const BoxArray& dstba = dstfa.boxArray();
     BL_ASSERT(srcba.ixType() == dstba.ixType());
 
+    BoxArray srcba_simplified = srcba.simplified();
+    BoxArray dstba_simplified = dstba.simplified();
+
     const IndexType& boxtype = dstba.ixType();
     BL_ASSERT(boxtype == dstdomain.ixType());
-     
-    BL_ASSERT(dstng.allLE(dstfa.nGrowVect()));
 
-    const DistributionMapping& dstdm = dstfa.DistributionMap();
-    
-    const int myproc = ParallelDescriptor::MyProc();
+    BL_ASSERT(dstng.allLE(dstfa.nGrowVect()));
 
     BoxList bl(boxtype);
-    Vector<int> iprocs;
-
-    for (int i = 0, N = dstba.size(); i < N; ++i)
-    {
-        Box bx = dstba[i];
+    const int Ndst = dstba_simplified.size();
+    const int nprocs = ParallelContext::NProcsSub();
+    int iboxlo, iboxhi;
+    bool parallel_ci;
+    if (Ndst > 8) {
+        parallel_ci = true;
+        const int navg = Ndst / nprocs;
+        const int nextra = Ndst - navg*nprocs;
+        const int myproc = ParallelContext::MyProcSub();
+        iboxlo = (myproc < nextra) ? myproc*(navg+1) : myproc*navg+nextra;
+        iboxhi = (myproc < nextra) ? iboxlo+navg+1-1 : iboxlo+navg-1;
+    } else {
+        parallel_ci = false;
+        iboxlo = 0;
+        iboxhi = Ndst-1;
+    }
+    for (int i = iboxlo; i <= iboxhi; ++i) {
+        Box bx = dstba_simplified[i];
         bx.grow(m_dstng);
         bx &= m_dstdomain;
+        BoxList const& leftover = srcba_simplified.complementIn(bx);
+        if (leftover.isNotEmpty()) {
+            bl.join(leftover);
+        }
+    }
 
-        BoxList leftover = srcba.complementIn(bx);
+    if (parallel_ci) {
+        amrex::AllGatherBoxes(bl.data());
+    }
 
-        bool ismybox = (dstdm[i] == myproc);
-        for (BoxList::const_iterator bli = leftover.begin(); bli != leftover.end(); ++bli)
-        {
-            bl.push_back(m_coarsener->doit(*bli));
-            if (ismybox) {
-                dst_boxes.push_back(*bli);
-                dst_idxs.push_back(i);
+    if (bl.isEmpty()) return;
+
+    Long ncells_total = 0L;
+    Long ncells_max = 0L;
+    for (auto const& b : bl) {
+        auto n = b.numPts();
+        ncells_total += n;
+        ncells_max = std::max(ncells_max, n);
+    }
+
+    Long ncells_avg = ncells_total / ParallelContext::NProcsSub();
+    Long ncells_target = std::max(2*ncells_avg, Long(8*8*8));
+    if (ncells_max > ncells_target) {
+        BoxList bltmp(boxtype);
+        Vector<Box>& bltmpvec = bltmp.data();
+        for (Box const& b : bl) {
+            Long const npts = b.numPts();
+            if (npts <= ncells_target) {
+                bltmp.push_back(b);
+            } else {
+                IntVect const len = b.length();
+                IntVect numblk{1};
+                while (npts > (AMREX_D_TERM(numblk[0],*numblk[1],*numblk[2])) * ncells_target) {
+#if (AMREX_SPACEDIM == 3)
+                    int longdir = (len[2] >= len[0] && len[2] >= len[1]) ? 2 :
+                        (len[1] >= len[0]) ? 1 : 0;
+#elif (AMREX_SPACEDIM == 2)
+                    int longdir = (len[1] >= len[0]) ? 1 : 0;
+#elif (AMREX_SPACEDIM == 1)
+                    int longdir = 0;
+#else
+                    static_assert(false, "FabArrayBase::FPinfo() unsupported AMREX_SPACEDIM");
+#endif
+                    numblk[longdir] *= 2;
+                }
+                numblk.min(len);
+                IntVect sz, extra;
+                for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+                    sz[idim] = len[idim] / numblk[idim];
+                    extra[idim] =  len[idim] - sz[idim] * numblk[idim];
+                }
+                if (numblk == 1) {
+                    bltmp.push_back(b);
+                } else {
+                    IntVect const& boxlo = b.smallEnd();
+#if (AMREX_SPACEDIM == 3)
+                    for (int k = 0; k < numblk[2]; ++k) {
+                        int klo = (k < extra[2]) ? k*(sz[2]+1) : (k*sz[2]+extra[2]);
+                        int khi = (k < extra[2]) ? klo+(sz[2]+1)-1 : klo+sz[2]-1;
+                        klo += boxlo[2];
+                        khi += boxlo[2];
+#endif
+#if (AMREX_SPACEDIM >= 2)
+                        for (int j = 0; j < numblk[1]; ++j) {
+                            int jlo = (j < extra[1]) ? j*(sz[1]+1) : (j*sz[1]+extra[1]);
+                            int jhi = (j < extra[1]) ? jlo+(sz[1]+1)-1 : jlo+sz[1]-1;
+                            jlo += boxlo[1];
+                            jhi += boxlo[1];
+#endif
+                            for (int i = 0; i < numblk[0]; ++i) {
+                                int ilo = (i < extra[0]) ? i*(sz[0]+1) : (i*sz[0]+extra[0]);
+                                int ihi = (i < extra[0]) ? ilo+(sz[0]+1)-1 : ilo+sz[0]-1;
+                                ilo += boxlo[0];
+                                ihi += boxlo[0];
+                                bltmpvec.emplace_back(IntVect(AMREX_D_DECL(ilo,jlo,klo)),
+                                                      IntVect(AMREX_D_DECL(ihi,jhi,khi)),
+                                                      boxtype);
+                    AMREX_D_TERM(},},})
+                }
             }
-            iprocs.push_back(dstdm[i]);
         }
+        std::swap(bl,bltmp);
+    }
+
+    BoxList blcrse(boxtype);
+    blcrse.reserve(bl.size());
+    for (auto const& b : bl) {
+        blcrse.push_back(coarsener.doit(b));
     }
 
-    if (!iprocs.empty()) {
-        ba_crse_patch.define(bl);
-        dm_crse_patch.define(std::move(iprocs));
+    ba_crse_patch.define(std::move(blcrse));
+    ba_fine_patch.define(std::move(bl));
+    dm_patch.KnapSackProcessorMap(ba_fine_patch, ParallelContext::NProcsSub());
+
 #ifdef AMREX_USE_EB
-        if (index_space)
-        {
-            fact_crse_patch = makeEBFabFactory(index_space,
-                                               index_space->getGeometry(cdomain),
-                                               ba_crse_patch,
-                                               dm_crse_patch,
-                                               {0,0,0}, EBSupport::basic);
-        }
-        else
+    if (index_space)
+    {
+        fact_crse_patch = makeEBFabFactory(index_space,
+                                           index_space->getGeometry(cdomain),
+                                           ba_crse_patch,
+                                           dm_patch,
+                                           {0,0,0}, EBSupport::basic);
+        int ng = boxtype.cellCentered() ? 0 : 1; // to avoid dengerate box
+        fact_fine_patch = makeEBFabFactory(index_space,
+                                           index_space->getGeometry(fdomain),
+                                           ba_fine_patch,
+                                           dm_patch,
+                                           {ng,ng,ng}, EBSupport::basic);
+    }
+    else
 #endif
-        {
-            fact_crse_patch.reset(new FArrayBoxFactory());
-        }
+    {
+        fact_crse_patch.reset(new FArrayBoxFactory());
+        fact_fine_patch.reset(new FArrayBoxFactory());
     }
 }
 
 FabArrayBase::FPinfo::~FPinfo ()
 {
-    delete m_coarsener;
 }
 
 Long
 FabArrayBase::FPinfo::bytes () const
 {
     Long cnt = sizeof(FabArrayBase::FPinfo);
-    cnt += sizeof(Box) * (ba_crse_patch.capacity() + dst_boxes.capacity());
-    cnt += sizeof(int) * (dm_crse_patch.capacity() + dst_idxs.capacity());
+    cnt += sizeof(Box) * (ba_crse_patch.capacity() + ba_fine_patch.capacity());
+    cnt += sizeof(int) * dm_patch.capacity();
     return cnt;
 }
 
 const FabArrayBase::FPinfo&
 FabArrayBase::TheFPinfo (const FabArrayBase& srcfa,
                          const FabArrayBase& dstfa,
-                         const Box&          dstdomain,
                          const IntVect&      dstng,
                          const BoxConverter& coarsener,
-                         const Box&          cdomain,
+                         const Geometry&     fgeom,
+                         const Geometry&     cgeom,
                          const EB2::IndexSpace* index_space)
 {
     BL_PROFILE("FabArrayBase::TheFPinfo()");
 
+    Box dstdomain = fgeom.Domain();
+    dstdomain.convert(dstfa.boxArray().ixType());
+    for (int i = 0; i < AMREX_SPACEDIM; ++i) {
+        if (fgeom.isPeriodic(i)) {
+            dstdomain.grow(i,dstng[i]);
+        }
+    }
+
     const BDKey& srckey = srcfa.getBDKey();
     const BDKey& dstkey = dstfa.getBDKey();
 
@@ -1194,7 +1339,8 @@ FabArrayBase::TheFPinfo (const FabArrayBase& srcfa,
     }
 
     // Have to build a new one
-    FPinfo* new_fpc = new FPinfo(srcfa, dstfa, dstdomain, dstng, coarsener, cdomain, index_space);
+    FPinfo* new_fpc = new FPinfo(srcfa, dstfa, dstdomain, dstng, coarsener,
+                                 fgeom.Domain(), cgeom.Domain(), index_space);
 
 #ifdef AMREX_MEM_PROFILING
     m_FPinfo_stats.bytes += new_fpc->bytes();
@@ -1215,6 +1361,7 @@ FabArrayBase::TheFPinfo (const FabArrayBase& srcfa,
 void
 FabArrayBase::flushFPinfo (bool no_assertion)
 {
+    amrex::ignore_unused(no_assertion);
     BL_ASSERT(no_assertion || getBDKey() == m_bdkey);
 
     std::vector<FPinfoCacheIter> others;
@@ -1374,6 +1521,7 @@ FabArrayBase::TheCFinfo (const FabArrayBase& finefa,
 void
 FabArrayBase::flushCFinfo (bool no_assertion)
 {
+    amrex::ignore_unused(no_assertion);
     BL_ASSERT(no_assertion || getBDKey() == m_bdkey);
     auto er_it = m_TheCrseFineCache.equal_range(m_bdkey);
     for (auto it = er_it.first; it != er_it.second; ++it)
@@ -1554,6 +1702,7 @@ FabArrayBase::buildTileArray (const IntVect& tileSize, TileArray& ta) const
 void
 FabArrayBase::flushTileArray (const IntVect& tileSize, bool no_assertion) const
 {
+    amrex::ignore_unused(no_assertion);
     BL_ASSERT(no_assertion || getBDKey() == m_bdkey);
 
     TACache& tao = m_TheTileArrayCache;
@@ -1658,6 +1807,7 @@ FabArrayBase::WaitForAsyncSends (int                 N_snds,
                                  Vector<char*>&       send_data,
                                  Vector<MPI_Status>&  stats)
 {
+    amrex::ignore_unused(send_data);
 #ifdef BL_USE_MPI
     BL_ASSERT(N_snds > 0);
 
@@ -1667,6 +1817,8 @@ FabArrayBase::WaitForAsyncSends (int                 N_snds,
     BL_ASSERT(send_data.size() == N_snds);
 
     ParallelDescriptor::Waitall(send_reqs, stats);
+#else
+    amrex::ignore_unused(N_snds,send_reqs,stats);
 #endif /*BL_USE_MPI*/
 }
 
@@ -1680,8 +1832,8 @@ FabArrayBase::CheckRcvStats(Vector<MPI_Status>& recv_stats,
 {
     for (int i = 0, n = recv_size.size(); i < n; ++i) {
 	if (recv_size[i] > 0) {
-	    std::size_t count;
-            int tmp_count;
+	    std::size_t count = 0;
+            int tmp_count = 0;
 
             const int comm_data_type = ParallelDescriptor::select_comm_data_type(recv_size[i]);
             if (comm_data_type == 1) {
diff --git a/Src/Base/AMReX_FabArrayCommI.H b/Src/Base/AMReX_FabArrayCommI.H
index 88174cbb4b9..a0f05f93d24 100644
--- a/Src/Base/AMReX_FabArrayCommI.H
+++ b/Src/Base/AMReX_FabArrayCommI.H
@@ -3,7 +3,7 @@
 #include <AMReX_PCI.H>
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::FBEP_nowait (int scomp, int ncomp, const IntVect& nghost,
                             const Periodicity& period, bool cross,
@@ -83,7 +83,7 @@ FabArray<FAB>::FBEP_nowait (int scomp, int ncomp, const IntVect& nghost,
     if (N_rcvs > 0) {
         PostRcvs(*TheFB.m_RcvTags, fb_the_recv_data,
                  fb_recv_data, fb_recv_size, fb_recv_from, fb_recv_reqs,
-                 scomp, ncomp, SeqNum);
+                 ncomp, SeqNum);
         fb_recv_stat.resize(N_rcvs);
     }
 
@@ -118,7 +118,7 @@ FabArray<FAB>::FBEP_nowait (int scomp, int ncomp, const IntVect& nghost,
             std::size_t nbytes = 0;
             for (auto const& cct : kv.second)
             {
-                nbytes += (*this)[cct.srcIndex].nBytes(cct.sbox,scomp,ncomp);
+                nbytes += (*this)[cct.srcIndex].nBytes(cct.sbox,ncomp);
             }
 
             std::size_t acd = ParallelDescriptor::alignof_comm_data(nbytes);
@@ -143,9 +143,7 @@ FabArray<FAB>::FBEP_nowait (int scomp, int ncomp, const IntVect& nghost,
         {
             the_send_data = static_cast<char*>(amrex::The_FA_Arena()->alloc(total_volume));
             for (int i = 0, N = send_size.size(); i < N; ++i) {
-                if (send_size[i] > 0) {
-                    send_data[i] = the_send_data + offset[i];
-                }
+                send_data[i] = the_send_data + offset[i];
             }
         } else {
             the_send_data = nullptr;
@@ -231,7 +229,7 @@ FabArray<FAB>::FBEP_nowait (int scomp, int ncomp, const IntVect& nghost,
 }
 
 template <class FAB>
-template <class FOO, class BAR>  // FOO fools nvcc
+template <class F, typename std::enable_if<IsBaseFab<F>::value,int>::type Z>
 void
 FabArray<FAB>::FillBoundary_finish ()
 {
@@ -439,7 +437,7 @@ FabArray<FAB>::ParallelCopy (const FabArray<FAB>& src,
         int actual_n_rcvs = 0;
 	if (N_rcvs > 0) {
             PostRcvs(*thecpc.m_RcvTags, the_recv_data,
-                     recv_data, recv_size, recv_from, recv_reqs, SC, NC, SeqNum);
+                     recv_data, recv_size, recv_from, recv_reqs, NC, SeqNum);
             actual_n_rcvs = N_rcvs - std::count(recv_size.begin(), recv_size.end(), 0);
 	}
 
@@ -471,7 +469,7 @@ FabArray<FAB>::ParallelCopy (const FabArray<FAB>& src,
                 std::size_t nbytes = 0;
                 for (auto const& cct : kv.second)
                 {
-                    nbytes += src[cct.srcIndex].nBytes(cct.sbox,SC,NC);
+                    nbytes += src[cct.srcIndex].nBytes(cct.sbox,NC);
                 }
 
                 std::size_t acd = ParallelDescriptor::alignof_comm_data(nbytes);
@@ -495,9 +493,7 @@ FabArray<FAB>::ParallelCopy (const FabArray<FAB>& src,
             {
                 the_send_data = static_cast<char*>(amrex::The_FA_Arena()->alloc(total_volume));
                 for (int i = 0, N = send_size.size(); i < N; ++i) {
-                    if (send_size[i] > 0) {
-                        send_data[i] = the_send_data + offset[i];
-                    }
+                    send_data[i] = the_send_data + offset[i];
                 }
             }
 
@@ -701,7 +697,6 @@ FabArray<FAB>::PostRcvs (const MapOfCopyComTagContainers&  m_RcvTags,
                          Vector<std::size_t>&              recv_size,
                          Vector<int>&                      recv_from,
                          Vector<MPI_Request>&              recv_reqs,
-                         int                               icomp,
                          int                               ncomp,
                          int                               SeqNum)
 {
@@ -717,7 +712,7 @@ FabArray<FAB>::PostRcvs (const MapOfCopyComTagContainers&  m_RcvTags,
         std::size_t nbytes = 0;
         for (auto const& cct : kv.second)
         {
-            nbytes += (*this)[cct.dstIndex].nBytes(cct.dbox,icomp,ncomp);
+            nbytes += (*this)[cct.dstIndex].nBytes(cct.dbox,ncomp);
         }
 
         std::size_t acd = ParallelDescriptor::alignof_comm_data(nbytes);
@@ -750,9 +745,9 @@ FabArray<FAB>::PostRcvs (const MapOfCopyComTagContainers&  m_RcvTags,
 
         for (int i = 0; i < nrecv; ++i)
         {
+            recv_data[i] = the_recv_data + offset[i];
             if (recv_size[i] > 0)
             {
-                recv_data[i] = the_recv_data + offset[i];
                 const int rank = ParallelContext::global_to_local_rank(recv_from[i]);
                 const int comm_data_type = ParallelDescriptor::select_comm_data_type(recv_size[i]);
                 if (comm_data_type == 1) {
diff --git a/Src/Base/AMReX_FabArrayUtility.H b/Src/Base/AMReX_FabArrayUtility.H
index 654b41956f7..869fd172d89 100644
--- a/Src/Base/AMReX_FabArrayUtility.H
+++ b/Src/Base/AMReX_FabArrayUtility.H
@@ -12,7 +12,7 @@ template <class FAB, class F,
           class bar = amrex::EnableIf_t<IsBaseFab<FAB>::value> >
 typename FAB::value_type
 ReduceSum (FabArray<FAB> const& fa, int nghost, F&& f) {
-    return ReduceSum(fa, IntVect(nghost), std::move(f));
+    return ReduceSum(fa, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -75,13 +75,14 @@ template <class FAB, class F>
 amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB::value_type>
 ReduceSum_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return ReduceSum_host(fa,nghost,std::move(f));
+    return ReduceSum_host(fa,nghost,std::forward<F>(f));
 }
 
 template <class FAB, class F>
 amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB::value_type>
 ReduceSum_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa,nghost,f);
     amrex::Abort("ReduceSum: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -93,9 +94,9 @@ typename FAB::value_type
 ReduceSum (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceSum_device(fa, nghost, std::move(f));
+        return fudetail::ReduceSum_device(fa, nghost, std::forward<F>(f));
     } else {
-        return fudetail::ReduceSum_host_wrapper(fa, nghost, std::move(f));
+        return fudetail::ReduceSum_host_wrapper(fa, nghost, std::forward<F>(f));
     }
 }
 #else
@@ -104,7 +105,7 @@ template <class FAB, class F,
 typename FAB::value_type
 ReduceSum (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceSum_host(fa, nghost, std::move(f));
+    return fudetail::ReduceSum_host(fa, nghost, std::forward<F>(f));
 }
 #endif
 
@@ -113,7 +114,7 @@ template <class FAB1, class FAB2, class F,
 typename FAB1::value_type
 ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            int nghost, F&& f) {
-    return ReduceSum(fa1, fa2, IntVect(nghost), std::move(f));
+    return ReduceSum(fa1, fa2, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -152,11 +153,13 @@ ReduceSum_device (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
     using value_type = typename FAB1::value_type;
     value_type sm = 0;
 
+    BL_PROFILE("ReduceSum_device");
+
     {
         ReduceOps<ReduceOpSum> reduce_op;
         ReduceData<value_type> reduce_data(reduce_op);
         using ReduceTuple = typename decltype(reduce_data)::Type;
-
+        Gpu::FuseReductionSafeGuard rsg(true);
         for (MFIter mfi(fa1); mfi.isValid(); ++mfi)
         {
             const Box& bx = amrex::grow(mfi.validbox(),nghost);
@@ -181,7 +184,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::va
 ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         IntVect const& nghost, F&& f)
 {
-    return ReduceSum_host(fa1,fa2,nghost,std::move(f));
+    return ReduceSum_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class F>
@@ -189,6 +192,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::val
 ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,nghost,f);
     amrex::Abort("ReduceSum: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -201,9 +205,9 @@ ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceSum_device(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceSum_device(fa1,fa2,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceSum_host_wrapper(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceSum_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -213,7 +217,7 @@ typename FAB1::value_type
 ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceSum_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceSum_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -223,7 +227,7 @@ typename FAB1::value_type
 ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, FabArray<FAB3> const& fa3,
            int nghost, F&& f)
 {
-  return ReduceSum(fa1, fa2, fa3, IntVect(nghost), std::move(f));
+  return ReduceSum(fa1, fa2, fa3, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -293,7 +297,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::va
 ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceSum_host(fa1,fa2,fa3,nghost,std::move(f));
+    return fudetail::ReduceSum_host(fa1,fa2,fa3,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class FAB3, class F>
@@ -301,6 +305,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::val
 ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,fa3,nghost,f);
     amrex::Abort("ReduceSum: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -313,9 +318,9 @@ ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceSum_device(fa1,fa2,fa3,nghost,std::move(f));
+        return fudetail::ReduceSum_device(fa1,fa2,fa3,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceSum_host_wrapper(fa1,fa2,fa3,nghost,std::move(f));
+        return fudetail::ReduceSum_host_wrapper(fa1,fa2,fa3,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -325,7 +330,7 @@ typename FAB1::value_type
 ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceSum_host(fa1,fa2,fa3,nghost,std::move(f));
+    return fudetail::ReduceSum_host(fa1,fa2,fa3,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -334,7 +339,7 @@ template <class FAB, class F,
 typename FAB::value_type
 ReduceMin (FabArray<FAB> const& fa, int nghost, F&& f)
 {
-    return ReduceMin(fa, IntVect(nghost), std::move(f));
+    return ReduceMin(fa, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -398,13 +403,14 @@ template <class FAB, class F>
 amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB::value_type>
 ReduceMin_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return ReduceMin_host(fa,nghost,std::move(f));
+    return ReduceMin_host(fa,nghost,std::forward<F>(f));
 }
 
 template <class FAB, class F>
 amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB::value_type>
 ReduceMin_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa,nghost,f);
     amrex::Abort("ReduceMin: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -416,9 +422,9 @@ typename FAB::value_type
 ReduceMin (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceMin_device(fa, nghost, std::move(f));
+        return fudetail::ReduceMin_device(fa, nghost, std::forward<F>(f));
     } else {
-        return fudetail::ReduceMin_host_wrapper(fa, nghost, std::move(f));
+        return fudetail::ReduceMin_host_wrapper(fa, nghost, std::forward<F>(f));
     }
 }
 #else
@@ -427,7 +433,7 @@ template <class FAB, class F,
 typename FAB::value_type
 ReduceMin (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMin_host(fa, nghost, std::move(f));
+    return fudetail::ReduceMin_host(fa, nghost, std::forward<F>(f));
 }
 #endif
 
@@ -436,7 +442,7 @@ template <class FAB1, class FAB2, class F,
 typename FAB1::value_type
 ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, int nghost, F&& f)
 {
-    return ReduceMin(fa1, fa2, IntVect(nghost), std::move(f));
+    return ReduceMin(fa1, fa2, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -506,7 +512,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::va
 ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMin_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceMin_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class F>
@@ -514,6 +520,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::val
 ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,nghost,f);
     amrex::Abort("ReduceMin: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -526,9 +533,9 @@ ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceMin_device(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceMin_device(fa1,fa2,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceMin_host_wrapper(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceMin_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -538,7 +545,7 @@ typename FAB1::value_type
 ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMin_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceMin_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -548,7 +555,7 @@ typename FAB1::value_type
 ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, FabArray<FAB3> const& fa3,
            int nghost, F&& f)
 {
-    return ReduceMin(fa1, fa2, fa3, IntVect(nghost), std::move(f));
+    return ReduceMin(fa1, fa2, fa3, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -620,7 +627,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::va
 ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMin_host(fa1,fa2,fa3,nghost,std::move(f));
+    return fudetail::ReduceMin_host(fa1,fa2,fa3,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class FAB3, class F>
@@ -628,6 +635,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::val
 ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,fa3,nghost,f);
     amrex::Abort("ReduceMin: Launch Region is off. Device lambda lambda cannot be called by host.");
     return 0;
 }
@@ -640,9 +648,9 @@ ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceMin_device(fa1,fa2,fa3,nghost,std::move(f));
+        return fudetail::ReduceMin_device(fa1,fa2,fa3,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceMin_host_wrapper(fa1,fa2,fa3,nghost,std::move(f));
+        return fudetail::ReduceMin_host_wrapper(fa1,fa2,fa3,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -652,7 +660,7 @@ typename FAB1::value_type
 ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMin_host(fa1,fa2,fa3,nghost,std::move(f));
+    return fudetail::ReduceMin_host(fa1,fa2,fa3,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -661,7 +669,7 @@ template <class FAB, class F,
 typename FAB::value_type
 ReduceMax (FabArray<FAB> const& fa, int nghost, F&& f)
 {
-    return ReduceMax(fa, IntVect(nghost), std::move(f));
+    return ReduceMax(fa, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -726,13 +734,14 @@ template <class FAB, class F>
 amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB::value_type>
 ReduceMax_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return ReduceMax_host(fa,nghost,std::move(f));
+    return ReduceMax_host(fa,nghost,std::forward<F>(f));
 }
 
 template <class FAB, class F>
 amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB::value_type>
 ReduceMax_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa,nghost,f);
     amrex::Abort("ReduceMax: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -744,9 +753,9 @@ typename FAB::value_type
 ReduceMax (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceMax_device(fa,nghost,std::move(f));
+        return fudetail::ReduceMax_device(fa,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceMax_host_wrapper(fa,nghost,std::move(f));
+        return fudetail::ReduceMax_host_wrapper(fa,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -755,7 +764,7 @@ template <class FAB, class F,
 typename FAB::value_type
 ReduceMax (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMax_host(fa,nghost,std::move(f));
+    return fudetail::ReduceMax_host(fa,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -764,7 +773,7 @@ template <class FAB1, class FAB2, class F,
 typename FAB1::value_type
 ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, int nghost, F&& f)
 {
-    return ReduceMax(fa1, fa2, IntVect(nghost), std::move(f));
+    return ReduceMax(fa1, fa2, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -834,7 +843,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::va
 ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         IntVect const& nghost, F&& f)
 {
-    return ReduceMax_host(fa1,fa2,nghost,std::move(f));
+    return ReduceMax_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class F>
@@ -842,6 +851,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::val
 ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,nghost,f);
     amrex::Abort("ReduceMax: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -854,9 +864,9 @@ ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceMax_device(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceMax_device(fa1,fa2,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceMax_host_wrapper(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceMax_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -866,7 +876,7 @@ typename FAB1::value_type
 ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMax_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceMax_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -876,7 +886,7 @@ typename FAB1::value_type
 ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, FabArray<FAB3> const& fa3,
            int nghost, F&& f)
 {
-    return ReduceMax(fa1, fa2, fa3, IntVect(nghost), std::move(f));
+    return ReduceMax(fa1, fa2, fa3, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -948,7 +958,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::va
 ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMax_host(fa1,fa2,fa3,nghost,std::move(f));
+    return fudetail::ReduceMax_host(fa1,fa2,fa3,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class FAB3, class F>
@@ -956,6 +966,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, typename FAB1::val
 ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                         FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,fa3,nghost,f);
     amrex::Abort("ReduceMax: Launch Region is off. Device lambda lambda cannot be called by host.");
     return 0;
 }
@@ -968,9 +979,9 @@ ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceMax_device(fa1,fa2,fa3,nghost,std::move(f));
+        return fudetail::ReduceMax_device(fa1,fa2,fa3,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceMax_host_wrapper(fa1,fa2,fa3,nghost,std::move(f));
+        return fudetail::ReduceMax_host_wrapper(fa1,fa2,fa3,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -980,7 +991,7 @@ typename FAB1::value_type
 ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
            FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceMax_host(fa1,fa2,fa3,nghost,std::move(f));
+    return fudetail::ReduceMax_host(fa1,fa2,fa3,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -989,7 +1000,7 @@ template <class FAB, class F,
 bool
 ReduceLogicalAnd (FabArray<FAB> const& fa, int nghost, F&& f)
 {
-    return ReduceLogicalAnd(fa, IntVect(nghost), std::move(f));
+    return ReduceLogicalAnd(fa, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -1051,13 +1062,14 @@ template <class FAB, class F>
 amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalAnd_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return ReduceLogicalAnd_host(fa,nghost,std::move(f));
+    return ReduceLogicalAnd_host(fa,nghost,std::forward<F>(f));
 }
 
 template <class FAB, class F>
 amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalAnd_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa,nghost,f);
     amrex::Abort("ReduceLogicalAnd: Launch Region is off. Device lambda cannot be called by host.");
     return false;
 }
@@ -1069,9 +1081,9 @@ bool
 ReduceLogicalAnd (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceLogicalAnd_device(fa,nghost,std::move(f));
+        return fudetail::ReduceLogicalAnd_device(fa,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceLogicalAnd_host_wrapper(fa,nghost,std::move(f));
+        return fudetail::ReduceLogicalAnd_host_wrapper(fa,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -1080,7 +1092,7 @@ template <class FAB, class F,
 bool
 ReduceLogicalAnd (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceLogicalAnd_host(fa,nghost,std::move(f));
+    return fudetail::ReduceLogicalAnd_host(fa,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -1090,7 +1102,7 @@ bool
 ReduceLogicalAnd (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                   int nghost, F&& f)
 {
-    return ReduceLogicalAnd(fa1, fa2, IntVect(nghost), std::move(f));
+    return ReduceLogicalAnd(fa1, fa2, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -1157,7 +1169,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalAnd_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                   IntVect const& nghost, F&& f)
 {
-    return ReduceLogicalAnd_host(fa1,fa2,nghost,std::move(f));
+    return ReduceLogicalAnd_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class F>
@@ -1165,6 +1177,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalAnd_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                                IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,nghost,f);
     amrex::Abort("ReduceLogicalAnd: Luanch Region is off. Device lambda cannot be called by host.");
     return false;
 }
@@ -1177,9 +1190,9 @@ ReduceLogicalAnd (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                   IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceLogicalAnd_device(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceLogicalAnd_device(fa1,fa2,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceLogicalAnd_host_wrapper(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceLogicalAnd_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -1189,7 +1202,7 @@ bool
 ReduceLogicalAnd (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                   IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceLogicalAnd_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceLogicalAnd_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -1198,7 +1211,7 @@ template <class FAB, class F,
 bool
 ReduceLogicalOr (FabArray<FAB> const& fa, int nghost, F&& f)
 {
-    return ReduceLogicalOr(fa, IntVect(nghost), std::move(f));
+    return ReduceLogicalOr(fa, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -1260,13 +1273,14 @@ template <class FAB, class F>
 amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalOr_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return ReduceLogicalOr_host(fa,nghost,std::move(f));
+    return ReduceLogicalOr_host(fa,nghost,std::forward<F>(f));
 }
 
 template <class FAB, class F>
 amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalOr_host (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa,nghost,f);
     amrex::Abort("ReduceLogicalOr: Launch Region is off. Device lambda cannot be called by host.");
     return 0;
 }
@@ -1278,9 +1292,9 @@ bool
 ReduceLogicalOr (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceLogicalOr_device(fa,nghost,std::move(f));
+        return fudetail::ReduceLogicalOr_device(fa,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceLogicalOr_host_wrapper(fa,nghost,std::move(f));
+        return fudetail::ReduceLogicalOr_host_wrapper(fa,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -1289,7 +1303,7 @@ template <class FAB, class F,
 bool
 ReduceLogicalOr (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceLogicalOr_host(fa,nghost,std::move(f));
+    return fudetail::ReduceLogicalOr_host(fa,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -1299,7 +1313,7 @@ bool
 ReduceLogicalOr (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                  int nghost, F&& f)
 {
-    return ReduceLogicalOr(fa1, fa2, IntVect(nghost), std::move(f));
+    return ReduceLogicalOr(fa1, fa2, IntVect(nghost), std::forward<F>(f));
 }
 
 namespace fudetail {
@@ -1350,6 +1364,7 @@ ReduceLogicalOr_device (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
             [=] AMREX_GPU_DEVICE (Box const& b) -> ReduceTuple
             {
                 int tr = f(b, arr1, arr2);
+                return {tr};
             });
         }
 
@@ -1365,7 +1380,7 @@ amrex::EnableIf_t<!amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalOr_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                  IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceLogicalOr_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceLogicalOr_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 
 template <class FAB1, class FAB2, class F>
@@ -1373,6 +1388,7 @@ amrex::EnableIf_t<amrex::DefinitelyNotHostRunnable<F>::value, bool>
 ReduceLogicalOr_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                               IntVect const& nghost, F&& f)
 {
+    amrex::ignore_unused(fa1,fa2,nghost,f);
     amrex::Abort("ReeuceLogicalOr: Launch Region is off. Device lambda cannot be called by host.");
     return false;
 }
@@ -1385,9 +1401,9 @@ ReduceLogicalOr (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                  IntVect const& nghost, F&& f)
 {
     if (Gpu::inLaunchRegion()) {
-        return fudetail::ReduceLogicalOr_device(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceLogicalOr_device(fa1,fa2,nghost,std::forward<F>(f));
     } else {
-        return fudetail::ReduceLogicalOr_host_wrapper(fa1,fa2,nghost,std::move(f));
+        return fudetail::ReduceLogicalOr_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));
     }
 }
 #else
@@ -1397,7 +1413,7 @@ bool
 ReduceLogicalOr (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,
                  IntVect const& nghost, F&& f)
 {
-    return fudetail::ReduceLogicalOr_host(fa1,fa2,nghost,std::move(f));
+    return fudetail::ReduceLogicalOr_host(fa1,fa2,nghost,std::forward<F>(f));
 }
 #endif
 
@@ -1453,7 +1469,7 @@ Add (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int
         {
             auto const srcFab = src.array(mfi);
             auto       dstFab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dstFab(i,j,k,n+dstcomp) += srcFab(i,j,k,n+srccomp);
             });
@@ -1485,7 +1501,7 @@ Copy (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, in
         {
             auto const srcFab = src.array(mfi);
             auto       dstFab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dstFab(i,j,k,dstcomp+n) = srcFab(i,j,k,srccomp+n);
             });
@@ -1517,7 +1533,7 @@ Subtract (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp
         {
             auto const srcFab = src.array(mfi);
             auto       dstFab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dstFab(i,j,k,n+dstcomp) -= srcFab(i,j,k,n+srccomp);
             });
@@ -1549,7 +1565,7 @@ Multiply (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp
         {
             auto const srcFab = src.array(mfi);
             auto       dstFab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dstFab(i,j,k,n+dstcomp) *= srcFab(i,j,k,n+srccomp);
             });
@@ -1581,7 +1597,7 @@ Divide (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp,
         {
             auto const srcFab = src.array(mfi);
             auto       dstFab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dstFab(i,j,k,n+dstcomp) /= srcFab(i,j,k,n+srccomp);
             });
@@ -1592,29 +1608,28 @@ Divide (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp,
 template <class FAB,
           class bar = amrex::EnableIf_t<IsBaseFab<FAB>::value> >
 void
-Abs (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, int nghost)
+Abs (FabArray<FAB>& fa, int icomp, int numcomp, int nghost)
 {
-    Abs(dst,src,srccomp,dstcomp,numcomp,IntVect(nghost));
+    Abs(fa,icomp,numcomp,IntVect(nghost));
 }
 
 template <class FAB,
           class bar = amrex::EnableIf_t<IsBaseFab<FAB>::value> >
 void
-Abs (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, const IntVect& nghost)
+Abs (FabArray<FAB>& fa, int icomp, int numcomp, const IntVect& nghost)
 {
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
-    for (MFIter mfi(dst,TilingIfNotGPU()); mfi.isValid(); ++mfi)
+    for (MFIter mfi(fa,TilingIfNotGPU()); mfi.isValid(); ++mfi)
     {
         const Box& bx = mfi.growntilebox(nghost);
         if (bx.ok())
         {
-            auto const srcFab = src.array(mfi);
-            auto       dstFab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            auto const& fab = fa.array(mfi);
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
-                dstFab(i,j,k,n+dstcomp) /= srcFab(i,j,k,n+srccomp);
+                fab(i,j,k,n+icomp) = amrex::Math::abs(fab(i,j,k,n+icomp));
             });
         }
     }
@@ -1630,6 +1645,8 @@ prefetchToHost (FabArray<FAB> const& fa, const bool synchronous = true)
             fa.prefetchToHost(mfi);
         }
     }
+#else
+    amrex::ignore_unused(fa,synchronous);
 #endif
 }
 
@@ -1643,6 +1660,8 @@ prefetchToDevice (FabArray<FAB> const& fa, const bool synchronous = true)
             fa.prefetchToDevice(mfi);
         }
     }
+#else
+    amrex::ignore_unused(fa,synchronous);
 #endif
 }
 
@@ -1665,7 +1684,7 @@ OverrideSync (FabArray<FAB> & fa, FabArray<IFAB> const& msk, const Periodicity&
         const Box& bx = mfi.tilebox();
         auto fab = fa.array(mfi);
         auto const ifab = msk.array(mfi);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, ncomp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, ncomp, i, j, k, n,
         {
             if (!ifab(i,j,k)) fab(i,j,k,n) = 0;
         });
@@ -1690,7 +1709,7 @@ dtoh_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src,
     for (MFIter mfi(dst); mfi.isValid(); ++mfi) {
         void* pdst = dst[mfi].dataPtr(dcomp);
         void const* psrc = src[mfi].dataPtr(scomp);
-        Gpu::dtoh_memcpy_async(pdst, psrc, dst[mfi].nBytes(mfi.fabbox(), dcomp, ncomp));
+        Gpu::dtoh_memcpy_async(pdst, psrc, dst[mfi].nBytes(mfi.fabbox(), ncomp));
     }
 #else
     Copy(dst, src, scomp, dcomp, ncomp, dst.nGrowVect());
@@ -1715,7 +1734,7 @@ htod_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src,
     for (MFIter mfi(dst); mfi.isValid(); ++mfi) {
         void* pdst = dst[mfi].dataPtr(dcomp);
         void const* psrc = src[mfi].dataPtr(scomp);
-        Gpu::htod_memcpy_async(pdst, psrc, dst[mfi].nBytes(mfi.fabbox(), dcomp, ncomp));
+        Gpu::htod_memcpy_async(pdst, psrc, dst[mfi].nBytes(mfi.fabbox(), ncomp));
     }
 #else
     Copy(dst, src, scomp, dcomp, ncomp, dst.nGrowVect());
@@ -1729,6 +1748,84 @@ htod_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src)
     htod_memcpy(dst, src, 0, 0, dst.nComp());
 }
 
+template <class FAB, class foo = amrex::EnableIf_t<IsBaseFab<FAB>::value> >
+IntVect
+indexFromValue (FabArray<FAB> const& mf, int comp, IntVect const& nghost,
+                typename FAB::value_type value)
+{
+    IntVect loc;
+
+#ifdef AMREX_USE_GPU
+    if (Gpu::inLaunchRegion())
+    {
+        int tmp[1+AMREX_SPACEDIM] = {0};
+        amrex::Gpu::AsyncArray<int> aa(tmp, 1+AMREX_SPACEDIM);
+        int* p = aa.data();
+        // This is a device ptr to 1+AMREX_SPACEDIM int zeros.
+        // The first is used as an atomic bool and the others for intvect.
+        for (MFIter mfi(mf); mfi.isValid(); ++mfi) {
+            const Box& bx = amrex::grow(mfi.validbox(), nghost);
+            auto const& arr = mf.const_array(mfi);
+            amrex::ParallelFor(bx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+            {
+                int* flag = p;
+                if (*flag == 0) {
+                    if (arr(i,j,k,comp) == value) {
+                        if (Gpu::Atomic::Exch(flag,1) == 0) {
+                            AMREX_D_TERM(p[1] = i;,
+                                         p[2] = j;,
+                                         p[3] = k;);
+                        }
+                    }
+                }
+            });
+        }
+        aa.copyToHost(tmp, 1+AMREX_SPACEDIM);
+        AMREX_D_TERM(loc[0] = tmp[1];,
+                     loc[1] = tmp[2];,
+                     loc[2] = tmp[3];);
+    }
+    else
+#endif
+    {
+        bool f = false;
+#ifdef _OPENMP
+#pragma omp parallel
+#endif
+        {
+            IntVect priv_loc = IntVect::TheMinVector();
+            for (MFIter mfi(mf,true); mfi.isValid(); ++mfi)
+            {
+                const Box& bx = mfi.growntilebox(nghost);
+                auto const& fab = mf.const_array(mfi);
+                AMREX_LOOP_3D(bx, i, j, k,
+                {
+                    if (fab(i,j,k,comp) == value) priv_loc = IntVect(AMREX_D_DECL(i,j,k));
+                });
+            }
+
+            if (priv_loc.allGT(IntVect::TheMinVector())) {
+                bool old;
+// we should be able to test on _OPENMP < 201107 for capture (version 3.1)
+// but we must work around a bug in gcc < 4.9
+#if defined(_OPENMP) && _OPENMP < 201307 // OpenMP 4.0
+#pragma omp critical (amrex_indexfromvalue)
+#elif defined(_OPENMP)
+#pragma omp atomic capture
+#endif
+                {
+                    old = f;
+                    f = true;
+                }
+
+                if (old == false) loc = priv_loc;
+            }
+        }
+    }
+
+    return loc;
+}
+
 }
 
 #endif
diff --git a/Src/Base/AMReX_FabConv.cpp b/Src/Base/AMReX_FabConv.cpp
index 025a5b7cd6f..0f750aa6b28 100644
--- a/Src/Base/AMReX_FabConv.cpp
+++ b/Src/Base/AMReX_FabConv.cpp
@@ -221,7 +221,7 @@ selectOrdering (int prec,
 RealDescriptor*
 RealDescriptor::newRealDescriptor (int         iot,
                                    int         prec,
-                                   const char* sys,
+                                   const char* /*sys*/,
                                    int         ordering)
 {
     RealDescriptor* rd = 0;
@@ -239,6 +239,8 @@ RealDescriptor::newRealDescriptor (int         iot,
         case FABio::FAB_DOUBLE:
             rd = new RealDescriptor(FPC::ieee_double, ord, 8);
             return rd;
+        default:
+            return rd;
         }
     }
     case FABio::FAB_NATIVE:
@@ -498,7 +500,7 @@ _pd_reorder (char*      arr,
              const int* ord)
 {
     const int MAXLINE = 16;
-    char local[MAXLINE];
+    char local[MAXLINE] = {0};
 
     for (int j; nitems > 0; nitems--)
     {
diff --git a/Src/Base/AMReX_FilCC_1D_C.H b/Src/Base/AMReX_FilCC_1D_C.H
index 77e12be9172..189debc6d78 100644
--- a/Src/Base/AMReX_FilCC_1D_C.H
+++ b/Src/Base/AMReX_FilCC_1D_C.H
@@ -12,9 +12,9 @@ inline
 void
 filcc_cell (const IntVect& iv, Array4<Real> const& q,
             const int dcomp, const int numcomp,
-            GeometryData const& geom, const Real time,
+            GeometryData const& geom, const Real /*time*/,
             const BCRec* bcr, const int bcomp,
-            const int orig_comp) noexcept
+            const int /*orig_comp*/) noexcept
 {
     const int i = iv[0];
 
diff --git a/Src/Base/AMReX_FilCC_2D_C.H b/Src/Base/AMReX_FilCC_2D_C.H
index 3a7508283b9..5aab33f7fc5 100644
--- a/Src/Base/AMReX_FilCC_2D_C.H
+++ b/Src/Base/AMReX_FilCC_2D_C.H
@@ -12,9 +12,9 @@ inline
 void
 filcc_cell (const IntVect& iv, Array4<Real> const& q,
             const int dcomp, const int numcomp,
-            GeometryData const& geom, const Real time,
+            GeometryData const& geom, const Real /*time*/,
             const BCRec* bcr, const int bcomp,
-            const int orig_comp) noexcept
+            const int /*orig_comp*/) noexcept
 {
     const int i = iv[0];
     const int j = iv[1];
diff --git a/Src/Base/AMReX_FilCC_3D_C.H b/Src/Base/AMReX_FilCC_3D_C.H
index 942d07f7b4d..8a837fbf7f1 100644
--- a/Src/Base/AMReX_FilCC_3D_C.H
+++ b/Src/Base/AMReX_FilCC_3D_C.H
@@ -12,9 +12,9 @@ inline
 void
 filcc_cell (const IntVect& iv, Array4<Real> const& q,
             const int dcomp, const int numcomp,
-            GeometryData const& geom, const Real time,
+            GeometryData const& geom, const Real /*time*/,
             const BCRec* bcr, const int bcomp,
-            const int orig_comp) noexcept
+            const int /*orig_comp*/) noexcept
 {
     const int i = iv[0];
     const int j = iv[1];
diff --git a/Src/Base/AMReX_FilCC_C.cpp b/Src/Base/AMReX_FilCC_C.cpp
index 931915b0bc6..bde017a0485 100644
--- a/Src/Base/AMReX_FilCC_C.cpp
+++ b/Src/Base/AMReX_FilCC_C.cpp
@@ -3,7 +3,7 @@
 namespace amrex {
 
 void fab_filcc (Box const& bx, Array4<Real> const& qn, int ncomp,
-                Box const& domain, Real const* dx, Real const* xlo,
+                Box const& domain, Real const* /*dx*/, Real const* /*xlo*/,
                 BCRec const* bcn)
 {
     const auto lo = amrex::lbound(bx);
diff --git a/Src/Base/AMReX_FilND_C.H b/Src/Base/AMReX_FilND_C.H
new file mode 100644
index 00000000000..01dd9a2479c
--- /dev/null
+++ b/Src/Base/AMReX_FilND_C.H
@@ -0,0 +1,13 @@
+#ifndef AMREX_FILL_ND_H_
+#define AMREX_FILL_ND_H_
+
+#include <AMReX_FArrayBox.H>
+#include <AMReX_BCRec.H>
+
+namespace amrex {
+    void fab_filnd (Box const& bx, Array4<Real> const& q, int ncomp,
+                    Box const& domain, Real const* dx, Real const* xlo,
+                    BCRec const* bc);
+}
+
+#endif
diff --git a/Src/Base/AMReX_FilND_C.cpp b/Src/Base/AMReX_FilND_C.cpp
new file mode 100644
index 00000000000..610f4815f99
--- /dev/null
+++ b/Src/Base/AMReX_FilND_C.cpp
@@ -0,0 +1,100 @@
+#include <AMReX_FilND_C.H>
+
+namespace amrex {
+
+void fab_filnd (Box const& bx, Array4<Real> const& qn, int ncomp,
+                Box const& domain, Real const* /*dx*/, Real const* /*xlo*/,
+                BCRec const* bcn)
+{
+    const auto lo = amrex::lbound(bx);
+    const auto hi = amrex::ubound(bx);
+    const auto domlo = amrex::lbound(domain);
+    const auto domhi = amrex::ubound(domain);
+
+    const int ilo = domlo.x;
+    const int ihi = domhi.x;
+
+#if AMREX_SPACEDIM >= 2
+    const int jlo = domlo.y;
+    const int jhi = domhi.y;
+#endif
+
+#if AMREX_SPACEDIM == 3
+    const int klo = domlo.z;
+    const int khi = domhi.z;
+#endif
+
+    for (int n = 0; n < ncomp; ++n)
+    {
+        Array4<Real> q(qn,n);
+        BCRec const& bc = bcn[n];
+
+        if (lo.x < ilo && (bc.lo(0) != BCType::int_dir)) {
+           const int imin = lo.x;
+           const int imax = ilo-1;
+           for (int k = lo.z; k <= hi.z; ++k) {
+           for (int j = lo.y; j <= hi.y; ++j) {
+           for (int i = imin; i <= imax; ++i) {
+               q(i,j,k) = q(ilo,j,k);
+           }}}
+        }
+
+        if (hi.x > ihi && (bc.hi(0) != BCType::int_dir)) {
+            const int imin = ihi+1;
+            const int imax = hi.x;
+            for (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = imin; i <= imax; ++i) {
+                q(i,j,k) = q(ihi,j,k);
+            }}}
+        }
+
+#if AMREX_SPACEDIM >= 2
+
+        if (lo.y < jlo && (bc.lo(1) != BCType::int_dir)) {
+            const int jmin = lo.y;
+            const int jmax = jlo-1;
+            for (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = jmin; j <= jmax; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                q(i,j,k) = q(i,jlo,k);
+            }}}
+        }
+
+        if (hi.y > jhi && (bc.hi(1) != BCType::int_dir)) {
+            const int jmin = jhi+1;
+            const int jmax = hi.y;
+            for (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = jmin; j <= jmax; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                q(i,j,k) = q(i,jhi,k);
+            }}}
+        }
+#endif
+
+#if AMREX_SPACEDIM == 3
+
+        if (lo.z < klo && (bc.lo(2) != BCType::int_dir)) {
+            const int kmin = lo.z;
+            const int kmax = klo-1;
+            for (int k = kmin; k <= kmax; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                q(i,j,k) = q(i,j,klo);
+            }}}
+        }
+
+        if (hi.z > khi && (bc.hi(2) != BCType::int_dir)) {
+            const int kmin = khi+1;
+            const int kmax = hi.z;
+            for (int k = kmin; k <= kmax; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                q(i,j,k) = q(i,j,khi);
+            }}}
+        }
+#endif
+    }
+}
+
+}
diff --git a/Src/Base/AMReX_FileSystem.H b/Src/Base/AMReX_FileSystem.H
new file mode 100644
index 00000000000..3a8ccc28a72
--- /dev/null
+++ b/Src/Base/AMReX_FileSystem.H
@@ -0,0 +1,32 @@
+#ifndef AMREX_FILE_SYSTEM_H_
+#define AMREX_FILE_SYSTEM_H_
+
+#include <string>
+
+#ifdef _WIN32
+typedef unsigned short mode_t;
+#else
+#include <sys/types.h>  // for mode_t
+#endif
+
+namespace amrex {
+namespace FileSystem {
+
+bool
+CreateDirectories (std::string const& filename, mode_t mode, bool verbose = false);
+
+std::string
+CurrentPath ();
+
+bool
+Exists (std::string const& filename);
+
+bool
+Remove (std::string const& filename);
+
+bool
+RemoveAll (std::string const& p); // recursive remove
+
+}}
+
+#endif
diff --git a/Src/Base/AMReX_FileSystem.cpp b/Src/Base/AMReX_FileSystem.cpp
new file mode 100644
index 00000000000..372570beecf
--- /dev/null
+++ b/Src/Base/AMReX_FileSystem.cpp
@@ -0,0 +1,215 @@
+#include <AMReX_FileSystem.H>
+#include <AMReX_Print.H>
+#include <AMReX_Vector.H>
+#include <AMReX.H>
+
+#if defined(_WIN32) // || __cplusplus >= 201703L
+
+#include <filesystem>
+#include <system_error>
+
+namespace amrex {
+namespace FileSystem {
+
+bool
+CreateDirectories (std::string const& p, mode_t /*mode*/, bool verbose)
+{
+    std::error_code ec;
+    std::filesystem::create_directories(std::filesystem::path{p}, ec);
+    if (ec and verbose) {
+        amrex::AllPrint() << "amrex::UtilCreateDirectory failed to create "
+                          << p << ": " << ec.message() << std::endl;
+    }
+    return !ec;    
+}
+
+bool
+Exists (std::string const& filename)
+{
+    std::error_code ec;
+    bool r = std::filesystem::exists(std::filesystem::path{filename}, ec);
+    if (ec and amrex::Verbose() > 0) {
+        amrex::AllPrint() << "amrex::FileSystem::Exists failed. " << ec.message() << std::endl;
+    }
+    return r;
+}
+
+std::string
+CurrentPath ()
+{
+    std::error_code ec;
+    auto path = std::filesystem::current_path(ec);
+    if (ec and amrex::Verbose() > 0) {
+        amrex::AllPrint() << "amrex::FileSystem::CurrentPath failed. " << ec.message() << std::endl;
+    }
+    return path.string();
+}
+
+bool
+Remove (std::string const& filename)
+{
+    std::error_code ec;
+    bool r = std::filesystem::remove(std::filesystem::path{filename},ec);
+    return !ec;
+}
+
+bool
+RemoveAll (std::string const& p)
+{
+    std::error_code ec;
+    std::filesystem::remove_all(std::filesystem::path{p},ec);
+    return !ec;
+}
+
+}}
+
+#else
+
+#include <cstdio>
+#include <cstddef>
+#include <cstring>
+#include <unistd.h>
+#include <sys/stat.h>
+#include <sys/types.h>
+#include <sys/wait.h>
+
+namespace amrex {
+namespace FileSystem {
+
+bool
+CreateDirectories (std::string const& path, mode_t mode, bool verbose)
+{
+    bool retVal(false);
+    Vector<std::pair<std::string, int> > pathError;
+
+    const char* path_sep_str = "/";
+
+    if (path.length() == 0 || path == path_sep_str) {
+        return true;
+    }
+
+    errno = 0;
+
+    if(std::strchr(path.c_str(), *path_sep_str) == 0) {
+        //
+        // No slashes in the path.
+        //
+        errno = 0;
+        if(mkdir(path.c_str(), mode) < 0 && errno != EEXIST) {
+            retVal = false;
+        } else {
+            retVal = true;
+        }
+        pathError.push_back(std::make_pair(path, errno));
+    } else {
+        //
+        // Make copy of the directory pathname so we can write to it.
+        //
+        char *dir = new char[path.length() + 1];
+        (void) strcpy(dir, path.c_str());
+
+        char *slash = std::strchr(dir, *path_sep_str);
+
+        if(dir[0] == *path_sep_str) {  // full pathname.
+            do {
+                if(*(slash+1) == 0) {
+                    break;
+                }
+                if((slash = std::strchr(slash+1, *path_sep_str)) != 0) {
+                    *slash = 0;
+                }
+                errno = 0;
+                if(mkdir(dir, mode) < 0 && errno != EEXIST) {
+                    retVal = false;
+                } else {
+                    retVal = true;
+                }
+                pathError.push_back(std::make_pair(dir, errno));
+                if(slash) {
+                    *slash = *path_sep_str;
+                }
+            } while(slash);
+
+        } else {  // relative pathname.
+
+            do {
+                *slash = 0;
+                errno = 0;
+                if(mkdir(dir, mode) < 0 && errno != EEXIST) {
+                    retVal = false;
+                } else {
+                    retVal = true;
+                }
+                pathError.push_back(std::make_pair(dir, errno));
+                *slash = *path_sep_str;
+            } while((slash = std::strchr(slash+1, *path_sep_str)) != 0);
+
+            errno = 0;
+            if(mkdir(dir, mode) < 0 && errno != EEXIST) {
+                retVal = false;
+            } else {
+                retVal = true;
+            }
+            pathError.push_back(std::make_pair(dir, errno));
+        }
+
+        delete [] dir;
+    }
+
+    if(retVal == false  || verbose == true) {
+      for(int i(0); i < pathError.size(); ++i) {
+          amrex::AllPrint()<< "amrex::UtilCreateDirectory:: path errno:  "
+                           << pathError[i].first << " :: "
+                           << strerror(pathError[i].second)
+                           << std::endl;
+      }
+    }
+
+    return retVal;
+}
+
+bool
+Exists (std::string const& filename)
+{
+    struct stat statbuff;
+    return (lstat(filename.c_str(), &statbuff) != -1);
+}
+
+std::string
+CurrentPath ()
+{
+    constexpr int bufSize = 1024;
+    char temp[bufSize];
+    char *rCheck = getcwd(temp, bufSize);
+    if(rCheck == 0) {
+        amrex::Abort("**** Error:  getcwd buffer too small.");
+    }
+    return std::string(rCheck);
+}
+
+bool
+Remove (std::string const& filename)
+{
+    return unlink(filename.c_str());
+}
+
+bool
+RemoveAll (std::string const& p)
+{
+    if (p.size() >= 1990) {
+        amrex::Error("FileSystem::RemoveAll: Path name too long");
+        return false;
+    }
+    char command[2000];
+    std::snprintf(command, 2000, "\\rm -rf %s", p.c_str());;
+    int retVal = std::system(command);
+    if (retVal == -1 || WEXITSTATUS(retVal) != 0) {
+        amrex::Error("Removing old directory failed.");
+        return false;
+    }
+    return true;
+}
+
+}}
+
+#endif
diff --git a/Src/Base/AMReX_Geometry.H b/Src/Base/AMReX_Geometry.H
index a0732539e49..c76f5995058 100644
--- a/Src/Base/AMReX_Geometry.H
+++ b/Src/Base/AMReX_Geometry.H
@@ -50,7 +50,7 @@ struct GeometryData
  //! Returns our rectangular domain.
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     const Box& Domain () const noexcept { return domain; }
- //! Returns whether the domain is periodic in the given direction.
+//! Returns whether the domain is periodic in the given direction.
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     int isPeriodic (const int i) const noexcept { return is_periodic[i]; }
  //! Coordinates type
@@ -104,11 +104,13 @@ public:
     void define (const Box& dom, const RealBox& rb, int coord, Array<int,AMREX_SPACEDIM> const& is_per) noexcept;
     //! Returns the problem domain.
     const RealBox& ProbDomain () const noexcept { return prob_domain; }
+    //! Returns the roundoff domain.
+    const RealBox& RoundoffDomain () const noexcept { return roundoff_domain; }
     //! Sets the problem domain.
     void ProbDomain (const RealBox& rb) noexcept
     {
         prob_domain = rb;
-        SetOffset(rb.lo());
+        computeRoundoffDomain();
     }
     //! Returns the lo end of the problem domain in each dimension.
     const Real* ProbLo () const noexcept { return prob_domain.lo(); }
@@ -120,11 +122,11 @@ public:
     Real ProbHi (int dir) const noexcept { return prob_domain.hi(dir); }
 
     GpuArray<Real,AMREX_SPACEDIM> ProbLoArray () const noexcept {
-        return {AMREX_D_DECL(prob_domain.lo(0),prob_domain.lo(1),prob_domain.lo(2))};
+        return {{AMREX_D_DECL(prob_domain.lo(0),prob_domain.lo(1),prob_domain.lo(2))}};
     }
 
     GpuArray<Real,AMREX_SPACEDIM> ProbHiArray () const noexcept {
-        return {AMREX_D_DECL(prob_domain.hi(0),prob_domain.hi(1),prob_domain.hi(2))};
+        return {{AMREX_D_DECL(prob_domain.hi(0),prob_domain.hi(1),prob_domain.hi(2))}};
     }
 
     //! Returns the overall size of the domain by multiplying the ProbLength's together
@@ -137,7 +139,11 @@ public:
     //! Returns our rectangular domain.
     const Box& Domain () const noexcept { return domain; }
     //! Sets our rectangular domain.
-    void Domain (const Box& bx) noexcept { domain = bx; }
+    void Domain (const Box& bx) noexcept
+    {
+        domain = bx;
+        computeRoundoffDomain();
+    }
     //! Define a multifab of areas and volumes with given grow factor.
     void GetVolume (MultiFab&       vol,
                     const BoxArray& grds,
@@ -190,27 +196,14 @@ public:
         return AMREX_D_TERM(isPeriodic(0),&&isPeriodic(1),&&isPeriodic(2));
     }
     Array<int,AMREX_SPACEDIM> isPeriodic () const noexcept {
-        return {AMREX_D_DECL(static_cast<int>(is_periodic[0]),
-                             static_cast<int>(is_periodic[1]),
-                             static_cast<int>(is_periodic[2]))};
+        return {{AMREX_D_DECL(static_cast<int>(is_periodic[0]),
+                              static_cast<int>(is_periodic[1]),
+                              static_cast<int>(is_periodic[2]))}};
     }
     GpuArray<int,AMREX_SPACEDIM> isPeriodicArray () const noexcept {
-// HIP FIX HERE - Initialization List
-#ifdef AMREX_USE_HIP
-        GpuArray<int, AMREX_SPACEDIM> arr;
-        for (int i=0; i<AMREX_SPACEDIM; ++i)
-            { arr[i] = static_cast<int>(is_periodic[i]); }
-        return arr;
-/*
-        return {(int[AMREX_SPACEDIM]){AMREX_D_DECL(static_cast<int>(is_periodic[0]),
-                                                   static_cast<int>(is_periodic[1]),
-                                                   static_cast<int>(is_periodic[2]))}};
-*/
-#else
-        return {AMREX_D_DECL(static_cast<int>(is_periodic[0]),
-                             static_cast<int>(is_periodic[1]),
-                             static_cast<int>(is_periodic[2]))};
-#endif
+        return {{AMREX_D_DECL(static_cast<int>(is_periodic[0]),
+                              static_cast<int>(is_periodic[1]),
+                              static_cast<int>(is_periodic[2]))}};
     }
     //! What's period in specified direction?
     int period (int dir) const noexcept { BL_ASSERT(is_periodic[dir]); return domain.length(dir); }
@@ -250,9 +243,9 @@ public:
     //!
     Array<int,AMREX_SPACEDIM>
     setPeriodicity (Array<int,AMREX_SPACEDIM> const& period) noexcept {
-        Array<int,AMREX_SPACEDIM> r{AMREX_D_DECL(is_periodic[0],
-                                                 is_periodic[1],
-                                                 is_periodic[2])};
+        Array<int,AMREX_SPACEDIM> r{{AMREX_D_DECL(is_periodic[0],
+                                                  is_periodic[1],
+                                                  is_periodic[2])}};
         AMREX_D_TERM(is_periodic[0] = period[0];,
                      is_periodic[1] = period[1];,
                      is_periodic[2] = period[2];);
@@ -275,12 +268,41 @@ public:
         }
     }
 
+    /**
+    * \brief Returns true if a point is outside the roundoff domain.
+    *        All particles with positions inside the roundoff domain
+    *        are sure to be mapped to cells inside the Domain() box. Note that
+    *        the same need not be true for all points inside ProbDomain().
+    */
+    bool outsideRoundoffDomain (AMREX_D_DECL(Real x, Real y, Real z)) const;
+
+    /**
+    * \brief Returns true if a point is inside the roundoff domain.
+    *        All particles with positions inside the roundoff domain
+    *        are sure to be mapped to cells inside the Domain() box. Note that
+    *        the same need not be true for all points inside ProbDomain().
+    */
+    bool insideRoundoffDomain (AMREX_D_DECL(Real x, Real y, Real z)) const;
+
+    /**
+    * \brief Compute the roundoff domain. Public because it contains an
+    *        extended host / device lambda.
+    */
+    void computeRoundoffDomain ();
+
 private:
     void read_params ();
 
     // is_periodic and RealBox used to be static
     bool    is_periodic[AMREX_SPACEDIM] = {AMREX_D_DECL(false,false,false)};
     RealBox prob_domain;
+
+    // Due to round-off errors, not all floating point numbers for which plo >= x < phi
+    // will map to a cell that is inside "domain". "roundoff_domain" stores a phi
+    // that is very close to that in prob_domain, and for which all floating point numbers
+    // inside it according to a naive inequality check will map to a cell inside domain.
+    RealBox roundoff_domain;
+
     //
     Box     domain;
 };
diff --git a/Src/Base/AMReX_Geometry.cpp b/Src/Base/AMReX_Geometry.cpp
index eaaa84409b2..1ff6b4292c5 100644
--- a/Src/Base/AMReX_Geometry.cpp
+++ b/Src/Base/AMReX_Geometry.cpp
@@ -2,6 +2,7 @@
 
 #include <iostream>
 
+#include <AMReX_Algorithm.H>
 #include <AMReX_BoxArray.H>
 #include <AMReX_Geometry.H>
 #include <AMReX_ParmParse.H>
@@ -9,9 +10,7 @@
 #include <AMReX_Utility.H>
 #include <AMReX_SPACE.H>
 
-#ifdef _OPENMP
-#include <omp.h>
-#endif
+#include <AMReX_OpenMP.H>
 
 namespace amrex {
 
@@ -39,7 +38,7 @@ operator>> (std::istream& is,
         is >> c;
         IntVect is_per;
         is >> is_per;
-        g.setPeriodicity({AMREX_D_DECL(is_per[0],is_per[1],is_per[2])});
+        g.setPeriodicity({{AMREX_D_DECL(is_per[0],is_per[1],is_per[2])}});
     } else {
         g.setPeriodicity(DefaultGeometry().isPeriodic());
     }
@@ -104,12 +103,7 @@ Geometry::define (const Box& dom, const RealBox* rb, int coord,
     domain = dom;
     ok     = true;
 
-    for (int k = 0; k < AMREX_SPACEDIM; k++)
-    {
-        offset[k] = prob_domain.lo(k);
-        dx[k] = prob_domain.length(k)/(Real(domain.length(k)));
-	inv_dx[k] = 1.0/dx[k];
-    }
+    computeRoundoffDomain();
 }
 
 void
@@ -119,9 +113,7 @@ Geometry::Setup (const RealBox* rb, int coord, int const* isper) noexcept
 
     if (gg->ok) return;
 
-#ifdef _OPENMP
-    BL_ASSERT(!omp_in_parallel());
-#endif
+    BL_ASSERT(!OpenMP::in_parallel());
 
     ParmParse pp("geometry");
 
@@ -401,4 +393,62 @@ Geometry::growPeriodicDomain (int ngrow) const noexcept
     return b;
 }
 
+void
+Geometry::computeRoundoffDomain ()
+{
+    for (int k = 0; k < AMREX_SPACEDIM; k++)
+    {
+        offset[k] = prob_domain.lo(k);
+        dx[k] = prob_domain.length(k)/(Real(domain.length(k)));
+        inv_dx[k] = 1.0/dx[k];
+    }
+
+    roundoff_domain = prob_domain;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+    {
+        int ilo = Domain().smallEnd(idim);
+        int ihi = Domain().bigEnd(idim);
+        Real plo = ProbLo(idim);
+        Real phi = ProbHi(idim);
+        Real idx = InvCellSize(idim);
+        Real deltax = CellSize(idim);
+
+#ifdef AMREX_SINGLE_PRECISION_PARTICLES
+        Real tolerance = std::max(1.e-4*deltax, 1.e-10*phi);
+#else
+        Real tolerance = std::max(1.e-8*deltax, 1.e-14*phi);
+#endif
+        // bisect the point at which the cell no longer maps to inside the domain
+        Real lo = static_cast<Real>(phi) - Real(0.5)*static_cast<Real>(deltax);
+        Real hi = static_cast<Real>(phi) + Real(0.5)*static_cast<Real>(deltax);
+
+        Real mid = bisect(lo, hi,
+                          [=] AMREX_GPU_HOST_DEVICE (Real x) -> Real
+                          {
+                              int i = int(Math::floor((x - plo)*idx)) + ilo;
+                              bool inside = i >= ilo and i <= ihi;
+                              return static_cast<Real>(inside) - Real(0.5);
+                          }, tolerance);
+        roundoff_domain.setHi(idim, mid - tolerance);
+    }
+}
+
+bool
+Geometry::outsideRoundoffDomain (AMREX_D_DECL(Real x, Real y, Real z)) const
+{
+    bool outside = AMREX_D_TERM(x <  roundoff_domain.lo(0)
+                             || x >= roundoff_domain.hi(0),
+                             || y <  roundoff_domain.lo(1)
+                             || y >= roundoff_domain.hi(1),
+                             || z <  roundoff_domain.lo(2)
+                             || z >= roundoff_domain.hi(2));
+    return outside;
+}
+
+bool
+Geometry::insideRoundoffDomain (AMREX_D_DECL(Real x, Real y, Real z)) const
+{
+    return !outsideRoundoffDomain(AMREX_D_DECL(x, y, z));
+}
+
 }
diff --git a/Src/Base/AMReX_Gpu.H b/Src/Base/AMReX_Gpu.H
index 3d7ff6f9ae1..5c59d89305b 100644
--- a/Src/Base/AMReX_Gpu.H
+++ b/Src/Base/AMReX_Gpu.H
@@ -9,10 +9,12 @@ namespace amrex { namespace Cuda {} }
 #endif
 
 #include <AMReX_GpuQualifiers.H>
+#include <AMReX_GpuKernelInfo.H>
 #include <AMReX_GpuPrint.H>
 #include <AMReX_GpuAssert.H>
 #include <AMReX_GpuTypes.H>
 #include <AMReX_GpuControl.H>
+#include <AMReX_GpuFuse.H>
 #include <AMReX_GpuLaunch.H>
 #include <AMReX_GpuError.H>
 
diff --git a/Src/Base/AMReX_GpuAllocators.H b/Src/Base/AMReX_GpuAllocators.H
index 53d65d088a0..99b01f30a37 100644
--- a/Src/Base/AMReX_GpuAllocators.H
+++ b/Src/Base/AMReX_GpuAllocators.H
@@ -5,6 +5,7 @@
 #include <memory>
 #include <limits>
 #include <memory>
+#include <type_traits>
 
 #include <AMReX_Print.H>
 #include <AMReX_Arena.H>
@@ -20,11 +21,17 @@ namespace amrex {
 
     template <typename T>
     struct RunOnGpu : std::false_type {};
-        
-#ifdef AMREX_USE_GPU
-  
+
+    struct ArenaAllocatorTraits {
+        typedef std::true_type propagate_on_container_copy_assignment;
+        typedef std::true_type propagate_on_container_move_assignment;
+        typedef std::true_type propagate_on_container_swap;
+        typedef std::true_type is_always_equal;
+    };
+
     template<typename T>
     class ArenaAllocator
+        : public ArenaAllocatorTraits
     {
     public :
 
@@ -33,18 +40,19 @@ namespace amrex {
         inline value_type* allocate(std::size_t n)
         {
 	    value_type* result = nullptr;
-            result = (value_type*) The_Arena()->alloc(n * sizeof(T));  
+            result = (value_type*) The_Arena()->alloc(n * sizeof(T));
 	    return result;
         }
-    
+
         inline void deallocate(value_type* ptr, std::size_t)
         {
             The_Arena()->free(ptr);
-        }    
+        }
     };
 
     template<typename T>
     class DeviceArenaAllocator
+        : public ArenaAllocatorTraits
     {
     public :
 
@@ -53,18 +61,19 @@ namespace amrex {
         inline value_type* allocate(std::size_t n)
         {
 	    value_type* result = nullptr;
-            result = (value_type*) The_Device_Arena()->alloc(n * sizeof(T));  
+            result = (value_type*) The_Device_Arena()->alloc(n * sizeof(T));
 	    return result;
         }
-    
+
         inline void deallocate(value_type* ptr, std::size_t)
         {
             The_Device_Arena()->free(ptr);
-        }    
+        }
     };
 
     template<typename T>
     class PinnedArenaAllocator
+        : public ArenaAllocatorTraits
     {
     public :
 
@@ -73,18 +82,19 @@ namespace amrex {
         inline value_type* allocate(std::size_t n)
         {
 	    value_type* result = nullptr;
-            result = (value_type*) The_Pinned_Arena()->alloc(n * sizeof(T));  
+            result = (value_type*) The_Pinned_Arena()->alloc(n * sizeof(T));
 	    return result;
         }
-    
+
         inline void deallocate(value_type* ptr, std::size_t)
         {
             The_Pinned_Arena()->free(ptr);
-        }    
+        }
     };
 
     template<typename T>
     class ManagedArenaAllocator
+        : public ArenaAllocatorTraits
     {
     public :
 
@@ -93,14 +103,14 @@ namespace amrex {
         inline value_type* allocate(std::size_t n)
         {
 	    value_type* result = nullptr;
-            result = (value_type*) The_Managed_Arena()->alloc(n * sizeof(T));  
+            result = (value_type*) The_Managed_Arena()->alloc(n * sizeof(T));
 	    return result;
         }
-    
+
         inline void deallocate(value_type* ptr, std::size_t)
         {
             The_Managed_Arena()->free(ptr);
-        }    
+        }
     };
 
     template<typename T>
@@ -110,10 +120,12 @@ namespace amrex {
 
         using value_type = T;
 
+        PolymorphicAllocator () : m_use_gpu_aware_mpi(ParallelDescriptor::UseGpuAwareMpi()) {}
+
         inline value_type* allocate(std::size_t n)
         {
 	    value_type* result = nullptr;
-            if (ParallelDescriptor::UseGpuAwareMpi()) 
+            if (m_use_gpu_aware_mpi)
             {
                 result = (value_type*) The_Device_Arena()->alloc(n * sizeof(T));
             }
@@ -123,10 +135,10 @@ namespace amrex {
             }
 	    return result;
         }
-    
+
         inline void deallocate(value_type* ptr, std::size_t)
         {
-            if (ParallelDescriptor::UseGpuAwareMpi()) 
+            if (m_use_gpu_aware_mpi)
             {
                 The_Device_Arena()->free(ptr);
             }
@@ -134,23 +146,27 @@ namespace amrex {
             {
                 The_Pinned_Arena()->free(ptr);
             }
-        }    
-    };
+        }
 
-    template <template <typename> class Allocator, class T, class U>
-    bool
-    operator==(Allocator<T> const&, Allocator<U> const&) noexcept
-    {
-        return true;
-    }
-    
-    template <template <typename> class Allocator, class T, class U>
-    bool
-    operator!=(Allocator<T> const& x, Allocator<U> const& y) noexcept
-    {
-        return !(x == y);
-    }
+        bool m_use_gpu_aware_mpi;
+
+        template <class U, class V>
+        friend bool
+        operator== (PolymorphicAllocator<U> const& a, PolymorphicAllocator<V> const& b) noexcept
+        {
+            return a.m_use_gpu_aware_mpi == b.m_use_gpu_aware_mpi;
+        }
 
+        template <class U, class V>
+        friend bool
+        operator!= (PolymorphicAllocator<U> const& a, PolymorphicAllocator<V> const& b) noexcept
+        {
+            return a.m_use_gpu_aware_mpi != b.m_use_gpu_aware_mpi;
+        }
+
+    };
+
+#ifdef AMREX_USE_GPU
     template <typename T>
     struct RunOnGpu<ArenaAllocator<T> > : std::true_type {};
 
@@ -162,6 +178,14 @@ namespace amrex {
 
 #endif // AMREX_USE_GPU
 
+#ifdef AMREX_USE_GPU
+    template <class T>
+    using DefaultAllocator = amrex::ArenaAllocator<T>;
+#else
+    template <class T>
+    using DefaultAllocator = std::allocator<T>;
+#endif // AMREX_USE_GPU
+
 } // namespace amrex
 
 #endif // AMREX_GPUALLOCATORS_H_
diff --git a/Src/Base/AMReX_GpuAssert.H b/Src/Base/AMReX_GpuAssert.H
index e2475b8af57..e730e947163 100644
--- a/Src/Base/AMReX_GpuAssert.H
+++ b/Src/Base/AMReX_GpuAssert.H
@@ -14,8 +14,7 @@
 #elif defined(AMREX_USE_CUDA)
 #  define AMREX_DEVICE_ASSERT(flag) assert(flag)
 #elif defined(AMREX_USE_HIP)
-// HIP FIX HERE - assert
-#  define AMREX_DEVICE_ASSERT(flag)
+#  define AMREX_DEVICE_ASSERT(flag) assert(flag)
 #endif
 
 #endif  // !defined(__APPLE__)
diff --git a/Src/Base/AMReX_GpuAsyncArray.H b/Src/Base/AMReX_GpuAsyncArray.H
index 0d5504e49dd..2076fa1592c 100644
--- a/Src/Base/AMReX_GpuAsyncArray.H
+++ b/Src/Base/AMReX_GpuAsyncArray.H
@@ -9,19 +9,14 @@
 #include <AMReX_TypeTraits.H>
 #include <AMReX_GpuDevice.H>
 
-// HIP FIX HERE - MOVE TO ONE SPOT
-#ifdef __HIP_PLATFORM_HCC__
-#define HIPRT_CB 
-#endif
-
-#if defined(AMREX_USE_GPU) && !defined(AMREX_USE_DPCPP)
+#if defined(AMREX_USE_CUDA) || defined(AMREX_USE_HIP)
 extern "C" {
-AMREX_HIP_OR_CUDA(
-         void HIPRT_CB  amrex_asyncarray_delete ( hipStream_t stream,  hipError_t error, void* p);,
-#if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )
-         void CUDART_CB amrex_asyncarray_delete (void* p);)
-#else
-         void CUDART_CB amrex_asyncarray_delete (cudaStream_t stream, cudaError_t error, void* p);)
+#if defined(AMREX_USE_HIP)
+    void amrex_asyncarray_delete ( hipStream_t stream,  hipError_t error, void* p);
+#elif defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10)
+    void CUDART_CB amrex_asyncarray_delete (void* p);
+#elif defined(AMREX_USE_CUDA)
+    void CUDART_CB amrex_asyncarray_delete (cudaStream_t stream, cudaError_t error, void* p);
 #endif
 }
 #endif
@@ -29,7 +24,7 @@ AMREX_HIP_OR_CUDA(
 namespace amrex {
 namespace Gpu {
 
-template <typename T, typename = amrex::EnableIf_t<AMREX_IS_TRIVIALLY_COPYABLE(T)> >
+template <typename T, typename std::enable_if<AMREX_IS_TRIVIALLY_COPYABLE(T),int>::type = 0>
 class AsyncArray
 {
 public:
@@ -48,7 +43,7 @@ public:
 #endif
     }
 
-    template <typename U = T, typename = amrex::EnableIf_t<std::is_pod<U>::value> >
+    template <typename U = T, typename std::enable_if<std::is_pod<U>::value,int>::type = 0>
     explicit AsyncArray (const std::size_t n)
     {
         if (n == 0) return;
@@ -78,15 +73,15 @@ public:
                 T** p = static_cast<T**>(std::malloc(2*sizeof(T*)));
                 p[0] = d_data;
                 p[1] = h_data;
-                AMREX_HIP_OR_CUDA(
-                    AMREX_HIP_SAFE_CALL ( hipStreamAddCallback(Gpu::gpuStream(),
-                                                               amrex_asyncarray_delete, p, 0));,
-#if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )
-                    AMREX_CUDA_SAFE_CALL(cudaLaunchHostFunc(Gpu::gpuStream(),
-                                                            amrex_asyncarray_delete, p)););
-#else                    
-                    AMREX_CUDA_SAFE_CALL(cudaStreamAddCallback(Gpu::gpuStream(),
-                                                               amrex_asyncarray_delete, p, 0)););
+#if defined(AMREX_USE_HIP)
+                AMREX_HIP_SAFE_CALL ( hipStreamAddCallback(Gpu::gpuStream(),
+                                                           amrex_asyncarray_delete, p, 0));
+#elif defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10)
+                AMREX_CUDA_SAFE_CALL(cudaLaunchHostFunc(Gpu::gpuStream(),
+                                                        amrex_asyncarray_delete, p));
+#elif defined(AMREX_USE_CUDA)
+                AMREX_CUDA_SAFE_CALL(cudaStreamAddCallback(Gpu::gpuStream(),
+                                                           amrex_asyncarray_delete, p, 0));
 #endif
                 Gpu::callbackAdded();
 #else
diff --git a/Src/Base/AMReX_GpuAsyncArray.cpp b/Src/Base/AMReX_GpuAsyncArray.cpp
index cf328a4168f..35355218b91 100644
--- a/Src/Base/AMReX_GpuAsyncArray.cpp
+++ b/Src/Base/AMReX_GpuAsyncArray.cpp
@@ -1,20 +1,15 @@
 #include <AMReX_GpuAsyncArray.H>
-#include <mutex>
 
 #ifdef AMREX_USE_GPU
 
-#ifdef __HIP_PLATFORM_HCC__
-#define HIPRT_CB 
-#endif
-
 #if !defined(AMREX_USE_DPCPP)
 extern "C" {
-AMREX_HIP_OR_CUDA(
-         void HIPRT_CB  amrex_asyncarray_delete ( hipStream_t stream,  hipError_t error, void* p),
-#if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )
-         void CUDART_CB amrex_asyncarray_delete (void* p))
-#else
-         void CUDART_CB amrex_asyncarray_delete (cudaStream_t stream, cudaError_t error, void* p))
+#if defined(AMREX_USE_HIP)
+    void amrex_asyncarray_delete ( hipStream_t /*stream*/,  hipError_t /*error*/, void* p)
+#elif defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10)
+    void CUDART_CB amrex_asyncarray_delete (void* p)
+#elif defined(AMREX_USE_CUDA)
+    void CUDART_CB amrex_asyncarray_delete (cudaStream_t /*stream*/, cudaError_t /*error*/, void* p)
 #endif
     {
         void** pp = (void**)p;
diff --git a/Src/Base/AMReX_GpuAtomic.H b/Src/Base/AMReX_GpuAtomic.H
index 26310f92d55..bc770870b02 100644
--- a/Src/Base/AMReX_GpuAtomic.H
+++ b/Src/Base/AMReX_GpuAtomic.H
@@ -82,6 +82,7 @@ namespace detail {
         sycl::atomic<T,as> a{sycl::multi_ptr<T,as>(sum)};
         return sycl::atomic_fetch_add(a, value, mo);
 #else
+        amrex::ignore_unused(sum, value);
         return T(); // should never get here, but have to return something
 #endif
     }
@@ -110,6 +111,16 @@ namespace detail {
 
 #endif
 
+#if defined(AMREX_USE_CUDA) && (__CUDA_ARCH__ < 600)
+
+    AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+    Long Add_device (double* const sum, double const value) noexcept
+    {
+        return detail::atomic_op<double, unsigned long long>(sum, value, amrex::Plus<double>());
+    }
+
+#endif
+
 #endif
 
     template<class T>
@@ -125,6 +136,33 @@ namespace detail {
 #endif
     }
 
+////////////////////////////////////////////////////////////////////////
+//  AddNoRet
+////////////////////////////////////////////////////////////////////////
+
+    template<class T>
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    void AddNoRet (T* const sum, T const value) noexcept
+    {
+#if AMREX_DEVICE_COMPILE
+        Add_device(sum, value);
+#else
+        *sum += value;
+#endif
+    }
+
+#if defined(AMREX_USE_HIP)
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    void AddNoRet (float* const sum, float const value) noexcept
+    {
+#if AMREX_DEVICE_COMPILE
+        atomicAddNoRet(sum, value);
+#else
+        *sum += value;
+#endif
+    }
+#endif
+
 ////////////////////////////////////////////////////////////////////////
 //  Min
 ////////////////////////////////////////////////////////////////////////
@@ -143,6 +181,7 @@ namespace detail {
         sycl::atomic<T,as> a{sycl::multi_ptr<T,as>(m)};
         return sycl::atomic_fetch_min(a, value, mo);
 #else
+        amrex::ignore_unused(m,value);
         return T(); // should never get here, but have to return something
 #endif
     }
@@ -202,6 +241,7 @@ namespace detail {
         sycl::atomic<T,as> a{sycl::multi_ptr<T,as>(m)};
         return sycl::atomic_fetch_max(a, value, mo);
 #else
+        amrex::ignore_unused(m,value);
         return T(); // should never get here, but have to return something
 #endif
     }
@@ -289,15 +329,14 @@ namespace detail {
 //  Inc
 ////////////////////////////////////////////////////////////////////////
 
-    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+#ifdef AMREX_USE_DPCPP
+    template <sycl::access::address_space AS = sycl::access::address_space::global_space>
+    AMREX_FORCE_INLINE
     unsigned int Inc (unsigned int* const m, unsigned int const value) noexcept
     {
-#if defined(__CUDA_ARCH__) || defined(__HIP_DEVICE_COMPILE__)
-        return atomicInc(m, value);
-#elif defined(__SYCL_DEVICE_ONLY__)
+#if defined(__SYCL_DEVICE_ONLY__)
         constexpr auto mo = sycl::memory_order::relaxed;
-        constexpr auto as = sycl::access::address_space::global_space;
-        sycl::atomic<unsigned int,as> a{sycl::multi_ptr<unsigned int,as>(m)};
+        sycl::atomic<unsigned int,AS> a{sycl::multi_ptr<unsigned int,AS>(m)};
         unsigned int oldi = a.load(mo), newi;
         do {
             newi = (oldi >= value) ? 0u : (oldi+1u);
@@ -309,6 +348,19 @@ namespace detail {
         return old;
 #endif
     }
+#else
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    unsigned int Inc (unsigned int* const m, unsigned int const value) noexcept
+    {
+#if defined(__CUDA_ARCH__) || defined(__HIP_DEVICE_COMPILE__)
+        return atomicInc(m, value);
+#else
+        auto const old = *m;
+        *m = (old >= value) ? 0u : (old+1u);
+        return old;
+#endif
+    }
+#endif
 
 ////////////////////////////////////////////////////////////////////////
 //  Dec
@@ -388,7 +440,7 @@ namespace HostDevice { namespace Atomic {
     void Add (T* const sum, T const value) noexcept
     {
 #if AMREX_DEVICE_COMPILE
-        Gpu::Atomic::Add(sum,value);
+        Gpu::Atomic::AddNoRet(sum,value);
 #else
 #ifdef _OPENMP
 #pragma omp atomic update
diff --git a/Src/Base/AMReX_GpuComplex.H b/Src/Base/AMReX_GpuComplex.H
index 05bc7ef7fe8..8eff481ce06 100644
--- a/Src/Base/AMReX_GpuComplex.H
+++ b/Src/Base/AMReX_GpuComplex.H
@@ -358,7 +358,7 @@ T abs (const GpuComplex<T>& a_z) noexcept
         return s;
     x /= s;
     y /= s;
-    return s * amrex::Math::sqrt(x * x + y * y);
+    return s * std::sqrt(x * x + y * y);
 }
 
 /**
@@ -373,12 +373,12 @@ GpuComplex<T> sqrt (const GpuComplex<T>& a_z) noexcept
 
     if (x == T())
     {
-        T t = amrex::Math::sqrt(amrex::Math::abs(y) / 2);
+        T t = std::sqrt(amrex::Math::abs(y) / 2);
         return GpuComplex<T>(t, y < T() ? -t : t);
     }
     else
     {
-        T t = amrex::Math::sqrt(2 * (amrex::abs(a_z) + amrex::Math::abs(x)));
+        T t = std::sqrt(2 * (amrex::abs(a_z) + amrex::Math::abs(x)));
         T u = t / 2;
         return x > T()
             ? GpuComplex<T>(u, y / t)
diff --git a/Src/Base/AMReX_GpuControl.H b/Src/Base/AMReX_GpuControl.H
index aa06a25ff7c..5d7d29e26b3 100644
--- a/Src/Base/AMReX_GpuControl.H
+++ b/Src/Base/AMReX_GpuControl.H
@@ -26,6 +26,37 @@
 #define AMREX_HIP_OR_CUDA_OR_DPCPP(a,b,c) ((void)0);
 #endif
 
+#ifdef AMREX_USE_GPU
+#define AMREX_GPU_OR_CPU(a,b) a
+#else
+#define AMREX_GPU_OR_CPU(a,b) b
+#endif
+
+#ifdef AMREX_USE_DPCPP
+#define AMREX_DPCPP_ONLY(a) a
+#else
+#define AMREX_DPCPP_ONLY(a) ((void)0)
+#endif
+
+#ifdef AMREX_USE_DPCPP
+#if (AMREX_SPACEDIM == 1)
+#  define AMREX_DPCPP_1D_ONLY(a) a
+#  define AMREX_DPCPP_2D_ONLY(a) ((void)0)
+#  define AMREX_DPCPP_3D_ONLY(a) ((void)0)
+#elif (AMREX_SPACEDIM == 2)
+#  define AMREX_DPCPP_1D_ONLY(a) ((void)0)
+#  define AMREX_DPCPP_2D_ONLY(a) a
+#  define AMREX_DPCPP_3D_ONLY(a) ((void)0)
+#elif (AMREX_SPACEDIM == 3)
+#  define AMREX_DPCPP_1D_ONLY(a) ((void)0)
+#  define AMREX_DPCPP_2D_ONLY(a) ((void)0)
+#  define AMREX_DPCPP_3D_ONLY(a) a
+#endif
+#else
+#  define AMREX_DPCPP_1D_ONLY(a) ((void)0)
+#  define AMREX_DPCPP_2D_ONLY(a) ((void)0)
+#  define AMREX_DPCPP_3D_ONLY(a) ((void)0)
+#endif
 
 namespace amrex {
     enum struct RunOn { Gpu, Cpu, Device=Gpu, Host=Cpu };
diff --git a/Src/Base/AMReX_GpuDevice.H b/Src/Base/AMReX_GpuDevice.H
index e5250d2f2c4..8e975e963aa 100644
--- a/Src/Base/AMReX_GpuDevice.H
+++ b/Src/Base/AMReX_GpuDevice.H
@@ -9,6 +9,8 @@
 #include <AMReX_GpuTypes.H>
 #include <AMReX_GpuError.H>
 #include <AMReX_GpuControl.H>
+#include <AMReX_OpenMP.H>
+#include <AMReX_Vector.H>
 
 namespace amrex {
 
@@ -45,17 +47,17 @@ public:
     static void Finalize ();
 
 #if defined(AMREX_USE_GPU)
-    static gpuStream_t gpuStream () noexcept { return gpu_stream; }
+    static gpuStream_t gpuStream () noexcept { return gpu_stream[OpenMP::get_thread_num()]; }
     static gpuStream_t nullStream () noexcept { return gpu_default_stream; }
 #ifdef AMREX_USE_CUDA
     // for backward compatibility
-    static cudaStream_t cudaStream () noexcept { return gpu_stream; }
+    static cudaStream_t cudaStream () noexcept { return gpu_stream[OpenMP::get_thread_num()]; }
 #endif
 #ifdef AMREX_USE_DPCPP
     static sycl::queue& nullQueue () noexcept { return *(gpu_default_stream.queue); }
-    static sycl::queue& streamQueue () noexcept { return *(gpu_stream.queue); }
-    static sycl::queue& streamQueue (int i) noexcept { return *(gpu_streams[i].queue); }
-    static bool onNullStream () noexcept { return gpu_stream == gpu_default_stream; }
+    static sycl::queue& streamQueue () noexcept { return *(gpu_stream[OpenMP::get_thread_num()].queue); }
+    static sycl::queue& streamQueue (int i) noexcept { return *(gpu_stream_pool[i].queue); }
+    static bool onNullStream () noexcept { return gpu_stream[OpenMP::get_thread_num()] == gpu_default_stream; }
     static bool onNullStream (gpuStream_t stream) noexcept { return stream == gpu_default_stream; }
 #endif
 #endif
@@ -113,12 +115,17 @@ public:
     static std::string deviceName () noexcept { return std::string(device_prop.name); }
 #endif
 
+#ifdef AMREX_USE_CUDA
+    static int devicePropMajor () noexcept { return device_prop.major; }
+    static int devicePropMinor () noexcept { return device_prop.minor; }
+#endif
+
     static std::size_t freeMemAvailable ();
 
 #ifdef AMREX_USE_GPU
     static constexpr int warp_size = AMREX_HIP_OR_CUDA_OR_DPCPP(64,32,16);
 
-    static int maxBlocksPerLaunch () noexcept { return max_blocks_per_launch; }
+    static unsigned int maxBlocksPerLaunch () noexcept { return max_blocks_per_launch; }
 
 #ifdef AMREX_USE_DPCPP
     static Long maxMemAllocSize () noexcept { return device_prop.maxMemAllocSize; }
@@ -134,24 +141,17 @@ private:
     static int device_id;
     static int num_devices_used;
     static int verbose;
-
-#ifdef AMREX_USE_GPU
-    static constexpr int max_gpu_streams = 4;
-#else
-    // Equivalent to "single dependent stream". Fits best
-    //  with math this is used in ("x/max_streams").
-    static constexpr int max_gpu_streams = 1;
-#endif
+    static int max_gpu_streams;
 
 #ifdef AMREX_USE_GPU
     static dim3 numThreadsMin;
     static dim3 numBlocksOverride, numThreadsOverride;
 
-    static std::array<gpuStream_t,max_gpu_streams> gpu_streams;
     static gpuStream_t gpu_default_stream;
-    static gpuStream_t gpu_stream;
+    static Vector<gpuStream_t> gpu_stream_pool;
+    static Vector<gpuStream_t> gpu_stream;
     static gpuDeviceProp_t device_prop;
-    static int max_blocks_per_launch;
+    static unsigned int max_blocks_per_launch;
 
 #ifdef AMREX_USE_DPCPP
     static std::unique_ptr<sycl::context> sycl_context;
@@ -202,6 +202,8 @@ nonNullStreamSynchronize () noexcept
 }
 #endif
 
+#ifdef AMREX_USE_GPU
+
 inline void
 htod_memcpy (void* p_d, const void* p_h, const std::size_t sz) noexcept
 {
@@ -215,6 +217,7 @@ htod_memcpy (void* p_d, const void* p_h, const std::size_t sz) noexcept
     } catch (sycl::exception const& ex) {
         amrex::Abort(std::string("htod_memcpy: ")+ex.what()+"!!!!!");
     }
+    if (Device::onNullStream()) Gpu::synchronize();
 #else
     AMREX_HIP_OR_CUDA(
         AMREX_HIP_SAFE_CALL(hipMemcpy(p_d, p_h, sz, hipMemcpyHostToDevice));,
@@ -235,6 +238,7 @@ dtoh_memcpy (void* p_h, const void* p_d, const std::size_t sz) noexcept
     } catch (sycl::exception const& ex) {
         amrex::Abort(std::string("dtoh_memcpy: ")+ex.what()+"!!!!!");
     }
+    Gpu::synchronize(); // To mimic cuda behavior
 #else
     AMREX_HIP_OR_CUDA(
         AMREX_HIP_SAFE_CALL(hipMemcpy(p_h, p_d, sz, hipMemcpyDeviceToHost));,
@@ -304,6 +308,8 @@ dtod_memcpy_async (void* p_d_dst, const void* p_d_src, const std::size_t sz) noe
 #endif
 }
 
+#endif
+
 #ifdef AMREX_USE_DPCPP
 inline bool
 onNullStream ()
diff --git a/Src/Base/AMReX_GpuDevice.cpp b/Src/Base/AMReX_GpuDevice.cpp
index 41a48c45c59..1c8520ddab2 100644
--- a/Src/Base/AMReX_GpuDevice.cpp
+++ b/Src/Base/AMReX_GpuDevice.cpp
@@ -48,20 +48,24 @@ namespace Gpu {
 int Device::device_id = 0;
 int Device::num_devices_used = 0;
 int Device::verbose = 0;
+#ifdef AMREX_USE_GPU
+int Device::max_gpu_streams = 4;
+#else
+int Device::max_gpu_streams = 1;
+#endif
 
 #ifdef AMREX_USE_GPU
-constexpr int Device::max_gpu_streams;
 dim3 Device::numThreadsMin      = dim3(1, 1, 1);
 dim3 Device::numThreadsOverride = dim3(0, 0, 0);
 dim3 Device::numBlocksOverride  = dim3(0, 0, 0);
-int  Device::max_blocks_per_launch = 640;
+unsigned int Device::max_blocks_per_launch = 2560;
 
-std::array<gpuStream_t,Device::max_gpu_streams> Device::gpu_streams;
-gpuStream_t                                     Device::gpu_default_stream;
-gpuStream_t                                     Device::gpu_stream;
-gpuDeviceProp_t                                 Device::device_prop;
+gpuStream_t         Device::gpu_default_stream;
+Vector<gpuStream_t> Device::gpu_stream_pool;
+Vector<gpuStream_t> Device::gpu_stream;
+gpuDeviceProp_t     Device::device_prop;
 
-constexpr int                                   Device::warp_size;
+constexpr int Device::warp_size;
 
 #ifdef AMREX_USE_DPCPP
 std::unique_ptr<sycl::context> Device::sycl_context;
@@ -76,12 +80,14 @@ namespace {
 
     void InitializeGraph(int graph_size)
     {
+        amrex::ignore_unused(graph_size);
+
 #if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )
 
         BL_PROFILE("InitGraph");
 
         int streams = Gpu::Device::numGpuStreams();
-        cudaGraphExec_t graphExec;
+        cudaGraphExec_t graphExec{};
         for (int n=0; n<(graph_size); ++n)
         {
             Gpu::Device::startGraphRecording((n == 0), NULL, NULL, 0);
@@ -115,6 +121,9 @@ Device::Initialize ()
     nvtx_init = nvtxRangeStartA(pname);
 #endif
 
+    ParmParse ppamrex("amrex");
+    ppamrex.query("max_gpu_streams", max_gpu_streams);
+
     ParmParse pp("device");
 
     pp.query("v", verbose);
@@ -124,7 +133,7 @@ Device::Initialize ()
         AMREX_HIP_OR_CUDA_OR_DPCPP
             ( amrex::Print() << "Initializing HIP...\n";,
               amrex::Print() << "Initializing CUDA...\n";,
-              amrex::Print() << "Initializing oneAPI...\n"; );
+              amrex::Print() << "Initializing oneAPI...\n"; )
     }
 
     // XL CUDA Fortran support needs to be initialized
@@ -144,8 +153,6 @@ Device::Initialize ()
         gpu_device_count = gpu_devices.size();
         if (gpu_device_count <= 0) {
             amrex::Abort("No GPU device found");
-        } else if (gpu_device_count > 1) {
-            amrex::Abort("DPCPP TODO: more than one device not supported yet");
         }
     }
 #else
@@ -160,6 +167,9 @@ Device::Initialize ()
     // or only one MPI rank, this is easy. Otherwise, we
     // need to do a little more work.
 
+    int n_local_procs = 1;
+    amrex::ignore_unused(n_local_procs);
+
     if (ParallelDescriptor::NProcs() == 1) {
         device_id = 0;
     }
@@ -198,9 +208,11 @@ Device::Initialize ()
         // this is if the number of visible devices is smaller than
         // the known number of GPUs per socket.
 
+#if defined(AMREX_USE_CUDA)
 #if (!defined(AMREX_GPUS_PER_SOCKET) && !defined(AMREX_GPUS_PER_NODE))
         amrex::Warning("Multiple GPUs are visible to each MPI rank, but the number of GPUs per socket or node has not been provided.\n"
                        "This may lead to incorrect or suboptimal rank-to-GPU mapping.");
+#endif
 #endif
 
         MPI_Comm local_comm;
@@ -222,8 +234,7 @@ Device::Initialize ()
         MPI_Comm_split_type(ParallelDescriptor::Communicator(), split_type, key, MPI_INFO_NULL, &local_comm);
 
         // Get rank within the local communicator, and number of ranks.
-        int n_procs;
-        MPI_Comm_size(local_comm, &n_procs);
+        MPI_Comm_size(local_comm, &n_local_procs);
 
         int my_rank;
         MPI_Comm_rank(local_comm, &my_rank);
@@ -242,7 +253,7 @@ Device::Initialize ()
         // that this will fail in the case where the devices are
         // set to exclusive process mode and MPS is not enabled.
 
-        if (n_procs > gpu_device_count) {
+        if (n_local_procs > gpu_device_count) {
             amrex::Print() << "Mapping more than one rank per GPU. This will fail if the GPUs are in exclusive process mode\n"
                            << "and MPS is not enabled. In that case you will see an error such as: 'all CUDA-capable devices are\n"
                            << "busy'. To resolve that issue, set the GPUs to the default compute mode, or enable MPS. If you are\n"
@@ -255,8 +266,6 @@ Device::Initialize ()
 
     AMREX_HIP_OR_CUDA(AMREX_HIP_SAFE_CALL (hipSetDevice(device_id));,
                       AMREX_CUDA_SAFE_CALL(cudaSetDevice(device_id)); );
-    AMREX_HIP_OR_CUDA(AMREX_HIP_SAFE_CALL (hipSetDeviceFlags(hipDeviceMapHost));,
-                      AMREX_CUDA_SAFE_CALL(cudaSetDeviceFlags(cudaDeviceMapHost)); );
 
 #ifdef AMREX_USE_ACC
     amrex_initialize_acc(device_id);
@@ -278,7 +287,7 @@ Device::Initialize ()
     // is only available starting from CUDA 10.0, so we will
     // leave num_devices_used as 0 for older CUDA toolkits.
 
-#if AMREX_NVCC_MAJOR_VERSION >= 10
+#if (__CUDACC_VER_MAJOR__ >= 10)
     size_t uuid_length = 16;
     size_t recv_sz = uuid_length * ParallelDescriptor::NProcs();
     const char* sendbuf = &device_prop.uuid.bytes[0];
@@ -309,7 +318,7 @@ Device::Initialize ()
     cudaProfilerStart();
 
     if (amrex::Verbose()) {
-#if defined(AMREX_USE_MPI) && (AMREX_NVCC_MAJOR_VERSION >= 10)
+#if defined(AMREX_USE_MPI) && (__CUDACC_VER_MAJOR__ >= 10)
         if (num_devices_used == ParallelDescriptor::NProcs())
         {
             amrex::Print() << "CUDA initialized with 1 GPU per MPI rank; "
@@ -329,7 +338,14 @@ Device::Initialize ()
 
 #elif defined(AMREX_USE_HIP) 
     if (amrex::Verbose()) {
-        amrex::Print() << "HIP initialized.\n";
+        if (ParallelDescriptor::NProcs() > 1) {
+#ifdef BL_USE_MPI
+            amrex::Print() << "HIP initialized.  On the first node/socket, there are "
+                           << n_local_procs << " processes and " << gpu_device_count << " GPUs\n";
+#endif
+        } else {
+            amrex::Print() << "HIP initialized.\n";
+        }
     }
 #elif defined(AMREX_USE_DPCPP)
     if (amrex::Verbose()) {
@@ -348,18 +364,18 @@ Device::Finalize ()
 
     for (int i = 0; i < max_gpu_streams; ++i)
     {
-        AMREX_HIP_OR_CUDA( AMREX_HIP_SAFE_CALL( hipStreamDestroy(gpu_streams[i]));,
-                          AMREX_CUDA_SAFE_CALL(cudaStreamDestroy(gpu_streams[i])); );
+        AMREX_HIP_OR_CUDA( AMREX_HIP_SAFE_CALL( hipStreamDestroy(gpu_stream_pool[i]));,
+                          AMREX_CUDA_SAFE_CALL(cudaStreamDestroy(gpu_stream_pool[i])); );
     }
 
 #ifdef AMREX_USE_DPCPP
     sycl_context.reset();
     sycl_device.reset();
-    for (auto& s : gpu_streams) {
+    for (auto& s : gpu_stream_pool) {
         delete s.queue;
         s.queue = nullptr;
     }
-    gpu_stream.queue = nullptr;
+    gpu_stream.clear();
     delete gpu_default_stream.queue;
     gpu_default_stream.queue = nullptr;
 #endif
@@ -374,6 +390,8 @@ Device::initialize_gpu ()
 {
 #ifdef AMREX_USE_GPU
 
+    gpu_stream_pool.resize(max_gpu_streams);
+
 #ifdef AMREX_USE_HIP
 
     AMREX_HIP_SAFE_CALL(hipGetDeviceProperties(&device_prop, device_id));
@@ -388,16 +406,14 @@ Device::initialize_gpu ()
 
     gpu_default_stream = 0;
     for (int i = 0; i < max_gpu_streams; ++i) {
-        AMREX_HIP_SAFE_CALL(hipStreamCreate(&gpu_streams[i]));
+        AMREX_HIP_SAFE_CALL(hipStreamCreate(&gpu_stream_pool[i]));
     }
 
 #elif defined(AMREX_USE_CUDA)
     AMREX_CUDA_SAFE_CALL(cudaGetDeviceProperties(&device_prop, device_id));
 
-    AMREX_ALWAYS_ASSERT_WITH_MESSAGE(device_prop.major >= 6, "Compute capability must be >= 6");
-
-    // Prefer L1 cache to shared memory (this has no effect on GPUs with a fixed L1 cache size).
-    AMREX_CUDA_SAFE_CALL(cudaDeviceSetCacheConfig(cudaFuncCachePreferL1));
+    AMREX_ALWAYS_ASSERT_WITH_MESSAGE(device_prop.major >= 4 || (device_prop.major == 3 && device_prop.minor >= 5),
+                                     "Compute capability must be >= 3.5");
 
     if (sizeof(Real) == 8) {
         AMREX_CUDA_SAFE_CALL(cudaDeviceSetSharedMemConfig(cudaSharedMemBankSizeEightByte));
@@ -407,9 +423,9 @@ Device::initialize_gpu ()
 
     gpu_default_stream = 0;
     for (int i = 0; i < max_gpu_streams; ++i) {
-        AMREX_CUDA_SAFE_CALL(cudaStreamCreate(&gpu_streams[i]));
+        AMREX_CUDA_SAFE_CALL(cudaStreamCreate(&gpu_stream_pool[i]));
 #ifdef AMREX_USE_ACC
-        acc_set_cuda_stream(i, gpu_streams[i]);
+        acc_set_cuda_stream(i, gpu_stream_pool[i]);
 #endif
     }
 
@@ -417,13 +433,15 @@ Device::initialize_gpu ()
 
 #elif defined(AMREX_USE_DPCPP)
     { // create device, context and queues
-        sycl::gpu_selector device_selector;
-        sycl_device.reset(new sycl::device(device_selector));
+        sycl::gpu_selector gpu_device_selector;
+        sycl::platform platform(gpu_device_selector);
+        auto const& gpu_devices = platform.get_devices();
+        sycl_device.reset(new sycl::device(gpu_devices[device_id]));
         sycl_context.reset(new sycl::context(*sycl_device, amrex_sycl_error_handler));
-        gpu_default_stream.queue = new sycl::queue(*sycl_context, device_selector,
+        gpu_default_stream.queue = new sycl::queue(*sycl_context, *sycl_device,
                                          sycl::property_list{sycl::property::queue::in_order{}});
         for (int i = 0; i < max_gpu_streams; ++i) {
-            gpu_streams[i].queue = new sycl::queue(*sycl_context, device_selector,
+            gpu_stream_pool[i].queue = new sycl::queue(*sycl_context, *sycl_device,
                                          sycl::property_list{sycl::property::queue::in_order{}});
         }
     }
@@ -473,7 +491,7 @@ Device::initialize_gpu ()
     }
 #endif
 
-    gpu_stream = gpu_default_stream;
+    gpu_stream.resize(OpenMP::get_max_threads(), gpu_default_stream);
 
     ParmParse pp("device");
 
@@ -514,9 +532,9 @@ Device::initialize_gpu ()
     }
 
 #ifdef AMREX_USE_DPCPP
-    max_blocks_per_launch = 1000000; // xxxxx DPCPP todo
+    // max_blocks_per_launch = 100000; // xxxxx DPCPP todo
 #else
-    max_blocks_per_launch = numMultiProcessors() * maxThreadsPerMultiProcessor() / AMREX_GPU_MAX_THREADS;
+    max_blocks_per_launch = 4 * numMultiProcessors() * maxThreadsPerMultiProcessor() / AMREX_GPU_MAX_THREADS;
 #endif
 
 #endif
@@ -537,15 +555,16 @@ Device::numDevicesUsed () noexcept
 void
 Device::setStreamIndex (const int idx) noexcept
 {
+    amrex::ignore_unused(idx);
 #ifdef AMREX_USE_GPU
     if (idx < 0) {
-        gpu_stream = gpu_default_stream;
+        gpu_stream[OpenMP::get_thread_num()] = gpu_default_stream;
 
 #ifdef AMREX_USE_ACC
         amrex_set_acc_stream(acc_async_sync);
 #endif
     } else {
-        gpu_stream = gpu_streams[idx % max_gpu_streams];
+        gpu_stream[OpenMP::get_thread_num()] = gpu_stream_pool[idx % max_gpu_streams];
 
 #ifdef AMREX_USE_ACC
         amrex_set_acc_stream(idx % max_gpu_streams);
@@ -558,16 +577,16 @@ Device::setStreamIndex (const int idx) noexcept
 gpuStream_t
 Device::resetStream () noexcept
 {
-    gpuStream_t r = gpu_stream;
-    gpu_stream = gpu_default_stream;
+    gpuStream_t r = gpu_stream[OpenMP::get_thread_num()];
+    gpu_stream[OpenMP::get_thread_num()] = gpu_default_stream;
     return r;
 }
 
 gpuStream_t
 Device::setStream (gpuStream_t s) noexcept
 {
-    gpuStream_t r = gpu_stream;
-    gpu_stream = s;
+    gpuStream_t r = gpu_stream[OpenMP::get_thread_num()];
+    gpu_stream[OpenMP::get_thread_num()] = s;
     return r;
 }
 #endif
@@ -599,8 +618,8 @@ Device::streamSynchronize () noexcept
         amrex::Abort(std::string("streamSynchronize: ")+ex.what()+"!!!!!");
     }
 #else
-    AMREX_HIP_OR_CUDA( AMREX_HIP_SAFE_CALL(hipStreamSynchronize(gpu_stream));,
-                       AMREX_CUDA_SAFE_CALL(cudaStreamSynchronize(gpu_stream)); )
+    AMREX_HIP_OR_CUDA( AMREX_HIP_SAFE_CALL(hipStreamSynchronize(gpu_stream[OpenMP::get_thread_num()]));,
+                       AMREX_CUDA_SAFE_CALL(cudaStreamSynchronize(gpu_stream[OpenMP::get_thread_num()])); )
 #endif
 }
 
@@ -608,7 +627,7 @@ Device::streamSynchronize () noexcept
 void
 Device::nonNullStreamSynchronize () noexcept
 {
-    for (auto const& s : gpu_streams) {
+    for (auto const& s : gpu_stream_pool) {
         try {
             s.queue->wait_and_throw();
         } catch (sycl::exception const& ex) {
@@ -658,7 +677,7 @@ Device::startGraphRecording(bool first_iter, void* h_ptr, void* d_ptr, size_t sz
 cudaGraphExec_t
 Device::stopGraphRecording(bool last_iter)
 {
-    cudaGraphExec_t graphExec;
+    cudaGraphExec_t graphExec{};
 
     if (last_iter && inLaunchRegion() && inGraphRegion())
     {
@@ -737,6 +756,7 @@ Device::executeGraph(const cudaGraphExec_t &graphExec, bool synch)
 void
 Device::mem_advise_set_preferred (void* p, const std::size_t sz, const int device)
 {
+    amrex::ignore_unused(p,sz,device);
     // HIP does not support memory advise.
 #ifdef AMREX_USE_CUDA
 #ifndef AMREX_USE_HIP
@@ -758,6 +778,7 @@ Device::mem_advise_set_preferred (void* p, const std::size_t sz, const int devic
 void
 Device::mem_advise_set_readonly (void* p, const std::size_t sz)
 {
+    amrex::ignore_unused(p,sz);
     // HIP does not support memory advise.
 #ifdef AMREX_USE_CUDA
 #ifndef AMREX_USE_HIP
@@ -1038,10 +1059,13 @@ std::size_t
 Device::freeMemAvailable ()
 {
 #ifdef AMREX_USE_GPU
-    std::size_t f, t;
+    std::size_t f;
+#ifndef AMREX_USE_DPCPP
+    std::size_t t;
+#endif
     AMREX_HIP_OR_CUDA_OR_DPCPP( AMREX_HIP_SAFE_CALL(hipMemGetInfo(&f,&t));,
                                 AMREX_CUDA_SAFE_CALL(cudaMemGetInfo(&f,&t));,
-                                f = device_prop.totalGlobalMem; ); // xxxxx DPCPP tod
+                                f = device_prop.totalGlobalMem; ); // xxxxx DPCPP todo
     return f;
 #else
     return 0;
diff --git a/Src/Base/AMReX_GpuElixir.cpp b/Src/Base/AMReX_GpuElixir.cpp
index c1c8b0ddb8c..15cd2834ab9 100644
--- a/Src/Base/AMReX_GpuElixir.cpp
+++ b/Src/Base/AMReX_GpuElixir.cpp
@@ -6,10 +6,6 @@
 #include <memory>
 #include <AMReX_GpuDevice.H>
 
-#ifdef __HIP_PLATFORM_HCC__
-#define HIPRT_CB 
-#endif
-
 namespace amrex {
 namespace Gpu {
 
@@ -18,12 +14,12 @@ namespace {
 #if defined(AMREX_USE_GPU) && !defined(AMREX_USE_DPCPP)
 
 extern "C" {
-AMREX_HIP_OR_CUDA(
-         void HIPRT_CB  amrex_elixir_delete ( hipStream_t stream,  hipError_t error, void* p),
-#if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )         
-         void CUDART_CB amrex_elixir_delete (void* p))
-#else
-         void CUDART_CB amrex_elixir_delete (cudaStream_t stream, cudaError_t error, void* p))
+#if defined(AMREX_USE_HIP)
+    void amrex_elixir_delete ( hipStream_t /*stream*/,  hipError_t /*error*/, void* p)
+#elif defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10)
+    void CUDART_CB amrex_elixir_delete (void* p)
+#elif defined(AMREX_USE_CUDA)
+    void CUDART_CB amrex_elixir_delete (cudaStream_t /*stream*/, cudaError_t /*error*/, void* p)
 #endif
     {
         void** pp = (void**)p;
@@ -49,15 +45,15 @@ Elixir::clear () noexcept
             void** p = static_cast<void**>(std::malloc(2*sizeof(void*)));
             p[0] = m_p;
             p[1] = (void*)m_arena;
-            AMREX_HIP_OR_CUDA(
-                AMREX_HIP_SAFE_CALL ( hipStreamAddCallback(Gpu::gpuStream(),
-                                                           amrex_elixir_delete, p, 0));,
-#if ( defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10) )
-                AMREX_CUDA_SAFE_CALL(cudaLaunchHostFunc(Gpu::gpuStream(),
-                                                        amrex_elixir_delete, p)););
-#else
-                AMREX_CUDA_SAFE_CALL(cudaStreamAddCallback(Gpu::gpuStream(),
-                                                           amrex_elixir_delete, p, 0)););
+#if defined(AMREX_USE_HIP)
+            AMREX_HIP_SAFE_CALL ( hipStreamAddCallback(Gpu::gpuStream(),
+                                                       amrex_elixir_delete, p, 0));
+#elif defined(__CUDACC__) && (__CUDACC_VER_MAJOR__ >= 10)
+            AMREX_CUDA_SAFE_CALL(cudaLaunchHostFunc(Gpu::gpuStream(),
+                                                    amrex_elixir_delete, p));
+#elif defined(AMREX_USE_CUDA)
+            AMREX_CUDA_SAFE_CALL(cudaStreamAddCallback(Gpu::gpuStream(),
+                                                       amrex_elixir_delete, p, 0));
 #endif
             Gpu::callbackAdded();
 #elif defined(AMREX_USE_DPCPP)
diff --git a/Src/Base/AMReX_GpuError.H b/Src/Base/AMReX_GpuError.H
index d5917b248e9..bf15bc978ee 100644
--- a/Src/Base/AMReX_GpuError.H
+++ b/Src/Base/AMReX_GpuError.H
@@ -89,17 +89,6 @@ namespace Gpu {
                            + " " + hipGetErrorString(amrex_i_err)); \
         amrex::Abort(errStr); \
     }}
-
-#ifdef AMREX_HIP_PLATFORM_NVCC
-#define AMREX_CUDA_SAFE_CALL(call) { \
-    cudaError_t amrex_i_err = call;          \
-    if (cudaSuccess != amrex_i_err) { \
-        std::string errStr(std::string("CUDA error in file ") + __FILE__ \
-                           + " line " + std::to_string(__LINE__) \
-                           + " " + cudaGetErrorString(amrex_i_err)); \
-        amrex::Abort(errStr); \
-    }}
-#endif
 #endif
 
 #define AMREX_GPU_ERROR_CHECK() amrex::Gpu::ErrorCheck(__FILE__, __LINE__)
diff --git a/Src/Base/AMReX_GpuFuse.H b/Src/Base/AMReX_GpuFuse.H
new file mode 100644
index 00000000000..99467f9a956
--- /dev/null
+++ b/Src/Base/AMReX_GpuFuse.H
@@ -0,0 +1,315 @@
+#ifndef AMREX_GPU_FUSE_H_
+#define AMREX_GPU_FUSE_H_
+
+#include <AMReX_Arena.H>
+#include <AMReX_Vector.H>
+#include <AMReX_Box.H>
+#include <AMReX_TypeTraits.H>
+#include <AMReX_GpuDevice.H>
+#include <AMReX_GpuLaunchGlobal.H>
+#include <cstring>
+#include <memory>
+
+namespace amrex {
+namespace Gpu {
+
+#ifdef AMREX_USE_GPU
+
+#ifdef AMREX_USE_CUDA
+
+typedef void (*Lambda1DLauncher)(char*,int);
+typedef void (*Lambda3DLauncher)(char*,int,int,int);
+typedef void (*Lambda4DLauncher)(char*,int,int,int,int);
+typedef void (*LambdaDtor)(char*);
+
+struct FuseHelper {
+    union LambdaLauncher {
+        Lambda1DLauncher L1D;
+        Lambda3DLauncher L3D;
+        Lambda4DLauncher L4D;
+    };
+    // Device function pointer to wrapper around Lambda's operator()
+    LambdaLauncher m_fp;
+    std::size_t m_offset; // This tells us where the lambda object is.
+    Box m_bx;
+    int m_N;
+};
+
+static_assert(AMREX_IS_TRIVIALLY_COPYABLE(FuseHelper),"FuseHelper is not trivially copyable");
+
+template <typename Lambda>
+AMREX_GPU_DEVICE
+void
+LaunchLambda1D (char* buf, int i)
+{
+    (*reinterpret_cast<Lambda*>(buf))(i);
+}
+
+template <typename Lambda>
+AMREX_GPU_DEVICE
+void
+LaunchLambda3D (char* buf, int i, int j, int k)
+{
+    (*reinterpret_cast<Lambda*>(buf))(i,j,k);
+}
+
+template <typename Lambda>
+AMREX_GPU_DEVICE
+void
+LaunchLambda4D (char* buf, int i, int j, int k, int n)
+{
+    (*reinterpret_cast<Lambda*>(buf))(i,j,k,n);
+}
+
+template <typename Lambda>
+void
+DestroyLambda (char* buf)
+{
+    reinterpret_cast<Lambda*>(buf)->~Lambda();
+}
+
+template <typename Lambda>
+std::size_t
+PutLambda (Lambda const& f, char* buf)
+{
+    new (buf) Lambda(f);
+    return Arena::align(sizeof(Lambda));
+}
+
+template <typename Lambda>
+void
+PutLambda1DLauncher (FuseHelper* helper)
+{
+    static Lambda1DLauncher fp = nullptr;
+    if (fp == nullptr) {
+        launch_global<<<1,1>>>([=] AMREX_GPU_DEVICE ()
+        {
+            helper->m_fp.L1D = &LaunchLambda1D<Lambda>;
+        });
+        Gpu::synchronize();
+        fp = helper->m_fp.L1D;
+    } else {
+        helper->m_fp.L1D = fp;
+    }
+}
+
+template <typename Lambda>
+void
+PutLambda3DLauncher (FuseHelper* helper)
+{
+    static Lambda3DLauncher fp = nullptr;
+    if (fp == nullptr) {
+        launch_global<<<1,1>>>([=] AMREX_GPU_DEVICE ()
+        {
+            helper->m_fp.L3D = &LaunchLambda3D<Lambda>;
+        });
+        Gpu::synchronize();
+        fp = helper->m_fp.L3D;
+    } else {
+        helper->m_fp.L3D = fp;
+    }
+}
+
+template <typename Lambda>
+void
+PutLambda4DLauncher (FuseHelper* helper)
+{
+    static Lambda4DLauncher fp = nullptr;
+    if (fp == nullptr) {
+        launch_global<<<1,1>>>([=] AMREX_GPU_DEVICE ()
+        {
+            helper->m_fp.L4D = &LaunchLambda4D<Lambda>;
+        });
+        Gpu::synchronize();
+        fp = helper->m_fp.L4D;
+    } else {
+        helper->m_fp.L4D = fp;
+    }
+}
+
+template <typename Lambda>
+void
+PutLambdaDtor (LambdaDtor& lambda_dtor)
+{
+    lambda_dtor = &DestroyLambda<Lambda>;
+}
+
+class Fuser
+{
+public:
+
+    Fuser ();
+    ~Fuser ();
+    Fuser (Fuser const&) = delete;
+    Fuser& operator= (Fuser const&) = delete;
+
+    template <typename F>
+    void
+    Register (Box const& bx, F&& f)
+    {
+        AMREX_ASSERT(!OpenMP::in_parallel());
+        if (bx.isEmpty()) return;
+        using Lambda = typename std::decay<F>::type;
+        Register_doit<Lambda>(bx, 0, f);
+        PutLambda3DLauncher<Lambda>(m_helper_buf+(m_nlambdas-1));
+    }
+
+    template <typename F>
+    void
+    Register (Box const& bx, int ncomp, F&& f)
+    {
+        AMREX_ASSERT(!OpenMP::in_parallel());
+        if (bx.isEmpty()) return;
+        using Lambda = typename std::decay<F>::type;
+        Register_doit<Lambda>(bx, ncomp, f);
+        PutLambda4DLauncher<Lambda>(m_helper_buf+(m_nlambdas-1));
+    }
+
+    template <typename T, typename F, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+    void
+    Register (T N, F&&f)
+    {
+        AMREX_ASSERT(!OpenMP::in_parallel());
+        AMREX_ASSERT(sizeof(T) <= sizeof(int) ||
+                     N < static_cast<T>(std::numeric_limits<int>::max()));
+        if (N <= 0) return;
+        using Lambda = typename std::decay<F>::type;
+        Register_doit<Lambda>(Box(), N, f);
+        PutLambda1DLauncher<Lambda>(m_helper_buf+(m_nlambdas-1));
+    }
+
+    void Launch ();
+
+    static Fuser& getInstance ();
+    static void Initialize ();
+    static void Finalize ();
+
+private:
+
+    static std::unique_ptr<Fuser> m_instance;
+
+    char* m_lambda_buf = nullptr;
+    std::size_t m_nbytes_used_lambda_buf = 0;
+    std::size_t m_nbytes_lambda_buf = 2*1024*1024;
+
+    FuseHelper* m_helper_buf = nullptr;
+    std::size_t m_nhelpers_buf = 1024;
+
+    Vector<LambdaDtor> m_dtor_buf;
+
+    int m_nlambdas = 0;
+
+    void resize_lambda_buf ();
+    void resize_helper_buf ();
+
+    template <typename Lambda>
+    void
+    Register_doit (Box const& bx, int ncomp, Lambda const& f)
+    {
+        if (m_nlambdas >= m_nhelpers_buf) {
+            resize_helper_buf();
+        }
+
+        int ikernel = m_nlambdas++;
+        new (m_helper_buf+ikernel) FuseHelper;
+        m_helper_buf[ikernel].m_offset = m_nbytes_used_lambda_buf;
+        m_helper_buf[ikernel].m_bx = bx;
+        m_helper_buf[ikernel].m_N = ncomp;
+
+        static_assert(std::alignment_of<Lambda>::value <= Arena::align_size,
+                      "GpuFuse: alignment error");
+        if (m_nbytes_used_lambda_buf + Arena::align(sizeof(Lambda)) > m_nbytes_lambda_buf) {
+            resize_lambda_buf();
+        }
+        char* p_lambda = m_lambda_buf + m_nbytes_used_lambda_buf;
+        std::size_t sz_lambda = PutLambda<Lambda>(f, p_lambda);
+        m_nbytes_used_lambda_buf += sz_lambda;
+        AMREX_ASSERT(m_nbytes_used_lambda_buf <= m_nbytes_lambda_buf);
+
+        m_dtor_buf.push_back(nullptr);
+        PutLambdaDtor<Lambda>(m_dtor_buf.back());
+    }
+};
+
+template <typename F>
+void
+Register (Box const& bx, F&& f)
+{
+    Fuser::getInstance().Register(bx, std::forward<F>(f));
+}
+
+template <typename F>
+void
+Register (Box const& bx, int ncomp, F&& f)
+{
+    Fuser::getInstance().Register(bx, ncomp, std::forward<F>(f));
+}
+
+template <typename T, typename F, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void
+Register (T N, F&&f)
+{
+    Fuser::getInstance().Register(N, std::forward<F>(f));
+}
+
+inline void
+LaunchFusedKernels ()
+{
+    Fuser::getInstance().Launch();
+}
+
+#else
+
+class Fuser
+{
+public:
+    static Fuser& getInstance ();
+    static void Initialize ();
+    static void Finalize ();
+private:
+    static std::unique_ptr<Fuser> m_instance;
+};
+
+inline void LaunchFusedKernels () {}
+
+#endif
+
+Long getFuseSizeThreshold ();
+Long setFuseSizeThreshold (Long new_threshold);
+int getFuseNumKernelsThreshold ();
+int setFuseNumKernelsThreshold (int new_threshold);
+bool inFuseRegion ();
+bool setFuseRegion (bool flag);
+bool inFuseReductionRegion ();
+bool setFuseReductionRegion (bool flag);
+
+struct FuseSafeGuard
+{
+    explicit FuseSafeGuard (bool flag) noexcept
+        : m_old(setFuseRegion(flag)) {}
+    ~FuseSafeGuard () { setFuseRegion(m_old); }
+private:
+    bool m_old;
+};
+
+struct FuseReductionSafeGuard
+{
+    explicit FuseReductionSafeGuard (bool flag) noexcept
+        : m_old(setFuseReductionRegion(flag)) {}
+    ~FuseReductionSafeGuard () { setFuseReductionRegion(m_old); }
+private:
+    bool m_old;
+};
+
+#else
+
+struct FuseSafeGuard
+{
+    explicit FuseSafeGuard (bool) {}
+};
+
+#endif
+
+}}
+
+#endif
diff --git a/Src/Base/AMReX_GpuFuse.cpp b/Src/Base/AMReX_GpuFuse.cpp
new file mode 100644
index 00000000000..e3a4fe812b1
--- /dev/null
+++ b/Src/Base/AMReX_GpuFuse.cpp
@@ -0,0 +1,283 @@
+#include <AMReX_Gpu.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_BLProfiler.H>
+#include <AMReX_OpenMP.H>
+
+namespace amrex {
+namespace Gpu {
+
+#ifdef AMREX_USE_GPU
+
+namespace {
+    bool s_in_fuse_region = false;
+    bool s_in_fuse_reduction_region = false;
+    // Fusing kernels with elements greater than this are not recommended based tests on v100
+    Long s_fuse_size_threshold = 257*257;
+    // If the number of kernels is less than this, fusing is not recommended based on tests on v100
+    int s_fuse_numkernels_threshold = 3;
+}
+
+std::unique_ptr<Fuser> Fuser::m_instance = nullptr;
+
+#ifdef AMREX_USE_CUDA
+
+Fuser::Fuser ()
+{
+    AMREX_ASSERT(!OpenMP::in_parallel());
+    m_lambda_buf = (char*)The_Pinned_Arena()->alloc(m_nbytes_lambda_buf);
+    m_helper_buf = (FuseHelper*)The_Pinned_Arena()->alloc(m_nhelpers_buf*sizeof(FuseHelper));
+    m_dtor_buf.reserve(1024);
+}
+
+Fuser::~Fuser ()
+{
+    if (m_nlambdas > 0) {
+        Launch();
+    }
+
+    The_Pinned_Arena()->free(m_lambda_buf);
+    The_Pinned_Arena()->free(m_helper_buf);
+}
+
+void Fuser::Launch ()
+{
+    BL_PROFILE("Fuser::Launch()");
+
+    int nlambdas = m_nlambdas;
+    if (nlambdas > 0) {
+        AMREX_ASSERT(!OpenMP::in_parallel());
+
+        int* nwarps = (int*)The_Pinned_Arena()->alloc((nlambdas+1)*sizeof(int));
+        int ntotwarps = 0;
+        for (int i = 0; i < nlambdas; ++i)
+        {
+            nwarps[i] = ntotwarps;
+            Box const& bx = m_helper_buf[i].m_bx;
+            int N;
+            if (bx.isEmpty()) {
+                N = m_helper_buf[i].m_N;
+            } else {
+                N = bx.numPts();
+            }
+            ntotwarps += (N + Gpu::Device::warp_size-1) / Gpu::Device::warp_size;
+        }
+        nwarps[nlambdas] = ntotwarps;
+
+        AMREX_ASSERT(ntotwarps < std::numeric_limits<int>::max()/Gpu::Device::warp_size);
+
+        // Pack nwarps, lambda helpers and lambda objects into a buffer
+        std::size_t sizeof_nwarps = sizeof(int) * (nlambdas+1);
+        std::size_t offset_helpers = Arena::align(sizeof_nwarps);
+        std::size_t sizeof_helpers = sizeof(FuseHelper)*nlambdas;
+        std::size_t offset_objects = Arena::align(offset_helpers+sizeof_helpers);
+        std::size_t sizeof_objects = m_nbytes_used_lambda_buf;
+        std::size_t total_buf_size = offset_objects + sizeof_objects;
+
+        char* h_buffer = (char*)The_Pinned_Arena()->alloc(total_buf_size);
+        char* d_buffer = (char*)The_Device_Arena()->alloc(total_buf_size);
+
+        std::memcpy(h_buffer, nwarps, sizeof_nwarps);
+        std::memcpy(h_buffer+offset_helpers, m_helper_buf, sizeof_helpers);
+        std::memcpy(h_buffer+offset_objects, m_lambda_buf, sizeof_objects);
+        Gpu::htod_memcpy_async(d_buffer, h_buffer, total_buf_size);
+
+        auto d_nwarps = reinterpret_cast<int*>(d_buffer);
+        auto d_lambda_helper = reinterpret_cast<FuseHelper*>(d_buffer+offset_helpers);
+        auto d_lambda_object = reinterpret_cast<char*>(d_buffer+offset_objects);
+
+        constexpr int nthreads = 256;
+        constexpr int nwarps_per_block = nthreads/Gpu::Device::warp_size;
+        int nblocks = (ntotwarps + nwarps_per_block-1) / nwarps_per_block;
+
+        bool is_reduction = s_in_fuse_reduction_region;
+
+        amrex::launch(nblocks, nthreads, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept
+        {
+            int g_tid = blockDim.x*blockIdx.x + threadIdx.x;
+            int g_wid = g_tid / Gpu::Device::warp_size;
+            if (g_wid >= ntotwarps) {
+                if (is_reduction) {
+                    // for reduction, the assumption is all lambdas have function signature
+                    FuseHelper& helper = d_lambda_helper[0];
+                    char* lambda_object = d_lambda_object + helper.m_offset;
+                    if (helper.m_bx.isEmpty()) {
+                        helper.m_fp.L1D(lambda_object,-1);
+                    } else {
+                        if (helper.m_N == 0) {
+                            helper.m_fp.L3D(lambda_object, INT_MIN, INT_MIN, INT_MIN);
+                        } else {
+                            for (int n = 0; n < helper.m_N; ++n) {
+                                helper.m_fp.L4D(lambda_object, INT_MIN, INT_MIN, INT_MIN, -1);
+                            }
+                        }
+                    }
+                }
+                return;
+            }
+
+            int ilambda;
+            {
+                int lo = 0;
+                int hi = nlambdas;
+                while (lo <= hi) {
+                    int mid = (lo+hi)/2;
+                    if (g_wid >= d_nwarps[mid] && g_wid < d_nwarps[mid+1]) {
+                        ilambda = mid;
+                        break;
+                    } else if (g_wid < d_nwarps[mid]) {
+                        hi = mid-1;
+                    } else {
+                        lo = mid+1;
+                    }
+                };
+            }
+
+            int b_wid = g_wid - d_nwarps[ilambda]; // b_wid'th warp on this lambda
+            int lane = threadIdx.x % Gpu::Device::warp_size;
+            int icell = b_wid*Gpu::Device::warp_size + lane;
+
+            FuseHelper& helper = d_lambda_helper[ilambda];
+            char* lambda_object = d_lambda_object + helper.m_offset;
+            Box const& bx = helper.m_bx;
+            if (bx.isEmpty()) {
+                if (icell < helper.m_N) {
+                    helper.m_fp.L1D(lambda_object,icell);
+                } else if (is_reduction) {
+                    helper.m_fp.L1D(lambda_object,-1);
+                }
+            } else {
+                int ncells = bx.numPts();
+                if (icell < ncells) {
+                    const auto len = amrex::length(bx);
+                    const auto lo  = amrex::lbound(bx);
+                    int k =  icell /   (len.x*len.y);
+                    int j = (icell - k*(len.x*len.y)) /   len.x;
+                    int i = (icell - k*(len.x*len.y)) - j*len.x;
+                    i += lo.x;
+                    j += lo.y;
+                    k += lo.z;
+                    if (helper.m_N == 0) {
+                        helper.m_fp.L3D(lambda_object,i,j,k);
+                    } else {
+                        for (int n = 0; n < helper.m_N; ++n) {
+                            helper.m_fp.L4D(lambda_object,i,j,k,n);
+                        }
+                    }
+                } else if (is_reduction) {
+                    if (helper.m_N == 0) {
+                        helper.m_fp.L3D(lambda_object, INT_MIN, INT_MIN, INT_MIN);
+                    } else {
+                        for (int n = 0; n < helper.m_N; ++n) {
+                            helper.m_fp.L4D(lambda_object, INT_MIN, INT_MIN, INT_MIN, -1);
+                        }
+                    }
+                }
+            }
+        });
+        Gpu::synchronize();
+        The_Pinned_Arena()->free(nwarps);
+        The_Pinned_Arena()->free(h_buffer);
+        The_Device_Arena()->free(d_buffer);
+
+        for (int i = 0; i < nlambdas; ++i) {
+            char* p = m_lambda_buf + m_helper_buf[i].m_offset;
+            m_dtor_buf[i](p);
+            m_helper_buf[i].~FuseHelper();
+        }
+        m_dtor_buf.clear();
+        m_nbytes_used_lambda_buf = 0;
+        m_nlambdas = 0;
+    }
+}
+
+void
+Fuser::resize_lambda_buf ()
+{
+    m_nbytes_lambda_buf += m_nbytes_lambda_buf/2;
+    auto p = (char*)The_Pinned_Arena()->alloc(m_nbytes_lambda_buf);
+    std::memcpy(p, m_lambda_buf, m_nbytes_used_lambda_buf);
+    The_Pinned_Arena()->free(m_lambda_buf);
+    m_lambda_buf = p;
+}
+
+void
+Fuser::resize_helper_buf ()
+{
+    m_nhelpers_buf += m_nhelpers_buf/2;
+    auto p = (FuseHelper*)The_Pinned_Arena()->alloc(m_nhelpers_buf*sizeof(FuseHelper));
+    for (int i = 0; i < m_nlambdas; ++i) {
+        new (p+i) FuseHelper(m_helper_buf[i]);
+        (m_helper_buf+i)->~FuseHelper();
+    }
+    The_Pinned_Arena()->free(m_helper_buf);
+    m_helper_buf = p;
+}
+
+#endif
+
+Fuser&
+Fuser::getInstance ()
+{
+    if (m_instance == nullptr) {
+        m_instance.reset(new Fuser());
+    }
+    return *m_instance;
+}
+
+void
+Fuser::Initialize ()
+{
+    ParmParse pp("amrex");
+    pp.query("gpu_fuse_size_threshold", s_fuse_size_threshold);
+    pp.query("gpu_fuse_numkernels_threshold", s_fuse_numkernels_threshold);
+
+    amrex::ExecOnFinalize(Fuser::Finalize);
+}
+
+void
+Fuser::Finalize ()
+{
+    m_instance.reset();
+}
+
+Long getFuseSizeThreshold () { return s_fuse_size_threshold; }
+
+Long
+setFuseSizeThreshold (Long new_threshold)
+{
+    Long old = s_fuse_size_threshold;
+    s_fuse_size_threshold = new_threshold;
+    return old;
+}
+
+int getFuseNumKernelsThreshold () { return s_fuse_numkernels_threshold; }
+
+int setFuseNumKernelsThreshold (int new_threshold)
+{
+    int old = s_fuse_numkernels_threshold;
+    s_fuse_numkernels_threshold = new_threshold;
+    return old;
+}
+
+bool inFuseRegion () { return s_in_fuse_region; }
+
+bool setFuseRegion (bool flag)
+{
+    bool old = s_in_fuse_region;
+    s_in_fuse_region = flag;
+    return old;
+}
+
+bool inFuseReductionRegion () { return s_in_fuse_reduction_region; }
+
+bool setFuseReductionRegion (bool flag)
+{
+    bool old = s_in_fuse_reduction_region;
+    s_in_fuse_reduction_region = flag;
+    return old;
+}
+
+#endif
+
+}}
diff --git a/Src/Base/AMReX_GpuKernelInfo.H b/Src/Base/AMReX_GpuKernelInfo.H
new file mode 100644
index 00000000000..94e125e5a0c
--- /dev/null
+++ b/Src/Base/AMReX_GpuKernelInfo.H
@@ -0,0 +1,18 @@
+#ifndef AMREX_GPU_KERNEL_INFO_H_
+#define AMREX_GPU_KERNEL_INFO_H_
+
+namespace amrex {
+namespace Gpu {
+
+class KernelInfo
+{
+public:
+    KernelInfo& setFusible (bool flag) { fusible = flag; return *this; }
+    bool isFusible () const { return fusible; }
+private:
+    bool fusible = false;
+};
+
+}}
+
+#endif
diff --git a/Src/Base/AMReX_GpuLaunch.H b/Src/Base/AMReX_GpuLaunch.H
index 0fbded87895..d0e4678a0b6 100644
--- a/Src/Base/AMReX_GpuLaunch.H
+++ b/Src/Base/AMReX_GpuLaunch.H
@@ -2,6 +2,7 @@
 #define AMREX_GPU_LAUNCH_H_
 
 #include <AMReX_GpuQualifiers.H>
+#include <AMReX_GpuKernelInfo.H>
 #include <AMReX_GpuControl.H>
 #include <AMReX_GpuTypes.H>
 #include <AMReX_GpuError.H>
@@ -9,12 +10,16 @@
 #include <AMReX_GpuDevice.H>
 #include <AMReX_GpuMemory.H>
 #include <AMReX_GpuReduce.H>
+#include <AMReX_GpuFuse.H>
 #include <AMReX_Tuple.H>
 #include <AMReX_Box.H>
 #include <AMReX_Loop.H>
 #include <AMReX_Extension.H>
 #include <AMReX_BLassert.H>
 #include <AMReX_TypeTraits.H>
+#include <AMReX_GpuLaunchGlobal.H>
+#include <AMReX_RandomEngine.H>
+#include <AMReX_Algorithm.H>
 #include <cstddef>
 #include <limits>
 #include <algorithm>
@@ -35,17 +40,14 @@
 
 namespace amrex {
 
-// Because of CUDA, we cannot take rvalue lambdas.
+// We cannot take rvalue lambdas.
 // ************************************************
 //  Variadic lambda function wrappers for C++ CUDA/HIP Kernel calls.
 
 #if defined(AMREX_USE_CUDA) || defined(AMREX_USE_HIP)
-    template<class L>
-    AMREX_GPU_GLOBAL void launch_global (L f0) { f0(); }
-
     template<class L, class... Lambdas>
     AMREX_GPU_GLOBAL void launch_global (L f0, Lambdas... fs) { f0(); call_device(fs...); }
-    
+
     template<class L>
     AMREX_GPU_DEVICE void call_device (L&& f0) noexcept { f0(); }
     
@@ -97,8 +99,6 @@ namespace Gpu {
 
 // ************************************************
 
-    void getGridSize (FabArrayBase const& fa, int ngrow, LayoutData<GridSize>& gs, int& ntotblocks);
-
     AMREX_GPU_HOST_DEVICE
     inline
     Box getThreadBox (const Box& bx, Long offset) noexcept
@@ -114,6 +114,7 @@ namespace Gpu {
         iv += bx.smallEnd();
         return (bx & Box(iv,iv,bx.type()));
 #else
+        amrex::ignore_unused(offset);
         return bx;
 #endif
     }
@@ -126,8 +127,8 @@ namespace Gpu {
             Gpu::Device::grid_stride_threads_and_blocks(numBlocks,numThreads);
         }
         ExecutionConfig (const Box& box) noexcept {
-            // If we change this, we must make sure it doesn't break say getGridSize, which
-            // assumes the decomposition is 1D.  FabArrayUtility Reduce* as well.
+            // If we change this, we must make sure it doesn't break FabArrayUtility Reduce*,
+            // which assumes the decomposition is 1D.
             Gpu::Device::n_threads_and_blocks( ((box.numPts()+AMREX_GPU_NCELLS_PER_THREAD-1)/AMREX_GPU_NCELLS_PER_THREAD), numBlocks, numThreads );
 #if 0
             Box b = amrex::surroundingNodes(box);
@@ -188,6 +189,31 @@ namespace Gpu {
                                                         AMREX_WRONG_NUM_ARGS, \
                                                         AMREX_WRONG_NUM_ARGS)(__VA_ARGS__)
 
+#ifdef AMREX_USE_CUDA
+#define AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA(...) AMREX_GET_MACRO(__VA_ARGS__,\
+                                                        AMREX_GPU_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA_RANGE_3, \
+                                                        AMREX_WRONG_NUM_ARGS, \
+                                                        AMREX_WRONG_NUM_ARGS, \
+                                                        AMREX_GPU_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA_RANGE_2, \
+                                                        AMREX_WRONG_NUM_ARGS, \
+                                                        AMREX_WRONG_NUM_ARGS, \
+                                                        AMREX_GPU_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA_RANGE, \
+                                                        AMREX_WRONG_NUM_ARGS, \
+                                                        AMREX_WRONG_NUM_ARGS)(__VA_ARGS__)
+#else
+#define AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA(...) AMREX_LAUNCH_HOST_DEVICE_LAMBDA(__VA_ARGS__)
+#endif
+
+#if (AMREX_SPACEDIM == 1)
+#define AMREX_LAUNCH_DEVICE_LAMBDA_DIM(a1,a2,a3,b1,b2,b3,c1,c2,c3)      AMREX_GPU_LAUNCH_DEVICE_LAMBDA_RANGE     (a1,a2,a2)
+#define AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM(a1,a2,a3,b1,b2,b3,c1,c2,c3) AMREX_GPU_LAUNCH_HOST_DEVICE_LAMBDA_RANGE(a1,a2,a3)
+#elif (AMREX_SPACEDIM == 2)
+#define AMREX_LAUNCH_DEVICE_LAMBDA_DIM(a1,a2,a3,b1,b2,b3,c1,c2,c3)      AMREX_GPU_LAUNCH_DEVICE_LAMBDA_RANGE_2     (a1,a2,a3,b1,b2,b3)
+#define AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM(a1,a2,a3,b1,b2,b3,c1,c2,c3) AMREX_GPU_LAUNCH_HOST_DEVICE_LAMBDA_RANGE_2(a1,a2,a3,b1,b2,b3)
+#elif (AMREX_SPACEDIM == 3)
+#define AMREX_LAUNCH_DEVICE_LAMBDA_DIM(...)      AMREX_GPU_LAUNCH_DEVICE_LAMBDA_RANGE_3     (__VA_ARGS__)
+#define AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM(...) AMREX_GPU_LAUNCH_HOST_DEVICE_LAMBDA_RANGE_3(__VA_ARGS__)
+#endif
 
 #define AMREX_FOR_1D(...)      AMREX_GPU_DEVICE_FOR_1D(__VA_ARGS__)
 #define AMREX_FOR_3D(...)      AMREX_GPU_DEVICE_FOR_3D(__VA_ARGS__)
@@ -205,6 +231,22 @@ namespace Gpu {
 #define AMREX_HOST_DEVICE_PARALLEL_FOR_3D(...) AMREX_GPU_HOST_DEVICE_PARALLEL_FOR_3D(__VA_ARGS__)
 #define AMREX_HOST_DEVICE_PARALLEL_FOR_4D(...) AMREX_GPU_HOST_DEVICE_PARALLEL_FOR_4D(__VA_ARGS__)
 
+#ifdef AMREX_USE_CUDA
+#define AMREX_HOST_DEVICE_PARALLEL_FOR_1D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_1D_FUSIBLE(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_3D_FUSIBLE(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_4D_FUSIBLE(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_FOR_1D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_1D_FUSIBLE(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_FOR_3D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_3D_FUSIBLE(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_FOR_4D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_4D_FUSIBLE(__VA_ARGS__)
+#else
+#define AMREX_HOST_DEVICE_PARALLEL_FOR_1D_FUSIBLE(...) AMREX_HOST_DEVICE_PARALLEL_FOR_1D(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE(...) AMREX_HOST_DEVICE_PARALLEL_FOR_3D(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE(...) AMREX_HOST_DEVICE_PARALLEL_FOR_4D(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_FOR_1D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_1D(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_FOR_3D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_3D(__VA_ARGS__)
+#define AMREX_HOST_DEVICE_FOR_4D_FUSIBLE(...) AMREX_GPU_HOST_DEVICE_FOR_4D(__VA_ARGS__)
+#endif
+
 #ifdef AMREX_USE_GPU
 
 #define AMREX_HOST_DEVICE_PARALLEL_FOR_1D_FLAG(where_to_run,n,i,block) \
@@ -238,12 +280,12 @@ namespace Gpu {
 #define AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FLAG(where_to_run,box,nc,i,j,k,n,block) \
     if ((where_to_run == RunOn::Device) && (Gpu::inLaunchRegion())) \
     { \
-        amrex::ParallelFor(box, nc, [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) AMREX_NOEXCEPT \
+        amrex::ParallelFor(box, nc, [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept \
             block \
         ); \
     } \
     else { \
-        amrex::LoopConcurrentOnCpu(box, nc, [=] (int i, int j, int k, int n) AMREX_NOEXCEPT \
+        amrex::LoopConcurrentOnCpu(box, nc, [=] (int i, int j, int k, int n) noexcept \
             block \
         ); \
     }
@@ -278,12 +320,12 @@ namespace Gpu {
 #define AMREX_HOST_DEVICE_FOR_4D_FLAG(where_to_run,box,nc,i,j,k,n,block) \
     if ((where_to_run == RunOn::Device) && (Gpu::inLaunchRegion())) \
     { \
-        amrex::ParallelFor(box, nc, [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) AMREX_NOEXCEPT \
+        amrex::ParallelFor(box, nc, [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept \
             block \
         ); \
     } \
     else { \
-        amrex::LoopOnCpu(box, nc, [=] (int i, int j, int k, int n) AMREX_NOEXCEPT \
+        amrex::LoopOnCpu(box, nc, [=] (int i, int j, int k, int n) noexcept \
             block \
         ); \
     }
diff --git a/Src/Base/AMReX_GpuLaunch.cpp b/Src/Base/AMReX_GpuLaunch.cpp
deleted file mode 100644
index e56b44bf08d..00000000000
--- a/Src/Base/AMReX_GpuLaunch.cpp
+++ /dev/null
@@ -1,24 +0,0 @@
-#include <AMReX_GpuLaunch.H>
-#include <AMReX_FabArrayBase.H>
-#include <AMReX_LayoutData.H>
-
-namespace amrex {
-namespace Gpu {
-
-#ifdef AMREX_USE_GPU
-void getGridSize (FabArrayBase const& fa, int ngrow, LayoutData<GridSize>& gs, int& ntotblocks)
-{
-    gs = LayoutData<GridSize>(fa.boxArray(),fa.DistributionMap());
-    ntotblocks = 0;
-    for (MFIter mfi(gs); mfi.isValid(); ++mfi) {
-        const auto& bx = amrex::grow(mfi.validbox(),ngrow);
-        auto ec = ExecutionConfig(bx);
-        gs[mfi].numBlocks = ec.numBlocks.x;
-        gs[mfi].numThreads = ec.numThreads.x;
-        gs[mfi].globalBlockId = ntotblocks;
-        ntotblocks += ec.numBlocks.x;
-    }
-}
-#endif
-
-}}
diff --git a/Src/Base/AMReX_GpuLaunchFunctsC.H b/Src/Base/AMReX_GpuLaunchFunctsC.H
index 11a7d725c09..d79b47a2838 100644
--- a/Src/Base/AMReX_GpuLaunchFunctsC.H
+++ b/Src/Base/AMReX_GpuLaunchFunctsC.H
@@ -4,13 +4,13 @@
 namespace amrex {
 
 template<typename T, typename L>
-void launch (T const& n, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void launch (T const& n, L&& f, std::size_t /*shared_mem_bytes*/=0) noexcept
 {
     f(n);
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void For (T n, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void For (T n, L&& f) noexcept
 {
     for (T i = 0; i < n; ++i) {
         f(i);
@@ -18,7 +18,13 @@ void For (T n, L&& f, std::size_t shared_mem_bytes=0) noexcept
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void ParallelFor (T n, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void For (Gpu::KernelInfo const&, T n, L&& f) noexcept
+{
+    For(n, std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelFor (T n, L&& f) noexcept
 {
     AMREX_PRAGMA_SIMD
     for (T i = 0; i < n; ++i) {
@@ -26,8 +32,14 @@ void ParallelFor (T n, L&& f, std::size_t shared_mem_bytes=0) noexcept
     }
 }
 
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelFor (Gpu::KernelInfo const&, T n, L&& f) noexcept
+{
+    ParallelFor(n, std::forward<L>(f));
+}
+
 template <typename L>
-void For (Box const& box, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void For (Box const& box, L&& f) noexcept
 {
     const auto lo = amrex::lbound(box);
     const auto hi = amrex::ubound(box);
@@ -39,7 +51,13 @@ void For (Box const& box, L&& f, std::size_t shared_mem_bytes=0) noexcept
 }
 
 template <typename L>
-void ParallelFor (Box const& box, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void For (Gpu::KernelInfo const&, Box const& box, L&& f) noexcept
+{
+    For(box, std::forward<L>(f));
+}
+
+template <typename L>
+void ParallelFor (Box const& box, L&& f) noexcept
 {
     const auto lo = amrex::lbound(box);
     const auto hi = amrex::ubound(box);
@@ -51,8 +69,14 @@ void ParallelFor (Box const& box, L&& f, std::size_t shared_mem_bytes=0) noexcep
     }}}
 }
 
+template <typename L>
+void ParallelFor (Gpu::KernelInfo const&, Box const& box, L&& f) noexcept
+{
+    ParallelFor(box, std::forward<L>(f));
+}
+
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void For (Box const& box, T ncomp, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void For (Box const& box, T ncomp, L&& f) noexcept
 {
     const auto lo = amrex::lbound(box);
     const auto hi = amrex::ubound(box);
@@ -66,7 +90,13 @@ void For (Box const& box, T ncomp, L&& f, std::size_t shared_mem_bytes=0) noexce
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void ParallelFor (Box const& box, T ncomp, L&& f, std::size_t shared_mem_bytes=0) noexcept
+void For (Gpu::KernelInfo const&, Box const& box, T ncomp, L&& f) noexcept
+{
+    For(box, ncomp, std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelFor (Box const& box, T ncomp, L&& f) noexcept
 {
     const auto lo = amrex::lbound(box);
     const auto hi = amrex::ubound(box);
@@ -80,94 +110,165 @@ void ParallelFor (Box const& box, T ncomp, L&& f, std::size_t shared_mem_bytes=0
     }
 }
 
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelFor (Gpu::KernelInfo const&, Box const& box, T ncomp, L&& f) noexcept
+{
+    ParallelFor(box, ncomp, std::forward<L>(f));
+}
+
 template <typename L1, typename L2>
-void For (Box const& box1, Box const& box2, L1&& f1, L2&& f2,
-          std::size_t shared_mem_bytes=0) noexcept
+void For (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
     For(box1, std::forward<L1>(f1));
     For(box2, std::forward<L2>(f2));
 }
 
+template <typename L1, typename L2>
+void For (Gpu::KernelInfo const&, Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    For (box1, box2, std::forward<L1>(f1), std::forward<L2>(f2));
+}
+
 template <typename L1, typename L2, typename L3>
-void For (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3,
-          std::size_t shared_mem_bytes=0) noexcept
+void For (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
 {
     For(box1, std::forward<L1>(f1));
     For(box2, std::forward<L2>(f2));
     For(box3, std::forward<L3>(f3));
 }
 
+template <typename L1, typename L2, typename L3>
+void For (Gpu::KernelInfo const&, Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    For(box1, box2, box3, std::forward<L1>(f1), std::forward<L2>(f2), std::forward<L3>(f3));
+}
+
 template <typename T1, typename T2, typename L1, typename L2,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
 void For (Box const& box1, T1 ncomp1, L1&& f1,
-          Box const& box2, T2 ncomp2, L2&& f2,
-          std::size_t shared_mem_bytes=0) noexcept
+          Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
     For(box1, ncomp1, std::forward<L1>(f1));
     For(box2, ncomp2, std::forward<L2>(f2));
 }
 
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void For (Gpu::KernelInfo const&,
+          Box const& box1, T1 ncomp1, L1&& f1,
+          Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    For(box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+}
+
 template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
           typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
 void For (Box const& box1, T1 ncomp1, L1&& f1,
           Box const& box2, T2 ncomp2, L2&& f2,
-          Box const& box3, T3 ncomp3, L3&& f3,
-          std::size_t shared_mem_bytes=0) noexcept
+          Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
     For(box1, ncomp1, std::forward<L1>(f1));
     For(box2, ncomp2, std::forward<L2>(f2));
     For(box3, ncomp3, std::forward<L3>(f3));
 }
 
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void For (Gpu::KernelInfo const&,
+          Box const& box1, T1 ncomp1, L1&& f1,
+          Box const& box2, T2 ncomp2, L2&& f2,
+          Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    For(box1,ncomp1,std::forward<L1>(f1),
+        box2,ncomp2,std::forward<L2>(f2),
+        box3,ncomp3,std::forward<L3>(f3));
+}
+
 template <typename L1, typename L2>
-void ParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2,
-                  std::size_t shared_mem_bytes=0) noexcept
+void ParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
     ParallelFor(box1, std::forward<L1>(f1));
     ParallelFor(box2, std::forward<L2>(f2));
 }
 
+template <typename L1, typename L2>
+void ParallelFor (Gpu::KernelInfo const&, Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    ParallelFor(box1,box2,f1,f2);
+}
+
 template <typename L1, typename L2, typename L3>
-void ParallelFor (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3,
-                  std::size_t shared_mem_bytes=0) noexcept
+void ParallelFor (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
 {
     ParallelFor(box1, std::forward<L1>(f1));
     ParallelFor(box2, std::forward<L2>(f2));
     ParallelFor(box3, std::forward<L3>(f3));
 }
 
+template <typename L1, typename L2, typename L3>
+void ParallelFor (Gpu::KernelInfo const&, Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    ParallelFor(box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+}
+
 template <typename T1, typename T2, typename L1, typename L2,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
 void ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
-                  Box const& box2, T2 ncomp2, L2&& f2,
-                  std::size_t shared_mem_bytes=0) noexcept
+                  Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
     ParallelFor(box1, ncomp1, std::forward<L1>(f1));
     ParallelFor(box2, ncomp2, std::forward<L2>(f2));
 }
 
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void ParallelFor (Gpu::KernelInfo const&,
+                  Box const& box1, T1 ncomp1, L1&& f1,
+                  Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    ParallelFor(box1,ncomp1,std::forward<L1>(f1),
+                box2,ncomp2,std::forward<L2>(f2));
+}
+
 template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
           typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
 void ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
                   Box const& box2, T2 ncomp2, L2&& f2,
-                  Box const& box3, T3 ncomp3, L3&& f3,
-                  std::size_t shared_mem_bytes=0) noexcept
+                  Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
     ParallelFor(box1, ncomp1, std::forward<L1>(f1));
     ParallelFor(box2, ncomp2, std::forward<L2>(f2));
     ParallelFor(box3, ncomp3, std::forward<L3>(f3));
 }
 
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void ParallelFor (Gpu::KernelInfo const&,
+                  Box const& box1, T1 ncomp1, L1&& f1,
+                  Box const& box2, T2 ncomp2, L2&& f2,
+                  Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    ParallelFor(box1, ncomp1, std::forward<L1>(f1),
+                box2, ncomp2, std::forward<L2>(f2),
+                box3, ncomp3, std::forward<L3>(f3));
+}
+
 template <typename N, typename T, typename L1, typename L2,
           typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
 void FabReduce (Box const& box, N ncomp, T const& init_val,
-                L1&& f1, L2&& f2, std::size_t shared_mem_bytes=0) noexcept
+                L1&& f1, L2&& f2, std::size_t /*shared_mem_bytes*/=0) noexcept
 {
     auto r = init_val;
     const auto lo = amrex::lbound(box);
@@ -184,7 +285,7 @@ void FabReduce (Box const& box, N ncomp, T const& init_val,
 
 template <typename T, typename L1, typename L2>
 void FabReduce (Box const& box, T const& init_val,
-                L1&& f1, L2&& f2, std::size_t shared_mem_bytes=0) noexcept
+                L1&& f1, L2&& f2, std::size_t /*shared_mem_bytes*/=0) noexcept
 {
     auto r = init_val;
     const auto lo = amrex::lbound(box);
@@ -200,7 +301,7 @@ void FabReduce (Box const& box, T const& init_val,
 template <typename N, typename T, typename L1, typename L2,
           typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
 void VecReduce (N n, T const& init_val,
-                L1&& f1, L2&& f2, std::size_t shared_mem_bytes=0) noexcept
+                L1&& f1, L2&& f2, std::size_t /*shared_mem_bytes*/=0) noexcept
 {
     auto r = init_val;
     for (N i = 0; i < n; ++i) {
@@ -315,6 +416,152 @@ void HostDeviceFor (Box const& box1, T1 ncomp1, L1&& f1,
         box3,ncomp3,std::forward<L3>(f3));
 }
 
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void HostDeviceParallelFor (Gpu::KernelInfo const&, T n, L&& f) noexcept
+{
+    ParallelFor(n,std::forward<L>(f));
+}
+
+template <typename L>
+void HostDeviceParallelFor (Gpu::KernelInfo const&, Box const& box, L&& f) noexcept
+{
+    ParallelFor(box,std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void HostDeviceParallelFor (Gpu::KernelInfo const&, Box const& box, T ncomp, L&& f) noexcept
+{
+    ParallelFor(box,ncomp,std::forward<L>(f));
+}
+
+template <typename L1, typename L2>
+void HostDeviceParallelFor (Gpu::KernelInfo const&, Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    ParallelFor(box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+}
+
+template <typename L1, typename L2, typename L3>
+void HostDeviceParallelFor (Gpu::KernelInfo const&,
+                            Box const& box1, Box const& box2, Box const& box3,
+                            L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    ParallelFor(box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+}
+
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void HostDeviceParallelFor (Gpu::KernelInfo const&,
+                            Box const& box1, T1 ncomp1, L1&& f1,
+                            Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    ParallelFor(box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+}
+
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void HostDeviceParallelFor (Gpu::KernelInfo const&,
+                            Box const& box1, T1 ncomp1, L1&& f1,
+                            Box const& box2, T2 ncomp2, L2&& f2,
+                            Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    ParallelFor(box1,ncomp1,std::forward<L1>(f1),
+                box2,ncomp2,std::forward<L2>(f2),
+                box3,ncomp3,std::forward<L3>(f3));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void HostDeviceFor (Gpu::KernelInfo const&, T n, L&& f) noexcept
+{
+    For(n,std::forward<L>(f));
+}
+
+template <typename L>
+void HostDeviceFor (Gpu::KernelInfo const&, Box const& box, L&& f) noexcept
+{
+    For(box,std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void HostDeviceFor (Gpu::KernelInfo const&, Box const& box, T ncomp, L&& f) noexcept
+{
+    For(box,ncomp,std::forward<L>(f));
+}
+
+template <typename L1, typename L2>
+void HostDeviceFor (Gpu::KernelInfo const&, Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    For(box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+}
+
+template <typename L1, typename L2, typename L3>
+void HostDeviceFor (Gpu::KernelInfo const&,
+                    Box const& box1, Box const& box2, Box const& box3,
+                    L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    For(box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+}
+
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void HostDeviceFor (Gpu::KernelInfo const&,
+                    Box const& box1, T1 ncomp1, L1&& f1,
+                    Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    For(box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+}
+
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void HostDeviceFor (Gpu::KernelInfo const&,
+                    Box const& box1, T1 ncomp1, L1&& f1,
+                    Box const& box2, T2 ncomp2, L2&& f2,
+                    Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    For(box1,ncomp1,std::forward<L1>(f1),
+        box2,ncomp2,std::forward<L2>(f2),
+        box3,ncomp3,std::forward<L3>(f3));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelForRNG (T n, L&& f) noexcept
+{
+    for (T i = 0; i < n; ++i) {
+        f(i,RandomEngine{});
+    }
+}
+
+template <typename L>
+void ParallelForRNG (Box const& box, L&& f) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int k = lo.z; k <= hi.z; ++k) {
+    for (int j = lo.y; j <= hi.y; ++j) {
+    for (int i = lo.x; i <= hi.x; ++i) {
+        f(i,j,k,RandomEngine{});
+    }}}
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelForRNG (Box const& box, T ncomp, L&& f) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (T n = 0; n < ncomp; ++n) {
+        for (int k = lo.z; k <= hi.z; ++k) {
+        for (int j = lo.y; j <= hi.y; ++j) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            f(i,j,k,n,RandomEngine{});
+        }}}
+    }
+}
+
 }
 
 #endif
diff --git a/Src/Base/AMReX_GpuLaunchFunctsG.H b/Src/Base/AMReX_GpuLaunchFunctsG.H
index 5256b02334e..fa7d197d1f0 100644
--- a/Src/Base/AMReX_GpuLaunchFunctsG.H
+++ b/Src/Base/AMReX_GpuLaunchFunctsG.H
@@ -94,7 +94,7 @@ void launch (T const& n, L&& f) noexcept
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void ParallelFor (T n, L&& f) noexcept
+void ParallelFor (Gpu::KernelInfo const& /*info*/, T n, L&& f) noexcept
 {
     if (amrex::isEmpty(n)) return;
     const auto ec = Gpu::ExecutionConfig(n);
@@ -122,7 +122,7 @@ void ParallelFor (T n, L&& f) noexcept
 }
 
 template <typename L>
-void ParallelFor (Box const& box, L&& f) noexcept
+void ParallelFor (Gpu::KernelInfo const& /*info*/, Box const& box, L&& f) noexcept
 {
     if (amrex::isEmpty(box)) return;
     int ncells = box.numPts();
@@ -159,7 +159,7 @@ void ParallelFor (Box const& box, L&& f) noexcept
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void ParallelFor (Box const& box, T ncomp, L&& f) noexcept
+void ParallelFor (Gpu::KernelInfo const& /*info*/, Box const& box, T ncomp, L&& f) noexcept
 {
     if (amrex::isEmpty(box)) return;
     int ncells = box.numPts();
@@ -197,14 +197,138 @@ void ParallelFor (Box const& box, T ncomp, L&& f) noexcept
     }
 }
 
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelForRNG (T n, L&& f) noexcept
+{
+    if (amrex::isEmpty(n)) return;
+    const auto ec = Gpu::ExecutionConfig(n);
+    // If we are on default queue, block all other streams
+    if (Gpu::onNullStream()) Gpu::nonNullStreamSynchronize();
+    int nthreads_per_block = ec.numThreads.x;
+    int nthreads_total = nthreads_per_block * amrex::min(ec.numBlocks.x,Gpu::Device::maxBlocksPerLaunch());
+    auto& q = Gpu::Device::nullQueue();
+    auto& engdescr = *(getRandEngineDescriptor());
+    try {
+        q.submit([&] (sycl::handler& h) {
+            auto engine_acc = engdescr.get_access(h);
+            h.parallel_for(sycl::nd_range<1>(sycl::range<1>(nthreads_total),
+                                             sycl::range<1>(nthreads_per_block)),
+            [=] (sycl::nd_item<1> item)
+            AMREX_REQUIRE_SUBGROUP_SIZE(Gpu::Device::warp_size)
+            {
+                int tid = item.get_global_id(0);
+                auto engine = engine_acc.load(tid);
+                RandomEngine rand_eng{&engine};
+                for (T i = tid, stride = item.get_global_range(0); i < n; i += stride) {
+                    f(i,rand_eng);
+                }
+                engine_acc.store(engine, tid);
+            });
+        });
+        q.wait_and_throw(); // because next launch might be on a different queue
+    } catch (sycl::exception const& ex) {
+        amrex::Abort(std::string("ParallelFor: ")+ex.what()+"!!!!!");
+    }
+}
+
+template <typename L>
+void ParallelForRNG (Box const& box, L&& f) noexcept
+{
+    if (amrex::isEmpty(box)) return;
+    int ncells = box.numPts();
+    const auto lo  = amrex::lbound(box);
+    const auto len = amrex::length(box);
+    const auto ec = Gpu::ExecutionConfig(ncells);
+    // If we are on default queue, block all other streams
+    if (Gpu::onNullStream()) Gpu::nonNullStreamSynchronize();
+    int nthreads_per_block = ec.numThreads.x;
+    int nthreads_total = nthreads_per_block * amrex::min(ec.numBlocks.x,Gpu::Device::maxBlocksPerLaunch());
+    auto& q = Gpu::Device::nullQueue();
+    auto& engdescr = *(getRandEngineDescriptor());
+    try {
+        q.submit([&] (sycl::handler& h) {
+            auto engine_acc = engdescr.get_access(h);
+            h.parallel_for(sycl::nd_range<1>(sycl::range<1>(nthreads_total),
+                                             sycl::range<1>(nthreads_per_block)),
+            [=] (sycl::nd_item<1> item)
+            AMREX_REQUIRE_SUBGROUP_SIZE(Gpu::Device::warp_size)
+            {
+                int tid = item.get_global_id(0);
+                auto engine = engine_acc.load(tid);
+                RandomEngine rand_eng{&engine};
+                for (int icell = tid, stride = item.get_global_range(0);
+                     icell < ncells; icell += stride) {
+                    int k =  icell /   (len.x*len.y);
+                    int j = (icell - k*(len.x*len.y)) /   len.x;
+                    int i = (icell - k*(len.x*len.y)) - j*len.x;
+                    i += lo.x;
+                    j += lo.y;
+                    k += lo.z;
+                    f(i,j,k,rand_eng);
+                }
+                engine_acc.store(engine, tid);
+            });
+        });
+        q.wait_and_throw(); // because next launch might be on a different queue
+    } catch (sycl::exception const& ex) {
+        amrex::Abort(std::string("ParallelFor: ")+ex.what()+"!!!!!");
+    }
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelForRNG (Box const& box, T ncomp, L&& f) noexcept
+{
+    if (amrex::isEmpty(box)) return;
+    int ncells = box.numPts();
+    const auto lo  = amrex::lbound(box);
+    const auto len = amrex::length(box);
+    const auto ec = Gpu::ExecutionConfig(ncells);
+    // If we are on default queue, block all other streams
+    if (Gpu::onNullStream()) Gpu::nonNullStreamSynchronize();
+    int nthreads_per_block = ec.numThreads.x;
+    int nthreads_total = nthreads_per_block * amrex::min(ec.numBlocks.x,Gpu::Device::maxBlocksPerLaunch());
+    auto& q = Gpu::Device::streamQueue();
+    auto& engdescr = *(getRandEngineDescriptor());
+    try {
+        q.submit([&] (sycl::handler& h) {
+            auto engine_acc = engdescr.get_access(h);
+            h.parallel_for(sycl::nd_range<1>(sycl::range<1>(nthreads_total),
+                                             sycl::range<1>(nthreads_per_block)),
+            [=] (sycl::nd_item<1> item)
+            AMREX_REQUIRE_SUBGROUP_SIZE(Gpu::Device::warp_size)
+            {
+                int tid = item.get_global_id(0);
+                auto engine = engine_acc.load(tid);
+                RandomEngine rand_eng{&engine};
+                for (int icell = tid, stride = item.get_global_range(0);
+                     icell < ncells; icell += stride) {
+                    int k =  icell /   (len.x*len.y);
+                    int j = (icell - k*(len.x*len.y)) /   len.x;
+                    int i = (icell - k*(len.x*len.y)) - j*len.x;
+                    i += lo.x;
+                    j += lo.y;
+                    k += lo.z;
+                    for (T n = 0; n < ncomp; ++n) {
+                        f(i,j,k,n,rand_eng);
+                    }
+                }
+                engine_acc.store(engine, tid);
+            });
+        });
+        q.wait_and_throw(); // because next launch might be on a different queue
+    } catch (sycl::exception const& ex) {
+        amrex::Abort(std::string("ParallelFor: ")+ex.what()+"!!!!!");
+    }
+}
+
 template <typename L1, typename L2>
-void ParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+void ParallelFor (Gpu::KernelInfo const& /*info*/, Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
-    if (amrex::isEmpty(box1) and amrex::isEmpty(box2)) return;
-    // xxxxx DPC++ todo: launch separate kernel to reduce kernel size
+    // xxxxx DPCPP todo: launch separate kernel to reduce kernel size
     ParallelFor(box1, std::forward<L1>(f1));
     ParallelFor(box2, std::forward<L2>(f2));
 #if 0
+    if (amrex::isEmpty(box1) and amrex::isEmpty(box2)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells = amrex::max(ncells1, ncells2);
@@ -255,14 +379,16 @@ void ParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 }
 
 template <typename L1, typename L2, typename L3>
-void ParallelFor (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
+void ParallelFor (Gpu::KernelInfo const& /*info*/,
+                  Box const& box1, Box const& box2, Box const& box3,
+                  L1&& f1, L2&& f2, L3&& f3) noexcept
 {
-    if (amrex::isEmpty(box1) and amrex::isEmpty(box2) and amrex::isEmpty(box3)) return
-    // xxxxx DPC++ todo: launch separate kernel to reduce kernel size
+    // xxxxx DPCPP todo: launch separate kernel to reduce kernel size
     ParallelFor(box1, std::forward<L1>(f1));
     ParallelFor(box2, std::forward<L2>(f2));
     ParallelFor(box3, std::forward<L3>(f3));
 #if 0
+    if (amrex::isEmpty(box1) and amrex::isEmpty(box2) and amrex::isEmpty(box3)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells3 = box3.numPts();
@@ -327,14 +453,15 @@ void ParallelFor (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2
 template <typename T1, typename T2, typename L1, typename L2,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
-void ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+void ParallelFor (Gpu::KernelInfo const& /*info*/,
+                  Box const& box1, T1 ncomp1, L1&& f1,
                   Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
-    if (amrex::isEmpty(box1) and amrex::isEmpty(box2)) return;
-    // xxxxx DPC++ todo: launch separate kernel to reduce kernel size
+    // xxxxx DPCPP todo: launch separate kernel to reduce kernel size
     ParallelFor(box1, ncomp1, std::forward<L1>(f1));
     ParallelFor(box2, ncomp2, std::forward<L2>(f2));
 #if 0
+    if (amrex::isEmpty(box1) and amrex::isEmpty(box2)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells = amrex::max(ncells1, ncells2);
@@ -392,16 +519,17 @@ template <typename T1, typename T2, typename T3, typename L1, typename L2, typen
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
           typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
-void ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+void ParallelFor (Gpu::KernelInfo const& /*info*/,
+                  Box const& box1, T1 ncomp1, L1&& f1,
                   Box const& box2, T2 ncomp2, L2&& f2,
                   Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
-    if (amrex::isEmpty(box1) and amrex::isEmpty(box2) and amrex::isEmpty(box3)) return;
-    // xxxxx DPC++ todo: launch separate kernel to reduce kernel size
+    // xxxxx DPCPP todo: launch separate kernel to reduce kernel size
     ParallelFor(box1, ncomp1, std::forward<L1>(f1));
     ParallelFor(box2, ncomp2, std::forward<L2>(f2));
     ParallelFor(box3, ncomp3, std::forward<L3>(f3));
 #if 0
+    if (amrex::isEmpty(box1) and amrex::isEmpty(box2) and amrex::isEmpty(box3)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells3 = box3.numPts();
@@ -477,7 +605,7 @@ void FabReduce (Box const& box, T const& init_val, L1&& f1, L2&& f2) noexcept
     const auto lo  = amrex::lbound(box);
     const auto len = amrex::length(box);
     auto ec = Gpu::ExecutionConfig(ncells);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     // If we are on default queue, block all other streams
     if (Gpu::onNullStream()) Gpu::nonNullStreamSynchronize();
     int nthreads_per_block = ec.numThreads.x;
@@ -518,7 +646,7 @@ void FabReduce (Box const& box, N ncomp, T const& init_val, L1&& f1, L2&& f2) no
     const auto lo  = amrex::lbound(box);
     const auto len = amrex::length(box);
     auto ec = Gpu::ExecutionConfig(ncells);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     // If we are on default queue, block all other streams
     if (Gpu::onNullStream()) Gpu::nonNullStreamSynchronize();
     int nthreads_per_block = ec.numThreads.x;
@@ -558,7 +686,7 @@ void VecReduce (N n, T const& init_val, L1&& f1, L2&& f2) noexcept
 {
     if (amrex::isEmpty(n)) return;
     auto ec = Gpu::ExecutionConfig(n);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     // If we are on default queue, block all other streams
     if (Gpu::onNullStream()) Gpu::nonNullStreamSynchronize();
     int nthreads_per_block = ec.numThreads.x;
@@ -628,15 +756,110 @@ void launch (T const& n, L&& f) noexcept
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
 amrex::EnableIf_t<MaybeDeviceRunnable<L>::value>
-ParallelFor (T n, L&& f) noexcept
+ParallelFor (Gpu::KernelInfo const& info, T n, L&& f) noexcept
+{
+    if (amrex::isEmpty(n)) return;
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && n <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(n, f);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto ec = Gpu::ExecutionConfig(n);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (T i = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 i < n; i += stride) {
+                f(i);
+            }
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
+}
+
+template <typename L>
+amrex::EnableIf_t<MaybeDeviceRunnable<L>::value>
+ParallelFor (Gpu::KernelInfo const& info, Box const& box, L&& f) noexcept
+{
+    if (amrex::isEmpty(box)) return;
+    int ncells = box.numPts();
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && ncells <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(box, f);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto lo  = amrex::lbound(box);
+        const auto len = amrex::length(box);
+        const auto ec = Gpu::ExecutionConfig(ncells);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 icell < ncells; icell += stride) {
+                int k =  icell /   (len.x*len.y);
+                int j = (icell - k*(len.x*len.y)) /   len.x;
+                int i = (icell - k*(len.x*len.y)) - j*len.x;
+                i += lo.x;
+                j += lo.y;
+                k += lo.z;
+                f(i,j,k);
+            }
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+amrex::EnableIf_t<MaybeDeviceRunnable<L>::value>
+ParallelFor (Gpu::KernelInfo const& info, Box const& box, T ncomp, L&& f) noexcept
+{
+    if (amrex::isEmpty(box)) return;
+    int ncells = box.numPts();
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && ncells <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(box, ncomp, f);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto lo  = amrex::lbound(box);
+        const auto len = amrex::length(box);
+        const auto ec = Gpu::ExecutionConfig(ncells);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 icell < ncells; icell += stride) {
+                int k =  icell /   (len.x*len.y);
+                int j = (icell - k*(len.x*len.y)) /   len.x;
+                int i = (icell - k*(len.x*len.y)) - j*len.x;
+                i += lo.x;
+                j += lo.y;
+                k += lo.z;
+                for (T n = 0; n < ncomp; ++n) {
+                    f(i,j,k,n);
+                }
+            }
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+amrex::EnableIf_t<MaybeDeviceRunnable<L>::value>
+ParallelForRNG (T n, L&& f) noexcept
 {
     if (amrex::isEmpty(n)) return;
+    randState_t* rand_state = getRandState();
     const auto ec = Gpu::ExecutionConfig(n);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+    AMREX_LAUNCH_KERNEL(amrex::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch()),
+                        ec.numThreads, 0, Gpu::nullStream(),  // use null stream
     [=] AMREX_GPU_DEVICE () noexcept {
-        for (T i = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             i < n; i += stride) {
-            f(i);
+        int tid = blockDim.x*blockIdx.x+threadIdx.x;
+        RandomEngine engine{&(rand_state[tid])};
+        for (T i = tid, stride = blockDim.x*gridDim.x; i < n; i += stride) {
+            f(i,engine);
         }
     });
     AMREX_GPU_ERROR_CHECK();
@@ -644,24 +867,27 @@ ParallelFor (T n, L&& f) noexcept
 
 template <typename L>
 amrex::EnableIf_t<MaybeDeviceRunnable<L>::value>
-ParallelFor (Box const& box, L&& f) noexcept
+ParallelForRNG (Box const& box, L&& f) noexcept
 {
     if (amrex::isEmpty(box)) return;
+    randState_t* rand_state = getRandState();
     int ncells = box.numPts();
     const auto lo  = amrex::lbound(box);
     const auto len = amrex::length(box);
     const auto ec = Gpu::ExecutionConfig(ncells);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+    AMREX_LAUNCH_KERNEL(amrex::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch()),
+                        ec.numThreads, 0, Gpu::nullStream(),  // use null stream
     [=] AMREX_GPU_DEVICE () noexcept {
-        for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
+        int tid = blockDim.x*blockIdx.x+threadIdx.x;
+        RandomEngine engine{&(rand_state[tid])};
+        for (int icell = tid, stride = blockDim.x*gridDim.x; icell < ncells; icell += stride) {
             int k =  icell /   (len.x*len.y);
             int j = (icell - k*(len.x*len.y)) /   len.x;
             int i = (icell - k*(len.x*len.y)) - j*len.x;
             i += lo.x;
             j += lo.y;
             k += lo.z;
-            f(i,j,k);
+            f(i,j,k,engine);
         }
     });
     AMREX_GPU_ERROR_CHECK();
@@ -669,17 +895,20 @@ ParallelFor (Box const& box, L&& f) noexcept
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
 amrex::EnableIf_t<MaybeDeviceRunnable<L>::value>
-ParallelFor (Box const& box, T ncomp, L&& f) noexcept
+ParallelForRNG (Box const& box, T ncomp, L&& f) noexcept
 {
     if (amrex::isEmpty(box)) return;
+    randState_t* rand_state = getRandState();
     int ncells = box.numPts();
     const auto lo  = amrex::lbound(box);
     const auto len = amrex::length(box);
     const auto ec = Gpu::ExecutionConfig(ncells);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+    AMREX_LAUNCH_KERNEL(amrex::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch()),
+                        ec.numThreads, 0, Gpu::nullStream(), // use null stream
     [=] AMREX_GPU_DEVICE () noexcept {
-        for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
+        int tid = blockDim.x*blockIdx.x+threadIdx.x;
+        RandomEngine engine{&(rand_state[tid])};
+        for (int icell = tid, stride = blockDim.x*gridDim.x; icell < ncells; icell += stride) {
             int k =  icell /   (len.x*len.y);
             int j = (icell - k*(len.x*len.y)) /   len.x;
             int i = (icell - k*(len.x*len.y)) - j*len.x;
@@ -687,7 +916,7 @@ ParallelFor (Box const& box, T ncomp, L&& f) noexcept
             j += lo.y;
             k += lo.z;
             for (T n = 0; n < ncomp; ++n) {
-                f(i,j,k,n);
+                f(i,j,k,n,engine);
             }
         }
     });
@@ -696,141 +925,173 @@ ParallelFor (Box const& box, T ncomp, L&& f) noexcept
 
 template <typename L1, typename L2>
 amrex::EnableIf_t<MaybeDeviceRunnable<L1>::value and MaybeDeviceRunnable<L2>::value>
-ParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+ParallelFor (Gpu::KernelInfo const& info,
+             Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
     if (amrex::isEmpty(box1) and amrex::isEmpty(box2)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells = amrex::max(ncells1, ncells2);
-    const auto lo1  = amrex::lbound(box1);
-    const auto lo2  = amrex::lbound(box2);
-    const auto len1 = amrex::length(box1);
-    const auto len2 = amrex::length(box2);
-    const auto ec = Gpu::ExecutionConfig(ncells);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
-    [=] AMREX_GPU_DEVICE () noexcept {
-        for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-            if (icell < ncells1) {
-                int k =  icell /   (len1.x*len1.y);
-                int j = (icell - k*(len1.x*len1.y)) /   len1.x;
-                int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
-                i += lo1.x;
-                j += lo1.y;
-                k += lo1.z;
-                f1(i,j,k);
-            }
-            if (icell < ncells2) {
-                int k =  icell /   (len2.x*len2.y);
-                int j = (icell - k*(len2.x*len2.y)) /   len2.x;
-                int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
-                i += lo2.x;
-                j += lo2.y;
-                k += lo2.z;
-                f2(i,j,k);
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && ncells <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(box1, f1);
+        Gpu::Register(box2, f2);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto lo1  = amrex::lbound(box1);
+        const auto lo2  = amrex::lbound(box2);
+        const auto len1 = amrex::length(box1);
+        const auto len2 = amrex::length(box2);
+        const auto ec = Gpu::ExecutionConfig(ncells);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 icell < ncells; icell += stride) {
+                if (icell < ncells1) {
+                    int k =  icell /   (len1.x*len1.y);
+                    int j = (icell - k*(len1.x*len1.y)) /   len1.x;
+                    int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
+                    i += lo1.x;
+                    j += lo1.y;
+                    k += lo1.z;
+                    f1(i,j,k);
+                }
+                if (icell < ncells2) {
+                    int k =  icell /   (len2.x*len2.y);
+                    int j = (icell - k*(len2.x*len2.y)) /   len2.x;
+                    int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
+                    i += lo2.x;
+                    j += lo2.y;
+                    k += lo2.z;
+                    f2(i,j,k);
+                }
             }
-        }
-    });
-    AMREX_GPU_ERROR_CHECK();
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
 }
 
 template <typename L1, typename L2, typename L3>
 amrex::EnableIf_t<MaybeDeviceRunnable<L1>::value and MaybeDeviceRunnable<L2>::value and MaybeDeviceRunnable<L3>::value>
-ParallelFor (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
+ParallelFor (Gpu::KernelInfo const& info,
+             Box const& box1, Box const& box2, Box const& box3,
+             L1&& f1, L2&& f2, L3&& f3) noexcept
 {
     if (amrex::isEmpty(box1) and amrex::isEmpty(box2) and amrex::isEmpty(box3)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells3 = box3.numPts();
     int ncells = amrex::max(ncells1, ncells2, ncells3);
-    const auto lo1  = amrex::lbound(box1);
-    const auto lo2  = amrex::lbound(box2);
-    const auto lo3  = amrex::lbound(box3);
-    const auto len1 = amrex::length(box1);
-    const auto len2 = amrex::length(box2);
-    const auto len3 = amrex::length(box3);
-    const auto ec = Gpu::ExecutionConfig(ncells);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
-    [=] AMREX_GPU_DEVICE () noexcept {
-        for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-            if (icell < ncells1) {
-                int k =  icell /   (len1.x*len1.y);
-                int j = (icell - k*(len1.x*len1.y)) /   len1.x;
-                int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
-                i += lo1.x;
-                j += lo1.y;
-                k += lo1.z;
-                f1(i,j,k);
-            }
-            if (icell < ncells2) {
-                int k =  icell /   (len2.x*len2.y);
-                int j = (icell - k*(len2.x*len2.y)) /   len2.x;
-                int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
-                i += lo2.x;
-                j += lo2.y;
-                k += lo2.z;
-                f2(i,j,k);
-            }
-            if (icell < ncells3) {
-                int k =  icell /   (len3.x*len3.y);
-                int j = (icell - k*(len3.x*len3.y)) /   len3.x;
-                int i = (icell - k*(len3.x*len3.y)) - j*len3.x;
-                i += lo3.x;
-                j += lo3.y;
-                k += lo3.z;
-                f3(i,j,k);
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && ncells <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(box1, f1);
+        Gpu::Register(box2, f2);
+        Gpu::Register(box3, f3);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto lo1  = amrex::lbound(box1);
+        const auto lo2  = amrex::lbound(box2);
+        const auto lo3  = amrex::lbound(box3);
+        const auto len1 = amrex::length(box1);
+        const auto len2 = amrex::length(box2);
+        const auto len3 = amrex::length(box3);
+        const auto ec = Gpu::ExecutionConfig(ncells);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 icell < ncells; icell += stride) {
+                if (icell < ncells1) {
+                    int k =  icell /   (len1.x*len1.y);
+                    int j = (icell - k*(len1.x*len1.y)) /   len1.x;
+                    int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
+                    i += lo1.x;
+                    j += lo1.y;
+                    k += lo1.z;
+                    f1(i,j,k);
+                }
+                if (icell < ncells2) {
+                    int k =  icell /   (len2.x*len2.y);
+                    int j = (icell - k*(len2.x*len2.y)) /   len2.x;
+                    int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
+                    i += lo2.x;
+                    j += lo2.y;
+                    k += lo2.z;
+                    f2(i,j,k);
+                }
+                if (icell < ncells3) {
+                    int k =  icell /   (len3.x*len3.y);
+                    int j = (icell - k*(len3.x*len3.y)) /   len3.x;
+                    int i = (icell - k*(len3.x*len3.y)) - j*len3.x;
+                    i += lo3.x;
+                    j += lo3.y;
+                    k += lo3.z;
+                    f3(i,j,k);
+                }
             }
-        }
-    });
-    AMREX_GPU_ERROR_CHECK();
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
 }
 
 template <typename T1, typename T2, typename L1, typename L2,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
 amrex::EnableIf_t<MaybeDeviceRunnable<L1>::value and MaybeDeviceRunnable<L2>::value>
-ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+ParallelFor (Gpu::KernelInfo const& info,
+             Box const& box1, T1 ncomp1, L1&& f1,
              Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
     if (amrex::isEmpty(box1) and amrex::isEmpty(box2)) return;
     int ncells1 = box1.numPts();
     int ncells2 = box2.numPts();
     int ncells = amrex::max(ncells1, ncells2);
-    const auto lo1  = amrex::lbound(box1);
-    const auto lo2  = amrex::lbound(box2);
-    const auto len1 = amrex::length(box1);
-    const auto len2 = amrex::length(box2);
-    const auto ec = Gpu::ExecutionConfig(ncells);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
-    [=] AMREX_GPU_DEVICE () noexcept {
-        for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-            if (icell < ncells1) {
-                int k =  icell /   (len1.x*len1.y);
-                int j = (icell - k*(len1.x*len1.y)) /   len1.x;
-                int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
-                i += lo1.x;
-                j += lo1.y;
-                k += lo1.z;
-                for (T1 n = 0; n < ncomp1; ++n) {
-                    f1(i,j,k,n);
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && ncells <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(box1, ncomp1, f1);
+        Gpu::Register(box2, ncomp2, f2);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto lo1  = amrex::lbound(box1);
+        const auto lo2  = amrex::lbound(box2);
+        const auto len1 = amrex::length(box1);
+        const auto len2 = amrex::length(box2);
+        const auto ec = Gpu::ExecutionConfig(ncells);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 icell < ncells; icell += stride) {
+                if (icell < ncells1) {
+                    int k =  icell /   (len1.x*len1.y);
+                    int j = (icell - k*(len1.x*len1.y)) /   len1.x;
+                    int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
+                    i += lo1.x;
+                    j += lo1.y;
+                    k += lo1.z;
+                    for (T1 n = 0; n < ncomp1; ++n) {
+                        f1(i,j,k,n);
+                    }
                 }
-            }
-            if (icell < ncells2) {
-                int k =  icell /   (len2.x*len2.y);
-                int j = (icell - k*(len2.x*len2.y)) /   len2.x;
-                int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
-                i += lo2.x;
-                j += lo2.y;
-                k += lo2.z;
-                for (T2 n = 0; n < ncomp2; ++n) {
-                    f2(i,j,k,n);
+                if (icell < ncells2) {
+                    int k =  icell /   (len2.x*len2.y);
+                    int j = (icell - k*(len2.x*len2.y)) /   len2.x;
+                    int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
+                    i += lo2.x;
+                    j += lo2.y;
+                    k += lo2.z;
+                    for (T2 n = 0; n < ncomp2; ++n) {
+                        f2(i,j,k,n);
+                    }
                 }
             }
-        }
-    });
-    AMREX_GPU_ERROR_CHECK();
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
 }
 
 template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
@@ -838,7 +1099,8 @@ template <typename T1, typename T2, typename T3, typename L1, typename L2, typen
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
           typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
 amrex::EnableIf_t<MaybeDeviceRunnable<L1>::value and MaybeDeviceRunnable<L2>::value and MaybeDeviceRunnable<L3>::value>
-ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+ParallelFor (Gpu::KernelInfo const& info,
+             Box const& box1, T1 ncomp1, L1&& f1,
              Box const& box2, T2 ncomp2, L2&& f2,
              Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
@@ -847,53 +1109,63 @@ ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
     int ncells2 = box2.numPts();
     int ncells3 = box3.numPts();
     int ncells = amrex::max(ncells1, ncells2, ncells3);
-    const auto lo1  = amrex::lbound(box1);
-    const auto lo2  = amrex::lbound(box2);
-    const auto lo3  = amrex::lbound(box3);
-    const auto len1 = amrex::length(box1);
-    const auto len2 = amrex::length(box2);
-    const auto len3 = amrex::length(box3);
-    const auto ec = Gpu::ExecutionConfig(ncells);
-    AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
-    [=] AMREX_GPU_DEVICE () noexcept {
-        for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-            if (icell < ncells1) {
-                int k =  icell /   (len1.x*len1.y);
-                int j = (icell - k*(len1.x*len1.y)) /   len1.x;
-                int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
-                i += lo1.x;
-                j += lo1.y;
-                k += lo1.z;
-                for (T1 n = 0; n < ncomp1; ++n) {
-                    f1(i,j,k,n);
+#ifdef AMREX_USE_CUDA
+    if (Gpu::inFuseRegion() && info.isFusible() && ncells <= Gpu::getFuseSizeThreshold()) {
+        Gpu::Register(box1, ncomp1, f1);
+        Gpu::Register(box2, ncomp2, f2);
+        Gpu::Register(box3, ncomp3, f3);
+    } else
+#endif
+    {
+        amrex::ignore_unused(info);
+        const auto lo1  = amrex::lbound(box1);
+        const auto lo2  = amrex::lbound(box2);
+        const auto lo3  = amrex::lbound(box3);
+        const auto len1 = amrex::length(box1);
+        const auto len2 = amrex::length(box2);
+        const auto len3 = amrex::length(box3);
+        const auto ec = Gpu::ExecutionConfig(ncells);
+        AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
+        [=] AMREX_GPU_DEVICE () noexcept {
+            for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
+                 icell < ncells; icell += stride) {
+                if (icell < ncells1) {
+                    int k =  icell /   (len1.x*len1.y);
+                    int j = (icell - k*(len1.x*len1.y)) /   len1.x;
+                    int i = (icell - k*(len1.x*len1.y)) - j*len1.x;
+                    i += lo1.x;
+                    j += lo1.y;
+                    k += lo1.z;
+                    for (T1 n = 0; n < ncomp1; ++n) {
+                        f1(i,j,k,n);
+                    }
                 }
-            }
-            if (icell < ncells2) {
-                int k =  icell /   (len2.x*len2.y);
-                int j = (icell - k*(len2.x*len2.y)) /   len2.x;
-                int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
-                i += lo2.x;
-                j += lo2.y;
-                k += lo2.z;
-                for (T2 n = 0; n < ncomp2; ++n) {
-                    f2(i,j,k,n);
+                if (icell < ncells2) {
+                    int k =  icell /   (len2.x*len2.y);
+                    int j = (icell - k*(len2.x*len2.y)) /   len2.x;
+                    int i = (icell - k*(len2.x*len2.y)) - j*len2.x;
+                    i += lo2.x;
+                    j += lo2.y;
+                    k += lo2.z;
+                    for (T2 n = 0; n < ncomp2; ++n) {
+                        f2(i,j,k,n);
+                    }
                 }
-            }
-            if (icell < ncells3) {
-                int k =  icell /   (len3.x*len3.y);
-                int j = (icell - k*(len3.x*len3.y)) /   len3.x;
-                int i = (icell - k*(len3.x*len3.y)) - j*len3.x;
-                i += lo3.x;
-                j += lo3.y;
-                k += lo3.z;
-                for (T3 n = 0; n < ncomp3; ++n) {
-                    f3(i,j,k,n);
+                if (icell < ncells3) {
+                    int k =  icell /   (len3.x*len3.y);
+                    int j = (icell - k*(len3.x*len3.y)) /   len3.x;
+                    int i = (icell - k*(len3.x*len3.y)) - j*len3.x;
+                    i += lo3.x;
+                    j += lo3.y;
+                    k += lo3.z;
+                    for (T3 n = 0; n < ncomp3; ++n) {
+                        f3(i,j,k,n);
+                    }
                 }
             }
-        }
-    });
-    AMREX_GPU_ERROR_CHECK();
+        });
+        AMREX_GPU_ERROR_CHECK();
+    }
 }
 
 template <typename T, typename L1, typename L2>
@@ -905,7 +1177,7 @@ FabReduce (Box const& box, T const& init_val, L1&& f1, L2&& f2) noexcept
     const auto lo  = amrex::lbound(box);
     const auto len = amrex::length(box);
     auto ec = Gpu::ExecutionConfig(ncells);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE () noexcept {
         auto r = init_val;
@@ -934,7 +1206,7 @@ FabReduce (Box const& box, N ncomp, T const& init_val, L1&& f1, L2&& f2) noexcep
     const auto lo  = amrex::lbound(box);
     const auto len = amrex::length(box);
     auto ec = Gpu::ExecutionConfig(ncells);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE () noexcept {
         auto r = init_val;
@@ -962,7 +1234,7 @@ VecReduce (N n, T const& init_val, L1&& f1, L2&& f2) noexcept
 {
     if (amrex::isEmpty(n)) return;
     auto ec = Gpu::ExecutionConfig(n);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, Gpu::gpuStream(),
     [=] AMREX_GPU_DEVICE () noexcept {
         auto r = init_val;
@@ -977,34 +1249,153 @@ VecReduce (N n, T const& init_val, L1&& f1, L2&& f2) noexcept
 
 #endif
 
+template <typename L>
+void single_task (L&& f) noexcept
+{
+    single_task(Gpu::gpuStream(), std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void For (Gpu::KernelInfo const& info, T n, L&& f) noexcept
+{
+    ParallelFor(info, n,std::forward<L>(f));
+}
+
+template <typename L>
+void For (Gpu::KernelInfo const& info, Box const& box, L&& f) noexcept
+{
+    ParallelFor(info, box,std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void For (Gpu::KernelInfo const& info, Box const& box, T ncomp, L&& f) noexcept
+{
+    ParallelFor(info,box,ncomp,std::forward<L>(f));
+}
+
+template <typename L1, typename L2>
+void For (Gpu::KernelInfo const& info,
+          Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    ParallelFor(info,box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+}
+
+template <typename L1, typename L2, typename L3>
+void For (Gpu::KernelInfo const& info,
+          Box const& box1, Box const& box2, Box const& box3,
+          L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    ParallelFor(info,box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+}
+
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void For (Gpu::KernelInfo const& info,
+          Box const& box1, T1 ncomp1, L1&& f1,
+          Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    ParallelFor(info,box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+}
+
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void For (Gpu::KernelInfo const& info,
+          Box const& box1, T1 ncomp1, L1&& f1,
+          Box const& box2, T2 ncomp2, L2&& f2,
+          Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    ParallelFor(info,
+                box1,ncomp1,std::forward<L1>(f1),
+                box2,ncomp2,std::forward<L2>(f2),
+                box3,ncomp3,std::forward<L3>(f3));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelFor (T n, L&& f) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{}, n, std::forward<L>(f));
+}
+
+template <typename L>
+void ParallelFor (Box const& box, L&& f) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{}, box, std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void ParallelFor (Box const& box, T ncomp, L&& f) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{},box,ncomp,std::forward<L>(f));
+}
+
+template <typename L1, typename L2>
+void ParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{},box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+}
+
+template <typename L1, typename L2, typename L3>
+void ParallelFor (Box const& box1, Box const& box2, Box const& box3,
+                  L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{},box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+}
+
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+                  Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{},box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+}
+
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void ParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+                  Box const& box2, T2 ncomp2, L2&& f2,
+                  Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    ParallelFor(Gpu::KernelInfo{},
+                box1,ncomp1,std::forward<L1>(f1),
+                box2,ncomp2,std::forward<L2>(f2),
+                box3,ncomp3,std::forward<L3>(f3));
+}
+
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
 void For (T n, L&& f) noexcept
 {
-    ParallelFor(n,std::forward<L>(f));
+    ParallelFor(Gpu::KernelInfo{}, n,std::forward<L>(f));
 }
 
 template <typename L>
 void For (Box const& box, L&& f) noexcept
 {
-    ParallelFor(box,std::forward<L>(f));
+    ParallelFor(Gpu::KernelInfo{}, box,std::forward<L>(f));
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
 void For (Box const& box, T ncomp, L&& f) noexcept
 {
-    ParallelFor(box,ncomp,std::forward<L>(f));
+    ParallelFor(Gpu::KernelInfo{},box,ncomp,std::forward<L>(f));
 }
 
 template <typename L1, typename L2>
 void For (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
-    ParallelFor(box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+    ParallelFor(Gpu::KernelInfo{},box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
 }
 
 template <typename L1, typename L2, typename L3>
-void For (Box const& box1, Box const& box2, Box const& box3, L1&& f1, L2&& f2, L3&& f3) noexcept
+void For (Box const& box1, Box const& box2, Box const& box3,
+          L1&& f1, L2&& f2, L3&& f3) noexcept
 {
-    ParallelFor(box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+    ParallelFor(Gpu::KernelInfo{},box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
 }
 
 template <typename T1, typename T2, typename L1, typename L2,
@@ -1013,7 +1404,7 @@ template <typename T1, typename T2, typename L1, typename L2,
 void For (Box const& box1, T1 ncomp1, L1&& f1,
           Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
-    ParallelFor(box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+    ParallelFor(Gpu::KernelInfo{},box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
 }
 
 template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
@@ -1024,29 +1415,37 @@ void For (Box const& box1, T1 ncomp1, L1&& f1,
           Box const& box2, T2 ncomp2, L2&& f2,
           Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
-    ParallelFor(box1,ncomp1,std::forward<L1>(f1),
+    ParallelFor(Gpu::KernelInfo{},
+                box1,ncomp1,std::forward<L1>(f1),
                 box2,ncomp2,std::forward<L2>(f2),
                 box3,ncomp3,std::forward<L3>(f3));
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L>::value>
-HostDeviceParallelFor (T n, L&& f) noexcept
+HostDeviceParallelFor (Gpu::KernelInfo const& info, T n, L&& f) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(n,std::forward<L>(f));
+        ParallelFor(info,n,std::forward<L>(f));
     } else {
         AMREX_PRAGMA_SIMD
         for (T i = 0; i < n; ++i) f(i);
     }
 }
 
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+amrex::EnableIf_t<MaybeHostDeviceRunnable<L>::value>
+HostDeviceParallelFor (T n, L&& f) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{}, n, std::forward<L>(f));
+}
+
 template <typename L>
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L>::value>
-HostDeviceParallelFor (Box const& box, L&& f) noexcept
+HostDeviceParallelFor (Gpu::KernelInfo const& info, Box const& box, L&& f) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(box,std::forward<L>(f));
+        ParallelFor(info, box,std::forward<L>(f));
     } else {
         LoopConcurrentOnCpu(box,std::forward<L>(f));
     }
@@ -1054,10 +1453,10 @@ HostDeviceParallelFor (Box const& box, L&& f) noexcept
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L>::value>
-HostDeviceParallelFor (Box const& box, T ncomp, L&& f) noexcept
+HostDeviceParallelFor (Gpu::KernelInfo const& info, Box const& box, T ncomp, L&& f) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(box,ncomp,std::forward<L>(f));
+        ParallelFor(info, box,ncomp,std::forward<L>(f));
     } else {
         LoopConcurrentOnCpu(box,ncomp,std::forward<L>(f));
     }
@@ -1065,10 +1464,11 @@ HostDeviceParallelFor (Box const& box, T ncomp, L&& f) noexcept
 
 template <typename L1, typename L2>
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L1>::value and MaybeHostDeviceRunnable<L2>::value>
-HostDeviceParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+HostDeviceParallelFor (Gpu::KernelInfo const& info,
+                       Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+        ParallelFor(info,box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
     } else {
         LoopConcurrentOnCpu(box1,std::forward<L1>(f1));
         LoopConcurrentOnCpu(box2,std::forward<L2>(f2));
@@ -1077,11 +1477,13 @@ HostDeviceParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexc
 
 template <typename L1, typename L2, typename L3>
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L1>::value and MaybeHostDeviceRunnable<L2>::value and MaybeHostDeviceRunnable<L3>::value>
-HostDeviceParallelFor (Box const& box1, Box const& box2, Box const& box3,
+HostDeviceParallelFor (Gpu::KernelInfo const& info,
+                       Box const& box1, Box const& box2, Box const& box3,
                        L1&& f1, L2&& f2, L3&& f3) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+        ParallelFor(info,box1,box2,box3,
+                    std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
     } else {
         LoopConcurrentOnCpu(box1,std::forward<L1>(f1));
         LoopConcurrentOnCpu(box2,std::forward<L2>(f2));
@@ -1093,11 +1495,12 @@ template <typename T1, typename T2, typename L1, typename L2,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L1>::value and MaybeHostDeviceRunnable<L2>::value>
-HostDeviceParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+HostDeviceParallelFor (Gpu::KernelInfo const& info,
+                       Box const& box1, T1 ncomp1, L1&& f1,
                        Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+        ParallelFor(info,box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
     } else {
         LoopConcurrentOnCpu(box1,ncomp1,std::forward<L1>(f1));
         LoopConcurrentOnCpu(box2,ncomp2,std::forward<L2>(f2));
@@ -1109,12 +1512,14 @@ template <typename T1, typename T2, typename T3, typename L1, typename L2, typen
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
           typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
 amrex::EnableIf_t<MaybeHostDeviceRunnable<L1>::value and MaybeHostDeviceRunnable<L2>::value and MaybeHostDeviceRunnable<L3>::value>
-HostDeviceParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+HostDeviceParallelFor (Gpu::KernelInfo const& info,
+                       Box const& box1, T1 ncomp1, L1&& f1,
                        Box const& box2, T2 ncomp2, L2&& f2,
                        Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
     if (Gpu::inLaunchRegion()) {
-        ParallelFor(box1,ncomp1,std::forward<L1>(f1),
+        ParallelFor(info,
+                    box1,ncomp1,std::forward<L1>(f1),
                     box2,ncomp2,std::forward<L2>(f2),
                     box3,ncomp3,std::forward<L3>(f3));
     } else {
@@ -1125,54 +1530,115 @@ HostDeviceParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void HostDeviceFor (T n, L&& f) noexcept
+void HostDeviceFor (Gpu::KernelInfo const& info, T n, L&& f) noexcept
 {
-    HostDeviceParallelFor(n,std::forward<L>(f));
+    HostDeviceParallelFor(info,n,std::forward<L>(f));
 }
 
 template <typename L>
-void HostDeviceFor (Box const& box, L&& f) noexcept
+void HostDeviceFor (Gpu::KernelInfo const& info, Box const& box, L&& f) noexcept
 {
-    HostDeviceParallelFor(box,std::forward<L>(f));
+    HostDeviceParallelFor(info,box,std::forward<L>(f));
 }
 
 template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
-void HostDeviceFor (Box const& box, T ncomp, L&& f) noexcept
+void HostDeviceFor (Gpu::KernelInfo const& info, Box const& box, T ncomp, L&& f) noexcept
 {
-    HostDeviceParallelFor(box,ncomp,std::forward<L>(f));
+    HostDeviceParallelFor(info,box,ncomp,std::forward<L>(f));
 }
 
 template <typename L1, typename L2>
-void HostDeviceFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+void HostDeviceFor (Gpu::KernelInfo const& info,
+                    Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
 {
-    HostDeviceParallelFor(box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+    HostDeviceParallelFor(info,box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
 }
 
 template <typename L1, typename L2, typename L3>
-void HostDeviceFor (Box const& box1, Box const& box2, Box const& box3,
+void HostDeviceFor (Gpu::KernelInfo const& info,
+                    Box const& box1, Box const& box2, Box const& box3,
                     L1&& f1, L2&& f2, L3&& f3) noexcept
 {
-    HostDeviceParallelFor(box1,box2,box3,std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+    HostDeviceParallelFor(info, box1,box2,box3,
+                          std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
 }
 
 template <typename T1, typename T2, typename L1, typename L2,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
-void HostDeviceFor (Box const& box1, T1 ncomp1, L1&& f1,
+void HostDeviceFor (Gpu::KernelInfo const& info,
+                    Box const& box1, T1 ncomp1, L1&& f1,
                     Box const& box2, T2 ncomp2, L2&& f2) noexcept
 {
-    HostDeviceParallelFor(box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+    HostDeviceParallelFor(info,box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
 }
 
 template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
           typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
           typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
           typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
-void HostDeviceFor (Box const& box1, T1 ncomp1, L1&& f1,
+void HostDeviceFor (Gpu::KernelInfo const& info,
+                    Box const& box1, T1 ncomp1, L1&& f1,
                     Box const& box2, T2 ncomp2, L2&& f2,
                     Box const& box3, T3 ncomp3, L3&& f3) noexcept
 {
-    HostDeviceParallelFor(box1,ncomp1,std::forward<L1>(f1),
+    HostDeviceParallelFor(info,
+                          box1,ncomp1,std::forward<L1>(f1),
+                          box2,ncomp2,std::forward<L2>(f2),
+                          box3,ncomp3,std::forward<L3>(f3));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void HostDeviceParallelFor (T n, L&& f) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{},n,std::forward<L>(f));
+}
+
+template <typename L>
+void HostDeviceParallelFor (Box const& box, L&& f) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{},box,std::forward<L>(f));
+}
+
+template <typename T, typename L, typename M=amrex::EnableIf_t<std::is_integral<T>::value> >
+void HostDeviceParallelFor (Box const& box, T ncomp, L&& f) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{},box,ncomp,std::forward<L>(f));
+}
+
+template <typename L1, typename L2>
+void HostDeviceParallelFor (Box const& box1, Box const& box2, L1&& f1, L2&& f2) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{},box1,box2,std::forward<L1>(f1),std::forward<L2>(f2));
+}
+
+template <typename L1, typename L2, typename L3>
+void HostDeviceParallelFor (Box const& box1, Box const& box2, Box const& box3,
+                            L1&& f1, L2&& f2, L3&& f3) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{}, box1,box2,box3,
+                          std::forward<L1>(f1),std::forward<L2>(f2),std::forward<L3>(f3));
+}
+
+template <typename T1, typename T2, typename L1, typename L2,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value> >
+void HostDeviceParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+                            Box const& box2, T2 ncomp2, L2&& f2) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{},box1,ncomp1,std::forward<L1>(f1),box2,ncomp2,std::forward<L2>(f2));
+}
+
+template <typename T1, typename T2, typename T3, typename L1, typename L2, typename L3,
+          typename M1=amrex::EnableIf_t<std::is_integral<T1>::value>,
+          typename M2=amrex::EnableIf_t<std::is_integral<T2>::value>,
+          typename M3=amrex::EnableIf_t<std::is_integral<T3>::value> >
+void HostDeviceParallelFor (Box const& box1, T1 ncomp1, L1&& f1,
+                            Box const& box2, T2 ncomp2, L2&& f2,
+                            Box const& box3, T3 ncomp3, L3&& f3) noexcept
+{
+    HostDeviceParallelFor(Gpu::KernelInfo{},
+                          box1,ncomp1,std::forward<L1>(f1),
                           box2,ncomp2,std::forward<L2>(f2),
                           box3,ncomp3,std::forward<L3>(f3));
 }
diff --git a/Src/Base/AMReX_GpuLaunchGlobal.H b/Src/Base/AMReX_GpuLaunchGlobal.H
new file mode 100644
index 00000000000..695c42b42c9
--- /dev/null
+++ b/Src/Base/AMReX_GpuLaunchGlobal.H
@@ -0,0 +1,16 @@
+#ifndef AMREX_GPU_LAUNCH_GLOBAL_H_
+#define AMREX_GPU_LAUNCH_GLOBAL_H_
+
+#include <AMReX_GpuQualifiers.H>
+
+namespace amrex {
+
+#if defined(AMREX_USE_CUDA) || defined(AMREX_USE_HIP)
+    // We cannot take rvalue lambdas.
+    template<class L>
+    AMREX_GPU_GLOBAL void launch_global (L f0) { f0(); }
+#endif
+
+}
+
+#endif
diff --git a/Src/Base/AMReX_GpuLaunchMacrosG.H b/Src/Base/AMReX_GpuLaunchMacrosG.H
index 83306b4b560..81e8a395441 100644
--- a/Src/Base/AMReX_GpuLaunchMacrosG.H
+++ b/Src/Base/AMReX_GpuLaunchMacrosG.H
@@ -53,6 +53,34 @@
             block \
         } \
     }}}
+#ifdef AMREX_USE_CUDA
+#define AMREX_GPU_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA_RANGE(TN,TI,block) \
+    { auto const& amrex_i_tn = TN; \
+    if (!amrex::isEmpty(amrex_i_tn)) { \
+    if (amrex::Gpu::inLaunchRegion()) \
+    { \
+      const auto amrex_i_ec = amrex::Gpu::ExecutionConfig(amrex_i_tn); \
+      if (amrex::Gpu::inFuseRegion() && amrex_i_ec.numBlocks.x*amrex_i_ec.numThreads.x <= amrex::Gpu::getFuseSizeThreshold()) { \
+        amrex::Gpu::Register(amrex_i_tn, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept { \
+            amrex::Box TI{amrex::IntVect(AMREX_D_DECL(i,j,k)),amrex::IntVect(AMREX_D_DECL(i,j,k))}; \
+            block \
+        }); \
+      } else { \
+        AMREX_LAUNCH_KERNEL(amrex_i_ec.numBlocks, amrex_i_ec.numThreads, amrex_i_ec.sharedMem, amrex::Gpu::gpuStream(), \
+        [=] AMREX_GPU_DEVICE () noexcept { \
+            for (auto const TI : amrex::Gpu::Range(amrex_i_tn)) { \
+                block \
+            } \
+        }); \
+        AMREX_GPU_ERROR_CHECK(); \
+      } \
+    } \
+    else { \
+        for (auto const TI : amrex::Gpu::Range(amrex_i_tn)) { \
+            block \
+        } \
+    }}}
+#endif
 #endif
 
 // two fused launches
@@ -134,6 +162,51 @@
             block2 \
         } \
     }}}
+#ifdef AMREX_USE_CUDA
+#define AMREX_GPU_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA_RANGE_2(TN1,TI1,block1,TN2,TI2,block2) \
+    { auto const& amrex_i_tn1 = TN1; auto const& amrex_i_tn2 = TN2; \
+    if (!amrex::isEmpty(amrex_i_tn1) or !amrex::isEmpty(amrex_i_tn2)) { \
+    if (amrex::Gpu::inLaunchRegion()) \
+    { \
+      const auto amrex_i_ec1 = amrex::Gpu::ExecutionConfig(amrex_i_tn1); \
+      const auto amrex_i_ec2 = amrex::Gpu::ExecutionConfig(amrex_i_tn2); \
+      dim3 amrex_i_nblocks = amrex::max(amrex_i_ec1.numBlocks.x, \
+                                        amrex_i_ec2.numBlocks.x); \
+      amrex_i_nblocks.y = 2; \
+      if (amrex::Gpu::inFuseRegion() && amrex_i_nblocks.x*amrex_i_nblocks.y*amrex_i_ec1.numThreads.x <= amrex::Gpu::getFuseSizeThreshold()) { \
+        amrex::Gpu::Register(amrex_i_tn1, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept { \
+            amrex::Box TI1{amrex::IntVect(AMREX_D_DECL(i,j,k)),amrex::IntVect(AMREX_D_DECL(i,j,k))}; \
+            block1 \
+        }); \
+        amrex::Gpu::Register(amrex_i_tn2, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept { \
+            amrex::Box TI2{amrex::IntVect(AMREX_D_DECL(i,j,k)),amrex::IntVect(AMREX_D_DECL(i,j,k))}; \
+            block2 \
+        }); \
+      } else { \
+        AMREX_LAUNCH_KERNEL(amrex_i_nblocks, amrex_i_ec1.numThreads, 0, amrex::Gpu::gpuStream(), \
+        [=] AMREX_GPU_DEVICE () noexcept { \
+            switch (blockIdx.y) { \
+            case 0: for (auto const TI1 : amrex::Gpu::Range(amrex_i_tn1)) { \
+                        block1 \
+                    } \
+                    break; \
+            case 1: for (auto const TI2 : amrex::Gpu::Range(amrex_i_tn2)) { \
+                        block2 \
+                    } \
+            } \
+        }); \
+        AMREX_GPU_ERROR_CHECK(); \
+      } \
+    } \
+    else { \
+        for (auto const TI1 : amrex::Gpu::Range(amrex_i_tn1)) { \
+            block1 \
+        } \
+        for (auto const TI2 : amrex::Gpu::Range(amrex_i_tn2)) { \
+            block2 \
+        } \
+    }}}
+#endif
 #endif
 
 // three fused launches
@@ -233,6 +306,64 @@
             block3 \
         } \
     }}}
+#ifdef AMREX_USE_CUDA
+#define AMREX_GPU_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA_RANGE_3(TN1,TI1,block1,TN2,TI2,block2,TN3,TI3,block3) \
+    { auto const& amrex_i_tn1 = TN1; auto const& amrex_i_tn2 = TN2; auto const& amrex_i_tn3 = TN3; \
+    if (!amrex::isEmpty(amrex_i_tn1) or !amrex::isEmpty(amrex_i_tn2) or !amrex::isEmpty(amrex_i_tn3)) { \
+    if (amrex::Gpu::inLaunchRegion()) \
+    { \
+      const auto amrex_i_ec1 = amrex::Gpu::ExecutionConfig(amrex_i_tn1); \
+      const auto amrex_i_ec2 = amrex::Gpu::ExecutionConfig(amrex_i_tn2); \
+      const auto amrex_i_ec3 = amrex::Gpu::ExecutionConfig(amrex_i_tn3); \
+      dim3 amrex_i_nblocks = amrex::max(amrex::max(amrex_i_ec1.numBlocks.x, \
+                                                   amrex_i_ec2.numBlocks.x), \
+                                                   amrex_i_ec3.numBlocks.x); \
+      amrex_i_nblocks.y = 3; \
+      if (amrex::Gpu::inFuseRegion() && amrex_i_nblocks.x*amrex_i_nblocks.y*amrex_i_ec1.numThreads.x <= amrex::Gpu::getFuseSizeThreshold()) { \
+        amrex::Gpu::Register(amrex_i_tn1, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept { \
+            amrex::Box TI1{amrex::IntVect(AMREX_D_DECL(i,j,k)),amrex::IntVect(AMREX_D_DECL(i,j,k))}; \
+            block1 \
+        }); \
+        amrex::Gpu::Register(amrex_i_tn2, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept { \
+            amrex::Box TI2{amrex::IntVect(AMREX_D_DECL(i,j,k)),amrex::IntVect(AMREX_D_DECL(i,j,k))}; \
+            block2 \
+        }); \
+        amrex::Gpu::Register(amrex_i_tn3, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept { \
+            amrex::Box TI3{amrex::IntVect(AMREX_D_DECL(i,j,k)),amrex::IntVect(AMREX_D_DECL(i,j,k))}; \
+            block3 \
+        }); \
+      } else {                                                             \
+        AMREX_LAUNCH_KERNEL(amrex_i_nblocks, amrex_i_ec1.numThreads, 0, amrex::Gpu::gpuStream(), \
+        [=] AMREX_GPU_DEVICE () noexcept { \
+            switch (blockIdx.y) { \
+            case 0: for (auto const TI1 : amrex::Gpu::Range(amrex_i_tn1)) { \
+                        block1 \
+                    } \
+                    break; \
+            case 1: for (auto const TI2 : amrex::Gpu::Range(amrex_i_tn2)) { \
+                        block2 \
+                    } \
+                    break; \
+            case 2: for (auto const TI3 : amrex::Gpu::Range(amrex_i_tn3)) { \
+                        block3 \
+                    } \
+            } \
+        }); \
+        AMREX_GPU_ERROR_CHECK(); \
+      } \
+    } \
+    else { \
+        for (auto const TI1 : amrex::Gpu::Range(amrex_i_tn1)) { \
+            block1 \
+        } \
+        for (auto const TI2 : amrex::Gpu::Range(amrex_i_tn2)) { \
+            block2 \
+        } \
+        for (auto const TI3 : amrex::Gpu::Range(amrex_i_tn3)) { \
+            block3 \
+        } \
+    }}}
+#endif
 #endif
 
 #ifdef AMREX_USE_DPCPP
@@ -452,6 +583,19 @@
     } \
 }
 
+#define AMREX_GPU_HOST_DEVICE_FOR_1D_FUSIBLE(n,i,block) \
+{ \
+    auto const& amrex_i_n = n; \
+    using amrex_i_inttype = typename std::remove_const<decltype(n)>::type; \
+    if (amrex::Gpu::inLaunchRegion()) { \
+        amrex::ParallelFor(amrex::Gpu::KernelInfo().setFusible(true),amrex_i_n,[=] AMREX_GPU_DEVICE (amrex_i_inttype i) noexcept block); \
+    } else { \
+        auto amrex_i_lambda = [=] (amrex_i_inttype i) noexcept block; \
+        AMREX_PRAGMA_SIMD \
+        for (amrex_i_inttype i = 0; i < amrex_i_n; ++i) amrex_i_lambda(i); \
+    } \
+}
+
 #define AMREX_GPU_DEVICE_FOR_1D(n,i,block) \
 { \
     using amrex_i_inttype = typename std::remove_const<decltype(n)>::type; \
@@ -470,6 +614,16 @@
     } \
 }
 
+#define AMREX_GPU_HOST_DEVICE_FOR_3D_FUSIBLE(box,i,j,k,block) \
+{ \
+    auto const& amrex_i_box = box; \
+    if (amrex::Gpu::inLaunchRegion()) { \
+        amrex::ParallelFor(amrex::Gpu::KernelInfo().setFusible(true),amrex_i_box,[=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept block); \
+    } else { \
+        amrex::LoopConcurrentOnCpu(amrex_i_box,[=] (int i, int j, int k) noexcept block); \
+    } \
+}
+
 #define AMREX_GPU_DEVICE_FOR_3D(box,i,j,k,block) \
 { \
     amrex::ParallelFor(box,[=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept block); \
@@ -488,6 +642,17 @@
     } \
 }
 
+#define AMREX_GPU_HOST_DEVICE_FOR_4D_FUSIBLE(box,ncomp,i,j,k,n,block) \
+{ \
+    auto const& amrex_i_box = box; \
+    auto const& amrex_i_ncomp = ncomp; \
+    if (amrex::Gpu::inLaunchRegion()) { \
+        amrex::ParallelFor(amrex::Gpu::KernelInfo().setFusible(true),amrex_i_box,amrex_i_ncomp,[=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept block); \
+    } else { \
+        amrex::LoopConcurrentOnCpu(amrex_i_box,amrex_i_ncomp,[=] (int i, int j, int k, int n) noexcept block); \
+    } \
+}
+
 #define AMREX_GPU_DEVICE_FOR_4D(box,ncomp,i,j,k,n,block) \
 { \
     amrex::ParallelFor(box,ncomp,[=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept block); \
diff --git a/Src/Base/AMReX_GpuMemory.H b/Src/Base/AMReX_GpuMemory.H
index 911036795c2..7753489f0f9 100644
--- a/Src/Base/AMReX_GpuMemory.H
+++ b/Src/Base/AMReX_GpuMemory.H
@@ -51,7 +51,7 @@ struct Deleter {
     void operator() (void* pt) const noexcept { m_arena->free(pt); }
 };
 
-template <class T, typename = amrex::EnableIf_t<AMREX_IS_TRIVIALLY_COPYABLE(T)> >
+template <class T, typename std::enable_if<AMREX_IS_TRIVIALLY_COPYABLE(T),int>::type = 0>
 struct DeviceScalar
 {
     DeviceScalar (DeviceScalar const&) = delete;
diff --git a/Src/Base/AMReX_GpuPrint.H b/Src/Base/AMReX_GpuPrint.H
index 0eb65f723d1..91f42500b35 100644
--- a/Src/Base/AMReX_GpuPrint.H
+++ b/Src/Base/AMReX_GpuPrint.H
@@ -10,14 +10,19 @@
 #endif
 
 #if defined(AMREX_USE_DPCPP)
+#if (__SYCL_COMPILER_VERSION <= 20200827)
 #  define AMREX_DEVICE_PRINTF(format,...) { \
       static const __attribute__((opencl_constant)) char amrex_i_format[] = format ; \
       cl::sycl::intel::experimental::printf(amrex_i_format, __VA_ARGS__); }
+#else
+#  define AMREX_DEVICE_PRINTF(format,...) { \
+      static const __attribute__((opencl_constant)) char amrex_i_format[] = format ; \
+      sycl::ONEAPI::experimental::printf(amrex_i_format, __VA_ARGS__); }
+#endif
 #elif defined(AMREX_USE_CUDA)
 #  define AMREX_DEVICE_PRINTF(...) std::printf(__VA_ARGS__);
 #elif defined(AMREX_USE_HIP)
-// HIP FIX HERE - printf
-#  define AMREX_DEVICE_PRINTF(...)
+#  define AMREX_DEVICE_PRINTF(...) ::printf(__VA_ARGS__);
 #endif
 
 #endif  // !defined(__APPLE__)
diff --git a/Src/Base/AMReX_GpuQualifiers.H b/Src/Base/AMReX_GpuQualifiers.H
index 3f476db98c6..d1119048c87 100644
--- a/Src/Base/AMReX_GpuQualifiers.H
+++ b/Src/Base/AMReX_GpuQualifiers.H
@@ -12,14 +12,15 @@
 #define AMREX_GPU_GLOBAL __global__
 #define AMREX_GPU_HOST_DEVICE __host__ __device__
 #define AMREX_GPU_CONSTANT __constant__
-#define AMREX_GPU_EXTERNAL
 
 #if defined(AMREX_USE_HIP) && !defined(AMREX_USE_CUDA)
 #define AMREX_GPU_MANAGED __device__
 #define AMREX_GPU_DEVICE_MANAGED __device__
+#define AMREX_GPU_EXTERNAL __attribute__((weak))
 #else
 #define AMREX_GPU_MANAGED __managed__
 #define AMREX_GPU_DEVICE_MANAGED __device__ __managed__
+#define AMREX_GPU_EXTERNAL
 #endif
 
 #else
@@ -45,7 +46,7 @@
 # define AMREX_REQUIRE_SUBGROUP_SIZE(x) \
   _Pragma("clang diagnostic push") \
   _Pragma("clang diagnostic ignored \"-Wattributes\"") \
-  [[cl::intel_reqd_sub_group_size(x)]] \
+  [[intel::reqd_sub_group_size(x)]]                \
   _Pragma("clang diagnostic pop")
 #endif // AMREX_USE_DPCPP
 
diff --git a/Src/Base/AMReX_GpuRange.H b/Src/Base/AMReX_GpuRange.H
index f0e3e7b2d22..ffb09f8ddee 100644
--- a/Src/Base/AMReX_GpuRange.H
+++ b/Src/Base/AMReX_GpuRange.H
@@ -9,7 +9,7 @@
 
 namespace amrex {
 
-template <typename T, typename = amrex::EnableIf_t<std::is_integral<T>::value> >
+template <typename T, typename std::enable_if<std::is_integral<T>::value,int>::type = 0>
 bool isEmpty (T n) noexcept { return n <= 0; }
 
 AMREX_FORCE_INLINE bool isEmpty (Box const& b) noexcept { return b.isEmpty(); }
@@ -19,13 +19,13 @@ namespace Gpu {
 namespace range_detail {
 
 //! integer version
-template <typename T, typename = amrex::EnableIf_t<std::is_integral<T>::value> >
+template <typename T, typename std::enable_if<std::is_integral<T>::value,int>::type = 0>
 AMREX_GPU_HOST_DEVICE
 Long size (T const& b) noexcept { return static_cast<Long>(b); }
 
-template <typename T, typename = amrex::EnableIf_t<std::is_integral<T>::value> >
+template <typename T, typename std::enable_if<std::is_integral<T>::value,int>::type = 0>
 AMREX_GPU_HOST_DEVICE
-Long at (T const& b, Long offset) noexcept { return offset; }
+Long at (T const& /*b*/, Long offset) noexcept { return offset; }
 
 //! Box version
 AMREX_GPU_HOST_DEVICE
diff --git a/Src/Base/AMReX_GpuReduce.H b/Src/Base/AMReX_GpuReduce.H
index 201d7122f1e..cf5c4a3dfa7 100644
--- a/Src/Base/AMReX_GpuReduce.H
+++ b/Src/Base/AMReX_GpuReduce.H
@@ -20,7 +20,11 @@ template <int warpSize, typename T, typename F>
 struct warpReduce
 {
     AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+#if (__SYCL_COMPILER_VERSION <= 20200827)
     T operator() (T x, sycl::intel::sub_group const& sg) const noexcept
+#else
+    T operator() (T x, sycl::ONEAPI::sub_group const& sg) const noexcept
+#endif
     {
         for (int offset = warpSize/2; offset > 0; offset /= 2) {
             T y = sg.shuffle_down(x, offset);
@@ -36,10 +40,18 @@ T blockReduce (T x, WARPREDUCE && warp_reduce, T x0, Gpu::Handler const& h)
 {
     T* shared = (T*)h.local;
     int tid = h.item.get_local_id(0);
+#if (__SYCL_COMPILER_VERSION <= 20200827)
     sycl::intel::sub_group const& sg = h.item.get_sub_group();
+#else
+    sycl::ONEAPI::sub_group const& sg = h.item.get_sub_group();
+#endif
     int lane = sg.get_local_id()[0];
     int wid = sg.get_group_id()[0];
+#if (__SYCL_COMPILER_VERSION <= 20200715)
     int numwarps = sg.get_group_range();
+#else
+    int numwarps = sg.get_group_range()[0];
+#endif
     x = warp_reduce(x, sg);
     // __syncthreads() prior to writing to shared memory is necessary
     // if this reduction call is occurring multiple times in a kernel,
@@ -60,7 +72,7 @@ void deviceReduceSum (T * dest, T source, Gpu::Handler const& h) noexcept
 {
     source = Gpu::blockReduce<Gpu::Device::warp_size>
         (source, Gpu::warpReduce<Gpu::Device::warp_size,T,amrex::Plus<T> >(), (T)0, h);
-    if (h.item.get_local_id(0) == 0) Gpu::Atomic::Add(dest, source);
+    if (h.item.get_local_id(0) == 0) Gpu::Atomic::AddNoRet(dest, source);
 }
 
 template <typename T>
@@ -105,15 +117,11 @@ struct warpReduce
     AMREX_GPU_DEVICE AMREX_FORCE_INLINE
     T operator() (T x) const noexcept
     {
-// HIP FIX HERE - __shfl_down_sync -> type of HIP intrinsics don't match. 
-//                e.g. need to figure a work around for longs and Real2.
-//#ifdef AMREX_USE_CUDA
         for (int offset = warpSize/2; offset > 0; offset /= 2) {
             AMREX_HIP_OR_CUDA(T y = __shfl_down(x, offset);,
-                              T y = __shfl_down_sync(0xffffffff, x, offset); );
+                              T y = __shfl_down_sync(0xffffffff, x, offset); )
             x = F()(x,y);
         }
-//#endif
         return x;
     }
 };
@@ -145,7 +153,7 @@ void deviceReduceSum (T * dest, T source) noexcept
 {
     source = Gpu::blockReduce<Gpu::Device::warp_size>
         (source, Gpu::warpReduce<Gpu::Device::warp_size,T,amrex::Plus<T> >(), (T)0);
-    if (threadIdx.x == 0) Gpu::Atomic::Add(dest, source);
+    if (threadIdx.x == 0) Gpu::Atomic::AddNoRet(dest, source);
 }
 
 template <typename T>
@@ -255,6 +263,8 @@ void amdWarpReduceSum (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] += data[tid + 4];
     if (blockSize >=  4) data[tid] += data[tid + 2];
     if (blockSize >=  2) data[tid] += data[tid + 1];
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -269,6 +279,8 @@ void cudaWarpReduceSum_lt7 (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] += data[tid + 4];
     if (blockSize >=  4) data[tid] += data[tid + 2];
     if (blockSize >=  2) data[tid] += data[tid + 1];
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -283,6 +295,8 @@ void cudaWarpReduceSum_ge7 (T* data, int tid) noexcept
     if (blockSize >=  8) { if (tid <  4) { data[tid] += data[tid +  4]; } __syncwarp(); }
     if (blockSize >=  4) { if (tid <  2) { data[tid] += data[tid +  2]; } __syncwarp(); }
     if (blockSize >=  2) { if (tid <  1) { data[tid] += data[tid +  1]; } __syncwarp(); }
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -335,6 +349,8 @@ void amdWarpReduceMin (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = amrex::min(data[tid],data[tid +  4]);
     if (blockSize >=  4) data[tid] = amrex::min(data[tid],data[tid +  2]);
     if (blockSize >=  2) data[tid] = amrex::min(data[tid],data[tid +  1]);
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -349,6 +365,8 @@ void cudaWarpReduceMin_lt7 (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = amrex::min(data[tid],data[tid +  4]);
     if (blockSize >=  4) data[tid] = amrex::min(data[tid],data[tid +  2]);
     if (blockSize >=  2) data[tid] = amrex::min(data[tid],data[tid +  1]);
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -363,6 +381,8 @@ void cudaWarpReduceMin_ge7 (T* data, int tid) noexcept
     if (blockSize >=  8) { if (tid <  4) { data[tid] = amrex::min(data[tid],data[tid +  4]); } __syncwarp(); }
     if (blockSize >=  4) { if (tid <  2) { data[tid] = amrex::min(data[tid],data[tid +  2]); } __syncwarp(); }
     if (blockSize >=  2) { if (tid <  1) { data[tid] = amrex::min(data[tid],data[tid +  1]); } __syncwarp(); }
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -415,6 +435,8 @@ void amdWarpReduceMax (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = amrex::max(data[tid],data[tid +  4]);
     if (blockSize >=  4) data[tid] = amrex::max(data[tid],data[tid +  2]);
     if (blockSize >=  2) data[tid] = amrex::max(data[tid],data[tid +  1]);
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -429,6 +451,8 @@ void cudaWarpReduceMax_lt7 (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = amrex::max(data[tid],data[tid +  4]);
     if (blockSize >=  4) data[tid] = amrex::max(data[tid],data[tid +  2]);
     if (blockSize >=  2) data[tid] = amrex::max(data[tid],data[tid +  1]);
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -443,6 +467,8 @@ void cudaWarpReduceMax_ge7 (T* data, int tid) noexcept
     if (blockSize >=  8) { if (tid <  4) { data[tid] = amrex::max(data[tid],data[tid +  4]); } __syncwarp(); }
     if (blockSize >=  4) { if (tid <  2) { data[tid] = amrex::max(data[tid],data[tid +  2]); } __syncwarp(); }
     if (blockSize >=  2) { if (tid <  1) { data[tid] = amrex::max(data[tid],data[tid +  1]); } __syncwarp(); }
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -495,6 +521,8 @@ void amdWarpReduceAnd (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = data[tid] && data[tid +  4];
     if (blockSize >=  4) data[tid] = data[tid] && data[tid +  2];
     if (blockSize >=  2) data[tid] = data[tid] && data[tid +  1];
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -509,6 +537,8 @@ void cudaWarpReduceAnd_lt7 (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = data[tid] && data[tid +  4];
     if (blockSize >=  4) data[tid] = data[tid] && data[tid +  2];
     if (blockSize >=  2) data[tid] = data[tid] && data[tid +  1];
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -523,6 +553,8 @@ void cudaWarpReduceAnd_ge7 (T* data, int tid) noexcept
     if (blockSize >=  8) { if (tid <  4) { data[tid] = data[tid] && data[tid +  4]; } __syncwarp(); }
     if (blockSize >=  4) { if (tid <  2) { data[tid] = data[tid] && data[tid +  2]; } __syncwarp(); }
     if (blockSize >=  2) { if (tid <  1) { data[tid] = data[tid] && data[tid +  1]; } __syncwarp(); }
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -575,6 +607,8 @@ void amdWarpReduceOr (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = data[tid] || data[tid +  4];
     if (blockSize >=  4) data[tid] = data[tid] || data[tid +  2];
     if (blockSize >=  2) data[tid] = data[tid] || data[tid +  1];
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -589,6 +623,8 @@ void cudaWarpReduceOr_lt7 (volatile T* data, int tid) noexcept
     if (blockSize >=  8) data[tid] = data[tid] || data[tid +  4];
     if (blockSize >=  4) data[tid] = data[tid] || data[tid +  2];
     if (blockSize >=  2) data[tid] = data[tid] || data[tid +  1];
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
@@ -603,6 +639,8 @@ void cudaWarpReduceOr_ge7 (T* data, int tid) noexcept
     if (blockSize >=  8) { if (tid <  4) { data[tid] = data[tid] || data[tid +  4]; } __syncwarp(); }
     if (blockSize >=  4) { if (tid <  2) { data[tid] = data[tid] || data[tid +  2]; } __syncwarp(); }
     if (blockSize >=  2) { if (tid <  1) { data[tid] = data[tid] || data[tid +  1]; } __syncwarp(); }
+#else
+    amrex::ignore_unused(data,tid);
 #endif
 }
 
diff --git a/Src/Base/AMReX_GpuUtility.H b/Src/Base/AMReX_GpuUtility.H
index 232d06a9b75..e847bc5409a 100644
--- a/Src/Base/AMReX_GpuUtility.H
+++ b/Src/Base/AMReX_GpuUtility.H
@@ -49,6 +49,7 @@ namespace Gpu {
         CUresult r = cuPointerGetAttributes(1, &attrib, data, (CUdeviceptr)p);
         return r == CUDA_SUCCESS && is_managed;
 #elif defined(AMREX_USE_DPCPP)
+        amrex::ignore_unused(p);
         // xxxxx DPCPP todo: get_pointer_type
 //        auto const info = sycl::get_pointer_info(p);
 //        auto type = sycl::get_pointer_type(p,Device::syclContext());
@@ -62,8 +63,7 @@ namespace Gpu {
     inline bool isDevicePtr (void const* p) noexcept {
 #if defined(AMREX_USE_HIP)
         hipPointerAttribute_t attrib;
-        // HIP FIX HERE: const_cast: earlier versions of hip have a bug
-        hipError_t r = hipPointerGetAttributes(&attrib, const_cast<void*>(p));
+        hipError_t r = hipPointerGetAttributes(&attrib, p);
         return r == hipSuccess && attrib.memoryType == hipMemoryTypeDevice;
 #elif defined(AMREX_USE_CUDA)
         CUpointer_attribute attrib = CU_POINTER_ATTRIBUTE_MEMORY_TYPE;
@@ -72,6 +72,7 @@ namespace Gpu {
         CUresult r = cuPointerGetAttributes(1, &attrib, data, (CUdeviceptr)p);
         return r == CUDA_SUCCESS && mem_type == CU_MEMORYTYPE_DEVICE;
 #elif defined(AMREX_USE_DPCPP)
+        amrex::ignore_unused(p);
         // xxxxx DPCPP todo: get_pointer_type
         return false;
 #else
@@ -83,8 +84,7 @@ namespace Gpu {
     inline bool isPinnedPtr (void const* p) noexcept {
 #if defined(AMREX_USE_HIP)
         hipPointerAttribute_t attrib;
-        // HIP FIX HERE: const_cast: earlier versions of hip have a bug
-        hipError_t r = hipPointerGetAttributes(&attrib, const_cast<void*>(p));
+        hipError_t r = hipPointerGetAttributes(&attrib, p);
         return r == hipSuccess && attrib.memoryType == hipMemoryTypeHost;
 #elif defined(AMREX_USE_CUDA)
         CUpointer_attribute attrib = CU_POINTER_ATTRIBUTE_MEMORY_TYPE;
@@ -93,6 +93,7 @@ namespace Gpu {
         CUresult r = cuPointerGetAttributes(1, &attrib, data, (CUdeviceptr)p);
         return r == CUDA_SUCCESS && mem_type == CU_MEMORYTYPE_HOST;
 #elif defined(AMREX_USE_DPCPP)
+        amrex::ignore_unused(p);
         // xxxxx DPCPP todo: get_pointer_type
         return false;
 #else
@@ -107,8 +108,7 @@ namespace Gpu {
             return true;
         } else {
             hipPointerAttribute_t attrib;
-            // HIP FIX HERE: const_cast: earlier versions of hip have a bug
-            hipError_t r = hipPointerGetAttributes(&attrib, const_cast<void*>(p));
+            hipError_t r = hipPointerGetAttributes(&attrib, p);
             return r == hipSuccess &&
                 (attrib.memoryType == hipMemoryTypeHost   ||
                  attrib.memoryType == hipMemoryTypeDevice);
@@ -124,6 +124,7 @@ namespace Gpu {
              mem_type == CU_MEMORYTYPE_ARRAY  ||
              mem_type == CU_MEMORYTYPE_UNIFIED);
 #elif defined(AMREX_USE_DPCPP)
+        amrex::ignore_unused(p);
         // xxxxx DPCPP todo: get_pointer_type
         return false;
 #else
diff --git a/Src/Base/AMReX_IntVect.H b/Src/Base/AMReX_IntVect.H
index e50291ddab3..517b401f02d 100644
--- a/Src/Base/AMReX_IntVect.H
+++ b/Src/Base/AMReX_IntVect.H
@@ -468,18 +468,6 @@ public:
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     IntVect& coarsen (int p) noexcept;
 
-    //! for serialization
-    static size_t AMREX_FORCE_INLINE
-    linearSize () noexcept
-    {
-        size_t retval = AMREX_SPACEDIM*sizeof(int);
-        return retval;
-    }
-
-    //! for serialization
-    void linearOut (void* a_buffer ) const noexcept;
-    void linearIn (void* a_buffer ) noexcept;
-
     /**
     * \brief This static member function returns a reference to a constant IntVect
     * object, all of whose AMREX_SPACEDIM arguments are set to zero (0).
@@ -629,32 +617,6 @@ IntVect::maxDir(bool a_doAbsValue) const noexcept
     return retval;
 }
 
-AMREX_FORCE_INLINE
-void
-IntVect::linearOut(void* a_buffer ) const noexcept
-{
-    int* intbuf = (int *) a_buffer;
-    const IntVect& iv = *this;
-    for(int idir = 0; idir < SpaceDim; idir++)
-    {
-        *intbuf = iv[idir];
-        intbuf++;
-    }
-}
-
-AMREX_FORCE_INLINE
-void
-IntVect::linearIn(void* a_buffer ) noexcept
-{
-    int* intbuf = (int *) a_buffer;
-    IntVect& iv = *this;
-    for(int idir = 0; idir < SpaceDim; idir++)
-    {
-        iv[idir] = *intbuf;
-        intbuf++;
-    }
-}
-
 //! Returns p + s.
 AMREX_GPU_HOST_DEVICE
 AMREX_FORCE_INLINE
diff --git a/Src/Base/AMReX_Loop.H b/Src/Base/AMReX_Loop.H
index ca2a514d9da..7db241b2ba0 100644
--- a/Src/Base/AMReX_Loop.H
+++ b/Src/Base/AMReX_Loop.H
@@ -217,6 +217,7 @@ void LoopConcurrentOnCpu (Box const& bx, int ncomp, F&& f) noexcept
     for (int k = amrex_i_lo.z; k <= amrex_i_hi.z; ++k) { \
     for (int j = amrex_i_lo.y; j <= amrex_i_hi.y; ++j) { \
     for (int i = amrex_i_lo.x; i <= amrex_i_hi.x; ++i) { \
+        AMREX_D_PICK(amrex::ignore_unused(j,k),amrex::ignore_unused(k),(void)0); \
         block \
     }}} \
 }
@@ -229,6 +230,7 @@ void LoopConcurrentOnCpu (Box const& bx, int ncomp, F&& f) noexcept
     for (int k = amrex_i_lo.z; k <= amrex_i_hi.z; ++k) { \
     for (int j = amrex_i_lo.y; j <= amrex_i_hi.y; ++j) { \
     for (int i = amrex_i_lo.x; i <= amrex_i_hi.x; ++i) { \
+        AMREX_D_PICK(amrex::ignore_unused(j,k),amrex::ignore_unused(k),(void)0); \
         block \
     }}}} \
 }
diff --git a/Src/Base/AMReX_MFCopyDescriptor.cpp b/Src/Base/AMReX_MFCopyDescriptor.cpp
index bcddd62c5c1..73c70520afc 100644
--- a/Src/Base/AMReX_MFCopyDescriptor.cpp
+++ b/Src/Base/AMReX_MFCopyDescriptor.cpp
@@ -24,6 +24,8 @@ InterpAddBox (MultiFabCopyDescriptor& fabCopyDesc,
 		      int                     num_comp,
 		      bool                    extrap)
 {
+    amrex::ignore_unused(extrap);
+
     const Real teps = (t2-t1)/1000.0;
 
     BL_ASSERT(extrap || ( (t>=t1-teps) && (t <= t2+teps) ) );
@@ -85,6 +87,8 @@ InterpFillFab (MultiFabCopyDescriptor& fabCopyDesc,
 		       int                     num_comp,
 		       bool                    extrap)
 {
+    amrex::ignore_unused(extrap);
+
     const Real teps = (t2-t1)/1000.0;
 
     BL_ASSERT(extrap || ( (t>=t1-teps) && (t <= t2+teps) ) );
diff --git a/Src/Base/AMReX_MFIter.H b/Src/Base/AMReX_MFIter.H
index 24fa65c72d7..976e2900563 100644
--- a/Src/Base/AMReX_MFIter.H
+++ b/Src/Base/AMReX_MFIter.H
@@ -81,7 +81,7 @@ public:
 	SkipInit      = 0x08
     };
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
     enum MFReducer { SUM = 0, MAX, MIN };
 #endif
 
@@ -164,7 +164,7 @@ public:
     //! The the number of tiles in the current grid;
     int numLocalTiles() const noexcept {return num_local_tiles ? (*num_local_tiles)[currentIndex] : 1;}
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
     //! Maintain a list of values to reduce.
     template<typename T>
     T* add_reduce_value(T* val, MFReducer r) { return val; }
@@ -212,7 +212,7 @@ protected:
     const Vector<int>* local_tile_index_map;
     const Vector<int>* num_local_tiles;
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
     mutable Vector<Real*> real_reduce_val;
 
     mutable MFReducer reducer;
@@ -222,7 +222,12 @@ protected:
     mutable Vector<Vector<Real*> > real_device_reduce_list;
 #endif
 
+#ifdef AMREX_USE_GPU
+    std::unique_ptr<Gpu::FuseSafeGuard> gpu_fsg;
+#endif
+
     static int nextDynamicIndex;
+    static int depth;
 
     void Initialize ();
 };
diff --git a/Src/Base/AMReX_MFIter.cpp b/Src/Base/AMReX_MFIter.cpp
index c0ac2d612a7..d3eec50e7b9 100644
--- a/Src/Base/AMReX_MFIter.cpp
+++ b/Src/Base/AMReX_MFIter.cpp
@@ -2,10 +2,12 @@
 #include <AMReX_MFIter.H>
 #include <AMReX_FabArray.H>
 #include <AMReX_FArrayBox.H>
+#include <AMReX_OpenMP.H>
 
 namespace amrex {
 
 int MFIter::nextDynamicIndex = std::numeric_limits<int>::min();
+int MFIter::depth = 0;
 
 MFIter::MFIter (const FabArrayBase& fabarray_, 
 		unsigned char       flags_)
@@ -144,11 +146,7 @@ MFIter::MFIter (const BoxArray& ba, const DistributionMapping& dm, const MFItInf
     tile_size(info.tilesize),
     flags(info.do_tiling ? Tiling : 0),
     streams(info.num_streams),
-#ifdef _OPENMP
-    dynamic(info.dynamic && (omp_get_num_threads() > 1)),
-#else
-    dynamic(false),
-#endif
+    dynamic(info.dynamic && (OpenMP::get_num_threads() > 1)),
     device_sync(info.device_sync),
     index_map(nullptr),
     local_index_map(nullptr),
@@ -180,11 +178,7 @@ MFIter::MFIter (const FabArrayBase& fabarray_, const MFItInfo& info)
     tile_size(info.tilesize),
     flags(info.do_tiling ? Tiling : 0),
     streams(info.num_streams),
-#ifdef _OPENMP
-    dynamic(info.dynamic && (omp_get_num_threads() > 1)),
-#else
-    dynamic(false),
-#endif
+    dynamic(info.dynamic && (OpenMP::get_num_threads() > 1)),
     device_sync(info.device_sync),
     index_map(nullptr),
     local_index_map(nullptr),
@@ -207,6 +201,13 @@ MFIter::MFIter (const FabArrayBase& fabarray_, const MFItInfo& info)
 
 MFIter::~MFIter ()
 {
+#ifdef _OPENMP
+#pragma omp master
+#endif
+    {
+        depth = 0;
+    }
+
 #ifdef BL_USE_TEAM
     if ( ! (flags & NoTeamBarrier) )
 	ParallelDescriptor::MyTeam().MemoryBarrier();
@@ -216,11 +217,11 @@ MFIter::~MFIter ()
     if (device_sync) Gpu::synchronize();
 #endif
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
     reduce();
 #endif
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
     if (Gpu::inLaunchRegion()) {
         for (int i = 0; i < real_reduce_list.size(); ++i)
             for (int j = 0; j < real_reduce_list[i].size(); ++j)
@@ -232,6 +233,9 @@ MFIter::~MFIter ()
     AMREX_GPU_ERROR_CHECK();
     Gpu::Device::resetStreamIndex();
     Gpu::resetNumCallbacks();
+    if (!OpenMP::in_parallel() && Gpu::inFuseRegion()) {
+        Gpu::LaunchFusedKernels();
+    }
 #endif
 
     if (m_fa) {
@@ -243,9 +247,17 @@ MFIter::~MFIter ()
     }
 }
 
-void 
+void
 MFIter::Initialize ()
 {
+#ifdef _OPENMP
+#pragma omp master
+#endif
+    {
+        ++depth;
+        AMREX_ALWAYS_ASSERT_WITH_MESSAGE(depth == 1, "Nested MFIter is not supported");
+    }
+
     if (flags & SkipInit) {
 	return;
     }
@@ -334,6 +346,11 @@ MFIter::Initialize ()
 #ifdef AMREX_USE_GPU
 	Gpu::Device::setStreamIndex((streams > 0) ? currentIndex%streams : -1);
         Gpu::resetNumCallbacks();
+        if (!OpenMP::in_parallel()) {
+            if (index_map->size() >= Gpu::getFuseNumKernelsThreshold()) {
+                gpu_fsg.reset(new Gpu::FuseSafeGuard(true));
+            }
+        }
 #endif
 
 	typ = fabArray.boxArray().ixType();
@@ -387,12 +404,12 @@ Box
 MFIter::tilebox (const IntVect& nodal, const IntVect& ngrow) const noexcept
 {
     Box bx = tilebox(nodal);
-    const Box& vbx = validbox();
+    const Box& vccbx = amrex::enclosedCells(validbox());
     for (int d=0; d<AMREX_SPACEDIM; ++d) {
-	if (bx.smallEnd(d) == vbx.smallEnd(d)) {
+	if (bx.smallEnd(d) == vccbx.smallEnd(d)) {
 	    bx.growLo(d, ngrow[d]);
 	}
-	if (bx.bigEnd(d) >= vbx.bigEnd(d)) {
+	if (bx.bigEnd(d) >= vccbx.bigEnd(d)) {
 	    bx.growHi(d, ngrow[d]);
 	}
     }
@@ -473,17 +490,8 @@ Box
 MFIter::grownnodaltilebox (int dir, IntVect const& a_ng) const noexcept
 {
     BL_ASSERT(dir < AMREX_SPACEDIM);
-    Box bx = nodaltilebox(dir);
-    const Box& vbx = validbox();
-    for (int d=0; d<AMREX_SPACEDIM; ++d) {
-	if (bx.smallEnd(d) == vbx.smallEnd(d)) {
-	    bx.growLo(d, a_ng[d]);
-	}
-	if (bx.bigEnd(d) >= vbx.bigEnd(d)) {
-	    bx.growHi(d, a_ng[d]);
-	}
-    }
-    return bx;
+    if (dir < 0) return tilebox(IntVect::TheNodeVector(), a_ng);
+    return tilebox(IntVect::TheDimensionVector(dir), a_ng);
 }
 
 void
@@ -498,15 +506,8 @@ MFIter::operator++ () noexcept
     else
 #endif
     {
-#ifdef AMREX_USE_GPU
-#ifdef _OPENMP
-        int numOmpThreads = omp_get_num_threads();
-#else
-        int numOmpThreads = 1;
-#endif
-        
-        bool use_gpu = (numOmpThreads == 1) && Gpu::inLaunchRegion();
-        if (use_gpu) {
+#ifdef AMREX_USE_GPU_PRAGMA
+        if (Gpu::inLaunchRegion()) {
             if (!real_reduce_list.empty()) {
                 for (int i = 0; i < real_reduce_list[currentIndex].size(); ++i) {
                     Gpu::dtoh_memcpy_async(&real_reduce_list[currentIndex][i],
@@ -520,7 +521,7 @@ MFIter::operator++ () noexcept
         ++currentIndex;
 
 #ifdef AMREX_USE_GPU
-        if (use_gpu) {
+        if (Gpu::inLaunchRegion()) {
             Gpu::Device::setStreamIndex((streams > 0) ? currentIndex%streams : -1);
             AMREX_GPU_ERROR_CHECK();
 #ifdef AMREX_DEBUG
@@ -531,7 +532,7 @@ MFIter::operator++ () noexcept
     }
 }
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
 Real*
 MFIter::add_reduce_value(Real* val, MFReducer r)
 {
@@ -593,7 +594,7 @@ MFIter::add_reduce_value(Real* val, MFReducer r)
 }
 #endif
 
-#ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_GPU_PRAGMA
 // Reduce over the values in the list.
 void
 MFIter::reduce()
@@ -667,13 +668,8 @@ MFGhostIter::Initialize ()
     }
 #endif
 
-    int tid = 0;
-    int nthreads = 1;
-#ifdef _OPENMP
-    nthreads = omp_get_num_threads();
-    if (nthreads > 1)
-	tid = omp_get_thread_num();
-#endif
+    int tid = OpenMP::get_thread_num();
+    int nthreads = OpenMP::get_num_threads();
 
     int npes = nworkers*nthreads;
     int pid = rit*nthreads+tid;
diff --git a/Src/Base/AMReX_Machine.H b/Src/Base/AMReX_Machine.H
index 1773bd73e40..a6a590eb3bf 100644
--- a/Src/Base/AMReX_Machine.H
+++ b/Src/Base/AMReX_Machine.H
@@ -7,13 +7,15 @@ namespace amrex {
 namespace machine {
 
 void Initialize (); //!< called in amrex::Initialize()
-void Finalize ();
 
+#ifdef AMREX_USE_MPI
+void Finalize ();
 /**
 * find the best topologically close neighborhood of ranks
 * returns a vector of global or local rank IDs based on flag_local_ranks
 */
 Vector<int> find_best_nbh (int rank_n, bool flag_local_ranks = false);
+#endif
 
 }}
 
diff --git a/Src/Base/AMReX_Machine.cpp b/Src/Base/AMReX_Machine.cpp
index ada5b38aa0c..5c55c9245b9 100644
--- a/Src/Base/AMReX_Machine.cpp
+++ b/Src/Base/AMReX_Machine.cpp
@@ -1,3 +1,18 @@
+#ifndef AMREX_USE_MPI
+
+namespace amrex {
+namespace machine {
+    void Initialize () {}
+}}
+
+#else
+
+#include <AMReX_Print.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_ParallelReduce.H>
+#include <AMReX_Utility.H>
+#include <AMReX_Machine.H>
+
 #include <cstdlib>
 #include <string>
 #include <vector>
@@ -7,12 +22,6 @@
 #include <map>
 #include <unordered_map>
 
-#include <AMReX_Print.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelReduce.H>
-#include <AMReX_Utility.H>
-#include <AMReX_Machine.H>
-
 using namespace amrex;
 
 namespace {
@@ -24,7 +33,7 @@ struct DoubleInt {
 
 using Coord = Array<int, 4>;
 
-#ifdef AMREX_DEBUG
+#if defined(AMREX_DEBUG)
 // returns coordinate in an index space with no switches
 // for dragonfly network
 Coord read_df_node_coord (const std::string & name)
@@ -34,7 +43,7 @@ Coord read_df_node_coord (const std::string & name)
         std::ifstream ifs {"/proc/cray_xt/cname"};
         if (!ifs) {
             // not on a cray
-            return Coord {0,0,0,0}; // initializer_list
+            return Coord {{0,0,0,0}}; // initializer_list
         }
         char t0, t1, t2, t3, t4;
         ifs >> t0 >> cabx >> t1 >> caby >> t2 >> cab_chas >> t3 >> slot >> t4 >> node;
@@ -49,11 +58,10 @@ Coord read_df_node_coord (const std::string & name)
     }
     int chas = cab_chas + 3*(cabx & 1); // 2 cabinets per group (6 chassis per group)
 
-    return Coord {node, slot, chas, group};
+    return Coord {{node, slot, chas, group}};
 }
 #endif
 
-#ifdef BL_USE_MPI
 std::string get_mpi_processor_name ()
 {
     std::string result;
@@ -63,9 +71,8 @@ std::string get_mpi_processor_name ()
     result = std::string(name);
     return result;
 }
-#endif
 
-#ifdef AMREX_DEBUG
+#if defined(AMREX_DEBUG)
 // assumes groups are in 4x16x6 configuration
 int df_coord_to_id (const Coord & c)
 {
@@ -80,7 +87,7 @@ Coord df_id_to_coord (int id)
     int slot = id % 16; id /= 16;
     int chas = id % 6;  id /= 6;
     int group = id;
-    return Coord {node, slot, chas, group};
+    return Coord {{node, slot, chas, group}};
 }
 
 template <class T, size_t N>
@@ -113,7 +120,6 @@ std::string to_str(const Vector<T> & v)
     return oss.str();
 }
 
-#if AMREX_USE_MPI
 Vector<int> get_subgroup_ranks ()
 {
     int rank_n = ParallelContext::NProcsSub();
@@ -126,7 +132,6 @@ Vector<int> get_subgroup_ranks ()
     ParallelContext::local_to_global_rank(granks.data(), lranks.data(), rank_n);
     return granks;
 }
-#endif
 
 int pair_n (int x) {
     return x*(x-1)/2;
@@ -215,7 +220,6 @@ class Machine
     // find a compact neighborhood of size rank_n in the current ParallelContext subgroup
     Vector<int> find_best_nbh (int nbh_rank_n, bool flag_local_ranks)
     {
-#ifdef BL_USE_MPI
         BL_PROFILE("Machine::find_best_nbh()");
 
         auto sg_g_ranks = get_subgroup_ranks();
@@ -301,9 +305,6 @@ class Machine
         }
 
         return result;
-#else
-        return Vector<int>(nbh_rank_n, 0);
-#endif
     }
 
   private:
@@ -379,7 +380,6 @@ class Machine
                 if (flag_verbose) {
                     Print() << "Got node ID from SLURM_TOPOLOGY_ADDR: " << result << std::endl;
                 }
-#ifdef BL_USE_MPI
             } else {
                 if (cluster_name == "escori")
 		    tag = "cgpu";
@@ -392,7 +392,6 @@ class Machine
                         Print() << "Got node ID from MPI_Get_processor_name(): " << result << std::endl;
                     }
                 }
-#endif
             }
 
             // check result
@@ -414,10 +413,8 @@ class Machine
     Vector<int> get_node_ids ()
     {
         Vector<int> ids(ParallelDescriptor::NProcs(), 0);
-#ifdef BL_USE_MPI
         int node_id = get_my_node_id();
         ParallelAllGather::AllGather(node_id, ids.data(), ParallelContext::CommunicatorAll());
-#endif
         if (flag_verbose) {
             std::map<int, Vector<int>> node_ranks;
             for (int i = 0; i < ids.size(); ++i) {
@@ -482,7 +479,9 @@ class Machine
     {
         BL_PROFILE("Machine::search_local_nbh()");
 
-        Print() << "Machine::search_local_nbh() called ..." << std::endl;
+        if (amrex::Verbose() > 0) {
+            Print() << "Machine::search_local_nbh() called ..." << std::endl;
+        }
 
         Vector<int> result;
 
@@ -548,21 +547,24 @@ class Machine
                     min_avg_dist = avg_dist;
                 }
             }
-            cur_node = std::move(*next_node);
-            next_node = nullptr;
-            candidates.erase(cur_node.id);
 
-            // add cur_node to result
-            result.push_back(cur_node.id);
-            total_rank_n += cur_node.rank_n;
-            total_pairs_dist += cur_node.sum_dist;
+            if (next_node) {
+                cur_node = std::move(*next_node);
+                next_node = nullptr;
+                candidates.erase(cur_node.id);
 
-            if (flag_verbose) {
-                Print() << "  Added " << cur_node.id
-                        << ": " << to_str(cur_node.coord)
-                        << ", ranks: " << cur_node.rank_n
-                        << ", total ranks: " << total_rank_n
-                        << ", avg dist: " << min_avg_dist << std::endl;
+                // add cur_node to result
+                result.push_back(cur_node.id);
+                total_rank_n += cur_node.rank_n;
+                total_pairs_dist += cur_node.sum_dist;
+
+                if (flag_verbose) {
+                    Print() << "  Added " << cur_node.id
+                            << ": " << to_str(cur_node.coord)
+                            << ", ranks: " << cur_node.rank_n
+                            << ", total ranks: " << total_rank_n
+                            << ", avg dist: " << min_avg_dist << std::endl;
+                }
             }
         }
 
@@ -592,3 +594,5 @@ Vector<int> find_best_nbh (int rank_n, bool flag_local_ranks) {
 }
 
 }}
+
+#endif
diff --git a/Src/Base/AMReX_Math.H b/Src/Base/AMReX_Math.H
index afa02fb21aa..92840410cd2 100644
--- a/Src/Base/AMReX_Math.H
+++ b/Src/Base/AMReX_Math.H
@@ -12,12 +12,12 @@ namespace sycl = cl::sycl;
 #endif
 
 namespace amrex { inline namespace disabled {
-    // If it is inside namespace amrex, or amrex namespace is imported with
-    // using namespace amrex or amrex::disabled, unqualified abs functions are
-    // disabled with a link time error such as, undefined reference to
-    // `amrex::disabled::abs(double)'.  To fix it, one can use `std::abs` or
-    // `amrex::Math::abs`.  The latter works in both host and device functions,
-    // whereas `std::abs` does not currently work on device with HIP and DPC++.
+    // If it is inside namespace amrex, or amrex namespace is imported with using namespace amrex or
+    // amrex::disabled, unqualified abs functions are disabled with a compile time error such as,
+    // call of overload abs(int&) is ambiguous, or a link time error such as, undefined reference to
+    // `amrex::disabled::abs(double)'.  To fix it, one can use `std::abs` or `amrex::Math::abs`.
+    // The latter works in both host and device functions, whereas `std::abs` does not currently
+    // work on device with HIP and DPC++.
     AMREX_GPU_HOST_DEVICE double abs (double);
     AMREX_GPU_HOST_DEVICE float abs (float);
     AMREX_GPU_HOST_DEVICE long double abs (long double);
@@ -35,33 +35,14 @@ namespace amrex { namespace Math {
 
 //using sycl::abs;
 // We have to do this because somehow sycl::abs(int) return unsigned int.
-template <typename T> T abs (T a) { return sycl::abs(a); }
+//template <typename T> T abs (T a) { return sycl::abs(a); } // The compiler seems to have trouble with this on DG1.
+template <typename T> T abs (T a) { return (a >= T(0)) ? a : -a; }
 
 using sycl::ceil;
 using sycl::copysign;
 using sycl::floor;
 using sycl::round;
 
-using std::sqrt;
-
-#elif defined (AMREX_USE_HIP)
-
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-double abs (double a) { return fabs(a); }
-
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-float abs (float a) { return fabsf(a); }
-
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int abs (int a) { return ::abs(a); }
-
-using ::ceil;
-using ::copysign;
-using ::floor;
-using ::round;
-
-using ::sqrt;
-
 #else
 
 using std::abs;
@@ -70,8 +51,6 @@ using std::copysign;
 using std::floor;
 using std::round;
 
-using std::sqrt;
-
 #endif
 
 }}
diff --git a/Src/Base/AMReX_MemPool.cpp b/Src/Base/AMReX_MemPool.cpp
index d0f98c8d919..a35fb2c1d87 100644
--- a/Src/Base/AMReX_MemPool.cpp
+++ b/Src/Base/AMReX_MemPool.cpp
@@ -1,7 +1,3 @@
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
 #include <iostream>
 #include <limits>
 #include <algorithm>
@@ -13,6 +9,7 @@
 #include <AMReX_CArena.H>
 #include <AMReX_MemPool.H>
 #include <AMReX_Vector.H>
+#include <AMReX_OpenMP.H>
 
 #ifdef AMREX_MEM_PROFILING
 #include <AMReX_MemProfiler.H>
@@ -20,10 +17,6 @@
 
 #include <AMReX_ParmParse.H>
 
-#ifdef USE_PERILLA_PTHREADS
-#include <WorkerThread.H>
-#endif
-
 using namespace amrex;
 
 namespace
@@ -48,25 +41,11 @@ void amrex_mempool_init ()
         ParmParse pp("fab");
 	pp.query("init_snan", init_snan);
 
-	int nthreads = 1;
-
-#ifdef _OPENMP
-	nthreads = omp_get_max_threads();
-#endif
-
-
-#ifdef USE_PERILLA_PTHREADS
-#ifdef _OPENMP
-	//Just in case Perilla thread spawns multiple OMP threads
-        nthreads *= perilla::nThreads();
-#else
-	nthreads = perilla::nThreads();
-#endif
-#endif
+	int nthreads = OpenMP::get_max_threads();
 
 	the_memory_pool.resize(nthreads);
 	for (int i=0; i<nthreads; ++i) {
-// HIP FIX THIS - Default Arena w/o managed?
+// xxxxx HIP FIX THIS - Default Arena w/o managed?
 // Default arena is currently Device on HIP where there is no managed option.
 // Need to adjust to CPU specifically in that case.
 #ifdef AMREX_USE_HIP
@@ -106,38 +85,13 @@ void amrex_mempool_finalize ()
 
 void* amrex_mempool_alloc (size_t nbytes)
 {
-  int tid=0;
-
-#ifdef _OPENMP
-  tid = omp_get_thread_num();
-#endif
-
-#ifdef USE_PERILLA_PTHREADS
-#ifdef _OPENMP
-  tid = perilla::tid()*omp_get_max_threads()+tid;
-#else
-  tid = perilla::tid();
-#endif
-#endif
+  int tid = OpenMP::get_thread_num();
   return the_memory_pool[tid]->alloc(nbytes);
 }
 
 void amrex_mempool_free (void* p) 
 {
-  int tid=0;
-
-#ifdef _OPENMP
-  tid = omp_get_thread_num();
-#endif
-
-#ifdef USE_PERILLA_PTHREADS
-#ifdef _OPENMP
-  tid = perilla::tid()*omp_get_max_threads()+tid;
-#else
-  tid = perilla::tid();
-#endif
-#endif
-
+  int tid = OpenMP::get_thread_num();
   the_memory_pool[tid]->free(p);
 }
 
diff --git a/Src/Base/AMReX_MemProfiler.cpp b/Src/Base/AMReX_MemProfiler.cpp
index ca3f3767015..d79aa4492d8 100644
--- a/Src/Base/AMReX_MemProfiler.cpp
+++ b/Src/Base/AMReX_MemProfiler.cpp
@@ -5,7 +5,7 @@
 #include <iomanip>
 #include <fstream>
 
-#ifdef __linux
+#ifdef __linux__
 #include <unistd.h>
 #include <sys/types.h>
 #include <sys/sysinfo.h>
@@ -98,7 +98,7 @@ MemProfiler::report_ (const std::string& prefix, const std::string& memory_log_n
     std::vector<int>  num_builds_max = num_builds_min;
     std::vector<int>  hwm_builds_max = hwm_builds_min;
 
-#ifdef __linux
+#ifdef __linux__
     const int N = 9;
 #else
     const int N = 1;
@@ -109,7 +109,7 @@ MemProfiler::report_ (const std::string& prefix, const std::string& memory_log_n
 
     mymin[0] = mymax[0] = std::accumulate(cur_min.begin(), cur_min.end(), 0L);
 
-#ifdef __linux
+#ifdef __linux__
     int ierr_proc_status = 0;
     const int ipstat = 1;
     const int npstat = 4;
@@ -292,7 +292,7 @@ MemProfiler::report_ (const std::string& prefix, const std::string& memory_log_n
 	    }
 	}
 
-#ifdef __linux
+#ifdef __linux__
 	if (ierr_proc_status == 0) {
 	    memlog << "\n";
 	    memlog << " * " << std::setw(width_bytes) << std::left << "Proc VmPeak"
diff --git a/Src/Base/AMReX_MultiFab.H b/Src/Base/AMReX_MultiFab.H
index f3b492d6c31..25e4bb2a61a 100644
--- a/Src/Base/AMReX_MultiFab.H
+++ b/Src/Base/AMReX_MultiFab.H
@@ -470,16 +470,6 @@ public:
                       int             numcomp,
                       const IntVect&  nghost);
 
-#ifdef USE_PERILLA
-    static void Copy (MultiFab&       dst,
-                const MultiFab& src,
-                int             f,
-                int             srccomp,
-                int             dstcomp,
-                int             numcomp,
-                const Box&      bx);
-#endif
-
     /**
     * \brief Swap from src to dst including nghost ghost cells.
     * The two MultiFabs MUST have the same underlying BoxArray.
diff --git a/Src/Base/AMReX_MultiFab.cpp b/Src/Base/AMReX_MultiFab.cpp
index 83b17db3983..66e638ba9d5 100644
--- a/Src/Base/AMReX_MultiFab.cpp
+++ b/Src/Base/AMReX_MultiFab.cpp
@@ -43,16 +43,36 @@ MultiFab::Dot (const MultiFab& x, int xcomp,
 
     BL_PROFILE("MultiFab::Dot()");
 
-    Real sm = amrex::ReduceSum(x, y, nghost,
-    [=] AMREX_GPU_HOST_DEVICE (Box const& bx, Array4<Real const> const& xfab, Array4<Real const> const& yfab) -> Real
-    {
-        Real t = 0.0;
-        AMREX_LOOP_4D(bx, numcomp, i, j, k, n,
+    Real sm = 0.0;
+#ifdef AMREX_USE_GPU
+    if (Gpu::inLaunchRegion()) {
+        sm = amrex::ReduceSum(x, y, nghost,
+        [=] AMREX_GPU_HOST_DEVICE (Box const& bx, Array4<Real const> const& xfab, Array4<Real const> const& yfab) -> Real
         {
-            t += xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);
+            Real t = 0.0;
+            AMREX_LOOP_4D(bx, numcomp, i, j, k, n,
+            {
+                t += xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);
+            });
+            return t;
         });
-        return t;
-    });
+    } else
+#endif
+    {
+#ifdef _OPENMP
+#pragma omp parallel reduction(+:sm)
+#endif
+        for (MFIter mfi(x,true); mfi.isValid(); ++mfi)
+        {
+            Box const& bx = mfi.growntilebox(nghost);
+            Array4<Real const> const& xfab = x.const_array(mfi);
+            Array4<Real const> const& yfab = y.const_array(mfi);
+            AMREX_LOOP_4D(bx, numcomp, i, j, k, n,
+            {
+                sm += xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);
+            });
+        }
+    }
 
     if (!local) ParallelAllReduce::Sum(sm, ParallelContext::CommunicatorSub());
 
@@ -155,33 +175,6 @@ MultiFab::Copy (MultiFab& dst, const MultiFab& src,
     amrex::Copy(dst,src,srccomp,dstcomp,numcomp,nghost);
 }
 
-
-#ifdef USE_PERILLA
-void
-MultiFab::Copy (MultiFab&       dst,
-                const MultiFab& src,
-                int             f,
-                int             srccomp,
-                int             dstcomp,
-                int             numcomp,
-                const Box&      bx)
-{
-// don't have to    BL_ASSERT(dst.boxArray() == src.boxArray());
-    BL_ASSERT(dst.distributionMap == src.distributionMap);
-    //BL_ASSERT(dst.nGrow() >= nghost); // and src.nGrow() >= nghost);
-
-    int fis = src.IndexArray()[f];
-    int fid = dst.IndexArray()[f];
-    //const Box& bx = BoxLib::grow(dst[f].box(),nghost);
-    //const Box& bx = dst[fid].box();
-
-    if (bx.ok())
-      dst[fid].copy(src[fid], bx, srccomp, bx, dstcomp, numcomp);
-
-}
-#endif
-
-
 void
 MultiFab::Swap (MultiFab& dst, MultiFab& src,
                 int srccomp, int dstcomp, int numcomp, int nghost)
@@ -225,7 +218,7 @@ MultiFab::Swap (MultiFab& dst, MultiFab& src,
             if (bx.ok()) {
                 auto sfab = src.array(mfi);
                 auto dfab = dst.array(mfi);
-                AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
                 {
                     const amrex::Real tmp = dfab(i,j,k,n+dstcomp);
                     dfab(i,j,k,n+dstcomp) = sfab(i,j,k,n+srccomp);
@@ -325,7 +318,7 @@ MultiFab::Saxpy (MultiFab& dst, Real a, const MultiFab& src,
         if (bx.ok()) {
             auto const sfab = src.array(mfi);
             auto       dfab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dfab(i,j,k,dstcomp+n) += a * sfab(i,j,k,srccomp+n);
             });
@@ -359,7 +352,7 @@ MultiFab::Xpay (MultiFab& dst, Real a, const MultiFab& src,
         if (bx.ok()) {
             auto const sfab = src.array(mfi);
             auto       dfab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dfab(i,j,k,n+dstcomp) = sfab(i,j,k,n+srccomp) + a * dfab(i,j,k,n+dstcomp);
             });
@@ -401,7 +394,7 @@ MultiFab::LinComb (MultiFab& dst,
             auto const xfab =   x.array(mfi);
             auto const yfab =   y.array(mfi);
             auto       dfab = dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dfab(i,j,k,dstcomp+n) = a*xfab(i,j,k,xcomp+n) + b*yfab(i,j,k,ycomp+n);
             });
@@ -442,7 +435,7 @@ MultiFab::AddProduct (MultiFab& dst,
             auto const s1fab = src1.array(mfi);
             auto const s2fab = src2.array(mfi);
             auto        dfab =  dst.array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, numcomp, i, j, k, n,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, numcomp, i, j, k, n,
             {
                 dfab(i,j,k,n+dstcomp) += s1fab(i,j,k,n+comp1) * s2fab(i,j,k,n+comp2);
             });
@@ -692,7 +685,7 @@ MultiFab::contains_inf (int scomp, int ncomp, IntVect const& ngrow, bool local)
 bool 
 MultiFab::contains_inf (int scomp, int ncomp, int ngrow, bool local) const
 {
-    return contains_inf(0,ncomp,IntVect(ngrow),local);
+    return contains_inf(scomp,ncomp,IntVect(ngrow),local);
 }
 
 bool 
@@ -843,75 +836,7 @@ namespace {
 static IntVect
 indexFromValue (MultiFab const& mf, int comp, int nghost, Real value, MPI_Op mmloc)
 {
-    IntVect loc;
-
-#ifdef AMREX_USE_GPU
-    if (Gpu::inLaunchRegion())
-    {
-        int tmp[1+AMREX_SPACEDIM] = {0};
-        amrex::Gpu::AsyncArray<int> aa(tmp, 1+AMREX_SPACEDIM);
-        int* p = aa.data();
-        // This is a device ptr to 1+AMREX_SPACEDIM int zeros.
-        // The first is used as an atomic bool and the others for intvect.
-        for (MFIter mfi(mf); mfi.isValid(); ++mfi) {
-            const Box& bx = amrex::grow(mfi.validbox(), nghost);
-            const Array4<Real const> arr = mf.const_array(mfi);
-            amrex::ParallelFor(bx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
-            {
-                int* flag = p;
-                if (*flag == 0) {
-                    if (arr(i,j,k,comp) == value) {
-                        if (Gpu::Atomic::Exch(flag,1) == 0) {
-                            AMREX_D_TERM(p[1] = i;,
-                                         p[2] = j;,
-                                         p[3] = k;);
-                        }
-                    }
-                }
-            });
-        }
-        aa.copyToHost(tmp, 1+AMREX_SPACEDIM);
-        AMREX_D_TERM(loc[0] = tmp[1];,
-                     loc[1] = tmp[2];,
-                     loc[2] = tmp[3];);
-    }
-    else
-#endif
-    {
-        bool f = false;
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        {
-            IntVect priv_loc = IntVect::TheMinVector();
-            for (MFIter mfi(mf,true); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.growntilebox(nghost);
-                const Array4<Real const>& fab = mf.const_array(mfi);
-                AMREX_LOOP_3D(bx, i, j, k,
-                {
-                    if (fab(i,j,k,comp) == value) priv_loc = IntVect(AMREX_D_DECL(i,j,k));
-                });
-            }
-
-            if (priv_loc.allGT(IntVect::TheMinVector())) {
-                bool old;
-// we should be able to test on _OPENMP < 201107 for capture (version 3.1)
-// but we must work around a bug in gcc < 4.9
-#if defined(_OPENMP) && _OPENMP < 201307 // OpenMP 4.0
-#pragma omp critical (amrex_indexfromvalue)
-#elif defined(_OPENMP)
-#pragma omp atomic capture
-#endif
-                {
-                    old = f;
-                    f = true;
-                }
-
-                if (old == false) loc = priv_loc;
-            }
-        }
-    }
+    IntVect loc = indexFromValue(mf, comp, IntVect{nghost}, value);
 
 #ifdef BL_USE_MPI
     const int NProcs = ParallelContext::NProcsSub();
@@ -929,6 +854,8 @@ indexFromValue (MultiFab const& mf, int comp, int nghost, Real value, MPI_Op mml
         MPI_Allreduce(&in,  &out, 1, datatype, mmloc, comm);
         MPI_Bcast(&(loc[0]), AMREX_SPACEDIM, MPI_INT, out.rank, comm);
     }
+#else
+    amrex::ignore_unused(mmloc);
 #endif
 
     return loc;
@@ -975,6 +902,8 @@ MultiFab::norm0 (const iMultiFab& mask, int comp, int nghost, bool local) const
 Real
 MultiFab::norm0 (int comp, int nghost, bool local, bool ignore_covered ) const
 {
+    amrex::ignore_unused(ignore_covered);
+
     Real nm0;
 
 #ifdef AMREX_USE_EB
@@ -1045,15 +974,23 @@ MultiFab::norm2 (int comp) const
 Real
 MultiFab::norm2 (int comp, const Periodicity& period) const
 {
-    MultiFab tmpmf(boxArray(), DistributionMap(), 1, 0, MFInfo(), Factory());
-    MultiFab::Copy(tmpmf, *this, comp, 0, 1, 0);
-
     auto mask = OverlapMask(period);
-    MultiFab::Divide(tmpmf, *mask, 0, 0, 1, 0);
 
-    Real nm2 = MultiFab::Dot(*this, comp, tmpmf, 0, 1, 0);
-    nm2 = std::sqrt(nm2);
-    return nm2;
+    Real nm2 = amrex::ReduceSum(*this, *mask, 0,
+    [=] AMREX_GPU_HOST_DEVICE (Box const& bx, Array4<Real const> const& xfab,
+                               Array4<Real const> const& mfab) -> Real
+    {
+        Real r = 0.0;
+        AMREX_LOOP_3D(bx, i, j, k,
+        {
+            Real tmp = xfab(i,j,k,comp);
+            r += tmp*tmp/mfab(i,j,k);
+        });
+        return r;
+    });
+
+    ParallelAllReduce::Sum(nm2, ParallelContext::CommunicatorSub());
+    return std::sqrt(nm2);
 }
 
 Vector<Real>
@@ -1075,6 +1012,8 @@ MultiFab::norm2 (const Vector<int>& comps) const
 Real
 MultiFab::norm1 (int comp, const Periodicity& period, bool ignore_covered ) const
 {
+    amrex::ignore_unused(ignore_covered);
+
     MultiFab tmpmf(this->boxArray(), this->DistributionMap(), 1, 0,
                    MFInfo(), this->Factory());
 
@@ -1328,7 +1267,7 @@ MultiFab::OverlapMask (const Periodicity& period) const
     [=] AMREX_GPU_DEVICE (int i, int j, int k, int n, Array4<Real> const& a) noexcept
     {
         Real* p = a.ptr(i,j,k,n);
-        Gpu::Atomic::Add(p, 1.0_rt);
+        Gpu::Atomic::AddNoRet(p, Real(1.0));
     });
 #endif
 
diff --git a/Src/Base/AMReX_MultiFabUtil.H b/Src/Base/AMReX_MultiFabUtil.H
index b84e81cc91d..ff88e05b035 100644
--- a/Src/Base/AMReX_MultiFabUtil.H
+++ b/Src/Base/AMReX_MultiFabUtil.H
@@ -71,6 +71,14 @@ namespace amrex
     void average_down_faces (const MultiFab& fine, MultiFab& crse,
                              const IntVect& ratio, int ngcrse=0);
 
+    //  This version takes periodicity into account.
+    void average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
+                             const Array<MultiFab*,AMREX_SPACEDIM>& crse,
+                             const IntVect& ratio, const Geometry& crse_geom);
+    //  This version takes periodicity into account.
+    void average_down_faces (const MultiFab& fine, MultiFab& crse,
+                             const IntVect& ratio, const Geometry& crse_geom);
+
     //! Average fine edge-based MultiFab onto crse edge-based MultiFab.
     void average_down_edges (const Vector<const MultiFab*>& fine,
                              const Vector<MultiFab*>& crse,
@@ -91,7 +99,8 @@ namespace amrex
     void average_down_nodal (const FabArray<FAB>& S_fine,
                              FabArray<FAB>& S_crse,
                              const IntVect& ratio,
-                             int ngcrse = 0);
+                             int ngcrse = 0,
+                             bool mfiter_is_definitely_safe=false);
 
     //! Average fine cell-based MultiFab onto crse cell-centered MultiFab using
     //! volume-weighting. This routine DOES NOT assume that the crse BoxArray is
@@ -263,7 +272,7 @@ makeFineMask (const FabArray<FAB>& cmf, const FabArray<FAB>& fmf,
 //! This routine assumes that the crse BoxArray is a coarsened version of the fine BoxArray.
 template <typename FAB>
 void average_down_nodal (const FabArray<FAB>& fine, FabArray<FAB>& crse,
-                         const IntVect& ratio, int ngcrse)
+                         const IntVect& ratio, int ngcrse, bool mfiter_is_definitely_safe)
 {
     AMREX_ASSERT(fine.is_nodal());
     AMREX_ASSERT(crse.is_nodal());
@@ -272,7 +281,7 @@ void average_down_nodal (const FabArray<FAB>& fine, FabArray<FAB>& crse,
     int ncomp = crse.nComp();
     using value_type = typename FAB::value_type;
 
-    if (isMFIterSafe(fine, crse))
+    if (mfiter_is_definitely_safe || isMFIterSafe(fine, crse))
     {
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
diff --git a/Src/Base/AMReX_MultiFabUtil.cpp b/Src/Base/AMReX_MultiFabUtil.cpp
index 68c0b3b4fa6..fb436d6dcaf 100644
--- a/Src/Base/AMReX_MultiFabUtil.cpp
+++ b/Src/Base/AMReX_MultiFabUtil.cpp
@@ -67,7 +67,7 @@ namespace amrex
             Array4<Real> const& ccarr = cc.array(mfi);
             Array4<Real const> const& ndarr = nd.const_array(mfi);
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avg_nd_to_cc(tbx, ccarr, ndarr, dcomp, scomp, ncomp);
             });
@@ -91,7 +91,7 @@ namespace amrex
                          Array4<Real const> const& eyarr = edge[1]->const_array(mfi);,
                          Array4<Real const> const& ezarr = edge[2]->const_array(mfi););
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avg_eg_to_cc(tbx, ccarr, AMREX_D_DECL(exarr,eyarr,ezarr), dcomp);
             });
@@ -102,7 +102,7 @@ namespace amrex
         const Vector<const MultiFab*>& fc, int ngrow)
     {
         average_face_to_cellcenter(cc, dcomp,
-            Array<MultiFab const*,AMREX_SPACEDIM>{AMREX_D_DECL(fc[0],fc[1],fc[2])},
+            Array<MultiFab const*,AMREX_SPACEDIM>{{AMREX_D_DECL(fc[0],fc[1],fc[2])}},
             ngrow);
     }
 
@@ -111,7 +111,7 @@ namespace amrex
     {
         average_face_to_cellcenter(cc,
                                    Array<MultiFab const*,AMREX_SPACEDIM>
-                                                  {AMREX_D_DECL(fc[0],fc[1],fc[2])},
+                                   {{AMREX_D_DECL(fc[0],fc[1],fc[2])}},
                                    geom);
     }
 
@@ -133,12 +133,12 @@ namespace amrex
                          Array4<Real const> const& fzarr = fc[2]->const_array(mfi););
 
 #if (AMREX_SPACEDIM == 1)
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avg_fc_to_cc(tbx, ccarr, fxarr, dcomp, GeometryData());
             });
 #else
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avg_fc_to_cc(tbx, ccarr, AMREX_D_DECL(fxarr,fyarr,fzarr), dcomp);
             });
@@ -168,12 +168,12 @@ namespace amrex
                          Array4<Real const> const& fzarr = fc[2]->const_array(mfi););
 
 #if (AMREX_SPACEDIM == 1)
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avg_fc_to_cc(tbx, ccarr, fxarr, 0, gd);
             });
 #else
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avg_fc_to_cc(tbx, ccarr, AMREX_D_DECL(fxarr,fyarr,fzarr), 0);
             });
@@ -184,7 +184,7 @@ namespace amrex
     void average_cellcenter_to_face (const Vector<MultiFab*>& fc, const MultiFab& cc,
 				     const Geometry& geom)
     {
-        average_cellcenter_to_face(Array<MultiFab*,AMREX_SPACEDIM>{AMREX_D_DECL(fc[0],fc[1],fc[2])},
+        average_cellcenter_to_face(Array<MultiFab*,AMREX_SPACEDIM>{{AMREX_D_DECL(fc[0],fc[1],fc[2])}},
                                    cc, geom);
     }
 
@@ -198,6 +198,8 @@ namespace amrex
 
 #if (AMREX_SPACEDIM == 1)
         const GeometryData& gd = geom.data();
+#else
+        amrex::ignore_unused(geom);
 #endif
 
 #ifdef _OPENMP
@@ -216,12 +218,12 @@ namespace amrex
             Array4<Real const> const& ccarr = cc.const_array(mfi);
 
 #if (AMREX_SPACEDIM == 1)
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (index_bounds, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA (index_bounds, tbx,
             {
                 amrex_avg_cc_to_fc(tbx, xbx, fxarr, ccarr, gd);
             });
 #else
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (index_bounds, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA (index_bounds, tbx,
             {
                 amrex_avg_cc_to_fc(tbx, AMREX_D_DECL(xbx,ybx,zbx),
                                    AMREX_D_DECL(fxarr,fyarr,fzarr), ccarr);
@@ -246,6 +248,8 @@ namespace amrex
 		       const Geometry& fgeom, const Geometry& cgeom,
                        int scomp, int ncomp, const IntVect& ratio)
     {
+        amrex::ignore_unused(fgeom,cgeom);
+
         BL_PROFILE("amrex::average_down_w_geom");
 
         if (S_fine.is_nodal() || S_crse.is_nodal())
@@ -284,7 +288,7 @@ namespace amrex
             Array4<Real const> const& finearr = S_fine.const_array(mfi);
             Array4<Real const> const& finevolarr = fvolume.const_array(mfi);
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avgdown_with_vol(tbx,crsearr,finearr,finevolarr,
                                        0,scomp,ncomp,ratio);
@@ -308,7 +312,7 @@ namespace amrex
 
     void sum_fine_to_coarse(const MultiFab& S_fine, MultiFab& S_crse,
                             int scomp, int ncomp, const IntVect& ratio,
-                            const Geometry& cgeom, const Geometry& fgeom)
+                            const Geometry& cgeom, const Geometry& /*fgeom*/)
     {
         AMREX_ASSERT(S_crse.nComp() == S_fine.nComp());
         AMREX_ASSERT(ratio == ratio[0]);
@@ -333,7 +337,7 @@ namespace amrex
             Array4<Real> const& crsearr = crse_S_fine.array(mfi);
             Array4<Real const> const& finearr = S_fine.const_array(mfi);
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
             {
                 amrex_avgdown(tbx,crsearr,finearr,0,scomp,ncomp,ratio);
             });
@@ -371,12 +375,12 @@ namespace amrex
                 Array4<Real const> const& finearr = S_fine.const_array(mfi);
 
                 if (is_cell_centered) {
-                    AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                    AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
                     {
                         amrex_avgdown(tbx,crsearr,finearr,scomp,scomp,ncomp,ratio);
                     });
                 } else {
-                    AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                    AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
                     {
                         amrex_avgdown_nodes(tbx,crsearr,finearr,scomp,scomp,ncomp,ratio);
                     });
@@ -402,12 +406,12 @@ namespace amrex
                 //        not part of the actual crse multifab which came in.
 
                 if (is_cell_centered) {
-                    AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                    AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
                     {
                         amrex_avgdown(tbx,crsearr,finearr,0,scomp,ncomp,ratio);
                     });
                 } else {
-                    AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                    AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
                     {
                         amrex_avgdown_nodes(tbx,crsearr,finearr,0,scomp,ncomp,ratio);
                     });
@@ -425,9 +429,9 @@ namespace amrex
                              const IntVect& ratio, int ngcrse)
     {
         average_down_faces(Array<const MultiFab*,AMREX_SPACEDIM>
-                                   {AMREX_D_DECL(fine[0],fine[1],fine[2])},
+                                   {{AMREX_D_DECL(fine[0],fine[1],fine[2])}},
                            Array<MultiFab*,AMREX_SPACEDIM>
-                                   {AMREX_D_DECL(crse[0],crse[1],crse[2])},
+                                   {{AMREX_D_DECL(crse[0],crse[1],crse[2])}},
                            ratio, ngcrse);
     }
 
@@ -482,7 +486,7 @@ namespace amrex
                 Array4<Real> const& crsearr = crse.array(mfi);
                 Array4<Real const> const& finearr = fine.const_array(mfi);
 
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
                 {
                     amrex_avgdown_faces(tbx, crsearr, finearr, 0, 0, ncomp, ratio, dir);
                 });
@@ -497,6 +501,25 @@ namespace amrex
         }
     }
 
+    void average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
+                             const Array<MultiFab*,AMREX_SPACEDIM>& crse,
+                             const IntVect& ratio, const Geometry& crse_geom)
+    {
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+        {
+            average_down_faces(*fine[idim], *crse[idim], ratio, crse_geom);
+        }
+    }
+
+    void average_down_faces (const MultiFab& fine, MultiFab& crse,
+                             const IntVect& ratio, const Geometry& crse_geom)
+    {
+        MultiFab ctmp(amrex::coarsen(fine.boxArray(),ratio), fine.DistributionMap(),
+                      crse.nComp(), 0);
+        average_down_faces(fine, ctmp, ratio, 0);
+        crse.ParallelCopy(ctmp,0,0,crse.nComp(),0,0,crse_geom.periodicity());
+    }
+
     //! Average fine edge-based MultiFab onto crse edge-based MultiFab.
     //! This routine assumes that the crse BoxArray is a coarsened version of the fine BoxArray.
     void average_down_edges (const Vector<const MultiFab*>& fine, const Vector<MultiFab*>& crse,
@@ -545,7 +568,7 @@ namespace amrex
                 Array4<Real> const& crsearr = crse.array(mfi);
                 Array4<Real const> const& finearr = fine.const_array(mfi);
 
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
                 {
                     amrex_avgdown_edges(tbx, crsearr, finearr, 0, 0, ncomp, ratio, dir);
                 });
@@ -617,7 +640,7 @@ namespace amrex
 
             if (interpolate)
             {
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tile_box, thread_box,
+                AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( tile_box, thread_box,
                 {
                     amrex_fill_slice_interp(thread_box, slice_arr, full_arr,
                                             0, start_comp, ncomp,
diff --git a/Src/Base/AMReX_MultiFabUtil_1D_C.H b/Src/Base/AMReX_MultiFabUtil_1D_C.H
index 5991fd8b0fa..4b234c3a9ec 100644
--- a/Src/Base/AMReX_MultiFabUtil_1D_C.H
+++ b/Src/Base/AMReX_MultiFabUtil_1D_C.H
@@ -157,7 +157,7 @@ inline
 void amrex_avgdown_faces (Box const& bx, Array4<Real> const& crse,
                           Array4<Real const> const& fine,
                           int ccomp, int fcomp, int ncomp,
-                          IntVect const& ratio, int idir) noexcept
+                          IntVect const& ratio, int /*idir*/) noexcept
 {
     const auto clo = lbound(bx);
     const auto chi = ubound(bx);
@@ -176,7 +176,7 @@ inline
 void amrex_avgdown_edges (Box const& bx, Array4<Real> const& crse,
                           Array4<Real const> const& fine,
                           int ccomp, int fcomp, int ncomp,
-                          IntVect const& ratio, int idir) noexcept
+                          IntVect const& ratio, int /*idir*/) noexcept
 {
     const auto clo = lbound(bx);
     const auto chi = ubound(bx);
diff --git a/Src/Base/AMReX_MultiFabUtil_Perilla.H b/Src/Base/AMReX_MultiFabUtil_Perilla.H
deleted file mode 100644
index fd3fcb8ca08..00000000000
--- a/Src/Base/AMReX_MultiFabUtil_Perilla.H
+++ /dev/null
@@ -1,40 +0,0 @@
-#ifndef AMREX_MultiFabUtil_PERILLAH_
-#define AMREX_MultiFabUtil_PERILLAH_
-
-#ifdef USE_PERILLA
-#include <AMReX_MultiFab.H>
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_Amr.H>
-#include <RegionGraph.H>
-
-namespace amrex
-{
-
-  class RGIter;
-
-    void average_down_push(RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			 const Geometry& fine_geom, const Geometry& crse_geom,
-			 int scomp, int ncomp, const IntVect& ratio, int f);
-    void average_down_pull(RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom,
-			   int scomp, int ncomp, const IntVect& ratio, int f);
-  
-    void average_down_push(RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			   const Geometry& fine_geom, const Geometry& crse_geom,
-			   int scomp, int ncomp, const int ratio, int f);
-    void average_down_pull(RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fine_geom, const Geometry& crse_geom,
-			   int scomp, int ncomp, const int ratio, int f);
-  
-    void average_down_push(RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			   int scomp, int ncomp, const IntVect& ratio, int f);
-    void average_down_pull(RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			   int scomp, int ncomp, const IntVect& ratio, int f);
-  
-    void average_down_push(RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			   int scomp, int ncomp,       int      ratio, int f);  
-    void average_down_pull(RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			   int scomp, int ncomp,       int      ratio, int f);
-
-}
-#endif
-
-#endif
diff --git a/Src/Base/AMReX_MultiFabUtil_Perilla.cpp b/Src/Base/AMReX_MultiFabUtil_Perilla.cpp
deleted file mode 100644
index bba565096a6..00000000000
--- a/Src/Base/AMReX_MultiFabUtil_Perilla.cpp
+++ /dev/null
@@ -1,167 +0,0 @@
-#ifdef USE_PERILLA
-
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_MultiFabUtil_C.H>
-#include <AMReX_MultiFabUtil_Perilla.H>
-
-#include <Perilla.H>
-#include <RegionGraph.H>
-#include <WorkerThread.H>
-#include <AMReX_Amr.H>
-#include <AMReX_AmrLevel.H>
-
-namespace amrex
-{
-  void average_down_push (RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-                       int scomp, int ncomp, const IntVect& ratio, int f)
-    {
-        if(rgi.currentItr != rgi.totalItr)
-	  return;
-
-	f = rgi.currentRegion;
-
-        BL_ASSERT(S_crse.nComp() == S_fine.nComp());
-
-	//if(RG_fine->graphID == 23)
-	//std::cout<<"In avg down push f " << f << std::endl;
-
-	//  NOTE: The tilebox is defined at the coarse level.
-	int lfi = crse_S_fine.IndexArray()[f];
-	//const Box& tbx = crse_S_fine[lfi].box();
-
-	//  NOTE: We copy from component scomp of the fine fab into component 0 of the crse fab
-	//        because the crse fab is a temporary which was made starting at comp 0, it is
-	//        not part of the actual crse multifab which came in.
-
-	int tg = perilla::wid();
-	int nt = perilla::wtid();
-	
-	for(int t=0; t<RG_fine->fabTiles[f]->numTiles; t++)
-	  if(t % (perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS) == nt-perilla::NUM_COMM_THREADS)
-	    {
-	      const Box& tbx = *(RG_fine->fabTiles[f]->tileBx[t]);
-	      
-              amrex_avgdown(tbx,crse_S_fine[lfi].array(),S_fine[lfi].array(),0,scomp,ncomp,ratio);
-	    }
-	RG_fine->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-perilla::NUM_COMM_THREADS); // Barrier to synchronize team threads
-	
-	//if(RG_fine->graphID == 23)
-	//std::cout<<"In avg down pushAsych f " << f << std::endl;
-
-	Perilla::multifabCopyPush( RG_crse, RG_fine, &S_crse, &crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-	
-        //S_crse.copy(crse_S_fine,0,scomp,ncomp);
-   }
-
-  void average_down_pull (RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-                       int scomp, int ncomp, const IntVect& ratio, int f)
-    {
-        if(rgi.currentItr != 1)
-	  return;
-
-	f = rgi.currentRegion;
-
-        BL_ASSERT(S_crse.nComp() == S_fine.nComp());
-
-	Perilla::multifabCopyPull( RG_crse, RG_fine, &S_crse, &S_fine, f,scomp, 0, ncomp, 0, 0, false);
-	
-        //S_crse.copy(crse_S_fine,0,scomp,ncomp);
-   }
-
-  void average_down_push (RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-			  const Geometry& fgeom, const Geometry& cgeom, 
-			  int scomp, int ncomp, int rr, int f)
-     {
-       average_down_push(rgi,amr,S_fine,S_crse,crse_S_fine,RG_fine,RG_crse,fgeom,cgeom,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-     }
-  
-  void average_down_pull (RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fgeom, const Geometry& cgeom, 
-		     int scomp, int ncomp, int rr, int f)
-     {
-       average_down_pull(rgi, S_fine,S_crse,RG_fine,RG_crse,fgeom,cgeom,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-     }
-
-  
-  void average_down_push (RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse, 
-			  const Geometry& fgeom, const Geometry& cgeom, 
-			  int scomp, int ncomp, const IntVect& ratio, int f)
-    {
-        if(rgi.currentItr != rgi.totalItr)
-	  return;
-
-	f = rgi.currentRegion;
-
-        if (S_fine.is_nodal() || S_crse.is_nodal())
-        {
-            amrex::Error("Can't use amrex::average_down for nodal MultiFab!");
-        }
-
-#if (BL_SPACEDIM == 3)
-	amrex::average_down_push(rgi, amr, S_fine, S_crse, crse_S_fine, RG_fine, RG_crse, scomp, ncomp, ratio, f);
-	return;
-#else
-
-        BL_ASSERT(S_crse.nComp() == S_fine.nComp());
-
-
-	MultiFab fvolume;
-	fgeom.GetVolume(fvolume, fine_BA, 0);
-
-	//#ifdef _OPENMP
-	//#pragma omp parallel
-	//#endif
-        //for (MFIter mfi(crse_S_fine,true); mfi.isValid(); ++mfi)
-        //{
-	//  NOTE: The tilebox is defined at the coarse level.
-	int lfi = crse_S_fine.IndexArray()[f];
- 	const Box& tbx = crse_S_fine[ lfi ].box();
-	
-        amrex_avgdown_with_vol(tbx,crse_S_fine[lfi].array(),S_fine[lfi].array(),fvolume[lfi].array(),
-                               0,scomp,ncomp,ratio);
-	//}
-
-	Perilla::multifabCopyPush( RG_crse, RG_fine, &S_crse, &crse_S_fine, f, scomp, 0, ncomp, 0, 0, false);
-	
-        //S_crse.copy(crse_S_fine,0,scomp,ncomp);
-#endif
-   }
-
-  void average_down_pull (RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, const Geometry& fgeom, const Geometry& cgeom, 
-			      int scomp, int ncomp, const IntVect& ratio, int f)
-    {
-        if(rgi.currentItr != 1)
-	  return;
-
-	f = rgi.currentRegion;
-
-        if (S_fine.is_nodal() || S_crse.is_nodal())
-        {
-            amrex::Error("Can't use amrex::average_down for nodal MultiFab!");
-        }
-
-#if (BL_SPACEDIM == 3)
-	amrex::average_down_pull(rgi, S_fine, S_crse, RG_fine, RG_crse, scomp, ncomp, ratio, f);
-	return;
-#else
-
-        BL_ASSERT(S_crse.nComp() == S_fine.nComp());
-
-
-	Perilla::multifabCopyPull(rgi, RG_crse, RG_fine, &S_crse, &S_fine, f, scomp, 0, ncomp, 0, 0, false);
-	
-        //S_crse.copy(crse_S_fine,0,scomp,ncomp);
-#endif
-   }
-  
-  void average_down_push (RGIter& rgi, Amr& amr, MultiFab& S_fine, MultiFab& S_crse, MultiFab& crse_S_fine, RegionGraph* RG_fine, RegionGraph* RG_crse,
-			  int scomp, int ncomp, int rr, int f)
-    {
-      average_down_push(rgi,amr,S_fine,S_crse,crse_S_fine,RG_fine,RG_crse,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-    }
-  void average_down_pull (RGIter& rgi, MultiFab& S_fine, MultiFab& S_crse, RegionGraph* RG_fine, RegionGraph* RG_crse, int scomp, int ncomp, int rr, int f)
-    {
-      average_down_pull(rgi, S_fine,S_crse,RG_fine,RG_crse,scomp,ncomp,rr*IntVect::TheUnitVector(),f);
-    }
-}
-
-#endif
diff --git a/Src/Base/AMReX_MultiFabUtil_nd_C.H b/Src/Base/AMReX_MultiFabUtil_nd_C.H
index 7ad5309fab6..82347fd9b5a 100644
--- a/Src/Base/AMReX_MultiFabUtil_nd_C.H
+++ b/Src/Base/AMReX_MultiFabUtil_nd_C.H
@@ -23,9 +23,9 @@ void amrex_fill_slice_interp (Box const& bx, Array4<Real> slice,
     int ihi = 0, jhi = 0, khi = 0;
 
     Real weight = (coord - gd.ProbLo(dir)) / gd.CellSize(dir);
-    int dirhi = static_cast<int>(amrex::Math::floor(weight + 0.5_rt));
+    int dirhi = static_cast<int>(amrex::Math::floor(weight + Real(0.5)));
     int dirlo = dirhi-1;
-    weight -= dirlo+0.5_rt;
+    weight -= dirlo+Real(0.5);
 
     if (weight < 0.5) {
         switch (dir)
diff --git a/Src/Base/AMReX_NFiles.cpp b/Src/Base/AMReX_NFiles.cpp
index 6a893d3bc0a..0709dbc3141 100644
--- a/Src/Base/AMReX_NFiles.cpp
+++ b/Src/Base/AMReX_NFiles.cpp
@@ -310,6 +310,7 @@ bool NFilesIter::ReadyToWrite(bool appendFirst) {
   return false;
 
 #else
+  amrex::ignore_unused(appendFirst);
   if(finishedWriting) {
     return false;
   }
diff --git a/Src/Base/AMReX_OpenMP.H b/Src/Base/AMReX_OpenMP.H
new file mode 100644
index 00000000000..e4d52c45630
--- /dev/null
+++ b/Src/Base/AMReX_OpenMP.H
@@ -0,0 +1,31 @@
+#ifndef AMREX_OPENMP_H_
+#define AMREX_OPENMP_H_
+
+#ifdef _OPENMP
+#include <omp.h>
+
+namespace amrex {
+namespace OpenMP {
+
+    inline int get_num_threads () { return omp_get_num_threads(); }
+    inline int get_max_threads () { return omp_get_max_threads(); }
+    inline int get_thread_num  () { return omp_get_thread_num();  }
+    inline int in_parallel     () { return omp_in_parallel();     }
+
+}}
+
+#else
+
+namespace amrex {
+namespace OpenMP {
+
+    constexpr int get_num_threads () { return 1; }
+    constexpr int get_max_threads () { return 1; }
+    constexpr int get_thread_num  () { return 0; }
+    constexpr int in_parallel     () { return false; }
+
+}}
+
+#endif
+
+#endif
diff --git a/Src/Base/AMReX_PODVector.H b/Src/Base/AMReX_PODVector.H
index bfd13bfd630..b7e19a0743d 100644
--- a/Src/Base/AMReX_PODVector.H
+++ b/Src/Base/AMReX_PODVector.H
@@ -30,14 +30,18 @@ namespace amrex
         typename std::enable_if<!RunOnGpu<T>::value>::type
         uninitializedFillNImpl (U* data, Size count, const Value& value)
         {
-            std::uninitialized_fill_n<U*, U>(data, count, value);
+            std::uninitialized_fill_n<U*, Size, Value>(data, count, value);
         }
 
         template <typename T>
         typename std::enable_if<RunOnGpu<T>::value>::type
         memCopyImpl (void* dst, const void* src, std::size_t count)
         {
+#ifdef AMREX_USE_GPU
             Gpu::dtod_memcpy(dst, src, count);
+#else
+            std::memcpy(dst, src, count);
+#endif
         }
 
         template <typename T>
@@ -51,29 +55,38 @@ namespace amrex
         typename std::enable_if<RunOnGpu<T>::value>::type
         memMoveImpl (void* dst, const void* src, std::size_t count, T& allocator)
         {
+#ifdef AMREX_USE_GPU
             AMREX_ASSERT(count % sizeof(typename T::value_type) == 0);
 
             auto N = count / sizeof(typename T::value_type);
             auto tmp = allocator.allocate(N);
-            
+
             Gpu::dtod_memcpy(tmp, src, count);
             Gpu::dtod_memcpy(dst, tmp, count);
 
             allocator.deallocate(tmp, N);
+#else
+            amrex::ignore_unused(allocator);
+            std::memmove(dst, src, count);
+#endif
         }
 
         template <typename T>
         typename std::enable_if<!RunOnGpu<T>::value>::type
-        memMoveImpl (void* dst, const void* src, std::size_t count, T& allocator)
+        memMoveImpl (void* dst, const void* src, std::size_t count, T& /*allocator*/)
         {
             std::memmove(dst, src, count);
         }
-        
+
         template <typename T, typename U>
         typename std::enable_if<RunOnGpu<T>::value>::type
         initFromListImpl (U* data, std::initializer_list<U> list)
         {
+#ifdef AMREX_USE_GPU
             Gpu::htod_memcpy(data, &(*list.begin()), list.size() * sizeof(U));
+#else
+            std::memcpy(data, &(*list.begin()), list.size() * sizeof(U));
+#endif
         }
 
         template <typename T, typename U>
@@ -505,7 +518,7 @@ namespace amrex
             m_capacity = a_capacity;
         }
         
-        PODVector& CopyAssignmentDoIt (const PODVector<T, Allocator>& a_vector, std::false_type) noexcept
+        PODVector& CopyAssignmentDoIt (const PODVector<T, Allocator>& a_vector, std::true_type) noexcept
         {
             const size_t other_size = a_vector.size();            
             if ( other_size > capacity() ) { AllocateBuffer(other_size); }            
@@ -514,11 +527,11 @@ namespace amrex
             return *this;
         }
         
-        PODVector& CopyAssignmentDoIt (const PODVector<T, Allocator>& a_vector, std::true_type) noexcept
+        PODVector& CopyAssignmentDoIt (const PODVector<T, Allocator>& a_vector, std::false_type) noexcept
         {
-            if (static_cast<Allocator&>(a_vector) == static_cast<Allocator&>(*this))
+            if (static_cast<Allocator const&>(a_vector) == static_cast<Allocator&>(*this))
             {
-                CopyAssignmentDoIt(a_vector, std::false_type());
+                return CopyAssignmentDoIt(a_vector, std::true_type());
             }
             else
             {
@@ -526,7 +539,7 @@ namespace amrex
                 if ( other_size > capacity() ) { AllocateBuffer(other_size); }                
                 m_size = other_size;                    
                 detail::memCopyImpl<Allocator>(m_data, a_vector.m_data, size() * sizeof(T));
-                Allocator::operator=(static_cast<Allocator&>(a_vector));                
+                Allocator::operator=(static_cast<Allocator const&>(a_vector));
                 return *this;
             }
         }
@@ -558,7 +571,7 @@ namespace amrex
         {
             deallocate(m_data, capacity());
             
-            Allocator::operator=(std::move(static_cast<Allocator&>(a_vector)));
+            Allocator::operator=(std::move(static_cast<Allocator const&>(a_vector)));
             
             m_data = a_vector.m_data;
             m_size = a_vector.m_size;
diff --git a/Src/Base/AMReX_ParallelContext.cpp b/Src/Base/AMReX_ParallelContext.cpp
index 83f8ba28337..2408430558d 100644
--- a/Src/Base/AMReX_ParallelContext.cpp
+++ b/Src/Base/AMReX_ParallelContext.cpp
@@ -73,6 +73,7 @@ Frame::local_to_global_rank (int* global, const int* local, std::size_t n) const
         for (std::size_t i = 0; i < n; ++i) global[i] = local[i];
     }
 #else
+    amrex::ignore_unused(local);
     for (std::size_t i = 0; i < n; ++i) global[i] = 0;
 #endif
 }
@@ -98,6 +99,7 @@ Frame::global_to_local_rank (int* local, const int* global, std::size_t n) const
         for (std::size_t i = 0; i < n; ++i) local[i] = global[i];
     }
 #else
+    amrex::ignore_unused(global);
     for (std::size_t i = 0; i < n; ++i) local[i] = 0;
 #endif    
 }
diff --git a/Src/Base/AMReX_ParallelDescriptor.H b/Src/Base/AMReX_ParallelDescriptor.H
index 323abbe153f..16a79b679d4 100644
--- a/Src/Base/AMReX_ParallelDescriptor.H
+++ b/Src/Base/AMReX_ParallelDescriptor.H
@@ -39,11 +39,12 @@
 #include <iostream>
 #include <limits>
 #include <numeric>
+#include <csignal>
 
 namespace amrex {
-    
+
 template <typename T> class LayoutData;
-    
+
 //! Parallel frontend that abstracts functionalities needed to spawn processes and handle communication
 namespace ParallelDescriptor
 {
@@ -137,6 +138,7 @@ while ( false )
 	MPI_Comm_rank(comm,&r);
 	return r;
 #else
+        amrex::ignore_unused(comm);
 	return 0;
 #endif
     }
@@ -226,6 +228,7 @@ while ( false )
         BL_MPI_REQUIRE(MPI_Comm_size(comm, &s));
         return s;
 #else
+        amrex::ignore_unused(comm);
         return 1;
 #endif
     }
@@ -545,9 +548,6 @@ while ( false )
     template <class T> void Gatherv (const T* send, int sc,
 				     T* recv, const std::vector<int>& rc, const std::vector<int>& disp,
 				     int root);
-    template <class T> void Gatherv (const T* send, Long sc,
-				     T* recv, const std::vector<Long>& rc, const std::vector<Long>& disp,
-				     int root);
 
     //! Gather LayoutData values to a vector on root
     template <class T> void GatherLayoutDataToVector (const LayoutData<T>& sendbuf,
@@ -565,6 +565,14 @@ while ( false )
     void IProbe(int src_pid, int tag, int &mflag, MPI_Status &status);
     void IProbe(int src_pid, int tag, MPI_Comm comm, int &mflag, MPI_Status &status);
 
+    /** Convert an MPI_THREAD_<X> level to string
+     *
+     * @param mtlev MPI_THREAD_<X> level
+     * @return string representation of the equivalent MPI macro name
+     */
+    std::string
+    mpi_level_to_string (int mtlev);
+
     // PMI = Process Management Interface, available on Crays. Provides API to
     // query topology of the job.
 #ifdef AMREX_PMI
@@ -973,48 +981,6 @@ ParallelDescriptor::Gatherv (const T* send, int sc,
     BL_COMM_PROFILE(BLProfiler::Gatherv, std::accumulate(rc.begin(),rc.end(),0)*sizeof(T), root, BLProfiler::NoTag());
 }
 
-template <class T>
-void
-ParallelDescriptor::Gatherv (const T* send, Long sc,
-			     T* recv, const std::vector<Long>& rc, const std::vector<Long>& disp,
-			     int root)
-{
-    BL_PROFILE_T_S("ParallelDescriptor::Gatherv(TLong)", T);
-    BL_COMM_PROFILE(BLProfiler::Gatherv,  BLProfiler::BeforeCall(), root, BLProfiler::NoTag());
-
-    int tag = ParallelDescriptor::SeqNum();
-
-    if (MyProc() == root) {
-	int nprocs = NProcs();
-	BL_ASSERT(rc.size() == nprocs);
-	BL_ASSERT(disp.size() == nprocs);
-
-	std::vector<MPI_Request> request;
-	for (int i = 0; i < nprocs; ++i) {
-	    T* buf = recv + disp[i];
-	    if (i == root) {
-		for (int k = 0; k < rc[i]; ++k) {
-		    *buf++ = send[k];
-		}
-	    } else {
-		MPI_Request req;
-		MPI_Irecv(buf, rc[i], ParallelDescriptor::Mpi_typemap<T>::type(), i,
-			  tag, Communicator(), &req);
-		request.push_back(req);
-	    }
-	}
-	if (request.size() > 0) {
-	    std::vector<MPI_Status> status(request.size());
-	    MPI_Waitall(request.size(), &request[0], &status[0]);
-	}
-    } else {
-	MPI_Send(const_cast<T*>(send), sc, ParallelDescriptor::Mpi_typemap<T>::type(), root, tag,
-		 Communicator());
-    }
-
-    BL_COMM_PROFILE(BLProfiler::Gatherv, std::accumulate(rc.begin(),rc.end(),0L)*sizeof(T), root, BLProfiler::NoTag());
-}
-
 template <class T>
 void
 ParallelDescriptor::GatherLayoutDataToVector (const LayoutData<T>& sendbuf,
@@ -1032,8 +998,8 @@ ParallelDescriptor::GatherLayoutDataToVector (const LayoutData<T>& sendbuf,
         T_to_send.push_back(sendbuf[i]);
     }
 
-    int nprocs = ParallelDescriptor::NProcs();
-    Vector<Long> recvcount(nprocs, 0);
+    int nprocs = ParallelContext::NProcsSub();
+    Vector<int> recvcount(nprocs, 0);
     const Vector<int>& old_pmap = sendbuf.DistributionMap().ProcessorMap();
     for (int i=0; i<old_pmap.size(); ++i)
     {
@@ -1065,22 +1031,21 @@ ParallelDescriptor::GatherLayoutDataToVector (const LayoutData<T>& sendbuf,
         }
     }
 
-    Vector<Long> disp(nprocs);
-    disp[0] = 0;
+    Vector<int> disp(nprocs);
+    if (!disp.empty()) disp[0] = 0;
     std::partial_sum(recvcount.begin(), recvcount.end()-1, disp.begin()+1);
     Vector<T> new_index_to_T(sendbuf.size());
 
-    ParallelDescriptor::Gatherv(&T_to_send[0],
-                                T_to_send.size(),
-                                &new_index_to_T[0],
-                                recvcount,
-                                disp,
-                                root);
+    MPI_Gatherv(T_to_send.data(), T_to_send.size(),
+                ParallelDescriptor::Mpi_typemap<T>::type(),
+                new_index_to_T.data(), recvcount.data(), disp.data(),
+                ParallelDescriptor::Mpi_typemap<T>::type(),
+                root, ParallelContext::CommunicatorSub());
 
     // Now work just on the root, which now has global information on the collected;
     // LayoutData information; with new_index_to_old_index and new_index_to_T,
     // sort the gathered vector in pre-gather index space
-    if (ParallelDescriptor::MyProc() == root)
+    if (ParallelContext::MyProcSub() == root)
     {
         // Invert the map (new_index) --> (old_index)
         Vector<int> old_index_to_new_index(sendbuf.size());
@@ -1125,106 +1090,106 @@ namespace ParallelDescriptor
 {
 template <class T>
 Message
-Asend(const T* buf, size_t n, int dst_pid, int tag)
+Asend(const T* /*buf*/, size_t /*n*/, int /*dst_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Asend(const T* buf, size_t n, int dst_pid, int tag, MPI_Comm comm)
+Asend(const T* /*buf*/, size_t /*n*/, int /*dst_pid*/, int /*tag*/, MPI_Comm /*comm*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Asend(const std::vector<T>& buf, int dst_pid, int tag)
+Asend(const std::vector<T>& /*buf*/, int /*dst_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Send(const T* buf, size_t n, int dst_pid, int tag)
+Send(const T* /*buf*/, size_t /*n*/, int /*dst_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Send(const T* buf, size_t n, int dst_pid, int tag, MPI_Comm comm)
+Send(const T* /*buf*/, size_t /*n*/, int /*dst_pid*/, int /*tag*/, MPI_Comm /*comm*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Send(const std::vector<T>& buf, int dst_pid, int tag)
+Send(const std::vector<T>& /*buf*/, int /*dst_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Arecv(T* buf, size_t n, int src_pid, int tag)
+Arecv(T* /*buf*/, size_t /*n*/, int /*src_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Arecv(T* buf, size_t n, int src_pid, int tag, MPI_Comm comm)
+Arecv(T* /*buf*/, size_t /*n*/, int /*src_pid*/, int /*tag*/, MPI_Comm /*comm*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Arecv(std::vector<T>& buf, int src_pid, int tag)
+Arecv(std::vector<T>& /*buf*/, int /*src_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Recv(T* buf, size_t n, int src_pid, int tag)
+Recv(T* /*buf*/, size_t /*n*/, int /*src_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Recv(T* buf, size_t n, int src_pid, int tag, MPI_Comm comm)
+Recv(T* /*buf*/, size_t /*n*/, int /*src_pid*/, int /*tag*/, MPI_Comm /*comm*/)
 {
     return Message();
 }
 
 template <class T>
 Message
-Recv(std::vector<T>& buf, int src_pid, int tag)
+Recv(std::vector<T>& /*buf*/, int /*src_pid*/, int /*tag*/)
 {
     return Message();
 }
 
 template <class T>
 void
-Bcast(T* t, size_t n, int root)
+Bcast(T* /*t*/, size_t /*n*/, int /*root*/)
 {}
 
 template <class T>
 void
-Bcast(T* t, size_t n, int root, const MPI_Comm &comm)
+Bcast(T* /*t*/, size_t /*n*/, int /*root*/, const MPI_Comm & /*comm*/)
 {}
 
 template <class T, class T1>
 void
-Gather(const T* t, size_t n, T1* t1, size_t n1, int root)
+Gather(const T* /*t*/, size_t /*n*/, T1* /*t1*/, size_t /*n1*/, int /*root*/)
 {}
 
 template <class T>
 std::vector<T>
-Gather(const T& t, int root)
+Gather(const T& t, int /*root*/)
 {
     std::vector<T> resl(1);
     resl[0] = t;
@@ -1234,7 +1199,7 @@ Gather(const T& t, int root)
 template <class T>
 void
 GatherLayoutDataToVector (const LayoutData<T>& sendbuf,
-                          Vector<T>& recvbuf, int root)
+                          Vector<T>& recvbuf, int /*root*/)
 {
     for (int i=0; i<sendbuf.size(); ++i)
     {
@@ -1244,7 +1209,7 @@ GatherLayoutDataToVector (const LayoutData<T>& sendbuf,
 
 template <class T, class T1>
 void
-Scatter(T* t, size_t n, const T1* t1, size_t n1, int root)
+Scatter(T* /*t*/, size_t /*n*/, const T1* /*t1*/, size_t /*n1*/, int /*root*/)
 {}
 
 }
diff --git a/Src/Base/AMReX_ParallelDescriptor.cpp b/Src/Base/AMReX_ParallelDescriptor.cpp
index 424d9accf39..8de7b677ac1 100644
--- a/Src/Base/AMReX_ParallelDescriptor.cpp
+++ b/Src/Base/AMReX_ParallelDescriptor.cpp
@@ -4,7 +4,6 @@
 #include <cstdlib>
 #include <iostream>
 #include <fstream>
-#include <unistd.h>
 #include <sstream>
 #include <stack>
 #include <list>
@@ -40,6 +39,11 @@
 namespace
 {
     static int call_mpi_finalize = 0;
+    static int num_startparallel_called = 0;
+    static MPI_Datatype mpi_type_intvect   = MPI_DATATYPE_NULL;
+    static MPI_Datatype mpi_type_indextype = MPI_DATATYPE_NULL;
+    static MPI_Datatype mpi_type_box       = MPI_DATATYPE_NULL;
+    static MPI_Datatype mpi_type_lull_t    = MPI_DATATYPE_NULL;
 }
 #endif
 
@@ -322,27 +326,20 @@ ParallelDescriptor::StartParallel (int*    argc,
         call_mpi_finalize = 0;
     }
 
+    // It seems that for some MPI implementation, the first call to MPI_Wtime is always 0.  That
+    // sometimes causes problems for amrex::UniqueString function.  So we call MPI_Wtime here.
+    auto tfoo = MPI_Wtime();
+    amrex::ignore_unused(tfoo);
+
 #ifdef AMREX_MPI_THREAD_MULTIPLE
-    {
+    if ( ! sflag) {  // we initialized
         int requested = MPI_THREAD_MULTIPLE;
         int provided = -1;
         MPI_Query_thread(&provided);
 
         if (provided < requested)
         {
-            auto f = [] (int tlev) -> std::string {
-                if (tlev == MPI_THREAD_SINGLE) {
-                    return std::string("MPI_THREAD_SINGLE");
-                } else if (tlev == MPI_THREAD_FUNNELED) {
-                    return std::string("MPI_THREAD_FUNNELED");
-                } else if (tlev == MPI_THREAD_SERIALIZED) {
-                    return std::string("MPI_THREAD_SERIALIZED");
-                } else if (tlev == MPI_THREAD_MULTIPLE) {
-                    return std::string("MPI_THREAD_MULTIPLE");
-                } else {
-                    return std::string("UNKNOWN");
-                }
-            };
+            auto f = ParallelDescriptor::mpi_level_to_string;
             std::cout << "MPI provided < requested: " << f(provided) << " < "
                       << f(requested) << std::endl;;
             std::abort();
@@ -378,11 +375,25 @@ ParallelDescriptor::StartParallel (int*    argc,
 
     // Wait until all other processes are properly started.
 //    BL_MPI_REQUIRE( MPI_Barrier(Communicator()) );
+
+    ++num_startparallel_called;
 }
 
 void
 ParallelDescriptor::EndParallel ()
 {
+    --num_startparallel_called;
+    if (num_startparallel_called == 0) {
+        BL_MPI_REQUIRE( MPI_Type_free(&mpi_type_intvect) );
+        BL_MPI_REQUIRE( MPI_Type_free(&mpi_type_indextype) );
+        BL_MPI_REQUIRE( MPI_Type_free(&mpi_type_box) );
+        BL_MPI_REQUIRE( MPI_Type_free(&mpi_type_lull_t) );
+        mpi_type_intvect   = MPI_DATATYPE_NULL;
+        mpi_type_indextype = MPI_DATATYPE_NULL;
+        mpi_type_box       = MPI_DATATYPE_NULL;
+        mpi_type_lull_t    = MPI_DATATYPE_NULL;
+    }
+
     if (!call_mpi_finalize) {
         BL_MPI_REQUIRE( MPI_Comm_free(&m_comm) );
     }
@@ -404,6 +415,8 @@ ParallelDescriptor::second () noexcept
 void
 ParallelDescriptor::Barrier (const std::string &message)
 {
+    amrex::ignore_unused(message);
+
 #ifdef BL_LAZY
     Lazy::EvalReduction();
 #endif
@@ -419,6 +432,8 @@ ParallelDescriptor::Barrier (const std::string &message)
 void
 ParallelDescriptor::Barrier (const MPI_Comm &comm, const std::string &message)
 {
+    amrex::ignore_unused(message);
+
 #ifdef BL_LAZY
     int r;
     MPI_Comm_compare(comm, Communicator(), &r);
@@ -1656,13 +1671,12 @@ template <>
 MPI_Datatype
 ParallelDescriptor::Mpi_typemap<ParallelDescriptor::lull_t>::type ()
 {
-    static MPI_Datatype mine = MPI_DATATYPE_NULL;
-    if (mine == MPI_DATATYPE_NULL)
+    if (mpi_type_lull_t == MPI_DATATYPE_NULL)
     {
-        BL_MPI_REQUIRE( MPI_Type_contiguous(sizeof(lull_t), MPI_CHAR, &mine) );
-        BL_MPI_REQUIRE( MPI_Type_commit(&mine) );
+        BL_MPI_REQUIRE( MPI_Type_contiguous(sizeof(lull_t), MPI_CHAR, &mpi_type_lull_t) );
+        BL_MPI_REQUIRE( MPI_Type_commit(&mpi_type_lull_t) );
     }
-    return mine;
+    return mpi_type_lull_t;
 }
 
 void
@@ -1753,8 +1767,8 @@ ParallelDescriptor::Bcast(void *buf,
 #else /*!BL_USE_MPI*/
 
 void
-ParallelDescriptor::StartParallel (int*    argc,
-                                   char*** argv,
+ParallelDescriptor::StartParallel (int*    /*argc*/,
+                                   char*** /*argv*/,
                                    MPI_Comm)
 {
     m_comm = 0;
@@ -1768,6 +1782,7 @@ ParallelDescriptor::Gather (Real* sendbuf,
 			    Real* recvbuf,
 			    int   root)
 {
+    amrex::ignore_unused(root);
     BL_ASSERT(root == 0);
     BL_ASSERT(nsend > 0);
     BL_ASSERT(!(sendbuf == 0));
@@ -1803,10 +1818,10 @@ void ParallelDescriptor::Abort (int s, bool backtrace)
 
 const char* ParallelDescriptor::ErrorString (int) { return ""; }
 
-void ParallelDescriptor::Barrier (const std::string &message) {}
-void ParallelDescriptor::Barrier (const MPI_Comm &comm, const std::string &message) {}
+void ParallelDescriptor::Barrier (const std::string &/*message*/) {}
+void ParallelDescriptor::Barrier (const MPI_Comm &/*comm*/, const std::string &/*message*/) {}
 ParallelDescriptor::Message ParallelDescriptor::Abarrier () { return ParallelDescriptor::Message(); }
-ParallelDescriptor::Message ParallelDescriptor::Abarrier (const MPI_Comm &comm) { return ParallelDescriptor::Message(); }
+ParallelDescriptor::Message ParallelDescriptor::Abarrier (const MPI_Comm &/*comm*/) { return ParallelDescriptor::Message(); }
 
 void ParallelDescriptor::Test (MPI_Request&, int&, MPI_Status&) {}
 void ParallelDescriptor::IProbe (int, int, int&, MPI_Status&) {}
@@ -1830,13 +1845,13 @@ void ParallelDescriptor::ReduceRealMax (Real*,int,int) {}
 void ParallelDescriptor::ReduceRealMin (Real*,int,int) {}
 void ParallelDescriptor::ReduceRealSum (Real*,int,int) {}
 
-void ParallelDescriptor::ReduceRealSum (Vector<std::reference_wrapper<Real> >&& rvar) {}
-void ParallelDescriptor::ReduceRealMax (Vector<std::reference_wrapper<Real> >&& rvar) {}
-void ParallelDescriptor::ReduceRealMin (Vector<std::reference_wrapper<Real> >&& rvar) {}
+void ParallelDescriptor::ReduceRealSum (Vector<std::reference_wrapper<Real> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceRealMax (Vector<std::reference_wrapper<Real> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceRealMin (Vector<std::reference_wrapper<Real> >&& /*rvar*/) {}
 
-void ParallelDescriptor::ReduceRealSum (Vector<std::reference_wrapper<Real> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceRealMax (Vector<std::reference_wrapper<Real> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceRealMin (Vector<std::reference_wrapper<Real> >&& rvar, int cpu) {}
+void ParallelDescriptor::ReduceRealSum (Vector<std::reference_wrapper<Real> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceRealMax (Vector<std::reference_wrapper<Real> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceRealMin (Vector<std::reference_wrapper<Real> >&& /*rvar*/, int /*cpu*/) {}
 
 void ParallelDescriptor::ReduceLongAnd (Long&) {}
 void ParallelDescriptor::ReduceLongSum (Long&) {}
@@ -1858,15 +1873,15 @@ void ParallelDescriptor::ReduceLongSum (Long*,int,int) {}
 void ParallelDescriptor::ReduceLongMax (Long*,int,int) {}
 void ParallelDescriptor::ReduceLongMin (Long*,int,int) {}
 
-void ParallelDescriptor::ReduceLongAnd (Vector<std::reference_wrapper<Long> >&& rvar) {}
-void ParallelDescriptor::ReduceLongSum (Vector<std::reference_wrapper<Long> >&& rvar) {}
-void ParallelDescriptor::ReduceLongMax (Vector<std::reference_wrapper<Long> >&& rvar) {}
-void ParallelDescriptor::ReduceLongMin (Vector<std::reference_wrapper<Long> >&& rvar) {}
+void ParallelDescriptor::ReduceLongAnd (Vector<std::reference_wrapper<Long> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceLongSum (Vector<std::reference_wrapper<Long> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceLongMax (Vector<std::reference_wrapper<Long> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceLongMin (Vector<std::reference_wrapper<Long> >&& /*rvar*/) {}
 
-void ParallelDescriptor::ReduceLongAnd (Vector<std::reference_wrapper<Long> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceLongSum (Vector<std::reference_wrapper<Long> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceLongMax (Vector<std::reference_wrapper<Long> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceLongMin (Vector<std::reference_wrapper<Long> >&& rvar, int cpu) {}
+void ParallelDescriptor::ReduceLongAnd (Vector<std::reference_wrapper<Long> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceLongSum (Vector<std::reference_wrapper<Long> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceLongMax (Vector<std::reference_wrapper<Long> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceLongMin (Vector<std::reference_wrapper<Long> >&& /*rvar*/, int /*cpu*/) {}
 
 void ParallelDescriptor::ReduceIntSum (int&) {}
 void ParallelDescriptor::ReduceIntMax (int&) {}
@@ -1884,13 +1899,13 @@ void ParallelDescriptor::ReduceIntSum (int*,int,int) {}
 void ParallelDescriptor::ReduceIntMax (int*,int,int) {}
 void ParallelDescriptor::ReduceIntMin (int*,int,int) {}
 
-void ParallelDescriptor::ReduceIntSum (Vector<std::reference_wrapper<int> >&& rvar) {}
-void ParallelDescriptor::ReduceIntMax (Vector<std::reference_wrapper<int> >&& rvar) {}
-void ParallelDescriptor::ReduceIntMin (Vector<std::reference_wrapper<int> >&& rvar) {}
+void ParallelDescriptor::ReduceIntSum (Vector<std::reference_wrapper<int> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceIntMax (Vector<std::reference_wrapper<int> >&& /*rvar*/) {}
+void ParallelDescriptor::ReduceIntMin (Vector<std::reference_wrapper<int> >&& /*rvar*/) {}
 
-void ParallelDescriptor::ReduceIntSum (Vector<std::reference_wrapper<int> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceIntMax (Vector<std::reference_wrapper<int> >&& rvar, int cpu) {}
-void ParallelDescriptor::ReduceIntMin (Vector<std::reference_wrapper<int> >&& rvar, int cpu) {}
+void ParallelDescriptor::ReduceIntSum (Vector<std::reference_wrapper<int> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceIntMax (Vector<std::reference_wrapper<int> >&& /*rvar*/, int /*cpu*/) {}
+void ParallelDescriptor::ReduceIntMin (Vector<std::reference_wrapper<int> >&& /*rvar*/, int /*cpu*/) {}
 
 void ParallelDescriptor::ReduceBoolAnd (bool&) {}
 void ParallelDescriptor::ReduceBoolOr  (bool&) {}
@@ -1907,26 +1922,26 @@ ParallelDescriptor::second () noexcept
 }
 
 void
-ParallelDescriptor::Wait (MPI_Request& req,
-                          MPI_Status& status)
+ParallelDescriptor::Wait (MPI_Request& /*req*/,
+                          MPI_Status& /*status*/)
 {}
 
 void
-ParallelDescriptor::Waitall (Vector<MPI_Request>& reqs,
-                             Vector<MPI_Status>& status)
+ParallelDescriptor::Waitall (Vector<MPI_Request>& /*reqs*/,
+                             Vector<MPI_Status>& /*status*/)
 {}
 
 void
-ParallelDescriptor::Waitany (Vector<MPI_Request>& reqs,
-                             int &index,
-                             MPI_Status& status)
+ParallelDescriptor::Waitany (Vector<MPI_Request>& /*reqs*/,
+                             int &/*index*/,
+                             MPI_Status& /*status*/)
 {}
 
 void
-ParallelDescriptor::Waitsome (Vector<MPI_Request>& reqs,
-                              int&                completed,
-                              Vector<int>&         indx,
-                              Vector<MPI_Status>&  status)
+ParallelDescriptor::Waitsome (Vector<MPI_Request>& /*reqs*/,
+                              int&                 /*completed*/,
+                              Vector<int>&         /*indx*/,
+                              Vector<MPI_Status>&  /*status*/)
 {}
 
 #endif
@@ -2008,23 +2023,22 @@ template <> MPI_Datatype Mpi_typemap<IntVect>::type()
     static_assert(AMREX_IS_TRIVIALLY_COPYABLE(IntVect), "IntVect must be trivially copyable");
     static_assert(std::is_standard_layout<IntVect>::value, "IntVect must be standard layout");
 
-    static MPI_Datatype mine(MPI_DATATYPE_NULL);
-    if ( mine == MPI_DATATYPE_NULL )
+    if ( mpi_type_intvect == MPI_DATATYPE_NULL )
     {
 	MPI_Datatype types[] = { MPI_INT };
 	int blocklens[] = { AMREX_SPACEDIM };
 	MPI_Aint disp[] = { 0 };
-	BL_MPI_REQUIRE( MPI_Type_create_struct(1, blocklens, disp, types, &mine) );
+	BL_MPI_REQUIRE( MPI_Type_create_struct(1, blocklens, disp, types, &mpi_type_intvect) );
         MPI_Aint lb, extent;
-        BL_MPI_REQUIRE( MPI_Type_get_extent(mine, &lb, &extent) );
+        BL_MPI_REQUIRE( MPI_Type_get_extent(mpi_type_intvect, &lb, &extent) );
         if (extent != sizeof(IntVect)) {
-            MPI_Datatype tmp = mine;
-            BL_MPI_REQUIRE( MPI_Type_create_resized(tmp, 0, sizeof(IntVect), &mine) );
+            MPI_Datatype tmp = mpi_type_intvect;
+            BL_MPI_REQUIRE( MPI_Type_create_resized(tmp, 0, sizeof(IntVect), &mpi_type_intvect) );
             BL_MPI_REQUIRE( MPI_Type_free(&tmp) );
         }
-	BL_MPI_REQUIRE( MPI_Type_commit( &mine ) );
+	BL_MPI_REQUIRE( MPI_Type_commit( &mpi_type_intvect ) );
     }
-    return mine;
+    return mpi_type_intvect;
 }
 
 template <> MPI_Datatype Mpi_typemap<IndexType>::type()
@@ -2032,23 +2046,22 @@ template <> MPI_Datatype Mpi_typemap<IndexType>::type()
     static_assert(AMREX_IS_TRIVIALLY_COPYABLE(IndexType), "IndexType must be trivially copyable");
     static_assert(std::is_standard_layout<IndexType>::value, "IndexType must be standard layout");
 
-    static MPI_Datatype mine(MPI_DATATYPE_NULL);
-    if ( mine == MPI_DATATYPE_NULL )
+    if ( mpi_type_indextype == MPI_DATATYPE_NULL )
     {
 	MPI_Datatype types[] = { MPI_UNSIGNED };
 	int blocklens[] = { 1 };
 	MPI_Aint disp[] = { 0 };
-        BL_MPI_REQUIRE( MPI_Type_create_struct(1, blocklens, disp, types, &mine) );
+        BL_MPI_REQUIRE( MPI_Type_create_struct(1, blocklens, disp, types, &mpi_type_indextype) );
         MPI_Aint lb, extent;
-        BL_MPI_REQUIRE( MPI_Type_get_extent(mine, &lb, &extent) );
+        BL_MPI_REQUIRE( MPI_Type_get_extent(mpi_type_indextype, &lb, &extent) );
         if (extent != sizeof(IndexType)) {
-            MPI_Datatype tmp = mine;
-            BL_MPI_REQUIRE( MPI_Type_create_resized(tmp, 0, sizeof(IndexType), &mine) );
+            MPI_Datatype tmp = mpi_type_indextype;
+            BL_MPI_REQUIRE( MPI_Type_create_resized(tmp, 0, sizeof(IndexType), &mpi_type_indextype) );
             BL_MPI_REQUIRE( MPI_Type_free(&tmp) );
         }
-	BL_MPI_REQUIRE( MPI_Type_commit( &mine ) );
+	BL_MPI_REQUIRE( MPI_Type_commit( &mpi_type_indextype ) );
     }
-    return mine;
+    return mpi_type_indextype;
 }
 
 template <> MPI_Datatype Mpi_typemap<Box>::type()
@@ -2056,8 +2069,7 @@ template <> MPI_Datatype Mpi_typemap<Box>::type()
     static_assert(AMREX_IS_TRIVIALLY_COPYABLE(Box), "Box must be trivially copyable");
     static_assert(std::is_standard_layout<Box>::value, "Box must be standard layout");
 
-    static MPI_Datatype mine(MPI_DATATYPE_NULL);
-    if ( mine == MPI_DATATYPE_NULL )
+    if ( mpi_type_box == MPI_DATATYPE_NULL )
     {
 	Box bx[2];
 	MPI_Datatype types[] = {
@@ -2073,17 +2085,17 @@ template <> MPI_Datatype Mpi_typemap<Box>::type()
         disp[2] -= disp[0];
         disp[1] -= disp[0];
         disp[0] = 0;
-        BL_MPI_REQUIRE( MPI_Type_create_struct(3, blocklens, disp, types, &mine) );
+        BL_MPI_REQUIRE( MPI_Type_create_struct(3, blocklens, disp, types, &mpi_type_box) );
         MPI_Aint lb, extent;
-        BL_MPI_REQUIRE( MPI_Type_get_extent(mine, &lb, &extent) );
+        BL_MPI_REQUIRE( MPI_Type_get_extent(mpi_type_box, &lb, &extent) );
         if (extent != sizeof(bx[0])) {
-            MPI_Datatype tmp = mine;
-            BL_MPI_REQUIRE( MPI_Type_create_resized(tmp, 0, sizeof(bx[0]), &mine) );
+            MPI_Datatype tmp = mpi_type_box;
+            BL_MPI_REQUIRE( MPI_Type_create_resized(tmp, 0, sizeof(bx[0]), &mpi_type_box) );
             BL_MPI_REQUIRE( MPI_Type_free(&tmp) );
         }
-	BL_MPI_REQUIRE( MPI_Type_commit( &mine ) );
+	BL_MPI_REQUIRE( MPI_Type_commit( &mpi_type_box ) );
     }
-    return mine;
+    return mpi_type_box;
 }
 #endif
 }
@@ -2223,6 +2235,25 @@ ParallelDescriptor::EndTeams ()
     m_Team.clear();
 }
 
+std::string
+ParallelDescriptor::mpi_level_to_string (int mtlev)
+{
+    switch (mtlev) {
+#ifdef AMREX_USE_MPI
+        case MPI_THREAD_SINGLE:
+            return std::string("MPI_THREAD_SINGLE");
+        case MPI_THREAD_FUNNELED:
+            return std::string("MPI_THREAD_FUNNELED");
+        case MPI_THREAD_SERIALIZED:
+            return std::string("MPI_THREAD_SERIALIZED");
+        case MPI_THREAD_MULTIPLE:
+            return std::string("MPI_THREAD_MULTIPLE");
+#endif
+        default:
+            return std::string("UNKNOWN");
+    }
+}
+
 #ifdef BL_USE_MPI
 
 int
diff --git a/Src/Base/AMReX_ParallelReduce.H b/Src/Base/AMReX_ParallelReduce.H
index 5ae621bf060..4e425f8ecb7 100644
--- a/Src/Base/AMReX_ParallelReduce.H
+++ b/Src/Base/AMReX_ParallelReduce.H
@@ -22,13 +22,13 @@ namespace detail {
 #ifdef BL_USE_MPI
 
     // NOTE: the order of these needs to match the order in the ReduceOp enum above
-    const std::array<MPI_Op, 5> mpi_ops = {
+    const std::array<MPI_Op, 5> mpi_ops = {{
         MPI_MAX,
         MPI_MIN,
         MPI_SUM,
         MPI_LOR,
         MPI_LAND
-    };
+    }};
 
     template<typename T>
     inline void Reduce (ReduceOp op, T* v, int cnt, int root, MPI_Comm comm)
@@ -86,12 +86,12 @@ namespace detail {
     }
 
 #else
-    template<typename T> void Reduce (ReduceOp op, T* v, int cnt, int root, MPI_Comm comm) {}
-    template<typename T> void Reduce (ReduceOp op, T& v, int root, MPI_Comm comm) {}
-    template<typename T> void Reduce (ReduceOp op, Vector<std::reference_wrapper<T> > const & v, int root, MPI_Comm comm) {}
+    template<typename T> void Reduce (ReduceOp /*op*/, T* /*v*/, int /*cnt*/, int /*root*/, MPI_Comm /*comm*/) {}
+    template<typename T> void Reduce (ReduceOp /*op*/, T& /*v*/, int /*root*/, MPI_Comm /*comm*/) {}
+    template<typename T> void Reduce (ReduceOp /*op*/, Vector<std::reference_wrapper<T> > const & /*v*/, int /*root*/, MPI_Comm /*comm*/) {}
 
-    template<typename T> void Gather (const T* v, int cnt, T* vs, int root, MPI_Comm comm) {}
-    template<typename T> void Gather (const T& v, T * vs, int root, MPI_Comm comm) {}
+    template<typename T> void Gather (const T* /*v*/, int /*cnt*/, T* /*vs*/, int /*root*/, MPI_Comm /*comm*/) {}
+    template<typename T> void Gather (const T& /*v*/, T * /*vs*/, int /*root*/, MPI_Comm /*comm*/) {}
 #endif
 }
 
diff --git a/Src/Base/AMReX_ParmParse.cpp b/Src/Base/AMReX_ParmParse.cpp
index b3f0ea0e43a..f9d373a043f 100644
--- a/Src/Base/AMReX_ParmParse.cpp
+++ b/Src/Base/AMReX_ParmParse.cpp
@@ -593,6 +593,7 @@ bldTable (const char*&                    str,
 	    {
 		amrex::Abort("ParmParse::bldTable() defn with no list");
 	    }
+            AMREX_FALLTHROUGH;
 	case pEOF:
 	    addDefn(cur_name,cur_list,tab);
 	    return;
@@ -636,6 +637,7 @@ bldTable (const char*&                    str,
 	    //
 	    // Otherwise, fall through, this may be a string.
 	    //
+            AMREX_FALLTHROUGH;
 	case pValue:
 	    if ( cur_name.empty() )
 	    {
diff --git a/Src/Base/AMReX_PhysBCFunct.H b/Src/Base/AMReX_PhysBCFunct.H
index 3f33522118b..287c24a97c1 100644
--- a/Src/Base/AMReX_PhysBCFunct.H
+++ b/Src/Base/AMReX_PhysBCFunct.H
@@ -6,6 +6,7 @@
 #include <AMReX_MultiFab.H>
 #include <AMReX_ArrayLim.H>
 #include <AMReX_FilCC_C.H>
+#include <AMReX_FilND_C.H>
 #include <AMReX_TypeTraits.H>
 
 namespace amrex {
@@ -53,8 +54,8 @@ protected:
 
 /**
 * In this gpu version, F is provided by the user.  It needs to have a
-* __device__ operator() that can work on a cell for boundaries not
-* handled by amrex::fab_filcc.
+* __device__ operator() that can work on a cell/node for boundaries not
+* handled by amrex::fab_filcc/fab_filnd.
 */
 template <class F>
 class GpuBndryFuncFab
@@ -69,6 +70,18 @@ public:
                      Geometry const& geom, const Real time,
                      const Vector<BCRec>& bcr, const int bcomp,
                      const int orig_comp);
+
+    void ccdoit (Box const& bx, FArrayBox& dest,
+                 const int dcomp, const int numcomp,
+                 Geometry const& geom, const Real time,
+                 const Vector<BCRec>& bcr, const int bcomp,
+                 const int orig_comp);
+
+    void nddoit (Box const& bx, FArrayBox& dest,
+                 const int dcomp, const int numcomp,
+                 Geometry const& geom, const Real time,
+                 const Vector<BCRec>& bcr, const int bcomp,
+                 const int orig_comp);
 protected:
     F m_user_f;
 };
@@ -95,8 +108,8 @@ protected:
 class PhysBCFunctNoOp
 {
 public:
-    void operator() (MultiFab& mf, int dcomp, int ncomp, IntVect const& nghost,
-                     Real time, int bccomp) {}
+    void operator() (MultiFab& /*mf*/, int /*dcomp*/, int /*ncomp*/, IntVect const& /*nghost*/,
+                     Real /*time*/, int /*bccomp*/) {}
 };
 
 
@@ -184,6 +197,23 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
                                 Geometry const& geom, const Real time,
                                 const Vector<BCRec>& bcr, const int bcomp,
                                 const int orig_comp)
+{
+    if (bx.ixType().cellCentered()) {
+        ccdoit(bx,dest,dcomp,numcomp,geom,time,bcr,bcomp,orig_comp);
+    } else if (bx.ixType().nodeCentered()) {
+        nddoit(bx,dest,dcomp,numcomp,geom,time,bcr,bcomp,orig_comp);
+    } else {
+        amrex::Abort("GpuBndryFuncFab: mixed type not supported");
+    }
+}
+
+template <class F>
+void
+GpuBndryFuncFab<F>::ccdoit (Box const& bx, FArrayBox& dest,
+                            const int dcomp, const int numcomp,
+                            Geometry const& geom, const Real time,
+                            const Vector<BCRec>& bcr, const int bcomp,
+                            const int orig_comp)
 {
     const IntVect& len = bx.length();
 
@@ -226,6 +256,7 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
             amrex::ParallelFor(face_boxes[0],
             [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
             {
+                AMREX_D_PICK(amrex::ignore_unused(j,k),amrex::ignore_unused(k),(void)0);
                 IntVect const cell(AMREX_D_DECL(i,j,k));
                 filcc_cell(cell, fab, dcomp, numcomp, geomdata, time,
                            bcr_p, 0, orig_comp);
@@ -288,6 +319,7 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
             amrex::ParallelFor(edge_boxes[0],
             [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
             {
+                AMREX_D_PICK(amrex::ignore_unused(j,k),amrex::ignore_unused(k),(void)0);
                 IntVect const cell(AMREX_D_DECL(i,j,k));
                 filcc_cell(cell, fab, dcomp, numcomp, geomdata, time,
                            bcr_p, 0, orig_comp);
@@ -372,17 +404,18 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
     // filcc on the faces first
     {
         Array<Box,2*AMREX_SPACEDIM> dom_face_boxes
-            = { AMREX_D_DECL(amrex::adjCellLo(gdomain, 0, len[0]),
-                             amrex::adjCellLo(gdomain, 1, len[1]),
-                             amrex::adjCellLo(gdomain, 2, len[2])),
-                AMREX_D_DECL(amrex::adjCellHi(gdomain, 0, len[0]),
-                             amrex::adjCellHi(gdomain, 1, len[1]),
-                             amrex::adjCellHi(gdomain, 2, len[2])) };
+            = {{ AMREX_D_DECL(amrex::adjCellLo(gdomain, 0, len[0]),
+                              amrex::adjCellLo(gdomain, 1, len[1]),
+                              amrex::adjCellLo(gdomain, 2, len[2])),
+                 AMREX_D_DECL(amrex::adjCellHi(gdomain, 0, len[0]),
+                              amrex::adjCellHi(gdomain, 1, len[1]),
+                              amrex::adjCellHi(gdomain, 2, len[2])) }};
 
         for (const Box& b : dom_face_boxes) {
             Box tmp = b & bx;
             amrex::For(tmp, [=] (int i, int j, int k) noexcept
             {
+                amrex::ignore_unused(j,k);
                 IntVect const cell(AMREX_D_DECL(i,j,k));
                 filcc_cell(cell, fab, dcomp, numcomp, geomdata, time,
                            bcr_p, 0, orig_comp);
@@ -397,32 +430,33 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
     {
 #if (AMREX_SPACEDIM == 2)
         Array<Box,4> dom_edge_boxes
-            = { amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
-                amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),
-                amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
-                amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]) };
+            = {{ amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
+                 amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),
+                 amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
+                 amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]) }};
 #else
         Array<Box,12> dom_edge_boxes
-            = { amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
-                amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),
-                amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
-                amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),
-                //
-                amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),2,len[2]),
-                amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),2,len[2]),
-                //
-                amrex::adjCellLo(amrex::adjCellLo(gdomain,1,len[1]),2,len[2]),
-                amrex::adjCellLo(amrex::adjCellHi(gdomain,1,len[1]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellLo(gdomain,1,len[1]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellHi(gdomain,1,len[1]),2,len[2]) };
+            = {{ amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
+                 amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),
+                 amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),
+                 amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),
+                 //
+                 amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),2,len[2]),
+                 amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),2,len[2]),
+                 //
+                 amrex::adjCellLo(amrex::adjCellLo(gdomain,1,len[1]),2,len[2]),
+                 amrex::adjCellLo(amrex::adjCellHi(gdomain,1,len[1]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellLo(gdomain,1,len[1]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellHi(gdomain,1,len[1]),2,len[2]) }};
 #endif
 
         for (const Box& b : dom_edge_boxes) {
             Box tmp = b & bx;
             amrex::For(tmp, [=] (int i, int j, int k) noexcept
             {
+                amrex::ignore_unused(j,k);
                 IntVect const cell(AMREX_D_DECL(i,j,k));
                 filcc_cell(cell, fab, dcomp, numcomp, geomdata, time,
                            bcr_p, 0, orig_comp);
@@ -437,14 +471,14 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
     // filcc on corners
     {
         Array<Box,8> dom_corner_boxes
-            = { amrex::adjCellLo(amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellLo(amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellLo(amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellLo(amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
-                amrex::adjCellHi(amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]) };
+            = {{ amrex::adjCellLo(amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellLo(amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellLo(amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellLo(amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellLo(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellLo(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellHi(amrex::adjCellLo(gdomain,0,len[0]),1,len[1]),2,len[2]),
+                 amrex::adjCellHi(amrex::adjCellHi(amrex::adjCellHi(gdomain,0,len[0]),1,len[1]),2,len[2]) }};
 
         for (const Box& b : dom_corner_boxes) {
             Box tmp = b & bx;
@@ -463,6 +497,129 @@ GpuBndryFuncFab<F>::operator() (Box const& bx, FArrayBox& dest,
 #endif
 }
 
+template <class F>
+void
+GpuBndryFuncFab<F>::nddoit (Box const& bx, FArrayBox& dest,
+                            const int dcomp, const int numcomp,
+                            Geometry const& geom, const Real time,
+                            const Vector<BCRec>& bcr, const int bcomp,
+                            const int orig_comp)
+{
+    const IntVect& len = bx.length();
+
+    Box const& domain = amrex::convert(geom.Domain(),IntVect::TheNodeVector());;
+    Box gdomain = domain;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        if (geom.isPeriodic(idim)) {
+            gdomain.grow(idim,len[idim]);
+        }
+    }
+
+    if (gdomain.contains(bx)) return;
+
+    Array4<Real> const& fab = dest.array();
+    const auto geomdata = geom.data();
+
+    AsyncArray<BCRec> bcr_aa(bcr.data()+bcomp, numcomp);
+    BCRec* bcr_p = bcr_aa.data();
+
+    const auto f_user = m_user_f;
+
+    // xlo
+    if (!geom.isPeriodic(0) && bx.smallEnd(0) < domain.smallEnd(0)) {
+        Box bndry = bx;
+        int dxlo = domain.smallEnd(0);
+        bndry.setBig(0,dxlo-1);
+        amrex::ParallelFor(bndry, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            for (int n = dcomp; n < dcomp+numcomp; ++n) {
+                fab(i,j,k,n) = fab(dxlo,j,k,n);
+            }
+            f_user(IntVect(AMREX_D_DECL(i,j,k)), fab, dcomp, numcomp, geomdata, time,
+                   bcr_p, 0, orig_comp);
+        });
+    }
+
+    // xhi
+    if (!geom.isPeriodic(0) && bx.bigEnd(0) > domain.bigEnd(0)) {
+        Box bndry = bx;
+        int dxhi = domain.bigEnd(0);
+        bndry.setSmall(0,dxhi+1);
+        amrex::ParallelFor(bndry, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            for (int n = dcomp; n < dcomp+numcomp; ++n) {
+                fab(i,j,k,n) = fab(dxhi,j,k,n);
+            }
+            f_user(IntVect(AMREX_D_DECL(i,j,k)), fab, dcomp, numcomp, geomdata, time,
+                   bcr_p, 0, orig_comp);
+        });
+    }
+
+#if (AMREX_SPACEDIM >= 2)
+    // ylo
+    if (!geom.isPeriodic(1) && bx.smallEnd(1) < domain.smallEnd(1)) {
+        Box bndry = bx;
+        int dylo = domain.smallEnd(1);
+        bndry.setBig(1,dylo-1);
+        amrex::ParallelFor(bndry, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            for (int n = dcomp; n < dcomp+numcomp; ++n) {
+                fab(i,j,k,n) = fab(i,dylo,k,n);
+            }
+            f_user(IntVect(AMREX_D_DECL(i,j,k)), fab, dcomp, numcomp, geomdata, time,
+                   bcr_p, 0, orig_comp);
+        });
+    }
+
+    // yhi
+    if (!geom.isPeriodic(1) && bx.bigEnd(1) > domain.bigEnd(1)) {
+        Box bndry = bx;
+        int dyhi = domain.bigEnd(1);
+        bndry.setSmall(1,dyhi+1);
+        amrex::ParallelFor(bndry, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            for (int n = dcomp; n < dcomp+numcomp; ++n) {
+                fab(i,j,k,n) = fab(i,dyhi,k,n);
+            }
+            f_user(IntVect(AMREX_D_DECL(i,j,k)), fab, dcomp, numcomp, geomdata, time,
+                   bcr_p, 0, orig_comp);
+        });
+    }
+#endif
+
+#if (AMREX_SPACEDIM == 3)
+    // zlo
+    if (!geom.isPeriodic(2) && bx.smallEnd(2) < domain.smallEnd(2)) {
+        Box bndry = bx;
+        int dzlo = domain.smallEnd(2);
+        bndry.setBig(2,dzlo-1);
+        amrex::ParallelFor(bndry, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            for (int n = dcomp; n < dcomp+numcomp; ++n) {
+                fab(i,j,k,n) = fab(i,j,dzlo,n);
+            }
+            f_user(IntVect(AMREX_D_DECL(i,j,k)), fab, dcomp, numcomp, geomdata, time,
+                   bcr_p, 0, orig_comp);
+        });
+    }
+
+    // zhi
+    if (!geom.isPeriodic(2) && bx.bigEnd(2) > domain.bigEnd(2)) {
+        Box bndry = bx;
+        int dzhi = domain.bigEnd(2);
+        bndry.setSmall(2,dzhi+1);
+        amrex::ParallelFor(bndry, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            for (int n = dcomp; n < dcomp+numcomp; ++n) {
+                fab(i,j,k,n) = fab(i,j,dzhi,n);
+            }
+            f_user(IntVect(AMREX_D_DECL(i,j,k)), fab, dcomp, numcomp, geomdata, time,
+                   bcr_p, 0, orig_comp);
+        });
+    }
+#endif
+}
+
 }
 
 #endif
diff --git a/Src/Base/AMReX_PhysBCFunct.cpp b/Src/Base/AMReX_PhysBCFunct.cpp
index 01a43e308c9..7e2a55fad66 100644
--- a/Src/Base/AMReX_PhysBCFunct.cpp
+++ b/Src/Base/AMReX_PhysBCFunct.cpp
@@ -53,7 +53,7 @@ CpuBndryFuncFab::operator() (Box const& bx, FArrayBox& dest,
                              const int orig_comp)
 {
     const int* lo = dest.loVect();
-    const Box& domain = geom.Domain();
+    const Box& domain = amrex::convert(geom.Domain(),bx.ixType());
     const int* dom_lo = domain.loVect();
     const Real* dx = geom.CellSize();
     const Real* problo = geom.ProbLo();
@@ -62,7 +62,13 @@ CpuBndryFuncFab::operator() (Box const& bx, FArrayBox& dest,
     {
         xlo[i] = problo[i] + dx[i]*(lo[i]-dom_lo[i]);
     }
-    fab_filcc(bx, dest.array(dcomp), numcomp, domain, dx, xlo, &(bcr[bcomp]));
+    if (bx.ixType().cellCentered()) {
+        fab_filcc(bx, dest.array(dcomp), numcomp, domain, dx, xlo, &(bcr[bcomp]));
+    } else if (bx.ixType().nodeCentered()) {
+        fab_filnd(bx, dest.array(dcomp), numcomp, domain, dx, xlo, &(bcr[bcomp]));
+    } else {
+        amrex::Abort("CpuBndryFuncFab: mixed index types are not supported");
+    }
 
     if (f_user != nullptr)
     {
diff --git a/Src/Base/AMReX_PlotFileDataImpl.H b/Src/Base/AMReX_PlotFileDataImpl.H
index bdee1370635..91258b3cd24 100644
--- a/Src/Base/AMReX_PlotFileDataImpl.H
+++ b/Src/Base/AMReX_PlotFileDataImpl.H
@@ -56,7 +56,6 @@ private:
     int m_spacedim;
     Real m_time;
     int m_finest_level, m_nlevels;
-// HIP FIX HERE: Initialization List: {{
     Array<Real,AMREX_SPACEDIM> m_prob_lo {{AMREX_D_DECL(0.,0.,0.)}};
     Array<Real,AMREX_SPACEDIM> m_prob_hi {{AMREX_D_DECL(1.,1.,1.)}};
     Array<Real,AMREX_SPACEDIM> m_prob_size {{AMREX_D_DECL(1.,1.,1.)}};
diff --git a/Src/Base/AMReX_PlotFileDataImpl.cpp b/Src/Base/AMReX_PlotFileDataImpl.cpp
index b5f7c209ff8..e9a7afba846 100644
--- a/Src/Base/AMReX_PlotFileDataImpl.cpp
+++ b/Src/Base/AMReX_PlotFileDataImpl.cpp
@@ -57,7 +57,7 @@ PlotFileDataImpl::PlotFileDataImpl (std::string const& plotfile_name)
         is >> m_level_steps[i];
     }
 
-    m_cell_size.resize(m_nlevels, Array<Real,AMREX_SPACEDIM>{AMREX_D_DECL(1.,1.,1.)});
+    m_cell_size.resize(m_nlevels, Array<Real,AMREX_SPACEDIM>{{AMREX_D_DECL(1.,1.,1.)}});
     for (int ilev = 0; ilev < m_nlevels; ++ilev) {
         for (int idim = 0; idim < m_spacedim; ++idim) {
             is >> m_cell_size[ilev][idim];
diff --git a/Src/Base/AMReX_PlotFileUtil.cpp b/Src/Base/AMReX_PlotFileUtil.cpp
index 5da89d4158e..52b228ebe2d 100644
--- a/Src/Base/AMReX_PlotFileUtil.cpp
+++ b/Src/Base/AMReX_PlotFileUtil.cpp
@@ -5,6 +5,8 @@
 #include <AMReX_VisMF.H>
 #include <AMReX_AsyncOut.H>
 #include <AMReX_PlotFileUtil.H>
+#include <AMReX_FPC.H>
+#include <AMReX_FabArrayUtility.H>
 
 #ifdef AMREX_USE_EB
 #include <AMReX_EBFabFactory.H>
@@ -12,6 +14,11 @@
 
 #ifdef AMREX_USE_HDF5
 #include "hdf5.h"
+
+#ifdef AMREX_USE_HDF5_ASYNC
+#include "h5_vol_external_async_native.h"
+#endif
+
 #endif
 
 namespace amrex {
@@ -56,7 +63,7 @@ std::string MultiFabFileFullPrefix (int level,
 
 void
 PreBuildDirectorHierarchy (const std::string &dirName,
-                           const std::string &subDirPrefix,
+                           const std::string &/*subDirPrefix*/,
                            int nSubDirs, bool callBarrier)
 {
   UtilCreateCleanDirectory(dirName, false);  // ---- dont call barrier
@@ -139,14 +146,18 @@ WriteGenericPlotfileHeader (std::ostream &HeaderFile,
 	    HeaderFile << level << ' ' << bArray[level].size() << ' ' << time << '\n';
 	    HeaderFile << level_steps[level] << '\n';
 
-	    for (int i = 0; i < bArray[level].size(); ++i)
-	    {
-		const Box &b(bArray[level][i]);
-		RealBox loc = RealBox(b, geom[level].CellSize(), geom[level].ProbLo());
-		for (int n = 0; n < AMREX_SPACEDIM; ++n) {
-		    HeaderFile << loc.lo(n) << ' ' << loc.hi(n) << '\n';
-		}
-	    }
+            const IntVect& domain_lo = geom[level].Domain().smallEnd();
+            for (int i = 0; i < bArray[level].size(); ++i)
+            {
+                // Need to shift because the RealBox ctor we call takes the
+                // physical location of index (0,0,0).  This does not affect
+                // the usual cases where the domain index starts with 0.
+                const Box& b = amrex::shift(bArray[level][i], -domain_lo);
+                RealBox loc = RealBox(b, geom[level].CellSize(), geom[level].ProbLo());
+                for (int n = 0; n < AMREX_SPACEDIM; ++n) {
+                    HeaderFile << loc.lo(n) << ' ' << loc.hi(n) << '\n';
+                }
+            }
 
 	    HeaderFile << MultiFabHeaderPath(level, levelPrefix, mfPrefix) << '\n';
 	}
@@ -453,7 +464,6 @@ EB_WriteMultiLevelPlotfile (const std::string& plotfilename, int nlevels,
 
 #endif
 
-
 #ifdef AMREX_USE_HDF5
 static int CreateWriteHDF5AttrDouble(hid_t loc, const char *name, hsize_t n, const double *data)
 {
@@ -534,31 +544,61 @@ static int CreateWriteHDF5AttrString(hid_t loc, const char *name, const char* st
     return 1;
 }
 
-static int CreateWriteDsetDouble(hid_t loc, const char *name, hsize_t n, const double *data)
+/* static int CreateWriteDsetDouble(hid_t loc, const char *name, hsize_t n, const double *data) */
+/* { */
+/*     herr_t ret; */
+/*     hid_t dset, dset_space; */
+/*     hsize_t dims = n; */
+
+/*     dset_space = H5Screate_simple(1, &dims, NULL); */
+
+/*     dset = H5Dcreate(loc, name, H5T_NATIVE_DOUBLE, dset_space, H5P_DEFAULT, H5P_DEFAULT, H5P_DEFAULT); */
+/*     if (dset < 0) { */
+/*         printf("%s: Error with H5Dcreate [%s]\n", __func__, name); */
+/*         return -1; */
+/*     } */
+
+/*     ret  = H5Dwrite(dset, H5T_NATIVE_DOUBLE, H5S_ALL, H5S_ALL, H5P_DEFAULT, (void*)data); */
+/*     if (ret < 0) { */
+/*         printf("%s: Error with H5Dwrite [%s]\n", __func__, name); */
+/*         return -1; */
+/*     } */
+/*     H5Sclose(dset_space); */
+/*     H5Aclose(dset); */
+/*     return 1; */
+/* } */
+
+static void SetHDF5fapl(hid_t fapl)
 {
-    herr_t ret;
-    hid_t dset, dset_space;
-    hsize_t dims = n;
-
-    dset_space = H5Screate_simple(1, &dims, NULL);
-
-    dset = H5Dcreate(loc, name, H5T_NATIVE_DOUBLE, dset_space, H5P_DEFAULT, H5P_DEFAULT, H5P_DEFAULT);
-    if (dset < 0) {
-        printf("%s: Error with H5Dcreate [%s]\n", __func__, name);
-        return -1;
-    }
+#ifdef BL_USE_MPI
+    H5Pset_fapl_mpio(fapl, MPI_COMM_SELF, MPI_INFO_NULL);
+
+    // Alignment and metadata block size
+    int alignment = 16 * 1024 * 1024;
+    H5Pset_alignment(fapl, alignment, alignment);
+    H5Pset_meta_block_size(fapl, 8388608);
+
+    // Collective metadata ops
+    H5Pset_coll_metadata_write(fapl, true);
+    H5Pset_all_coll_metadata_ops(fapl, true);
+
+    // Defer cache flush
+    H5AC_cache_config_t cache_config;
+    cache_config.version = H5AC__CURR_CACHE_CONFIG_VERSION;
+    H5Pget_mdc_config(fapl, &cache_config);
+    cache_config.set_initial_size = 1;
+    cache_config.initial_size = 16 * 1024 * 1024;
+    cache_config.evictions_enabled = 0;
+    cache_config.incr_mode = H5C_incr__off;
+    cache_config.flash_incr_mode = H5C_flash_incr__off;
+    cache_config.decr_mode = H5C_decr__off;
+    H5Pset_mdc_config (fapl, &cache_config);
+#else
+    H5Pset_fapl_sec2(fapl);
+#endif
 
-    ret  = H5Dwrite(dset, H5T_NATIVE_DOUBLE, H5S_ALL, H5S_ALL, H5P_DEFAULT, (void*)data);
-    if (ret < 0) {
-        printf("%s: Error with H5Dwrite [%s]\n", __func__, name);
-        return -1;
-    }
-    H5Sclose(dset_space);
-    H5Aclose(dset);
-    return 1;
 }
 
-
 void
 WriteGenericPlotfileHeaderHDF5 (hid_t fid,
                             int nlevels,
@@ -693,7 +733,7 @@ WriteGenericPlotfileHeaderHDF5 (hid_t fid,
 
         int ngrid = bArray[level].size();
         CreateWriteHDF5AttrInt(grp, "ngrid", 1, &ngrid);
-        double cur_time = (double)time;
+        cur_time = (double)time;
         CreateWriteHDF5AttrDouble(grp, "time", 1, &cur_time);
 
         int ngrow = mf[level]->nGrow();
@@ -746,19 +786,19 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
     
 
     herr_t  ret;
-    int ndim = AMREX_SPACEDIM;
     int finest_level = nlevels-1;
     int ncomp = mf[0]->nComp();
     /* double total_write_start_time(ParallelDescriptor::second()); */
     std::string filename(plotfilename + ".h5");
 
     // Write out root level metadata
-    hid_t fapl, fid, grp;
+    hid_t fapl, dxpl, fid, grp;
 
     if(ParallelDescriptor::IOProcessor()) {
+        BL_PROFILE_VAR("H5writeMetadata", h5dwm);
         // Have only one rank to create and write metadata (header)
         fapl = H5Pcreate (H5P_FILE_ACCESS);
-        H5Pset_fapl_mpio(fapl, MPI_COMM_SELF, MPI_INFO_NULL);
+        SetHDF5fapl(fapl);
 
         // Create the HDF5 file
         fid = H5Fcreate(filename.c_str(), H5F_ACC_TRUNC, H5P_DEFAULT, fapl);
@@ -774,19 +814,78 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
 
         WriteGenericPlotfileHeaderHDF5(fid, nlevels, mf, boxArrays, varnames, geom, time, level_steps, ref_ratio, versionName, levelPrefix, mfPrefix, extra_dirs);
         H5Fclose(fid);
+        BL_PROFILE_VAR_STOP(h5dwm);
     }
 
     ParallelDescriptor::Barrier();
 
+    hid_t babox_id;
+    babox_id = H5Tcreate (H5T_COMPOUND, 2 * AMREX_SPACEDIM * sizeof(int));
+    if (1 == AMREX_SPACEDIM) {
+	H5Tinsert (babox_id, "lo_i", 0 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "hi_i", 1 * sizeof(int), H5T_NATIVE_INT);
+    }
+    else if (2 == AMREX_SPACEDIM) {
+	H5Tinsert (babox_id, "lo_i", 0 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "lo_j", 1 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "hi_i", 2 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "hi_j", 3 * sizeof(int), H5T_NATIVE_INT);
+    }
+    else if (3 == AMREX_SPACEDIM) {
+	H5Tinsert (babox_id, "lo_i", 0 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "lo_j", 1 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "lo_k", 2 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "hi_i", 3 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "hi_j", 4 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (babox_id, "hi_k", 5 * sizeof(int), H5T_NATIVE_INT);
+    }
+ 
+    hid_t center_id = H5Tcreate (H5T_COMPOUND, AMREX_SPACEDIM * sizeof(int));
+    if (1 == AMREX_SPACEDIM) {
+	H5Tinsert (center_id, "i", 0 * sizeof(int), H5T_NATIVE_INT);
+    }
+    else if (2 == AMREX_SPACEDIM) {
+	H5Tinsert (center_id, "i", 0 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (center_id, "j", 1 * sizeof(int), H5T_NATIVE_INT);
+    }
+    else if (3 == AMREX_SPACEDIM) {
+	H5Tinsert (center_id, "i", 0 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (center_id, "j", 1 * sizeof(int), H5T_NATIVE_INT);
+	H5Tinsert (center_id, "k", 2 * sizeof(int), H5T_NATIVE_INT);
+    }
+ 
     fapl = H5Pcreate (H5P_FILE_ACCESS);
-    H5Pset_fapl_mpio(fapl,  ParallelDescriptor::Communicator(), MPI_INFO_NULL);
+    dxpl = H5Pcreate(H5P_DATASET_XFER);
+
+    SetHDF5fapl(fapl);
+
+    // Only use async for writing actual data
+    #ifdef AMREX_USE_HDF5_ASYNC
+    H5Pset_vol_async(fapl);
+    H5Pset_dxpl_async(dxpl, true);
+    #endif
+
+    BL_PROFILE_VAR("H5writeAllLevel", h5dwd);
 
     // All process open the file
     fid = H5Fopen(filename.c_str(), H5F_ACC_RDWR, fapl);
     if (fid < 0) 
         FileOpenFailed(filename.c_str());
 
-    H5Pclose(fapl);
+    RealDescriptor *whichRD = nullptr;
+    if(FArrayBox::getFormat() == FABio::FAB_NATIVE) {
+        whichRD = FPC::NativeRealDescriptor().clone();
+    } else if(FArrayBox::getFormat() == FABio::FAB_NATIVE_32) {
+        whichRD = FPC::Native32RealDescriptor().clone();
+    } else if(FArrayBox::getFormat() == FABio::FAB_IEEE_32) {
+        whichRD = FPC::Ieee32NormalRealDescriptor().clone();
+    } else {
+        whichRD = FPC::NativeRealDescriptor().clone(); // to quiet clang static analyzer
+        Abort("VisMF::Write unable to execute with the current fab.format setting.  Use NATIVE, NATIVE_32 or IEEE_32");
+    }
+
+    bool doConvert(*whichRD != FPC::NativeRealDescriptor());
+    int whichRDBytes(whichRD->numBytes());
 
     // Write data for each level
     char level_name[32];
@@ -808,33 +907,13 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
         std::string odsname("data:offsets=0");
         std::string centername("boxcenter");
         std::string dataname("data:datatype=0");
-        hsize_t  flatdims[1], count[1];
+        hsize_t  flatdims[1];
         flatdims[0] = grids.size();
         
         flatdims[0] = grids.size();
         boxdataspace = H5Screate_simple(1, flatdims, NULL);
        
-        hid_t babox_id;
-        babox_id = H5Tcreate (H5T_COMPOUND, 2 * AMREX_SPACEDIM * sizeof(int));
-        if (1 == AMREX_SPACEDIM) {
-            H5Tinsert (babox_id, "lo_i", 0 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "hi_i", 1 * sizeof(int), H5T_NATIVE_INT);
-        }
-        else if (2 == AMREX_SPACEDIM) {
-            H5Tinsert (babox_id, "lo_i", 0 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "lo_j", 1 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "hi_i", 2 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "hi_j", 3 * sizeof(int), H5T_NATIVE_INT);
-        }
-        else if (3 == AMREX_SPACEDIM) {
-            H5Tinsert (babox_id, "lo_i", 0 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "lo_j", 1 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "lo_k", 2 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "hi_i", 3 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "hi_j", 4 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (babox_id, "hi_k", 5 * sizeof(int), H5T_NATIVE_INT);
-        }
-    
+   
         boxdataset = H5Dcreate(grp, bdsname.c_str(), babox_id, boxdataspace, H5P_DEFAULT, H5P_DEFAULT,H5P_DEFAULT);
         
         // Create a boxarray sorted by rank
@@ -862,20 +941,6 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
         offsetdataspace = H5Screate_simple(1, oflatdims, NULL);
         offsetdataset   = H5Dcreate(grp, odsname.c_str(), H5T_NATIVE_LLONG, offsetdataspace, H5P_DEFAULT, H5P_DEFAULT, H5P_DEFAULT);
 
-        hid_t center_id = H5Tcreate (H5T_COMPOUND, AMREX_SPACEDIM * sizeof(int));
-        if (1 == AMREX_SPACEDIM) {
-            H5Tinsert (center_id, "i", 0 * sizeof(int), H5T_NATIVE_INT);
-        }
-        else if (2 == AMREX_SPACEDIM) {
-            H5Tinsert (center_id, "i", 0 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (center_id, "j", 1 * sizeof(int), H5T_NATIVE_INT);
-        }
-        else if (3 == AMREX_SPACEDIM) {
-            H5Tinsert (center_id, "i", 0 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (center_id, "j", 1 * sizeof(int), H5T_NATIVE_INT);
-            H5Tinsert (center_id, "k", 2 * sizeof(int), H5T_NATIVE_INT);
-        }
- 
         hsize_t centerdims[1];
         centerdims[0]   = sortedGrids.size() ;
         centerdataspace = H5Screate_simple(1, centerdims, NULL);
@@ -906,19 +971,15 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
             totalOffset += procBufferSize[proc];
         }
         
-        hid_t dxpl = H5Pcreate(H5P_DATASET_XFER);
-        ret = H5Pset_dxpl_mpio(dxpl, H5FD_MPIO_INDEPENDENT);
-
         if(ParallelDescriptor::IOProcessor()) {
             int vbCount(0);
             Vector<int> vbox(sortedGrids.size() * 2 * AMREX_SPACEDIM);
             Vector<int> centering(sortedGrids.size() * AMREX_SPACEDIM);
-            count[0] = sortedGrids.size();
             for(int b(0); b < sortedGrids.size(); ++b) {
                 for(int i(0); i < AMREX_SPACEDIM; ++i) {
                     vbox[(vbCount * 2 * AMREX_SPACEDIM) + i] = sortedGrids[b].smallEnd(i);
                     vbox[(vbCount * 2 * AMREX_SPACEDIM) + i + AMREX_SPACEDIM] = sortedGrids[b].bigEnd(i);
-                    centering[vbCount + i] = sortedGrids[b].ixType().test(i) ? 1 : 0;
+                    centering[vbCount * AMREX_SPACEDIM + i] = sortedGrids[b].ixType().test(i) ? 1 : 0;
                 }
                 ++vbCount;
             }
@@ -934,8 +995,6 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
             if(ret < 0) { std::cout << "Write box dataset failed! ret = " << ret << std::endl; }
         }
        
-        
-        BL_PROFILE_VAR("H5Dwritedata", h5dwd);
         hsize_t hs_procsize[1], hs_allprocsize[1], ch_offset[1];
         
         ch_offset[0]       = procOffsets[myProc];          // ---- offset on this proc
@@ -949,19 +1008,44 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
         H5Sselect_hyperslab(dataspace, H5S_SELECT_SET, ch_offset, NULL, hs_procsize, NULL);
         
         Vector<Real> a_buffer(procBufferSize[myProc], -1.0);
-        Long dataCount(0);
-        for(MFIter mfi(*mf[level]); mfi.isValid(); ++mfi) {
-            const Box &vbox    = mfi.validbox();
-            const Real *dataPtr = (*mf[level])[mfi].dataPtr();
-            for(int i(0); i < vbox.numPts() * ncomp; ++i) {
-                a_buffer[dataCount++] = dataPtr[i];
+        /* Long dataCount(0); */
+        /* for(MFIter mfi(*mf[level]); mfi.isValid(); ++mfi) { */
+        /*     const Box &vbox    = mfi.validbox(); */
+        /*     const Real *dataPtr = (*mf[level])[mfi].dataPtr(); */
+        /*     for(int i(0); i < vbox.numPts() * ncomp; ++i) { */
+        /*         a_buffer[dataCount++] = dataPtr[i]; */
+        /*     } */
+        /* } */
+        const MultiFab* data;
+        std::unique_ptr<MultiFab> mf_tmp;
+        if (mf[level]->nGrowVect() != 0) {
+            mf_tmp.reset(new MultiFab(mf[level]->boxArray(),
+                                      mf[level]->DistributionMap(),
+                                      mf[level]->nComp(), 0, MFInfo(),
+                                      mf[level]->Factory()));
+            MultiFab::Copy(*mf_tmp, *mf[level], 0, 0, mf[level]->nComp(), 0);
+            data = mf_tmp.get();
+        } else {
+            data = mf[level];
+        }
+
+        Long writeDataItems(0), writeDataSize(0);
+        for(MFIter mfi(*data); mfi.isValid(); ++mfi) {
+            const FArrayBox &fab = (*data)[mfi];
+            writeDataItems = fab.box().numPts() * (*data).nComp();
+            if(doConvert) {
+                RealDescriptor::convertFromNativeFormat(static_cast<void *> (a_buffer.dataPtr()+writeDataSize),
+                                                        writeDataItems, fab.dataPtr(), *whichRD);
+            } else {    // ---- copy from the fab
+                memcpy(static_cast<void *> (a_buffer.dataPtr()+writeDataSize), 
+                       fab.dataPtr(), writeDataItems * whichRDBytes);
             }
+            writeDataSize += writeDataItems;
         }
-        
-        /* ret = H5Pset_dxpl_mpio(dxpl, H5FD_MPIO_COLLECTIVE); */
-           
-        BL_PROFILE_VAR("H5DwriteGrids", h5dwg);
 
+        BL_PROFILE_VAR("H5DwriteData", h5dwg);
+
+        /* ret = H5Pset_dxpl_mpio(dxpl, H5FD_MPIO_COLLECTIVE); */
         ret = H5Dwrite(dataset, H5T_NATIVE_DOUBLE, memdataspace, dataspace, dxpl, a_buffer.dataPtr());
         if(ret < 0) 
             std::cout << ParallelDescriptor::MyProc() << "Write data failed!  ret = " << ret << std::endl;
@@ -969,9 +1053,6 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
         BL_PROFILE_VAR_STOP(h5dwg);
 
         
-        H5Tclose(center_id);
-        H5Tclose(babox_id);
-        H5Pclose(dxpl);
         H5Sclose(memdataspace);
         H5Sclose(dataspace);
         H5Dclose(dataset);
@@ -981,24 +1062,21 @@ void WriteMultiLevelPlotfileHDF5 (const std::string& plotfilename,
         H5Dclose(centerdataset);
         H5Sclose(boxdataspace);
         H5Dclose(boxdataset);
-        
-        BL_PROFILE_VAR_STOP(h5dwd);
-
         H5Gclose(grp);
     } // For group
 
-    H5Fclose(fid);
-
-    /* double total_write_end_time(ParallelDescriptor::second()); */
-    /* double total_write_time(total_write_end_time - total_write_start_time); */
-    /* ParallelDescriptor::ReduceRealMax(total_write_time); */
+    BL_PROFILE_VAR_STOP(h5dwd);
 
-    /* if(ParallelDescriptor::IOProcessor()) { */
-    /*     std::cout << "WriteMultiLevelPlotfileHDF5 Time = " << total_write_time << "  seconds." << std::endl; */
-    /* } */    
+    H5Tclose(center_id);
+    H5Tclose(babox_id);
+    H5Pclose(fapl);
+    H5Pclose(dxpl);
+    H5Fclose(fid);
 
+    delete whichRD;
 }
 
+
 void
 WriteSingleLevelPlotfileHDF5 (const std::string& plotfilename,
                           const MultiFab& mf, const Vector<std::string>& varnames,
@@ -1017,7 +1095,5 @@ WriteSingleLevelPlotfileHDF5 (const std::string& plotfilename,
                             level_steps, ref_ratio, versionName, levelPrefix, mfPrefix, extra_dirs);
 }
 
-
-
 #endif
 }
diff --git a/Src/Base/AMReX_Print.H b/Src/Base/AMReX_Print.H
index 2540214eaeb..806d2c6ca9e 100644
--- a/Src/Base/AMReX_Print.H
+++ b/Src/Base/AMReX_Print.H
@@ -12,6 +12,15 @@
 
 namespace amrex
 {
+    template <typename T>
+    std::ostream& operator<< (std::ostream& os, Array<T,AMREX_SPACEDIM> const& a)
+    {
+        os << AMREX_D_TERM( '(' << a[0] , <<
+                            ',' << a[1] , <<
+                            ',' << a[2])  << ')';
+        return os;
+    }
+
     template <typename T, typename S>
     std::ostream& operator<<(std::ostream& os, const std::pair<T, S>& v)
     {
@@ -116,14 +125,14 @@ namespace amrex
 
 	explicit PrintToFile (const std::string& file_name_) 
 	    : file_name(file_name_)
-            , rank(ParallelDescriptor::IOProcessorNumber())
-	    , comm(ParallelDescriptor::Communicator())
+            , rank(ParallelContext::IOProcessorNumberSub())
+	    , comm(ParallelContext::CommunicatorSub())
         { Initialize(); }
         
 	PrintToFile (const std::string& file_name_, int rank_ ) 
 	    : file_name(file_name_)
 	    , rank(rank_)
-	    , comm(ParallelDescriptor::Communicator())
+	    , comm(ParallelContext::CommunicatorSub())
         { Initialize(); }
         
 	PrintToFile (const std::string& file_name_, int rank_, MPI_Comm comm_)
@@ -133,7 +142,7 @@ namespace amrex
         { Initialize(); }
 
 	~PrintToFile () {
-	    if (rank == AllProcs || rank == ParallelDescriptor::MyProc(comm)) {
+	    if (rank == AllProcs || rank == ParallelContext::MyProcSub()) {
 		ofs.flush();
 		ofs << ss.str();
 		ofs.flush();
@@ -161,9 +170,10 @@ namespace amrex
     private:
 
         void Initialize() {
-            int my_proc = ParallelDescriptor::MyProc(comm);
+            int my_proc = ParallelContext::MyProcSub();
             if (rank == AllProcs || rank == my_proc) {
-                std::string proc_file_name = file_name + "." + std::to_string(my_proc);
+                int my_proc_global = ParallelDescriptor::MyProc();
+                std::string proc_file_name = file_name + "." + std::to_string(my_proc_global);
 #ifdef _OPENMP
                 proc_file_name += "." + std::to_string(omp_get_thread_num());
 #endif
diff --git a/Src/Base/AMReX_Random.H b/Src/Base/AMReX_Random.H
index 97248712df9..af86370d553 100644
--- a/Src/Base/AMReX_Random.H
+++ b/Src/Base/AMReX_Random.H
@@ -1,30 +1,88 @@
 #ifndef AMREX_RAND_H
 #define AMREX_RAND_H
 
+#include <AMReX.H>
 #include <AMReX_GpuQualifiers.H>
 #include <AMReX_ParallelDescriptor.H>
-
-// xxxxx DPCPP todo
+#include <AMReX_RandomEngine.H>
+#include <limits>
+#include <cstdint>
 
 namespace amrex
 {
     /**
-    * \brief Generate a psuedo-random double using C++11's mt19937.
+    * \brief Generate a psuedo-random double from uniform distribution
     *
-    *  Generates one pseudorandom real number (double) from a normal
-    *  distribution with mean 'mean' and standard deviation 'stddev'.
+    *  Generates one pseudorandom real number (double) from a uniform
+    *  distribution between 0.0 and 1.0 (0.0 included, 1.0 excluded)
     *
     */
-    AMREX_GPU_EXTERNAL AMREX_GPU_HOST_DEVICE Real RandomNormal (Real mean, Real stddev);
+#ifdef AMREX_USE_CUDA
+    AMREX_GPU_HOST_DEVICE Real Random ();
+#else
+    Real Random ();
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    Real Random (RandomEngine const& random_engine)
+    {
+#if defined(__CUDA_ARCH__)
+#ifdef BL_USE_FLOAT
+        return 1.0f - curand_uniform(random_engine.rand_state);
+#else
+        return 1.0 - curand_uniform_double(random_engine.rand_state);
+#endif
+#elif defined(__HIP_DEVICE_COMPILE__)
+#ifdef BL_USE_FLOAT
+        return 1.0f - hiprand_uniform(random_engine.rand_state);
+#else
+        return 1.0 - hiprand_uniform_double(random_engine.rand_state);
+#endif
+#elif defined (__SYCL_DEVICE_ONLY__)
+        mkl::rng::device::uniform<Real> distr;
+        return mkl::rng::device::generate(distr, *random_engine.engine);
+#else
+        amrex::ignore_unused(random_engine);
+        return Random();
+#endif
+    }
 
     /**
-    * \brief Generate a psuedo-random double using C++11's mt19937.
+    * \brief Generate a psuedo-random double from a normal distribution
     *
-    *  Generates one pseudorandom real number (double) from a uniform
-    *  distribution between 0.0 and 1.0 (0.0 included, 1.0 excluded)
+    *  Generates one pseudorandom real number (double) from a normal
+    *  distribution with mean 'mean' and standard deviation 'stddev'.
     *
     */
-    AMREX_GPU_EXTERNAL AMREX_GPU_HOST_DEVICE Real Random ();
+#ifdef AMREX_USE_CUDA
+    AMREX_GPU_HOST_DEVICE Real RandomNormal (Real mean, Real stddev);
+#else
+    Real RandomNormal (Real mean, Real stddev);
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    Real RandomNormal (Real mean, Real stddev, RandomEngine const& random_engine)
+    {
+#if defined(__CUDA_ARCH__)
+#ifdef BL_USE_FLOAT
+        return stddev * curand_normal(random_engine.rand_state) + mean;
+#else
+        return stddev * curand_normal_double(random_engine.rand_state) + mean;
+#endif
+#elif defined(__HIP_DEVICE_COMPILE__)
+#ifdef BL_USE_FLOAT
+        return stddev * hiprand_normal(random_engine.rand_state) + mean;
+#else
+        return stddev * hiprand_normal_double(random_engine.rand_state) + mean;
+#endif
+#elif defined (__SYCL_DEVICE_ONLY__)
+        mkl::rng::device::gaussian<Real> distr(mean, stddev);
+        return mkl::rng::device::generate(distr, *random_engine.engine);
+#else
+        amrex::ignore_unused(random_engine);
+        return RandomNormal(mean, stddev);
+#endif
+    }
 
     /**
     * \brief Generate a psuedo-random integer from a Poisson distribution
@@ -35,16 +93,28 @@ namespace amrex
     *  The GPU version of this function relies on the cuRAND library
     *
     */
-    AMREX_GPU_EXTERNAL AMREX_GPU_HOST_DEVICE unsigned int RandomPoisson (Real lambda);
-
-
-
-#ifdef AMREX_USE_GPU
-    // Locking mechanism functions for locking and unlocking
-    AMREX_GPU_DEVICE int get_state (int tid);
-    AMREX_GPU_DEVICE void free_state (int tid);
+#ifdef AMREX_USE_CUDA
+    AMREX_GPU_HOST_DEVICE unsigned int RandomPoisson (Real lambda);
+#else
+    unsigned int RandomPoisson (Real lambda);
 #endif
 
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    unsigned int RandomPoisson (Real lambda, RandomEngine const& random_engine)
+    {
+#if defined(__CUDA_ARCH__)
+        return curand_poisson(random_engine.rand_state, lambda);
+#elif defined(__HIP_DEVICE_COMPILE__)
+        return hiprand_poisson(random_engine.rand_state, lambda);
+#elif defined (__SYCL_DEVICE_ONLY__)
+        amrex::ignore_unused(lambda,random_engine);
+        amrex::Abort("RandomPossion not supported in DPC++ device code");
+        return 0; // xxxxx DPCPP todo: Poisson distribution
+#else
+        amrex::ignore_unused(random_engine);
+        return RandomPoisson(lambda);
+#endif
+    }
 
     /**
     * \brief Generates one pseudorandom unsigned integer which is
@@ -53,7 +123,44 @@ namespace amrex
     * The CPU version of this function uses C++11's mt19937.
     * The GPU version uses CURAND's XORWOW generator.
     */
-    AMREX_GPU_EXTERNAL AMREX_GPU_HOST_DEVICE unsigned int Random_int (unsigned int n); // [0,n-1]
+#ifdef AMREX_USE_CUDA
+    AMREX_GPU_HOST_DEVICE unsigned int Random_int (unsigned int n); // [0,n-1]
+#else
+    unsigned int Random_int (unsigned int n); // [0,n-1]
+#endif
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    unsigned int Random_int (unsigned int n, RandomEngine const& random_engine)
+    {
+#if AMREX_DEVICE_COMPILE
+#if defined(__SYCL_DEVICE_ONLY__)
+        if (n <= static_cast<unsigned int>(std::numeric_limits<std::int32_t>::max())) {
+            mkl::rng::device::uniform<std::int32_t> distr(0,static_cast<std::int32_t>(n));
+            return mkl::rng::device::generate(distr, *random_engine.engine);
+        } else {
+            amrex::Abort("Random_int not supported in DPC++ device code, if n > INT_MAX");
+            return 0; // xxxxx DPCPP todo: unsigned uniform distribution
+        }
+#else
+        int rand;
+        constexpr unsigned int RAND_M = 4294967295; // 2**32-1
+        do {
+            AMREX_HIP_OR_CUDA( rand = hiprand(random_engine.rand_state);,
+                               rand =  curand(random_engine.rand_state) );
+        } while (rand > (RAND_M - RAND_M % n));
+        return rand % n;
+#endif
+#else
+        amrex::ignore_unused(random_engine);
+        return Random_int(n);
+#endif
+    }
+
+#ifdef AMREX_USE_GPU
+    // Locking mechanism functions for locking and unlocking
+    AMREX_GPU_DEVICE int get_state (int tid);
+    AMREX_GPU_DEVICE void free_state (int tid);
+#endif
 
     /**
     * \brief Generates one pseudorandom unsigned long which is
@@ -78,20 +185,8 @@ namespace amrex
     */
     void InitRandom (ULong seed, int nprocs=ParallelDescriptor::NProcs());
 
-    /**
-    * \brief Resize seed array and copy address to global symbol
-    */
-    void ResizeRandomSeed (int N);
     void ResetRandomSeed (ULong seed);
 
-    /**
-    * \brief Set the seeds of the random number generator for each CUDA thread .
-    *  An in-built CUDA library, curand_init is used here.
-    *  The pseusorandom sequence currently implemented is obtained
-    *  from the XORWOW and MRG32k3a generator
-    */
-    void InitRandSeedOnDevice (int N);
-
     /**
     * \brief Save and restore random state.
     *
@@ -118,14 +213,6 @@ namespace amrex
     */
     void NItemsPerBin (int totalItems, Vector<int> &binCounts);
 
-    /**
-    * \brief Set the seeds of the random number generator for each CUDA thread .
-    *  An in-built CUDA library, curand_init is used here.
-    *  The pseusorandom sequence currently implemented is obtained
-    *  from the XORWOW and MRG32k3a generator
-    */
-    void InitRandSeedOnDevice (int N);
-
     void DeallocateRandomSeedDevArray ();
 }
 
diff --git a/Src/Base/AMReX_Random.cpp b/Src/Base/AMReX_Random.cpp
index 8252ded355c..80a2af228d1 100644
--- a/Src/Base/AMReX_Random.cpp
+++ b/Src/Base/AMReX_Random.cpp
@@ -6,74 +6,104 @@
 #include <AMReX_Print.H>
 #include <AMReX_Random.H>
 #include <AMReX_BlockMutex.H>
-#include <AMReX_GpuLaunch.H>
-#include <AMReX_GpuDevice.H>
+#include <AMReX_Gpu.H>
+#include <AMReX_OpenMP.H>
 
-#ifdef AMREX_USE_HIP
-#include <hiprand.hpp>
-#endif
+namespace
+{
+    int nthreads;
 
-#ifdef _OPENMP
-#include <omp.h>
+    amrex::Vector<std::mt19937> generators;
+
+#if defined(AMREX_USE_CUDA) || defined(AMREX_USE_HIP)
+    AMREX_GPU_DEVICE int gpu_nstates_d;
+
+    AMREX_GPU_DEVICE amrex::randState_t* d_states_d_ptr;
+
+    amrex::BlockMutex* h_mutex_h_ptr = nullptr;
+    amrex::BlockMutex* d_mutex_h_ptr = nullptr;
+    AMREX_GPU_DEVICE amrex::BlockMutex* d_mutex_d_ptr = nullptr;
 #endif
+}
 
-#ifdef AMREX_USE_HIP
-using randState_t = hiprandState_t;
-#elif defined(AMREX_USE_CUDA)
-using randState_t =  curandState_t;
-#elif defined(AMREX_USE_DPCPP)
-struct randState_t {};
+#ifdef AMREX_USE_GPU
+namespace amrex {
+#ifdef AMREX_USE_DPCPP
+    dpcpp_rng_descr* rand_engine_descr = nullptr;
+#else
+    amrex::randState_t* d_states_h_ptr = nullptr;
+#endif
+}
 #endif
 
-namespace
+#ifdef AMREX_USE_GPU
+namespace {
+void ResizeRandomSeed ()
 {
-    int nthreads;
+    BL_PROFILE("ResizeRandomSeed");
 
-    amrex::Vector<std::mt19937> generators;
+    using namespace amrex;
 
-#ifdef AMREX_USE_GPU
-    // This seems to be a good default value on NVIDIA V100 GPUs
-    constexpr int gpu_nstates_default = 1e5;
+    DeallocateRandomSeedDevArray();
 
-    int gpu_nstates_h = 0;
-    AMREX_GPU_DEVICE int gpu_nstates_d = 0;
+    const int N = Gpu::Device::maxBlocksPerLaunch() * AMREX_GPU_MAX_THREADS;
 
-    randState_t* d_states_h_ptr = nullptr;
-    AMREX_GPU_DEVICE randState_t* d_states_d_ptr;
+#ifdef AMREX_USE_DPCPP
 
-    amrex::BlockMutex* h_mutex_h_ptr = nullptr;
-    amrex::BlockMutex* d_mutex_h_ptr = nullptr;
+    rand_engine_descr = new dpcpp_rng_descr
+        (Gpu::Device::nullQueue(), sycl::range<1>(N),
+         ParallelDescriptor::MyProc()*1234567ULL + 12345ULL, 1);
+
+#elif defined(AMREX_USE_CUDA) || defined(AMREX_USE_HIP)
+
+    d_states_h_ptr =  static_cast<randState_t*>(The_Arena()->alloc(N*sizeof(randState_t)));
+
+    h_mutex_h_ptr = new amrex::BlockMutex(N);
+    d_mutex_h_ptr = static_cast<amrex::BlockMutex*> (The_Arena()->alloc(sizeof(amrex::BlockMutex)));
+    amrex::Gpu::htod_memcpy(d_mutex_h_ptr, h_mutex_h_ptr, sizeof(amrex::BlockMutex));
+
+    randState_t* d_states_h_ptr_local = d_states_h_ptr;
+    amrex::BlockMutex* d_mutex_h_ptr_local = d_mutex_h_ptr;
+
+    amrex::single_task([=] AMREX_GPU_DEVICE () noexcept
+    {
+        d_states_d_ptr = d_states_h_ptr_local;
+        d_mutex_d_ptr = d_mutex_h_ptr_local;
+        gpu_nstates_d = N;
+    });
 
-    AMREX_GPU_DEVICE
-    amrex::BlockMutex* d_mutex_d_ptr = nullptr;
+    const int MyProc = amrex::ParallelDescriptor::MyProc();
+    amrex::ParallelFor(N, [=] AMREX_GPU_DEVICE (int idx) noexcept
+    {
+        amrex::ULong seed = MyProc*1234567ULL + 12345ULL ;
+        int seqstart = idx + 10 * idx ;
+        AMREX_HIP_OR_CUDA( hiprand_init(seed, seqstart, 0, &d_states_d_ptr[idx]);,
+                            curand_init(seed, seqstart, 0, &d_states_d_ptr[idx]); )
+    });
 #endif
 
+    Gpu::synchronize();
 }
+}
+#endif
 
 void
 amrex::InitRandom (amrex::ULong seed, int nprocs)
 {
-#ifdef _OPENMP
-    nthreads = omp_get_max_threads();
-#else
-    nthreads = 1;
-#endif
+    nthreads = OpenMP::get_max_threads();
     generators.resize(nthreads);
 
 #ifdef _OPENMP
 #pragma omp parallel
+#endif
     {
-        int tid = omp_get_thread_num();
+        int tid = OpenMP::get_thread_num();
         amrex::ULong init_seed = seed + tid*nprocs;
         generators[tid].seed(init_seed);
     }
-#else
-    generators[0].seed(seed);
-#endif
 
 #ifdef AMREX_USE_GPU
-    DeallocateRandomSeedDevArray();
-    ResizeRandomSeed(gpu_nstates_default);
+    ResizeRandomSeed();
 #endif
 }
 
@@ -83,6 +113,7 @@ int amrex::get_state (int tid)
 {
 #ifdef AMREX_USE_DPCPP
 // xxxxx DPCPP todo
+    amrex::ignore_unused(tid);
     return 0;
 #else
     // block size must evenly divide # of RNG states so we cut off the excess states
@@ -100,6 +131,7 @@ AMREX_GPU_DEVICE
 void amrex::free_state (int tid)
 {
 #ifdef AMREX_USE_DPCPP
+    amrex::ignore_unused(tid);
 // xxxxx DPCPP todo
 #else
     int bsize = blockDim.x * blockDim.y * blockDim.z;
@@ -111,13 +143,13 @@ void amrex::free_state (int tid)
 }
 #endif
 
-AMREX_GPU_HOST_DEVICE amrex::Real
-amrex::RandomNormal (amrex::Real mean, amrex::Real stddev)
+#ifdef AMREX_USE_CUDA
+AMREX_GPU_HOST_DEVICE
+#endif
+amrex::Real amrex::RandomNormal (amrex::Real mean, amrex::Real stddev)
 {
-
     amrex::Real rand;
-
-#if defined(__CUDA_ARCH__) || defined(__HIP_DEVICE_COMPILE__)
+#if defined(__CUDA_ARCH__)
     int blockId = blockIdx.x + blockIdx.y * gridDim.x + gridDim.x * gridDim.y * blockIdx.z;
 
     int tid = blockId * (blockDim.x * blockDim.y * blockDim.z)
@@ -126,41 +158,30 @@ amrex::RandomNormal (amrex::Real mean, amrex::Real stddev)
 
     int i = get_state(tid);
 #ifdef BL_USE_FLOAT
-    AMREX_HIP_OR_CUDA( rand = stddev * hiprand_normal(&d_states_d_ptr[i]) + mean;,
-                       rand = stddev *  curand_normal(&d_states_d_ptr[i]) + mean; );
+    rand = stddev *  curand_normal(&d_states_d_ptr[i]) + mean;
 #else
-    AMREX_HIP_OR_CUDA( rand = stddev * hiprand_normal_double(&d_states_d_ptr[i]) + mean;,
-                       rand = stddev *  curand_normal_double(&d_states_d_ptr[i]) + mean; );
+    rand = stddev *  curand_normal_double(&d_states_d_ptr[i]) + mean;
 #endif
     __threadfence();
     free_state(tid);
 
-#elif defined(__SYCL_DEVICE_ONLY__)
-
-    assert(0);
-    rand = 0.0_rt;
-    return rand;
-
-#else
-
-#ifdef _OPENMP
-    int tid = omp_get_thread_num();
 #else
-    int tid = 0;
-#endif
 
     std::normal_distribution<amrex::Real> distribution(mean, stddev);
+    int tid = OpenMP::get_thread_num();
     rand = distribution(generators[tid]);
 
 #endif
     return rand;
 }
 
-AMREX_GPU_HOST_DEVICE amrex::Real
-amrex::Random ()
+#ifdef AMREX_USE_CUDA
+AMREX_GPU_HOST_DEVICE
+#endif
+amrex::Real amrex::Random ()
 {
     amrex::Real rand;
-#if defined(__CUDA_ARCH__) || defined(__HIP_DEVICE_COMPILE__)    // on the device
+#if defined(__CUDA_ARCH__)   // on the device
     int blockId = blockIdx.x + blockIdx.y * gridDim.x + gridDim.x * gridDim.y * blockIdx.z;
 
     int tid = blockId * (blockDim.x * blockDim.y * blockDim.z)
@@ -171,43 +192,33 @@ amrex::Random ()
     // curand_uniform generates numbers in (0.0,1], while
     // std::uniform_real_distribution in [0.0, 1.0)
 #ifdef BL_USE_FLOAT
-    AMREX_HIP_OR_CUDA( rand = 1.0f - hiprand_uniform(&d_states_d_ptr[i]);,
-                       rand = 1.0f - curand_uniform(&d_states_d_ptr[i]); );
+    rand = 1.0f - curand_uniform(&d_states_d_ptr[i]);
 #else
-    AMREX_HIP_OR_CUDA( rand = 1.0 - hiprand_uniform_double(&d_states_d_ptr[i]);,
-                       rand = 1.0 - curand_uniform_double(&d_states_d_ptr[i]); );
+    rand = 1.0 - curand_uniform_double(&d_states_d_ptr[i]);
 #endif
 
     __threadfence();
     free_state(tid);
 
-#elif defined(__SYCL_DEVICE_ONLY__)
-
-    assert(0);
-    rand = 0.0_rt;
-    return rand;
-
 #else     // on the host
 
-#ifdef _OPENMP
-    int tid = omp_get_thread_num();
-#else
-    int tid = 0;
-#endif
-
     std::uniform_real_distribution<amrex::Real> distribution(0.0, 1.0);
+    int tid = OpenMP::get_thread_num();
     rand = distribution(generators[tid]);
+
 #endif
 
     return rand;
 }
 
-AMREX_GPU_HOST_DEVICE unsigned int
-amrex::RandomPoisson (amrex::Real lambda)
+#ifdef AMREX_USE_CUDA
+AMREX_GPU_HOST_DEVICE
+#endif
+unsigned int amrex::RandomPoisson (amrex::Real lambda)
 {
     unsigned int rand;
 
-#if defined(__CUDA_ARCH__) || defined(__HIP_DEVICE_COMPILE__)
+#if defined(__CUDA_ARCH__)
     const auto blockId = blockIdx.x + blockIdx.y * gridDim.x + gridDim.x * gridDim.y * blockIdx.z;
 
     const auto tid = blockId * (blockDim.x * blockDim.y * blockDim.z)
@@ -216,37 +227,27 @@ amrex::RandomPoisson (amrex::Real lambda)
 
     const auto i = get_state(tid);
 
-    AMREX_HIP_OR_CUDA( rand = hiprand_poisson(&d_states_d_ptr[i], lambda);,
-                       rand = curand_poisson(&d_states_d_ptr[i], lambda););
+    rand = curand_poisson(&d_states_d_ptr[i], lambda);
 
     __threadfence();
     free_state(tid);
 
-#elif defined(__SYCL_DEVICE_ONLY__)
-
-    assert(0);
-    rand = 0.0_rt;
-    return rand;
-
 #else
 
-#ifdef _OPENMP
-    const auto tid = omp_get_thread_num();
-#else
-    const auto tid = 0;
-#endif
-
     std::poisson_distribution<unsigned int> distribution(lambda);
+    int tid = OpenMP::get_thread_num();
     rand = distribution(generators[tid]);
 
 #endif
     return rand;
 }
 
-AMREX_GPU_HOST_DEVICE unsigned int
-amrex::Random_int (unsigned int n)
+#ifdef AMREX_USE_CUDA
+AMREX_GPU_HOST_DEVICE
+#endif
+unsigned int amrex::Random_int (unsigned int n)
 {
-#if defined(__CUDA_ARCH__) || defined(__HIP_DEVICE_COMPILE__)  // on the device
+#if defined(__CUDA_ARCH__)  // on the device
     constexpr unsigned int RAND_M = 4294967295; // 2**32-1
 
     int blockId = blockIdx.x + blockIdx.y * gridDim.x + gridDim.x * gridDim.y * blockIdx.z;
@@ -258,27 +259,17 @@ amrex::Random_int (unsigned int n)
     unsigned int rand;
     int i = get_state(tid);
     do {
-        AMREX_HIP_OR_CUDA( rand = hiprand(&d_states_d_ptr[i]);,
-                           rand =  curand(&d_states_d_ptr[i]); );
+        rand =  curand(&d_states_d_ptr[i]);
     } while (rand > (RAND_M - RAND_M % n));
     __threadfence();
     free_state(tid);
 
     return rand % n;
 
-#elif defined(__SYCL_DEVICE_ONLY__)
-
-    assert(0);
-    return 0;
-
 #else // on the host
 
-#ifdef _OPENMP
-    int tid = omp_get_thread_num();
-#else
-    int tid = 0;
-#endif
     std::uniform_int_distribution<unsigned int> distribution(0, n-1);
+    int tid = OpenMP::get_thread_num();
     return distribution(generators[tid]);
 
 #endif
@@ -287,12 +278,8 @@ amrex::Random_int (unsigned int n)
 AMREX_GPU_HOST amrex::ULong
 amrex::Random_long (amrex::ULong n)
 {
-#ifdef _OPENMP
-    int tid = omp_get_thread_num();
-#else
-    int tid = 0;
-#endif
     std::uniform_int_distribution<amrex::ULong> distribution(0, n-1);
+    int tid = OpenMP::get_thread_num();
     return distribution(generators[tid]);
 }
 
@@ -355,80 +342,20 @@ void amrex::ResetRandomSeed (amrex::ULong seed)
     InitRandom(seed);
 }
 
-void
-amrex::ResizeRandomSeed (int N)
-{
-    BL_PROFILE("ResizeRandomSeed");
-
-#ifdef AMREX_USE_DPCPP
-    // xxxxx DPCPP todo
-
-#elif defined(AMREX_USE_CUDA) || defined(AMREX_USE_HIP)
-
-    if (N <= gpu_nstates_h) return;
-
-    int PrevSize = gpu_nstates_h;
-    int SizeDiff = N - PrevSize;
-
-    randState_t* new_data;
-    new_data = static_cast<randState_t*>  (The_Device_Arena()->alloc(N*sizeof(randState_t)));
-
-    if (h_mutex_h_ptr != nullptr)
-    {
-        delete h_mutex_h_ptr;
-        h_mutex_h_ptr = nullptr;
-    }
-
-    if (d_mutex_h_ptr != nullptr)
-    {
-        The_Device_Arena()->free(d_mutex_h_ptr);
-        d_mutex_h_ptr = nullptr;
-    }
-
-    h_mutex_h_ptr = new amrex::BlockMutex(N);
-    d_mutex_h_ptr = static_cast<amrex::BlockMutex*> (The_Device_Arena()->alloc(sizeof(amrex::BlockMutex)));
-    amrex::Gpu::htod_memcpy(d_mutex_h_ptr, h_mutex_h_ptr, sizeof(amrex::BlockMutex));
-
-    if (d_states_h_ptr != nullptr)
-    {
-        amrex::Gpu::dtod_memcpy(new_data, d_states_h_ptr, PrevSize*sizeof(randState_t));
-        The_Device_Arena()->free(d_states_h_ptr);
-    }
-
-    d_states_h_ptr = new_data;
-    gpu_nstates_h = N;
-    amrex::BlockMutex* d_mutex_h_ptr_local = d_mutex_h_ptr;
-
-    // HIP FIX HERE - hipMemcpyToSymbol doesn't work with pointers.
-    amrex::ParallelFor(1, [=] AMREX_GPU_DEVICE (int)
-    {
-        d_states_d_ptr = new_data;
-        d_mutex_d_ptr = d_mutex_h_ptr_local;
-        gpu_nstates_d = N;
-    });
-
-    const int MyProc = amrex::ParallelDescriptor::MyProc();
-    amrex::ParallelFor (SizeDiff, [=] AMREX_GPU_DEVICE (int idx) noexcept
-    {
-        amrex::ULong seed = MyProc*1234567ULL + 12345ULL ;
-        int seqstart = idx + 10 * idx ;
-        int loc = idx + PrevSize;
-
-        AMREX_HIP_OR_CUDA( hiprand_init(seed, seqstart, 0, &d_states_d_ptr[loc]);,
-                            curand_init(seed, seqstart, 0, &d_states_d_ptr[loc]); );
-    });
-
-#endif
-
-}
-
 void
 amrex::DeallocateRandomSeedDevArray ()
 {
 #ifdef AMREX_USE_GPU
+#ifdef AMREX_USE_DPCPP
+    if (rand_engine_descr) {
+        delete rand_engine_descr;
+        Gpu::synchronize();
+        rand_engine_descr = nullptr;
+    }
+#else
     if (d_states_h_ptr != nullptr)
     {
-        The_Device_Arena()->free(d_states_h_ptr);
+        The_Arena()->free(d_states_h_ptr);
         d_states_h_ptr = nullptr;
     }
 
@@ -440,11 +367,10 @@ amrex::DeallocateRandomSeedDevArray ()
 
     if (d_mutex_h_ptr != nullptr)
     {
-        The_Device_Arena()->free(d_mutex_h_ptr);
+        The_Arena()->free(d_mutex_h_ptr);
         d_mutex_h_ptr = nullptr;
     }
-
-    gpu_nstates_h = 0;
+#endif
 #endif
 }
 
diff --git a/Src/Base/AMReX_RandomEngine.H b/Src/Base/AMReX_RandomEngine.H
new file mode 100644
index 00000000000..f04480bd89f
--- /dev/null
+++ b/Src/Base/AMReX_RandomEngine.H
@@ -0,0 +1,77 @@
+#ifndef AMREX_RANDOM_ENGINE_H_
+#define AMREX_RANDOM_ENGINE_H_
+
+#include <AMReX_GpuQualifiers.H>
+#include <AMReX_Extension.H>
+
+#if defined(AMREX_USE_HIP)
+#include <hiprand.hpp>
+#elif defined(AMREX_USE_CUDA)
+#include <curand.h>
+#include <curand_kernel.h>
+#elif defined(AMREX_USE_DPCPP)
+#include <CL/sycl.hpp>
+namespace sycl = cl::sycl;
+#if (__SYCL_COMPILER_VERSION <= 20200827)
+// Disable warnings in mkl's rng header.  Too much noise.
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wmissing-braces"
+#pragma clang diagnostic ignored "-Wunused-variable"
+#pragma clang diagnostic ignored "-Wextra-semi"
+#include <mkl_rng_sycl_device.hpp>
+#pragma clang diagnostic pop
+#else
+#include <oneapi/mkl/rng/device.hpp>
+#endif
+#if (__SYCL_COMPILER_VERSION >= 20200827)
+namespace mkl = oneapi::mkl;
+#endif
+#endif
+
+namespace amrex
+{
+#ifdef AMREX_USE_GPU
+
+#ifdef AMREX_USE_DPCPP
+
+    using dpcpp_rng_engine = mkl::rng::device::philox4x32x10<>;
+    using dpcpp_rng_descr = mkl::rng::device::engine_descriptor<dpcpp_rng_engine>;
+    using dpcpp_rng_acc = mkl::rng::device::engine_accessor<dpcpp_rng_engine>;
+
+    extern dpcpp_rng_descr* rand_engine_descr;
+
+    AMREX_FORCE_INLINE
+    dpcpp_rng_descr* getRandEngineDescriptor () { return rand_engine_descr; }
+
+    struct RandomEngine {
+        dpcpp_rng_engine* engine;
+    };
+
+#else
+
+#ifdef AMREX_USE_HIP
+    using randState_t = hiprandState_t;
+#else
+    using randState_t = curandState_t;
+#endif
+
+    extern randState_t* d_states_h_ptr;
+
+    AMREX_FORCE_INLINE
+    randState_t* getRandState () { return d_states_h_ptr; }
+
+    struct RandomEngine {
+        randState_t* rand_state;
+    };
+
+#endif
+
+#else
+
+    struct RandomEngine {}; // CPU
+
+#endif
+
+}
+
+#endif
diff --git a/Src/Base/AMReX_RealVect.H b/Src/Base/AMReX_RealVect.H
index 50fb3137db2..7ade9dbe3d3 100644
--- a/Src/Base/AMReX_RealVect.H
+++ b/Src/Base/AMReX_RealVect.H
@@ -741,7 +741,7 @@ Real
 RealVect::vectorLength () const noexcept
 {
   Real len = this->radSquared();
-  len = amrex::Math::sqrt(len);
+  len = std::sqrt(len);
   return len;
 }
 
diff --git a/Src/Base/AMReX_Reduce.H b/Src/Base/AMReX_Reduce.H
index b549d9dfe18..59569e37e97 100644
--- a/Src/Base/AMReX_Reduce.H
+++ b/Src/Base/AMReX_Reduce.H
@@ -214,7 +214,7 @@ public:
     using Type = GpuTuple<Ts...>;
 
     template <typename... Ps>
-    explicit ReduceData (ReduceOps<Ps...> const& ops)
+    explicit ReduceData (ReduceOps<Ps...> const&)
         : m_host_tuple(),
           m_device_tuple((Type*)(The_Device_Arena()->alloc(2*sizeof(m_host_tuple))))
     {
@@ -264,6 +264,7 @@ namespace Reduce { namespace detail {
     auto call_f (F const& f, int i, int j, int k, IndexType t)
         noexcept -> decltype(f(Box()))
     {
+        AMREX_D_PICK(amrex::ignore_unused(j,k),amrex::ignore_unused(k),(void)0);
         return f(Box(IntVect(AMREX_D_DECL(i,j,k)),
                      IntVect(AMREX_D_DECL(i,j,k)),
                      t));
@@ -285,7 +286,7 @@ public:
         const auto len = amrex::length(box);
         IndexType ixtype = box.ixType();
         auto ec = Gpu::ExecutionConfig(ncells);
-        ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+        ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
 #ifdef AMREX_USE_DPCPP
         // device reduce needs local(i.e., shared) memory
         constexpr std::size_t shared_mem_bytes = sizeof(unsigned long long)*Gpu::Device::warp_size;
@@ -307,6 +308,22 @@ public:
             Reduce::detail::for_each_parallel<0, ReduceTuple, Ps...>(*dp,r, gh);
         });
 #else
+#ifdef AMREX_USE_CUDA
+        if (Gpu::inFuseRegion() && Gpu::inFuseReductionRegion()
+            && ec.numBlocks.x*ec.numThreads.x <= Gpu::getFuseSizeThreshold())
+        {
+            Gpu::Register(box, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+            {
+                ReduceTuple r = *(dp+1);
+                if (box.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
+                    auto pr = Reduce::detail::call_f(f,i,j,k,ixtype);
+                    Reduce::detail::for_each_local<0, ReduceTuple, Ps...>(r, pr);
+                }
+                Reduce::detail::for_each_parallel<0, ReduceTuple, Ps...>(*dp,r);
+            });
+        } else
+#endif
+        {
         amrex::launch(ec.numBlocks.x, ec.numThreads.x, 0, Gpu::gpuStream(),
         [=] AMREX_GPU_DEVICE () noexcept {
             ReduceTuple r = *(dp+1);
@@ -323,6 +340,7 @@ public:
             }
             Reduce::detail::for_each_parallel<0, ReduceTuple, Ps...>(*dp,r);
         });
+        }
 #endif
     }
 
@@ -336,7 +354,7 @@ public:
         const auto lo  = amrex::lbound(box);
         const auto len = amrex::length(box);
         auto ec = Gpu::ExecutionConfig(ncells);
-        ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+        ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
 #ifdef AMREX_USE_DPCPP
         // device reduce needs local(i.e., shared) memory
         constexpr std::size_t shared_mem_bytes = sizeof(unsigned long long)*Gpu::Device::warp_size;
@@ -388,7 +406,7 @@ public:
         using ReduceTuple = typename D::Type;
         auto dp = reduce_data.devicePtr();
         auto ec = Gpu::ExecutionConfig(n);
-        ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+        ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
 #ifdef AMREX_USE_DPCPP
         // device reduce needs local(i.e., shared) memory
         constexpr std::size_t shared_mem_bytes = sizeof(unsigned long long)*Gpu::Device::warp_size;
@@ -451,6 +469,17 @@ T Sum (N n, T const* v, T init_val = 0)
     return Reduce::Sum(n, v, init_val, amrex::Plus<T>());
 }
 
+template <typename T, typename N, typename F,
+          typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
+T Sum (N n, F&& f)
+{
+    ReduceOps<ReduceOpSum> reduce_op;
+    ReduceData<T> reduce_data(reduce_op);
+    using ReduceTuple = typename decltype(reduce_data)::Type;
+    reduce_op.eval(n, [=] AMREX_GPU_DEVICE (N i) -> ReduceTuple { return {f(i)}; });
+    return amrex::get<0>(reduce_data.value());
+}
+
 template <typename T, typename N, typename U, typename BOP, typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
 T Min (N n, U const* v, T init_val, BOP bop)
 {
@@ -519,7 +548,7 @@ std::pair<T,T> MinMax (N n, U const* v, MINOP minop, MAXOP maxop)
     Gpu::LaunchSafeGuard lsg(true);
     Array<T,2> hv{std::numeric_limits<T>::max(), std::numeric_limits<T>::lowest()};
     T* dp = (T*)(The_Device_Arena()->alloc(2*sizeof(T)));
-    Gpu::htod_memcpy(dp, hv.data(), 2*sizeof(T));
+    Gpu::htod_memcpy_async(dp, hv.data(), 2*sizeof(T));
     typedef GpuArray<T,2> Real2;
     amrex::VecReduce(n, Real2{hv[0],hv[1]},
     [=] AMREX_GPU_DEVICE (N i, Real2* r) noexcept
@@ -566,7 +595,7 @@ bool AnyOf (N n, T const* v, P&& pred)
     });
 #else
     auto ec = Gpu::ExecutionConfig(n);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     amrex::launch(ec.numBlocks.x, ec.numThreads.x, 0, 0,
     [=] AMREX_GPU_DEVICE () noexcept {
         __shared__ int has_any;
@@ -596,9 +625,6 @@ bool AnyOf (Box const& box, P&& pred)
     Gpu::LaunchSafeGuard lsg(true);
     Gpu::DeviceScalar<int> ds(0);
     int* dp = ds.dataPtr();
-    int ncells = box.numPts();
-    const auto lo  = amrex::lbound(box);
-    const auto len = amrex::length(box);
 #ifdef AMREX_USE_DPCPP
     // xxxxx DPCPP todo: Anyof Box: better version
     amrex::ParallelFor(box, [=] (int i, int j, int k) noexcept
@@ -607,8 +633,11 @@ bool AnyOf (Box const& box, P&& pred)
         Gpu::Atomic::LogicalOr(dp, r);
     });
 #else
+    int ncells = box.numPts();
+    const auto lo  = amrex::lbound(box);
+    const auto len = amrex::length(box);
     auto ec = Gpu::ExecutionConfig(ncells);
-    ec.numBlocks.x = std::min(ec.numBlocks.x, static_cast<unsigned int>(Gpu::Device::maxBlocksPerLaunch()));
+    ec.numBlocks.x = std::min(ec.numBlocks.x, Gpu::Device::maxBlocksPerLaunch());
     AMREX_LAUNCH_KERNEL(ec.numBlocks, ec.numThreads, 0, 0,
     [=] AMREX_GPU_DEVICE () noexcept {
         __shared__ int has_any;
@@ -648,7 +677,7 @@ public:
     using Type = GpuTuple<Ts...>;
 
     template <typename... Ps>
-    explicit ReduceData (ReduceOps<Ps...> const& ops)
+    explicit ReduceData (ReduceOps<Ps...> const&)
         : m_tuple()
     {
         Reduce::detail::for_each_init<0, Type, Ps...>(m_tuple);
@@ -677,7 +706,7 @@ private:
 
     template <typename D, typename F>
     AMREX_FORCE_INLINE
-    static auto call_f (Box const& box, D & reduce_data, F const& f)
+    static auto call_f (Box const& box, D & /*reduce_data*/, F const& f)
         noexcept -> decltype(f(0,0,0))
     {
         using ReduceTuple = typename D::Type;
@@ -774,6 +803,20 @@ T Sum (N n, T const* v, T init_val = 0)
     return Reduce::Sum(n, v, init_val, amrex::Plus<T>());
 }
 
+template <typename T, typename N, typename F,
+          typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
+T Sum (N n, F&& f)
+{
+    T r = 0;
+#ifdef _OPENMP
+#pragma omp parallel for reduction(+:r)
+#endif
+    for (N i = 0; i < n; ++i) {
+        r += f(i);
+    }
+    return r;
+}
+
 template <typename N, typename T, typename U, typename BOP, typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
 T Min (N n, U const* v, T init_val, BOP bop)
 {
diff --git a/Src/Base/AMReX_SPACE.H b/Src/Base/AMReX_SPACE.H
index 84c8df1c4e6..e2a091d8a9d 100644
--- a/Src/Base/AMReX_SPACE.H
+++ b/Src/Base/AMReX_SPACE.H
@@ -174,4 +174,19 @@ namespace amrex
 
 #endif
 
-#endif /*BL_SPACE_H*/
+
+#if (AMREX_SPACEDIM == 1)
+#  define AMREX_1D_ONLY(a) a
+#  define AMREX_2D_ONLY(a) ((void)0)
+#  define AMREX_3D_ONLY(a) ((void)0)
+#elif (AMREX_SPACEDIM == 2)
+#  define AMREX_1D_ONLY(a) ((void)0)
+#  define AMREX_2D_ONLY(a) a
+#  define AMREX_3D_ONLY(a) ((void)0)
+#elif (AMREX_SPACEDIM == 3)
+#  define AMREX_1D_ONLY(a) ((void)0)
+#  define AMREX_2D_ONLY(a) ((void)0)
+#  define AMREX_3D_ONLY(a) a
+#endif
+
+#endif /*AMREX_SPACE_H*/
diff --git a/Src/Base/AMReX_Scan.H b/Src/Base/AMReX_Scan.H
index 687d51530e5..826757a7936 100644
--- a/Src/Base/AMReX_Scan.H
+++ b/Src/Base/AMReX_Scan.H
@@ -35,43 +35,37 @@ struct BlockStatus<T, true>
     Data<T> d;
 
     AMREX_GPU_DEVICE AMREX_FORCE_INLINE
-#if defined(AMREX_USE_DPCPP) || defined(AMREX_USE_CUDA)
-    void write (char a_status, T a_value
-#if defined(AMREX_USE_DPCPP)
-                , sycl::nd_item<1> const& /*item*/
-#endif
-                ) {
+    void write (char a_status, T a_value) {
+#if defined(AMREX_USE_CUDA)
         volatile uint64_t tmp;
         reinterpret_cast<STVA<T> volatile&>(tmp).status = a_status;
         reinterpret_cast<STVA<T> volatile&>(tmp).value  = a_value;
         reinterpret_cast<uint64_t&>(d.s) = tmp;
-    }
-#elif defined(AMREX_USE_HIP)
-    void write (char a_status, T a_value) {
+#else
         Data<T> tmp;
         tmp.s = {a_status, a_value};
         static_assert(sizeof(unsigned long long) == sizeof(uint64_t),
-                      "HIP: unsigned long long must be 64 bits");
+                      "HIP/DPCPP: unsigned long long must be 64 bits");
         Gpu::Atomic::Exch(reinterpret_cast<unsigned long long*>(&d),
                           reinterpret_cast<unsigned long long&>(tmp));
-    }
 #endif
+    }
 
     AMREX_GPU_DEVICE AMREX_FORCE_INLINE
     T get_aggregate() const { return d.s.value; }
 
     AMREX_GPU_DEVICE AMREX_FORCE_INLINE
     STVA<T> read () volatile {
-#ifdef AMREX_USE_HIP
+#if defined(AMREX_USE_CUDA)
+        volatile uint64_t tmp = reinterpret_cast<uint64_t volatile&>(d);
+        return {reinterpret_cast<STVA<T> volatile&>(tmp).status,
+                reinterpret_cast<STVA<T> volatile&>(tmp).value };
+#else
         static_assert(sizeof(unsigned long long) == sizeof(uint64_t),
-                      "HIP: unsigned long long must be 64 bits");
+                      "HIP/DPCPP: unsigned long long must be 64 bits");
         unsigned long long tmp = Gpu::Atomic::Add
             (reinterpret_cast<unsigned long long*>(const_cast<Data<T>*>(&d)), 0ull);
         return (*reinterpret_cast<Data<T>*>(&tmp)).s;
-#else
-        volatile uint64_t tmp = reinterpret_cast<uint64_t volatile&>(d);
-        return {reinterpret_cast<STVA<T> volatile&>(tmp).status,
-                reinterpret_cast<STVA<T> volatile&>(tmp).value };
 #endif
     }
 
@@ -202,10 +196,18 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
     amrex::launch(nblocks, nthreads, sm, stream,
     [=] AMREX_GPU_DEVICE (Gpu::Handler const& gh) noexcept
     {
+#if (__SYCL_COMPILER_VERSION <= 20200827)
         sycl::intel::sub_group const& sg = gh.item.get_sub_group();
+#else
+        sycl::ONEAPI::sub_group const& sg = gh.item.get_sub_group();
+#endif
         int lane = sg.get_local_id()[0];
         int warp = sg.get_group_id()[0];
+#if (__SYCL_COMPILER_VERSION <= 20200715)
         int nwarps = sg.get_group_range();
+#else
+        int nwarps = sg.get_group_range()[0];
+#endif
 
         int threadIdxx = gh.item.get_local_id(0);
         int blockDimx = gh.item.get_local_range(0);
@@ -221,7 +223,8 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
         if (gridDimx > 1) {
             int& virtual_block_id_shared = *((int*)(shared2+nwarps));
             if (threadIdxx == 0) {
-                unsigned int bid = Gpu::Atomic::Inc(virtual_block_id_p, gridDimx);
+                unsigned int bid = Gpu::Atomic::Inc<sycl::access::address_space::global_space>
+                    (virtual_block_id_p, gridDimx);
                 virtual_block_id_shared = bid;
             }
             gh.item.barrier(sycl::access::fence_space::local_space);
@@ -297,7 +300,7 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
         // sum_prev_chunk now holds the sum of the whole block.
         if (threadIdxx == 0 && gridDimx > 1) {
             block_status.write((virtual_block_id == 0) ? 'p' : 'a',
-                               sum_prev_chunk, gh.item);
+                               sum_prev_chunk);
         }
 
         if (virtual_block_id == 0) {
@@ -356,8 +359,7 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
                 }
 
                 if (lane == 0) {
-                    block_status.write('p', block_status.get_aggregate() + exclusive_prefix,
-                                       gh.item);
+                    block_status.write('p', block_status.get_aggregate() + exclusive_prefix);
                     shared[0] = exclusive_prefix;
                 }
             }
@@ -425,7 +427,7 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
         }
     });
 
-    AMREX_LAUNCH_KERNEL(nblocks, nthreads, sm, stream, 
+    amrex::launch(nblocks, nthreads, sm, stream,
     [=] AMREX_GPU_DEVICE () noexcept
     {
         int lane = threadIdx.x % Gpu::Device::warp_size;
@@ -479,7 +481,7 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
             // Scan within a warp
             for (int i = 1; i <= Gpu::Device::warp_size; i *= 2) {
                 AMREX_HIP_OR_CUDA( T s = __shfl_up(x,i);,
-                                   T s = __shfl_up_sync(0xffffffff, x, i); );
+                                   T s = __shfl_up_sync(0xffffffff, x, i); )
                 if (lane >= i) x += s;
             }
 
@@ -585,7 +587,7 @@ T PrefixSum (int n, FIN && fin, FOUT && fout, Type type)
 
                         for (int i = Gpu::Device::warp_size/2; i > 0; i /= 2) {
                             AMREX_HIP_OR_CUDA( x += __shfl_down(x,i);,
-                                               x += __shfl_down_sync(0xffffffff, x, i); );
+                                               x += __shfl_down_sync(0xffffffff, x, i); )
                         }
                     }
 
@@ -650,6 +652,29 @@ T ExclusiveSum (N n, T const* in, T * out)
                  Type::exclusive);
 }
 
+#else
+
+// The return value is the total sum.
+template <typename N, typename T, typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
+T InclusiveSum (N n, T const* in, T * out)
+{
+    std::partial_sum(in, in+n, out);
+    return (n > 0) ? out[n-1] : T(0);
+}
+
+// The return value is the total sum.
+template <typename N, typename T, typename M=amrex::EnableIf_t<std::is_integral<N>::value> >
+T ExclusiveSum (N n, T const* in, T * out)
+{
+    if (n > 0) {
+        out[0] = 0;
+        std::partial_sum(in, in+n-1, out+1);
+        return in[n-1]+out[n-1];
+    } else {
+        return 0;
+    }
+}
+
 #endif
 
 }
diff --git a/Src/Base/AMReX_Slopes_K.H b/Src/Base/AMReX_Slopes_K.H
new file mode 100644
index 00000000000..84583228189
--- /dev/null
+++ b/Src/Base/AMReX_Slopes_K.H
@@ -0,0 +1,426 @@
+#ifndef AMREX_SLOPES_K_H_
+#define AMREX_SLOPES_K_H_
+
+#include <AMReX_FArrayBox.H>
+
+namespace {
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::Real amrex_calc_xslope (int i, int j, int k, int n, int order,
+                               amrex::Array4<amrex::Real const> const& q) noexcept
+{
+    if (order == 2)
+    {
+        amrex::Real dl = 2.0*(q(i  ,j,k,n) - q(i-1,j,k,n));
+        amrex::Real dr = 2.0*(q(i+1,j,k,n) - q(i  ,j,k,n));
+        amrex::Real dc = 0.5*(q(i+1,j,k,n) - q(i-1,j,k,n));
+        amrex::Real slope = amrex::min(amrex::Math::abs(dl),amrex::Math::abs(dc),amrex::Math::abs(dr));
+        slope = (dr*dl > 0.0) ? slope : 0.0;
+        return (dc > 0.0) ? slope : -slope;
+
+    } else if (order == 4) {
+
+        amrex::Real dlft, drgt, dcen, dfm, dfp, dlim, dsgn, dtemp;
+        amrex::Real qm, qp, qi;
+        qi = q(i,j,k,n);
+        qm = q(i-1,j,k,n);
+        qp = q(i+1,j,k,n);
+
+        dlft = qm - q(i-2,j,k,n);
+        drgt = qi - qm;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfm = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qp - qi;
+        drgt = q(i+2,j,k,n) - qp;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfp = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qi - qm;
+        drgt = qp - qi;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+
+        dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+
+        return dsgn*amrex::min(dlim, amrex::Math::abs(dtemp));
+
+    } else {
+        return 0.;
+    }
+}
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::Real amrex_calc_xslope_extdir (int i, int j, int k, int n, int order, 
+                                      amrex::Array4<amrex::Real const> const& q,
+                                      bool edlo, bool edhi, int domlo, int domhi) noexcept
+{
+    if (order == 2)
+    {
+        amrex::Real dl = 2.0*(q(i  ,j,k,n) - q(i-1,j,k,n));
+        amrex::Real dr = 2.0*(q(i+1,j,k,n) - q(i  ,j,k,n));
+        amrex::Real dc = 0.5*(q(i+1,j,k,n) - q(i-1,j,k,n));
+
+        if (edlo and i == domlo) {
+            dc = (q(i+1,j,k,n)+3.0*q(i,j,k,n)-4.0*q(i-1,j,k,n))/3.0;
+        } else if (edhi and i == domhi) {
+            dc = (4.0*q(i+1,j,k,n)-3.0*q(i,j,k,n)-q(i-1,j,k,n))/3.0;
+        }
+
+        amrex::Real slope = amrex::min(amrex::Math::abs(dl),amrex::Math::abs(dc),amrex::Math::abs(dr));
+        slope = (dr*dl > 0.0) ? slope : 0.0;
+        return (dc > 0.0) ? slope : -slope;
+
+    } else if (order == 4) {
+
+        amrex::Real dlft, drgt, dcen, dfm, dfp, dlim, dsgn, dtemp, dlimsh, dsgnsh;
+        amrex::Real qm, qp, qi;
+        qi = q(i,j,k,n);
+        qm = q(i-1,j,k,n);
+        qp = q(i+1,j,k,n);
+
+        dlft = qm - q(i-2,j,k,n);
+        drgt = qi - qm;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfm = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qp - qi;
+        drgt = q(i+2,j,k,n) - qp;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfp = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qi - qm;
+        drgt = qp - qi;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+
+        dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+
+        if (edlo and i == domlo) {
+           dtemp  = -16./15.*q(i-1,j,k,n) + .5*q(i,j,k,n) + 2./3.*q(i+1,j,k,n) -  0.1*q(i+2,j,k,n);
+           dlft = 2.*(q(i  ,j,k,n)-q(i-1,j,k,n));
+           drgt = 2.*(q(i+1,j,k,n)-q(i  ,j,k,n));
+           dlim = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgn = amrex::Math::copysign(1.e0, dtemp);
+        } else if (edlo and i == domlo+1) {
+           dfm  = -16./15.*q(domlo-1,j,k,n) + .5*q(domlo,j,k,n) + 2./3.*q(domlo+1,j,k,n) -  0.1*q(domlo+2,j,k,n);
+           dlft = 2.*(q(domlo  ,j,k,n)-q(domlo-1,j,k,n));
+           drgt = 2.*(q(domlo+1,j,k,n)-q(domlo  ,j,k,n));
+           dlimsh = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgnsh = amrex::Math::copysign(1.e0, dfm);
+           dfm = dsgnsh*amrex::min(dlimsh, amrex::Math::abs(dfm));
+           dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        }
+
+        if (edhi and i == domhi) {
+           dtemp  = 16./15.*q(i+1,j,k,n) - .5*q(i,j,k,n) - 2./3.*q(i-1,j,k,n) +  0.1*q(i-2,j,k,n);
+           dlft = 2.*(q(i  ,j,k,n)-q(i-1,j,k,n));
+           drgt = 2.*(q(i+1,j,k,n)-q(i  ,j,k,n));
+           dlim = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgn = amrex::Math::copysign(1.e0, dtemp);
+        } else if (edhi and i == domhi-1) {
+           dfp  = 16./15.*q(domhi+1,j,k,n) - .5*q(domhi,j,k,n) - 2./3.*q(domhi-1,j,k,n) +  0.1*q(domhi-2,j,k,n);
+           dlft = 2.*(q(domhi  ,j,k,n)-q(domhi-1,j,k,n));
+           drgt = 2.*(q(domhi+1,j,k,n)-q(domhi  ,j,k,n));
+           dlimsh = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgnsh = amrex::Math::copysign(1.e0, dfp);
+           dfp = dsgnsh*amrex::min(dlimsh, amrex::Math::abs(dfp));
+           dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        }
+
+        return dsgn*amrex::min(dlim, amrex::Math::abs(dtemp));
+
+    } else {
+        return 0.;
+    }
+
+}
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::Real amrex_calc_yslope (int i, int j, int k, int n, int order,
+                               amrex::Array4<amrex::Real const> const& q) noexcept
+{
+    if (order == 2)
+    {
+        amrex::Real dl = 2.0*(q(i,j  ,k,n) - q(i,j-1,k,n));
+        amrex::Real dr = 2.0*(q(i,j+1,k,n) - q(i,j  ,k,n));
+        amrex::Real dc = 0.5*(q(i,j+1,k,n) - q(i,j-1,k,n));
+        amrex::Real slope = amrex::min(amrex::Math::abs(dl),amrex::Math::abs(dc),amrex::Math::abs(dr));
+        slope = (dr*dl > 0.0) ? slope : 0.0;
+        return (dc > 0.0) ? slope : -slope;
+
+    } else if (order == 4) {
+
+        amrex::Real dlft, drgt, dcen, dfm, dfp, dlim, dsgn, dtemp;
+        amrex::Real qm, qp, qj;
+        qj = q(i,j,k,n);
+        qm = q(i,j-1,k,n);
+        qp = q(i,j+1,k,n);
+
+        dlft = qm - q(i,j-2,k,n);
+        drgt = qj - qm;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfm = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qp - qj;
+        drgt = q(i,j+2,k,n) - qp;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfp = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qj - qm;
+        drgt = qp - qj;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+
+        dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        return dsgn*amrex::min(dlim, amrex::Math::abs(dtemp));
+
+    } else {
+        return 0.;
+    }
+}
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::Real amrex_calc_yslope_extdir (int i, int j, int k, int n, int order, 
+                                      amrex::Array4<amrex::Real const> const& q,
+                                      bool edlo, bool edhi, int domlo, int domhi) noexcept
+{
+    if (order == 2)
+    {
+        amrex::Real dl = 2.0*(q(i,j  ,k,n) - q(i,j-1,k,n));
+        amrex::Real dr = 2.0*(q(i,j+1,k,n) - q(i,j  ,k,n));
+        amrex::Real dc = 0.5*(q(i,j+1,k,n) - q(i,j-1,k,n));
+        if (edlo and j == domlo) {
+            dc = (q(i,j+1,k,n)+3.0*q(i,j,k,n)-4.0*q(i,j-1,k,n))/3.0;
+        } else if (edhi and j == domhi) {
+            dc = (4.0*q(i,j+1,k,n)-3.0*q(i,j,k,n)-q(i,j-1,k,n))/3.0;
+        }
+        amrex::Real slope = amrex::min(amrex::Math::abs(dl),amrex::Math::abs(dc),amrex::Math::abs(dr));
+        slope = (dr*dl > 0.0) ? slope : 0.0;
+        return (dc > 0.0) ? slope : -slope;
+    
+    } else if (order == 4) {
+
+        amrex::Real dlft, drgt, dcen, dfm, dfp, dlim, dsgn, dtemp, dlimsh,dsgnsh;
+        amrex::Real qm, qp, qj;
+        qj = q(i,j,k,n);
+        qm = q(i,j-1,k,n);
+        qp = q(i,j+1,k,n);
+
+        dlft = qm - q(i,j-2,k,n);
+        drgt = qj - qm;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfm = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qp - qj;
+        drgt = q(i,j+2,k,n) - qp;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfp = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qj - qm;
+        drgt = qp - qj;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+
+        dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+
+        if (edlo and j == domlo) {
+           dtemp  = -16./15.*q(i,j-1,k,n) + .5*q(i,j,k,n) + 2./3.*q(i,j+1,k,n) -  0.1*q(i,j+2,k,n);
+           dlft = 2.*(q(i  ,j,k,n)-q(i,j-1,k,n));
+           drgt = 2.*(q(i,j+1,k,n)-q(i  ,j,k,n));
+           dlim = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgn = amrex::Math::copysign(1.e0, dtemp);
+        } else if (edlo and j == domlo+1) {
+           dfm  = -16./15.*q(i,domlo-1,k,n) + .5*q(i,domlo,k,n) + 2./3.*q(i,domlo+1,k,n) -  0.1*q(i,domlo+2,k,n);
+           dlft = 2.*(q(i  ,domlo,k,n)-q(i,domlo-1,k,n));
+           drgt = 2.*(q(i,domlo+1,k,n)-q(i  ,domlo,k,n));
+           dlimsh = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgnsh = amrex::Math::copysign(1.e0, dfm);
+           dfm = dsgnsh*amrex::min(dlimsh, amrex::Math::abs(dfm));
+           dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        }
+
+        if (edhi and j == domhi) {
+           dtemp  = 16./15.*q(i,j+1,k,n) - .5*q(i,j,k,n) - 2./3.*q(i,j-1,k,n) +  0.1*q(i,j-2,k,n);
+           dlft = 2.*(q(i  ,j,k,n)-q(i,j-1,k,n));
+           drgt = 2.*(q(i,j+1,k,n)-q(i  ,j,k,n));
+           dlim = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgn = amrex::Math::copysign(1.e0, dtemp);
+        } else if (edhi and j == domhi-1) {
+           dfp  = 16./15.*q(i,domhi+1,k,n) - .5*q(i,domhi,k,n) - 2./3.*q(i,domhi-1,k,n) +  0.1*q(i,domhi-2,k,n);
+           dlft = 2.*(q(i  ,domhi,k,n)-q(i,domhi-1,k,n));
+           drgt = 2.*(q(i,domhi+1,k,n)-q(i  ,domhi,k,n));
+           dlimsh = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgnsh = amrex::Math::copysign(1.e0, dfp);
+           dfp = dsgnsh*amrex::min(dlimsh, amrex::Math::abs(dfp));
+           dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        }
+
+        return dsgn*amrex::min(dlim, amrex::Math::abs(dtemp));
+
+    } else {
+        return 0.;
+    }
+}
+
+#if (AMREX_SPACEDIM == 3)
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::Real amrex_calc_zslope (int i, int j, int k, int n, int order,
+                               amrex::Array4<amrex::Real const> const& q) noexcept
+{
+    if (order == 2)
+    {
+        amrex::Real dl = 2.0*(q(i,j,k  ,n) - q(i,j,k-1,n));
+        amrex::Real dr = 2.0*(q(i,j,k+1,n) - q(i,j,k  ,n));
+        amrex::Real dc = 0.5*(q(i,j,k+1,n) - q(i,j,k-1,n));
+        amrex::Real slope = amrex::min(amrex::Math::abs(dl),amrex::Math::abs(dc),amrex::Math::abs(dr));
+        slope = (dr*dl > 0.0) ? slope : 0.0;
+        return (dc > 0.0) ? slope : -slope;
+
+    } else if (order == 4) {
+
+        amrex::Real dlft, drgt, dcen, dfm, dfp, dlim, dsgn, dtemp;
+        amrex::Real qm, qp, qk;
+        qk = q(i,j,k,n);
+        qm = q(i,j,k-1,n);
+        qp = q(i,j,k+1,n);
+
+        dlft = qm - q(i,j,k-2,n);
+        drgt = qk - qm;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfm = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qp - qk;
+        drgt = q(i,j,k+2,n) - qp;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfp = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qk - qm;
+        drgt = qp - qk;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+
+        dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        return dsgn*amrex::min(dlim, amrex::Math::abs(dtemp));
+
+    } else {
+        return 0.;
+    }
+}
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::Real amrex_calc_zslope_extdir (int i, int j, int k, int n, int order, 
+                                      amrex::Array4<amrex::Real const> const& q,
+                                      bool edlo, bool edhi, int domlo, int domhi) noexcept
+{
+    if (order == 2)
+    {
+
+        amrex::Real dl = 2.0*(q(i,j,k  ,n) - q(i,j,k-1,n));
+        amrex::Real dr = 2.0*(q(i,j,k+1,n) - q(i,j,k  ,n));
+        amrex::Real dc = 0.5*(q(i,j,k+1,n) - q(i,j,k-1,n));
+        if (edlo and k == domlo) {
+            dc = (q(i,j,k+1,n)+3.0*q(i,j,k,n)-4.0*q(i,j,k-1,n))/3.0;
+        } else if (edhi and k == domhi) {
+            dc = (4.0*q(i,j,k+1,n)-3.0*q(i,j,k,n)-q(i,j,k-1,n))/3.0;
+        }
+        amrex::Real slope = amrex::min(amrex::Math::abs(dl),amrex::Math::abs(dc),amrex::Math::abs(dr));
+        slope = (dr*dl > 0.0) ? slope : 0.0;
+        return (dc > 0.0) ? slope : -slope;
+    
+    } else if (order == 4) {
+
+        amrex::Real dlft, drgt, dcen, dfm, dfp, dlim, dsgn, dtemp, dlimsh, dsgnsh;
+        amrex::Real qm, qp, qk;
+        qk = q(i,j,k,n);
+        qm = q(i,j,k-1,n);
+        qp = q(i,j,k+1,n);
+
+        dlft = qm - q(i,j,k-2,n);
+        drgt = qk - qm;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfm = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qp - qk;
+        drgt = q(i,j,k+2,n) - qp;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+        dfp = dsgn*amrex::min(dlim, amrex::Math::abs(dcen));
+
+        dlft = qk - qm;
+        drgt = qp - qk;
+        dcen = 0.5*(dlft+drgt);
+        dsgn = amrex::Math::copysign(1.e0, dcen);
+        dlim = (dlft*drgt >= 0.0) ? 2.0*amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+
+        dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+
+        if (edlo and k == domlo) {
+           dtemp  = -16./15.*q(i,j,k-1,n) + .5*q(i,j,k,n) + 2./3.*q(i,j,k+1,n) -  0.1*q(i,j,k+2,n);
+           dlft = 2.*(q(i  ,j,k,n)-q(i,j,k-1,n));
+           drgt = 2.*(q(i,j,k+1,n)-q(i  ,j,k,n));
+           dlim = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgn = amrex::Math::copysign(1.e0, dtemp);
+        } else if (edlo and k == domlo+1) {
+           dfm  = -16./15.*q(i,j,domlo-1,n) + .5*q(i,j,domlo,n) + 2./3.*q(i,j,domlo+1,n) -  0.1*q(i,j,domlo+2,n);
+           dlft = 2.*(q(i  ,j,domlo,n)-q(i,j,domlo-1,n));
+           drgt = 2.*(q(i,j,domlo+1,n)-q(i  ,j,domlo,n));
+           dlimsh = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgnsh = amrex::Math::copysign(1.e0, dfm);
+           dfm = dsgnsh*amrex::min(dlimsh, amrex::Math::abs(dfm));
+           dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        }
+
+        if (edhi and k == domhi) {
+           dtemp  = 16./15.*q(i,j,k+1,n) - .5*q(i,j,k,n) - 2./3.*q(i,j,k-1,n) +  0.1*q(i,j,k-2,n);
+           dlft = 2.*(q(i  ,j,k,n)-q(i,j,k-1,n));
+           drgt = 2.*(q(i,j,k+1,n)-q(i  ,j,k,n));
+           dlim = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgn = amrex::Math::copysign(1.e0, dtemp);
+        } else if (edhi and k == domhi-1) {
+           dfp  = 16./15.*q(i,j,domhi+1,n) - .5*q(i,j,domhi,n) - 2./3.*q(i,j,domhi-1,n) +  0.1*q(i,j,domhi-2,n);
+           dlft = 2.*(q(i  ,j,domhi,n)-q(i,j,domhi-1,n));
+           drgt = 2.*(q(i,j,domhi+1,n)-q(i  ,j,domhi,n));
+           dlimsh = (dlft*drgt >= 0.0) ? amrex::min(amrex::Math::abs(dlft), amrex::Math::abs(drgt)) : 0.0;
+           dsgnsh = amrex::Math::copysign(1.e0, dfp);
+           dfp = dsgnsh*amrex::min(dlimsh, amrex::Math::abs(dfp));
+           dtemp  = 4.0/3.0*dcen - 1.0/6.0*(dfp + dfm);
+        }
+        return dsgn*amrex::min(dlim, amrex::Math::abs(dtemp));
+
+    } else {
+        return 0.;
+    }
+}
+#endif
+
+}
+#endif
diff --git a/Src/Base/AMReX_TinyProfiler.H b/Src/Base/AMReX_TinyProfiler.H
index 30c6f9a09e9..ba59a8b9cf4 100644
--- a/Src/Base/AMReX_TinyProfiler.H
+++ b/Src/Base/AMReX_TinyProfiler.H
@@ -88,10 +88,7 @@ private:
     static std::deque<std::tuple<double,double,std::string*> > ttstack;
     static std::map<std::string,std::map<std::string, Stats> > statsmap;
     static double t_init;
-
-#ifdef AMREX_USE_CUDA
-    nvtxRangeId_t nvtx_id;
-#endif
+    static int device_synchronize_around_region;
 
     static void PrintStats (std::map<std::string,Stats>& regstats, double dt_max);
 };
diff --git a/Src/Base/AMReX_TinyProfiler.cpp b/Src/Base/AMReX_TinyProfiler.cpp
index 004a7755557..6e1b173c7ac 100644
--- a/Src/Base/AMReX_TinyProfiler.cpp
+++ b/Src/Base/AMReX_TinyProfiler.cpp
@@ -11,6 +11,10 @@
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX_ParallelReduce.H>
 #include <AMReX_Utility.H>
+#include <AMReX_ParmParse.H>
+#ifdef AMREX_USE_GPU
+#include <AMReX_GpuDevice.H>
+#endif
 #include <AMReX_Print.H>
 
 #ifdef AMREX_USE_CUPTI
@@ -29,6 +33,7 @@ std::vector<std::string>          TinyProfiler::regionstack;
 std::deque<std::tuple<double,double,std::string*> > TinyProfiler::ttstack;
 std::map<std::string,std::map<std::string, TinyProfiler::Stats> > TinyProfiler::statsmap;
 double TinyProfiler::t_init = std::numeric_limits<double>::max();
+int TinyProfiler::device_synchronize_around_region = 0;
 
 namespace {
     std::set<std::string> improperly_nested_timers;
@@ -88,7 +93,10 @@ TinyProfiler::start () noexcept
 	global_depth = ttstack.size();
 
 #ifdef AMREX_USE_CUDA
-	nvtx_id = nvtxRangeStartA(fname.c_str());
+        if (device_synchronize_around_region) {
+            amrex::Gpu::Device::synchronize();
+        }
+	nvtxRangePush(fname.c_str());
 #endif
 
         for (auto const& region : regionstack)
@@ -110,16 +118,17 @@ TinyProfiler::stop () noexcept
     {
         double t;
 	int nKernelCalls = 0;
-	if (!uCUPTI) {
-	    t = amrex::second();
-	} else {
 #ifdef AMREX_USE_CUPTI
-	    cudaDeviceSynchronize();
-	    cuptiActivityFlushAll(0);
-	    t = computeElapsedTimeUserdata(activityRecordUserdata);
-	    nKernelCalls = activityRecordUserdata.size();
+        if (uCUPTI) {
+            cudaDeviceSynchronize();
+            cuptiActivityFlushAll(0);
+            t = computeElapsedTimeUserdata(activityRecordUserdata);
+            nKernelCalls = activityRecordUserdata.size();
+        } else
 #endif
-	}
+        {
+	    t = amrex::second();
+        }
 
 	while (static_cast<int>(ttstack.size()) > global_depth) {
 	    ttstack.pop_back();
@@ -162,7 +171,10 @@ TinyProfiler::stop () noexcept
         }
 
 #ifdef AMREX_USE_CUDA
-        nvtxRangeEnd(nvtx_id);
+        if (device_synchronize_around_region) {
+            amrex::Gpu::Device::synchronize();
+        }
+        nvtxRangePop();
 #endif
 	} else {
 	    improperly_nested_timers.insert(fname);
@@ -230,7 +242,10 @@ TinyProfiler::stop (unsigned boxUintID) noexcept
             }
 
 #ifdef AMREX_USE_CUDA
-            nvtxRangeEnd(nvtx_id);
+            if (device_synchronize_around_region) {
+                amrex::Gpu::Device::synchronize();
+            }
+            nvtxRangePop();
 #endif
         } else 
         {
@@ -247,6 +262,11 @@ TinyProfiler::Initialize () noexcept
 {
     regionstack.push_back(mainregion);
     t_init = amrex::second();
+
+    {
+        amrex::ParmParse pp("tiny_profiler");
+        pp.query("device_synchronize_around_region", device_synchronize_around_region);
+    }
 }
 
 void
diff --git a/Src/Base/AMReX_Tuple.H b/Src/Base/AMReX_Tuple.H
index bbb3921ba62..93c2c183724 100644
--- a/Src/Base/AMReX_Tuple.H
+++ b/Src/Base/AMReX_Tuple.H
@@ -271,7 +271,7 @@ namespace detail {
     template <typename R, typename TP1, typename TP2, std::size_t... N1, std::size_t... N2>
     AMREX_GPU_HOST_DEVICE constexpr R
     make_tuple (TP1 && a, TP2 && b,
-                IndexSequence<N1...> const& n1, IndexSequence<N2...> const& n2)
+                IndexSequence<N1...> const& /*n1*/, IndexSequence<N2...> const& /*n2*/)
     {
         return R(amrex::get<N1>(a)..., amrex::get<N2>(b)...);
     }
@@ -342,7 +342,7 @@ namespace detail {
     template <typename F, typename TP, std::size_t... N>
     AMREX_GPU_HOST_DEVICE
     constexpr auto
-    apply_impl (F&& f, TP&& t, IndexSequence<N...> is)
+    apply_impl (F&& f, TP&& t, IndexSequence<N...> /*is*/)
         -> typename detail::apply_result<F,detail::tuple_decay_t<TP> >::type
     {
         return f(amrex::get<N>(std::forward<TP>(t))...);
diff --git a/Src/Base/AMReX_TypeTraits.H b/Src/Base/AMReX_TypeTraits.H
index 009b5d8fed5..ea03a3a2a95 100644
--- a/Src/Base/AMReX_TypeTraits.H
+++ b/Src/Base/AMReX_TypeTraits.H
@@ -50,8 +50,8 @@ namespace amrex
 
     template <class T, class Enable = void>
     struct HasAtomicAdd : std::false_type {};
-    // CUDA supports atomicAdd for the following types
     template <> struct HasAtomicAdd<int> : std::true_type {};
+    template <> struct HasAtomicAdd<long> : std::true_type {};
     template <> struct HasAtomicAdd<unsigned int> : std::true_type {};
     template <> struct HasAtomicAdd<unsigned long long> : std::true_type {};
     template <> struct HasAtomicAdd<float> : std::true_type {};
diff --git a/Src/Base/AMReX_Utility.H b/Src/Base/AMReX_Utility.H
index 9b5ce1a573a..7c16363b5e0 100644
--- a/Src/Base/AMReX_Utility.H
+++ b/Src/Base/AMReX_Utility.H
@@ -12,10 +12,6 @@
 #include <limits>
 #include <cfloat>
 
-#include <sys/types.h>
-#include <unistd.h>
-#include <sys/wait.h>
-
 #include <AMReX_BLassert.H>
 #include <AMReX_REAL.H>
 #include <AMReX_INT.H>
@@ -27,6 +23,7 @@
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX_Random.H>
 #include <AMReX_GpuQualifiers.H>
+#include <AMReX_FileSystem.H>
 
 namespace amrex
 {
@@ -34,11 +31,6 @@ namespace amrex
 * \brief Useful C++ Utility Functions
 */
 
-    //! This shuts up the compiler about unused variables
-    template <class... Ts>
-    AMREX_GPU_HOST_DEVICE
-    void ignore_unused (const Ts&...) {}
-
     //! Return true if argument is a non-zero length string of digits.
     bool is_integer (const char* str);
 
@@ -91,8 +83,6 @@ namespace amrex
     void CreateDirectoryFailed (const std::string& dir);
     //! Output a message and abort when couldn't open the file.
     void FileOpenFailed (const std::string& dir);
-    //! Attempt to unlink the file.  Ignore any errors.
-    void UnlinkFile (const std::string& file);
     /**
     * \brief Check if a file already exists.
     *   Return true if the filename is an existing file, directory,
@@ -249,7 +239,7 @@ namespace amrex
 
     template<class T> void BroadcastArray(Vector<T> &aT, int myLocalId, int rootId, const MPI_Comm &localComm);
 
-    void USleep(double sleepsec);
+    void Sleep (double sleepsec);  // Sleep for sleepsec seconds
 
 
     using MaxResSteadyClock = std::conditional<std::chrono::high_resolution_clock::is_steady,
diff --git a/Src/Base/AMReX_Utility.cpp b/Src/Base/AMReX_Utility.cpp
index f527ddd281c..dca92caf9f1 100644
--- a/Src/Base/AMReX_Utility.cpp
+++ b/Src/Base/AMReX_Utility.cpp
@@ -1,27 +1,10 @@
-#include <cstdlib>
-#include <cstring>
-#include <cctype>
-#include <cmath>
-#include <cstdio>
-#include <ctime>
-#include <iostream>
-#include <sstream>
-#include <iomanip>
-#include <set>
-#include <random>
-
-#include <sys/stat.h>
-#include <sys/types.h>
-#include <errno.h>
-
 #include <AMReX_BLFort.H>
 #include <AMReX_REAL.H>
 #include <AMReX.H>
 #include <AMReX_Utility.H>
 #include <AMReX_BLassert.H>
 #include <AMReX_BLProfiler.H>
-#include <AMReX_Print.H>
-
+#include <AMReX_FileSystem.H>
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX_BoxArray.H>
 #include <AMReX_Print.H>
@@ -30,19 +13,20 @@
 #include <omp.h>
 #endif
 
-#include <sys/types.h>
-#include <sys/times.h>
-#include <sys/time.h>
-#include <sys/param.h>
-#include <unistd.h>
-
-
-using std::ostringstream;
-
-
-namespace {
-    const char* path_sep_str = "/";
-}
+#include <cerrno>
+#include <cstdlib>
+#include <cstring>
+#include <cctype>
+#include <cmath>
+#include <cstdio>
+#include <ctime>
+#include <chrono>
+#include <iostream>
+#include <sstream>
+#include <iomanip>
+#include <set>
+#include <random>
+#include <thread>
 
 //
 // Return true if argument is a non-zero length string of digits.
@@ -166,91 +150,7 @@ bool
 amrex::UtilCreateDirectory (const std::string& path,
 			    mode_t mode, bool verbose)
 {
-    bool retVal(false);
-    Vector<std::pair<std::string, int> > pathError;
-
-    if (path.length() == 0 || path == path_sep_str) {
-        return true;
-    }
-
-    errno = 0;
-
-    if(std::strchr(path.c_str(), *path_sep_str) == 0) {
-        //
-        // No slashes in the path.
-        //
-        errno = 0;
-        if(mkdir(path.c_str(), mode) < 0 && errno != EEXIST) {
-            retVal = false;
-        } else {
-            retVal = true;
-        }
-        pathError.push_back(std::make_pair(path, errno));
-    } else {
-        //
-        // Make copy of the directory pathname so we can write to it.
-        //
-        char *dir = new char[path.length() + 1];
-        (void) strcpy(dir, path.c_str());
-
-        char *slash = std::strchr(dir, *path_sep_str);
-
-        if(dir[0] == *path_sep_str) {  // full pathname.
-            do {
-                if(*(slash+1) == 0) {
-                    break;
-                }
-                if((slash = std::strchr(slash+1, *path_sep_str)) != 0) {
-                    *slash = 0;
-                }
-                errno = 0;
-                if(mkdir(dir, mode) < 0 && errno != EEXIST) {
-                    retVal = false;
-                } else {
-                    retVal = true;
-                }
-                pathError.push_back(std::make_pair(dir, errno));
-                if(slash) {
-                    *slash = *path_sep_str;
-                }
-            } while(slash);
-
-        } else {  // relative pathname.
-
-            do {
-                *slash = 0;
-                errno = 0;
-                if(mkdir(dir, mode) < 0 && errno != EEXIST) {
-                    retVal = false;
-                } else {
-                    retVal = true;
-                }
-                pathError.push_back(std::make_pair(dir, errno));
-                *slash = *path_sep_str;
-            } while((slash = std::strchr(slash+1, *path_sep_str)) != 0);
-
-            errno = 0;
-            if(mkdir(dir, mode) < 0 && errno != EEXIST) {
-                retVal = false;
-            } else {
-                retVal = true;
-            }
-            pathError.push_back(std::make_pair(dir, errno));
-        }
-
-        delete [] dir;
-    }
-
-    if(retVal == false  || verbose == true) {
-      for(int i(0); i < pathError.size(); ++i) {
-          amrex::AllPrint()<< "amrex::UtilCreateDirectory:: path errno:  " 
-                           << pathError[i].first << " :: "
-                           << strerror(pathError[i].second)
-                           << std::endl;
-      }
-    }
-
-    return retVal;
+    return FileSystem::CreateDirectories(path, mode, verbose);
 }
 
 void
@@ -269,17 +169,10 @@ amrex::FileOpenFailed (const std::string& file)
     amrex::Error(msg.c_str());
 }
 
-void
-amrex::UnlinkFile (const std::string& file)
-{
-    unlink(file.c_str());
-}
-
 bool
 amrex::FileExists(const std::string &filename)
 {
-  struct stat statbuff;
-  return(::lstat(filename.c_str(), &statbuff) != -1);
+    return amrex::FileSystem::Exists(filename);
 }
 
 std::string
@@ -325,12 +218,7 @@ amrex::UtilCreateDirectoryDestructive(const std::string &path, bool callbarrier)
           amrex::Print() << "amrex::UtilCreateCleanDirectoryDestructive():  " << path
                          << " exists.  I am destroying it.  " << std::endl;
       }
-      char command[2000];
-      sprintf(command, "\\rm -rf %s", path.c_str());;
-      int retVal = std::system(command);
-      if (retVal == -1 || WEXITSTATUS(retVal) != 0) {
-          amrex::Error("Removing old directory failed.");
-      }
+      FileSystem::RemoveAll(path);
     }
     if( ! amrex::UtilCreateDirectory(path, 0755)) 
     {
@@ -1041,9 +929,8 @@ void amrex::BroadcastStringArray(Vector<std::string> &bSA, int myLocalId, int ro
   }
 }
 
-void amrex::USleep(double sleepsec) {
-  constexpr unsigned int msps = 1000000;
-  usleep(static_cast<useconds_t>(sleepsec * msps));
+void amrex::Sleep(double sleepsec) {
+    std::this_thread::sleep_for(std::chrono::duration<double>(sleepsec));
 }
 
 
diff --git a/Src/Base/AMReX_Vector.H b/Src/Base/AMReX_Vector.H
index 2615e32bf44..9ba42c8a29e 100644
--- a/Src/Base/AMReX_Vector.H
+++ b/Src/Base/AMReX_Vector.H
@@ -199,7 +199,7 @@ namespace amrex
             if (N < 2) return stop;
 
             T* const data = vec.data() + start;
-            T const sentinel = data[0];
+            T const sentinel = data[0]; // duplicates will be set to sentinel and removed later
             H const hasher;
             for (std::size_t i = 1; i < N; ) {
                 if (data[i] == sentinel) {
@@ -208,43 +208,60 @@ namespace amrex
                 }
 
                 std::size_t const hash = hasher(data[i]) % N;
-                if (i == hash) {
+                if (i == hash) { // data[i] in correct hash position
                     ++i;
                     continue;
                 }
 
                 if (data[i] == data[hash]) {
-                    data[i] = sentinel;
+                    data[i] = sentinel; // because it's a duplicate
                     ++i;
                     continue;
                 }
 
                 if (data[hash] == sentinel) {
                     std::swap(data[hash], data[i]);
+                    // after swap, new data[i] holds sentinel
+                    //   newdata[hash] in correct hash poitiion
                     ++i;
                     continue;
                 }
 
                 std::size_t const hashhash = hasher(data[hash]) % N;
-                if (hashhash != hash) {
+                if (hashhash != hash) { // data[hash] not in correct has poision, thus will yield it's poistion
                     std::swap(data[i], data[hash]);
-                    if (hash < i) {
+                    // after swap, new data[hash] in correct hash position
+                    //   new data[i] not sure
+                    if (hash < i) {  // we have seen new data[i]
                         ++i;
-                    }
-                } else {
+                    } // else next iteration we will work on data[i]
+                } else { // data[hash] in correct hash position, but data[i] is not because of hash collision
                     ++i;
                 }
             }
 
+            // Now there are three types for data[i]
+            //   (1) sentinel
+            //   (2) data[i] != sentinel and hash(data[i]) == i
+            //   (3) data[i] != sentinel and hash(data[i]) != i because of hash collision
+            // All type 2s are unique, and all sentinels except one can be removed.
+            // We will move all type 2s to the beginning, all sentinels to the end.
+            // This will leave all type 3s in the middle.  Then we will work on the middle
+            // part plus one sentinel.
+
             std::size_t swapPos = 0;
             for (std::size_t i = 0; i < N; ++i) {
+                // move type 2 to the beginning pointed to by swapPos
                 if (data[i] != sentinel and i == hasher(data[i]) % N) {
                     std::swap(data[i], data[swapPos++]);
                 }
             }
 
+            // Now we have moved all type 2 elements to the beginning, [0,swapPos)
+
             std::size_t sentinelPos = N;
             for (std::size_t i = swapPos; i < sentinelPos; ) {
+                // move type 1 to the end
                 if(data[i] == sentinel) {
                     std::swap(data[i], data[--sentinelPos]);
                 } else {
@@ -252,6 +269,7 @@ namespace amrex
                 }
             }
 
+            // recursively work on the middle part
             return detail::removeDupDoit<T,H>(vec, start+swapPos, start+sentinelPos+1);
         }
     }
diff --git a/Src/Base/AMReX_VisMF.cpp b/Src/Base/AMReX_VisMF.cpp
index 9c4829f8df6..421af364fc2 100644
--- a/Src/Base/AMReX_VisMF.cpp
+++ b/Src/Base/AMReX_VisMF.cpp
@@ -707,6 +707,8 @@ void
 VisMF::Header::CalculateMinMax (const FabArray<FArrayBox>& mf,
                                 int procToWrite, MPI_Comm comm)
 {
+    amrex::ignore_unused(procToWrite,comm);
+
 //    BL_PROFILE("VisMF::CalculateMinMax");
 
     m_min.resize(m_ba.size());
@@ -1169,7 +1171,7 @@ void
 VisMF::FindOffsets (const FabArray<FArrayBox> &mf,
 		    const std::string &filePrefix,
                     VisMF::Header &hdr,
-		    VisMF::Header::Version whichVersion,
+		    VisMF::Header::Version /*whichVersion*/,
 		    NFilesIter &nfi, MPI_Comm comm)
 {
 //    BL_PROFILE("VisMF::FindOffsets");
@@ -1332,15 +1334,15 @@ VisMF::FindOffsets (const FabArray<FArrayBox> &mf,
 
 
 void
-VisMF::RemoveFiles(const std::string &mf_name, bool verbose)
+VisMF::RemoveFiles(const std::string &mf_name, bool a_verbose)
 {
     if(ParallelDescriptor::IOProcessor()) {
       std::string MFHdrFileName(mf_name + TheMultiFabHdrFileSuffix);
-      if(verbose) {
+      if(a_verbose) {
         amrex::Print() << "---- removing:  " << MFHdrFileName << std::endl;
       }
       int retVal(std::remove(MFHdrFileName.c_str()));
-      if(verbose) {
+      if(a_verbose) {
         if(retVal != 0) {
           amrex::Print() << "---- error removing:  " << MFHdrFileName << "  errno = "
 	            << strerror(errno) << std::endl;
@@ -1348,11 +1350,11 @@ VisMF::RemoveFiles(const std::string &mf_name, bool verbose)
       }
       for(int ip(0); ip < nOutFiles; ++ip) {
         std::string fileName(NFilesIter::FileName(nOutFiles, mf_name + FabFileSuffix, ip, true));
-        if(verbose) {
+        if(a_verbose) {
           amrex::Print() << "---- removing:  " << fileName << std::endl;
 	}
         int rv(std::remove(fileName.c_str()));
-        if(verbose) {
+        if(a_verbose) {
           if(rv != 0) {
             amrex::Print() << "---- error removing:  " << fileName << "  errno = "
 	              << strerror(errno) << std::endl;
@@ -2226,6 +2228,7 @@ VisMF::AsyncWriteDoit (const FabArray<FArrayBox>& mf, const std::string& mf_name
     RealDescriptor const& whichRD = FPC::NativeRealDescriptor();
 
     auto hdr = std::make_shared<VisMF::Header>(mf, VisMF::NFiles, VisMF::Header::Version_v1, false);
+    if (valid_cells_only) hdr->m_ngrow = IntVect(0);
 
     constexpr int sizeof_int64_over_real = sizeof(int64_t) / sizeof(Real);
     const int n_local_fabs = mf.local_size();
diff --git a/Src/Base/AMReX_iMultiFab.H b/Src/Base/AMReX_iMultiFab.H
index 3e727ff5773..07c4176a3a0 100644
--- a/Src/Base/AMReX_iMultiFab.H
+++ b/Src/Base/AMReX_iMultiFab.H
@@ -512,8 +512,10 @@ public:
     static void Finalize ();
 };
 
+// ngrow = IntVect{0} is a special case that should not be used in normal cases,
+// because it may mark valid cells as non-owner and ghost cells as owners.
 std::unique_ptr<iMultiFab>
-OwnerMask (FabArrayBase const& mf, const Periodicity& period);
+OwnerMask (FabArrayBase const& mf, const Periodicity& period, const IntVect& ngrow=IntVect{0});
 
 }
 
diff --git a/Src/Base/AMReX_iMultiFab.cpp b/Src/Base/AMReX_iMultiFab.cpp
index d23b4cf3bba..e9b464c69a7 100644
--- a/Src/Base/AMReX_iMultiFab.cpp
+++ b/Src/Base/AMReX_iMultiFab.cpp
@@ -372,75 +372,7 @@ namespace {
 static IntVect
 indexFromValue (iMultiFab const& mf, int comp, int nghost, int value, MPI_Op mmloc)
 {
-    IntVect loc;
-
-#ifdef AMREX_USE_GPU
-    if (Gpu::inLaunchRegion())
-    {
-        int tmp[1+AMREX_SPACEDIM] = {0};
-        amrex::Gpu::AsyncArray<int> aa(tmp, 1+AMREX_SPACEDIM);
-        int* p = aa.data();
-        // This is a device ptr to 1+AMREX_SPACEDIM int zeros.
-        // The first is used as an atomic bool and the others for intvect.
-        for (MFIter mfi(mf); mfi.isValid(); ++mfi) {
-            const Box& bx = amrex::grow(mfi.validbox(), nghost);
-            const Array4<int const> arr = mf.array(mfi);
-            amrex::ParallelFor(bx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
-            {
-                int* flag = p;
-                if (*flag == 0) {
-                    if (arr(i,j,k,comp) == value) {
-                        if (Gpu::Atomic::Exch(flag,1) == 0) {
-                            AMREX_D_TERM(p[1] = i;,
-                                         p[2] = j;,
-                                         p[3] = k;);
-                        }
-                    }
-                }
-            });
-        }
-        aa.copyToHost(tmp, 1+AMREX_SPACEDIM);
-        AMREX_D_TERM(loc[0] = tmp[1];,
-                     loc[1] = tmp[2];,
-                     loc[2] = tmp[3];);
-    }
-    else
-#endif
-    {
-        bool f = false;
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        {
-            IntVect priv_loc = IntVect::TheMinVector();
-            for (MFIter mfi(mf,true); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.growntilebox(nghost);
-                const Array4<int const>& fab = mf.const_array(mfi);
-                AMREX_LOOP_3D(bx, i, j, k,
-                {
-                    if (fab(i,j,k,comp) == value) priv_loc = IntVect(AMREX_D_DECL(i,j,k));
-                });
-            }
-
-            if (priv_loc.allGT(IntVect::TheMinVector())) {
-                bool old;
-// we should be able to test on _OPENMP < 201107 for capture (version 3.1)
-// but we must work around a bug in gcc < 4.9
-#if defined(_OPENMP) && _OPENMP < 201307
-#pragma omp critical (amrex_indexfromvalue)
-#elif defined(_OPENMP)
-#pragma omp atomic capture
-#endif
-                {
-                    old = f;
-                    f = true;
-                }
-
-                if (old == false) loc = priv_loc;
-            }
-        }
-    }
+    IntVect loc = indexFromValue(mf, comp, IntVect{nghost}, value);
 
 #ifdef BL_USE_MPI
     const int NProcs = ParallelContext::NProcsSub();
@@ -457,6 +389,8 @@ indexFromValue (iMultiFab const& mf, int comp, int nghost, int value, MPI_Op mml
         MPI_Allreduce(&in,  &out, 1, datatype, mmloc, comm);
         MPI_Bcast(&(loc[0]), AMREX_SPACEDIM, MPI_INT, out.rank, comm);
     }
+#else
+    amrex::ignore_unused(mmloc);
 #endif
 
     return loc;
@@ -591,7 +525,7 @@ iMultiFab::negate (const Box& region,
 }
 
 std::unique_ptr<iMultiFab>
-OwnerMask (FabArrayBase const& mf, const Periodicity& period)
+OwnerMask (FabArrayBase const& mf, const Periodicity& period, const IntVect& ngrow)
 {
     BL_PROFILE("OwnerMask()");
 
@@ -601,7 +535,7 @@ OwnerMask (FabArrayBase const& mf, const Periodicity& period)
     const int owner = 1;
     const int nonowner = 0;
 
-    std::unique_ptr<iMultiFab> p{new iMultiFab(ba,dm,1,0, MFInfo(),
+    std::unique_ptr<iMultiFab> p{new iMultiFab(ba,dm,1,ngrow, MFInfo(),
                                                DefaultFabFactory<IArrayBox>())};
     const std::vector<IntVect>& pshifts = period.shiftIntVect();
 
@@ -627,7 +561,7 @@ OwnerMask (FabArrayBase const& mf, const Periodicity& period)
 
             for (const auto& iv : pshifts)
             {
-                ba.intersections(bx+iv, isects);                    
+                ba.intersections(bx+iv, isects, false, ngrow);
                 for (const auto& is : isects)
                 {
                     const int oi = is.first;
diff --git a/Src/Base/AMReX_omp_mod.F90 b/Src/Base/AMReX_omp_mod.F90
index f76f5166a8f..7ab9b0c1cf6 100644
--- a/Src/Base/AMReX_omp_mod.F90
+++ b/Src/Base/AMReX_omp_mod.F90
@@ -4,6 +4,12 @@ module amrex_omp_module
 
   implicit none
 
+#ifdef _OPENMP
+  integer, parameter :: amrex_omp_support = (_OPENMP)
+#else
+  integer, parameter :: amrex_omp_support = 0 ! Should this be allowed??
+#endif
+
   integer, external :: omp_get_num_threads
   integer, external :: omp_get_max_threads
   integer, external :: omp_get_thread_num
@@ -17,6 +23,8 @@ module amrex_omp_module
 
   implicit none
 
+  integer, parameter :: amrex_omp_support = 0 ! indicates no support
+
 contains
 
   integer function omp_get_num_threads()
diff --git a/Src/Base/AMReX_parstream.cpp b/Src/Base/AMReX_parstream.cpp
index 42916eeec7c..a86663d687d 100644
--- a/Src/Base/AMReX_parstream.cpp
+++ b/Src/Base/AMReX_parstream.cpp
@@ -97,6 +97,7 @@ namespace amrex
 // in serial, this does absolutely nothing
   static void openFile()
   {
+    amrex::ignore_unused(s_pout);
   }
 #endif
 
diff --git a/Src/Base/CMakeLists.txt b/Src/Base/CMakeLists.txt
index 53201767cf0..eeef965625d 100644
--- a/Src/Base/CMakeLists.txt
+++ b/Src/Base/CMakeLists.txt
@@ -1,32 +1,5 @@
 target_include_directories(amrex PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_DIR}>)
 
-# MPI header is incapsulated in AMReX_ccse-mpi.H
-if (ENABLE_MPI)
-   find_package(MPI REQUIRED C CXX)
-
-   # Make imported target "global" so that it can be seen
-   # from other directories in the project.
-   # This is especially useful when get_target_properties_flattened()
-   # (see module AMReXTargetHelpers.cmake) is called to recover dependecy tree info
-   # in projects that use amrex directly in the build (via add_subdirectory()).
-   # Without this, get_target_properties_flattened() would not recognize
-   # MPI::MPI_C and MPI::MPI_CXX as targets because they would be visibile only in this
-   # folder and subfolders.
-   set_target_properties(
-      MPI::MPI_C MPI::MPI_CXX
-      PROPERTIES
-      IMPORTED_GLOBAL True )
-
-   target_link_libraries(amrex PUBLIC MPI::MPI_C MPI::MPI_CXX)
-endif ()
-
-# We need threads
-set( THREADS_PREFER_PTHREAD_FLAG on)
-find_package(Threads REQUIRED)
-set_target_properties( Threads::Threads PROPERTIES IMPORTED_GLOBAL True )
-target_link_libraries(amrex PUBLIC Threads::Threads)
-
-
 target_sources( amrex
    PRIVATE
    # Utility classes ---------------------------------------------------------
@@ -43,8 +16,6 @@ target_sources( amrex
    AMReX_error_fi.cpp
    AMReX.H
    AMReX_Exception.H
-   AMReX.cpp
-   AMReX_error_fi.cpp
    AMReX_Extension.H
    AMReX_IndexSequence.H
    AMReX_PODVector.H
@@ -54,11 +25,15 @@ target_sources( amrex
    AMReX_Functional.H
    AMReX_Utility.H
    AMReX_Utility.cpp
+   AMReX_FileSystem.H
+   AMReX_FileSystem.cpp
    AMReX_Reduce.H
    AMReX_Scan.H
    AMReX_Partition.H
    AMReX_Random.H
+   AMReX_RandomEngine.H
    AMReX_Random.cpp
+   AMReX_Slopes_K.H
    AMReX_BLassert.H
    AMReX_ArrayLim.H
    AMReX_REAL.H
@@ -69,6 +44,7 @@ target_sources( amrex
    AMReX_DistributionMapping.cpp
    AMReX_ParallelDescriptor.H
    AMReX_ParallelDescriptor.cpp
+   AMReX_OpenMP.H
    AMReX_ParallelReduce.H
    AMReX_ForkJoin.H
    AMReX_ForkJoin.cpp
@@ -78,6 +54,8 @@ target_sources( amrex
    AMReX_VisMF.cpp
    AMReX_AsyncOut.H
    AMReX_AsyncOut.cpp
+   AMReX_BackgroundThread.H
+   AMReX_BackgroundThread.cpp
    AMReX_Arena.H
    AMReX_Arena.cpp
    AMReX_BArena.H
@@ -165,11 +143,16 @@ target_sources( amrex
    # Geometry / Coordinate system routines -----------------------------------
    AMReX_CoordSys.cpp
    AMReX_CoordSys.H
+   AMReX_COORDSYS_${AMReX_SPACEDIM}D_C.H
+   AMReX_COORDSYS_C.H
    AMReX_Geometry.cpp
    AMReX_Geometry.H
    AMReX_MultiFabUtil.cpp
    AMReX_MultiFabUtil.H
    AMReX_MultiFabUtilI.H
+   AMReX_MultiFabUtil_${AMReX_SPACEDIM}D_C.H
+   AMReX_MultiFabUtil_nd_C.H
+   AMReX_MultiFabUtil_C.H
    # Boundary-related --------------------------------------------------------
    AMReX_BCRec.cpp
    AMReX_BCRec.H
@@ -178,9 +161,11 @@ target_sources( amrex
    AMReX_BCUtil.cpp
    AMReX_BCUtil.H
    AMReX_BC_TYPES.H
-   AMReX_FilCC_${DIM}D_C.H
+   AMReX_FilCC_${AMReX_SPACEDIM}D_C.H
    AMReX_FilCC_C.H
    AMReX_FilCC_C.cpp
+   AMReX_FilND_C.H
+   AMReX_FilND_C.cpp
    # Plotfile ----------------------------------------------------------------
    AMReX_PlotFileUtil.cpp
    AMReX_PlotFileUtil.H
@@ -189,13 +174,16 @@ target_sources( amrex
    # GPU --------------------------------------------------------------------
    AMReX_Gpu.H
    AMReX_GpuQualifiers.H
+   AMReX_GpuKernelInfo.H
    AMReX_GpuPrint.H
    AMReX_GpuAssert.H
    AMReX_GpuTypes.H
    AMReX_GpuControl.H
    AMReX_GpuControl.cpp
+   AMReX_GpuFuse.H
+   AMReX_GpuFuse.cpp
    AMReX_GpuLaunch.H
-   AMReX_GpuLaunch.cpp
+   AMReX_GpuLaunchGlobal.H
    AMReX_GpuLaunchMacrosG.H
    AMReX_GpuLaunchMacrosC.H
    AMReX_GpuLaunchFunctsG.H
@@ -229,18 +217,13 @@ target_sources( amrex
    )
 
 # Fortran stuff
-if (ENABLE_FORTRAN)
+if (AMReX_FORTRAN)
    target_sources( amrex
       PRIVATE
-      AMReX_COORDSYS_${DIM}D_C.H
-      AMReX_COORDSYS_C.H
       AMReX_filcc_f.H
       AMReX_BLutil_F.F90
       AMReX_BLProfiler_F.F90
-      AMReX_FILCC_${DIM}D.F90
-      AMReX_MultiFabUtil_${DIM}D_C.H
-      AMReX_MultiFabUtil_nd_C.H
-      AMReX_MultiFabUtil_C.H
+      AMReX_FILCC_${AMReX_SPACEDIM}D.F90
       AMReX_filcc_mod.F90
       AMReX_omp_mod.F90
       AMReX_acc_mod.F90
@@ -262,11 +245,11 @@ endif ()
 # endif
 
 # Memory Profiler
-if (ENABLE_MEM_PROFILE)
+if (AMReX_MEM_PROFILE)
    target_sources(amrex PRIVATE AMReX_MemProfiler.cpp AMReX_MemProfiler.H )
 endif ()
 
 # Tiny Profiler
-if (ENABLE_TINY_PROFILE)
+if (AMReX_TINY_PROFILE)
    target_sources(amrex PRIVATE AMReX_TinyProfiler.cpp AMReX_TinyProfiler.H )
 endif ()
diff --git a/Src/Base/Make.package b/Src/Base/Make.package
index 3b8ff9c27e1..4c8e4252cc7 100644
--- a/Src/Base/Make.package
+++ b/Src/Base/Make.package
@@ -24,13 +24,19 @@ C$(AMREX_BASE)_sources += AMReX_ParmParse.cpp AMReX_parmparse_fi.cpp AMReX_Utili
 C$(AMREX_BASE)_headers += AMReX_ParmParse.H AMReX_Utility.H AMReX_BLassert.H AMReX_ArrayLim.H
 C$(AMREX_BASE)_headers += AMReX_Functional.H AMReX_Reduce.H AMReX_Scan.H AMReX_Partition.H
 
-C$(AMREX_BASE)_headers += AMReX_Random.H
+C$(AMREX_BASE)_headers += AMReX_FileSystem.H
+C$(AMREX_BASE)_sources += AMReX_FileSystem.cpp
+
+C$(AMREX_BASE)_headers += AMReX_Random.H AMReX_RandomEngine.H
 C$(AMREX_BASE)_sources += AMReX_Random.cpp
 
+C$(AMREX_BASE)_headers += AMReX_Slopes_K.H
+
 C$(AMREX_BASE)_headers += AMReX_REAL.H AMReX_INT.H AMReX_CONSTANTS.H AMReX_SPACE.H
 
 C$(AMREX_BASE)_sources += AMReX_DistributionMapping.cpp AMReX_ParallelDescriptor.cpp
 C$(AMREX_BASE)_headers += AMReX_DistributionMapping.H AMReX_ParallelDescriptor.H
+C$(AMREX_BASE)_headers += AMReX_OpenMP.H
 
 C$(AMREX_BASE)_headers += AMReX_ParallelReduce.H
 
@@ -43,6 +49,9 @@ C$(AMREX_BASE)_headers += AMReX_VisMF.H AMReX_Arena.H AMReX_BArena.H AMReX_CAren
 C$(AMREX_BASE)_sources += AMReX_AsyncOut.cpp
 C$(AMREX_BASE)_headers += AMReX_AsyncOut.H
 
+C$(AMREX_BASE)_sources += AMReX_BackgroundThread.cpp
+C$(AMREX_BASE)_headers += AMReX_BackgroundThread.H
+
 C$(AMREX_BASE)_headers += AMReX_BLProfiler.H
 
 C$(AMREX_BASE)_headers += AMReX_BLBackTrace.H
@@ -57,11 +66,14 @@ C$(AMREX_BASE)_headers += AMReX_parstream.H
 C$(AMREX_BASE)_sources += AMReX_parstream.cpp
 
 C$(AMREX_BASE)_headers += AMReX_Gpu.H AMReX_GpuQualifiers.H AMReX_GpuPrint.H AMReX_GpuAssert.H AMReX_GpuTypes.H AMReX_GpuError.H
+C$(AMREX_BASE)_headers += AMReX_GpuKernelInfo.H
 
 C$(AMREX_BASE)_headers += AMReX_GpuLaunchMacrosG.H AMReX_GpuLaunchFunctsG.H
 C$(AMREX_BASE)_headers += AMReX_GpuLaunchMacrosC.H AMReX_GpuLaunchFunctsC.H
+C$(AMREX_BASE)_headers += AMReX_GpuLaunchGlobal.H
 C$(AMREX_BASE)_headers += AMReX_GpuLaunch.H
-C$(AMREX_BASE)_sources += AMReX_GpuLaunch.cpp
+C$(AMREX_BASE)_headers += AMReX_GpuFuse.H
+C$(AMREX_BASE)_sources += AMReX_GpuFuse.cpp
 
 C$(AMREX_BASE)_headers += AMReX_GpuControl.H
 C$(AMREX_BASE)_sources += AMReX_GpuControl.cpp
@@ -151,9 +163,6 @@ C$(AMREX_BASE)_headers += AMReX_MultiFabUtil.H AMReX_MultiFabUtil_C.H AMReX_Mult
 C$(AMREX_BASE)_sources += AMReX_MultiFabUtil.cpp
 C$(AMREX_BASE)_headers += AMReX_MultiFabUtilI.H
 
-C$(AMREX_BASE)_sources += AMReX_MultiFabUtil_Perilla.cpp
-C$(AMREX_BASE)_headers += AMReX_MultiFabUtil_Perilla.H
-
 #
 # Boundary-related 
 #
@@ -163,6 +172,8 @@ C$(AMREX_BASE)_sources += AMReX_PhysBCFunct.cpp AMReX_BCUtil.cpp
 C$(AMREX_BASE)_headers += AMReX_PhysBCFunct.H AMReX_BCUtil.H
 C$(AMREX_BASE)_sources += AMReX_FilCC_C.cpp
 C$(AMREX_BASE)_headers += AMReX_FilCC_C.H AMReX_FilCC_$(DIM)D_C.H
+C$(AMREX_BASE)_sources += AMReX_FilND_C.cpp
+C$(AMREX_BASE)_headers += AMReX_FilND_C.H
 
 #
 # Plotfile
diff --git a/Src/Boundary/AMReX_FabSet.cpp b/Src/Boundary/AMReX_FabSet.cpp
index 27dda6083bd..8cff555660c 100644
--- a/Src/Boundary/AMReX_FabSet.cpp
+++ b/Src/Boundary/AMReX_FabSet.cpp
@@ -181,10 +181,15 @@ FabSet::linComb (Real a, const MultiFab& mfa, int a_comp,
         const Box& bx = mfi.validbox();
         auto afab = bdrya.array(mfi);
         auto bfab = bdryb.array(mfi);
+#ifdef AMREX_USE_FLOAT
+        const Real huge = 1.e30f;
+#else
+        const Real huge = 1.e200;
+#endif
         AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, ncomp, i, j, k, n,
         {
-            afab(i,j,k,n) = 1.e200;
-            bfab(i,j,k,n) = 1.e200;
+            afab(i,j,k,n) = huge;
+            bfab(i,j,k,n) = huge;
         });
     }
 
diff --git a/Src/Boundary/AMReX_InterpBndryData.H b/Src/Boundary/AMReX_InterpBndryData.H
index 7671c362af7..e83cef673f5 100644
--- a/Src/Boundary/AMReX_InterpBndryData.H
+++ b/Src/Boundary/AMReX_InterpBndryData.H
@@ -94,9 +94,9 @@ public:
     * \param ratio
     * \param comp
     */
-    virtual void setBndryConds (const BCRec&   phys_bc,
-                                const IntVect& ratio,
-				int            comp = 0) {}
+    virtual void setBndryConds (const BCRec&   /*phys_bc*/,
+                                const IntVect& /*ratio*/,
+				int            /*comp*/ = 0) {}
 
     /**
     * \brief set bndry values at coarse level (non interpolation performed)
diff --git a/Src/Boundary/AMReX_InterpBndryData_1D_K.H b/Src/Boundary/AMReX_InterpBndryData_1D_K.H
index a102f9392e2..224ba12f246 100644
--- a/Src/Boundary/AMReX_InterpBndryData_1D_K.H
+++ b/Src/Boundary/AMReX_InterpBndryData_1D_K.H
@@ -20,7 +20,7 @@ AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void interpbndrydata_x_o3 (int i, int /*j*/, int /*k*/, int n,
                            Array4<Real> const& bdry, int nb,
                            Array4<Real const> const& crse, int nc, Dim3 const& r,
-                           Array4<int const> const& mask, int not_covered) noexcept
+                           Array4<int const> const& /*mask*/, int /*not_covered*/) noexcept
 {
     int ic = amrex::coarsen(i,r.x);
     bdry(i,0,0,n+nb) = crse(ic,0,0,n+nc);
diff --git a/Src/Boundary/AMReX_InterpBndryData_2D_K.H b/Src/Boundary/AMReX_InterpBndryData_2D_K.H
index 8e22f624e10..68548f7e645 100644
--- a/Src/Boundary/AMReX_InterpBndryData_2D_K.H
+++ b/Src/Boundary/AMReX_InterpBndryData_2D_K.H
@@ -57,7 +57,7 @@ void interpbndrydata_x_o3 (int i, int j, int /*k*/, int n,
         NN = 1;
     }
 
-    Real xInt = -0.5_rt + (j-jc*r.y+0.5_rt)/r.y;
+    Real xInt = -Real(0.5) + (j-jc*r.y+Real(0.5))/r.y;
     poly_interp_coeff(xInt, x, NN, c);
     Real b = 0.0;
     for (int m = 0; m < NN; ++m) {
@@ -106,7 +106,7 @@ void interpbndrydata_y_o3 (int i, int j, int /*k*/, int n,
         NN = 1;
     }
 
-    Real xInt = -0.5_rt + (i-ic*r.x+0.5_rt)/r.x;
+    Real xInt = -Real(0.5) + (i-ic*r.x+Real(0.5))/r.x;
     poly_interp_coeff(xInt, x, NN, c);
     Real b = 0.0;
     for (int m = 0; m < NN; ++m) {
diff --git a/Src/Boundary/AMReX_InterpBndryData_3D_K.H b/Src/Boundary/AMReX_InterpBndryData_3D_K.H
index 5fe7223e9bc..baecfae58f4 100644
--- a/Src/Boundary/AMReX_InterpBndryData_3D_K.H
+++ b/Src/Boundary/AMReX_InterpBndryData_3D_K.H
@@ -29,23 +29,23 @@ void interpbndrydata_x_o3 (int i, int j, int k, int n,
 
     int lo = (mask(i,j-r.y,k) == not_covered) ? jc-1 : jc;
     int hi = (mask(i,j+r.y,k) == not_covered) ? jc+1 : jc;
-    Real fac = (hi == lo+1) ? 1.0_rt : 0.5_rt;
+    Real fac = (hi == lo+1) ? Real(1.0) : Real(0.5);
     Real dy = fac*(crse(ic,hi,kc,n+nc)-crse(ic,lo,kc,n+nc));
-    Real dy2 = (hi==lo+2) ? 0.5_rt*(crse(ic,jc+1,kc,n+nc) - 2._rt*crse(ic,jc,kc,n+nc) + crse(ic,jc-1,kc,n+nc)) : 0._rt;
+    Real dy2 = (hi==lo+2) ? Real(0.5)*(crse(ic,jc+1,kc,n+nc) - Real(2.)*crse(ic,jc,kc,n+nc) + crse(ic,jc-1,kc,n+nc)) : Real(0.);
 
     lo = (mask(i,j,k-r.z) == not_covered) ? kc-1 : kc;
     hi = (mask(i,j,k+r.z) == not_covered) ? kc+1 : kc;
-    fac = (hi == lo+1) ? 1.0_rt : 0.5_rt;
+    fac = (hi == lo+1) ? Real(1.0) : Real(0.5);
     Real dz = fac*(crse(ic,jc,hi,n+nc)-crse(ic,jc,lo,n+nc));
-    Real dz2 = (hi==lo+2) ? 0.5_rt*(crse(ic,jc,kc+1,n+nc) - 2._rt*crse(ic,jc,kc,n+nc) + crse(ic,jc,kc-1,n+nc)) : 0._rt;
+    Real dz2 = (hi==lo+2) ? Real(0.5)*(crse(ic,jc,kc+1,n+nc) - Real(2.)*crse(ic,jc,kc,n+nc) + crse(ic,jc,kc-1,n+nc)) : Real(0.);
 
     Real dyz = (mask(i,j-r.y,k-r.z) == not_covered and mask(i,j+r.y,k-r.z) == not_covered and
                 mask(i,j-r.y,k+r.z) == not_covered and mask(i,j+r.y,k+r.z) == not_covered)
-        ? 0.25_rt*(crse(ic,jc+1,kc+1,n+nc)-crse(ic,jc-1,kc+1,n+nc)+crse(ic,jc-1,kc-1,n+nc)-crse(ic,jc+1,kc-1,n+nc))
+        ? Real(0.25)*(crse(ic,jc+1,kc+1,n+nc)-crse(ic,jc-1,kc+1,n+nc)+crse(ic,jc-1,kc-1,n+nc)-crse(ic,jc+1,kc-1,n+nc))
         : 0.0;
 
-    Real y = -0.5_rt + (j-jc*r.y+0.5_rt)/r.y;
-    Real z = -0.5_rt + (k-kc*r.z+0.5_rt)/r.z;
+    Real y = -Real(0.5) + (j-jc*r.y+Real(0.5))/r.y;
+    Real z = -Real(0.5) + (k-kc*r.z+Real(0.5))/r.z;
     bdry(i,j,k,n+nb) = crse(ic,jc,kc,n+nc) + y*dy + (y*y)*dy2 + z*dz + (z*z)*dz2 + y*z*dyz;
 }
 
@@ -61,24 +61,24 @@ void interpbndrydata_y_o3 (int i, int j, int k, int n,
 
     int lo = (mask(i-r.x,j,k) == not_covered) ? ic-1 : ic;
     int hi = (mask(i+r.x,j,k) == not_covered) ? ic+1 : ic;
-    Real fac = (hi == lo+1) ? 1.0_rt : 0.5_rt;
+    Real fac = (hi == lo+1) ? Real(1.0) : Real(0.5);
     Real dx = fac*(crse(hi,jc,kc,n+nc)-crse(lo,jc,kc,n+nc));
-    Real dx2 = (hi==lo+2) ? 0.5_rt*(crse(ic+1,jc,kc,n+nc) - 2._rt*crse(ic,jc,kc,n+nc) + crse(ic-1,jc,kc,n+nc)) : 0._rt;
+    Real dx2 = (hi==lo+2) ? Real(0.5)*(crse(ic+1,jc,kc,n+nc) - Real(2.)*crse(ic,jc,kc,n+nc) + crse(ic-1,jc,kc,n+nc)) : Real(0.);
 
     lo = (mask(i,j,k-r.z) == not_covered) ? kc-1 : kc;
     hi = (mask(i,j,k+r.z) == not_covered) ? kc+1 : kc;
-    fac = (hi == lo+1) ? 1.0_rt : 0.5_rt;
+    fac = (hi == lo+1) ? Real(1.0) : Real(0.5);
     Real dz = fac*(crse(ic,jc,hi,n+nc)-crse(ic,jc,lo,n+nc));
-    Real dz2 = (hi==lo+2) ? 0.5_rt*(crse(ic,jc,kc+1,n+nc) - 2._rt*crse(ic,jc,kc,n+nc) + crse(ic,jc,kc-1,n+nc)) : 0._rt;
+    Real dz2 = (hi==lo+2) ? Real(0.5)*(crse(ic,jc,kc+1,n+nc) - Real(2.)*crse(ic,jc,kc,n+nc) + crse(ic,jc,kc-1,n+nc)) : Real(0.);
 
     Real dxz = (mask(i-r.x,j,k-r.z) == not_covered and mask(i+r.x,j,k-r.z) == not_covered and
                 mask(i-r.x,j,k+r.z) == not_covered and mask(i+r.x,j,k+r.z) == not_covered)
-        ? 0.25_rt*(crse(ic+1,jc,kc+1,n+nc)-crse(ic-1,jc,kc+1,n+nc)+crse(ic-1,jc,kc-1,n+nc)-crse(ic+1,jc,kc-1,n+nc))
+        ? Real(0.25)*(crse(ic+1,jc,kc+1,n+nc)-crse(ic-1,jc,kc+1,n+nc)+crse(ic-1,jc,kc-1,n+nc)-crse(ic+1,jc,kc-1,n+nc))
         : 0.0;
 
 
-    Real x = -0.5_rt + (i-ic*r.x+0.5_rt)/r.x;
-    Real z = -0.5_rt + (k-kc*r.z+0.5_rt)/r.z;
+    Real x = -Real(0.5) + (i-ic*r.x+Real(0.5))/r.x;
+    Real z = -Real(0.5) + (k-kc*r.z+Real(0.5))/r.z;
     bdry(i,j,k,n+nb) = crse(ic,jc,kc,n+nc) + x*dx + (x*x)*dx2 + z*dz + (z*z)*dz2 + x*z*dxz;
 }
 
@@ -94,23 +94,23 @@ void interpbndrydata_z_o3 (int i, int j, int k, int n,
 
     int lo = (mask(i-r.x,j,k) == not_covered) ? ic-1 : ic;
     int hi = (mask(i+r.x,j,k) == not_covered) ? ic+1 : ic;
-    Real fac = (hi == lo+1) ? 1.0_rt : 0.5_rt;
+    Real fac = (hi == lo+1) ? Real(1.0) : Real(0.5);
     Real dx = fac*(crse(hi,jc,kc,n+nc)-crse(lo,jc,kc,n+nc));
-    Real dx2 = (hi==lo+2) ? 0.5_rt*(crse(ic+1,jc,kc,n+nc) - 2._rt*crse(ic,jc,kc,n+nc) + crse(ic-1,jc,kc,n+nc)) : 0._rt;
+    Real dx2 = (hi==lo+2) ? Real(0.5)*(crse(ic+1,jc,kc,n+nc) - Real(2.)*crse(ic,jc,kc,n+nc) + crse(ic-1,jc,kc,n+nc)) : Real(0.);
 
     lo = (mask(i,j-r.y,k) == not_covered) ? jc-1 : jc;
     hi = (mask(i,j+r.y,k) == not_covered) ? jc+1 : jc;
-    fac = (hi == lo+1) ? 1.0_rt : 0.5_rt;
+    fac = (hi == lo+1) ? Real(1.0) : Real(0.5);
     Real dy = fac*(crse(ic,hi,kc,n+nc)-crse(ic,lo,kc,n+nc));
-    Real dy2 = (hi==lo+2) ? 0.5_rt*(crse(ic,jc+1,kc,n+nc) - 2._rt*crse(ic,jc,kc,n+nc) + crse(ic,jc-1,kc,n+nc)) : 0._rt;
+    Real dy2 = (hi==lo+2) ? Real(0.5)*(crse(ic,jc+1,kc,n+nc) - Real(2.)*crse(ic,jc,kc,n+nc) + crse(ic,jc-1,kc,n+nc)) : Real(0.);
 
     Real dxy = (mask(i-r.x,j-r.y,k) == not_covered and mask(i+r.x,j-r.y,k) == not_covered and
                 mask(i-r.x,j+r.y,k) == not_covered and mask(i+r.x,j+r.y,k) == not_covered)
-        ? 0.25_rt*(crse(ic+1,jc+1,kc,n+nc)-crse(ic-1,jc+1,kc,n+nc)+crse(ic-1,jc-1,kc,n+nc)-crse(ic+1,jc-1,kc,n+nc))
+        ? Real(0.25)*(crse(ic+1,jc+1,kc,n+nc)-crse(ic-1,jc+1,kc,n+nc)+crse(ic-1,jc-1,kc,n+nc)-crse(ic+1,jc-1,kc,n+nc))
         : 0.0;
 
-    Real x = -0.5_rt + (i-ic*r.x+0.5_rt)/r.x;
-    Real y = -0.5_rt + (j-jc*r.y+0.5_rt)/r.y;
+    Real x = -Real(0.5) + (i-ic*r.x+Real(0.5))/r.x;
+    Real y = -Real(0.5) + (j-jc*r.y+Real(0.5))/r.y;
     bdry(i,j,k,n+nb) = crse(ic,jc,kc,n+nc) + x*dx + (x*x)*dx2 + y*dy + (y*y)*dy2 + x*y*dxy;
 }
 
diff --git a/Src/Boundary/AMReX_Mask.H b/Src/Boundary/AMReX_Mask.H
index ed74cda2d8d..778ded3fc06 100644
--- a/Src/Boundary/AMReX_Mask.H
+++ b/Src/Boundary/AMReX_Mask.H
@@ -53,7 +53,7 @@ public:
 
     explicit Mask (Array4<int const> const& a, IndexType t) noexcept : BaseFab<int>(a,t) {}
 
-    ~Mask () noexcept {};
+    ~Mask () noexcept {}
 
     Mask (Mask&& rhs) noexcept = default;
 
diff --git a/Src/Boundary/AMReX_YAFluxRegister.cpp b/Src/Boundary/AMReX_YAFluxRegister.cpp
index 21ed1077be6..3cd35ea7971 100644
--- a/Src/Boundary/AMReX_YAFluxRegister.cpp
+++ b/Src/Boundary/AMReX_YAFluxRegister.cpp
@@ -280,12 +280,12 @@ YAFluxRegister::FineAdd (const MFIter& mfi,
     const int nc = m_cfpatch.nComp();
 
     const Real ratio = static_cast<Real>(AMREX_D_TERM(m_ratio[0],*m_ratio[1],*m_ratio[2]));
-    std::array<Real,AMREX_SPACEDIM> dtdx{AMREX_D_DECL(dt/(dx[0]*ratio),
-                                                      dt/(dx[1]*ratio),
-                                                      dt/(dx[2]*ratio))};
+    std::array<Real,AMREX_SPACEDIM> dtdx{{AMREX_D_DECL(dt/(dx[0]*ratio),
+                                                       dt/(dx[1]*ratio),
+                                                       dt/(dx[2]*ratio))}};
     const Dim3 rr = m_ratio.dim3();
 
-    std::array<FArrayBox const*,AMREX_SPACEDIM> flux{AMREX_D_DECL(a_flux[0],a_flux[1],a_flux[2])};
+    std::array<FArrayBox const*,AMREX_SPACEDIM> flux{{AMREX_D_DECL(a_flux[0],a_flux[1],a_flux[2])}};
     bool use_gpu = (runon == RunOn::Gpu) && Gpu::inLaunchRegion();
     amrex::ignore_unused(use_gpu);
     std::array<FArrayBox,AMREX_SPACEDIM> ftmp;
diff --git a/Src/Boundary/AMReX_YAFluxRegister_1D_K.H b/Src/Boundary/AMReX_YAFluxRegister_1D_K.H
index a6e8a32c593..04f40382de8 100644
--- a/Src/Boundary/AMReX_YAFluxRegister_1D_K.H
+++ b/Src/Boundary/AMReX_YAFluxRegister_1D_K.H
@@ -33,7 +33,6 @@ void yafluxreg_fineadd (Box const& bx, Array4<Real> const& d, Array4<Real const>
                         Real dtdx, int nc, int dirside, Dim3 const& rr) noexcept
 {
     const auto lo = amrex::lbound(bx);
-    const auto hi = amrex::ubound(bx);
 
     switch (dirside) {
     case 0 :
diff --git a/Src/Boundary/CMakeLists.txt b/Src/Boundary/CMakeLists.txt
index 602a675552b..2ef60759b0d 100644
--- a/Src/Boundary/CMakeLists.txt
+++ b/Src/Boundary/CMakeLists.txt
@@ -20,15 +20,15 @@ target_sources(amrex
    AMReX_LO_BCTYPES.cpp
    AMReX_MacBndry.H
    AMReX_InterpBndryData_K.H
-   AMReX_InterpBndryData_${DIM}D_K.H
+   AMReX_InterpBndryData_${AMReX_SPACEDIM}D_K.H
    AMReX_LOUtil_K.H
    AMReX_YAFluxRegister.H
    AMReX_YAFluxRegister_K.H
-   AMReX_YAFluxRegister_${DIM}D_K.H
+   AMReX_YAFluxRegister_${AMReX_SPACEDIM}D_K.H
    AMReX_YAFluxRegister.cpp
    )
 
-if (ENABLE_FORTRAN)
+if (AMReX_FORTRAN)
    target_sources(amrex
       PRIVATE
       AMReX_LO_UTIL.F90
diff --git a/Src/CMakeLists.txt b/Src/CMakeLists.txt
index 2f89cceea58..054cc546a6a 100644
--- a/Src/CMakeLists.txt
+++ b/Src/CMakeLists.txt
@@ -1,5 +1,5 @@
 #
-# Fist, define the library we want to add
+# First, define the library we want to add
 # Think of this as a constructor for object "amrex"
 # In the following, we will use setters to change
 # the properties of this object, like setting the sources,
@@ -8,6 +8,16 @@
 add_library( amrex )
 add_library( AMReX::amrex ALIAS amrex )
 
+#
+# Setup parallel backends (any type: inter/intra-node)
+#
+include(AMReXParallelBackends)
+
+#
+# Find and link third party libraries if needed
+#
+include(AMReXThirdPartyLibraries)
+
 # Where to store Fortran modules
 if (CMAKE_Fortran_COMPILER_LOADED)
    set_target_properties( amrex
@@ -32,6 +42,7 @@ if (CMAKE_Fortran_COMPILER_LOADED AND (NOT CMAKE_Fortran_FLAGS) )
       )
 endif ()
 
+
 if (NOT CMAKE_CXX_FLAGS)
    target_link_libraries(amrex
       PUBLIC
@@ -39,7 +50,7 @@ if (NOT CMAKE_CXX_FLAGS)
       )
 endif ()
 
-if (ENABLE_FPE)
+if (AMReX_FPE)
    target_link_libraries(amrex
       PUBLIC
       $<BUILD_INTERFACE:Flags_FPE>
@@ -61,41 +72,33 @@ add_subdirectory(Amr)
 #
 # Optional components
 #
-if (ENABLE_EB)
-   if (ENABLE_CUDA AND ( "${NVCC_VERSION_MAJOR}.${NVCC_VERSION_MINOR}" VERSION_EQUAL "9.2") )
+if (AMReX_EB)
+   if (AMReX_CUDA AND ( "${NVCC_VERSION_MAJOR}.${NVCC_VERSION_MINOR}" VERSION_EQUAL "9.2") )
       message(FATAL_ERROR "EB component of AMReX is not compatible with CUDA 9.2")
    endif ()
    add_subdirectory(EB)
 endif ()
 
-if (ENABLE_LINEAR_SOLVERS)
+if (AMReX_LINEAR_SOLVERS)
    add_subdirectory(LinearSolvers)
-   target_link_libraries(amrex
-      PUBLIC
-      $<BUILD_INTERFACE:Flags_Fortran_REQUIRED>
-      )
 endif ()
 
-if (ENABLE_FORTRAN_INTERFACES)
+if (AMReX_FORTRAN_INTERFACES)
    add_subdirectory(F_Interfaces)
 endif ()
 
-if (ENABLE_PARTICLES)
+if (AMReX_PARTICLES)
    add_subdirectory(Particle)
 endif ()
 
 #
 # Optional external components
 #
-if (ENABLE_AMRDATA)
+if (AMReX_AMRDATA)
    add_subdirectory(Extern/amrdata)
-   target_link_libraries(amrex
-      PUBLIC
-      $<BUILD_INTERFACE:Flags_Fortran_REQUIRED>
-      )
 endif()
 
-if (ENABLE_PROFPARSER)
+if (AMReX_PROFPARSER)
     #
     # Generate BLProfParser.tab.H, BLProfParser.tab.cpp and
     # BLProfParser.lex.yy.cpp
@@ -133,23 +136,23 @@ if (ENABLE_PROFPARSER)
     add_subdirectory(Extern/ProfParser)
 endif ()
 
-if (ENABLE_SENSEI_INSITU)
+if (AMReX_SENSEI)
    add_subdirectory(Extern/SENSEI)
 endif ()
 
-if (ENABLE_SUNDIALS)
-   add_subdirectory(Extern/SUNDIALS4)
+if (AMReX_SUNDIALS)
+   add_subdirectory(Extern/SUNDIALS)
 endif ()
 
-if (ENABLE_CONDUIT)
+if (AMReX_CONDUIT OR AMReX_ASCENT)
    add_subdirectory(Extern/Conduit)
 endif ()
 
-if (ENABLE_HYPRE OR ENABLE_PETSC)
+if (AMReX_HYPRE OR AMReX_PETSC)
    add_subdirectory(Extern/HYPRE)
 endif ()
 
-if (ENABLE_PETSC)
+if (AMReX_PETSC)
    add_subdirectory(Extern/PETSc)
 endif ()
 
@@ -169,15 +172,18 @@ list(FILTER AMREX_PUBLIC_HEADERS INCLUDE REGEX "\\.H")
 set_target_properties( amrex PROPERTIES PUBLIC_HEADER "${AMREX_PUBLIC_HEADERS}")
 
 #
-# If ENABLE_CUDA, C++ files will be compiled as CUDA sources
+# If AMReX_CUDA, C++ files will be compiled as CUDA sources
 #
-if (ENABLE_CUDA)
+if (AMReX_CUDA)
    setup_target_for_cuda_compilation( amrex )
 endif ()
 
-
 #
 # Install amrex  -- Export
 #
 include(AMReXInstallHelpers)
-install_amrex(Flags_CXX Flags_Fortran Flags_FPE)
+set(_amrex_targets Flags_CXX Flags_Fortran Flags_FPE )
+if (AMReX_DPCPP)
+   list(APPEND _amrex_targets SYCL)
+endif()
+install_amrex(${_amrex_targets})
diff --git a/Src/EB/AMReX_EB2.H b/Src/EB/AMReX_EB2.H
index 3a0e13680a6..f326d42cee9 100644
--- a/Src/EB/AMReX_EB2.H
+++ b/Src/EB/AMReX_EB2.H
@@ -37,7 +37,11 @@ public:
 
     static void pop () noexcept { m_instance.pop_back(); }
     static void clear () noexcept { m_instance.clear(); }
-    static const IndexSpace& top () { return *(m_instance.back()); }
+    static const IndexSpace& top () {
+        AMREX_ALWAYS_ASSERT_WITH_MESSAGE(!m_instance.empty(),
+                                         "Have you forgot to call EB2::build? It's required even if the geometry is all regular.");
+        return *(m_instance.back());
+    }
     static bool empty () noexcept { return m_instance.empty(); }
     static int size () noexcept { return m_instance.size(); }
 
@@ -60,7 +64,8 @@ public:
 
     IndexSpaceImp (const G& gshop, const Geometry& geom,
                    int required_coarsening_level, int max_coarsening_level,
-                   int ngrow, bool build_coarse_level_by_coarsening);
+                   int ngrow, bool build_coarse_level_by_coarsening,
+                   bool extend_domain_face);
 
     IndexSpaceImp (IndexSpaceImp<G> const&) = delete;
     IndexSpaceImp (IndexSpaceImp<G> &&) = delete;
@@ -88,17 +93,21 @@ private:
 
 #include <AMReX_EB2_IndexSpaceI.H>
 
+bool ExtendDomainFace ();
+
 template <typename G>
 void
 Build (const G& gshop, const Geometry& geom,
        int required_coarsening_level, int max_coarsening_level,
-       int ngrow = 4, bool build_coarse_level_by_coarsening = true)
+       int ngrow = 4, bool build_coarse_level_by_coarsening = true,
+       bool extend_domain_face = ExtendDomainFace())
 {
     BL_PROFILE("EB2::Initialize()");
     IndexSpace::push(new IndexSpaceImp<G>(gshop, geom,
                                           required_coarsening_level,
                                           max_coarsening_level,
-                                          ngrow, build_coarse_level_by_coarsening));
+                                          ngrow, build_coarse_level_by_coarsening,
+                                          extend_domain_face));
 }
 
 void Build (const Geometry& geom,
diff --git a/Src/EB/AMReX_EB2.cpp b/Src/EB/AMReX_EB2.cpp
index a643f16255e..1f6b3552270 100644
--- a/Src/EB/AMReX_EB2.cpp
+++ b/Src/EB/AMReX_EB2.cpp
@@ -18,11 +18,13 @@ namespace amrex { namespace EB2 {
 Vector<std::unique_ptr<IndexSpace> > IndexSpace::m_instance;
 
 int max_grid_size = 64;
+bool extend_domain_face = true;
 
 void Initialize ()
 {
     ParmParse pp("eb2");
     pp.query("max_grid_size", max_grid_size);
+    pp.query("extend_domain_face", extend_domain_face);
 
     amrex::ExecOnFinalize(Finalize);
 }
@@ -32,6 +34,11 @@ void Finalize ()
     IndexSpace::clear();
 }
 
+bool ExtendDomainFace ()
+{
+    return extend_domain_face;
+}
+
 void
 IndexSpace::push (IndexSpace* ispace)
 {
diff --git a/Src/EB/AMReX_EB2_2D_C.cpp b/Src/EB/AMReX_EB2_2D_C.cpp
index f5b92555d37..77fdb93c343 100644
--- a/Src/EB/AMReX_EB2_2D_C.cpp
+++ b/Src/EB/AMReX_EB2_2D_C.cpp
@@ -4,7 +4,7 @@ namespace amrex { namespace EB2 {
 
 namespace {
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void set_eb_data (const int i, const int j, Array4<EBCellFlag> const& cell,
+void set_eb_data (const int i, const int j,
                   Array4<Real> const& apx, Array4<Real> const& apy,
                   Array4<Real> const& vfrac, Array4<Real> const& vcent,
                   Array4<Real> const& barea, Array4<Real> const& bcent,
@@ -64,14 +64,14 @@ void set_eb_data (const int i, const int j, Array4<EBCellFlag> const& cell,
         bnorm(i,j,0,1) = signy;
         vfrac(i,j,0) = 0.5*(axm+axp);
         vcent(i,j,0,0) = 0.0;
-        vcent(i,j,0,1) = (0.125*(ayp-aym) + ny*0.5*bcent(i,j,0,1)*bcent(i,j,0,1)) / vfrac(i,j,0);
+        vcent(i,j,0,1) = (0.125*(ayp-aym) + ny*0.5*bcent(i,j,0,1)*bcent(i,j,0,1)) / (vfrac(i,j,0) + 1.e-30);
     } else if (nyabs < tiny or nxabs > almostone) {
         barea(i,j,0) = 1.0;
         bcent(i,j,0,1) = 0.0;
         bnorm(i,j,0,0) = signx;
         bnorm(i,j,0,1) = 0.0;
         vfrac(i,j,0) = 0.5*(aym+ayp);
-        vcent(i,j,0,0) = (0.125*(axp-axm) + nx*0.5*bcent(i,j,0,0)*bcent(i,j,0,0)) / vfrac(i,j,0);
+        vcent(i,j,0,0) = (0.125*(axp-axm) + nx*0.5*bcent(i,j,0,0)*bcent(i,j,0,0)) / (vfrac(i,j,0) + 1.e-30);
         vcent(i,j,0,1) = 0.0;
     } else {
         Real aa = nxabs/ny;
@@ -105,6 +105,25 @@ void set_eb_data (const int i, const int j, Array4<EBCellFlag> const& cell,
         }
     }
 }
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void set_covered(const int i, const int j,
+                 Array4<EBCellFlag> const& cell,
+                 Array4<Real> const& vfrac, Array4<Real> const& vcent,
+                 Array4<Real> const& barea, Array4<Real> const& bcent,
+                 Array4<Real> const& bnorm) 
+{
+   vfrac(i,j,0) = 0.0;
+   vcent(i,j,0,0) = 0.0;
+   vcent(i,j,0,1) = 0.0;
+   barea(i,j,0) = 0.0;
+   bcent(i,j,0,0) = -1.0;
+   bcent(i,j,0,1) = -1.0;
+   bnorm(i,j,0,0) = 0.0;
+   bnorm(i,j,0,1) = 0.0;
+   cell(i,j,0).setCovered();
+}
+
 }
 
 void build_faces (Box const& bx, Array4<EBCellFlag> const& cell,
@@ -223,7 +242,8 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
                   Array4<Real> const& apx, Array4<Real> const& apy,
                   Array4<Real> const& vfrac, Array4<Real> const& vcent,
                   Array4<Real> const& barea, Array4<Real> const& bcent,
-                  Array4<Real> const& bnorm, Real small_volfrac)
+                  Array4<Real> const& bnorm, Real small_volfrac,
+                  Geometry const& geom, bool extend_domain_face)
 {
     const Box& bxg1 = amrex::grow(bx,1);
     AMREX_HOST_DEVICE_FOR_3D ( bxg1, i, j, k,
@@ -248,67 +268,106 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
             bnorm(i,j,0,1) = 0.0;
         } else {
 
-            set_eb_data(i,j,cell,apx,apy,vfrac,vcent,barea,bcent,bnorm);
+            set_eb_data(i,j,apx,apy,vfrac,vcent,barea,bcent,bnorm);
 
             // remove small cells
             if (vfrac(i,j,0) < small_volfrac) {
-                vfrac(i,j,0) = 0.0;
-                vcent(i,j,0,0) = 0.0;
-                vcent(i,j,0,1) = 0.0;
-                barea(i,j,0) = 0.0;
-                bcent(i,j,0,0) = -1.0;
-                bcent(i,j,0,1) = -1.0;
-                bnorm(i,j,0,0) = 0.0;
-                bnorm(i,j,0,1) = 0.0;
-                cell(i,j,0).setCovered();
+               set_covered(i,j,cell,vfrac,vcent,barea,bcent,bnorm);
             }
         }
     });
 
-    // fix face for small cells
-    AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bxg1, tbx,
+    // set cells in the extended region to covered if the
+    // corresponding cell on the domain face is covered
+    if(extend_domain_face) {
+
+       Box gdomain = geom.Domain();
+       for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+           if (geom.isPeriodic(idim)) {
+               gdomain.setSmall(idim, std::min(gdomain.smallEnd(idim), bxg1.smallEnd(idim)));
+               gdomain.setBig(idim, std::max(gdomain.bigEnd(idim), bxg1.bigEnd(idim)));
+           }
+       }
+
+       if (not gdomain.contains(bxg1)) {
+       AMREX_HOST_DEVICE_FOR_3D ( bxg1, i, j, k,
+       {
+              const auto & dlo = gdomain.loVect();
+              const auto & dhi = gdomain.hiVect();
+
+              // find the cell(ii,jj,kk) on the corr. domain face
+              // this would have already been set to correct value
+              bool in_extended_domain = false;
+              int ii = i;
+              int jj = j;
+              int kk = k;
+              if(i < dlo[0]) {
+                  in_extended_domain = true;
+                  ii = dlo[0];
+              }
+              else if(i > dhi[0]) {
+                  in_extended_domain = true;
+                  ii = dhi[0];
+              }
+
+              if(j < dlo[1]) {
+                  in_extended_domain = true;
+                  jj = dlo[1];
+              }
+              else if(j > dhi[1]) {
+                  in_extended_domain = true;
+                  jj = dhi[1];
+              }
+
+              // set cell in extendable region to covered if necessary
+              if( in_extended_domain and (not cell(i,j,k).isCovered()) 
+                  and cell(ii,jj,kk).isCovered() ) 
+              {
+                  set_covered(i,j,cell,vfrac,vcent,barea,bcent,bnorm);
+              }
+          });
+       }
+    }
+
+
+    // fix face for small cells whose vfrac has been set to zero
+    const Box xbx = Box(bx).surroundingNodes(0).grow(1,1);
+    AMREX_HOST_DEVICE_FOR_3D ( xbx, i, j, k,
     {
-        Box lbx = amrex::grow(amrex::surroundingNodes(bx,0),1,1);
-        auto lo = amrex::max_lbound(tbx, lbx);
-        auto hi = amrex::min_ubound(tbx, lbx);
-        for (int j = lo.y; j <= hi.y; ++j) {
-        for (int i = lo.x; i <= hi.x; ++i) {
-            if (vfrac(i-1,j,0) < small_volfrac or vfrac(i,j,0) < small_volfrac) {
-                fx(i,j,0) = Type::covered;
-                apx(i,j,0) = 0.0;
-                if (cell(i,j,0).isRegular())
-                {
-                    cell(i,j,0).setSingleValued();
-                    set_eb_data(i,j,cell,apx,apy,vfrac,vcent,barea,bcent,bnorm);
-                }
-                if (cell(i-1,j,0).isRegular())
-                {
-                    cell(i-1,j,0).setSingleValued();
-                    set_eb_data(i-1,j,cell,apx,apy,vfrac,vcent,barea,bcent,bnorm);
-                }
+        if (vfrac(i-1,j,0) == 0._rt or vfrac(i,j,0) == 0._rt) {
+            fx(i,j,0) = Type::covered;
+            apx(i,j,0) = 0.0;
+            // race conditions do not happeen because multiple cuts are not allowed
+            if (not cell(i,j,0).isCovered())
+            {
+                cell(i,j,0).setSingleValued();
+                set_eb_data(i,j,apx,apy,vfrac,vcent,barea,bcent,bnorm);
             }
-        }}
-
-        lbx = amrex::grow(amrex::surroundingNodes(bx,1),0,1);
-        lo = amrex::max_lbound(tbx, lbx);
-        hi = amrex::min_ubound(tbx, lbx);
-        for (int j = lo.y; j <= hi.y; ++j) {
-        for (int i = lo.x; i <= hi.x; ++i) {
-            if (vfrac(i,j-1,0) < small_volfrac or vfrac(i,j,0) < small_volfrac) {
-                fy(i,j,0) = Type::covered;
-                apy(i,j,0) = 0.0;
-                if (cell(i,j,0).isRegular())
-                {
-                    cell(i,j,0).setSingleValued();
-                    set_eb_data(i,j,cell,apx,apy,vfrac,vcent,barea,bcent,bnorm);
-                }
-                if (cell(i,j-1,0).isRegular())
-                {
-                    cell(i,j-1,0).setSingleValued();
-                    set_eb_data(i,j-1,cell,apx,apy,vfrac,vcent,barea,bcent,bnorm);
-                }
+            if (not cell(i-1,j,0).isCovered())
+            {
+                cell(i-1,j,0).setSingleValued();
+                set_eb_data(i-1,j,apx,apy,vfrac,vcent,barea,bcent,bnorm);
             }
-        }}
+        }
+    });
+    //
+    const Box ybx = Box(bx).surroundingNodes(1).grow(0,1);
+    AMREX_HOST_DEVICE_FOR_3D ( ybx, i, j, k,
+    {
+        if (vfrac(i,j-1,0) == 0._rt or vfrac(i,j,0) == 0._rt) {
+            fy(i,j,0) = Type::covered;
+            apy(i,j,0) = 0.0;
+            if (not cell(i,j,0).isCovered())
+            {
+                cell(i,j,0).setSingleValued();
+                set_eb_data(i,j,apx,apy,vfrac,vcent,barea,bcent,bnorm);
+            }
+            if (not cell(i,j-1,0).isCovered())
+            {
+                cell(i,j-1,0).setSingleValued();
+                set_eb_data(i,j-1,apx,apy,vfrac,vcent,barea,bcent,bnorm);
+            }
+        }
     });
 
     // Build neighbors.  By default, all neighbors are already set.
diff --git a/Src/EB/AMReX_EB2_3D_C.H b/Src/EB/AMReX_EB2_3D_C.H
index 2757106d46f..515832680df 100644
--- a/Src/EB/AMReX_EB2_3D_C.H
+++ b/Src/EB/AMReX_EB2_3D_C.H
@@ -52,7 +52,7 @@ amrex_eb2_build_types (Box const& tbx, Box const& bxg2,
         {
             fx(i,j,k) = Type::regular;
         }
-        else if (s(i,j,k  ) >= 0.0 and s(i,j+1,k  ) >= 0.0 
+        else if (s(i,j,k  ) >= 0.0 and s(i,j+1,k  ) >= 0.0
             and  s(i,j,k+1) >= 0.0 and s(i,j+1,k+1) >= 0.0 )
         {
             fx(i,j,k) = Type::covered;
@@ -193,7 +193,7 @@ int check_mvmc (int i, int j, int k, Array4<Real const> const& fine)
     int nz11 = num_cuts(fine(i+2,j+2,k),fine(i+2,j+2,k+1)) + num_cuts(fine(i+2,j+2,k+1),fine(i+2,j+2,k+2));
 
     // x-faces
-    int nxm;
+    int nxm = -1;
     int n = ny00 + ny01 + nz00 + nz01;
     if (n == 0) {
         nxm = 0;
diff --git a/Src/EB/AMReX_EB2_3D_C.cpp b/Src/EB/AMReX_EB2_3D_C.cpp
index 047287280b6..70043859539 100644
--- a/Src/EB/AMReX_EB2_3D_C.cpp
+++ b/Src/EB/AMReX_EB2_3D_C.cpp
@@ -5,7 +5,7 @@ namespace amrex { namespace EB2 {
 namespace {
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void set_eb_data (const int i, const int j, const int k,
-                  Array4<EBCellFlag> const& cell, Array4<Real> const& apx,
+                  Array4<Real> const& apx,
                   Array4<Real> const& apy, Array4<Real> const& apz,
                   Array4<Real const> const& fcx, Array4<Real const> const& fcy,
                   Array4<Real const> const& fcz, Array4<Real const> const& m2x,
@@ -36,7 +36,7 @@ void set_eb_data (const int i, const int j, const int k,
 
     Real dapx = axm - axp;
     Real dapy = aym - ayp;
-            Real dapz = azm - azp;
+    Real dapz = azm - azp;
     Real apnorm = std::sqrt(dapx*dapx+dapy*dapy+dapz*dapz);
             AMREX_ALWAYS_ASSERT_WITH_MESSAGE(apnorm != 0.0,
                                      "amrex::EB2:build_cells: apnorm==0");
@@ -236,6 +236,27 @@ void cut_face_2d (Real& areafrac, Real& centx, Real& centy,
         }
     }
 }
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void set_covered (const int i, const int j, const int k,
+                  Array4<EBCellFlag> const& cell,
+                  Array4<Real> const& vfrac, Array4<Real> const& vcent,
+                  Array4<Real> const& barea, Array4<Real> const& bcent,
+                  Array4<Real> const& bnorm)
+{
+    vfrac(i,j,k) = 0.0;
+    vcent(i,j,k,0) = 0.0;
+    vcent(i,j,k,1) = 0.0;
+    vcent(i,j,k,2) = 0.0;
+    bcent(i,j,k,0) = -1.0;
+    bcent(i,j,k,1) = -1.0;
+    bcent(i,j,k,2) = -1.0;
+    bnorm(i,j,k,0) = 0.0;
+    bnorm(i,j,k,1) = 0.0;
+    bnorm(i,j,k,2) = 0.0;
+    barea(i,j,k) = 0.0;
+    cell(i,j,k).setCovered();
+}
 }
 
 void build_faces (Box const& bx, Array4<EBCellFlag> const& cell,
@@ -609,7 +630,8 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
                   Array4<Real> const& vfrac, Array4<Real> const& vcent,
                   Array4<Real> const& barea, Array4<Real> const& bcent,
                   Array4<Real> const& bnorm, Array4<EBCellFlag> const& ctmp,
-                  Real small_volfrac)
+                  Real small_volfrac, 
+                  Geometry const& geom, bool extend_domain_face)
 {
     const Box& bxg1 = amrex::grow(bx,1);
     AMREX_HOST_DEVICE_FOR_3D ( bxg1, i, j, k,
@@ -640,32 +662,79 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
             barea(i,j,k) = 0.0;            
         } else {
 
-            set_eb_data(i,j,k,cell,apx,apy,apz,
+            set_eb_data(i,j,k,apx,apy,apz,
                         fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
                         barea,bcent,bnorm);
 
             // remove small cells
             if (vfrac(i,j,k) < small_volfrac) {
-                vfrac(i,j,k) = 0.0;
-                vcent(i,j,k,0) = 0.0;
-                vcent(i,j,k,1) = 0.0;
-                vcent(i,j,k,2) = 0.0;
-                bcent(i,j,k,0) = -1.0;
-                bcent(i,j,k,1) = -1.0;
-                bcent(i,j,k,2) = -1.0;
-                bnorm(i,j,k,0) = 0.0;
-                bnorm(i,j,k,1) = 0.0;
-                bnorm(i,j,k,2) = 0.0;
-                barea(i,j,k) = 0.0;
-                cell(i,j,k).setCovered();
+                set_covered(i,j,k,cell,vfrac,vcent,barea,bcent,bnorm);
             }
         }
     });
 
-    // fix faces for small cells
-    const auto bxlo = amrex::lbound(bx);
-    const auto bxhi = amrex::ubound(bx);
+    // set cells in the extended region to covered if the
+    // corresponding cell on the domain face is covered
+    if(extend_domain_face) {
+
+       Box gdomain = geom.Domain();
+       for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+           if (geom.isPeriodic(idim)) {
+               gdomain.setSmall(idim, std::min(gdomain.smallEnd(idim), bxg1.smallEnd(idim)));
+               gdomain.setBig(idim, std::max(gdomain.bigEnd(idim), bxg1.bigEnd(idim)));
+           }
+       }
+
+       if (not gdomain.contains(bxg1)) {
+          AMREX_HOST_DEVICE_FOR_3D ( bxg1, i, j, k,
+          {
+              const auto & dlo = gdomain.loVect();
+              const auto & dhi = gdomain.hiVect();
+
+              // find the cell(ii,jj,kk) on the corr. domain face
+              // this would have already been set to correct value
+              bool in_extended_domain = false;
+              int ii = i;
+              int jj = j;
+              int kk = k;
+              if(i < dlo[0]) {
+                  in_extended_domain = true;
+                  ii = dlo[0];
+              }
+              else if(i > dhi[0]) {
+                  in_extended_domain = true;
+                  ii = dhi[0];
+              }
+
+              if(j < dlo[1]) {
+                  in_extended_domain = true;
+                  jj = dlo[1];
+              }
+              else if(j > dhi[1]) {
+                  in_extended_domain = true;
+                  jj = dhi[1];
+              }
+
+              if(k < dlo[2]) {
+                  in_extended_domain = true;
+                  kk = dlo[2];
+              }
+              else if(k > dhi[2]) {
+                  in_extended_domain = true;
+                  kk = dhi[2];
+              }
+
+              // set cell in extendable region to covered if necessary
+              if( in_extended_domain and (not cell(i,j,k).isCovered()) 
+                  and cell(ii,jj,kk).isCovered() ) 
+              {
+                  set_covered(i,j,k,cell,vfrac,vcent,barea,bcent,bnorm);
+              }
+          });
+       }
+    }
 
+    // fix faces for small cells whose vfrac has been set to zero
 #ifdef AMREX_USE_DPCPP
     // xxxxx DPCPP todo: kernel parameter size
     Vector<Array4<Real const> > htmp = {fcx,fcy,fcz,m2x,m2y,m2z};
@@ -673,96 +742,91 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
     if (Gpu::inLaunchRegion()) dtmp.reset(new Gpu::AsyncArray<Array4<Real const> >(htmp.data(), 6));
     Array4<Real const>* ptmp = (Gpu::inLaunchRegion()) ? dtmp->data() : htmp.data();
 #endif
-
-    AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bxg1, tbx,
+    const Box xbx = Box(bx).surroundingNodes(0).grow(1,1).grow(2,1);
+    AMREX_HOST_DEVICE_FOR_3D ( xbx, i, j, k,
     {
-#ifdef AMREX_USE_DPCPP
-        auto fcx = ptmp[0];
-        auto fcy = ptmp[1];
-        auto fcz = ptmp[2];
-        auto m2x = ptmp[3];
-        auto m2y = ptmp[4];
-        auto m2z = ptmp[5];
-#endif
-
-        auto lo = amrex::max_lbound(tbx, Dim3{bxlo.x  ,bxlo.y-1,bxlo.z-1});
-        auto hi = amrex::min_ubound(tbx, Dim3{bxhi.x+1,bxhi.y+1,bxhi.z+1});
-        for (int k = lo.z; k <= hi.z; ++k) {
-        for (int j = lo.y; j <= hi.y; ++j) {
-        for (int i = lo.x; i <= hi.x; ++i)
-        {
-            if (vfrac(i-1,j,k) < small_volfrac or vfrac(i,j,k) < small_volfrac) {
-                fx(i,j,k) = Type::covered;
-                apx(i,j,k) = 0.0;
-                if (cell(i  ,j,k).isRegular())
-                {
-                    cell(i  ,j,k).setSingleValued();
-                    set_eb_data(i,j,k,cell,apx,apy,apz,
-                                fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
-                                barea,bcent,bnorm);
-                }
-                if (cell(i-1,j,k).isRegular())
-                {
-                    cell(i-1,j,k).setSingleValued();
-                    set_eb_data(i-1,j,k,cell,apx,apy,apz,
-                                fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
-                                barea,bcent,bnorm);
-                }
-            }
-        }}}
-
-        lo = amrex::max_lbound(tbx, Dim3{bxlo.x-1,bxlo.y  ,bxlo.z-1});
-        hi = amrex::min_ubound(tbx, Dim3{bxhi.x+1,bxhi.y+1,bxhi.z+1});
-        for (int k = lo.z; k <= hi.z; ++k) {
-        for (int j = lo.y; j <= hi.y; ++j) {
-        for (int i = lo.x; i <= hi.x; ++i)
-        {
-            if (vfrac(i,j-1,k) < small_volfrac or vfrac(i,j,k) < small_volfrac) {
-                fy(i,j,k) = Type::covered;
-                apy(i,j,k) = 0.0;
-                if (cell(i,j  ,k).isRegular())
-                {
-                    cell(i,j  ,k).setSingleValued();
-                    set_eb_data(i,j,k,cell,apx,apy,apz,
-                                fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
-                                barea,bcent,bnorm);
-                }
-                if (cell(i,j-1,k).isRegular())
-                {
-                    cell(i,j-1,k).setSingleValued();
-                    set_eb_data(i,j-1,k,cell,apx,apy,apz,
-                                fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
-                                barea,bcent,bnorm);
-                }
-            }
-        }}}
-
-        lo = amrex::max_lbound(tbx, Dim3{bxlo.x-1,bxlo.y-1,bxlo.z  });
-        hi = amrex::min_ubound(tbx, Dim3{bxhi.x+1,bxhi.y+1,bxhi.z+1});
-        for (int k = lo.z; k <= hi.z; ++k) {
-        for (int j = lo.y; j <= hi.y; ++j) {
-        for (int i = lo.x; i <= hi.x; ++i)
-        {
-            if (vfrac(i,j,k-1) < small_volfrac or vfrac(i,j,k) < small_volfrac) {
-                fz(i,j,k) = Type::covered;
-                apz(i,j,k) = 0.0;
-
-                if (cell(i,j,k  ).isRegular())
-                {
-                    cell(i,j,k  ).setSingleValued();
-                    set_eb_data(i,j,k,cell,apx,apy,apz,
-                                fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
-                                barea,bcent,bnorm);
-                }
-                if (cell(i,j,k-1).isRegular())
-                {
-                    cell(i,j,k-1).setSingleValued();
-                    set_eb_data(i,j,k-1,cell,apx,apy,apz,
-                                fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
-                                barea,bcent,bnorm);
-                }
-            }
-        }}}
+        if (vfrac(i-1,j,k) == 0._rt or vfrac(i,j,k) == 0._rt) {
+            AMREX_DPCPP_ONLY(auto fcx = ptmp[0]);
+            AMREX_DPCPP_ONLY(auto fcy = ptmp[1]);
+            AMREX_DPCPP_ONLY(auto fcz = ptmp[2]);
+            AMREX_DPCPP_ONLY(auto m2x = ptmp[3]);
+            AMREX_DPCPP_ONLY(auto m2y = ptmp[4]);
+            AMREX_DPCPP_ONLY(auto m2z = ptmp[5]);
+            fx(i,j,k) = Type::covered;
+            apx(i,j,k) = 0.0;
+            if (not cell(i  ,j,k).isCovered())
+            {
+                cell(i  ,j,k).setSingleValued();
+                set_eb_data(i,j,k,apx,apy,apz,
+                            fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
+                            barea,bcent,bnorm);
+            }
+            if (not cell(i-1,j,k).isCovered())
+            {
+                cell(i-1,j,k).setSingleValued();
+                set_eb_data(i-1,j,k,apx,apy,apz,
+                            fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
+                            barea,bcent,bnorm);
+            }
+        }
+    });
+    //
+    const Box ybx = Box(bx).surroundingNodes(1).grow(0,1).grow(2,1);
+    AMREX_HOST_DEVICE_FOR_3D ( ybx, i, j, k,
+    {
+        if (vfrac(i,j-1,k) == 0._rt or vfrac(i,j,k) == 0._rt) {
+            AMREX_DPCPP_ONLY(auto fcx = ptmp[0]);
+            AMREX_DPCPP_ONLY(auto fcy = ptmp[1]);
+            AMREX_DPCPP_ONLY(auto fcz = ptmp[2]);
+            AMREX_DPCPP_ONLY(auto m2x = ptmp[3]);
+            AMREX_DPCPP_ONLY(auto m2y = ptmp[4]);
+            AMREX_DPCPP_ONLY(auto m2z = ptmp[5]);
+            fy(i,j,k) = Type::covered;
+            apy(i,j,k) = 0.0;
+            if (not cell(i,j  ,k).isCovered())
+            {
+                cell(i,j  ,k).setSingleValued();
+                set_eb_data(i,j,k,apx,apy,apz,
+                            fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
+                            barea,bcent,bnorm);
+            }
+            if (not cell(i,j-1,k).isCovered())
+            {
+                cell(i,j-1,k).setSingleValued();
+                set_eb_data(i,j-1,k,apx,apy,apz,
+                            fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
+                            barea,bcent,bnorm);
+            }
+        }
+    });
+    //
+    const Box zbx = Box(bx).surroundingNodes(2).grow(0,1).grow(1,1);
+    AMREX_HOST_DEVICE_FOR_3D ( zbx, i, j, k,
+    {
+        if (vfrac(i,j,k-1) == 0._rt or vfrac(i,j,k) == 0._rt) {
+            AMREX_DPCPP_ONLY(auto fcx = ptmp[0]);
+            AMREX_DPCPP_ONLY(auto fcy = ptmp[1]);
+            AMREX_DPCPP_ONLY(auto fcz = ptmp[2]);
+            AMREX_DPCPP_ONLY(auto m2x = ptmp[3]);
+            AMREX_DPCPP_ONLY(auto m2y = ptmp[4]);
+            AMREX_DPCPP_ONLY(auto m2z = ptmp[5]);
+            fz(i,j,k) = Type::covered;
+            apz(i,j,k) = 0.0;
+            if (not cell(i,j,k  ).isCovered())
+            {
+                cell(i,j,k  ).setSingleValued();
+                set_eb_data(i,j,k,apx,apy,apz,
+                            fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
+                            barea,bcent,bnorm);
+            }
+            if (not cell(i,j,k-1).isCovered())
+            {
+                cell(i,j,k-1).setSingleValued();
+                set_eb_data(i,j,k-1,apx,apy,apz,
+                            fcx,fcy,fcz,m2x,m2y,m2z,vfrac,vcent,
+                            barea,bcent,bnorm);
+            }
+        }
     });
 
     // Build neighbors.  By default all 26 neighbors are already set.
diff --git a/Src/EB/AMReX_EB2_C.H b/Src/EB/AMReX_EB2_C.H
index 4ecb2cf7a5b..98a6d7b2449 100644
--- a/Src/EB/AMReX_EB2_C.H
+++ b/Src/EB/AMReX_EB2_C.H
@@ -4,6 +4,7 @@
 #include <AMReX_FArrayBox.H>
 #include <AMReX_EBCellFlag.H>
 #include <AMReX_EB2_Graph.H>
+#include <AMReX_Geometry.H>
 
 #if (AMREX_SPACEDIM == 2)
 #include <AMReX_EB2_2D_C.H>
@@ -29,7 +30,8 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
                   Array4<Real> const& apx, Array4<Real> const& apy,
                   Array4<Real> const& vfrac, Array4<Real> const& vcent,
                   Array4<Real> const& barea, Array4<Real> const& bcent,
-                  Array4<Real> const& bnorm, Real small_volfrac);
+                  Array4<Real> const& bnorm, Real small_volfrac, 
+                  Geometry const& geom, bool extend_domain_face);
 
 #elif (AMREX_SPACEDIM == 3)
 
@@ -57,7 +59,8 @@ void build_cells (Box const& bx, Array4<EBCellFlag> const& cell,
                   Array4<Real> const& vfrac, Array4<Real> const& vcent,
                   Array4<Real> const& barea, Array4<Real> const& bcent,
                   Array4<Real> const& bnorm, Array4<EBCellFlag> const& ctmp,
-                  Real small_volfrac);
+                  Real small_volfrac, 
+                  Geometry const& geom, bool extend_domain_face);
 
 #endif
 
diff --git a/Src/EB/AMReX_EB2_GeometryShop.H b/Src/EB/AMReX_EB2_GeometryShop.H
index ed4831ab9b5..4ea9aa51847 100644
--- a/Src/EB/AMReX_EB2_GeometryShop.H
+++ b/Src/EB/AMReX_EB2_GeometryShop.H
@@ -253,6 +253,7 @@ public:
             reduce_op.eval(bx, reduce_data,
             [=] AMREX_GPU_DEVICE (int i, int j, int k) -> ReduceTuple
             {
+                amrex::ignore_unused(j,k);
                 Real v = f(AMREX_D_DECL(problo[0]+i*dx[0],
                                         problo[1]+j*dx[1],
                                         problo[2]+k*dx[2]));
@@ -298,43 +299,52 @@ public:
     static constexpr bool isGPUable () noexcept { return false; }
 
     template <class U=F, typename std::enable_if<IsGPUable<U>::value>::type* FOO = nullptr >
-    void fillFab (BaseFab<Real>& levelset, const Geometry& geom, RunOn run_on) const noexcept
+    void fillFab (BaseFab<Real>& levelset, const Geometry& geom, RunOn run_on,
+                  Box const& bounding_box) const noexcept
     {
         const auto problo = geom.ProbLoArray();
         const auto dx = geom.CellSizeArray();
         const Box& bx = levelset.box();
         const auto& a = levelset.array();
+        const auto blo = amrex::lbound(bounding_box);
+        const auto bhi = amrex::ubound(bounding_box);
         auto f = m_f;
         AMREX_HOST_DEVICE_FOR_3D_FLAG(run_on, bx, i, j, k,
         {
-            a(i,j,k) = f(AMREX_D_DECL(problo[0]+i*dx[0],
-                                      problo[1]+j*dx[1],
-                                      problo[2]+k*dx[2]));
+            a(i,j,k) = f(AMREX_D_DECL(problo[0]+amrex::Clamp(i,blo.x,bhi.x)*dx[0],
+                                      problo[1]+amrex::Clamp(j,blo.y,bhi.y)*dx[1],
+                                      problo[2]+amrex::Clamp(k,blo.z,bhi.z)*dx[2]));
         });
     }
 
     template <class U=F, typename std::enable_if<!IsGPUable<U>::value>::type* BAR = nullptr >
-    void fillFab (BaseFab<Real>& levelset, const Geometry& geom, RunOn) const noexcept
+    void fillFab (BaseFab<Real>& levelset, const Geometry& geom, RunOn,
+                  Box const& bounding_box) const noexcept
     {
         const auto problo = geom.ProbLoArray();
         const auto dx = geom.CellSizeArray();
         const Box& bx = levelset.box();
         const auto& a = levelset.array();
+        const auto blo = amrex::lbound(bounding_box);
+        const auto bhi = amrex::ubound(bounding_box);
         amrex::LoopOnCpu(bx, [&] (int i, int j, int k) noexcept
         {
-            a(i,j,k) = m_f(RealArray{AMREX_D_DECL(problo[0]+i*dx[0],
-                                                  problo[1]+j*dx[1],
-                                                  problo[2]+k*dx[2])});
+            a(i,j,k) = m_f(RealArray{AMREX_D_DECL(problo[0]+amrex::Clamp(i,blo.x,bhi.x)*dx[0],
+                                                  problo[1]+amrex::Clamp(j,blo.y,bhi.y)*dx[1],
+                                                  problo[2]+amrex::Clamp(k,blo.z,bhi.z)*dx[2])});
         });
     }
 
     template <class U=F, typename std::enable_if<IsGPUable<U>::value>::type* FOO = nullptr >
     void getIntercept (Array<BaseFab<Real>,AMREX_SPACEDIM>& inter_fab,
                        Array<BaseFab<Type_t>,AMREX_SPACEDIM> const& type_fab,
-                       Geometry const& geom, RunOn run_on) const noexcept
+                       Geometry const& geom, RunOn run_on,
+                       Box const& bounding_box) const noexcept
     {
         auto const& dx = geom.CellSizeArray();
         auto const& problo = geom.ProbLoArray();
+        const auto blo = amrex::lbound(bounding_box);
+        const auto bhi = amrex::ubound(bounding_box);
         auto f = m_f;
         for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
             Array4<Real> const& inter = inter_fab[idim].array();
@@ -348,12 +358,12 @@ public:
                     IntVect ivhi(AMREX_D_DECL(i,j,k));
                     ivhi[dir] += 1;
                     inter(i,j,k) = BrentRootFinder
-                        ({AMREX_D_DECL(problo[0]+ivlo[0]*dx[0],
-                                       problo[1]+ivlo[1]*dx[1],
-                                       problo[2]+ivlo[2]*dx[2])},
-                         {AMREX_D_DECL(problo[0]+ivhi[0]*dx[0],
-                                       problo[1]+ivhi[1]*dx[1],
-                                       problo[2]+ivhi[2]*dx[2])},
+                        ({AMREX_D_DECL(problo[0]+amrex::Clamp(ivlo[0],blo.x,bhi.x)*dx[0],
+                                       problo[1]+amrex::Clamp(ivlo[1],blo.y,bhi.y)*dx[1],
+                                       problo[2]+amrex::Clamp(ivlo[2],blo.z,bhi.z)*dx[2])},
+                         {AMREX_D_DECL(problo[0]+amrex::Clamp(ivhi[0],blo.x,bhi.x)*dx[0],
+                                       problo[1]+amrex::Clamp(ivhi[1],blo.y,bhi.y)*dx[1],
+                                       problo[2]+amrex::Clamp(ivhi[2],blo.z,bhi.z)*dx[2])},
                             dir, f);
                 } else {
                     inter(i,j,k) = std::numeric_limits<Real>::quiet_NaN();
@@ -365,10 +375,13 @@ public:
     template <class U=F, typename std::enable_if<!IsGPUable<U>::value>::type* BAR = nullptr >
     void getIntercept (Array<BaseFab<Real>,AMREX_SPACEDIM>& inter_fab,
                        Array<BaseFab<Type_t>,AMREX_SPACEDIM> const& type_fab,
-                       Geometry const& geom, RunOn) const noexcept
+                       Geometry const& geom, RunOn,
+                       Box const& bounding_box) const noexcept
     {
         auto const& dx = geom.CellSizeArray();
         auto const& problo = geom.ProbLoArray();
+        const auto blo = amrex::lbound(bounding_box);
+        const auto bhi = amrex::ubound(bounding_box);
         for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
             Array4<Real> const& inter = inter_fab[idim].array();
             Array4<Type_t const> const& type = type_fab[idim].array();
@@ -381,12 +394,12 @@ public:
                     IntVect ivhi(AMREX_D_DECL(i,j,k));
                     ivhi[dir] += 1;
                     inter(i,j,k) = BrentRootFinder
-                        ({AMREX_D_DECL(problo[0]+ivlo[0]*dx[0],
-                                       problo[1]+ivlo[1]*dx[1],
-                                       problo[2]+ivlo[2]*dx[2])},
-                         {AMREX_D_DECL(problo[0]+ivhi[0]*dx[0],
-                                       problo[1]+ivhi[1]*dx[1],
-                                       problo[2]+ivhi[2]*dx[2])},
+                        ({AMREX_D_DECL(problo[0]+amrex::Clamp(ivlo[0],blo.x,bhi.x)*dx[0],
+                                       problo[1]+amrex::Clamp(ivlo[1],blo.y,bhi.y)*dx[1],
+                                       problo[2]+amrex::Clamp(ivlo[2],blo.z,bhi.z)*dx[2])},
+                         {AMREX_D_DECL(problo[0]+amrex::Clamp(ivhi[0],blo.x,bhi.x)*dx[0],
+                                       problo[1]+amrex::Clamp(ivhi[1],blo.y,bhi.y)*dx[1],
+                                       problo[2]+amrex::Clamp(ivhi[2],blo.z,bhi.z)*dx[2])},
                           dir, m_f);
                 } else {
                     inter(i,j,k) = std::numeric_limits<Real>::quiet_NaN();
diff --git a/Src/EB/AMReX_EB2_IF_AllRegular.H b/Src/EB/AMReX_EB2_IF_AllRegular.H
index 6522fd06adc..33f398a9406 100644
--- a/Src/EB/AMReX_EB2_IF_AllRegular.H
+++ b/Src/EB/AMReX_EB2_IF_AllRegular.H
@@ -15,7 +15,7 @@ public:
     constexpr Real operator() (const RealArray&) const noexcept { return -1.0; }
 
     AMREX_GPU_HOST_DEVICE
-    constexpr Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept { return -1.0; }
+    constexpr Real operator() (AMREX_D_DECL(Real, Real, Real)) const noexcept { return -1.0; }
 };
 
 }}
diff --git a/Src/EB/AMReX_EB2_IF_Complement.H b/Src/EB/AMReX_EB2_IF_Complement.H
index 327c82728c7..e01fdac7535 100644
--- a/Src/EB/AMReX_EB2_IF_Complement.H
+++ b/Src/EB/AMReX_EB2_IF_Complement.H
@@ -28,7 +28,7 @@ public:
         return -m_f(p);
     }
 
-    template<class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type >
+    template<class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Difference.H b/Src/EB/AMReX_EB2_IF_Difference.H
index 22e7abc6460..3c648e4ba48 100644
--- a/Src/EB/AMReX_EB2_IF_Difference.H
+++ b/Src/EB/AMReX_EB2_IF_Difference.H
@@ -39,8 +39,8 @@ public:
     }
 
     template <class U=F, class V=G,
-              class = typename std::enable_if<IsGPUable<U>::value &&
-                                              IsGPUable<V>::value>::type>
+              typename std::enable_if<IsGPUable<U>::value &&
+                                      IsGPUable<V>::value, int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Extrusion.H b/Src/EB/AMReX_EB2_IF_Extrusion.H
index 662e86fe15c..9055e565983 100644
--- a/Src/EB/AMReX_EB2_IF_Extrusion.H
+++ b/Src/EB/AMReX_EB2_IF_Extrusion.H
@@ -36,7 +36,7 @@ public:
         return m_f(x);
     }
 
-    template <class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Intersection.H b/Src/EB/AMReX_EB2_IF_Intersection.H
index a4403cbbf82..8c8dd90db5c 100644
--- a/Src/EB/AMReX_EB2_IF_Intersection.H
+++ b/Src/EB/AMReX_EB2_IF_Intersection.H
@@ -55,7 +55,7 @@ public:
         return op_impl(p, makeIndexSequence<sizeof...(Fs)>());
     }
 
-    template <class U=IntersectionIF<Fs...>, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=IntersectionIF<Fs...>, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Lathe.H b/Src/EB/AMReX_EB2_IF_Lathe.H
index 53a226a943f..dd4e9807e70 100644
--- a/Src/EB/AMReX_EB2_IF_Lathe.H
+++ b/Src/EB/AMReX_EB2_IF_Lathe.H
@@ -34,7 +34,7 @@ public:
 #endif
     }
 
-    template <class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Polynomial.H b/Src/EB/AMReX_EB2_IF_Polynomial.H
index 554e6345682..83e82661451 100644
--- a/Src/EB/AMReX_EB2_IF_Polynomial.H
+++ b/Src/EB/AMReX_EB2_IF_Polynomial.H
@@ -46,7 +46,9 @@ public:
           m_dp(static_cast<PolyTerm*>(The_Device_Arena()->alloc(sizeof(PolyTerm)*m_size))),
           m_sp(m_dp,Gpu::Deleter(The_Device_Arena()))
     {
+#ifdef AMREX_USE_GPU
         Gpu::htod_memcpy(m_dp, m_polynomial.data(), m_size*sizeof(PolyTerm));
+#endif
     }
 
 
diff --git a/Src/EB/AMReX_EB2_IF_Rotation.H b/Src/EB/AMReX_EB2_IF_Rotation.H
index 1c9cd81197f..3ed2b6488bc 100644
--- a/Src/EB/AMReX_EB2_IF_Rotation.H
+++ b/Src/EB/AMReX_EB2_IF_Rotation.H
@@ -42,7 +42,7 @@ public:
         return m_f({x, y});
     }
 
-    template <class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (Real x, Real y) const noexcept
     {
@@ -76,7 +76,7 @@ public:
         }
     }
 
-    template <class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (Real x, Real y, Real z) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Scale.H b/Src/EB/AMReX_EB2_IF_Scale.H
index 790938739f5..088ed58d267 100644
--- a/Src/EB/AMReX_EB2_IF_Scale.H
+++ b/Src/EB/AMReX_EB2_IF_Scale.H
@@ -37,7 +37,7 @@ public:
     ScaleIF& operator= (const ScaleIF& rhs) = delete;
     ScaleIF& operator= (ScaleIF&& rhs) = delete;
 
-    template <class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Translation.H b/Src/EB/AMReX_EB2_IF_Translation.H
index c863b513f65..e877606c8c6 100644
--- a/Src/EB/AMReX_EB2_IF_Translation.H
+++ b/Src/EB/AMReX_EB2_IF_Translation.H
@@ -37,7 +37,7 @@ public:
                                  p[2]-m_offset.z)});
     }
 
-    template <class U=F, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=F, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IF_Union.H b/Src/EB/AMReX_EB2_IF_Union.H
index 484700896f4..2ae76b0c788 100644
--- a/Src/EB/AMReX_EB2_IF_Union.H
+++ b/Src/EB/AMReX_EB2_IF_Union.H
@@ -55,7 +55,7 @@ public:
         return op_impl(p, makeIndexSequence<sizeof...(Fs)>());
     }
 
-    template <class U=UnionIF<Fs...>, class = typename std::enable_if<IsGPUable<U>::value>::type>
+    template <class U=UnionIF<Fs...>, typename std::enable_if<IsGPUable<U>::value,int>::type = 0>
     AMREX_GPU_HOST_DEVICE inline
     Real operator() (AMREX_D_DECL(Real x, Real y, Real z)) const noexcept
     {
diff --git a/Src/EB/AMReX_EB2_IndexSpaceI.H b/Src/EB/AMReX_EB2_IndexSpaceI.H
index ef0efb96b51..9e6fa27059c 100644
--- a/Src/EB/AMReX_EB2_IndexSpaceI.H
+++ b/Src/EB/AMReX_EB2_IndexSpaceI.H
@@ -3,7 +3,8 @@ template <typename G>
 IndexSpaceImp<G>::IndexSpaceImp (const G& gshop, const Geometry& geom,
                                  int required_coarsening_level,
                                  int max_coarsening_level,
-                                 int ngrow, bool build_coarse_level_by_coarsening)
+                                 int ngrow, bool build_coarse_level_by_coarsening,
+                                 bool extend_domain_face)
 {
     // build finest level (i.e., level 0) first
     AMREX_ALWAYS_ASSERT(required_coarsening_level >= 0 && required_coarsening_level <= 30);
@@ -19,7 +20,7 @@ IndexSpaceImp<G>::IndexSpaceImp (const G& gshop, const Geometry& geom,
     m_domain.push_back(geom.Domain());
     m_ngrow.push_back(ngrow_finest);
     m_gslevel.reserve(max_coarsening_level+1);
-    m_gslevel.emplace_back(this, gshop, geom, EB2::max_grid_size, ngrow_finest);
+    m_gslevel.emplace_back(this, gshop, geom, EB2::max_grid_size, ngrow_finest, extend_domain_face);
 
     for (int ilev = 1; ilev <= max_coarsening_level; ++ilev)
     {
@@ -43,7 +44,7 @@ IndexSpaceImp<G>::IndexSpaceImp (const G& gshop, const Geometry& geom,
                 if (build_coarse_level_by_coarsening) {
                     amrex::Abort("Failed to build required coarse EB level "+std::to_string(ilev));
                 } else {
-                    m_gslevel.emplace_back(this, gshop, cgeom, EB2::max_grid_size, ng);
+                    m_gslevel.emplace_back(this, gshop, cgeom, EB2::max_grid_size, ng, extend_domain_face);
                 }
             } else {
                 break;
diff --git a/Src/EB/AMReX_EB2_Level.H b/Src/EB/AMReX_EB2_Level.H
index 7b21189574c..a7474c8120e 100644
--- a/Src/EB/AMReX_EB2_Level.H
+++ b/Src/EB/AMReX_EB2_Level.H
@@ -94,14 +94,14 @@ class GShopLevel
     : public Level
 {
 public:
-    GShopLevel (IndexSpace const* is, G const& gshop, const Geometry& geom, int max_grid_size, int ngrow);
+    GShopLevel (IndexSpace const* is, G const& gshop, const Geometry& geom, int max_grid_size, int ngrow, bool extend_domain_face);
     GShopLevel (IndexSpace const* is, int ilev, int max_grid_size, int ngrow,
                 const Geometry& geom, GShopLevel<G>& fineLevel);
 };
 
 template <typename G>
 GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry& geom,
-                           int max_grid_size, int ngrow)
+                           int max_grid_size, int ngrow, bool extend_domain_face)
     : Level(is, geom)
 {
     if (std::is_same<typename G::FunctionType, AllRegularIF>::value) {
@@ -110,6 +110,10 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
         return;
     }
 
+    if (amrex::Verbose() > 0 && extend_domain_face == false) {
+        amrex::Print() << "AMReX WARNING: extend_domain_face=false is not recommended!\n";
+    }
+
     BL_PROFILE("EB2::GShopLevel()-fine");
 
     Real small_volfrac = 1.e-14;
@@ -121,7 +125,8 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
     // make sure ngrow is multiple of 16
     m_ngrow = IntVect{static_cast<int>(std::ceil(ngrow/16.)) * 16};
 
-    Box domain_grown = geom.Domain();
+    Box const& domain = geom.Domain();
+    Box domain_grown = domain;
     for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
         if (geom.isPeriodic(idim)) {
             m_ngrow[idim] = 0;
@@ -130,9 +135,29 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
         }
     }
     domain_grown.grow(m_ngrow);
+    Box bounding_box = (extend_domain_face) ? domain : domain_grown;
+    bounding_box.surroundingNodes();
+
+    BoxList bl(domain);
+    bl.maxSize(max_grid_size);
+    if (m_ngrow != 0) {
+        const IntVect& domlo = domain.smallEnd();
+        const IntVect& domhi = domain.bigEnd();
+        for (auto& b : bl) {
+            for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+                if (m_ngrow[idim] != 0) {
+                    if (b.smallEnd(idim) == domlo[idim]) {
+                        b.growLo(idim,m_ngrow[idim]);
+                    }
+                    if (b.bigEnd(idim) == domhi[idim]) {
+                        b.growHi(idim,m_ngrow[idim]);
+                    }
+                }
+            }
+        }
+    }
 
-    m_grids.define(domain_grown);
-    m_grids.maxSize(max_grid_size);
+    m_grids.define(std::move(bl));
     m_dmap.define(m_grids);
 
     Vector<Box> cut_boxes;
@@ -142,7 +167,7 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
     {
         const Box& vbx = mfi.validbox();
         const Box& gbx = amrex::surroundingNodes(amrex::grow(vbx,1));
-        int box_type = gshop.getBoxType(gbx, geom, RunOn::Gpu);
+        int box_type = gshop.getBoxType(gbx & bounding_box, geom, RunOn::Gpu);
         if (box_type == gshop.allcovered) {
             covered_boxes.push_back(vbx);
         } else if (box_type == gshop.mixedcells) {
@@ -194,6 +219,12 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
     const auto dx = geom.CellSizeArray();
     const auto problo = geom.ProbLoArray();
 
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        if (!extend_domain_face || geom.isPeriodic(idim)) {
+            bounding_box.grow(idim,GFab::ng);
+        }
+    }
+
     RunOn gshop_run_on = (Gpu::inLaunchRegion() && gshop.isGPUable())
         ? RunOn::Gpu : RunOn::Cpu;
 
@@ -213,7 +244,7 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
             const Box& vbx = gfab.validbox();
 
             auto& levelset = gfab.getLevelSet();
-            gshop.fillFab(levelset, geom, gshop_run_on);
+            gshop.fillFab(levelset, geom, gshop_run_on, bounding_box);
 
             if (hybrid) levelset.prefetchToDevice();
 
@@ -264,7 +295,7 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
                 }
             }
 
-            gshop.getIntercept(intercept, edgetype, geom, gshop_run_on);
+            gshop.getIntercept(intercept, edgetype, geom, gshop_run_on, bounding_box);
 
             if (hybrid) {
                 for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
@@ -294,7 +325,8 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
 
             build_cells(vbx, cfg, ftx, fty, ftz, apx, apy, apz,
                         fcx, fcy, fcz, xm2, ym2, zm2, vfr, ctr,
-                        bar, bct, bnm, cfgtmp, small_volfrac);
+                        bar, bct, bnm, cfgtmp, small_volfrac, 
+                        geom, extend_domain_face);
 
 #elif (AMREX_SPACEDIM == 2)
             for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
@@ -313,7 +345,7 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
                 }
             }
 
-            gshop.getIntercept(intercept, facetype, geom, gshop_run_on);
+            gshop.getIntercept(intercept, facetype, geom, gshop_run_on, bounding_box);
 
             if (hybrid) {
                 for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
@@ -324,7 +356,8 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
 
             build_faces(vbx, cfg, ftx, fty, lst, xip, yip, apx, apy, fcx, fcy, dx, problo);
 
-            build_cells(vbx, cfg, ftx, fty, apx, apy, vfr, ctr, bar, bct, bnm, small_volfrac);
+            build_cells(vbx, cfg, ftx, fty, apx, apy, vfr, ctr, bar, bct, bnm, small_volfrac, 
+                        geom, extend_domain_face);
 #endif
         }
     }
@@ -336,7 +369,7 @@ GShopLevel<G>::GShopLevel (IndexSpace const* is, G const& gshop, const Geometry&
 
 
 template <typename G>
-GShopLevel<G>::GShopLevel (IndexSpace const* is, int ilev, int max_grid_size, int /*ngrow*/,
+GShopLevel<G>::GShopLevel (IndexSpace const* is, int /*ilev*/, int max_grid_size, int /*ngrow*/,
                            const Geometry& geom, GShopLevel<G>& fineLevel)
     : Level(is, geom)
 {
diff --git a/Src/EB/AMReX_EB2_Level.cpp b/Src/EB/AMReX_EB2_Level.cpp
index 0ad24213c5d..0258354a895 100644
--- a/Src/EB/AMReX_EB2_Level.cpp
+++ b/Src/EB/AMReX_EB2_Level.cpp
@@ -294,6 +294,7 @@ Level::coarsenFromFine (Level& fineLevel, bool fill_boundary)
             amrex::LoopOnCpu(ndgbx,
             [=,&tile_error] (int i, int j, int k) noexcept
             {
+                amrex::ignore_unused(j,k);
                 int ierr = coarsen_from_fine(AMREX_D_DECL(i,j,k),
                                              bx, gbx,
                                              AMREX_D_DECL(xbx,ybx,zbx),
@@ -371,6 +372,7 @@ Level::coarsenFromFine (Level& fineLevel, bool fill_boundary)
             reduce_op.eval(ndgbx, reduce_data,
             [=] AMREX_GPU_DEVICE (int i, int j, int k) -> ReduceTuple
             {
+                amrex::ignore_unused(j,k);
                 int ierr = coarsen_from_fine(AMREX_D_DECL(i,j,k),
                                              bx, gbx,
                                              AMREX_D_DECL(xbx,ybx,zbx),
diff --git a/Src/EB/AMReX_EBFabFactory.H b/Src/EB/AMReX_EBFabFactory.H
index 6b4ade64002..0ab8b9a3fa8 100644
--- a/Src/EB/AMReX_EBFabFactory.H
+++ b/Src/EB/AMReX_EBFabFactory.H
@@ -71,6 +71,7 @@ public:
 
     const DistributionMapping& DistributionMap () const noexcept;
     const BoxArray& boxArray () const noexcept;
+    const Geometry& Geom () const noexcept { return m_geom; }
 
 private:
 
diff --git a/Src/EB/AMReX_EBFluxRegister.cpp b/Src/EB/AMReX_EBFluxRegister.cpp
index f207033ffae..e2d499a09d4 100644
--- a/Src/EB/AMReX_EBFluxRegister.cpp
+++ b/Src/EB/AMReX_EBFluxRegister.cpp
@@ -229,7 +229,7 @@ EBFluxRegister::FineAdd (const MFIter& mfi,
 
 void
 EBFluxRegister::Reflux (MultiFab& crse_state, const amrex::MultiFab& crse_vfrac,
-                        MultiFab& fine_state, const amrex::MultiFab& fine_vfrac)
+                        MultiFab& fine_state, const amrex::MultiFab& /*fine_vfrac*/)
 {
     if (!m_cfp_mask.empty())
     {
@@ -261,6 +261,8 @@ EBFluxRegister::Reflux (MultiFab& crse_state, const amrex::MultiFab& crse_vfrac,
         auto const& factory = dynamic_cast<EBFArrayBoxFactory const&>(crse_state.Factory());
         auto const& flags = factory.getMultiEBCellFlagFab();
 
+        const Box& gdomain = m_crse_geom.growPeriodicDomain(1);
+
         MFItInfo info;
         if (Gpu::notInLaunchRegion()) info.EnableTiling().SetDynamic(true);
 #ifdef _OPENMP
@@ -273,7 +275,7 @@ EBFluxRegister::Reflux (MultiFab& crse_state, const amrex::MultiFab& crse_vfrac,
                 const Box& bx = mfi.tilebox();
                 const auto& ebflag = flags[mfi];
                 if (ebflag.getType(bx) != FabType::covered) {
-                    const Box& bxg1 = amrex::grow(bx,1);
+                    const Box& bxg1 = amrex::grow(bx,1) & gdomain;
                     Array4<Real> const& dfab = m_crse_data.array(mfi);
                     Array4<Real const> const& sfab = grown_crse_data.const_array(mfi);
                     if (ebflag.getType(bxg1) == FabType::regular)
diff --git a/Src/EB/AMReX_EBFluxRegister_2D_C.H b/Src/EB/AMReX_EBFluxRegister_2D_C.H
index c1ed6c93ec0..fa828d41c92 100644
--- a/Src/EB/AMReX_EBFluxRegister_2D_C.H
+++ b/Src/EB/AMReX_EBFluxRegister_2D_C.H
@@ -193,7 +193,7 @@ void eb_rereflux_from_crse (int i, int j, int k, int n, Box const& bx, Array4<Re
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_rereflux_to_fine (int i, int j, int k, int n, Array4<Real> const& d,
+void eb_rereflux_to_fine (int i, int j, int /*k*/, int n, Array4<Real> const& d,
                           Array4<Real const> const& s, Array4<int const> const& msk, Dim3 ratio)
 {
     int ic = amrex::coarsen(i,ratio.x);
diff --git a/Src/EB/AMReX_EBMultiFabUtil.H b/Src/EB/AMReX_EBMultiFabUtil.H
index f0f1f8fb736..2b7cfed6946 100644
--- a/Src/EB/AMReX_EBMultiFabUtil.H
+++ b/Src/EB/AMReX_EBMultiFabUtil.H
@@ -25,12 +25,17 @@ namespace amrex
                           const IntVect& ratio);
 
     void EB_average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
-                                const Array<MultiFab*,AMREX_SPACEDIM>& crse,
+                                const Array<      MultiFab*,AMREX_SPACEDIM>& crse,
                                 int ratio, int ngcrse);
     void EB_average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
-                                const Array<MultiFab*,AMREX_SPACEDIM>& crse,
+                                const Array<      MultiFab*,AMREX_SPACEDIM>& crse,
                                 const IntVect& ratio, int ngcrse);
 
+    //  This version takes periodicity into account.
+    void EB_average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
+                                const Array<      MultiFab*,AMREX_SPACEDIM>& crse,
+                                const IntVect& ratio, const Geometry& crse_geom);
+
     void EB_average_down_boundaries (const MultiFab& fine, MultiFab& crse,
                                      int ratio, int ngcrse);
     void EB_average_down_boundaries (const MultiFab& fine, MultiFab& crse,
diff --git a/Src/EB/AMReX_EBMultiFabUtil.cpp b/Src/EB/AMReX_EBMultiFabUtil.cpp
index 7e82d6a1e95..91a8f96411f 100644
--- a/Src/EB/AMReX_EBMultiFabUtil.cpp
+++ b/Src/EB/AMReX_EBMultiFabUtil.cpp
@@ -122,15 +122,15 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, Real val)
     {
         AMREX_D_TERM(const Box& xbx = mfi.tilebox(IntVect::TheDimensionVector(0));,
                      const Box& ybx = mfi.tilebox(IntVect::TheDimensionVector(1));,
-                     const Box& zbx = mfi.tilebox(IntVect::TheDimensionVector(2)););
+                     const Box& zbx = mfi.tilebox(IntVect::TheDimensionVector(2)));
         AMREX_D_TERM(Array4<Real> const& u = umac[0]->array(mfi);,
                      Array4<Real> const& v = umac[1]->array(mfi);,
-                     Array4<Real> const& w = umac[2]->array(mfi););
+                     Array4<Real> const& w = umac[2]->array(mfi));
 
         auto fabtyp = flags[mfi].getType();
         if (fabtyp == FabType::covered)
         {
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 xbx, txbx,
                 {
                     const auto lo = amrex::lbound(txbx);
@@ -155,7 +155,6 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, Real val)
                         }}}
                     }
                 }
-#if (AMREX_SPACEDIM == 3)
                 ,zbx, tzbx,
                 {
                     const auto lo = amrex::lbound(tzbx);
@@ -168,15 +167,14 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, Real val)
                         }}}
                     }
                 }
-#endif
-                );
+            );
         }
         else if (fabtyp == FabType::singlevalued)
         {
             AMREX_D_TERM(Array4<Real const> const& ax = area[0]->const_array(mfi);,
                          Array4<Real const> const& ay = area[1]->const_array(mfi);,
-                         Array4<Real const> const& az = area[2]->const_array(mfi););
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                         Array4<Real const> const& az = area[2]->const_array(mfi));
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 xbx, txbx,
                 {
                     const auto lo = amrex::lbound(txbx);
@@ -201,7 +199,6 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, Real val)
                         }}}
                     }
                 }
-#if (AMREX_SPACEDIM == 3)
                 ,zbx, tzbx,
                 {
                     const auto lo = amrex::lbound(tzbx);
@@ -214,8 +211,7 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, Real val)
                         }}}
                     }
                 }
-#endif
-                );
+            );
         }
     }
 }
@@ -242,15 +238,15 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, const int sco
     {
         AMREX_D_TERM(const Box& xbx = mfi.tilebox(IntVect::TheDimensionVector(0));,
                      const Box& ybx = mfi.tilebox(IntVect::TheDimensionVector(1));,
-                     const Box& zbx = mfi.tilebox(IntVect::TheDimensionVector(2)););
+                     const Box& zbx = mfi.tilebox(IntVect::TheDimensionVector(2)));
         AMREX_D_TERM(Array4<Real> const& u = umac[0]->array(mfi);,
                      Array4<Real> const& v = umac[1]->array(mfi);,
-                     Array4<Real> const& w = umac[2]->array(mfi););
+                     Array4<Real> const& w = umac[2]->array(mfi));
 
         auto fabtyp = flags[mfi].getType();
         if (fabtyp == FabType::covered)
         {
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 xbx, txbx,
                 {
                     const auto lo = amrex::lbound(txbx);
@@ -275,7 +271,6 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, const int sco
                         }}}
                     }
                 }
-#if (AMREX_SPACEDIM == 3)
                 ,zbx, tzbx,
                 {
                     const auto lo = amrex::lbound(tzbx);
@@ -288,15 +283,14 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, const int sco
                         }}}
                     }
                 }
-#endif
-                );
+            );
         }
         else if (fabtyp == FabType::singlevalued)
         {
             AMREX_D_TERM(Array4<Real const> const& ax = area[0]->const_array(mfi);,
                          Array4<Real const> const& ay = area[1]->const_array(mfi);,
-                         Array4<Real const> const& az = area[2]->const_array(mfi););
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                         Array4<Real const> const& az = area[2]->const_array(mfi));
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 xbx, txbx,
                 {
                     const auto lo = amrex::lbound(txbx);
@@ -321,7 +315,6 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, const int sco
                         }}}
                     }
                 }
-#if (AMREX_SPACEDIM == 3)
                 ,zbx, tzbx,
                 {
                     const auto lo = amrex::lbound(tzbx);
@@ -334,8 +327,7 @@ EB_set_covered_faces (const Array<MultiFab*,AMREX_SPACEDIM>& umac, const int sco
                         }}}
                     }
                 }
-#endif
-                );
+            );
         }
     }
 }
@@ -490,7 +482,7 @@ EB_average_down (const MultiFab& S_fine, MultiFab& S_crse, int scomp, int ncomp,
                     Array4<Real const> const& vfrc = vfrac_fine.const_array(mfi);
                     AMREX_HOST_DEVICE_FOR_3D(tbx, i, j, k,
                     {
-                        eb_avgdown(i,j,k,fine_arr,scomp,crse_arr,scomp,vfrc,dratio,ncomp);
+                        eb_avgdown(i,j,k,fine_arr,scomp,crse_arr,0,vfrc,dratio,ncomp);
                     });
                 }
                 else
@@ -595,6 +587,35 @@ void EB_average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
     }
 }
 
+void EB_average_down_faces (const Array<const MultiFab*,AMREX_SPACEDIM>& fine,
+                            const Array<MultiFab*,AMREX_SPACEDIM>& crse,
+                            const IntVect& ratio, const Geometry& crse_geom)
+{
+    AMREX_ASSERT(crse[0]->nComp() == fine[0]->nComp());
+
+    if (!(*fine[0]).hasEBFabFactory())
+    {
+        amrex::average_down_faces(fine, crse, ratio, crse_geom);
+    }
+    else
+    {
+        int ngcrse = 0;
+        int ncomp = crse[0]->nComp();
+        Array<MultiFab,AMREX_SPACEDIM> ctmp;
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+        {
+            BoxArray cba = fine[idim]->boxArray();
+            cba.coarsen(ratio);
+            ctmp[idim].define(cba, fine[idim]->DistributionMap(), ncomp, ngcrse, MFInfo(), FArrayBoxFactory());
+        }
+        EB_average_down_faces(fine, amrex::GetArrOfPtrs(ctmp), ratio, ngcrse);
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+        {
+            crse[idim]->ParallelCopy(ctmp[idim],0,0,ncomp,crse_geom.periodicity());
+        }
+    }
+}
+
 void EB_average_down_boundaries (const MultiFab& fine, MultiFab& crse,
                                  int ratio, int ngcrse)
 {
@@ -697,7 +718,7 @@ void EB_computeDivergence (MultiFab& divu, const Array<MultiFab const*,AMREX_SPA
             Array4<Real> const& divuarr = divu.array(mfi);
             AMREX_D_TERM(Array4<Real const> const& uarr = umac[0]->const_array(mfi);,
                          Array4<Real const> const& varr = umac[1]->const_array(mfi);,
-                         Array4<Real const> const& warr = umac[2]->const_array(mfi););
+                         Array4<Real const> const& warr = umac[2]->const_array(mfi));
 
             const auto fabtyp = flagfab.getType(bx);
             if (fabtyp == FabType::covered) {
@@ -716,10 +737,10 @@ void EB_computeDivergence (MultiFab& divu, const Array<MultiFab const*,AMREX_SPA
                 Array4<Real const> const& vol = vfrac.const_array(mfi);
                 AMREX_D_TERM(Array4<Real const> const& apx = area[0]->const_array(mfi);,
                              Array4<Real const> const& apy = area[1]->const_array(mfi);,
-                             Array4<Real const> const& apz = area[2]->const_array(mfi););
+                             Array4<Real const> const& apz = area[2]->const_array(mfi));
                 AMREX_D_TERM(Array4<Real const> const& fcx = fcent[0]->const_array(mfi);,
                              Array4<Real const> const& fcy = fcent[1]->const_array(mfi);,
-                             Array4<Real const> const& fcz = fcent[2]->const_array(mfi););
+                             Array4<Real const> const& fcz = fcent[2]->const_array(mfi));
                 Array4<EBCellFlag const> const& flagarr = flagfab.const_array();
                 AMREX_HOST_DEVICE_FOR_4D(bx,divu.nComp(),i,j,k,n,
                 {
@@ -760,7 +781,7 @@ EB_average_face_to_cellcenter (MultiFab& ccmf, int dcomp,
             Array4<Real> const& ccfab = ccmf.array(mfi);
             AMREX_D_TERM(Array4<Real const> const& xfab = fmf[0]->const_array(mfi);,
                          Array4<Real const> const& yfab = fmf[1]->const_array(mfi);,
-                         Array4<Real const> const& zfab = fmf[2]->const_array(mfi););
+                         Array4<Real const> const& zfab = fmf[2]->const_array(mfi));
             const auto fabtyp = flagfab.getType(bx);
             if (fabtyp == FabType::covered) {
                 AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
@@ -775,7 +796,7 @@ EB_average_face_to_cellcenter (MultiFab& ccmf, int dcomp,
             } else {
                 AMREX_D_TERM(Array4<Real const> const& apx = area[0]->const_array(mfi);,
                              Array4<Real const> const& apy = area[1]->const_array(mfi);,
-                             Array4<Real const> const& apz = area[2]->const_array(mfi););
+                             Array4<Real const> const& apz = area[2]->const_array(mfi));
                 Array4<EBCellFlag const> const& flagarr = flagfab.const_array();
                 AMREX_HOST_DEVICE_FOR_3D(bx,i,j,k,
                 {
@@ -884,51 +905,61 @@ EB_interp_CC_to_FaceCentroid (const MultiFab& cc,
 #endif
     for (MFIter mfi(cc, mfi_info);  mfi.isValid(); ++mfi)
     {
-
         const Box& vbx = mfi.tilebox();
+        AMREX_D_TERM(const Box& xbx = mfi.nodaltilebox(0);,
+                     const Box& ybx = mfi.nodaltilebox(1);,
+                     const Box& zbx = mfi.nodaltilebox(2));
         const auto& ccfab = cc.array(mfi,scomp);
         const auto fabtyp = flags[mfi].getType(amrex::grow(vbx,0));
         const auto fabtyp_ghost = flags[mfi].getType(amrex::grow(vbx,nghost));
 
         if (fabtyp != FabType::covered)
         {
-
             AMREX_D_TERM(Array4<Real> const& edg_x = fc_x.array(mfi,dcomp);,
                          Array4<Real> const& edg_y = fc_y.array(mfi,dcomp);,
-                         Array4<Real> const& edg_z = fc_z.array(mfi,dcomp););
+                         Array4<Real> const& edg_z = fc_z.array(mfi,dcomp));
           
             if (fabtyp_ghost == FabType::regular )
             {
-                
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
-                {
-                    eb_interp_cc2face(thread_box, ccfab,
-                                      AMREX_D_DECL(edg_x,edg_y,edg_z),
-                                      ncomp,
-                                      domain, d_bcs);
-                });
-            
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
+                    (xbx, txbx,
+                     {
+                         eb_interp_cc2face_x(txbx, ccfab, edg_x, ncomp, domain, d_bcs);
+                     },
+                     ybx, tybx,
+                     {
+                         eb_interp_cc2face_y(tybx, ccfab, edg_y, ncomp, domain, d_bcs);
+                     },
+                     zbx, tzbx,
+                     {
+                         eb_interp_cc2face_z(tzbx, ccfab, edg_z, ncomp, domain, d_bcs);
+                     });
             }
             else
             {
-                Array4<EBCellFlag const> const& flagfab = flags.const_array(mfi);
                 AMREX_D_TERM(Array4<Real const> const& apxfab = area[0]->const_array(mfi);,
                              Array4<Real const> const& apyfab = area[1]->const_array(mfi);,
-                             Array4<Real const> const& apzfab = area[2]->const_array(mfi););
+                             Array4<Real const> const& apzfab = area[2]->const_array(mfi));
                 AMREX_D_TERM(Array4<Real const> const& fcx = fcent[0]->const_array(mfi);,
                              Array4<Real const> const& fcy = fcent[1]->const_array(mfi);,
-                             Array4<Real const> const& fcz = fcent[2]->const_array(mfi););
-                
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
-                {
-                    eb_interp_cc2facecent(thread_box, ccfab,
-                                          flagfab,
-                                          AMREX_D_DECL(apxfab,apyfab,apzfab),
-                                          AMREX_D_DECL(fcx,fcy,fcz),
-                                          AMREX_D_DECL(edg_x,edg_y,edg_z),
-                                          ncomp,
-                                          domain, d_bcs);
-                });
+                             Array4<Real const> const& fcz = fcent[2]->const_array(mfi));
+
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
+                    (xbx, txbx,
+                     {
+                         eb_interp_cc2facecent_x(txbx, ccfab, apxfab, fcx, edg_x,
+                                                 ncomp, domain, d_bcs);
+                     },
+                     ybx, tybx,
+                     {
+                         eb_interp_cc2facecent_y(tybx, ccfab, apyfab, fcy, edg_y,
+                                                 ncomp, domain, d_bcs);
+                     },
+                     zbx, tzbx,
+                     {
+                         eb_interp_cc2facecent_z(tzbx, ccfab, apzfab, fcz, edg_z,
+                                                 ncomp, domain, d_bcs);
+                     });
             }
         }
     }
@@ -1013,8 +1044,10 @@ EB_interp_CellCentroid_to_FaceCentroid (const MultiFab& phi_centroid,
 #endif
     for (MFIter mfi(phi_centroid, mfi_info);  mfi.isValid(); ++mfi)
     {
-
         const Box& vbx = mfi.tilebox();
+        AMREX_D_TERM(const Box& xbx = mfi.nodaltilebox(0);,
+                     const Box& ybx = mfi.nodaltilebox(1);,
+                     const Box& zbx = mfi.nodaltilebox(2));
         const auto& ccfab = phi_centroid.array(mfi,scomp);
         const auto fabtyp = flags[mfi].getType(amrex::grow(vbx,0));
         const auto fabtyp_ghost = flags[mfi].getType(amrex::grow(vbx,nghost));
@@ -1023,46 +1056,53 @@ EB_interp_CellCentroid_to_FaceCentroid (const MultiFab& phi_centroid,
         {
             AMREX_D_TERM(Array4<Real> const& phi_x = phi_xface.array(mfi,dcomp);,
                          Array4<Real> const& phi_y = phi_yface.array(mfi,dcomp);,
-                         Array4<Real> const& phi_z = phi_zface.array(mfi,dcomp););
+                         Array4<Real> const& phi_z = phi_zface.array(mfi,dcomp));
           
             if (fabtyp_ghost == FabType::regular )
             {
-                
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
-                {
-                    eb_interp_cc2face(thread_box, ccfab,
-                                      AMREX_D_DECL(phi_x,phi_y,phi_z),
-                                      ncomp,
-                                      domain, d_bcs);
-                });
-            
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
+                    (xbx, txbx,
+                     {
+                         eb_interp_cc2face_x(txbx, ccfab, phi_x, ncomp, domain, d_bcs);
+                     },
+                     ybx, tybx,
+                     {
+                         eb_interp_cc2face_y(tybx, ccfab, phi_y, ncomp, domain, d_bcs);
+                     },
+                     zbx, tzbx,
+                     {
+                         eb_interp_cc2face_z(tzbx, ccfab, phi_z, ncomp, domain, d_bcs);
+                     });
             }
             else
             {
-                Array4<EBCellFlag const> const& flagfab = flags.const_array(mfi);
                 AMREX_D_TERM(Array4<Real const> const& apxfab = area[0]->const_array(mfi);,
                              Array4<Real const> const& apyfab = area[1]->const_array(mfi);,
-                             Array4<Real const> const& apzfab = area[2]->const_array(mfi););
+                             Array4<Real const> const& apzfab = area[2]->const_array(mfi));
 
                 AMREX_D_TERM(Array4<Real const> const& fcx = fcent[0]->const_array(mfi);,
                              Array4<Real const> const& fcy = fcent[1]->const_array(mfi);,
-                             Array4<Real const> const& fcz = fcent[2]->const_array(mfi););
+                             Array4<Real const> const& fcz = fcent[2]->const_array(mfi));
 
                 Array4<Real const> const& cvol = vfrac.const_array(mfi);
                 Array4<Real const> const& cct  = ccent.const_array(mfi);
-                
-                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
-                {
-                    eb_interp_centroid2facecent(thread_box, ccfab,
-                                                flagfab,
-                                                AMREX_D_DECL(apxfab,apyfab,apzfab),
-                                                cvol,
-                                                cct,
-                                                AMREX_D_DECL(fcx,fcy,fcz),
-                                                AMREX_D_DECL(phi_x,phi_y,phi_z),
-                                                ncomp,
-                                                domain, d_bcs);
-                });
+
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
+                    (xbx, txbx,
+                     {
+                         eb_interp_centroid2facecent_x(txbx, ccfab, apxfab, cvol, cct, fcx, phi_x,
+                                                       ncomp, domain, d_bcs);
+                     },
+                     ybx, tybx,
+                     {
+                         eb_interp_centroid2facecent_y(tybx, ccfab, apyfab, cvol, cct, fcy, phi_y,
+                                                       ncomp, domain, d_bcs);
+                     },
+                     zbx, tzbx,
+                     {
+                         eb_interp_centroid2facecent_z(tzbx, ccfab, apzfab, cvol, cct, fcz, phi_z,
+                                                       ncomp, domain, d_bcs);
+                     });
             }
         }
     }
diff --git a/Src/EB/AMReX_EBMultiFabUtil_2D_C.H b/Src/EB/AMReX_EBMultiFabUtil_2D_C.H
index 203598cd181..0591b7ce0ec 100644
--- a/Src/EB/AMReX_EBMultiFabUtil_2D_C.H
+++ b/Src/EB/AMReX_EBMultiFabUtil_2D_C.H
@@ -278,27 +278,17 @@ void eb_interp_cc2cent (Box const& box,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_interp_cc2facecent (Box const& box,
-                            Array4<Real const> const& phi,
-                            Array4<EBCellFlag const> const& flag,
-                            Array4<Real const> const& apx, Array4<Real const> const& apy,
-                            Array4<Real const> const& fcx,
-                            Array4<Real const> const& fcy,
-                            Array4<Real> const& edg_x,
-                            Array4<Real> const& edg_y,
-                            int ncomp,
-                            const Box& domain,
-                            const BCRec* bc) noexcept
+void eb_interp_cc2facecent_x (Box const& ubx,
+                              Array4<Real const> const& phi,
+                              Array4<Real const> const& apx,
+                              Array4<Real const> const& fcx,
+                              Array4<Real> const& edg_x,
+                              int ncomp,
+                              const Box& domain,
+                              const BCRec* bc) noexcept
 {
   const Dim3 domlo = amrex::lbound(domain);
   const Dim3 domhi = amrex::ubound(domain);
-
-  const Box ubx = amrex::surroundingNodes(box,0);
-  const Box vbx = amrex::surroundingNodes(box,1);
-
-  //
-  // ===================== X =====================
-  //
   amrex::Loop(ubx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
       if (apx(i,j,k) == 0)
@@ -336,11 +326,20 @@ void eb_interp_cc2facecent (Box const& box,
          }
        }
     });
-  
+}
 
-    //
-  // ===================== Y =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_cc2facecent_y (Box const& vbx,
+                              Array4<Real const> const& phi,
+                              Array4<Real const> const& apy,
+                              Array4<Real const> const& fcy,
+                              Array4<Real> const& edg_y,
+                              int ncomp,
+                              const Box& domain,
+                              const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(vbx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
       if (apy(i,j,k) == 0)
@@ -381,29 +380,19 @@ void eb_interp_cc2facecent (Box const& box,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_interp_centroid2facecent (Box const& box,
-                                  Array4<Real const> const& phi,
-                                  Array4<EBCellFlag const> const& flag,
-                                  Array4<Real const> const& apx, Array4<Real const> const& apy,
-                                  Array4<Real const> const& cvol,
-                                  Array4<Real const> const& ccent,
-                                  Array4<Real const> const& fcx,
-                                  Array4<Real const> const& fcy,
-                                  Array4<Real> const& edg_x,
-                                  Array4<Real> const& edg_y,
-                                  int ncomp,
-                                  const Box& domain,
-                                  const BCRec* bc) noexcept
+void eb_interp_centroid2facecent_x (Box const& ubx,
+                                    Array4<Real const> const& phi,
+                                    Array4<Real const> const& apx,
+                                    Array4<Real const> const& cvol,
+                                    Array4<Real const> const& ccent,
+                                    Array4<Real const> const& fcx,
+                                    Array4<Real> const& edg_x,
+                                    int ncomp,
+                                    const Box& domain,
+                                    const BCRec* bc) noexcept
 {
   const Dim3 domlo = amrex::lbound(domain);
   const Dim3 domhi = amrex::ubound(domain);
-
-  const Box ubx = amrex::surroundingNodes(box,0);
-  const Box vbx = amrex::surroundingNodes(box,1);
-
-  //
-  // ===================== X =====================
-  //
   amrex::Loop(ubx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
       if (apx(i,j,k) == 0)
@@ -449,11 +438,22 @@ void eb_interp_centroid2facecent (Box const& box,
                              (1. - fcx(i,j,k) + y01_jj) * phi01    ) / (1. - y01 + y01_jj);
       }
     });
-  
+}
 
-  //
-  // ===================== Y =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_centroid2facecent_y (Box const& vbx,
+                                    Array4<Real const> const& phi,
+                                    Array4<Real const> const& apy,
+                                    Array4<Real const> const& cvol,
+                                    Array4<Real const> const& ccent,
+                                    Array4<Real const> const& fcy,
+                                    Array4<Real> const& edg_y,
+                                    int ncomp,
+                                    const Box& domain,
+                                    const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(vbx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
         if (apy(i,j,k) == 0)
@@ -502,24 +502,15 @@ void eb_interp_centroid2facecent (Box const& box,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_interp_cc2face (Box const& box,
-                        Array4<Real const> const& phi,
-                        Array4<Real> const& edg_x,
-                        Array4<Real> const& edg_y,
-                        int ncomp,
-                        const Box& domain,
-                        const BCRec* bc) noexcept
+void eb_interp_cc2face_x (Box const& ubx,
+                          Array4<Real const> const& phi,
+                          Array4<Real> const& edg_x,
+                          int ncomp,
+                          const Box& domain,
+                          const BCRec* bc) noexcept
 {
-  
   const Dim3 domlo = amrex::lbound(domain);
   const Dim3 domhi = amrex::ubound(domain);
-  
-  const Box ubx = amrex::surroundingNodes(box,0);
-  const Box vbx = amrex::surroundingNodes(box,1);
-  
-  //
-  // ===================== X =====================
-  //
   amrex::Loop(ubx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
         if ( (i == domlo.x) and (bc[n].lo(0) == BCType::ext_dir) )
@@ -535,11 +526,18 @@ void eb_interp_cc2face (Box const& box,
           edg_x(i,j,k,n) = 0.5 * ( phi(i,j,k,n) + phi(i-1,j,k,n) );
         } 
     });
-  
+}
 
-  //
-  // ===================== Y =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_cc2face_y (Box const& vbx,
+                          Array4<Real const> const& phi,
+                          Array4<Real> const& edg_y,
+                          int ncomp,
+                          const Box& domain,
+                          const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(vbx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
         if ( (j == domlo.y) and (bc[n].lo(1) == BCType::ext_dir) )
@@ -556,6 +554,7 @@ void eb_interp_cc2face (Box const& box,
         }
     });
 }
+
 }
 
 #endif
diff --git a/Src/EB/AMReX_EBMultiFabUtil_3D_C.H b/Src/EB/AMReX_EBMultiFabUtil_3D_C.H
index b70a21cacb9..98e0d080163 100644
--- a/Src/EB/AMReX_EBMultiFabUtil_3D_C.H
+++ b/Src/EB/AMReX_EBMultiFabUtil_3D_C.H
@@ -417,32 +417,17 @@ void eb_interp_cc2cent (Box const& box,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_interp_cc2facecent (Box const& box,
-                            Array4<Real const> const& phi,
-                            Array4<EBCellFlag const> const& flag,
-                            Array4<Real const> const& apx,
-                            Array4<Real const> const& apy,
-                            Array4<Real const> const& apz,
-                            Array4<Real const> const& fcx,
-                            Array4<Real const> const& fcy,
-                            Array4<Real const> const& fcz,
-                            Array4<Real> const& edg_x,
-                            Array4<Real> const& edg_y,
-                            Array4<Real> const& edg_z,
-                            int ncomp,
-                            const Box& domain,
-                            const BCRec* bc) noexcept
+void eb_interp_cc2facecent_x (Box const& ubx,
+                              Array4<Real const> const& phi,
+                              Array4<Real const> const& apx,
+                              Array4<Real const> const& fcx,
+                              Array4<Real> const& edg_x,
+                              int ncomp,
+                              const Box& domain,
+                              const BCRec* bc) noexcept
 {
   const Dim3 domlo = amrex::lbound(domain);
   const Dim3 domhi = amrex::ubound(domain);
-
-  const Box ubx = amrex::surroundingNodes(box,0);
-  const Box vbx = amrex::surroundingNodes(box,1);
-  const Box wbx = amrex::surroundingNodes(box,2);
-
-  //
-  // ===================== X =====================
-  //
   amrex::Loop(ubx, ncomp, [=] (int i, int j, int k, int n) noexcept
   {
     if (apx(i,j,k) == 0)
@@ -492,10 +477,20 @@ void eb_interp_cc2facecent (Box const& box,
       } 
     }
   });
+}
 
-  //
-  // ===================== Y =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_cc2facecent_y (Box const& vbx,
+                              Array4<Real const> const& phi,
+                              Array4<Real const> const& apy,
+                              Array4<Real const> const& fcy,
+                              Array4<Real> const& edg_y,
+                              int ncomp,
+                              const Box& domain,
+                              const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(vbx, ncomp, [=] (int i, int j, int k, int n) noexcept
   {
     if (apy(i,j,k) == 0)
@@ -545,10 +540,20 @@ void eb_interp_cc2facecent (Box const& box,
       } 
     }
   });
+}
 
-  //
-  // ===================== Z =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_cc2facecent_z (Box const& wbx,
+                              Array4<Real const> const& phi,
+                              Array4<Real const> const& apz,
+                              Array4<Real const> const& fcz,
+                              Array4<Real> const& edg_z,
+                              int ncomp,
+                              const Box& domain,
+                              const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(wbx, ncomp, [=] (int i, int j, int k, int n) noexcept
   {
     if (apz(i,j,k) == 0)
@@ -601,39 +606,21 @@ void eb_interp_cc2facecent (Box const& box,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_interp_centroid2facecent (Box const& bx,
-                                  Array4<Real const> const& phi,
-                                  Array4<EBCellFlag const> const& flag,
-                                  Array4<Real const> const& apx,
-                                  Array4<Real const> const& apy,
-                                  Array4<Real const> const& apz,
-                                  Array4<Real const> const& cvol,
-                                  Array4<Real const> const& ccent,
-                                  Array4<Real const> const& fcx,
-                                  Array4<Real const> const& fcy,
-                                  Array4<Real const> const& fcz,
-                                  Array4<Real> const& phi_x,
-                                  Array4<Real> const& phi_y,
-                                  Array4<Real> const& phi_z,
-                                  int ncomp,
-                                  const Box& domain,
-                                  const BCRec* bc) noexcept
+void eb_interp_centroid2facecent_x (Box const& ubx,
+                                    Array4<Real const> const& phi,
+                                    Array4<Real const> const& apx,
+                                    Array4<Real const> const& cvol,
+                                    Array4<Real const> const& ccent,
+                                    Array4<Real const> const& fcx,
+                                    Array4<Real> const& phi_x,
+                                    int ncomp,
+                                    const Box& domain,
+                                    const BCRec* bc) noexcept
 {
   const Dim3 domlo = amrex::lbound(domain);
   const Dim3 domhi = amrex::ubound(domain);
-
-  const Box ubx = amrex::surroundingNodes(bx,0);
-  const Box vbx = amrex::surroundingNodes(bx,1);
-  const Box wbx = amrex::surroundingNodes(bx,2);
-
   // Note that ccent holds (x,y,z) of the cell centroids  as components (0/1/2)
   //           fcx   holds (  y,z) of the x-face centroid as components ( /0/1)
-  //           fcy   holds (x,  z) of the y-face centroid as components (0/ /1)
-  //           fcz   holds (x,y  ) of the z-face centroid as components (0/1  )
-
-  //
-  // ===================== X =====================
-  //
   amrex::Loop(ubx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
       if (apx(i,j,k) == 0)
@@ -806,10 +793,24 @@ void eb_interp_centroid2facecent (Box const& bx,
           }
        }
     });
+}
   
-  //
-  // ===================== Y =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_centroid2facecent_y (Box const& vbx,
+                                    Array4<Real const> const& phi,
+                                    Array4<Real const> const& apy,
+                                    Array4<Real const> const& cvol,
+                                    Array4<Real const> const& ccent,
+                                    Array4<Real const> const& fcy,
+                                    Array4<Real> const& phi_y,
+                                    int ncomp,
+                                    const Box& domain,
+                                    const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
+  // Note that ccent holds (x,y,z) of the cell centroids  as components (0/1/2)
+  //           fcy   holds (x,  z) of the y-face centroid as components (0/ /1)
   amrex::Loop(vbx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
         if (apy(i,j,k) == 0)
@@ -979,10 +980,24 @@ void eb_interp_centroid2facecent (Box const& bx,
           }
         }
     });
+}
 
-  //
-  // ===================== Z =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_centroid2facecent_z (Box const& wbx,
+                                    Array4<Real const> const& phi,
+                                    Array4<Real const> const& apz,
+                                    Array4<Real const> const& cvol,
+                                    Array4<Real const> const& ccent,
+                                    Array4<Real const> const& fcz,
+                                    Array4<Real> const& phi_z,
+                                    int ncomp,
+                                    const Box& domain,
+                                    const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
+  // Note that ccent holds (x,y,z) of the cell centroids  as components (0/1/2)
+  //           fcz   holds (x,y  ) of the z-face centroid as components (0/1  )
   amrex::Loop(wbx, ncomp, [=] (int i, int j, int k, int n) noexcept
     {
         if (apz(i,j,k) == 0)
@@ -1155,25 +1170,15 @@ void eb_interp_centroid2facecent (Box const& bx,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void eb_interp_cc2face (Box const& box,
-                        Array4<Real const> const& phi,
-                        Array4<Real> const& edg_x,
-                        Array4<Real> const& edg_y,
-                        Array4<Real> const& edg_z,
-                        int ncomp,
-                        const Box& domain,
-                        const BCRec* bc) noexcept
+void eb_interp_cc2face_x (Box const& ubx,
+                          Array4<Real const> const& phi,
+                          Array4<Real> const& edg_x,
+                          int ncomp,
+                          const Box& domain,
+                          const BCRec* bc) noexcept
 {
   const Dim3 domlo = amrex::lbound(domain);
   const Dim3 domhi = amrex::ubound(domain);
-
-  const Box ubx = amrex::surroundingNodes(box,0);
-  const Box vbx = amrex::surroundingNodes(box,1);
-  const Box wbx = amrex::surroundingNodes(box,2);
-
-  //
-  //===================== X =====================
-  //
   amrex::Loop(ubx, ncomp, [=] (int i, int j, int k, int n) noexcept
   {
     if ( (i == domlo.x) and (bc[n].lo(0) == BCType::ext_dir) )
@@ -1189,10 +1194,18 @@ void eb_interp_cc2face (Box const& box,
       edg_x(i,j,k,n) = 0.5 * ( phi(i,j,k,n) + phi(i-1,j,k,n) );
     } 
   });
+}
 
-  //
-  //===================== Y =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_cc2face_y (Box const& vbx,
+                          Array4<Real const> const& phi,
+                          Array4<Real> const& edg_y,
+                          int ncomp,
+                          const Box& domain,
+                          const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(vbx, ncomp, [=] (int i, int j, int k, int n) noexcept
   {
     if ( (j == domlo.y) and (bc[n].lo(1) == BCType::ext_dir) )
@@ -1208,10 +1221,18 @@ void eb_interp_cc2face (Box const& box,
       edg_y(i,j,k,n) = 0.5 * (phi(i,j  ,k,n) + phi(i,j-1,k,n));
     }
   });
+}
 
-  //
-  //===================== Z =====================
-  //
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void eb_interp_cc2face_z (Box const& wbx,
+                          Array4<Real const> const& phi,
+                          Array4<Real> const& edg_z,
+                          int ncomp,
+                          const Box& domain,
+                          const BCRec* bc) noexcept
+{
+  const Dim3 domlo = amrex::lbound(domain);
+  const Dim3 domhi = amrex::ubound(domain);
   amrex::Loop(wbx, ncomp, [=] (int i, int j, int k, int n) noexcept
   {
     if ( (k == domlo.z) and (bc[n].lo(2) == BCType::ext_dir) )
diff --git a/Src/EB/AMReX_EB_F.H b/Src/EB/AMReX_EB_F.H
deleted file mode 100644
index 7e7265d87c3..00000000000
--- a/Src/EB/AMReX_EB_F.H
+++ /dev/null
@@ -1,132 +0,0 @@
-#ifndef AMREX_EB_F_H_
-#define AMREX_EB_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-    void amrex_eb_compute_normals(
-            const int* lo , const int* hi,
-            const void* flag,   const int* fglo, const int* fghi,
-            amrex_real* normal, const int* nlo,  const int* nhi,
-            const amrex_real* ax, const int* axlo, const int* axhi,
-            const amrex_real* ay, const int* aylo, const int* ayhi,
-            const amrex_real* az, const int* azlo, const int* azhi
-        );
-
-    void amrex_eb_init_levelset(
-            const int * lo,   const int * hi,
-            amrex_real * phi, const int * phlo, const int * phhi
-        );
-
-    void amrex_eb_fill_levelset(
-            const int * lo,             const int * hi,
-            const amrex_real * eb_list, const int * l_eb,
-            int * valid,                const int * vlo,  const int * vhi,
-            amrex_real * phi,           const int * phlo, const int * phhi,
-            const amrex_real * dx,      const amrex_real * dx_eb
-        );
-
-    void amrex_eb_fill_levelset_loc(
-            const int * lo,              const int * hi,
-            const amrex_real * eb_list,  const int * l_eb,
-            int * valid,                 const int * v_lo,      const int * v_hi,
-            amrex_real * phi,            const int * p_lo,      const int * p_hi,
-            const amrex_real * ls_guess, const int * lsg_lo,    const int * lsg_hi,
-            const amrex_real * ls_thres, const amrex_real * dx, const amrex_real * dx_eb
-        );
-
-    void amrex_eb_fill_levelset_bcs(
-            amrex_real * phi, const int * philo, const int * phihi,
-            int * valid,      const int * vlo,   const int * vhi,
-            const int * peri, const int * domlo, const int * domhi,
-            const amrex_real * eb_list, const int * l_eb,
-            const amrex_real * dx, const amrex_real * dx_eb
-        );
-
-    void amrex_eb_update_levelset_intersection(
-            const int * lo,           const int * hi,
-            const int * valid_in,     const int * vilo, const int * vihi,
-            const amrex_real * ls_in, const int * lslo, const int * lshi,
-            int * valid,              const int * vlo,  const int * vhi,
-            amrex_real * phi,         const int * phlo, const int * phhi
-        );
-
-    void amrex_eb_update_levelset_intersection_bcs(
-            const int * valid_in,     const int * vilo,  const int * vihi,
-            const amrex_real * ls_in, const int * lslo,  const int * lshi,
-            int * valid,              const int * vlo,   const int * vhi,
-            amrex_real * phi,         const int * phlo,  const int * phhi,
-            const int * periodic,     const int * domlo, const int * domhi
-        );
-
-    void amrex_eb_update_levelset_union(
-            const int * lo,           const int * hi,
-            const int * valid_in,     const int * vilo, const int * vihi,
-            const amrex_real * ls_in, const int * lslo, const int * lshi,
-            int * valid,              const int * vlo,  const int * vhi,
-            amrex_real * phi,         const int * phlo, const int * phhi
-        );
-
-    void amrex_eb_update_levelset_union_bcs(
-            const int * valid_in,     const int * vilo,  const int * vihi,
-            const amrex_real * ls_in, const int * lslo,  const int * lshi,
-            int * valid,              const int * vlo,   const int * vhi,
-            amrex_real * phi,         const int * phlo,  const int * phhi,
-            const int * periodic,     const int * domlo, const int * domhi
-        );
-
-    void amrex_eb_fill_valid(
-            const int * lo,         const int * hi,
-            int * valid,            const int * vlo,  const int * vhi,
-            const amrex_real * phi, const int * phlo, const int * phhi,
-            const int * n_pad
-        );
-
-    void amrex_eb_fill_valid_bcs(
-            int * valid,          const int * vlo,   const int * vhi,
-            const int * periodic, const int * domlo, const int * domhi
-        );
-
-    void amrex_eb_count_facets(
-            const int * lo,    const int * hi,
-            const void * flag, const int * flo, const int * fhi,
-            int * n_facets
-        );
-
-    void amrex_eb_as_list(
-            const int * lo,           const int * hi,  int * c_facets,
-            const void * flag,        const int * flo, const int * fhi,
-            const amrex_real * norm,  const int * nlo, const int * nhi,
-            const amrex_real * bcent, const int * blo, const int * bhi,
-            amrex_real * list_out,    const int * lsize,
-            const amrex_real * dx
-        );
-
-    void amrex_eb_threshold_levelset(
-            const int * lo,   const int * hi,     const amrex_real * threshold,
-            amrex_real * phi, const int * phi_lo, const int * phi_hi
-        );
-
-    void amrex_eb_validate_levelset(
-            const int * lo,          const int * hi,   const int * n_pad,
-            const amrex_real * impf, const int * imlo, const int * imhi,
-            const int * valid,       const int * vlo,  const int * vhi,
-            amrex_real * phi,        const int * phlo, const int * phhi
-        );
-
-    void amrex_eb_validate_levelset_bcs(
-            amrex_real * phi,        const int * phlo,  const int * phhi,
-            const int * valid,       const int * vlo,   const int * vhi,
-            const int * periodic,    const int * domlo, const int * domhi,
-            const amrex_real * impf, const int * imlo,  const int * imhi
-        );
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Src/EB/AMReX_EB_LSCore.H b/Src/EB/AMReX_EB_LSCore.H
deleted file mode 100644
index 3691f6585e1..00000000000
--- a/Src/EB/AMReX_EB_LSCore.H
+++ /dev/null
@@ -1,96 +0,0 @@
-#ifndef AMReX_EB_LSCore_H_
-#define AMReX_EB_LSCore_H_
-
-#include <string>
-#include <limits>
-#include <memory>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-#include <AMReX_BCRec.H>
-#include <AMReX_Vector.H>
-#include <AMReX_AmrCore.H>
-#include <AMReX_ArrayLim.H>
-#include <AMReX_FluxRegister.H>
-
-#include <AMReX_EB_F.H>
-#include <AMReX_EB_utils.H>
-#include <AMReX_EB_LSCore_F.H>
-#include <AMReX_EB_LSCoreBase.H>
-#include <AMReX_EB_levelset.H>
-
-#if defined(BL_USE_SENSEI_INSITU)
-namespace amrex {
-class AmrMeshInSituBridge;
-}
-#endif
-
-//using namespace amrex;
-
-namespace amrex {
-
-
-template<class F>
-class LSCore
-    : public LSCoreBase
-{
-public:
-
-    /****************************************************************************
-     * public member functions                                                  *
-     ***************************************************************************/
-
-    //! Constructor - reads amr in parameters from inputs file
-    //!             - sizes multilevel arrays and data structures
-    LSCore (EB2::GeometryShop<F> gshop);
-    LSCore (EB2::GeometryShop<F> a_gshop,
-            const RealBox * rb, int max_level_in, const Vector<int> & n_cell_in, int coord=-1);
-
-    virtual ~LSCore ();
-
-    //! Delete level data. Overrides the pure virtual function in AmrCore
-    virtual void ClearLevel (int lev) override;
-
-    //! Make a new level from scratch using provided BoxArray and
-    //! DistributionMapping. Only used during initialization. Overrides the pure
-    //! virtual function in AmrCore
-    virtual void MakeNewLevelFromScratch (int lev, Real time, const BoxArray & ba,
-                                          const DistributionMapping & dm) override;
-
-    static const EB2::Level * BuildEBLevel (const EB2::GeometryShop<F> & gshop,
-                                            int lev, const Vector<Geometry> & geom );
-
-    static const EB2::Level * BuildEBLevel ( const EB2::GeometryShop<F> gshop,
-                                             int lev, const Vector<Geometry> & geom,
-                                             int max_crse_level, int required_crse_lev);
-
-private:
-
-    /****************************************************************************
-     * private member functions                                                 *
-     ***************************************************************************/
-
-    /****************************************************************************
-     * private data members                                                     *
-     ***************************************************************************/
-
-    //! Used when building finer levels
-    EB2::GeometryShop<F> m_gshop;
-
-    /****************************************************************************
-     * runtime parameters                                                       *
-     ***************************************************************************/
-
-#if defined(BL_USE_SENSEI_INSITU)
-    amrex::AmrMeshInSituBridge *insitu_bridge;
-#endif
-};
-
-
-#include <AMReX_EB_LSCoreI.H>
-
-}
-
-#endif
diff --git a/Src/EB/AMReX_EB_LSCoreBase.H b/Src/EB/AMReX_EB_LSCoreBase.H
deleted file mode 100644
index 0cd98a78082..00000000000
--- a/Src/EB/AMReX_EB_LSCoreBase.H
+++ /dev/null
@@ -1,362 +0,0 @@
-#ifndef AMReX_EB_LSCoreBase_H_
-#define AMReX_EB_LSCoreBase_H_
-
-
-#include <string>
-#include <limits>
-#include <memory>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-#include <AMReX_BCRec.H>
-#include <AMReX_Vector.H>
-#include <AMReX_TagBox.H>
-#include <AMReX_AmrCore.H>
-
-#include <AMReX_EB_LSCore_F.H>
-#include <AMReX_EB_levelset.H>
-
-
-
-#if defined(BL_USE_SENSEI_INSITU)
-namespace amrex {
-class AmrMeshInSituBridge;
-}
-#endif
-
-//using namespace amrex;
-
-namespace amrex {
-
-
-class LSCoreBase
-    : public AmrCore
-{
-public:
-
-
-    /****************************************************************************
-     * Static utilities exposing LSCore's basic operations to classes managing  *
-     * their own grids.                                                         *
-     ***************************************************************************/
-
-    static void FillLevelSetTags( int lev, TagBoxArray & tags, const Vector<Real> & phierr,
-                                  const MultiFab & levelset_data, const Vector<Geometry> & geom );
-
-    static void FillVolfracTags( int lev, TagBoxArray & tags,
-                                 const Vector<BoxArray> & grids,
-                                 const Vector<DistributionMapping> & dmap,
-                                 const EB2::Level & eb_lev, const Vector<Geometry> & geom );
-
-    static Box EBSearchBox( const Box & tilebox, const FArrayBox & ls_crse,
-                            const Geometry & geom_fine, const IntVect & max_grow, bool & bail);
-
-    static void FillCoarsePatch (MultiFab & mf_fne, const MultiFab & mf_crse,
-                                 const Geometry & geom_fne, const Geometry & geom_crse,
-                                 const Vector<BCRec> & bcs, const IntVect & ref, int icomp, int ncomp);
-
-    static void MakeNewLevelFromCoarse (MultiFab & ls_fine, const MultiFab & ls_crse,
-                                        const BoxArray & ba, const DistributionMapping & dm,
-                                        const Geometry & geom_fine, const Geometry & geom_crse,
-                                        const Vector<BCRec> & bcs, const IntVect & ref);
-
-    static void FillLevelSet( MultiFab & level_set, const MultiFab & ls_crse,
-                              const EBFArrayBoxFactory & eb_factory, const MultiFab & mf_impfunc,
-                              const IntVect & ebt_size, int eb_pad, const Geometry & geom );
-
-    /****************************************************************************
-     * public member functions                                                  *
-     ***************************************************************************/
-
-
-    /**
-    * \brief Constructor - reads amr in parameters from inputs file
-    * - sizes multilevel arrays and data structures
-    */
-    LSCoreBase ();
-
-    LSCoreBase (const RealBox * rb, int max_level_in, const Vector<int> & n_cell_in, int coord=-1);
-    virtual ~LSCoreBase ();
-
-
-    /**
-    * \brief Initializes multilevel data
-    *
-    * \param a_use_phierr
-    */
-    void InitData (bool a_use_phierr = false);
-
-    void InitData (const Vector<Real> & m_phierr);
-
-
-    /**
-    * \brief Make a new level using provided BoxArray and DistributionMapping and fill
-    * with interpolated coarse level data. Overrides the pure virtual function
-    * in AmrCore
-    *
-    * \param lev
-    * \param time
-    * \param ba
-    * \param dm
-    */
-    virtual void MakeNewLevelFromCoarse (int lev, Real time, const BoxArray & ba,
-                                         const DistributionMapping & dm) override;
-
-
-    /**
-    * \brief Remake an existing level using provided BoxArray and DistributionMapping
-    * and fill with existing fine and coarse data. Overrides the pure virtual
-    * function in AmrCore
-    *
-    * \param lev
-    * \param time
-    * \param ba
-    * \param dm
-    */
-    virtual void RemakeLevel (int lev, Real time, const BoxArray & ba,
-                              const DistributionMapping & dm) override;
-
-
-    /**
-    * \brief NOTE: These are _not_ constructed here but in the template specialization
-    * LSCore classes:
-    *
-    * \param lev
-    */
-    virtual void ClearLevel (int lev) override = 0;
-
-    virtual void MakeNewLevelFromScratch (int lev, Real time, const BoxArray & ba,
-                                          const DistributionMapping & dm) override = 0;
-
-    void UpdateGrids (int lev, const BoxArray & ba, const DistributionMapping & dm);
-
-
-
-    /**
-    * \brief Tag all cells for refinement. Overrides the pure virtual function in
-    * AmrCore
-    *
-    * \param lev
-    * \param tags
-    * \param time
-    * \param ngrow
-    */
-    virtual void ErrorEst (int lev, TagBoxArray & tags, Real time, int ngrow) override;
-
-
-    /**
-    * \brief Write plotfile to disk
-    */
-    void WritePlotFile () const;
-
-
-    /**
-    * \brief Write checkpoint file to disk
-    */
-    void WriteCheckpointFile () const;
-
-    const MultiFab * getLevelSet(int n) const {return & level_set[n];}
-
-          MultiFab * getLevelSet(int n)       {return & level_set[n];}
-
-    const iMultiFab * getValid(int n) const {return & level_set_valid[n];}
-
-protected:
-
-    /****************************************************************************
-     * protected member functions                                               *
-     ***************************************************************************/
-
-    void Init ();
-
-
-    /**
-    * \brief Load tag levels from inputs database
-    */
-    void LoadTagLevels ();
-
-
-    /**
-    * \brief Set tag levels
-    *
-    * \param phierr
-    */
-    void SetTagLevels (const Vector<Real> & phierr);
-
-
-    /**
-    * \brief Read in some parameters from inputs file
-    */
-    void ReadParameters ();
-
-
-    /**
-    * \brief Set covered coarse cells to be the average of overlying fine cells
-    */
-    void AverageDown ();
-
-
-    /**
-    * \brief More flexible version of AverageDown() that lets you average down across multiple levels
-    *
-    * \param crse_lev
-    */
-    void AverageDownTo (int crse_lev);
-
-
-    /**
-    * \brief Compute a new multifab by coping in phi from valid region and filling
-    * ghost cells works for single level and 2-level cases (fill fine grid
-    * ghost by interpolating from coarse)
-    *
-    * \param lev
-    * \param time
-    * \param mf
-    * \param icomp
-    * \param ncomp
-    */
-    void FillPatch (int lev, amrex::Real time, MultiFab & mf, int icomp, int ncomp);
-
-
-    /**
-    * \brief Fill an entire multifab by interpolating from the coarser level this
-    * comes into play when a new level of refinement appears
-    *
-    * \param lev
-    * \param time
-    * \param mf
-    * \param icomp
-    * \param ncomp
-    */
-    void FillCoarsePatch (int lev, Real time, MultiFab & mf, int icomp, int ncomp);
-
-
-    /**
-    * \brief Construct a box over which to search for eb facets using the coarser
-    * level to inform how many ghost cells to fill
-    *
-    * \param box
-    * \param ls_crse
-    * \param geom_fine
-    * \param bail
-    */
-    Box EBSearchBox(const Box & box, const FArrayBox & ls_crse,
-                    const Geometry & geom_fine, bool & bail);
-
-
-    /**
-    * \brief Get plotfile name
-    *
-    * \param lev
-    */
-    std::string PlotFileName (int lev) const;
-
-
-    /**
-    * \brief Put together an array of multifabs for writing
-    */
-    Vector<MultiFab> PlotFileMF () const;
-
-
-    /**
-    * \brief Set plotfile variables names
-    */
-    Vector<std::string> PlotFileVarNames () const;
-
-
-    /**
-    * \brief read checkpoint file from disk
-    */
-    void ReadCheckpointFile ();
-
-
-    /**
-    * \brief utility to skip to next line in Header
-    *
-    * \param is
-    */
-    static void GotoNextLine (std::istream & is);
-
-
-    /****************************************************************************
-     * protected data members                                                   *
-     ***************************************************************************/
-
-
-    /**
-    * \brief EB data used for rebuilding levels from scratch. Used by extension
-    * classes (as they rely on template parameters). NOTE: use unique_ptr
-    * because LSFactory does not have a default constructor.
-    */
-    Vector<const EB2::Level *>         eb_levels;
-    Vector<std::unique_ptr<LSFactory>> ls_factory;
-
-    /**
-    * \brief Apparently std::vector\<bool\> isn't a thing?! (more precisely it's a
-    * different thing) =\> use int vector
-    */
-    Vector<int>                        rebuild_eb;
-
-
-    //! Level set data
-    Vector<MultiFab>  level_set;
-    Vector<iMultiFab> level_set_valid;
-
-    //! Resolve EB up to this many ghost cells (NOTE: these are scaled based on
-    //! local refinement level)
-    int eb_pad, max_eb_pad;
-
-
-    /**
-    * \brief This is essentially a 2*DIM integer array storing the physical boundary
-    * condition types at the lo/hi walls in each direction
-    */
-    Vector<BCRec> bcs; //!< 1-component
-
-    bool use_phierr = false;
-    bool phierr_set = false;
-    Vector<Real> phierr;
-
-    /****************************************************************************
-     * runtime parameters                                                       *
-     ***************************************************************************/
-
-    //! if >= 0 we restart from a checkpoint
-    std::string restart_chkfile = "";
-
-    //! plotfile prefix and frequency
-    std::string plot_file {"ls_plt"};
-    int plot_int = -1;
-
-    //! checkpoint prefix and frequency
-    std::string chk_file {"ls_chk"};
-    int chk_int = -1;
-
-
-private:
-
-
-    /****************************************************************************
-     * private member functions                                                 *
-     ***************************************************************************/
-
-
-    /**
-    * \brief Initializer used by both default and specialized constructors
-    */
-    void InitLSCoreBase();
-
-
-
-
-#if defined(BL_USE_SENSEI_INSITU)
-    amrex::AmrMeshInSituBridge *insitu_bridge;
-#endif
-};
-
-
-}
-
-#endif
diff --git a/Src/EB/AMReX_EB_LSCoreBase.cpp b/Src/EB/AMReX_EB_LSCoreBase.cpp
deleted file mode 100644
index 338877d1f7e..00000000000
--- a/Src/EB/AMReX_EB_LSCoreBase.cpp
+++ /dev/null
@@ -1,829 +0,0 @@
-
-#include <AMReX_Vector.H>
-#include <AMReX_AmrCore.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_FillPatchUtil.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_PhysBCFunct.H>
-#include <AMReX_EB_utils.H>
-#include <AMReX_EBAmrUtil.H>
-#include <AMReX_EB_F.H>
-
-#ifdef BL_USE_SENSEI_INSITU
-#include <AMReX_AmrMeshInSituBridge.H>
-#endif
-
-#ifdef AMREX_MEM_PROFILING
-#include <AMReX_MemProfiler.H>
-#endif
-
-#include <AMReX_EB_LSCoreBase.H>
-
-//using namespace amrex;
-namespace amrex {
-
-// constructor - reads in parameters from inputs file
-//             - sizes multilevel arrays and data structures
-//             - initializes BCRec boundary condition object
-LSCoreBase::LSCoreBase () {
-
-    BL_PROFILE("LSCoreBase::LSCoreBase()");
-
-    //NOTE: Geometry on all levels has been defined already.
-
-    ReadParameters();
-    InitLSCoreBase();
-}
-
-
-
-LSCoreBase::LSCoreBase(const RealBox * rb, int max_level_in, const Vector<int> & n_cell_in, int coord)
-    : AmrCore(rb, max_level_in, n_cell_in, coord)
-{
-    BL_PROFILE("LSCoreBase::LSCoreBase(RealBox)");
-
-    //NOTE: Geometry on all levels has been defined already.
-
-    ReadParameters();
-    InitLSCoreBase();
-}
-
-
-
-LSCoreBase::~LSCoreBase () {
-    BL_PROFILE("LSCoreBase::~LSCoreBase()");
-}
-
-
-
-void LSCoreBase::InitLSCoreBase() {
-
-    // No valid BoxArray and DistributionMapping have been defined.
-    // But the arrays for them have been resized.
-
-    BL_PROFILE("LSCoreBase::InitLSCoreBase()");
-
-    int nlevs_max = max_level + 1;
-
-    level_set.resize(nlevs_max);
-    level_set_valid.resize(nlevs_max);
-
-    ls_factory.resize(nlevs_max);
-    eb_levels.resize(nlevs_max);
-    rebuild_eb.resize(nlevs_max, 1); // At first rebuild eb on each level
-
-    bcs.resize(1);
-
-    // // periodic boundaries
-    // int bc_lo[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
-    // int bc_hi[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
-
-    // walls (Neumann)
-    int bc_lo[] = {BCType::foextrap, BCType::foextrap, BCType::foextrap};
-    int bc_hi[] = {BCType::foextrap, BCType::foextrap, BCType::foextrap};
-
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
-        // lo-side BCs
-        if (bc_lo[idim] == BCType::int_dir  ||  // periodic uses "internal Dirichlet"
-            bc_lo[idim] == BCType::foextrap ||  // first-order extrapolation
-            bc_lo[idim] == BCType::ext_dir ) {  // external Dirichlet
-            bcs[0].setLo(idim, bc_lo[idim]);
-        }
-        else {
-            amrex::Abort("Invalid bc_lo");
-        }
-
-        // hi-side BCSs
-        if (bc_hi[idim] == BCType::int_dir  ||  // periodic uses "internal Dirichlet"
-            bc_hi[idim] == BCType::foextrap ||  // first-order extrapolation
-            bc_hi[idim] == BCType::ext_dir ) {  // external Dirichlet
-            bcs[0].setHi(idim, bc_hi[idim]);
-        }
-        else {
-            amrex::Abort("Invalid bc_hi");
-        }
-    }
-
-}
-
-void LSCoreBase::LoadTagLevels () {
-
-    BL_PROFILE("LSCoreBase::LoadTagLevels()");
-
-    // read in an array of "phierr", which is the tagging threshold in this
-    // example, we tag values of "phi" which are greater than phierr for that
-    // particular level in subroutine state_error, you could use more elaborate
-    // tagging, such as more advanced logical expressions, or gradients, etc.
-    ParmParse pp("amr");
-    int n = pp.countval("phierr");
-    if (n > 0) {
-        pp.getarr("phierr", phierr, 0, n);
-    }
-}
-
-void LSCoreBase::SetTagLevels (const Vector<Real> & m_phierr) {
-
-    BL_PROFILE("LSCoreBase::SetTagLevels()");
-
-    phierr = m_phierr;
-}
-
-
-// Initializes multilevel data
-void LSCoreBase::Init () {
-
-    BL_PROFILE("LSCoreBase::Init()");
-
-    if (restart_chkfile == "") {
-        // start simulation from the beginning
-        const Real time = 0.0;
-
-        // This tells the AmrMesh class not to iterate when creating the
-        //    initial grid hierarchy
-        SetIterateToFalse();
-
-        // This tells the Cluster routine to use the new chopping
-        // routine which rejects cuts if they don't improve the efficiency
-        SetUseNewChop();
-
-        InitFromScratch(time);
-        AverageDown();
-
-        if (chk_int > 0)
-            WriteCheckpointFile();
-
-    } else {
-        // restart from a checkpoint
-        ReadCheckpointFile();
-    }
-
-    if (plot_int > 0)
-        WritePlotFile();
-}
-
-
-void LSCoreBase::InitData (bool a_use_phierr) {
-
-    BL_PROFILE("LSCoreBase::InitData()");
-
-    use_phierr = a_use_phierr;
-    if (use_phierr)
-        LoadTagLevels();
-    Init();
-}
-
-
-void LSCoreBase::InitData (const Vector<Real> & m_phierr) {
-
-    BL_PROFILE("LSCoreBase::InitData(phierr)");
-
-    SetTagLevels(m_phierr);
-    Init();
-}
-
-
-// Make a new level using provided BoxArray and DistributionMapping and fill
-// with interpolated coarse level data. Overrides the pure virtual function in
-// AmrCore
-void LSCoreBase::MakeNewLevelFromCoarse ( int lev, Real time, const BoxArray & ba,
-                                          const DistributionMapping & dm) {
-
-    BL_PROFILE("LSCoreBase::MakeNewLevelFromCoarse()");
-    BL_ASSERT(lev > 0);
-
-    LSCoreBase::MakeNewLevelFromCoarse(level_set[lev], level_set[lev - 1], ba, dm,
-                                       geom[lev], geom[lev - 1], bcs, refRatio(lev - 1 ));
-
-    // At this point, we consider _everywhere_ as valid. This is maintained for
-    // legacy reasons. TODO: There might be a better way of doing things.
-
-    const int ncomp  = level_set[lev].nComp();
-    const int nghost = level_set[lev].nGrow();
-
-    BoxArray ba_nd = amrex::convert(ba, IntVect::TheNodeVector());
-    level_set_valid[lev].define(ba_nd, dm, ncomp, nghost);
-    level_set_valid[lev].setVal(1);
-
-}
-
-
-// Remake an existing level using provided BoxArray and DistributionMapping and
-// fill with existing fine and coarse data. Overrides the pure virtual function
-// in AmrCore
-void LSCoreBase::RemakeLevel ( int lev, Real time, const BoxArray & ba,
-                               const DistributionMapping & dm) {
-
-    BL_PROFILE("LSCoreBase::RemakeLevel()");
-
-    const int ncomp  = level_set[lev].nComp();
-    const int nghost = level_set[lev].nGrow();
-
-    BoxArray ba_nd = amrex::convert(ba, IntVect::TheUnitVector());
-    MultiFab new_state(ba_nd, dm, ncomp, nghost);
-
-    FillPatch(lev, time, new_state, 0, ncomp);
-
-    std::swap(new_state, level_set[lev]);
-
-    // At this point, we consider _everywhere_ as valid. This is maintained for
-    // legacy reasons. TODO: There might be a better way of doing things.
-    level_set_valid[lev].define(ba_nd, dm, ncomp, nghost);
-    level_set_valid[lev].setVal(1);
-}
-
-
-void LSCoreBase::UpdateGrids (int lev, const BoxArray & ba, const DistributionMapping & dm){
-
-    BL_PROFILE("LSCoreBase::UpdateGrids()");
-
-    bool ba_changed = ( ba != grids[lev] );
-    bool dm_changed = ( dm != dmap[lev] );
-
-    if (! (ba_changed || dm_changed))
-        return;
-
-
-    SetBoxArray(lev, ba);
-    SetDistributionMap(lev, dm);
-
-    BoxArray ba_nd = amrex::convert(ba, IntVect::TheUnitVector());
-
-    MultiFab ls_regrid = MFUtil::duplicate<MultiFab, MFUtil::SymmetricGhost>
-        (ba_nd, dm, level_set[lev]);
-    iMultiFab valid_regrid = MFUtil::duplicate<iMultiFab, MFUtil::SymmetricGhost>
-        (ba_nd, dm, level_set_valid[lev]);
-
-    std::swap(ls_regrid, level_set[lev]);
-    std::swap(valid_regrid, level_set_valid[lev]);
-}
-
-
-void LSCoreBase::FillLevelSetTags(int lev, TagBoxArray & tags, const Vector<Real> & phierr,
-                                  const MultiFab & levelset_data, const Vector<Geometry> & geom ) {
-
-    BL_PROFILE("LSCoreBase::FillLevelSetTags()");
-
-    if (lev >= phierr.size()) return;
-
-    const int clearval = TagBox::CLEAR;
-    const int   tagval = TagBox::SET;
-
-    const Real * dx      = geom[lev].CellSize();
-    const Real * prob_lo = geom[lev].ProbLo();
-
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-        Vector<int> itags;
-
-        for (MFIter mfi(levelset_data, true); mfi.isValid(); ++mfi) {
-            const Box &    tilebox = mfi.tilebox();
-                  TagBox & tagfab  = tags[mfi];
-
-            // We cannot pass tagfab to Fortran because it is BaseFab<char>. So
-            // we are going to get a temporary integer array. set itags
-            // initially to 'untagged' everywhere we define itags over the
-            // tilebox region
-            tagfab.get_itags(itags, tilebox);
-
-            // data pointer and index space
-            int *       tptr = itags.dataPtr();
-            const int * tlo  = tilebox.loVect();
-            const int * thi  = tilebox.hiVect();
-
-            //-------------------------------------------------------------------
-            // Tag cells for refinement
-            Real time = 0; // Temporary storing "time" => not needed for level-set tagging
-            amrex_eb_levelset_error ( tptr, AMREX_ARLIM_3D(tlo), AMREX_ARLIM_3D(thi),
-                                      BL_TO_FORTRAN_3D(levelset_data[mfi]),
-                                      & tagval, & clearval,
-                                      BL_TO_FORTRAN_BOX(tilebox),
-                                      AMREX_ZFILL(dx), AMREX_ZFILL(prob_lo),
-                                      & time, & phierr[lev]);
-
-            //___________________________________________________________________
-            // Update the tags in the TagBox in the tilebox region to be equal
-            // to itags
-            tagfab.tags_and_untags(itags, tilebox);
-        }
-    }
-}
-
-
-
-void LSCoreBase::FillVolfracTags(int lev, TagBoxArray & tags,
-                                 const Vector<BoxArray> & grids,
-                                 const Vector<DistributionMapping> & dmap,
-                                 const EB2::Level & eb_lev, const Vector<Geometry> & geom) {
-
-    BL_PROFILE("LSCoreBase::FillVolfracTags()");
-
-    //___________________________________________________________________________
-    // Tag all cells with volfrac \in (0, 1)
-    MultiFab volfrac(grids[lev], dmap[lev], 1, 1);
-    eb_lev.fillVolFrac(volfrac, geom[lev]);
-
-    amrex::TagVolfrac(tags, volfrac);
-}
-
-
-
-// Fill an entire multifab by interpolating from the coarser level.
-void LSCoreBase::FillCoarsePatch (MultiFab & mf_fne, const MultiFab & mf_crse,
-                                  const Geometry & geom_fne, const Geometry & geom_crse,
-                                  const Vector<BCRec> & bcs, const IntVect & ref, int icomp, int ncomp) {
-
-    BL_PROFILE("static LSCoreBase::FillCoarsePatch()");
-
-    BndryFuncArray bfunc(amrex_eb_phifill);
-    PhysBCFunct<BndryFuncArray> cphysbc(geom_crse, bcs, bfunc);
-    PhysBCFunct<BndryFuncArray> fphysbc(geom_fne,  bcs, bfunc);
-
-    Interpolater * mapper = & node_bilinear_interp;
-
-    amrex::InterpFromCoarseLevel(mf_fne, 0, mf_crse, 0, icomp, ncomp, geom_crse, geom_fne,
-                                 cphysbc, 0, fphysbc, 0, ref, mapper, bcs, 0);
-}
-
-
-
-// Make a new level using provided BoxArray and DistributionMapping and fill
-// with interpolated coarse level data.
-void LSCoreBase::MakeNewLevelFromCoarse (MultiFab & ls_fine, const MultiFab & ls_crse,
-                                         const BoxArray & ba, const DistributionMapping & dm,
-                                         const Geometry & geom_fine, const Geometry & geom_crse,
-                                         const Vector<BCRec> & bcs, const IntVect & ref){
-
-    BL_PROFILE("static LSCoreBase::MakeNewLevelFromCoarse()");
-
-    const int ncomp  = ls_crse.nComp();
-    const int nghost = ls_crse.nGrow();
-
-    BoxArray ba_nd = amrex::convert(ba, IntVect::TheNodeVector());
-    ls_fine.define(ba_nd, dm, ncomp, nghost);
-
-    LSCoreBase::FillCoarsePatch(ls_fine, ls_crse, geom_fine, geom_crse, bcs, ref, 0, ncomp);
-}
-
-
-
-// Constructs a box over which to look for EB facets. The Box size grows based
-// on the coarse-level level-set value. But it never grows larger than
-// max_eb_pad.
-Box LSCoreBase::EBSearchBox( const Box & tilebox, const FArrayBox & ls_crse,
-                             const Geometry & geom_fine, const IntVect & max_grow, bool & bail) {
-
-    BL_PROFILE("LSCoreBase::EBSearchBox()");
-
-    // Infinities don't work well with std::max, so just bail and construct the
-    // maximum box.
-    if (ls_crse.contains_inf<RunOn::Host>()){
-        Box bx = amrex::convert(ls_crse.box(), IntVect::TheZeroVector());
-        bx.grow(max_grow);
-
-        bail = true;
-        return bx;
-    }
-
-    // Something's gone wrong :( ... so just bail and construct the maximum box.
-    if (ls_crse.contains_nan<RunOn::Host>()){
-        Box bx = amrex::convert(ls_crse.box(), IntVect::TheZeroVector());
-        bx.grow(max_grow);
-
-        bail = true;
-        return bx;
-    }
-
-
-    Real max_ls = std::max(std::abs(ls_crse.max<RunOn::Host>()), std::abs(ls_crse.min<RunOn::Host>()));
-
-    IntVect n_grow_ls(AMREX_D_DECL(static_cast<int>(geom_fine.InvCellSize(0)*max_ls),
-                                   static_cast<int>(geom_fine.InvCellSize(1)*max_ls),
-                                   static_cast<int>(geom_fine.InvCellSize(2)*max_ls)));
-
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-        if (n_grow_ls[i] > max_grow[i]) {
-            n_grow_ls[i] = max_grow[i];
-            bail = true;
-        }
-
-    Box bx = amrex::convert(tilebox, IntVect::TheZeroVector());
-    bx.grow(n_grow_ls);
-
-    return bx;
-}
-
-
-
-// tag all cells for refinement
-// overrides the pure virtual function in AmrCore
-void LSCoreBase::ErrorEst (int lev, TagBoxArray & tags, Real time, int ngrow) {
-
-    if (use_phierr) {
-        LSCoreBase::FillLevelSetTags(lev, tags, phierr, level_set[lev], geom);
-    } else {
-        LSCoreBase::FillVolfracTags(lev, tags, grids, dmap, * eb_levels[lev], geom);
-    }
-
-}
-
-
-// Read some parameters from inputs file
-void LSCoreBase::ReadParameters () {
-
-    BL_PROFILE("LSCoreBase::ReadParameters()");
-
-    /************************************************************************
-     * Parse inputs                                                         *
-     ***********************************************************************/
-
-    ParmParse pp("eb_amr");
-    pp.query("eb_pad", eb_pad);
-    pp.query("max_eb_pad", max_eb_pad);
-
-}
-
-
-// Set covered coarse cells to be the average of overlying fine cells
-void LSCoreBase::AverageDown () {
-
-    BL_PROFILE("LSCoreBase::AverageDown()");
-
-    for (int lev = finest_level-1; lev >= 0; lev--) {
-
-        amrex::average_down(level_set[lev + 1], level_set[lev],
-                            0, level_set[lev].nComp(), refRatio(lev));
-    }
-}
-
-
-// More flexible version of AverageDown() that lets you average down across
-// multiple levels
-void LSCoreBase::AverageDownTo (int crse_lev) {
-
-    BL_PROFILE("LSCoreBase::AverageDownTo()");
-
-    amrex::average_down(level_set[crse_lev+1], level_set[crse_lev],
-                        0, level_set[crse_lev].nComp(), refRatio(crse_lev));
-
-}
-
-
-// Compute a new multifab by coping in phi from valid region and filling ghost
-// cells works for single level and 2-level cases (fill fine grid ghost by
-// interpolating from coarse)
-void LSCoreBase::FillPatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp) {
-
-    BL_PROFILE("LSCoreBase::FillPatch()");
-
-    if (lev == 0) {
-
-        BndryFuncArray bfunc(amrex_eb_phifill);
-        PhysBCFunct<BndryFuncArray> physbc(geom[lev], bcs, bfunc);
-
-        // NOTE: if source MultiFab vector as size = 1 => no interpolation
-        amrex::FillPatchSingleLevel(mf, time, {& level_set[0]}, {0.}, 0, icomp, ncomp,
-                                              geom[lev], physbc, 0);
-
-    } else {
-
-        BndryFuncArray bfunc(amrex_eb_phifill);
-        PhysBCFunct<BndryFuncArray> cphysbc(geom[lev-1], bcs, bfunc);
-        PhysBCFunct<BndryFuncArray> fphysbc(geom[lev  ], bcs, bfunc);
-
-        Interpolater * mapper = & node_bilinear_interp;
-
-
-        amrex::FillPatchTwoLevels(mf, time, {& level_set[lev - 1]}, {0.}, {& level_set[lev]}, {0.},
-                                  0, icomp, ncomp, geom[lev-1], geom[lev],
-                                  cphysbc, 0, fphysbc, 0,
-                                  refRatio(lev-1), mapper, bcs, 0);
-
-    }
-}
-
-
-// Fill an entire multifab by interpolating from the coarser level. This comes
-// into play when a new level of refinement appears
-void LSCoreBase::FillCoarsePatch (int lev, Real time, MultiFab & mf, int icomp, int ncomp) {
-
-    BL_PROFILE("LSCoreBase::FillCoarsePatch()");
-    BL_ASSERT(lev > 0);
-
-    LSCoreBase::FillCoarsePatch(mf, level_set[lev - 1], geom[lev], geom[lev - 1],
-                                bcs, refRatio(lev - 1), icomp, ncomp);
-}
-
-
-// Constructs a box over which to look for EB facets. The Box size grows based
-// on the coarse-level level-set value. But it never grows larger than
-// max_eb_pad.
-Box LSCoreBase::EBSearchBox(const Box & tilebox, const FArrayBox & ls_crse,
-                            const Geometry & geom_fine, bool & bail) {
-
-    IntVect n_grow(AMREX_D_DECL(max_eb_pad, max_eb_pad, max_eb_pad));
-    Box bx = LSCoreBase::EBSearchBox(tilebox, ls_crse, geom_fine, n_grow, bail);
-
-    return bx;
-}
-
-
-
-void LSCoreBase::FillLevelSet( MultiFab & level_set, const MultiFab & ls_crse,
-                               const EBFArrayBoxFactory & eb_factory, const MultiFab & mf_impfunc,
-                               const IntVect & ebt_size, int eb_pad, const Geometry & geom ) {
-
-    BL_PROFILE("LSCoreBase::FillLevelSet()");
-
-    // EB boundary-centre data
-    const MultiCutFab & bndrycent = eb_factory.getBndryCent();
-    const auto & flags = eb_factory.getMultiEBCellFlagFab();
-
-    const BoxArray & ba_ls         = level_set.boxArray();
-    const BoxArray & ba_cc         = amrex::convert(ba_ls, IntVect::TheZeroVector());
-    const BoxArray & ba_nd         = amrex::convert(ba_ls, IntVect::TheUnitVector());
-    const DistributionMapping & dm = level_set.DistributionMap();
-
-    // EB normal data
-    MultiFab normal(ba_cc, dm, 3, eb_pad + 1);
-    FillEBNormals(normal, eb_factory, geom);
-
-    iMultiFab eb_valid(ba_cc, dm, 1, eb_pad + 1);
-    eb_valid.setVal(0);
-
-    // Level_set threshold
-    Real min_dx       = LSUtility::min_dx(geom);
-    Real ls_threshold = min_dx * (eb_pad + 1);
-
-    const IntVect max_grow{AMREX_D_DECL(eb_pad, eb_pad, eb_pad)};
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(level_set, ebt_size); mfi.isValid(); ++mfi) {
-            const auto & ls_tile = ls_crse[mfi];
-                  bool bail      = false;
-                  Box tile_box   = mfi.tilebox();
-                  Box eb_search  = LSCoreBase::EBSearchBox(tile_box, ls_tile, geom, max_grow, bail);
-
-            if (bail) continue;
-
-            int n_facets = 0;
-            const auto & flag = flags[mfi];
-            // Need to count number of eb-facets (in order to allocate facet_list)
-            amrex_eb_count_facets(BL_TO_FORTRAN_BOX(eb_search),
-                                  BL_TO_FORTRAN_3D(flag),
-                                  & n_facets);
-
-            int facet_list_size = 6 * n_facets;
-            Vector<Real> facet_list(facet_list_size);
-
-
-                  auto & ls_tile_w = level_set[mfi];
-                  auto & v_tile    = eb_valid[mfi];
-            const auto & if_tile   = mf_impfunc[mfi];
-
-            if (n_facets > 0) {
-                const auto & norm_tile = normal[mfi];
-                const auto & bcent_tile = bndrycent[mfi];
-
-                int c_facets = 0;
-                amrex_eb_as_list(BL_TO_FORTRAN_BOX(eb_search), & c_facets,
-                                 BL_TO_FORTRAN_3D(flag),
-                                 BL_TO_FORTRAN_3D(norm_tile),
-                                 BL_TO_FORTRAN_3D(bcent_tile),
-                                 facet_list.dataPtr(), & facet_list_size,
-                                 geom.CellSize()                          );
-
-                amrex_eb_fill_levelset_loc(BL_TO_FORTRAN_BOX(tile_box),
-                                           facet_list.dataPtr(), & facet_list_size,
-                                           BL_TO_FORTRAN_3D(v_tile),
-                                           BL_TO_FORTRAN_3D(ls_tile_w),
-                                           BL_TO_FORTRAN_3D(ls_tile), & ls_threshold,
-                                           geom.CellSize(), geom.CellSize()         );
-
-            }
-
-
-            //_______________________________________________________________________
-            // Enforce threshold of local level-set
-            amrex_eb_threshold_levelset(BL_TO_FORTRAN_BOX(tile_box), & ls_threshold,
-                                        BL_TO_FORTRAN_3D(ls_tile_w));
-
-
-            //_______________________________________________________________________
-            // Validate level-set
-            const int ls_grid_ref = 1;
-            amrex_eb_validate_levelset(BL_TO_FORTRAN_BOX(tile_box), & ls_grid_ref,
-                                       BL_TO_FORTRAN_3D(if_tile),
-                                       BL_TO_FORTRAN_3D(v_tile),
-                                       BL_TO_FORTRAN_3D(ls_tile_w)   );
-        }
-
-    level_set.FillBoundary(geom.periodicity());
-}
-
-
-
-// Get plotfile name
-std::string LSCoreBase::PlotFileName (int lev) const {
-    // return amrex::Concatenate(plot_file, lev, 5);
-    return plot_file;
-}
-
-
-// Put together an array of multifabs for writing
-Vector<MultiFab> LSCoreBase::PlotFileMF () const {
-
-    BL_PROFILE("LSCoreBase::PlotFileMF()");
-
-    Vector<MultiFab> r(max_level + 1);
-    for (int i = 0; i < max_level + 1; i++) {
-        const int ncomp  = level_set[i].nComp();
-        const int nghost = level_set[i].nGrow();
-        r[i].define(grids[i], dmap[i], ncomp, nghost);
-
-        amrex::average_node_to_cellcenter(r[i], 0, level_set[i], 0, 1);
-    }
-    return r;
-}
-
-
-// Set plotfile variable names
-Vector<std::string> LSCoreBase::PlotFileVarNames () const {
-    return {"level-set"};
-}
-
-
-// Write plotfile to disk
-void LSCoreBase::WritePlotFile () const {
-
-    BL_PROFILE("LSCoreBase::WritePlotFile()");
-
-    // Get plotfile name
-    const std::string & plotfilename = PlotFileName(0);
-
-    // Generate cell-centered data to put into plotfile
-    const Vector<MultiFab> mf_plt = PlotFileMF();
-    Vector<const MultiFab*> mf_ptr;
-    for (const MultiFab & mf : mf_plt)
-        mf_ptr.push_back(& mf);
-
-    // Get variable names
-    const auto & varnames = PlotFileVarNames();
-
-    // Keep user informed
-    amrex::Print() << "Writing ";
-    for (const std::string & str_name : varnames)
-        amrex::Print() << str_name << " ";
-    amrex::Print() << "plotfile: " << plotfilename << "\n";
-
-    // Save plot file
-    Vector<int> istep(max_level + 1, 0);
-    amrex::WriteMultiLevelPlotfile(plotfilename, finest_level + 1, mf_ptr, varnames,
-                                   Geom(), 0., istep, refRatio());
-}
-
-
-void LSCoreBase::WriteCheckpointFile () const {
-
-    BL_PROFILE("LSCoreBase::WriteCheckpointFile()");
-
-    // chk00010            write a checkpoint file with this root directory
-    // chk00010/Header     this contains information you need to save (e.g.,
-    //                     finest_level, t_new, etc.) and also the BoxArrays at
-    //                     each level
-    // chk00010/Level_0/
-    // chk00010/Level_1/
-    // etc.                these subdirectories will hold the MultiFab data at
-    //                     each level of refinement
-
-    // checkpoint file name, e.g., chk00010
-    // const std::string & checkpointname = amrex::Concatenate(chk_file,istep[0]);
-    const std::string & checkpointname = chk_file;
-
-    amrex::Print() << "Writing checkpoint " << checkpointname << "\n";
-
-    const int nlevels = finest_level + 1;
-
-    // ---- prebuild a hierarchy of directories
-    // ---- dirName is built first.  if dirName exists, it is renamed.  then build
-    // ---- dirName/subDirPrefix_0 .. dirName/subDirPrefix_nlevels-1
-    // ---- if callBarrier is true, call ParallelDescriptor::Barrier()
-    // ---- after all directories are built
-    // ---- ParallelDescriptor::IOProcessor() creates the directories
-    amrex::PreBuildDirectorHierarchy(checkpointname, "Level_", nlevels, true);
-
-    // write Header file
-    if (ParallelDescriptor::IOProcessor()) {
-
-        std::string HeaderFileName(checkpointname + "/Header");
-        VisMF::IO_Buffer io_buffer(VisMF::IO_Buffer_Size);
-        std::ofstream HeaderFile;
-        HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-        HeaderFile.open(HeaderFileName.c_str(), std::ofstream::out   |
-                                                std::ofstream::trunc |
-                                                std::ofstream::binary);
-        if( ! HeaderFile.good()) {
-            amrex::FileOpenFailed(HeaderFileName);
-        }
-
-        HeaderFile.precision(17);
-
-        // write out title line
-        HeaderFile << "Checkpoint file for AmrCoreAdv\n";
-
-        // write out finest_level
-        HeaderFile << finest_level << "\n";
-
-        // write out array of istep
-        Vector<int> istep(max_level + 1, 0);
-        for (int i = 0; i < istep.size(); ++i) {
-            HeaderFile << istep[i] << " ";
-        }
-        HeaderFile << "\n";
-
-        // write the BoxArray at each level
-        for (int lev = 0; lev <= finest_level; ++lev) {
-            boxArray(lev).writeOn(HeaderFile);
-            HeaderFile << '\n';
-        }
-    }
-
-    // write the MultiFab data to, e.g., chk00010/Level_0/
-    for (int lev = 0; lev <= finest_level; ++lev) {
-        VisMF::Write(level_set[lev],
-                     amrex::MultiFabFileFullPrefix(lev, checkpointname, "Level_", "phi"));
-    }
-
-}
-
-
-void LSCoreBase::ReadCheckpointFile () {
-
-    BL_PROFILE("LSCoreBase::ReadCheckpointFile()");
-
-    amrex::Print() << "Restart from checkpoint " << restart_chkfile << "\n";
-
-    // Header
-    std::string File(restart_chkfile + "/Header");
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    Vector<char> fileCharPtr;
-    ParallelDescriptor::ReadAndBcastFile(File, fileCharPtr);
-    std::string fileCharPtrString(fileCharPtr.dataPtr());
-    std::istringstream is(fileCharPtrString, std::istringstream::in);
-
-    std::string line, word;
-
-    // read in title line
-    std::getline(is, line);
-
-    // read in finest_level
-    is >> finest_level;
-    GotoNextLine(is);
-
-    for (int lev = 0; lev <= finest_level; ++lev) {
-
-        // read in level 'lev' BoxArray from Header
-        BoxArray ba;
-        ba.readFrom(is);
-        GotoNextLine(is);
-
-        // create a distribution mapping
-        DistributionMapping dm { ba, ParallelDescriptor::NProcs() };
-
-        // set BoxArray grids and DistributionMapping dmap in AMReX_AmrMesh.H class
-        SetBoxArray(lev, ba);
-        SetDistributionMap(lev, dm);
-
-        // build MultiFab and FluxRegister data
-        int ncomp = 1;
-        int nghost = 0;
-        level_set[lev].define(grids[lev], dmap[lev], ncomp, nghost);
-    }
-
-    // read in the MultiFab data
-    for (int lev = 0; lev <= finest_level; ++lev) {
-        VisMF::Read(level_set[lev],
-                    amrex::MultiFabFileFullPrefix(lev, restart_chkfile, "Level_", "phi"));
-    }
-
-}
-
-
-// utility to skip to next line in Header
-void LSCoreBase::GotoNextLine (std::istream & is) {
-    constexpr std::streamsize bl_ignore_max { 100000 };
-    is.ignore(bl_ignore_max, '\n');
-}
-
-
-
-}
diff --git a/Src/EB/AMReX_EB_LSCoreI.H b/Src/EB/AMReX_EB_LSCoreI.H
deleted file mode 100644
index b657cf688cf..00000000000
--- a/Src/EB/AMReX_EB_LSCoreI.H
+++ /dev/null
@@ -1,158 +0,0 @@
-
-//! NOTE: Since super class (LSCoreBase) constructor has no arguments, it is
-//! called by default.
-template<class F>
-LSCore<F>::LSCore (EB2::GeometryShop<F> a_gshop)
-: m_gshop(a_gshop)
-{}
-
-
-//! NOTE: here we need to explicitly call the super call (LSCoreBase)
-//! constructor due to the extra arguments
-template<class F>
-LSCore<F>::LSCore (EB2::GeometryShop<F> a_gshop,
-                   const RealBox * rb, int max_level_in, const Vector<int> & n_cell_in, int coord)
-: LSCoreBase(rb, max_level_in, n_cell_in, coord), m_gshop(a_gshop)
-{}
-
-
-
-template<class F>
-LSCore<F>::~LSCore () {}
-
-
-//! Delete level data overrides the pure virtual function in AmrCore
-template<class F>
-void LSCore<F>::ClearLevel (int lev) {
-    level_set[lev].clear();
-    level_set_valid[lev].clear();
-
-    // NOTE: maybe I shouldn't do this (this method is being called by regrid...)
-    //ls_factory[lev].clear();
-}
-
-
-template<class F>
-const EB2::Level * LSCore<F>::BuildEBLevel ( const EB2::GeometryShop<F> gshop,
-                                             int lev, const Vector<Geometry> & geom,
-                                             int max_crse_level, int required_crse_lev) {
-    EB2::Build(gshop, geom[lev], required_crse_lev, max_crse_level);
-    const EB2::IndexSpace & ebis = EB2::IndexSpace::top();
-
-    return & ebis.getLevel(geom[lev]);
-}
-
-
-
-//! Build a new EB level and return a pointer to this level
-template<class F>
-const EB2::Level * LSCore<F>::BuildEBLevel (const EB2::GeometryShop<F> & gshop,
-                                            int lev, const Vector<Geometry> & geom ) {
-    int max_crse_level = lev; //!< Important! this is needed to allow EBFactory to
-                              //!< be built on coarser levels (which is needed by
-                              //!< FillCoarsePatch)
-    int required_crse_lev = std::max(0, lev - 1);
-    //int required_crse_lev = lev;
-
-    return LSCore<F>::BuildEBLevel (gshop, lev, geom, max_crse_level, required_crse_lev);
-}
-
-
-//! Make a new level from scratch using provided BoxArray and
-//! DistributionMapping. Only used during initialization. Overrides the pure
-//! virtual function in AmrCore
-template<class F>
-void LSCore<F>::MakeNewLevelFromScratch (int lev, Real time, const BoxArray & ba,
-                                         const DistributionMapping & dm) {
-
-    const int ncomp  = 1;
-    const int nghost = 1;
-
-    Real strt_time = ParallelDescriptor::second();
-
-    /****************************************************************************
-     * Make sure EB geometry exists (build if necessary)                        *
-     ***************************************************************************/
-
-    if (rebuild_eb[lev] == 1) {
-        eb_levels[lev] = LSCore<F>::BuildEBLevel(m_gshop, lev, geom);
-
-        rebuild_eb[lev] = 0;
-    }
-
-    /****************************************************************************
-     * Define Basic data MultiFabs                                              *
-     ***************************************************************************/
-
-    BoxArray ba_nd = amrex::convert(ba, IntVect::TheUnitVector());
-
-    // Define MultiFab data (will store final level set for this level)
-    level_set[lev].define(ba_nd, dm, ncomp, nghost);
-
-    // At this point, we consider _everywhere_ as valid. This is maintained for
-    // legacy reasons. TODO: There might be a better way of doing things.
-    level_set_valid[lev].define(ba_nd, dm, ncomp, nghost);
-    level_set_valid[lev].setVal(1);
-
-    /****************************************************************************
-     * Construct LSFactory (does the actual level-set building on lev 0)        *
-     ***************************************************************************/
-
-    // TODO: more light-weight structure here? (since we don't need all the
-    // LSFactory features for LSCore)
-    int levelset_pad    = nghost;
-    int levelset_eb_pad = eb_pad;
-
-    // Basic search radius
-    for (int i = lev - 1; i >= 0; i--){
-        IntVect rr = refRatio(i);
-        levelset_eb_pad *= std::max({AMREX_D_DECL(rr[0], rr[1], rr[2])});
-    }
-    if (levelset_eb_pad > max_eb_pad) levelset_eb_pad = max_eb_pad;
-
-    ls_factory[lev] = std::unique_ptr<LSFactory>(
-        new LSFactory(lev, 1, 1, levelset_pad, levelset_eb_pad, ba, geom[lev], dm)
-        );
-
-    GShopLSFactory<F> ls_gshop(m_gshop, * ls_factory[lev]);
-    std::unique_ptr<MultiFab> mf_impfunc = ls_gshop.fill_impfunc();
-
-    /****************************************************************************
-     * Fill the actual level-set MultiFabs (one for each level)                 *
-     ***************************************************************************/
-
-    if (lev == 0) {
-
-        //_______________________________________________________________________
-        // Compute level 0 using LSFactory
-
-        int ieb_pad = ls_factory[lev]->get_eb_pad();
-        EBFArrayBoxFactory eb_factory(* eb_levels[lev], geom[lev], ba, dm,
-                                      {ieb_pad, ieb_pad, ieb_pad}, EBSupport::full);
-
-        int ng = ls_factory[lev]->get_ls_pad();
-
-        ls_factory[lev]->Fill(eb_factory, * mf_impfunc, levelset_eb_pad);
-        level_set[lev].copy(* ls_factory[lev]->get_data(), 0, 0, 1, ng, ng);
-
-    } else {
-
-        //_______________________________________________________________________
-        // Build finer levels locally, using coarse level set
-
-        // Fills level-set[lev] with coarse data
-        MakeNewLevelFromCoarse(lev, time, ba, dm);
-
-        EBFArrayBoxFactory eb_factory(* eb_levels[lev], geom[lev], ba, dm,
-                                      {levelset_eb_pad + 1, levelset_eb_pad + 1, levelset_eb_pad + 1},
-                                      EBSupport::full);
-
-        IntVect ebt_size{AMREX_D_DECL(levelset_eb_pad, levelset_eb_pad, levelset_eb_pad)};
-        LSCoreBase::FillLevelSet(level_set[lev], level_set[lev], eb_factory, (* mf_impfunc),
-                                 ebt_size, levelset_eb_pad, geom[lev]);
-    }
-
-    Real end_time = ParallelDescriptor::second() - strt_time;
-    amrex::Print() << "** Time to build the level set at level " << lev
-                   << " " << end_time << std::endl;
-}
diff --git a/Src/EB/AMReX_EB_LSCore_F.H b/Src/EB/AMReX_EB_LSCore_F.H
deleted file mode 100644
index c14d90164a3..00000000000
--- a/Src/EB/AMReX_EB_LSCore_F.H
+++ /dev/null
@@ -1,35 +0,0 @@
-#ifndef AMREX_EB_LSCore_F_H_
-#define AMREX_EB_LSCore_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-    // these are interfaces to fortran subroutines
-
-    void amrex_eb_levelset_error (int * tag, const int * tag_lo, const int * tag_hi,
-                                  const BL_FORT_FAB_ARG_3D(state),
-                                  const int * tagval, const int * clearval,
-                                  const int * lo,     const int * hi,
-                                  const amrex_real * dx,   const amrex_real * problo,
-                                  const amrex_real * time, const amrex_real * phierr);
-
-    void amrex_eb_volfrac_error (int * tag, const int * tag_lo, const int * tag_hi,
-                                 const BL_FORT_FAB_ARG_3D(state),
-                                 const int * tagval, const int * clearval, const double * tol,
-                                 const int * lo,     const int * hi,
-                                 const amrex_real * dx,   const amrex_real * problo);
-
-    void amrex_eb_phifill (BL_FORT_FAB_ARG_3D(state),
-                           const int* dlo, const int* dhi,
-                           const amrex_real* dx, const amrex_real* glo,
-                           const amrex_real* time, const int* bc);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Src/EB/AMReX_EB_Tagging.F90 b/Src/EB/AMReX_EB_Tagging.F90
deleted file mode 100644
index 3fddf21f105..00000000000
--- a/Src/EB/AMReX_EB_Tagging.F90
+++ /dev/null
@@ -1,76 +0,0 @@
-module amrex_eb_tagging_module
-
-  implicit none
-
-  public
-
-contains
-
-  ! -----------------------------------------------------------
-  !> This routine will tag high error cells based on the state
-  !!
-  !! \param tag        <=  integer tag array
-  !! \param tag_lo,hi   => index extent of tag array
-  !! \param state       => state array
-  !! \param state_lo,hi => index extent of state array
-  !! \param set         => integer value to tag cell for refinement
-  !! \param clear       => integer value to untag cell
-  !! \param lo,hi       => work region we are allowed to change
-  !! \param dx          => cell size
-  !! \param problo      => phys loc of lower left corner of prob domain
-  !! \param time        => problem evolution time
-  !!        level       => refinement level of this array
-  ! -----------------------------------------------------------
-
-  subroutine amrex_eb_levelset_error(tag,   tag_lo,   tag_hi,   &
-                                     state, state_lo, state_hi, &
-                                     set,   clear,              &
-                                     lo,    hi,                 &
-                                     dx,    problo,             &
-                                     time,  phierr)             &
-    bind(C, name="amrex_eb_levelset_error")
-
-    use amrex_fort_module       , only : amrex_real
-    use amrex_constants_module  , only : half,zero
-    use amrex_eb_levelset_module, only: amrex_eb_interp_levelset
-
-    implicit none
-
-    integer, dimension(3), intent(in   ) :: lo, hi, state_lo, state_hi, tag_lo, tag_hi
-    real(amrex_real),      intent(in   ) :: problo(3), dx(3), time, phierr
-    integer,               intent(in   ) :: set, clear
-
-    real(amrex_real),      intent(in   ) :: state(state_lo(1):state_hi(1), &
-                                                  state_lo(2):state_hi(2), &
-                                                  state_lo(3):state_hi(3))
-    integer,               intent(  out) :: tag(tag_lo(1):tag_hi(1), &
-                                                tag_lo(2):tag_hi(2), &
-                                                tag_lo(3):tag_hi(3))
-
-    integer          :: i, j, k
-    real(amrex_real) :: pos(3), plo(3), ls_val
-
-    plo = (/ zero, zero, zero /)
-
-    ! Tag on regions of high phi
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             pos = (/ i, j, k /)*dx + half*dx
-             call amrex_eb_interp_levelset ( &
-                  pos, plo, 1,               &
-                  state, state_lo, state_hi, &
-                  dx, ls_val                 )
-
-             if (abs(ls_val) .le. phierr) then
-                tag(i, j, k) = set
-             endif
-
-          enddo
-       enddo
-    enddo
-
-  end subroutine amrex_eb_levelset_error
-
-end module amrex_eb_tagging_module
diff --git a/Src/EB/AMReX_EB_bc_fill_nd.F90 b/Src/EB/AMReX_EB_bc_fill_nd.F90
deleted file mode 100644
index e7d90e8282d..00000000000
--- a/Src/EB/AMReX_EB_bc_fill_nd.F90
+++ /dev/null
@@ -1,30 +0,0 @@
-module amrex_eb_bc_fill_module
-
-! since this is a .F90 file (instead of .f90) we run this through a C++ preprocessor
-! for e.g., #if (BL_SPACEDIM == 1) statements.
-
-  implicit none
-
-  public
-
-contains
-
-  subroutine amrex_eb_phifill(phi,phi_lo,phi_hi,domlo,domhi,delta,xlo,time,bc) &
-       bind(C, name="amrex_eb_phifill")
-
-    use amrex_fort_module, only : bl_spacedim, amrex_real
-    use amrex_filcc_module, only : amrex_filccn
-
-    implicit none
-
-    integer      :: phi_lo(3),phi_hi(3)
-    integer      :: bc(bl_spacedim,2)
-    integer      :: domlo(3), domhi(3)
-    real(amrex_real) :: delta(3), xlo(3), time
-    real(amrex_real) :: phi(phi_lo(1):phi_hi(1),phi_lo(2):phi_hi(2),phi_lo(3):phi_hi(3))
-
-    call amrex_filccn(phi_lo, phi_hi, phi, phi_lo, phi_hi, 1, domlo, domhi, delta, xlo, bc)
-
-  end subroutine amrex_eb_phifill
-
-end module amrex_eb_bc_fill_module
diff --git a/Src/EB/AMReX_EB_geometry.F90 b/Src/EB/AMReX_EB_geometry.F90
deleted file mode 100644
index cf48e1e7e84..00000000000
--- a/Src/EB/AMReX_EB_geometry.F90
+++ /dev/null
@@ -1,386 +0,0 @@
-module amrex_eb_geometry_module
-
-    use amrex_fort_module, only: amrex_real
-
-    implicit none
-
-contains
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Function: DOT_3D_REAL
-   !!
-   !!  Purpose: Returns the cartesian dot product for two vectors in three
-   !!  dimensions.
-   !!
-   !!  Comments: Vectors are represented as one-dimensional arrays of type
-   !!  real(amrex_real) and of dimension(3) (i.e. indices range from 1..3).
-   !----------------------------------------------------------------------
-    pure function dot_3d_real (v1, v2)
-        implicit none
-
-        real(amrex_real)                           :: dot_3d_real
-        real(amrex_real), dimension(3), intent(in) :: v1, v2
-
-        ! really naive implementation
-        dot_3d_real = v1(1)*v2(1) + v1(2)*v2(2) + v1(3)*v2(3)
-
-    end function dot_3d_real
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Function: CROSS_3D_REAL
-   !!
-   !!  Purpose: Returns the cartesian cross product for two vectors in
-   !!  three dimensions.
-   !!
-   !!  Comments: Vectors are represented as one-dimensional arrays of type
-   !!  real(amrex_real) and of dimension(3) (i.e. indices range from 1..3).
-   !----------------------------------------------------------------------
-    pure function cross_3d_real (v1, v2)
-        implicit none
-
-        real(amrex_real), dimension(3)             :: cross_3d_real
-        real(amrex_real), dimension(3), intent(in) :: v1, v2
-
-        cross_3d_real(1) = v1(2)*v2(3) - v1(3)*v2(2)
-        cross_3d_real(2) = v1(3)*v2(1) - v1(1)*v2(3)
-        cross_3d_real(3) = v1(1)*v2(2) - v1(2)*v2(1)
-
-    end function cross_3d_real
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Function: PT_IN_BOX
-   !!
-   !!  Purpose: Returns true if the coordinate vector represents a point
-   !!  inside a three-dimensional cube of size dx and origin specified by
-   !!  integer vector. As a final input, the user specifies a dimension
-   !!  (axis) to ignore. This allows IN-BOX checking on a box face.
-   !!
-   !!  Comments: Position vectors are represented as one-dimensional arrays
-   !!  of type real(amrex_real) and of dimension(3) (i.e. indices range
-   !!  from 1..3). Cells are enumerated using arrays of type integer and
-   !!  dimension(3).
-   !----------------------------------------------------------------------
-   ! pure function pt_in_box (pt, id, id_ignore)
-   !     implicit none
-
-   !     logical                                :: pt_in_box
-   !     real(amrex_real), dimension(3), intent(in) :: pt
-   !     integer,      dimension(3), intent(in) :: id
-   !     integer,                    intent(in) :: id_ignore
-
-   !     real(amrex_real), dimension(3) :: box_max, box_min
-   !     integer                    :: i
-
-   !     ! Determine box boundaries
-   !     box_min(:) = id(:) * dx(:)
-   !     box_max(:) = (id(:) + 1.) * dx(:)
-
-   !     pt_in_box = .true.
-
-   !     ! Check each coordinate. Skip ignored coordinate.
-   !     do i = 1, 3
-   !         if (.not. (i .eq. id_ignore) ) then
-   !             if ( pt(i) .le. box_min(i) ) then
-   !                 pt_in_box = .false.
-   !                 exit
-   !             end if
-
-   !             if ( pt(i) .ge. box_max(i) ) then
-   !                 pt_in_box = .false.
-   !                 exit
-   !             end if
-   !         end if
-   !     end do
-
-   ! end function pt_in_box
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Subroutine: CALC_FACET_EDGE
-   !!
-   !!  Purpose: Calculates the line (represented by a position and a
-   !!  direction vector) given by the intersection of two planes (defined
-   !!  by two normal (n1, n2) and two positions (h1 = n1.p1, h2 = n2.p2).
-   !!
-   !!  When one plane is the EB surface, and the other is a face of the
-   !!  cell. Then this line represents the edge of the EB facet.
-   !!
-   !!  Comments: Vectors are represented as one-dimensional arrays of type
-   !!  real(amrex_real) and of dimension(3) (i.e. indices range from 1..3).
-   !----------------------------------------------------------------------
-    pure subroutine calc_facet_edge (p0, v, h1, h2, n1, n2)
-        implicit none
-
-        real(amrex_real), dimension(3), intent(  out) :: p0, v
-        real(amrex_real), dimension(3), intent(in   ) :: n1, n2
-        real(amrex_real),               intent(in   ) :: h1, h2
-
-        real(amrex_real) :: c1, c2, c_dp, c_norm
-
-        c_dp = dot_3d_real(n1, n2)
-        c_norm = 1 - c_dp * c_dp
-
-        c1 = ( h1 - h2 * c_dp ) / c_norm
-        c2 = ( h2 - h1 * c_dp ) / c_norm
-
-        p0(:) = c1 * n1(:) + c2 * n2(:)
-        v = cross_3d_real(n1, n2)
-
-    end subroutine calc_facet_edge
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Subroutine: LINES_NEAREST_PT
-   !!
-   !!  Purpose: Given an a line an a point, this subroutine finds the point
-   !!  one the line which minimizes the cartesian distance. It also finds
-   !!  the corresponing distance along the line corresponding to this point
-   !!
-   !!  Comments: Vectors are represented as one-dimensional arrays of type
-   !!  real(amrex_real) and of dimension(3) (i.e. indices range from 1..3).
-   !----------------------------------------------------------------------
-    pure subroutine lines_nearest_pt (lambda_min, nearest_pt, p0, v, pt)
-        implicit none
-
-        real(amrex_real),               intent(  out) :: lambda_min
-        real(amrex_real), dimension(3), intent(  out) :: nearest_pt
-        real(amrex_real), dimension(3), intent(in   ) :: p0, v, pt
-
-        real(amrex_real), dimension(3) :: c
-
-        c(:) = p0(:) - pt(:)
-        lambda_min = - dot_3d_real(v, c) / dot_3d_real(v, v)
-
-        nearest_pt(:) = p0(:) + lambda_min*v(:)
-
-    end subroutine lines_nearest_pt
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Subroutine: SWAP_REALS
-   !!
-   !!  Purpose: Stupid little subroutine which swaps the values of its
-   !!  inputs.
-   !!
-   !!  Comments: Inputs are of type real(amrex_real)
-   !!
-   !----------------------------------------------------------------------
-    pure subroutine swap_reals(a, b)
-        implicit none
-
-        real(amrex_real), intent(inout) :: a, b
-        real(amrex_real)                :: bucket
-
-        bucket = a
-        a      = b
-        b      = bucket
-
-    end subroutine swap_reals
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Subroutine: LAMBDA_BOUNDS
-   !!
-   !!  Purpose: Given a line which passes through a box in three dimensions
-   !!  (it can pass through the edges). Let lambda be a real value
-   !!  representing the coordinate along the line. This subroutine finds
-   !!  teh min/max values of lambda, in order for the point described by
-   !!  lambda to be contained within the box.
-   !!
-   !!  Comments: Vectors are represented as one-dimensional arrays of type
-   !!  real(amrex_real) and of dimension(3) (i.e. indices range from 1..3).
-   !----------------------------------------------------------------------
-    pure subroutine lambda_bounds(lambda_min, lambda_max, id_cell, p0, v, dx)
-
-        use amrex_constants_module , only : one
-
-        implicit none
-
-        real(amrex_real),               intent(  out) :: lambda_min, lambda_max
-        integer,      dimension(3), intent(in   ) :: id_cell
-        real(amrex_real), dimension(3), intent(in   ) :: p0, v, dx
-
-        ! c... are the preliminary boundaries
-        real(amrex_real) :: cx_lo, cy_lo, cz_lo, cx_hi, cy_hi, cz_hi
-
-        ! defaults such that if skipped, min/max will not choose these values anyway
-        cx_lo = -huge(cx_lo)
-        cy_lo = -huge(cy_lo)
-        cz_lo = -huge(cz_lo)
-
-        cx_hi = huge(cx_hi)
-        cy_hi = huge(cy_hi)
-        cz_hi = huge(cz_hi)
-
-        ! if the line runs parrallel to any of these dimensions (which is true for
-        ! EB edges), then skip -> the min/max functions at the end will skip them
-        ! due to the +/-huge(c...) defaults (above).
-
-        if ( abs(v(1)) .gt. epsilon(v) ) then
-            cx_lo = -( p0(1) -   real(id_cell(1),amrex_real)         * dx(1) ) / v(1)
-            cx_hi = -( p0(1) - ( real(id_cell(1),amrex_real) + one ) * dx(1) ) / v(1)
-
-            if ( v(1) .lt. 0. ) then
-                call swap_reals(cx_lo, cx_hi)
-            end if
-        end if
-
-        if ( abs(v(2)) .gt. epsilon(v) ) then
-            cy_lo = -( p0(2) -   real(id_cell(2),amrex_real)         * dx(2) ) / v(2)
-            cy_hi = -( p0(2) - ( real(id_cell(2),amrex_real) + one ) * dx(2) ) / v(2)
-
-            if ( v(2) .lt. 0. ) then
-                call swap_reals(cy_lo, cy_hi)
-            end if
-        end if
-
-        if ( abs(v(3)) .gt. epsilon(v) )  then
-            cz_lo = -( p0(3) -   real(id_cell(3),amrex_real)         * dx(3) ) / v(3)
-            cz_hi = -( p0(3) - ( real(id_cell(3),amrex_real) + one ) * dx(3) ) / v(3)
-
-            if ( v(3) .lt. 0. ) then
-                call swap_reals(cz_lo, cz_hi)
-            end if
-        endif
-
-        lambda_min = max(cx_lo, cy_lo, cz_lo)
-        lambda_max = min(cx_hi, cy_hi, cz_hi)
-
-    end subroutine lambda_bounds
-
-   !----------------------------------------------------------------------
-   !!
-   !>  Pure Function: FACETS_NEAREST_PT
-   !!
-   !!  Purpose: Given a collision between particle and EB surface, and
-   !!  given that a neighbour cell owns the EB surface, a collision between
-   !!  the particle and the EDGE of the EB facet might occur. This
-   !!  function returns the coordinates of the closest point on the edge of
-   !!  an EB facet. This function does not check of collisions.
-   !!
-   !!  Comments: Position and normal vectors are represented as
-   !!  one-dimensional arrays of type real(amrex_real) and of dimension(3)
-   !!  (i.e. indices range from 1..3). Cells are enumerated using arrays of
-   !!  type integer and of dimension(3).
-   !----------------------------------------------------------------------
-    pure function facets_nearest_pt(ind_pt, ind_loop, r_vec, eb_normal, eb_p0, dx)
-
-        use amrex_constants_module , only : one, half
-
-        implicit none
-
-        real(amrex_real), dimension(3)             :: facets_nearest_pt
-        integer,      dimension(3), intent(in) :: ind_pt, ind_loop
-        real(amrex_real), dimension(3), intent(in) :: r_vec, eb_normal, eb_p0, dx
-
-        integer,      dimension(3) :: ind_facets
-        integer                    :: n_facets, i_facet, tmp_facet, ind_cell, ind_nb
-        real(amrex_real), dimension(3) :: c_vec, c_vec_tmp, rc_vec
-        real(amrex_real), dimension(3) :: facet_normal, facet_p0, edge_p0, edge_v
-        real(amrex_real)               :: min_dist, min_dist_tmp, eb_h, facet_h
-
-        ! variables keeping track of coordinates on EB edges
-        ! lambda_tmp: current lambda-value being used in testing for edge collions
-        ! lambda: minimum (closets to bcentre) lambda value satisfying potential collision
-        real(amrex_real) :: f_c, lambda_tmp, lambda_max, lambda_min
-
-
-        ! Enumerate the possible EB facet edges invovlved.
-        n_facets = 0
-
-        if ( .not. (ind_pt(1) .eq. ind_loop(1)) ) then
-            n_facets = n_facets + 1
-            ind_facets(n_facets) = 1
-        end if
-
-        if ( .not. (ind_pt(2) .eq. ind_loop(2)) ) then
-            n_facets = n_facets + 1
-            ind_facets(n_facets) = 2
-        end if
-
-        if ( .not. (ind_pt(3) .eq. ind_loop(3)) ) then
-            n_facets = n_facets + 1
-            ind_facets(n_facets) = 3
-        end if
-
-        ! scalar characterizing EB facet position
-        eb_h = dot_3d_real(eb_normal, eb_p0)
-
-        ! itterate over EB facet edges and find whichever has the closest nearest point
-        min_dist = huge(min_dist)
-        do i_facet = 1, n_facets
-            tmp_facet = ind_facets(i_facet)
-
-            ! determine the normal of the cell's facet (cube faces)
-            facet_normal = (/ 0., 0., 0. /)
-            facet_normal(tmp_facet) = 1.  ! whether facing inwards or outwards is not important here
-
-            ! skip cases where cell faces conincide with the eb facets
-            if (all(abs(eb_normal) == abs(facet_normal))) cycle
-
-            ind_cell = ind_loop(tmp_facet)
-            ind_nb = ind_pt(tmp_facet)
-
-            ! determine position of the cell's facet
-            if (ind_cell .lt. ind_nb) then
-                f_c = ( real(ind_cell,amrex_real) + one ) * dx(tmp_facet)
-            else ! if (ind_cell .gt. ind_nb) then
-                f_c =   real(ind_cell,amrex_real)         * dx(tmp_facet)
-            end if
-
-            facet_p0 = (/                             &
-                ( real(ind_loop(1),amrex_real) + half ) * dx(1) , &
-                ( real(ind_loop(2),amrex_real) + half ) * dx(2) , &
-                ( real(ind_loop(3),amrex_real) + half ) * dx(3)   &
-            /)
-            facet_p0(tmp_facet) = f_c
-
-            ! scalar characterizing cell facet position
-            facet_h = dot_3d_real(facet_normal, facet_p0)
-
-            ! compute EB facet edge by finding the intercept between EB surface (first plane)
-            ! and the cell's facet (second plane)
-            call calc_facet_edge (edge_p0, edge_v, eb_h, facet_h, eb_normal, facet_normal)
-            ! this solution is a line representing the closest EB edge, now compute the point
-            ! on the line which minimizes the distance to the particle
-            call lines_nearest_pt (lambda_tmp, c_vec_tmp, edge_p0, edge_v, r_vec)
-
-            ! IMPORTANT: this point might be outside the cell
-            !  -> in that case, it will be one of the cell's corners
-
-            ! but don't use the PT_IN_BOX function, as it can yield false positives / negatives
-            !  -> but if you do want to use it, include test [1] below to avoid rounding errors
-            !if (.not. pt_in_box(c_vec_tmp, ind_loop, tmp_facet)) then
-
-            ! if closest point is outside cell, determine the furthest we can go along the
-            ! EB edge line whilst staying within the cell.
-            call lambda_bounds(lambda_min, lambda_max, ind_loop, edge_p0, edge_v, dx)
-
-            if (lambda_tmp .lt. lambda_min) then
-                lambda_tmp = lambda_min
-            elseif ( lambda_tmp .gt. lambda_max) then
-                lambda_tmp = lambda_max
-            end if
-            c_vec_tmp(:) = edge_p0(:) + lambda_tmp*edge_v(:)
-
-            !end if
-
-            ! determine new distance to particle
-            rc_vec(:) = c_vec_tmp(:) - r_vec(:)
-            min_dist_tmp = dot_3d_real(rc_vec, rc_vec)
-
-            ! minimize distance
-            if (min_dist_tmp .lt. min_dist) then
-                min_dist = min_dist_tmp
-                c_vec(:) = c_vec_tmp(:)
-            end if
-        end do
-
-        facets_nearest_pt(:) = c_vec(:)
-
-    end function facets_nearest_pt
-
-end module amrex_eb_geometry_module
diff --git a/Src/EB/AMReX_EB_levelset.H b/Src/EB/AMReX_EB_levelset.H
deleted file mode 100644
index 10936d929fe..00000000000
--- a/Src/EB/AMReX_EB_levelset.H
+++ /dev/null
@@ -1,497 +0,0 @@
-#ifndef AMREX_EB_LEVELSET_H_
-#define AMREX_EB_LEVELSET_H_
-
-#include <AMReX_REAL.H>
-#include <AMReX_Vector.H>
-#include <AMReX_RealVect.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_iMultiFab.H>
-#include <AMReX_BoxArray.H>
-
-#include <AMReX_EB2.H>
-#include <AMReX_EB2_GeometryShop.H>
-
-#include <AMReX_EBFabFactory.H>
-#include <AMReX_EBCellFlag.H>
-
-
-namespace amrex {
-
-class LSFactory {
-    private:
-
-        //! MultiFab pointers storing level-set data
-        //!    -> ls_grid: nodal MultiFab storing signed distance function to the
-        //!                nearest wall
-        //!    -> ls_valid: cell-centered iMultiFab storing integer flags
-        //!                 assuming the following values:
-        //!         -1 : not all nodes around cell have been initialized
-        //!          0 : none of the cell's neighbours contain negative vlaues of
-        //!              ls_phi on its nodes
-        //!          1 : the cell is in the neighbourhood of phi < 0
-        std::unique_ptr<MultiFab>  ls_grid;
-        std::unique_ptr<iMultiFab> ls_valid;
-
-        //! AMR information (needed for EBISLevel)
-        const int amr_lev;
-
-        DistributionMapping ls_dm;
-
-        //! Refined box array (over which the level-set MultiFab is constructed)
-        BoxArray ls_ba, cc_ba, eb_ba;
-        const int ls_grid_ref, eb_grid_ref;
-        //! Data structures encloding (padded) EB index space
-        std::unique_ptr<MultiFab> eb_grid;
-
-        //! Geometry objects reflecting refined (and padded) BoxArrays. This is
-        //! required to prevent PeriodicFill operations from "spilling" refined
-        //! indices over periodic boundaries
-        Geometry geom_ls, geom_eb;
-
-        //! Padding of the leve-set and EB grids:
-        const int ls_grid_pad, eb_grid_pad;
-
-        //! Tiling for local level-set filling
-        int eb_tile_size;
-
-        //! Baseline BoxArray and Geometry from which refined quantities are
-        //! derived. These are mainly kept around for the copy constructor.
-        BoxArray base_ba;
-        Geometry base_geom;
-
-        //! Cell size of the refined grids
-        const RealVect dx_vect, dx_eb_vect;
-
-        //! Updates internal BoxArray and DistributionMapping given a
-        //! "reference" BoxArray at a coarser level. Uses `ls_grid_ref` and
-        //! `eb_grid_ref` to construct refined versions of `ba`.
-        void update_ba(const BoxArray & new_ba, const DistributionMapping & dm);
-
-        //! Initialize internal BoxArray, and Geometry objects given reference
-        //! BoxArray and Geometry (at a coarser level of refinement)
-        void init_geom(const BoxArray & ba, const Geometry & geom, const DistributionMapping & dm);
-
-        void fill_valid_kernel();
-        void fill_valid(int n);
-        void fill_valid();
-
-    public:
-        LSFactory(int lev, int ls_ref, int eb_ref, int ls_pad, int eb_pad,
-                  const BoxArray & ba, const Geometry & geom, const DistributionMapping & dm,
-                  int eb_tile_size = 32);
-        LSFactory(const LSFactory & other);
-        ~LSFactory();
-
-        void regrid(const BoxArray & ba, const DistributionMapping & dm);
-
-        void invert();
-
-        void set_data(const MultiFab & mf_ls);
-
-
-        /************************************************************************
-         *                                                                      *
-         * Utility to gather local EB facets                                    *
-         *                                                                      *
-         ***********************************************************************/
-
-        //! Construct eb_facets list from eb_factory. The facet list is a 1-D
-        //! list of facet bcent positions, followed by normals => N facets would
-        //! be stored in a Vector<Real> of length 6*N. Only facets that fall
-        //! within the Box `eb_search` are included in the list. The RealVect
-        //! `eb_dx` provides the discretization of the EB data. NOTE:
-        //! `be_search` must be contained in the `norm_tile`, `bcent_tile` and
-        //! `flag_tile`.
-        static std::unique_ptr<Vector<Real>> eb_facets(const FArrayBox & norm_tile,
-                                                       const CutFab & bcent_tile,
-                                                       const EBCellFlagFab & flag_tile,
-                                                       const RealVect & eb_dx,
-                                                       const Box & eb_search);
-
-
-        /************************************************************************
-         *                                                                      *
-         * Utilities that fill the level-set MultiFab using local EB Factory    *
-         * NOTE: returns an iMultiFab flagging "valid" data                     *
-         *                                                                      *
-         ***********************************************************************/
-
-        //! Fills level-set MultiFab `data` locally from EBFArrayBoxFactory
-        //! `eb_factory`. Same as `fill_data` but with cubic EB search box.
-        static void fill_data (MultiFab & data, iMultiFab & valid,
-                               const EBFArrayBoxFactory & eb_factory,
-                               const MultiFab & eb_impfunc,
-                               int ebt_size, int ls_ref, int eb_ref,
-                               const Geometry & geom, const Geometry & geom_eb);
-
-        //! Fills level-set MultiFab `data` locally from EBFArrayBoxFactory
-        //! `eb_factory`. Also fills iMultiFab tagging cells which are nearby to
-        //! EB surface. Only EB facets in a box size of `ebt_size` are
-        //! considered. Any EB facets that are outside this box are ignored =>
-        //! the min/max value of the level-set are +/- `eb_pad *
-        //! min(geom_eb.CellSize(:))`.
-        static void fill_data (MultiFab & data, iMultiFab & valid,
-                               const EBFArrayBoxFactory & eb_factory,
-                               const MultiFab & eb_impfunc,
-                               const IntVect & ebt_size, int ls_ref, int eb_ref,
-                               const Geometry & geom, const Geometry & geom_eb);
-
-        //! Fills level-set MultiFab `data` from implicit function MultiFab
-        //! `mf_impfunc`. Also fills iMultiFab tagging cells whose values are
-        //! informed by nearby EB surfaces (in the case of implicit-function
-        //! filling without threshold, this covers the whole domain). This works
-        //! as long as the implicit function is a signed distance function. The
-        //! int `eb_pad` and Geometry object `geom_eb` can be used to specify a
-        //! level-set threshold (`eb_pad*min(geom_eb.CellSize(:))`) to make the
-        //! result compatible with Intersections and Unions with EB-filled
-        //! level-sets. No threshold is applied with `eb_pad < 0`
-        static void fill_data (MultiFab & data, iMultiFab & valid,
-                               const MultiFab & mf_impfunc,
-                               int eb_pad, const Geometry & eb_geom);
-
-
-        //! Updates the level-set MultiFab `data` with the result of
-        //! intersection operation between `data` and another level-set MultiFab
-        //! `data_in`, for all cells where `valid_in == 1`. The iMultiFab
-        //! `valid` is also updated with the new valid flags corresponding to
-        //! the intersection level-set.
-        static void intersect_data (MultiFab & data, iMultiFab & valid,
-                                    const MultiFab & data_in, const iMultiFab & valid_in,
-                                    const Geometry & geom_ls);
-
-
-        //! Updates the level-set MultiFab `data` with the result of union
-        //! operation between `data` and another level-set MultiFab `data_in`,
-        //! for all cells where `valid_in == 1`. The iMultiFab `valid` is also
-        //! updated with the new valid flags corresponding to the intersection
-        //! level-set.
-        static void union_data (MultiFab & data, iMultiFab & valid,
-                                const MultiFab & data_in, const iMultiFab & valid_in,
-                                const Geometry & geom_ls);
-
-
-
-        /************************************************************************
-         *                                                                      *
-         * Public member functions to update level-set data                     *
-         *                                                                      *
-         ***********************************************************************/
-
-        //! Fills (overwrites) level-set data locally. The local EB search
-        //! radius is managed by LSFactory. EB search box is defaulted to
-        //! `LSFactory::eb_tile_size`. Level-set values are guaranteed to be
-        //! accurate up to `LSFactory::eb_grid_pad` cells. Returns: iMultiFab
-        //! indicating region that has been filled by a valid level-set function
-        //! (i.e. the value of the level-set was informed by nearby EB facets)
-        std::unique_ptr<iMultiFab> Fill(const EBFArrayBoxFactory & eb_factory,
-                                        const MultiFab & mf_impfunc);
-
-        //! Fills (overwrites) level-set data locally. The local EB search
-        //! radius is specified by the user corresponding to a cube with
-        //! edge-length = `ebt_size`. Level-set values are guaranteed to be
-        //! accurate up to `LSFactory::eb_grid_pad` cells. Returns: iMultiFab
-        //! indicating region that has been filled by a valid level-set function
-        //! (i.e. the value of the level-set was informed by nearby EB facets)
-        std::unique_ptr<iMultiFab> Fill(const EBFArrayBoxFactory & eb_factory,
-                                        const MultiFab & mf_impfunc,
-                                        int ebt_size);
-
-        //! Fills (overwrites) level-set data locally. The local EB search
-        //! radius is specified by the user corresponding to a box with edge
-        //! lengths given by the IntVect `ebt_size`. Level-set values are
-        //! guaranteed to be accurate up to `LSFactory::eb_grid_pad` cells.
-        //! Returns: iMultiFab indicating region that has been filled by a valid
-        //! level-set function (i.e. the value of the level-set was informed by
-        //! nearby EB facets)
-        std::unique_ptr<iMultiFab> Fill(const EBFArrayBoxFactory & eb_factory,
-                                        const MultiFab & mf_impfunc,
-                                        const IntVect & ebt_size);
-
-        //! Fills (overwrites) level-set data locally. The level-set is given by
-        //! an implicit function which is defined on a MultiFab `mf_impfunc`,
-        //! which has the same resolution, and at least as many ghost-cells, as
-        //! the LSFactory. This can be guaranteed using the
-        //! LSUtility::GShopLSFactory. Requires that the implicit function is a
-        //! signed distance function. If `apply_threshold = true` level-set is
-        //! truncated to to a length scale corresponding to `eb_grid_pad` cells
-        //! (making it compatible with the EBFArrayBoxFactory version). Returns:
-        //! iMultiFab indicating region that has been filled by a valid
-        //! level-set function (i.e. the value of the level-set was informed by
-        //! nearby EB facets)
-        std::unique_ptr<iMultiFab> Fill(const MultiFab & mf_impfunc,
-                                        bool apply_threshold = false);
-
-        //! Performs intersection operation with the level-set representation of
-        //! `eb_factory`. The implicit function (mf_impfunc) is needed to select
-        //! the inside/outside edge-cases where the level-set cannot be
-        //! determined by projection onto EB facets.
-        std::unique_ptr<iMultiFab> Intersect(const EBFArrayBoxFactory & eb_factory,
-                                             const MultiFab & mf_impfunc);
-
-        //! Performs intersection operation with the level-set representation of
-        //! `eb_factory`. The integer `ebt_size` specifies the (cubic) tile size
-        //! used to search of EB facets.
-        std::unique_ptr<iMultiFab> Intersect(const EBFArrayBoxFactory & eb_factory,
-                                             const MultiFab & mf_impfunc,
-                                             int ebt_size);
-
-        //! Performs intersection operation with the level-set representation of
-        //! `eb_factory`. The IntVect `ebt_size` specifies the tile size used to
-        //! search of EB facets.
-        std::unique_ptr<iMultiFab> Intersect(const EBFArrayBoxFactory & eb_factory,
-                                             const MultiFab & mf_impfunc,
-                                             const IntVect & ebt_size);
-
-        //! Performs intersection operation with the level-set given in the
-        //! MultiFab `mf_impfunc`. If the flag `apply_threshold == true`, then
-        //! the level-set in `mf_impfunc` will be thresholded.
-        std::unique_ptr<iMultiFab> Intersect(const MultiFab & mf_impfunc,
-                                             bool apply_threshold = false);
-
-        //! Performs union operation with the level-set representation of
-        //! `eb_factory`. The implicit function (mf_impfunc) is needed to select
-        //! the inside/outside edge-cases where the level-set cannot be
-        //! determined by projection onto EB facets.
-        std::unique_ptr<iMultiFab> Union(const EBFArrayBoxFactory & eb_factory,
-                                         const MultiFab & mf_impfunc);
-
-        //! Performs union operation with the level-set representation of
-        //! `eb_factory`. The integer `ebt_size` specifies the (cubic) tile size
-        //! used to search of EB facets.
-        std::unique_ptr<iMultiFab> Union(const EBFArrayBoxFactory & eb_factory,
-                                         const MultiFab & mf_impfunc,
-                                         int ebt_size);
-
-        //! Performs union operation with the level-set representation of
-        //! `eb_factory`. The IntVect `ebt_size` specifies the tile size used to
-        //! search of EB facets.
-        std::unique_ptr<iMultiFab> Union(const EBFArrayBoxFactory & eb_factory,
-                                         const MultiFab & mf_impfunc,
-                                         const IntVect & ebt_size);
-
-        //! Performs union operation with the level-set given in the MultiFab
-        //! `mf_impfunc`. If the flag `apply_threshold == true`, then the
-        //! level-set in `mf_impfunc` will be thresholded.
-        std::unique_ptr<iMultiFab> Union(const MultiFab & mf_impfunc,
-                                         bool apply_threshold = false);
-
-        //! Update internal `ls_grid`` and `ls_valid` taking the min of
-        //! `ls_grid` and `ls_in`
-        void update_intersection(const MultiFab & ls_in, const iMultiFab & valid_in);
-
-        //! Update internal `ls_grid`` and `ls_valid` taking the max of
-        //! `ls_grid` and `ls_in`
-        void update_union(const MultiFab & ls_in, const iMultiFab & valid_in);
-
-        //! Return mutable pointer to level-set data
-              MultiFab *  get_data()       {return ls_grid.get();};
-        //! Return constant pointer to level-set data
-        const MultiFab *  get_data() const {return ls_grid.get();};
-        //! Return constant pointer to level-set data
-        const iMultiFab * get_valid() const {return ls_valid.get();};
-
-        //! Copy level-set data into a new MultiFab with BoxArray matching the
-        //! LSFactory `ls_ba`, and DistributionMapping `dm`. Returns a
-        //! unique_ptr to the new MultiFab.
-        std::unique_ptr<MultiFab>  copy_data(const DistributionMapping & dm) const;
-
-        //! Copy level-set valid tags into a new iMultiFab with BoxArray
-        //! matching the LSFactory `ls_ba`, and DistributionMapping `dm`.
-        //! Returns a unique_ptr to the new iMultiFab.
-        std::unique_ptr<iMultiFab> copy_valid(const DistributionMapping & dm) const;
-
-        //! Coarsen level-set data by a coarsening ration of `ls_grid_ref`. The
-        //! coarsened data is saved into a new MultiFab with coarsened version
-        //! of the LSFactory BoxArray `ls_ba`, and DistributionMapping `dm_ls`.
-        //! Returns a unique_ptr to the new MultiFab.
-        std::unique_ptr<MultiFab>  coarsen_data() const;
-
-        //! Return level-set refinement
-        int get_ls_ref() const {return ls_grid_ref;};
-        //! Return level-set ghost cells (in units of the refined grid)
-        int get_ls_pad() const {return ls_grid_pad;};
-        //! Return EB grid refinement
-        int get_eb_ref() const {return eb_grid_ref;};
-        //! Return EB-grid ghost cells (in units of the refined eb-grid)
-        int get_eb_pad() const {return eb_grid_pad;};
-
-        //! Return AMR level
-        int get_amr_level() const {return amr_lev;};
-
-
-        //! Return BoxArrays:
-        //!    -> ls: levelset (nodal)
-        //!    -> cc: cell-centered (dual to ls) used by valid
-        //!    -> eb: BoxArray used by EBIS (cell-centered)
-        const BoxArray & get_ls_ba() const {return ls_ba;};
-        const BoxArray & get_cc_ba() const {return cc_ba;};
-        const BoxArray & get_eb_ba() const {return eb_ba;};
-        const BoxArray & get_ba()    const {return base_ba;};
-
-        const Geometry & get_geom()          const {return base_geom;};
-        const Geometry & get_ls_geom()       const {return geom_ls;};
-        const Geometry & get_eb_geom()       const {return geom_eb;};
-        const DistributionMapping & get_dm() const {return ls_dm;};
-};
-
-
-
-//! Template class that handles filling implicit functions from GeometryShop.
-//! The implicit function is filled into a MultiFab with the same CellSize,
-//! BoxArray, DistributionMapping, and number of ghost cells as the LSFactory.
-template <class F>
-class GShopLSFactory {
-    private:
-        EB2::GeometryShop<F> m_gshop;
-        Geometry             m_geom;
-        BoxArray             m_ls_ba;
-        DistributionMapping  m_ls_dm;
-        int                  m_ls_pad;
-
-    public:
-        GShopLSFactory( const EB2::GeometryShop<F> & gshop, const LSFactory & level_set )
-            : m_gshop(gshop),
-              m_geom(level_set.get_ls_geom()),
-              m_ls_ba(level_set.get_ls_ba()),
-              m_ls_dm(level_set.get_dm()),
-              m_ls_pad(level_set.get_ls_pad())
-        {}
-
-        GShopLSFactory (const EB2::GeometryShop<F> & gshop, const Geometry & geom,
-                        const BoxArray & ba, const DistributionMapping & dm, int ls_pad)
-            : m_gshop(gshop), m_geom(geom), m_ls_ba(ba), m_ls_dm(dm), m_ls_pad(ls_pad)
-        {
-            // Ensure that the inputted (refence) BoxArray is nodal
-            BoxArray ba_nd = amrex::convert(ba, IntVect::TheNodeVector());
-            m_ls_ba = ba_nd;
-        }
-
-        GShopLSFactory (const EB2::GeometryShop<F> & gshop, const Geometry & geom_crse,
-                        const BoxArray & ba_crse, const DistributionMapping & dm,
-                        int ls_pad, int ls_ref)
-            : m_gshop(gshop), m_ls_dm(dm), m_ls_pad(ls_pad)
-        {
-            // Set up refined geometry
-            Box dom = geom_crse.Domain();
-            dom.refine(ls_ref);
-            Geometry geom(dom);
-            m_geom = geom;
-
-            // Set up refined BoxArray. NOTE: ensure that the inputted
-            // (reference) BoxArray is nodal
-            BoxArray ba = amrex::convert(ba_crse, IntVect::TheNodeVector());
-            ba.refine(ls_ref);
-            m_ls_ba = ba;
-        }
-
-        //! Fill MultiFab (with the same CellSize, BoxArray,
-        //! DistributionMapping, and number of ghost cells as the LSFactory)
-        //! with the implicit function values. The filled MultiFab is returned
-        //! as a std::unique_ptr<MultiFab>.
-        std::unique_ptr<MultiFab> fill_impfunc() {
-            std::unique_ptr<MultiFab> mf_impfunc = std::unique_ptr<MultiFab>(new MultiFab);
-            mf_impfunc->define(m_ls_ba, m_ls_dm, 1, m_ls_pad);
-
-#ifdef _OPENMP
-#pragma omp parallel if (Gpu::notInLaunchRegion())
-#endif
-            for(MFIter mfi(* mf_impfunc); mfi.isValid(); ++ mfi)
-                m_gshop.fillFab((* mf_impfunc)[mfi], m_geom, RunOn::Gpu);
-
-            mf_impfunc->FillBoundary(m_geom.periodicity());
-
-            return mf_impfunc;
-        }
-};
-
-
-
-//! Collection of static functions that help with the construction of LSFactory
-//! objects.
-class LSUtility {
-    public:
-
-
-    /****************************************************************************
-     *                                                                          *
-     * Utility functions for creating geometry objects with the correct Domain  *
-     * and CellSize as requires by the LSFactory object.                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    //! Construct geometry with the Domain (Box) inherited from the Geometry
-    //! `geom`, and CellSize matching the LSFactory `level_set` resolution.
-    static Geometry make_ls_geometry(const LSFactory & level_set, const Geometry & geom){
-        // Set up refined geometry
-        Box dom_ls = geom.Domain();
-        dom_ls.refine(level_set.get_ls_ref());
-        Geometry geom_ls(dom_ls);
-
-        return geom_ls;
-    }
-
-
-    //! Construct geometry with the Domain (Box) inherited from the Geometry
-    //! `geom`, and CellSize matching the LSFactory `level_set` EB resolution.
-    //! This is particularly useful for building EBFArrayBoxFactory objects
-    //! whose Geometry is what's expected by the LSFactory's filling routines.
-    static Geometry make_eb_geometry(const LSFactory & level_set, const Geometry & geom){
-        // Set up refined geometry
-        Box dom_eb = geom.Domain();
-        dom_eb.refine(level_set.get_eb_ref());
-        Geometry geom_eb(dom_eb);
-
-        return geom_eb;
-    }
-
-
-    //! Returns the min CellSize of the Geometry object `geom`.
-    static Real min_dx (const Geometry & geom) {
-
-        const Real * dx = geom.CellSize();
-
-#if (AMREX_SPACEDIM == 1)
-        const Real min_dx = dx[0];
-#elif (AMREX_SPACEDIM == 2)
-        const Real min_dx = std::min(dx[0], dx[1]);
-#elif (AMREX_SPACEDIM == 3)
-        const Real min_dx = std::min(dx[0], std::min(dx[1], dx[2]));
-#endif
-
-        return min_dx;
-    }
-
-
-    //! Returns the minimum eb_pad (EB ghost cells) to ensure that the level-set
-    //! is able to resolve a length scale of at least `min_resolution`.
-    static int min_eb_pad (Real min_resolution, const Geometry & geom_eb) {
-
-        const Real min_dx = LSUtility::min_dx(geom_eb);
-
-        return static_cast<int>(min_resolution/min_dx);
-    }
-
-
-    //! Debug utility to help interrogate runtime flag types.
-    static void PrintFlagType(const Box & tile_box, const EBCellFlagFab & flag){
-
-        if(flag.getType(tile_box) == FabType::covered)
-            amrex::Print() << "flag covered" << std::endl;
-        else if(flag.getType(tile_box) == FabType::regular)
-            amrex::Print() << "flag regular" << std::endl;
-        else if(flag.getType(tile_box) == FabType::singlevalued)
-            amrex::Print() << "flag singlevalued" << std::endl;
-        else if(flag.getType(tile_box) == FabType::multivalued)
-            amrex::Print() << "flag multivalued" << std::endl;
-        else if(flag.getType(tile_box) == FabType::undefined)
-            amrex::Print() << "flag undefined" << std::endl;
-        else
-            amrex::Print() << "flag ill-formed" << std::endl;
-    }
-};
-
-
-
-}
-
-#endif
diff --git a/Src/EB/AMReX_EB_levelset.cpp b/Src/EB/AMReX_EB_levelset.cpp
deleted file mode 100644
index 83e1247ed19..00000000000
--- a/Src/EB/AMReX_EB_levelset.cpp
+++ /dev/null
@@ -1,1120 +0,0 @@
-#include "AMReX_EB_levelset.H"
-
-#include <AMReX_REAL.H>
-#include <AMReX_Vector.H>
-#include <AMReX_RealVect.H>
-#include <AMReX_EBFArrayBox.H>
-#include <AMReX_EBFabFactory.H>
-
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_MultiCutFab.H>
-#include "AMReX_BoxIterator.H"
-#include <AMReX_EBCellFlag.H>
-
-#include <AMReX_EB_F.H>
-#include <AMReX_EB_utils.H>
-
-#include <AMReX_EB2.H>
-
-namespace amrex {
-
-LSFactory::LSFactory(int lev, int ls_ref, int eb_ref, int ls_pad, int eb_pad,
-                     const BoxArray & ba, const Geometry & geom, const DistributionMapping & dm,
-                     int a_eb_tile_size)
-    : amr_lev(lev),
-      ls_grid_ref(ls_ref), eb_grid_ref(eb_ref),
-      ls_grid_pad(ls_pad), eb_grid_pad(eb_pad),
-      eb_tile_size(a_eb_tile_size),
-      dx_vect(AMREX_D_DECL(geom.CellSize()[0]/ls_ref,
-                           geom.CellSize()[1]/ls_ref,
-                           geom.CellSize()[2]/ls_ref)),
-      dx_eb_vect(AMREX_D_DECL(geom.CellSize()[0]/eb_ref,
-                              geom.CellSize()[1]/eb_ref,
-                              geom.CellSize()[2]/eb_ref))
-{
-
-    BL_PROFILE("LSFactory::LSFactory()");
-
-    // Init geometry over which the level set and EB are defined
-    init_geom(ba, geom, dm);
-
-    // Initialize MultiFab pointers storing level-set data
-    //    -> ls_grid:  nodal MultiFab storing signed distance function to the nearest wall
-    //    -> ls_valid: cell-centered iMultiFab storing integer flags assuming the following values:
-    //         -1 : not all nodes around cell have been initialized
-    //          0 : none of the cell's neighbours contain negative vlaues of ls_phi on its nodes
-    //          1 : the cell is in the neighbourhood of phi < 0
-    ls_grid  = std::unique_ptr<MultiFab>(new MultiFab);
-    ls_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-
-    // Temporary MultiFab used for generating EB factories.
-    eb_grid = std::unique_ptr<MultiFab>(new MultiFab);
-
-    // Define ls_grid and ls_valid, growing them by ls_pad
-    // Note: box arrays (such as ls_ba) are initialized in init_geom() -> update_ba()
-    ls_grid->define(ls_ba, dm, 1, ls_pad);
-    ls_valid->define(ls_ba, dm, 1, ls_pad);
-    ls_valid->setVal(-1);
-
-    // Define eb_grid, growing it by eb_pad
-    eb_grid->define(eb_ba, dm, 1, eb_pad);
-
-
-    // Initialize by setting all ls_phi = huge(c_real)
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid, true); mfi.isValid(); ++mfi){
-        // also initialize ghost cells => growntilebox. Note: if a direction is
-        // not periodic, FillBoundary will never touch those ghost cells.
-        Box tile_box   = mfi.growntilebox();
-        auto & ls_tile = (* ls_grid)[mfi];
-
-        // Initialize in fortran land
-        amrex_eb_init_levelset(tile_box.loVect(), tile_box.hiVect(),
-                               ls_tile.dataPtr(), ls_tile.loVect(),  ls_tile.hiVect());
-    }
-}
-
-
-
-LSFactory::LSFactory(const LSFactory & other) :
-    LSFactory(other.get_amr_level(),
-              other.get_ls_ref(), other.get_eb_ref(),
-              other.get_ls_pad(), other.get_eb_pad(),
-              other.get_ba(), other.get_geom(), other.get_dm() )
-{
-
-    BL_PROFILE("LSFactory::LSFactory(LSFactory)");
-
-
-    //ls_grid  = other.copy_data();
-    //ls_valid = other.copy_valid();
-}
-
-
-
-LSFactory::~LSFactory() {
-
-    BL_PROFILE("LSFactory::~LSFactory()");
-
-    ls_grid.reset();
-    ls_valid.reset();
-    eb_grid.reset();
-}
-
-
-
-void LSFactory::update_ba(const BoxArray & new_ba, const DistributionMapping & dm) {
-
-    BL_PROFILE("LSFactory::update_ba()");
-
-    base_ba = new_ba;
-
-    // Refined versions of both the cell-centered and nodal (phi)
-    const BoxArray phi_ba = amrex::convert(new_ba, IntVect::TheNodeVector());
-
-    ls_dm = dm;
-
-    ls_ba = phi_ba;
-    ls_ba.refine(ls_grid_ref);
-
-    cc_ba = new_ba;
-    cc_ba.refine(ls_grid_ref);
-
-    eb_ba = new_ba;
-    eb_ba.refine(eb_grid_ref);
-}
-
-
-
-void LSFactory::init_geom(const BoxArray & ba, const Geometry & geom,
-                          const DistributionMapping & dm) {
-
-    BL_PROFILE("LSFactory::init_geom()");
-
-    base_geom = geom;
-
-    // Initialize Geometry objects for the level set and the EB, note that the
-    // Geometry objects reflect the refined (and padded) box arrays, preventing
-    // periodic fill operations from "spilling over" from refined/padded
-    // indices.
-    update_ba(ba, dm);
-
-    geom_ls = LSUtility::make_ls_geometry(* this, geom);
-    geom_eb = LSUtility::make_eb_geometry(* this, geom);
-}
-
-
-
-void LSFactory::fill_valid_kernel(){
-
-    BL_PROFILE("LSFactory::fill_valid_kernel()");
-
-    int search_radius = 1;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid, true); mfi.isValid(); ++ mfi) {
-        Box tile_box = mfi.tilebox();
-        const int * lo = tile_box.loVect();
-        const int * hi = tile_box.hiVect();
-
-        const auto & ls_tile = (* ls_grid)[mfi];
-        auto & valid_tile    = (* ls_valid)[mfi];
-
-        amrex_eb_fill_valid(lo, hi,
-                            BL_TO_FORTRAN_3D(valid_tile),
-                            BL_TO_FORTRAN_3D(ls_tile),
-                            & search_radius);
-
-    }
-}
-
-
-
-void LSFactory::fill_valid(int n){
-
-    BL_PROFILE("LSFactory::fill_valid(n)");
-
-    if(n <= 0) return;
-
-    fill_valid_kernel();
-    return fill_valid(n-1);
-}
-
-
-
-void LSFactory::fill_valid(){
-
-    BL_PROFILE("LSFactory::fill_valid()");
-
-    fill_valid(ls_grid_pad);
-
-   /****************************************************************************
-    * Set boundary values of valid_grid                                        *
-    ****************************************************************************/
-
-    BL_PROFILE_REGION_START("LSFactory::fill_valid()::bcs");
-
-    // Simulation domain
-    Box domain(geom_ls.Domain());
-
-    // Int array flagging periodic directions => no need to fill the periodic
-    // ones as they are filled by FillBoundary
-    IntVect periodic(
-            AMREX_D_DECL(
-                geom_ls.isPeriodic(0),
-                geom_ls.isPeriodic(1),
-                geom_ls.isPeriodic(2)
-            )
-        );
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid); mfi.isValid(); ++mfi){
-        auto & v_tile = (* ls_valid)[mfi];
-        amrex_eb_fill_valid_bcs(BL_TO_FORTRAN_3D(v_tile),
-                                periodic.getVect(), domain.loVect(), domain.hiVect());
-    }
-
-    BL_PROFILE_REGION_STOP("LSFactory::fill_valid()::bcs");
-
-
-    // Avoid FillBoundary in recursive steps
-    BL_PROFILE_REGION_START("LSFactory::fill_valid()::FillBoundary");
-    ls_valid->FillBoundary(geom_ls.periodicity());
-    BL_PROFILE_REGION_STOP("LSFactory::fill_valid()::FillBoundary");
-}
-
-
-
-std::unique_ptr<Vector<Real>> LSFactory::eb_facets(const FArrayBox & norm_tile,
-                                                   const CutFab & bcent_tile,
-                                                   const EBCellFlagFab & flag_tile,
-                                                   const RealVect & dx_eb,
-                                                   const Box & eb_search)
-{
-    BL_PROFILE("LSFactory::eb_facets(tile)");
-
-    // 1-D list of eb-facet data. Format:
-    // { px_1, py_1, pz_1, nx_1, ny_1, nz_1, px_2, py_2, ... , nz_N }
-    //   ^                 ^
-    //   |                 +---- {nx, ny, nz} is the normal vector pointing _towards_ the facet
-    //   +-----------------------{px, py, pz} is the position vector of the facet centre
-    std::unique_ptr<Vector<Real>> facet_list;
-
-    int n_facets = 0;
-    // Need to count number of eb-facets (in order to allocate facet_list)
-    amrex_eb_count_facets(BL_TO_FORTRAN_BOX(eb_search),
-                          BL_TO_FORTRAN_3D(flag_tile),
-                          & n_facets);
-
-    int facet_list_size = 6 * n_facets;
-    facet_list = std::unique_ptr<Vector<Real>>(new Vector<Real>(facet_list_size));
-
-    if (n_facets > 0) {
-        int c_facets = 0;
-        amrex_eb_as_list(BL_TO_FORTRAN_BOX(eb_search), & c_facets,
-                         BL_TO_FORTRAN_3D(flag_tile),
-                         BL_TO_FORTRAN_3D(norm_tile),
-                         BL_TO_FORTRAN_3D(bcent_tile),
-                         facet_list->dataPtr(), & facet_list_size,
-                         dx_eb.dataPtr()                           );
-    }
-
-    return facet_list;
-}
-
-
-
-void LSFactory::update_intersection(const MultiFab & ls_in, const iMultiFab & valid_in) {
-
-    BL_PROFILE("LSFactory::update_intersection()");
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid, true); mfi.isValid(); ++mfi){
-        Box tile_box = mfi.tilebox();
-
-        const auto & valid_in_tile = valid_in[mfi];
-        const auto & ls_in_tile = ls_in[mfi];
-        auto & v_tile = (* ls_valid)[mfi];
-        auto & ls_tile = (* ls_grid)[mfi];
-
-        amrex_eb_update_levelset_intersection(tile_box.loVect(), tile_box.hiVect(),
-                                              BL_TO_FORTRAN_3D(valid_in_tile),
-                                              BL_TO_FORTRAN_3D(ls_in_tile),
-                                              BL_TO_FORTRAN_3D(v_tile),
-                                              BL_TO_FORTRAN_3D(ls_tile)              );
-    }
-
-   /****************************************************************************
-    * Set boundary values of ls_grid                                           *
-    ****************************************************************************/
-
-    BL_PROFILE_REGION_START("LSFactory::update_intersection()::bcs");
-
-    // Simulation domain
-    Box domain(geom_ls.Domain());
-
-    // Int array flagging periodic directions => no need to fill the periodic
-    // ones as they are filled by FillBoundary
-    IntVect periodic(
-            AMREX_D_DECL(
-                geom_ls.isPeriodic(0),
-                geom_ls.isPeriodic(1),
-                geom_ls.isPeriodic(2)
-            )
-        );
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid); mfi.isValid(); ++mfi){
-        const auto & valid_in_tile = valid_in[mfi];
-        const auto & ls_in_tile = ls_in[mfi];
-        auto & v_tile = (* ls_valid)[mfi];
-        auto & ls_tile = (* ls_grid)[mfi];
-
-        amrex_eb_update_levelset_intersection_bcs( BL_TO_FORTRAN_3D(valid_in_tile),
-                                                   BL_TO_FORTRAN_3D(ls_in_tile),
-                                                   BL_TO_FORTRAN_3D(v_tile),
-                                                   BL_TO_FORTRAN_3D(ls_tile),
-                                                   periodic.getVect(),
-                                                   domain.loVect(), domain.hiVect()  );
-    }
-
-    BL_PROFILE_REGION_STOP("LSFactory::update_intersection()::bcs");
-
-    BL_PROFILE_REGION_START("LSFactory::update_intersection()::FillBoundary");
-    ls_grid->FillBoundary(geom_ls.periodicity());
-    BL_PROFILE_REGION_STOP("LSFactory::update_intersection()::FillBoundary");
-
-    fill_valid();
-}
-
-
-
-void LSFactory::update_union(const MultiFab & ls_in, const iMultiFab & valid_in) {
-
-    BL_PROFILE("LSFactory::update_union()");
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid, true); mfi.isValid(); ++mfi){
-        Box tile_box = mfi.tilebox();
-
-        const auto & valid_in_tile = valid_in[mfi];
-        const auto & ls_in_tile = ls_in[mfi];
-        auto & v_tile = (* ls_valid)[mfi];
-        auto & ls_tile = (* ls_grid)[mfi];
-
-        amrex_eb_update_levelset_union(tile_box.loVect(), tile_box.hiVect(),
-                                       BL_TO_FORTRAN_3D(valid_in_tile),
-                                       BL_TO_FORTRAN_3D(ls_in_tile),
-                                       BL_TO_FORTRAN_3D(v_tile),
-                                       BL_TO_FORTRAN_3D(ls_tile)                  );
-    }
-
-   /****************************************************************************
-    * Set boundary values of ls_grid                                           *
-    ****************************************************************************/
-
-    BL_PROFILE_REGION_START("LSFactory::update_union()::bcs");
-
-    // Simulation domain
-    Box domain(geom_ls.Domain());
-
-    // Int array flagging periodic directions => no need to fill the periodic
-    // ones as they are filled by FillBoundary
-    IntVect periodic(
-            AMREX_D_DECL(
-                geom_ls.isPeriodic(0),
-                geom_ls.isPeriodic(1),
-                geom_ls.isPeriodic(2)
-            )
-        );
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid); mfi.isValid(); ++mfi){
-        const auto & valid_in_tile = valid_in[mfi];
-        const auto & ls_in_tile = ls_in[mfi];
-        auto & v_tile = (* ls_valid)[mfi];
-        auto & ls_tile = (* ls_grid)[mfi];
-
-        amrex_eb_update_levelset_union_bcs( BL_TO_FORTRAN_3D(valid_in_tile),
-                                            BL_TO_FORTRAN_3D(ls_in_tile),
-                                            BL_TO_FORTRAN_3D(v_tile),
-                                            BL_TO_FORTRAN_3D(ls_tile),
-                                            periodic.getVect(),
-                                            domain.loVect(), domain.hiVect()  );
-    }
-    BL_PROFILE_REGION_STOP("LSFactory::update_union()::bcs");
-
-    BL_PROFILE_REGION_START("LSFactory::update_union()::FillBoundary");
-    ls_grid->FillBoundary(geom_ls.periodicity());
-    BL_PROFILE_REGION_START("LSFactory::update_union()::FillBoundary");
-
-    fill_valid();
-}
-
-
-
-std::unique_ptr<MultiFab> LSFactory::copy_data(const DistributionMapping& dm) const {
-
-    BL_PROFILE("LSFactory::copy_data()");
-
-    std::unique_ptr<MultiFab> cpy(new MultiFab(ls_ba, dm, 1, ls_grid_pad));
-    cpy->copy(* ls_grid, 0, 0, 1, ls_grid_pad, ls_grid_pad);
-
-    BL_PROFILE_REGION_START("LSFactory::copy_data()::FillBoundary");
-    cpy->FillBoundary(geom_ls.periodicity());
-    BL_PROFILE_REGION_STOP("LSFactory::copy_data()::FillBoundary");
-
-    return cpy;
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::copy_valid(const DistributionMapping& dm) const {
-
-    BL_PROFILE("LSFactory::copy_valid()");
-
-    std::unique_ptr<iMultiFab> cpy(new iMultiFab(ls_ba, dm, 1, ls_grid_pad));
-    cpy->copy(* ls_valid, 0, 0, 1, ls_grid_pad, ls_grid_pad);
-
-    BL_PROFILE_REGION_START("LSFactory::copy_valid()::FillBoundary");
-    cpy->FillBoundary(geom_ls.periodicity());
-    BL_PROFILE_REGION_STOP("LSFactory::copy_valid()::FillBoundary");
-    return cpy;
-}
-
-
-
-std::unique_ptr<MultiFab> LSFactory::coarsen_data() const {
-
-    BL_PROFILE("LSFactory::coarsen_data()");
-
-    // No refinement => do nothing
-    if(ls_grid_ref == 1)
-        return copy_data(ls_grid.get()->DistributionMap());
-
-    // Target for coarse nodal version of the level-set MultiFab
-    std::unique_ptr<MultiFab> ls_crse = std::unique_ptr<MultiFab>(new MultiFab);
-    const MultiFab * ls_fine = ls_grid.get(); // Pointer to fine level-set MultiFab
-
-    // Coarse nodal level-set BoxArray (amrex::average_down requires coarse BA)
-    BoxArray crse_ba = ls_fine->boxArray();
-    crse_ba.coarsen(ls_grid_ref);
-    int ng_crse = ls_fine->nGrow() / ls_grid_ref;
-
-    IntVect ratio = IntVect{AMREX_D_DECL(ls_grid_ref, ls_grid_ref, ls_grid_ref)};
-    ls_crse->define(crse_ba, ls_fine->DistributionMap(), ls_fine->nComp(), ng_crse);
-    // Don't use average_down, average_down_nodal fills ghost cells
-    // amrex::average_down(* ls_fine, * ls_crse, 0, 1, ls_grid_ref);
-    amrex::average_down_nodal(* ls_fine, * ls_crse, ratio, ng_crse );
-
-    // Do this in the write plot file function
-    // Now map the nodal MultiFab to the cell-centered MultiFab:
-    //amrex::average_node_to_cellcenter(* ls_crse, 0, * ls_crse, 0, 1);
-    return ls_crse;
-}
-
-
-
-void LSFactory::regrid(const BoxArray & ba, const DistributionMapping & dm)
-{
-
-    BL_PROFILE("LSFactory::regrid()");
-
-    // Regrids the level-set data whenever the
-    // DistributionMapping has changed:
-    //      -> Rebuilds the nodal levelset (ls_ba), cell-centered valid
-    //         (cc_ba), and eb (eb_ba) BoxArrays
-    //          -> ls_ba, cc_ba, and eb_ba are all inherited
-    update_ba(ba, dm);
-
-    int ng = ls_grid_pad;
-    std::unique_ptr<MultiFab> ls_grid_new
-        = std::unique_ptr<MultiFab>(new MultiFab(ls_ba, dm, 1, ng));
-
-    ls_grid_new->copy(* ls_grid, 0, 0, 1, ng, ng);
-    ls_grid_new->FillBoundary(geom_ls.periodicity());
-    ls_grid = std::move(ls_grid_new);
-
-    std::unique_ptr<iMultiFab> ls_valid_new
-        = std::unique_ptr<iMultiFab>(new iMultiFab(ls_ba, dm, 1,ng));
-
-    ls_valid_new->copy(* ls_valid, 0, 0, 1, ng, ng);
-    ls_valid_new->FillBoundary(geom_ls.periodicity());
-    ls_valid = std::move(ls_valid_new);
-}
-
-
-
-void LSFactory::invert() {
-
-   BL_PROFILE("LSFactory::invert()");
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi( * ls_grid, true); mfi.isValid(); ++ mfi){
-        FArrayBox & a_fab = (* ls_grid)[mfi];
-        for(BoxIterator bit(mfi.tilebox()); bit.ok(); ++bit)
-            a_fab(bit(), 0) = - a_fab(bit(), 0);
-    }
-
-    ls_grid->FillBoundary(geom_ls.periodicity());
-}
-
-
-
-void LSFactory::set_data(const MultiFab & mf_ls){
-
-    BL_PROFILE("LSFactory::set_data()");
-
-    ls_grid->copy(mf_ls, 0, 0, 1, ls_grid_pad, ls_grid_pad);
-    ls_grid->FillBoundary(geom_ls.periodicity());
-
-    fill_valid();
-}
-
-
-
-void LSFactory::fill_data (MultiFab & data, iMultiFab & valid,
-                           const EBFArrayBoxFactory & eb_factory,
-                           const MultiFab & eb_impfunc,
-                           int ebt_size, int ls_ref, int eb_ref,
-                           const Geometry & geom, const Geometry & geom_eb) {
-
-    // No profiling in function specialization
-
-    LSFactory::fill_data(data, valid, eb_factory, eb_impfunc,
-                         IntVect{AMREX_D_DECL(ebt_size, ebt_size, ebt_size)},
-                         ls_ref, eb_ref, geom, geom_eb);
-}
-
-
-
-void LSFactory::fill_data (MultiFab & data, iMultiFab & valid,
-                           const EBFArrayBoxFactory & eb_factory,
-                           const MultiFab & eb_impfunc,
-                           const IntVect & ebt_size, int ls_ref, int eb_ref,
-                           const Geometry & geom, const Geometry & geom_eb) {
-
-    BL_PROFILE("LSFactory::fill_data()");
-
-    /****************************************************************************
-     *                                                                          *
-     * Sets: `data` MultiFab containing level-set and a `valid` indicating that *
-     * the corresponding cell in `data` as been filled by a valid (i.e. the     *
-     * value of the level-set was informed by nearby EB facets) level-set       *
-     * function                                                                 *
-     *                                                                          *
-     ***************************************************************************/
-
-    RealVect dx(AMREX_D_DECL(geom.CellSize(0),
-                             geom.CellSize(1),
-                             geom.CellSize(2)));
-
-    RealVect dx_eb(AMREX_D_DECL(geom_eb.CellSize(0),
-                                geom_eb.CellSize(1),
-                                geom_eb.CellSize(2)));
-
-    // Don't use the ls_grid_pad for the eb_padding (goes wrong!)
-    const int ls_pad = data.nGrow();
-
-    // Doesn't work with iMultiFabs
-    //BL_ASSERT(isMFIterSafe(data, valid));
-
-    const BoxArray & ls_ba            = data.boxArray();
-    const BoxArray & eb_ba            = eb_factory.boxArray();
-    const DistributionMapping & ls_dm = data.DistributionMap();
-
-
-    /****************************************************************************
-     *                                                                          *
-     * Access EB Cut-Cell data:                                                 *
-     *                                                                          *
-     ***************************************************************************/
-
-    const MultiCutFab & bndrycent = eb_factory.getBndryCent();
-    const auto & flags = eb_factory.getMultiEBCellFlagFab();
-
-    // make sure to use the EB-factory's ngrow for the eb-padding;
-    const int eb_pad = flags.nGrow();
-
-    /****************************************************************************
-     *                                                                          *
-     * Compute normals data (which are stored on MultiFab over the EB Grid)     *
-     *                                                                          *
-     ***************************************************************************/
-
-    MultiFab normal(eb_ba, ls_dm, 3, eb_pad); //deliberately use levelset DM
-    amrex::FillEBNormals(normal, eb_factory, geom_eb);
-
-
-    /****************************************************************************
-     *                                                                          *
-     * Fill local MultiFab with eb_factory's level-set data. Note the role of   *
-     * the temporary eb_valid iMultiFab:                                        *
-     *  -> eb_valid = 1 if the corresponding eb_ls location could be projected  *
-     *                  onto the eb-facets => level-set sign is OK              *
-     *  -> eb_valid = 0 if eb_ls is the fall-back (euclidian) distance to the   *
-     *                  nearest eb-facet => the sign needs to be checked        *
-     *                                                                          *
-     ***************************************************************************/
-
-    iMultiFab eb_valid(ls_ba, ls_dm, 1, ls_pad);
-    eb_valid.setVal(0);
-
-
-    /****************************************************************************
-     *                                                                          *
-     * Identify the shortest length scale (used to compute the minimum distance *
-     * to nearest un-detected EB facet)                                         *
-     *                                                                          *
-     ***************************************************************************/
-
-    const Real min_dx = LSUtility::min_dx(geom_eb);
-
-
-    /****************************************************************************
-     *                                                                          *
-     * Loop over EB tile boxes (ebt) and 1. search for EB facets, the 2. find   *
-     * least minimum (thresholded) distance to B facets.                        *
-     *                                                                          *
-     ***************************************************************************/
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(data, ebt_size * std::max(1, ls_ref/eb_ref)); mfi.isValid(); ++mfi)
-    {
-        //_______________________________________________________________________
-        // Fill grown tile box => fill ghost cells as well
-        Box tile_box = mfi.growntilebox();
-
-
-        //_______________________________________________________________________
-        // Don't do anything for the current tile if EB facets are ill-defined
-        if (! bndrycent.ok(mfi)){
-            auto & ls_tile = data[mfi];
-            ls_tile.setVal<RunOn::Host>( min_dx *( eb_pad + 1), tile_box );
-
-            // Ensure that tile-wise assignment is validated
-            const auto & if_tile = eb_impfunc[mfi];
-                  auto & v_tile  = eb_valid[mfi];
-
-            amrex_eb_validate_levelset(BL_TO_FORTRAN_BOX(tile_box), & ls_ref,
-                                       BL_TO_FORTRAN_3D(if_tile),
-                                       BL_TO_FORTRAN_3D(v_tile),
-                                       BL_TO_FORTRAN_3D(ls_tile)   );
-
-            continue;
-        }
-
-
-        //_______________________________________________________________________
-        // Construct search box over which to look for EB facets
-
-        // mfi inherits from ls_grid which might not have the right refinement
-        Box eb_search = mfi.tilebox();
-        eb_search.coarsen(ls_ref);
-        eb_search.refine(eb_ref);
-
-        // Grow search box out from (correctly refined) tile box. NOTE: grow the
-        // tile box AT MOST by eb_grid_pad => ensures that EBFactory is defined
-        // for the whole search box
-        eb_search.enclosedCells(); // search box must be cell-centered
-        eb_search.grow(eb_pad);
-
-        const auto & flag       = flags[mfi];
-        const auto & if_tile    = eb_impfunc[mfi];
-        const auto & norm_tile  = normal[mfi];
-        const auto & bcent_tile = bndrycent[mfi];
-
-        auto & v_tile      = eb_valid[mfi];
-        auto & ls_tile     = data[mfi];
-        auto & region_tile = valid[mfi];
-
-
-        //_______________________________________________________________________
-        // Construct EB facets
-        std::unique_ptr<Vector<Real>> facets = eb_facets(norm_tile, bcent_tile, flag,
-                                                         dx_eb, eb_search);
-        int len_facets = facets->size();
-
-
-        //_______________________________________________________________________
-        // Fill local level-set
-        if (len_facets > 0) {
-
-            amrex_eb_fill_levelset(BL_TO_FORTRAN_BOX(tile_box),
-                                   facets->dataPtr(), & len_facets,
-                                   BL_TO_FORTRAN_3D(v_tile),
-                                   BL_TO_FORTRAN_3D(ls_tile),
-                                   dx.dataPtr(), dx_eb.dataPtr() );
-
-            region_tile.setVal<RunOn::Host>(1);
-        } else {
-            ls_tile.setVal<RunOn::Host>( min_dx * ( eb_pad + 1 ) , tile_box );
-        }
-
-
-        //_______________________________________________________________________
-        // Threshold local level-set
-        Real ls_threshold = min_dx * (eb_pad+1); //eb_pad => we know that any EB
-                                                 //is _at least_ eb_pad away from
-                                                 //the edge of the eb search box
-        amrex_eb_threshold_levelset(BL_TO_FORTRAN_BOX(tile_box), & ls_threshold,
-                                    BL_TO_FORTRAN_3D(ls_tile));
-
-
-        //_______________________________________________________________________
-        // Validate level-set (here so that tile-wise assignment is still validated)
-        amrex_eb_validate_levelset(BL_TO_FORTRAN_BOX(tile_box), & ls_ref,
-                                   BL_TO_FORTRAN_3D(if_tile),
-                                   BL_TO_FORTRAN_3D(v_tile),
-                                   BL_TO_FORTRAN_3D(ls_tile)   );
-    }
-}
-
-
-
-void LSFactory::fill_data (MultiFab & data, iMultiFab & valid,
-                           const MultiFab & mf_impfunc,
-                           int eb_pad, const Geometry & eb_geom) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Set valid (Here: "valid" region defined as all nodes because IF is       *
-     * defined everywhere, unless we are using the threshold eb_pad*eb_dx)      *
-     *                                                                          *
-     ***************************************************************************/
-
-    if (eb_pad <= 0) {
-        valid.setVal(1);
-    } else {
-        valid.setVal(0);
-    }
-
-
-    /****************************************************************************
-     *                                                                          *
-     * GeometryService convention:                                              *
-     *      -- implicit_function(r) < 0 : r in fluid (outside of EB)            *
-     *      -- implicit_function(r) > 0 : r not in fluid (inside EB)            *
-     *   => If implicit_function is a signed-distance function, we need to      *
-     *      invert sign                                                         *
-     *                                                                          *
-     ***************************************************************************/
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(mf_impfunc, true); mfi.isValid(); ++ mfi) {
-        const FArrayBox & in_fab  = mf_impfunc[mfi];
-              FArrayBox & out_fab = data[mfi];
-
-        // NOTE: growntilebox => flip also the ghost cells. They don't get
-        // flipped twice because we don't call FillBoundary.
-        for (BoxIterator bit(mfi.growntilebox()); bit.ok(); ++ bit)
-            out_fab(bit(), 0) = - in_fab(bit(), 0);
-    }
-
-
-    /****************************************************************************
-     *                                                                          *
-     * Threshold local level-set:  eb_pad => we know that any EB is _at least_  *
-     * eb_pad away from the edge of the current tile box (consistent with EB-   *
-     * based level-set filling).                                                *
-     *                                                                          *
-     ***************************************************************************/
-
-    if (eb_pad > 0) {
-        const Real min_dx = LSUtility::min_dx(eb_geom);
-        const Real ls_threshold = min_dx * (eb_pad+1);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for (MFIter mfi(data, true); mfi.isValid(); ++ mfi) {
-
-            FArrayBox & ls_tile = data[mfi];
-            IArrayBox &  v_tile = valid[mfi];
-
-            //___________________________________________________________________
-            // Apply threshold to grown tile box => fill ghost cells as well
-            Box tile_box = mfi.growntilebox();
-
-            amrex_eb_threshold_levelset(BL_TO_FORTRAN_BOX(tile_box), & ls_threshold,
-                                        BL_TO_FORTRAN_3D(ls_tile));
-
-
-            //___________________________________________________________________
-            // Set valid to 1 whenever the box contains values within
-            // +/- ls_threshold
-            for (BoxIterator bit(mfi.growntilebox()); bit.ok(); ++ bit) {
-                if (std::abs(ls_tile(bit(), 0)) <= ls_threshold) {
-                    v_tile.setVal<RunOn::Host>(1, tile_box);
-                    break;
-                }
-            }
-        }
-    }
-
-}
-
-
-
-void LSFactory::intersect_data (MultiFab & data, iMultiFab & valid,
-                                const MultiFab & data_in, const iMultiFab & valid_in,
-                                const Geometry & geom_ls) {
-
-    BL_PROFILE("LSFactory::intersect_data()");
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi(data, true); mfi.isValid(); ++mfi){
-        Box tile_box = mfi.growntilebox();
-
-        const auto & valid_in_tile = valid_in[mfi];
-        const auto & ls_in_tile = data_in[mfi];
-        auto & v_tile = valid[mfi];
-        auto & ls_tile = data[mfi];
-
-        amrex_eb_update_levelset_intersection(tile_box.loVect(), tile_box.hiVect(),
-                                              BL_TO_FORTRAN_3D(valid_in_tile),
-                                              BL_TO_FORTRAN_3D(ls_in_tile),
-                                              BL_TO_FORTRAN_3D(v_tile),
-                                              BL_TO_FORTRAN_3D(ls_tile)              );
-    }
-}
-
-
-
-void LSFactory::union_data (MultiFab & data, iMultiFab & valid,
-                            const MultiFab & data_in, const iMultiFab & valid_in,
-                            const Geometry & geom_ls) {
-
-    BL_PROFILE("LSFactory::union_data()");
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for(MFIter mfi(data, true); mfi.isValid(); ++mfi){
-        Box tile_box = mfi.growntilebox();
-
-        const auto & valid_in_tile = valid_in[mfi];
-        const auto & ls_in_tile = data_in[mfi];
-        auto & v_tile = valid[mfi];
-        auto & ls_tile = data[mfi];
-
-        amrex_eb_update_levelset_intersection(tile_box.loVect(), tile_box.hiVect(),
-                                              BL_TO_FORTRAN_3D(valid_in_tile),
-                                              BL_TO_FORTRAN_3D(ls_in_tile),
-                                              BL_TO_FORTRAN_3D(v_tile),
-                                              BL_TO_FORTRAN_3D(ls_tile)              );
-    }
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Fill(const EBFArrayBoxFactory & eb_factory,
-                                           const MultiFab & mf_impfunc) {
-    return Fill(eb_factory, mf_impfunc, eb_tile_size);
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Fill(const EBFArrayBoxFactory & eb_factory,
-                                           const MultiFab & mf_impfunc,
-                                           int ebt_size) {
-    return Fill(eb_factory, mf_impfunc,
-                IntVect{AMREX_D_DECL(ebt_size, ebt_size, ebt_size)});
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Fill(const EBFArrayBoxFactory & eb_factory,
-                                           const MultiFab & mf_impfunc,
-                                           const IntVect & ebt_size) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Returns: iMultiFab indicating region that has been filled by a valid     *
-     * level-set function (i.e. the value of the level-set was informed by      *
-     * nearby EB facets)                                                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    std::unique_ptr<iMultiFab> region_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-    region_valid->define(ls_ba, ls_dm, 1, ls_grid_pad);
-    region_valid->setVal(0);
-
-
-    LSFactory::fill_data(* ls_grid, * region_valid, eb_factory, mf_impfunc,
-                         ebt_size, ls_grid_ref, eb_grid_ref, geom_ls, geom_eb);
-
-
-    fill_valid();
-
-    return region_valid;
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Fill(const MultiFab & mf_impfunc,
-                                           bool apply_threshold) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Returns: iMultiFab indicating region that has been filled by a valid     *
-     * level-set function (i.e. the value of the level-set was informed by      *
-     * nearby EB facets)                                                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    std::unique_ptr<iMultiFab> region_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-    region_valid->define(ls_ba, ls_dm, 1, ls_grid_pad);
-    region_valid->setVal(0);
-
-
-    int ls_threshold_pad = -1;
-    if (apply_threshold)
-        ls_threshold_pad = eb_grid_pad;
-
-    LSFactory::fill_data(* ls_grid, * region_valid, mf_impfunc,
-                         ls_threshold_pad, geom_eb);
-
-    fill_valid();
-
-    return region_valid;
-
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Intersect(const EBFArrayBoxFactory & eb_factory,
-                                                const MultiFab & mf_impfunc) {
-
-    return Intersect(eb_factory, mf_impfunc, eb_tile_size);
-
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Intersect(const EBFArrayBoxFactory & eb_factory,
-                                                const MultiFab & mf_impfunc,
-                                                int ebt_size){
-    return Intersect(eb_factory, mf_impfunc,
-                     IntVect{AMREX_D_DECL(ebt_size, ebt_size, ebt_size)});
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Intersect(const EBFArrayBoxFactory & eb_factory,
-                                                const MultiFab & mf_impfunc,
-                                                const IntVect & ebt_size) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Returns: iMultiFab indicating region that has been filled by a valid     *
-     * level-set function (i.e. the value of the level-set was informed by      *
-     * nearby EB facets)                                                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    std::unique_ptr<iMultiFab> region_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-    region_valid->define(ls_ba, ls_dm, 1, ls_grid_pad);
-    region_valid->setVal(0);
-
-    // Local MultiFab storing level-set data for this eb_factory
-    MultiFab  eb_ls(ls_ba, ls_dm, 1, ls_grid_pad);
-
-    // Fill local MultiFab with EBF level-set
-    LSFactory::fill_data(eb_ls, * region_valid, eb_factory, mf_impfunc,
-                         ebt_size, ls_grid_ref, eb_grid_ref, geom_ls, geom_eb);
-
-
-    // Update LSFactory using local eb level-set
-    update_intersection(eb_ls, * region_valid);
-
-
-    return region_valid;
-
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Intersect(const MultiFab & mf_impfunc,
-                                                bool apply_threshold) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Returns: iMultiFab indicating region that has been filled by a valid     *
-     * level-set function (i.e. the value of the level-set was informed by      *
-     * nearby EB facets)                                                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    std::unique_ptr<iMultiFab> region_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-    region_valid->define(ls_ba, ls_dm, 1, ls_grid_pad);
-    region_valid->setVal(0);
-
-    // Local MultiFab storing level-set data for this eb_factory
-    MultiFab  if_ls(ls_ba, ls_dm, 1, ls_grid_pad);
-
-
-    int ls_threshold_pad = -1;
-    if (apply_threshold)
-        ls_threshold_pad = eb_grid_pad;
-
-    // Fill local MultiFab with implicit-function data
-    LSFactory::fill_data(if_ls, * region_valid, mf_impfunc, ls_threshold_pad, geom_eb);
-
-
-    // Update LSFactory using local (corrected) implicit function MultiFab
-    update_intersection(if_ls, * region_valid);
-
-    return region_valid;
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Union(const EBFArrayBoxFactory & eb_factory,
-                                            const MultiFab & mf_impfunc) {
-
-    return Union(eb_factory, mf_impfunc, eb_tile_size);
-
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Union(const EBFArrayBoxFactory & eb_factory,
-                                            const MultiFab & mf_impfunc,
-                                            int ebt_size){
-    return Union(eb_factory, mf_impfunc,
-                     IntVect{AMREX_D_DECL(ebt_size, ebt_size, ebt_size)});
-}
-
-
-
-std::unique_ptr<iMultiFab> LSFactory::Union(const EBFArrayBoxFactory & eb_factory,
-                                            const MultiFab & mf_impfunc,
-                                            const IntVect & ebt_size) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Returns: iMultiFab indicating region that has been filled by a valid     *
-     * level-set function (i.e. the value of the level-set was informed by      *
-     * nearby EB facets)                                                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    std::unique_ptr<iMultiFab> region_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-    region_valid->define(ls_ba, ls_dm, 1, ls_grid_pad);
-    region_valid->setVal(0);
-
-    // Local MultiFab storing level-set data for this eb_factory
-    MultiFab  eb_ls(ls_ba, ls_dm, 1, ls_grid_pad);
-
-    // Fill local MultiFab with EBF level-set
-    LSFactory::fill_data(eb_ls, * region_valid, eb_factory, mf_impfunc,
-                         ebt_size, ls_grid_ref, eb_grid_ref, geom_ls, geom_eb);
-
-
-    // Update LSFactory using local eb level-set
-    update_union(eb_ls, * region_valid);
-
-
-    return region_valid;
-
-}
-
-
-std::unique_ptr<iMultiFab> LSFactory::Union(const MultiFab & mf_impfunc,
-                                            bool apply_threshold) {
-
-    /****************************************************************************
-     *                                                                          *
-     * Returns: iMultiFab indicating region that has been filled by a valid     *
-     * level-set function (i.e. the value of the level-set was informed by      *
-     * nearby EB facets)                                                        *
-     *                                                                          *
-     ***************************************************************************/
-
-    std::unique_ptr<iMultiFab> region_valid = std::unique_ptr<iMultiFab>(new iMultiFab);
-    region_valid->define(ls_ba, ls_dm, 1, ls_grid_pad);
-    region_valid->setVal(0);
-
-    // Local MultiFab storing level-set data for this eb_factory
-    MultiFab  if_ls(ls_ba, ls_dm, 1, ls_grid_pad);
-
-
-    int ls_threshold_pad = -1;
-    if (apply_threshold)
-        ls_threshold_pad = eb_grid_pad;
-
-    // Fill local MultiFab with implicit-function data
-    LSFactory::fill_data(if_ls, * region_valid, mf_impfunc, ls_threshold_pad, geom_eb);
-
-
-    // Update LSFactory using local (corrected) implicit function MultiFab
-    update_union(if_ls, * region_valid);
-
-    return region_valid;
-}
-
-
-}
diff --git a/Src/EB/AMReX_EB_levelset_F.F90 b/Src/EB/AMReX_EB_levelset_F.F90
deleted file mode 100644
index d664d7f9c66..00000000000
--- a/Src/EB/AMReX_EB_levelset_F.F90
+++ /dev/null
@@ -1,1383 +0,0 @@
-module amrex_eb_levelset_module
-
-    use amrex_fort_module, only: amrex_real
-    use iso_c_binding,     only: c_int
-
-    use amrex_ebcellflag_module, only: is_single_valued_cell
-
-    implicit none
-
-contains
-
-    !-----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine INIT_LEVELSET
-    !!
-    !!   Purpose: Initializes level-set array to the fortran huge(real(amrex_real)) value. This way these values of the
-    !!   level-set function will be overwritten by the min() function (used in these levelset_update function).
-    !!
-    !!   Comments: If you want to "clear" the whole level-set array (phi), make sure that lo and hi match the grown
-    !!   tile box (i.e. mfi.growntilebox()).
-    !!
-    !-----------------------------------------------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_init_levelset(lo,  hi,          &
-                                           phi, phlo, phhi ) &
-                    bind(C, name="amrex_eb_init_levelset")
-
-        implicit none
-
-        ! ** define I/O dummy variables
-        integer,      dimension(3), intent(in   ) :: lo, hi, phlo, phhi
-        real(amrex_real),               intent(  out) :: phi ( phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-
-        ! ** define internal variables
-        !    i, j, k: loop index variables
-        integer :: i, j, k
-
-        do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-                do i = lo(1), hi(1)
-                    phi(i, j, k) = huge(phi)
-                end do
-            end do
-        end do
-
-      end subroutine amrex_eb_init_levelset
-
-
-
-    !----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine FILL_LEVELSET
-    !!
-    !!   Purpose: given a list of EB-facets, fill the level-set MultiFab between `lo` and `hi` with the closets
-    !!   distance to the EB-facests. Also fill a iMultiFab with 0's and 1's. 0 Indicating that the closest distance
-    !!   was not the result of a projection onto a facet's plane, but instead onto an edge/corner.
-    !!
-    !!   Comments: Distances are **signed** ( < 0 => inside an EB). Note that at this point the algorithm assumes an
-    !!   edge case lies inside an EB (i.e. its distance is negative). These points are marked using valid = 0. We
-    !!   recommend that the EB's implicit function is used to check these cases (i.e. validate the level-set).
-    !!
-    !----------------------------------------------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_fill_levelset(lo,      hi,          &
-                                           eb_list, l_eb,        &
-                                           valid,   vlo,  vhi,   &
-                                           phi,     phlo, phhi,  &
-                                           dx,      dx_eb      ) &
-                     bind(C, name="amrex_eb_fill_levelset")
-
-        implicit none
-
-        ! ** define I/O dummy variables
-        integer,                       intent(in   ) :: l_eb
-        integer,      dimension(3),    intent(in   ) :: lo, hi, vlo, vhi, phlo, phhi
-        real(amrex_real), dimension(l_eb), intent(in   ) :: eb_list
-        real(amrex_real),                  intent(  out) :: phi     (phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3))
-        integer,                       intent(  out) :: valid   ( vlo(1):vhi(1),   vlo(2):vhi(2),   vlo(3):vhi(3) )
-        real(amrex_real), dimension(3),    intent(in   ) :: dx, dx_eb
-
-
-        ! ** define internal variables
-        !    pos_node:      position of the level-set MultiFab node (where level-set is evaluated)
-        !    levelset_node: value of the signed-distance function at pos_node
-        real(amrex_real), dimension(3) :: pos_node
-        real(amrex_real)               :: levelset_node
-        !    ii, jj, kk: loop index variables
-        !    valid_cell: .true. iff levelset_node is signed (if .false., levelset_node needs to be validated by IF)
-        integer :: ii, jj, kk
-        logical :: valid_cell
-
-        do kk = lo(3), hi(3)
-            do jj = lo(2), hi(2)
-                do ii = lo(1), hi(1)
-                    pos_node      = (/ ii*dx(1), jj*dx(2), kk*dx(3) /)
-                    call closest_dist ( levelset_node, valid_cell, eb_list, l_eb, dx_eb, pos_node)
-
-                    phi(ii, jj, kk) = levelset_node;
-
-                    if ( valid_cell ) then
-                        valid(ii, jj, kk) = 1
-                    else
-                        valid(ii, jj, kk) = 0
-                    end if
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_fill_levelset
-
-
-    !---------------------------------------------------------------------------
-    !!
-    !>   pure subroutine FILL_LEVELSET_LOC
-    !!
-    !!   Purpose: given a list of EB-facets, fill the level-set MultiFab between
-    !!   `lo` and `hi` with the closets distance to the EB-facests. For all
-    !!   `abs(ls_guess) > ls_thres `, level-set filling is aborted and the
-    !!   level-set is set to +/- `ls_thres`. This avoid unnecessary filling far
-    !!   from EB boundaries.
-    !!
-    !!   Also fill a iMultiFab with 0's and 1's. 0 Indicating that the closest
-    !!   distance was not the result of a projection onto a facet's plane, but
-    !!   instead onto an edge/corner.
-    !!
-    !!   Comments: Distances are **signed** ( < 0 => inside an EB). Note that at
-    !!   this point the algorithm assumes an edge case lies inside an EB (i.e.
-    !!   its distance is negative). These points are marked using valid = 0. We
-    !!   recommend that the EB's implicit function is used to check these cases
-    !!   (i.e. validate the level-set).
-    !!
-    !---------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_fill_levelset_loc(lo,       hi,              &
-                                               eb_list,  l_eb,            &
-                                               valid,    v_lo,   v_hi,    &
-                                               phi,      p_lo,   p_hi,    &
-                                               ls_guess, lsg_lo, lsg_hi,  &
-                                               ls_thres, dx,     dx_eb  ) &
-                    bind(C, name="amrex_eb_fill_levelset_loc")
-
-      implicit none
-
-      ! ** define I/O dummy variables
-      integer,                       intent(in   ) :: l_eb
-      integer,      dimension(3),    intent(in   ) :: lo, hi, v_lo, v_hi, p_lo, p_hi, lsg_lo, lsg_hi
-      real(amrex_real), dimension(l_eb), intent(in   ) :: eb_list
-      real(amrex_real), dimension(3),    intent(in   ) :: dx, dx_eb
-      real(amrex_real),                  intent(in   ) :: ls_thres
-
-      real(amrex_real),  intent(  out) :: phi     (  p_lo(1):p_hi(1),     p_lo(2):p_hi(2),     p_lo(3):p_hi(3)  )
-      integer,       intent(  out) :: valid   (  v_lo(1):v_hi(1),     v_lo(2):v_hi(2),     v_lo(3):v_hi(3)  )
-      real(amrex_real),  intent(in   ) :: ls_guess(lsg_lo(1):lsg_hi(1), lsg_lo(2):lsg_hi(2), lsg_lo(3):lsg_hi(3))
-
-      ! ** define internal variables
-      !    pos_node:      position of the level-set MultiFab node (where level-set is evaluated)
-      !    levelset_node: value of the signed-distance function at pos_node
-      real(amrex_real), dimension(3) :: pos_node
-      real(amrex_real)               :: levelset_node
-      !    ii, jj, kk: loop index variables
-      !    valid_cell: .true. iff levelset_node is signed (if .false., levelset_node needs to be validated by IF)
-      integer      :: ii, jj, kk
-      logical      :: valid_cell
-      real(amrex_real) :: phi_th
-
-      phi_th = ls_thres
-      if (phi_th < 0) phi_th = huge(phi_th)
-
-      do kk = lo(3), hi(3)
-         do jj = lo(2), hi(2)
-            do ii = lo(1), hi(1)
-               if ( abs(ls_guess(ii, jj, kk)) .lt.  phi_th ) then
-
-                  pos_node = (/ ii*dx(1), jj*dx(2), kk*dx(3) /)
-                  call closest_dist ( levelset_node, valid_cell, eb_list, l_eb, dx_eb, pos_node)
-
-                  phi(ii, jj, kk) = levelset_node;
-
-                  if ( valid_cell ) then
-                     valid(ii, jj, kk) = 1
-                  else
-                     valid(ii, jj, kk) = 0
-                  end if
-
-               else if ( ls_guess(ii, jj, kk) .le. -phi_th ) then
-
-                  phi(ii, jj, kk) = - phi_th
-                  valid(ii, jj, kk) = 0
-
-               else if ( ls_guess(ii, jj, kk) .ge.  phi_th ) then
-
-                  phi(ii, jj, kk) = phi_th
-                  valid(ii, jj, kk) = 0
-
-               end if
-            end do
-         end do
-      end do
-
-    end subroutine amrex_eb_fill_levelset_loc
-
-
-
-    pure subroutine amrex_eb_fill_levelset_bcs( phi,      philo, phihi, &
-                                                valid,    vlo,   vhi,   &
-                                                periodic, domlo, domhi, &
-                                                eb_list, l_eb,          &
-                                                dx, dx_eb              )&
-                    bind(C, name="amrex_eb_fill_levelset_bcs")
-
-        implicit none
-
-        integer,      dimension(3), intent(in   ) :: philo, phihi, vlo, vhi, periodic, domlo, domhi
-        real(amrex_real),               intent(  out) :: phi(philo(1):phihi(1), philo(2):phihi(2), philo(3):phihi(3))
-        integer,                    intent(  out) :: valid(vlo(1):vhi(1),     vlo(2):vhi(2),     vlo(3):vhi(3))
-
-        ! ** extra data used by fill levelset operation
-        real(amrex_real), dimension(3),    intent(in   ) :: dx, dx_eb
-        integer,                       intent(in   ) :: l_eb
-        real(amrex_real), dimension(l_eb), intent(in   ) :: eb_list
-
-
-        integer, dimension(3) :: lo, hi
-
-        !-------------------------------------------------------------------------------------------------------------
-        ! Iterate over each of the 6 "faces" of the rectangular domain
-        !-------------------------------------------------------------------------------------------------------------
-
-        ! 2 i-j faces => k is in [philo(3), domlo(3)) U (domhi(3), phihi(3)]
-
-        if ( (periodic(3).eq.0) .and. (philo(3).lt.domlo(3)) ) then
-            lo(:) = philo(:)      ! k = philo(3), domlo(3) - 1
-            hi(:) = phihi(:)      ! j = philo(2), phihi(2)
-            hi(3) = domlo(3) - 1  ! i = philo(1), phihi(1)
-
-            call amrex_eb_fill_levelset ( &
-                lo, hi,                   &
-                eb_list, l_eb,            &
-                valid, vlo,   vhi,        &
-                phi,   philo, phihi,      &
-                dx, dx_eb                 &
-            )
-        end if
-
-        if ( (periodic(3).eq.0) .and. (phihi(3).gt.domhi(3)) ) then
-            lo(:) = philo(:)      ! k = domhi(3) + 1, phihi(3)
-            hi(:) = phihi(:)      ! j = philo(2), phihi(2)
-            lo(3) = domhi(3) + 1  ! i = philo(1), phihi(1)
-
-            call amrex_eb_fill_levelset ( &
-                lo, hi,                   &
-                eb_list, l_eb,            &
-                valid, vlo,   vhi,        &
-                phi,   philo, phihi,      &
-                dx, dx_eb                 &
-            )
-        end if
-
-
-        ! 2 i-k faces => j is in [philo(2), domlo(2)) U (domhi(2), phihi(2)]
-
-        if ( (periodic(2).eq.0) .and. (philo(2).lt.domlo(2)) ) then
-            lo(:) = philo(:)      ! k = philo(3), phihi(3)
-            hi(:) = phihi(:)      ! j = philo(2), domlo(2) - 1
-            hi(2) = domlo(2) - 1  ! i = philo(1), phihi(1)
-
-            call amrex_eb_fill_levelset ( &
-                lo, hi,                   &
-                eb_list, l_eb,            &
-                valid, vlo,   vhi,        &
-                phi,   philo, phihi,      &
-                dx, dx_eb                 &
-            )
-        end if
-
-        if ( (periodic(2).eq.0) .and. (phihi(2).gt.domhi(2)) ) then
-            lo(:) = philo(:)      ! k = philo(3), phihi(3)
-            hi(:) = phihi(:)      ! j = domhi(2) + 1, phihi(2)
-            lo(2) = domhi(2) + 1  ! i = philo(1), phihi(1)
-
-            call amrex_eb_fill_levelset ( &
-                lo, hi,                   &
-                eb_list, l_eb,            &
-                valid, vlo,   vhi,        &
-                phi,   philo, phihi,      &
-                dx, dx_eb                 &
-            )
-        end if
-
-
-        ! 2 j-k faces => i is in [philo(1), domlo(1)) U (domhi(1), phihi(1)]
-
-        if ( (periodic(1).eq.0) .and. (philo(1).lt.domlo(1)) ) then
-            lo(:) = philo(:)      ! k = philo(3), phihi(3)
-            hi(:) = phihi(:)      ! j = philo(2), phihi(2)
-            hi(1) = domlo(1) - 1  ! i = philo(1), domlo(1) - 1
-
-            call amrex_eb_fill_levelset ( &
-                lo, hi,                   &
-                eb_list, l_eb,            &
-                valid, vlo,   vhi,        &
-                phi,   philo, phihi,      &
-                dx, dx_eb                 &
-            )
-        end if
-
-        if ( (periodic(1).eq.0) .and. (phihi(1).gt.domhi(1)) ) then
-            lo(:) = philo(:)      ! k = philo(3), phihi(3)
-            hi(:) = phihi(:)      ! j = philo(2), phihi(2)
-            lo(1) = domhi(1) + 1  ! i = domhi(1) + 1, phihi(1)
-
-            call amrex_eb_fill_levelset ( &
-                lo, hi,                   &
-                eb_list, l_eb,            &
-                valid, vlo,   vhi,        &
-                phi,   philo, phihi,      &
-                dx, dx_eb                 &
-            )
-        end if
-
-    end subroutine amrex_eb_fill_levelset_bcs
-
-
-    !------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine CLOSEST_DIST
-    !!
-    !!   Purpose: Find the distance to the closets point on the surface defined by the EB-facet list (from the
-    !!   point `pos`). Note that this distance is **signed** => if the vector `eb_center - pos` points
-    !!   **towards** the surface.
-    !!
-    !!   Comments: sometimes the closes point is on an EB-facet edge. In this case, the surface normal is not
-    !!   trivial, and this algorithm defaults to a negative distance. However this point is given an `valid`
-    !!   flag of false. It is recommended that the EB's implicit function is used to determine the weather the
-    !!   lies in the EB interior.
-    !!
-    !-----------------------------------------------------------------------------------------------------------
-
-    pure subroutine closest_dist(min_dist, proj_valid,  &
-                                 eb_data,  l_eb, dx_eb, &
-                                 pos                   )
-
-      use amrex_eb_geometry_module, only: facets_nearest_pt
-      use amrex_constants_module , only : one
-
-      implicit none
-
-      ! ** define I/O dummy variables
-      integer,                       intent(in   ) :: l_eb
-      logical,                       intent(  out) :: proj_valid
-      real(amrex_real),                  intent(  out) :: min_dist
-      real(amrex_real), dimension(3),    intent(in   ) :: pos, dx_eb
-      real(amrex_real), dimension(l_eb), intent(in   ) :: eb_data
-
-
-      ! ** define internal variables
-      !    i:         loop index variable
-      !    i_nearest: index of facet nearest to ps
-      integer                    :: i, i_nearest
-      !    vi_pt, vi_cent: vector indices (in MultiFab index-space) of:
-      !       +------|---> the projection point on the nearest EB facet
-      !              +---> the center of the nearest EB facet
-      integer,      dimension(3) :: vi_pt, vi_cent
-      !    dist_proj:        projected (minimal) distance to the nearest EB facet
-      !    dist2, min_dist2: squred distance to the EB facet centre, and square distance to the nearest EB facet
-      real(amrex_real)               :: dist_proj, dist2, min_dist2, min_edge_dist2
-      !    ind_dx:           inverse of dx_eb (used to allocate MultiFab indices to position vector)
-      !    eb_norm, eb_cent: EB normal and center (LATER: of the nearest EB facet)
-      !    eb_min_pt, c_vec: projected point on EB facet (c_vec: onto facet edge)
-      real(amrex_real), dimension(3) :: inv_dx, eb_norm, eb_cent, eb_min_pt, c_vec
-      !    min_pt_valid: set to true if the eb_min_pt is in the same cell as eb_cent
-      logical :: min_pt_valid
-      !    *_shift: loop counters for checking off-by-epsilon error when comparing eb_cent and projected point
-      integer :: i_shift, j_shift, k_shift
-
-
-      inv_dx(:)  = one / dx_eb(:)
-
-      min_dist   = huge(min_dist)
-      min_dist2  = huge(min_dist2)
-      i_nearest  = 0
-      proj_valid = .false.
-
-      ! Find nearest EB facet
-      do i = 1, l_eb, 6
-         eb_cent(:)   = eb_data(i     : i + 2)
-         eb_norm(:)   = eb_data(i + 3 : i + 5)
-
-         dist2        = dot_product( pos(:) - eb_cent(:), pos(:) - eb_cent(:) )
-
-         if ( dist2 < min_dist2 ) then
-            min_dist2 = dist2
-            i_nearest = i
-         end if
-      end do
-
-
-      ! Test if pos "projects onto" the nearest EB facet's interior
-      eb_cent(:)   = eb_data(i_nearest     : i_nearest + 2)
-      eb_norm(:)   = eb_data(i_nearest + 3 : i_nearest + 5)
-
-      dist_proj = dot_product( pos(:) - eb_cent(:), -eb_norm(:) )
-      eb_min_pt(:) = pos(:) + eb_norm(:) * dist_proj
-
-      vi_cent(:) = floor( eb_cent(:) * inv_dx)
-      vi_pt(:)   = floor( eb_min_pt(:) * inv_dx);
-
-      min_pt_valid = .false.
-      if ( all( vi_pt == vi_cent ) ) then
-          min_pt_valid = .true.
-      else ! rounding error might give false negatives
-      do k_shift = -1, 1
-         do j_shift = -1, 1
-            do i_shift = -1, 1
-               vi_pt(:) = floor( (eb_min_pt(:) + (/i_shift, j_shift, k_shift /)*1d-6*dx_eb ) * inv_dx);
-               if ( all( vi_pt == vi_cent ) ) min_pt_valid = .true.
-            end do
-         end do
-      end do
-      end if
-
-
-      ! If projects onto nearest EB facet, then return projected distance
-      ! Alternatively: find the nearest point on the EB edge
-      if ( min_pt_valid ) then
-         ! this is a signed distance function
-         min_dist   = dist_proj
-         proj_valid = .true.
-      else
-         ! fallback: find the nearest point on the EB edge
-         c_vec = facets_nearest_pt(vi_pt, vi_cent, pos, eb_norm, eb_cent, dx_eb)
-         min_edge_dist2 = dot_product( c_vec(:) - pos(:), c_vec(:) - pos(:))
-         min_dist       = -sqrt( min(min_dist2, min_edge_dist2) )
-      end if
-
-    end subroutine closest_dist
-
-    !---------------------------------------------------------------------------
-    !!
-    !>   pure subroutine THRESHOLD_LEVELSET
-    !!
-    !!   PURPOSE: sets max/min threshold to the level-set function. This ensures
-    !!   that the level-set function is a local description near boundaries.
-    !!
-    !!   COMMENTS: some applications (such as filling level-set from discrete)
-    !!   EB facets become less accurate far from the boundary. Thresholding can
-    !!   therefore eliminate spurious level-set values
-    !!
-    !---------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_threshold_levelset(lo,  hi,     threshold, &
-                                                phi, phi_lo, phi_hi    )&
-                    bind(C, name="amrex_eb_threshold_levelset")
-
-      implicit none
-
-      integer,      dimension(3), intent(in   ) :: lo, hi, phi_lo, phi_hi
-      real(amrex_real),               intent(in   ) :: threshold
-      real(amrex_real),               intent(inout) :: phi (phi_lo(1):phi_hi(1), &
-                                                        phi_lo(2):phi_hi(2), &
-                                                        phi_lo(3):phi_hi(3))
-
-      integer      :: ii, jj, kk
-      real(amrex_real) :: phi_th
-
-
-      phi_th = threshold
-      if (phi_th < 0) phi_th = huge(phi_th)
-
-
-      do kk = lo(3), hi(3)
-         do jj = lo(2), hi(2)
-            do ii = lo(1), hi(1)
-
-               if ( phi(ii, jj, kk) >  phi_th ) phi(ii, jj, kk) =  phi_th
-               if ( phi(ii, jj, kk) < -phi_th ) phi(ii, jj, kk) = -phi_th
-
-            end do
-         end do
-      end do
-
-
-    end subroutine amrex_eb_threshold_levelset
-
-    !----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine VALIDATE_LEVELSET
-    !!
-    !!   Purpose: ensure that the sign of the level-set (`phi`) function is the same as the sign of the implicit
-    !!   function (`impf`), if `valid == 0`.
-    !!
-    !!   Comments: Note the role of `valid` above, `valid` is 0 for points where the closest distance to the surface
-    !!   is on an edge. In that case, fill_levelset_eb defaults to negative distances. Hence this function can be
-    !!   used for checking this assumption, and flipping the level-set value's sign if necessary.
-    !!
-    !----------------------------------------------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_validate_levelset(lo,    hi,   n_pad, &
-                                               impf,  imlo, imhi,  &
-                                               valid, vlo,  vhi,   &
-                                               phi,   phlo, phhi  )&
-                    bind(C, name="amrex_eb_validate_levelset")
-
-        implicit none
-
-        integer,      dimension(3), intent(in   ) :: lo, hi, imlo, imhi, vlo, vhi, phlo, phhi
-        integer,                    intent(in   ) :: n_pad
-        real(amrex_real),               intent(in   ) :: impf  ( imlo(1):imhi(1), imlo(2):imhi(2), imlo(3):imhi(3) )
-        integer,                    intent(in   ) :: valid (  vlo(1):vhi(1),   vlo(2):vhi(2),   vlo(3):vhi(3)  )
-        real(amrex_real),               intent(inout) :: phi   ( phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-
-        integer      :: ii, jj, kk
-        real(amrex_real) :: levelset_node
-
-        do kk = lo(3), hi(3)
-            do jj = lo(2), hi(2)
-                do ii = lo(1), hi(1)
-                    if ( valid(ii, jj, kk)  == 0 ) then
-                        levelset_node = abs( phi(ii, jj, kk) )
-                        if ( impf(ii, jj, kk) <= 0 ) then
-                            phi(ii, jj, kk) = levelset_node
-                        else
-                            phi(ii, jj, kk) = -levelset_node
-                        end if
-                     end if
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_validate_levelset
-
-
-
-    pure subroutine amrex_eb_validate_levelset_bcs( phi,      phlo,  phhi,  &
-                                                    valid,    vlo,   vhi,   &
-                                                    periodic, domlo, domhi, &
-                                                    impf,     imlo,  imhi ) &
-                    bind(C, name="amrex_eb_validate_levelset_bcs")
-
-        implicit none
-
-        integer, dimension(3), intent(in   ) :: phlo, phhi, vlo, vhi, periodic, domlo, domhi, imlo, imhi
-        integer,               intent(in   ) :: valid (  vlo(1):vhi(1),   vlo(2):vhi(2),   vlo(3):vhi(3)  )
-        real(amrex_real),          intent(inout) :: phi   ( phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-        real(amrex_real),          intent(in   ) :: impf(imlo(1):imhi(1), imlo(2):imhi(2), imlo(3):imhi(3))
-
-        integer, dimension(3) :: lo, hi
-        !-------------------------------------------------------------------------------------------------------------
-        ! Iterate over each of the 6 "faces" of the rectangular domain
-        !-------------------------------------------------------------------------------------------------------------
-
-        ! 2 i-j faces => k is in [vlo(3), domlo(3)) U (domhi(3), vhi(3)]
-
-        if ( (periodic(3).eq.0) .and. (phlo(3).lt.domlo(3)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), domlo(3) - 1
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            hi(3) = domlo(3) - 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_validate_levelset ( &
-                lo, hi, 0,                    &
-                impf,  imlo, imhi,            &
-                valid, vlo,  vhi,             &
-                phi,   phlo, phhi             &
-            )
-        end if
-
-        if ( (periodic(3).eq.0) .and. (phhi(3).gt.domhi(3)) ) then
-            lo(:) = phlo(:)       ! k = domhi(3) + 1, phihi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            lo(3) = domhi(3) + 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_validate_levelset ( &
-                lo, hi, 0,                    &
-                impf,  imlo, imhi,            &
-                valid, vlo,  vhi,             &
-                phi,   phlo, phhi             &
-            )
-        end if
-
-
-        ! 2 i-k faces => j is in [vlo(2), domlo(2)) U (domhi(2), vhi(2)]
-
-        if ( (periodic(2).eq.0) .and. (phlo(2).lt.domlo(2)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), domlo(2) - 1
-            hi(2) = domlo(2) - 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_validate_levelset ( &
-                lo, hi, 0,                    &
-                impf,  imlo, imhi,            &
-                valid, vlo,  vhi,             &
-                phi,   phlo, phhi             &
-            )
-        end if
-
-        if ( (periodic(2).eq.0) .and. (phhi(2).gt.domhi(2)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = domhi(2) + 1, phhi(2)
-            lo(2) = domhi(2) + 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_validate_levelset ( &
-                lo, hi, 0,                    &
-                impf,  imlo, imhi,            &
-                valid, vlo,  vhi,             &
-                phi,   phlo, phhi             &
-            )
-        end if
-
-
-        ! 2 j-k faces => i is in [vlo(1), domlo(1)) U (domhi(1), vhi(1)]
-
-        if ( (periodic(1).eq.0) .and. (phlo(1).lt.domlo(1)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            hi(1) = domlo(1) - 1  ! i = phlo(1), domlo(1) - 1
-
-            call amrex_eb_validate_levelset ( &
-                lo, hi, 0,                    &
-                impf,  imlo, imhi,            &
-                valid, vlo,  vhi,             &
-                phi,   phlo, phhi             &
-            )
-        end if
-
-        if ( (periodic(1).eq.0) .and. (phhi(1).gt.domhi(1)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            lo(1) = domhi(1) + 1  ! i = domhi(1) + 1, phhi(1)
-
-            call amrex_eb_validate_levelset ( &
-                lo, hi, 0,                    &
-                impf,  imlo, imhi,            &
-                valid, vlo,  vhi,             &
-                phi,   phlo, phhi             &
-            )
-        end if
-
-    end subroutine amrex_eb_validate_levelset_bcs
-
-
-    !----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine UPDATE_LEVELSET_INTERSECTION
-    !!
-    !!   Purpose: Update level set using the "intersection" selection rule: the minimum value between `phi` and
-    !!   `ls_in` is stored in `phi`. This is the level-set equivalent of the `GeometryShop::IntersectionIF`.
-    !!
-    !!   Comments: The role of `valid` here is to flag cells near (or in) regions of negative level-set.
-    !!
-    !----------------------------------------------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_update_levelset_intersection(lo,    hi,           &
-                                                          v_in,  vilo, vihi,   &
-                                                          ls_in, lslo, lshi,   &
-                                                          valid, vlo,  vhi,    &
-                                                          phi,   phlo, phhi  ) &
-                    bind(C, name="amrex_eb_update_levelset_intersection")
-
-        implicit none
-
-        integer,      dimension(3), intent(in   ) :: lo, hi, vilo, vihi, lslo, lshi, vlo, vhi, phlo, phhi
-        integer,                    intent(in   ) :: v_in  (vilo(1):vihi(1),vilo(2):vihi(2),vilo(3):vihi(3))
-        real(amrex_real),               intent(in   ) :: ls_in (lslo(1):lshi(1),lslo(2):lshi(2),lslo(3):lshi(3))
-        integer,                    intent(inout) :: valid ( vlo(1):vhi(1),  vlo(2):vhi(2),  vlo(3):vhi(3) )
-        real(amrex_real),               intent(inout) :: phi   (phlo(1):phhi(1),phlo(2):phhi(2),phlo(3):phhi(3))
-
-        real(amrex_real) :: ls_node, in_node
-        integer      :: ii, jj, kk
-
-        do kk = lo(3), hi(3)
-            do jj = lo(2), hi(2)
-                do ii = lo(1), hi(1)
-
-                    if (v_in(ii, jj, kk) .eq. 1 ) then
-                        in_node = ls_in(ii, jj, kk)
-                        ls_node = phi(ii, jj, kk)
-
-                        if ( in_node .lt. ls_node ) then
-                            phi(ii, jj, kk) = in_node
-                            if ( ls_node .le. 0 ) then
-                                valid(ii, jj, kk) = 1
-                            end if
-                        end if
-                    end if
-
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_update_levelset_intersection
-
-
-
-    pure subroutine amrex_eb_update_levelset_intersection_bcs( v_in,     vilo,  vihi,   &
-                                                               ls_in,    lslo,  lshi,   &
-                                                               valid,    vlo,   vhi,    &
-                                                               phi,      phlo,  phhi,   &
-                                                               periodic, domlo, domhi ) &
-                    bind(C, name="amrex_eb_update_levelset_intersection_bcs")
-
-        implicit none
-
-        integer, dimension(3), intent(in   ) :: vilo, vihi, lslo, lshi, vlo, vhi, phlo, phhi, periodic, domlo, domhi
-        integer,               intent(in   ) :: v_in  (vilo(1):vihi(1),vilo(2):vihi(2),vilo(3):vihi(3))
-        real(amrex_real),          intent(in   ) :: ls_in (lslo(1):lshi(1),lslo(2):lshi(2),lslo(3):lshi(3))
-        integer,               intent(  out) :: valid ( vlo(1):vhi(1),  vlo(2):vhi(2),  vlo(3):vhi(3) )
-        real(amrex_real),          intent(  out) :: phi   (phlo(1):phhi(1),phlo(2):phhi(2),phlo(3):phhi(3))
-
-        integer, dimension(3) :: lo, hi
-
-        !-------------------------------------------------------------------------------------------------------------
-        ! Iterate over each of the 6 "faces" of the rectangular domain
-        !-------------------------------------------------------------------------------------------------------------
-
-        ! 2 i-j faces => k is in [vlo(3), domlo(3)) U (domhi(3), vhi(3)]
-
-        if ( (periodic(3).eq.0) .and. (phlo(3).lt.domlo(3)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), domlo(3) - 1
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            hi(3) = domlo(3) - 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_intersection ( &
-                lo,    hi,                               &
-                v_in,  vilo, vihi,                       &
-                ls_in, lslo, lshi,                       &
-                valid, vlo,  vhi,                        &
-                phi,   phlo, phhi                        &
-            )
-        end if
-
-        if ( (periodic(3).eq.0) .and. (phhi(3).gt.domhi(3)) ) then
-            lo(:) = phlo(:)       ! k = domhi(3) + 1, phihi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            lo(3) = domhi(3) + 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_intersection ( &
-                lo,    hi,                               &
-                v_in,  vilo, vihi,                       &
-                ls_in, lslo, lshi,                       &
-                valid, vlo,  vhi,                        &
-                phi,   phlo, phhi                        &
-            )
-        end if
-
-
-        ! 2 i-k faces => j is in [vlo(2), domlo(2)) U (domhi(2), vhi(2)]
-
-        if ( (periodic(2).eq.0) .and. (phlo(2).lt.domlo(2)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), domlo(2) - 1
-            hi(2) = domlo(2) - 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_intersection ( &
-                lo,    hi,                               &
-                v_in,  vilo, vihi,                       &
-                ls_in, lslo, lshi,                       &
-                valid, vlo,  vhi,                        &
-                phi,   phlo, phhi                        &
-            )
-        end if
-
-        if ( (periodic(2).eq.0) .and. (phhi(2).gt.domhi(2)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = domhi(2) + 1, phhi(2)
-            lo(2) = domhi(2) + 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_intersection ( &
-                lo,    hi,                               &
-                v_in,  vilo, vihi,                       &
-                ls_in, lslo, lshi,                       &
-                valid, vlo,  vhi,                        &
-                phi,   phlo, phhi                        &
-            )
-        end if
-
-
-        ! 2 j-k faces => i is in [vlo(1), domlo(1)) U (domhi(1), vhi(1)]
-
-        if ( (periodic(1).eq.0) .and. (phlo(1).lt.domlo(1)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            hi(1) = domlo(1) - 1  ! i = phlo(1), domlo(1) - 1
-
-            call amrex_eb_update_levelset_intersection ( &
-                lo,    hi,                               &
-                v_in,  vilo, vihi,                       &
-                ls_in, lslo, lshi,                       &
-                valid, vlo,  vhi,                        &
-                phi,   phlo, phhi                        &
-            )
-        end if
-
-        if ( (periodic(1).eq.0) .and. (phhi(1).gt.domhi(1)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            lo(1) = domhi(1) + 1  ! i = domhi(1) + 1, phhi(1)
-
-            call amrex_eb_update_levelset_intersection ( &
-                lo,    hi,                               &
-                v_in,  vilo, vihi,                       &
-                ls_in, lslo, lshi,                       &
-                valid, vlo,  vhi,                        &
-                phi,   phlo, phhi                        &
-            )
-        end if
-
-    end subroutine amrex_eb_update_levelset_intersection_bcs
-
-
-
-    !----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine UPDATE_LEVELSET_UNION
-    !!
-    !!   Purpose: Update level set using the "union" selection rule: the maximum value between `phi` and `ls_in` is
-    !!   stored in `phi`. This is the level-set equivalent of the `GeometryShop::IntersectionIF`.
-    !!
-    !!   Comments: The role of `valid` here is to flag cells near (or in) regions of negative level-set.
-    !!
-    !----------------------------------------------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_update_levelset_union(lo,    hi,           &
-                                                   v_in,  vilo, vihi,   &
-                                                   ls_in, lslo, lshi,   &
-                                                   valid, vlo,  vhi,    &
-                                                   phi,   phlo, phhi  ) &
-                    bind(C, name="amrex_eb_update_levelset_union")
-
-        implicit none
-
-        integer,      dimension(3), intent(in   ) :: lo, hi, vilo, vihi, lslo, lshi, vlo, vhi, phlo, phhi
-        integer,                    intent(in   ) :: v_in  (vilo(1):vihi(1),vilo(2):vihi(2),vilo(3):vihi(3))
-        real(amrex_real),               intent(in   ) :: ls_in (lslo(1):lshi(1),lslo(2):lshi(2),lslo(3):lshi(3))
-        integer,                    intent(  out) :: valid ( vlo(1):vhi(1),  vlo(2):vhi(2),  vlo(3):vhi(3) )
-        real(amrex_real),               intent(  out) :: phi   (phlo(1):phhi(1),phlo(2):phhi(2),phlo(3):phhi(3))
-
-        real(amrex_real) :: ls_node, in_node
-        integer      :: ii, jj, kk
-
-        do kk = lo(3), hi(3)
-            do jj = lo(2), hi(2)
-                do ii = lo(1), hi(1)
-
-                    if (v_in(ii, jj, kk) .eq. 1 ) then
-                        in_node = ls_in(ii, jj, kk)
-                        ls_node = phi(ii, jj, kk)
-
-                        if ( in_node .gt. ls_node ) then
-                            phi(ii, jj, kk) = in_node
-                            if ( ls_node .le. 0 ) then
-                                valid(ii, jj, kk) = 1
-                            end if
-                        end if
-                    end if
-
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_update_levelset_union
-
-
-
-    pure subroutine amrex_eb_update_levelset_union_bcs( v_in,     vilo,  vihi,   &
-                                                        ls_in,    lslo,  lshi,   &
-                                                        valid,    vlo,   vhi,    &
-                                                        phi,      phlo,  phhi,   &
-                                                        periodic, domlo, domhi ) &
-                    bind(C, name="amrex_eb_update_levelset_union_bcs")
-
-        implicit none
-
-        integer, dimension(3), intent(in   ) :: vilo, vihi, lslo, lshi, vlo, vhi, phlo, phhi, periodic, domlo, domhi
-        integer,               intent(in   ) :: v_in  (vilo(1):vihi(1),vilo(2):vihi(2),vilo(3):vihi(3))
-        real(amrex_real),          intent(in   ) :: ls_in (lslo(1):lshi(1),lslo(2):lshi(2),lslo(3):lshi(3))
-        integer,               intent(  out) :: valid ( vlo(1):vhi(1),  vlo(2):vhi(2),  vlo(3):vhi(3) )
-        real(amrex_real),          intent(  out) :: phi   (phlo(1):phhi(1),phlo(2):phhi(2),phlo(3):phhi(3))
-
-        !integer      :: i, j, k
-        !real(amrex_real) :: ls_node, in_node
-
-        integer, dimension(3) :: lo, hi
-
-        !-------------------------------------------------------------------------------------------------------------
-        ! Iterate over each of the 6 "faces" of the rectangular domain
-        !-------------------------------------------------------------------------------------------------------------
-
-        ! 2 i-j faces => k is in [vlo(3), domlo(3)) U (domhi(3), vhi(3)]
-        if ( (periodic(3).eq.0) .and. (phlo(3).lt.domlo(3)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), domlo(3) - 1
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            hi(3) = domlo(3) - 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_union ( &
-                lo,    hi,                        &
-                v_in,  vilo, vihi,                &
-                ls_in, lslo, lshi,                &
-                valid, vlo,  vhi,                 &
-                phi,   phlo, phhi                 &
-            )
-        end if
-
-        if ( (periodic(3).eq.0) .and. (phhi(3).gt.domhi(3)) ) then
-            lo(:) = phlo(:)       ! k = domhi(3) + 1, phihi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            lo(3) = domhi(3) + 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_union ( &
-                lo,    hi,                        &
-                v_in,  vilo, vihi,                &
-                ls_in, lslo, lshi,                &
-                valid, vlo,  vhi,                 &
-                phi,   phlo, phhi                 &
-            )
-        end if
-
-
-        ! 2 i-k faces => j is in [vlo(2), domlo(2)) U (domhi(2), vhi(2)]
-
-        if ( (periodic(2).eq.0) .and. (phlo(2).lt.domlo(2)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), domlo(2) - 1
-            hi(2) = domlo(2) - 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_union ( &
-                lo,    hi,                        &
-                v_in,  vilo, vihi,                &
-                ls_in, lslo, lshi,                &
-                valid, vlo,  vhi,                 &
-                phi,   phlo, phhi                 &
-            )
-        end if
-
-        if ( (periodic(2).eq.0) .and. (phhi(2).gt.domhi(2)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = domhi(2) + 1, phhi(2)
-            lo(2) = domhi(2) + 1  ! i = phlo(1), phhi(1)
-
-            call amrex_eb_update_levelset_union ( &
-                lo,    hi,                        &
-                v_in,  vilo, vihi,                &
-                ls_in, lslo, lshi,                &
-                valid, vlo,  vhi,                 &
-                phi,   phlo, phhi                 &
-            )
-        end if
-
-
-        ! 2 j-k faces => i is in [vlo(1), domlo(1)) U (domhi(1), vhi(1)]
-
-        if ( (periodic(1).eq.0) .and. (phlo(1).lt.domlo(1)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            hi(1) = domlo(1) - 1  ! i = phlo(1), domlo(1) - 1
-
-            call amrex_eb_update_levelset_union ( &
-                lo,    hi,                        &
-                v_in,  vilo, vihi,                &
-                ls_in, lslo, lshi,                &
-                valid, vlo,  vhi,                 &
-                phi,   phlo, phhi                 &
-            )
-        end if
-
-        if ( (periodic(1).eq.0) .and. (phhi(1).gt.domhi(1)) ) then
-            lo(:) = phlo(:)       ! k = phlo(3), phhi(3)
-            hi(:) = phhi(:)       ! j = phlo(2), phhi(2)
-            lo(1) = domhi(1) + 1  ! i = domhi(1) + 1, phhi(1)
-
-            call amrex_eb_update_levelset_union ( &
-                lo,    hi,                        &
-                v_in,  vilo, vihi,                &
-                ls_in, lslo, lshi,                &
-                valid, vlo,  vhi,                 &
-                phi,   phlo, phhi                 &
-            )
-        end if
-
-    end subroutine amrex_eb_update_levelset_union_bcs
-
-    !----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine FILL_VALID
-    !!
-    !!   Purpose: Fills elements of valid with 1 whenever it corresponds to a position with n_pad of the level set
-    !!   value being negative (i.e. phi < 0), and 0 otherwise.
-    !!
-    !----------------------------------------------------------------------------------------------------------------
-
-    pure subroutine amrex_eb_fill_valid(       lo,     hi, &
-                                        valid, vlo,   vhi, &
-                                        phi,   phlo, phhi, &
-                                        n_pad            ) &
-                    bind(C, name="amrex_eb_fill_valid")
-
-        implicit none
-
-        integer, dimension(3), intent(in   ) :: lo, hi, vlo, vhi, phlo, phhi
-        integer,               intent(in   ) :: n_pad
-        integer,               intent(  out) :: valid( vlo(1):vhi(1),   vlo(2):vhi(2),   vlo(3):vhi(3))
-        real(amrex_real),          intent(in   ) :: phi  (phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3))
-
-        integer :: i, j, k
-        logical :: valid_cell
-
-
-        do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-                do i = lo(1), hi(1)
-                    valid_cell = neighbour_is_valid(phi, phlo, phhi, i, j, k, n_pad)
-                    if ( valid_cell ) then
-                        valid(i, j, k) = 1
-                    end if
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_fill_valid
-
-
-
-    !----------------------------------------------------------------------------------------------------------------
-    !!
-    !>   pure subroutine FILL_VALID_BCS
-    !!
-    !!   Purpose: Fills elements of valid with 1 whenever it corresponds to a position with n_pad of the level set
-    !!   value being negative (i.e. phi < 0), and 0 otherwise. For all ghost cells outside the domain
-    !!
-    !----------------------------------------------------------------------------------------------------------------
-
-
-    pure subroutine amrex_eb_fill_valid_bcs( valid, vlo, vhi, periodic, domlo, domhi ) &
-                    bind(C, name="amrex_eb_fill_valid_bcs")
-
-        implicit none
-
-        integer, dimension(3), intent(in   ) :: vlo, vhi, periodic, domlo, domhi
-        integer,               intent(  out) :: valid(vlo(1):vhi(1), vlo(2):vhi(2), vlo(3):vhi(3))
-
-        integer :: i, j, k
-
-        !-------------------------------------------------------------------------------------------------------------
-        ! Iterate over each of the 6 "faces" of the rectangular domain
-        !-------------------------------------------------------------------------------------------------------------
-
-        ! 2 i-j faces => k is in [vlo(3), domlo(3)) U (domhi(3), vhi(3)]
-
-        if ( periodic(3).eq.0 ) then
-            do k = vlo(3), domlo(3) - 1
-                do j = vlo(2), vhi(2)
-                    do i = vlo(1), vhi(1)
-                        valid(i, j, k) = 1
-                    end do
-                end do
-            end do
-
-            do k = domhi(3) + 1, vhi(3)
-                do j = vlo(2), vhi(2)
-                    do i = vlo(1), vhi(1)
-                        valid(i, j, k) = 1
-                    end do
-                end do
-            end do
-        end if
-
-        ! 2 i-k faces => j is in [vlo(2), domlo(2)) U (domhi(2), vhi(2)]
-
-        if ( periodic(2).eq.0 ) then
-            if ( vlo(2).lt.domlo(2) ) then
-                do k = vlo(3), vhi(3)
-                    do j = vlo(2), domlo(2) - 1
-                        do i = vlo(1), vhi(1)
-                            valid(i, j, k) = 1
-                        end do
-                    end do
-                end do
-            end if
-
-            if (vhi(2).gt.domhi(2) ) then
-                do k = vlo(3), vhi(3)
-                    do j = domhi(2) + 1, vhi(2)
-                        do i = vlo(1), vhi(1)
-                            valid(i, j, k) = 1
-                        end do
-                    end do
-                end do
-            end if
-        end if
-
-        ! 2 j-k faces => i is in [vlo(1), domlo(1)) U (domhi(1), vhi(1)]
-
-        if ( periodic(1).eq.0 ) then
-            if ( vlo(1).lt.domlo(1) ) then
-                do k = vlo(3), vhi(3)
-                    do j = vlo(2), vhi(2)
-                        do i = vlo(1), domlo(1) - 1
-                            valid(i, j, k) = 1
-                        end do
-                    end do
-                end do
-            end if
-
-            if ( vhi(1).gt.domhi(1) ) then
-                do k = vlo(3), vhi(3)
-                    do j = vlo(2), vhi(2)
-                        do i = domhi(1) + 1, vhi(1)
-                            valid(i, j, k) = 1
-                        end do
-                    end do
-                end do
-            end if
-        end if
-
-    end subroutine amrex_eb_fill_valid_bcs
-
-
-
-    pure function neighbour_is_valid(phi, phlo, phhi, i, j, k, n_pad)
-        implicit none
-
-        ! ** output type
-        logical :: neighbour_is_valid
-
-        ! ** input types
-        integer,      dimension(3), intent(in) :: phlo, phhi
-        real(amrex_real),               intent(in) :: phi( phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-        integer,                    intent(in) :: i, j, k, n_pad
-
-
-        ! ** declare local variables
-        ! ii, jj, kk : loop variables itterating over neighbour stencil
-        ! klo ... ihi: boundaries of stencil which will be checked for valid cells
-        !              a cell is valid if phi <= 0
-        integer :: ii, jj, kk, klo, khi, jlo, jhi, ilo, ihi
-
-
-        !----------------------------------------------------------------------------------------------------
-        ! build neighbour stencil of size n_pad
-        ! note: stencil could be out-of-bounds  => bounds-checking
-        !----------------------------------------------------------------------------------------------------
-
-        ilo = max(i-n_pad, phlo(1))
-        ihi = min(i+n_pad, phhi(1))
-
-        jlo = max(j-n_pad, phlo(2))
-        jhi = min(j+n_pad, phhi(2))
-
-        klo = max(k-n_pad, phlo(3))
-        khi = min(k+n_pad, phhi(3))
-
-
-        !---------------------------------------------------------------------------------------------------
-        ! check members of neighbour stencil:
-        !       cell is "valid" whenever at least one cell in the neighbour stencil has a level-set phi
-        !       less than, or equal to, 0
-        !---------------------------------------------------------------------------------------------------
-
-        neighbour_is_valid = .false.
-
-        do kk = klo, khi
-            do jj = jlo, jhi
-                do ii = ilo, ihi
-                    if ( phi(ii, jj, kk) .le. 0 ) then
-                        neighbour_is_valid = .true.
-                        return
-                    end if
-                end do
-            end do
-        end do
-
-    end function neighbour_is_valid
-
-
-
-    pure subroutine amrex_eb_count_facets(lo, hi, flag, flo, fhi, n_facets) &
-                    bind(C, name="amrex_eb_count_facets")
-
-        implicit none
-
-        integer, dimension(3), intent(in   ) :: lo, hi, flo, fhi
-        integer,               intent(in   ) :: flag ( flo(1):fhi(1), flo(2):fhi(2), flo(3):fhi(3) )
-        integer,               intent(inout) :: n_facets
-
-        integer :: i, j, k
-
-        do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-                do i = lo(1), hi(1)
-                    if ( is_single_valued_cell( flag(i, j, k) ) ) then
-                        n_facets = n_facets + 1
-                    end if
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_count_facets
-
-
-
-    pure subroutine amrex_eb_as_list(lo,       hi,   c_facets,  &
-                               flag,     flo,  fhi,       &
-                               norm,     nlo,  nhi,       &
-                               bcent,    blo,  bhi,       &
-                               list_out, lsize,           &
-                               dx                       ) &
-                    bind(C, name="amrex_eb_as_list")
-
-        use amrex_constants_module , only : half
-
-        implicit none
-
-        integer,                intent(in   ) :: lsize
-        integer, dimension(3),  intent(in   ) :: lo, hi, flo, fhi, nlo, nhi, blo, bhi
-        real(amrex_real),       intent(in   ) :: dx(3)
-        integer,                intent(in   ) :: flag  ( flo(1):fhi(1), flo(2):fhi(2), flo(3):fhi(3) )
-        real(amrex_real),       intent(in   ) :: norm  ( nlo(1):nhi(1), nlo(2):nhi(2), nlo(3):nhi(3), 3)
-        real(amrex_real),       intent(in   ) :: bcent ( blo(1):bhi(1), blo(2):bhi(2), blo(3):bhi(3), 3)
-        real(amrex_real),       intent(  out) :: list_out(lsize)
-        integer,                intent(inout) :: c_facets
-
-        integer                    :: i, j, k, i_facet
-        real(amrex_real), dimension(3) :: eb_cent
-
-        i_facet = 6 * c_facets + 1
-
-        do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-                do i = lo(1), hi(1)
-                    if ( is_single_valued_cell( flag(i, j, k) ) ) then
-
-                        c_facets = c_facets + 1
-
-                        eb_cent(:) = ( bcent(i, j, k, :)                     &
-                                       + (/ real(i,amrex_real), real(j,amrex_real), real(k,amrex_real) /)     &
-                                       + (/ half, half, half /) ) * dx(:)
-
-                        list_out( i_facet     : i_facet + 2) = eb_cent(:)
-                        list_out( i_facet + 3 : i_facet + 5) = norm(i, j, k, :)
-
-                        i_facet = i_facet + 6
-
-                    end if
-                end do
-            end do
-        end do
-
-    end subroutine amrex_eb_as_list
-
-
-
-    pure subroutine amrex_eb_interp_levelset(pos, plo,  n_refine, &
-                                             phi, phlo, phhi,     &
-                                             dx,  phi_interp    ) &
-                    bind(C, name="amrex_eb_interp_levelset")
-
-        use amrex_constants_module , only : one
-
-        implicit none
-
-        real(amrex_real), dimension(3), intent(in   ) :: pos, plo
-        integer,      dimension(3), intent(in   ) :: phlo, phhi
-        integer,                    intent(in   ) :: n_refine
-        real(amrex_real),               intent(in   ) :: phi( phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-        real(amrex_real), dimension(3), intent(in   ) :: dx
-        real(amrex_real),               intent(  out) :: phi_interp
-
-        integer                    :: i, j, k
-        real(amrex_real)               :: xp, yp, zp, lx, ly, lz, wx_lo, wx_hi, wy_lo, wy_hi, wz_lo, wz_hi
-        real(amrex_real), dimension(3) :: inv_dx
-
-        inv_dx(:) = n_refine / dx(:)
-
-        xp = pos(1) - plo(1)
-        yp = pos(2) - plo(2)
-        zp = pos(3) - plo(3)
-
-        lx = xp * inv_dx(1)
-        ly = yp * inv_dx(2)
-        lz = zp * inv_dx(3)
-
-        i = floor(lx)
-        j = floor(ly)
-        k = floor(lz)
-
-        wx_hi = lx - i
-        wy_hi = ly - j
-        wz_hi = lz - k
-
-        wx_lo = one - wx_hi
-        wy_lo = one - wy_hi
-        wz_lo = one - wz_hi
-
-        phi_interp = phi(i,   j,   k  ) * wx_lo * wy_lo * wz_lo &
-                   + phi(i+1, j,   k  ) * wx_hi * wy_lo * wz_lo &
-                   + phi(i,   j+1, k  ) * wx_lo * wy_hi * wz_lo &
-                   + phi(i,   j,   k+1) * wx_lo * wy_lo * wz_hi &
-                   + phi(i+1, j+1, k  ) * wx_hi * wy_hi * wz_lo &
-                   + phi(i,   j+1, k+1) * wx_lo * wy_hi * wz_hi &
-                   + phi(i+1, j,   k+1) * wx_hi * wy_lo * wz_hi &
-                   + phi(i+1, j+1, k+1) * wx_hi * wy_hi * wz_hi
-
-    end subroutine amrex_eb_interp_levelset
-
-
-
-    pure subroutine amrex_eb_normal_levelset(pos, plo,   n_refine, &
-                                             phi, phlo,  phhi,     &
-                                             dx,  normal         ) &
-                    bind(C, name="amrex_eb_normal_levelset")
-
-        use amrex_constants_module , only : one
-
-        implicit none
-
-        real(amrex_real), dimension(3), intent(in   ) :: pos, plo
-        integer,      dimension(3), intent(in   ) :: phlo, phhi
-        integer,                    intent(in   ) :: n_refine
-        real(amrex_real),               intent(in   ) :: phi( phlo(1):phhi(1), phlo(2):phhi(2), phlo(3):phhi(3) )
-        real(amrex_real), dimension(3), intent(in   ) :: dx
-        real(amrex_real), dimension(3), intent(  out) :: normal
-
-        integer                    :: i, j, k
-        real(amrex_real)               :: xp, yp, zp, lx, ly, lz, wx_lo, wx_hi, wy_lo, wy_hi, wz_lo, wz_hi
-        real(amrex_real), dimension(3) :: inv_dx
-
-        real(amrex_real) :: inv_norm
-
-        inv_dx = n_refine / dx
-
-        xp = pos(1) - plo(1)
-        yp = pos(2) - plo(2)
-        zp = pos(3) - plo(3)
-
-        lx = xp * inv_dx(1)
-        ly = yp * inv_dx(2)
-        lz = zp * inv_dx(3)
-
-        i = floor(lx)
-        j = floor(ly)
-        k = floor(lz)
-
-        wx_hi = lx - i
-        wy_hi = ly - j
-        wz_hi = lz - k
-
-        wx_lo = one - wx_hi
-        wy_lo = one - wy_hi
-        wz_lo = one - wz_hi
-
-        normal(1) = - phi(i,   j,   k  )*inv_dx(1) * wy_lo * wz_lo  &
-                    + phi(i+1, j,   k  )*inv_dx(1) * wy_lo * wz_lo  &
-                    - phi(i,   j+1, k  )*inv_dx(1) * wy_hi * wz_lo  &
-                    + phi(i+1, j+1, k  )*inv_dx(1) * wy_hi * wz_lo  &
-                    - phi(i,   j,   k+1)*inv_dx(1) * wy_lo * wz_hi  &
-                    + phi(i+1, j,   k+1)*inv_dx(1) * wy_lo * wz_hi  &
-                    - phi(i,   j+1, k+1)*inv_dx(1) * wy_hi * wz_hi  &
-                    + phi(i+1, j+1, k+1)*inv_dx(1) * wy_hi * wz_hi
-
-        normal(2) = - phi(i,   j,   k  )*inv_dx(2) * wx_lo * wz_lo  &
-                    + phi(i,   j+1, k  )*inv_dx(2) * wx_lo * wz_lo  &
-                    - phi(i+1, j,   k  )*inv_dx(2) * wx_hi * wz_lo  &
-                    + phi(i+1, j+1, k  )*inv_dx(2) * wx_hi * wz_lo  &
-                    - phi(i,   j,   k+1)*inv_dx(2) * wx_lo * wz_hi  &
-                    + phi(i,   j+1, k+1)*inv_dx(2) * wx_lo * wz_hi  &
-                    - phi(i+1, j,   k+1)*inv_dx(2) * wx_hi * wz_hi  &
-                    + phi(i+1, j+1, k+1)*inv_dx(2) * wx_hi * wz_hi
-
-        normal(3) = - phi(i,   j,   k  )*inv_dx(3) * wx_lo * wy_lo  &
-                    + phi(i,   j,   k+1)*inv_dx(3) * wx_lo * wy_lo  &
-                    - phi(i+1, j,   k  )*inv_dx(3) * wx_hi * wy_lo  &
-                    + phi(i+1, j,   k+1)*inv_dx(3) * wx_hi * wy_lo  &
-                    - phi(i,   j+1, k  )*inv_dx(3) * wx_lo * wy_hi  &
-                    + phi(i,   j+1, k+1)*inv_dx(3) * wx_lo * wy_hi  &
-                    - phi(i+1, j+1, k  )*inv_dx(3) * wx_hi * wy_hi  &
-                    + phi(i+1, j+1, k+1)*inv_dx(3) * wx_hi * wy_hi
-
-        ! this might not be necessary if the phi grid is dense enough...
-        inv_norm = one / sqrt(normal(1)**2 + normal(2)**2 + normal(3)**2)
-        normal(:) = normal(:) * inv_norm
-
-    end subroutine amrex_eb_normal_levelset
-
-end module amrex_eb_levelset_module
diff --git a/Src/EB/AMReX_EB_slopes_K.H b/Src/EB/AMReX_EB_slopes_K.H
new file mode 100644
index 00000000000..37ac3fc8134
--- /dev/null
+++ b/Src/EB/AMReX_EB_slopes_K.H
@@ -0,0 +1,568 @@
+#ifndef AMREX_EB_SLOPES_K_H_
+#define AMREX_EB_SLOPES_K_H_
+
+#ifdef AMREX_USE_EB
+#include <AMReX_EBFArrayBox.H>
+#include <AMReX_EBCellFlag.H>
+#else
+#include <AMReX_FArrayBox.H>
+#endif
+
+#include <AMReX_Slopes_K.H>
+
+namespace {
+
+#if (AMREX_SPACEDIM > 1)
+#ifdef AMREX_USE_EB
+
+// amrex_calc_slopes_eb calculates the slope in each coordinate direction using a 
+// least squares linear fit to the 9 in 2D / 27 in 3D nearest neighbors, with the function
+// going through the centroid of cell(i,j,k).  This does not assume that the cell centroids,
+// where the data is assume to live, are the same as cell centers.  Note that this routine
+// is called either by amrex_calc_slopes_eb or amrex_calc_slopes_extdir_eb; in the former
+// A is defined with the cell centroids; in the latter, the A values corresponding to values
+// defined on faces use the face centroid location.
+//
+// All the slopes are returned in one call.
+
+#if (AMREX_SPACEDIM == 2) 
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::GpuArray<amrex::Real,AMREX_SPACEDIM>
+amrex_calc_slopes_eb_given_A (int i, int j, int k, int n,
+                              amrex::Real A[9][AMREX_SPACEDIM],
+                              amrex::Array4<amrex::Real const> const& state,
+                              amrex::Array4<amrex::EBCellFlag const> const& flag) noexcept
+{
+    amrex::Real du[9];
+
+    int lc=0;
+    {
+        for(int jj(-1); jj<=1; jj++){
+          for(int ii(-1); ii<=1; ii++){
+
+            if( flag(i,j,0).isConnected(ii,jj,0) and
+                not (ii==0 and jj==0)) {
+
+              du[lc] = state(i+ii,j+jj,0,n) - state(i,j,0,n);
+
+            } else {
+
+              du[lc] = 0.0;
+            }
+            lc++;
+          }
+        }
+    }
+
+    amrex::Real AtA[AMREX_SPACEDIM][AMREX_SPACEDIM];
+    amrex::Real Atb[AMREX_SPACEDIM];
+
+    for(int jj(0); jj<AMREX_SPACEDIM; ++jj)
+    {
+      for(int ii(0); ii<AMREX_SPACEDIM; ++ii){
+        AtA[ii][jj] = 0.0;
+      }
+      Atb[jj] = 0.0;
+    }
+
+    for(int lc(0); lc<9; ++lc)
+    {
+        AtA[0][0] += A[lc][0]* A[lc][0];
+        AtA[0][1] += A[lc][0]* A[lc][1];
+        AtA[1][1] += A[lc][1]* A[lc][1];
+
+        Atb[0] += A[lc][0]*du[lc];
+        Atb[1] += A[lc][1]*du[lc];
+    }
+
+    // Fill in symmetric
+    AtA[1][0] = AtA[0][1];
+
+    amrex::Real detAtA =
+      (AtA[0][0]*AtA[1][1])-
+      (AtA[0][1]*AtA[1][0]);
+
+    amrex::Real detAtA_x =
+        (Atb[0]   *AtA[1][1]) -
+        (AtA[0][1]*Atb[1]); 
+
+    // Slope at centroid of (i,j,k)
+    amrex::Real xs = detAtA_x / detAtA;
+
+    amrex::Real detAtA_y =
+        (AtA[0][0]*Atb[1]) -
+        (Atb[0] * AtA[1][0]);
+
+    // Slope at centroid of (i,j,k)
+    amrex::Real ys = detAtA_y / detAtA;
+
+   return {xs,ys};
+}
+#elif (AMREX_SPACEDIM == 3)
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::GpuArray<amrex::Real,AMREX_SPACEDIM>
+amrex_calc_slopes_eb_given_A (int i, int j, int k, int n,
+                              amrex::Real A[27][AMREX_SPACEDIM],
+                              amrex::Array4<amrex::Real const> const& state,
+                              amrex::Array4<amrex::EBCellFlag const> const& flag) noexcept
+{
+    amrex::Real du[27];
+
+    int lc=0;
+    for(int kk(-1); kk<=1; kk++)
+    {
+        for(int jj(-1); jj<=1; jj++){
+          for(int ii(-1); ii<=1; ii++){
+
+            if( flag(i,j,k).isConnected(ii,jj,kk) and
+                not (ii==0 and jj==0 and kk==0)) {
+
+              du[lc] = state(i+ii,j+jj,k+kk,n) - state(i,j,k,n);
+
+            } else {
+
+              du[lc] = 0.0;
+            }
+            lc++;
+          }
+        }
+    }
+
+    amrex::Real AtA[AMREX_SPACEDIM][AMREX_SPACEDIM];
+    amrex::Real Atb[AMREX_SPACEDIM];
+
+    for(int jj(0); jj<AMREX_SPACEDIM; ++jj){
+      for(int ii(0); ii<AMREX_SPACEDIM; ++ii){
+        AtA[ii][jj] = 0.0;
+      }
+      Atb[jj] = 0.0;
+    }
+
+    for(int lc(0); lc < 27; ++lc)
+    {
+        AtA[0][0] += A[lc][0]* A[lc][0];
+        AtA[0][1] += A[lc][0]* A[lc][1];
+        AtA[0][2] += A[lc][0]* A[lc][2];
+        AtA[1][1] += A[lc][1]* A[lc][1];
+        AtA[1][2] += A[lc][1]* A[lc][2];
+        AtA[2][2] += A[lc][2]* A[lc][2];
+
+        Atb[0] += A[lc][0]*du[lc];
+        Atb[1] += A[lc][1]*du[lc];
+        Atb[2] += A[lc][2]*du[lc];
+    }
+
+    // Fill in symmetric
+    AtA[1][0] = AtA[0][1];
+    AtA[2][0] = AtA[0][2];
+    AtA[2][1] = AtA[1][2];
+
+    amrex::Real detAtA =
+      AtA[0][0]*(AtA[1][1]*AtA[2][2] - AtA[1][2]*AtA[2][1]) -
+      AtA[0][1]*(AtA[1][0]*AtA[2][2] - AtA[1][2]*AtA[2][0]) +
+      AtA[0][2]*(AtA[1][0]*AtA[2][1] - AtA[1][1]*AtA[2][0]);
+
+    amrex::Real detAtA_x =
+        Atb[0]   *(AtA[1][1]*AtA[2][2] - AtA[1][2]*AtA[1][2]) -
+        AtA[0][1]*(Atb[1] *  AtA[2][2] - AtA[1][2]*Atb[2]   ) +
+        AtA[0][2]*(Atb[1] *  AtA[2][1] - AtA[1][1]*Atb[2]   );
+
+    // Slope at centroid of (i,j,k)
+    amrex::Real xs = detAtA_x / detAtA;
+
+    amrex::Real detAtA_y =
+        AtA[0][0]*(Atb[1]  * AtA[2][2] - AtA[1][2]*Atb[2]   ) -
+        Atb[0] *  (AtA[1][0]*AtA[2][2] - AtA[1][2]*AtA[2][0]) +
+        AtA[0][2]*(AtA[1][0]*Atb[2]    - Atb[1]   *AtA[2][0]);
+
+    // Slope at centroid of (i,j,k)
+    amrex::Real ys = detAtA_y / detAtA;
+
+    amrex::Real detAtA_z =
+        AtA[0][0]*(AtA[1][1]*Atb[2]    - Atb[1]   *AtA[1][2]) -
+        AtA[0][1]*(AtA[1][0]*Atb[2]    - Atb[1]   *AtA[2][0]) +
+        Atb[0]   *(AtA[1][0]*AtA[2][1] - AtA[1][1]*AtA[2][0]);
+
+    // Slope at centroid of (i,j,k)
+    amrex::Real zs = detAtA_z / detAtA;
+
+    return {xs,ys,zs};
+}
+#endif
+
+// amrex_calc_slopes_eb calculates the slope in each coordinate direction using a 
+// 1) standard 2nd order limited slope if all three cells in the stencil are regular cells
+// OR
+// 2) least squares linear fit to the at-most 9 in 2D / 27 in 3D nearest neighbors, with the function
+// going through the centroid of cell(i,j,k).  This does not assume that the cell centroids,
+// where the data is assume to live, are the same as cell centers.  Note that calc_slopes_eb
+// defines the matrix A and passes this A to amrex_calc_slopes_eb_given_A.
+//
+// This routine assumes that there are no relevant hoextrap/extdir domain boundary conditions for this cell -- 
+//     it does not test for them so this should not be called if such boundaries might be present
+//
+// All the slopes are returned in one call.
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::GpuArray<amrex::Real,AMREX_SPACEDIM>
+amrex_calc_slopes_eb (int i, int j, int k, int n,
+                      amrex::Array4<amrex::Real const> const& state,
+                      amrex::Array4<amrex::Real const> const& ccent,
+                      amrex::Array4<amrex::EBCellFlag const> const& flag) noexcept
+{
+#if (AMREX_SPACEDIM == 2)
+    constexpr int dim_a = 9;
+#elif (AMREX_SPACEDIM == 3)
+    constexpr int dim_a = 27;
+#endif
+    amrex::Real A[dim_a][AMREX_SPACEDIM];
+
+    int lc=0;
+#if (AMREX_SPACEDIM == 3)
+    for(int kk(-1); kk<=1; kk++)
+#else
+    int kk = 0;
+#endif
+    {
+        for(int jj(-1); jj<=1; jj++){
+          for(int ii(-1); ii<=1; ii++){
+
+            if( flag(i,j,k).isConnected(ii,jj,kk) and
+                not (ii==0 and jj==0 and kk==0)) {
+
+            // Not multplying by dx to be consistent with how the
+            // slope is stored. Also not including the global shift
+            // wrt plo or i,j,k. We only need relative distance.
+
+              A[lc][0] = ii + ccent(i+ii,j+jj,k+kk,0) - ccent(i,j,k,0);
+              A[lc][1] = jj + ccent(i+ii,j+jj,k+kk,1) - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+              A[lc][2] = kk + ccent(i+ii,j+jj,k+kk,2) - ccent(i,j,k,2);
+#endif
+
+            } else {
+
+              AMREX_D_TERM(A[lc][0] = 0.0;,
+                           A[lc][1] = 0.0;,
+                           A[lc][2] = 0.0;);
+            }
+            lc++;
+          }
+        }
+    }
+
+    // 
+    // These slopes use the EB stencil without testing whether it is actually needed
+    // 
+    const auto& slopes = amrex_calc_slopes_eb_given_A (i,j,k,n,A,state,flag);
+    AMREX_D_TERM(amrex::Real xslope = slopes[0];,
+                 amrex::Real yslope = slopes[1];,
+                 amrex::Real zslope = slopes[2];);
+
+    // 
+    // Here we over-write -- if possible -- with a stencil not using the EB stencil
+    // 
+
+    // X direction
+    if (flag(i,j,k).isRegular() and flag(i-1,j,k).isRegular() and flag(i+1,j,k).isRegular()) 
+    {
+        int order = 2;
+        xslope = amrex_calc_xslope(i,j,k,n,order,state);
+    }
+
+    // Y direction
+    if (flag(i,j,k).isRegular() and flag(i,j-1,k).isRegular() and flag(i,j+1,k).isRegular()) 
+    {
+        int order = 2;
+        yslope = amrex_calc_yslope(i,j,k,n,order,state);
+    }
+
+#if (AMREX_SPACEDIM == 3)
+    // Z direction
+    if (flag(i,j,k).isRegular() and flag(i,j,k-1).isRegular() and flag(i,j,k+1).isRegular()) 
+    {
+        int order = 2;
+        zslope = amrex_calc_zslope(i,j,k,n,order,state);
+    }
+#endif
+    
+    return {AMREX_D_DECL(xslope,yslope,zslope)};
+}
+
+// amrex_calc_slopes_extdir_eb calculates the slope in each coordinate direction using a 
+// 1) standard limited slope if all three cells in the stencil are regular cells
+//    (this stencil sees the extdir/hoextrap boundary condition if there is one)
+// OR
+// 2) least squares linear fit to the at-most 9 in 2D / 27 in 3D nearest neighbors, with the function
+// least squares linear fit to the 9 in 2D / 27 in 3D nearest neighbors, with the function
+// going through the centroid of cell(i,j,k).  This does not assume that the cell centroids,
+// where the data is assume to live, are the same as cell centers.
+//
+// All the slopes are returned in one call.
+//
+
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+amrex::GpuArray<amrex::Real,AMREX_SPACEDIM>
+amrex_calc_slopes_extdir_eb (int i, int j, int k, int n,
+                             amrex::Array4<amrex::Real const> const& state,
+                             amrex::Array4<amrex::Real const> const& ccent,
+                             AMREX_D_DECL(
+                             amrex::Array4<amrex::Real const> const& fcx, 
+                             amrex::Array4<amrex::Real const> const& fcy,
+                             amrex::Array4<amrex::Real const> const& fcz),
+                             amrex::Array4<amrex::EBCellFlag const> const& flag,
+                             AMREX_D_DECL(bool edlo_x, bool edlo_y, bool edlo_z),
+                             AMREX_D_DECL(bool edhi_x, bool edhi_y, bool edhi_z), 
+                             AMREX_D_DECL(int domlo_x, int domlo_y, int domlo_z),
+                             AMREX_D_DECL(int domhi_x, int domhi_y, int domhi_z)) noexcept
+{
+#if (AMREX_SPACEDIM == 2)
+    constexpr int dim_a = 9;
+#elif (AMREX_SPACEDIM == 3)
+    constexpr int dim_a = 27;
+#endif
+
+    AMREX_D_TERM(amrex::Real xslope = 0.0;,
+                 amrex::Real yslope = 0.0;,
+                 amrex::Real zslope = 0.0;);
+
+    // First get EB-aware slope that doesn't know about extdir
+    bool needs_bdry_stencil = (edlo_x and i <= domlo_x) or (edhi_x and i >= domhi_x) or
+                              (edlo_y and j <= domlo_y) or (edhi_y and j >= domhi_y);
+#if (AMREX_SPACEDIM == 3)
+         needs_bdry_stencil = needs_bdry_stencil or 
+                              (edlo_z and k <= domlo_z) or (edhi_z and k >= domhi_z);
+#endif
+
+    //
+    // This call does not have any knowledge of extdir / hoextrap boundary conditions
+    //
+    if (!needs_bdry_stencil)
+    {
+        // This returns slopes calculated with the regular 1-d approach if all cells in the stencil
+        //      are regular.  If not, it uses the EB-aware least squares approach to fit a linear profile 
+        //      using the neighboring un-covered cells.
+        const auto& slopes = amrex_calc_slopes_eb (i,j,k,n,state,ccent,flag);
+        return slopes;
+
+    } else {
+
+    amrex::Real A[dim_a][AMREX_SPACEDIM];
+
+    //
+    // Correct only those cells which are affected by extdir:
+    //    1) Here if any of the cells are not regular we use the face and cell centroids
+    //
+
+    if ( (edlo_x and i == domlo_x) or (edhi_x and i == domhi_x) )
+    {
+        int lc=0;
+#if (AMREX_SPACEDIM == 3)
+        for(int kk(-1); kk<=1; kk++) 
+#else
+        int kk = 0;
+#endif
+        {
+            for(int jj(-1); jj<=1; jj++){
+              for(int ii(-1); ii<=1; ii++){
+
+                if( flag(i,j,k).isConnected(ii,jj,kk) and
+                    not (ii==0 and jj==0 and kk==0)) {
+    
+                    // Not multplying by dx to be consistent with how the
+                    // slope is stored. Also not including the global shift
+                    // wrt plo or i,j,k. We only need relative distance.
+
+                    if ( (edlo_x and i == domlo_x) and ii == -1) {
+                        A[lc][0] = -0.5                       - ccent(i,j,k,0);
+                        A[lc][1] = jj + fcx(i   ,j+jj,k+kk,0) - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+                        A[lc][2] = kk + fcx(i   ,j+jj,k+kk,1) - ccent(i,j,k,2);
+#endif
+                    } 
+                    else if ( (edhi_x and i == domhi_x) and ii == 1) 
+                    {
+                        A[lc][0] = 0.5                        - ccent(i,j,k,0);
+                        A[lc][1] = jj + fcx(i+ii,j+jj,k+kk,0) - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+                        A[lc][2] = kk + fcx(i+ii,j+jj,k+kk,1) - ccent(i,j,k,2);
+#endif
+                    } else {
+                        A[lc][0] = ii + ccent(i+ii,j+jj,k+kk,0) - ccent(i,j,k,0);
+                        A[lc][1] = jj + ccent(i+ii,j+jj,k+kk,1) - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+                        A[lc][2] = kk + ccent(i+ii,j+jj,k+kk,2) - ccent(i,j,k,2);
+#endif
+                    }
+
+                 } else {
+                    AMREX_D_TERM(A[lc][0] = 0.0;,
+                                 A[lc][1] = 0.0;,
+                                 A[lc][2] = 0.0;);
+                }
+                lc++;
+              }
+            }
+        }
+        const auto& slopes = amrex_calc_slopes_eb_given_A (i,j,k,n,A,state,flag);
+        AMREX_D_TERM(xslope = slopes[0];,
+                     yslope = slopes[1];,
+                     zslope = slopes[2];);
+    }
+
+    if ( (edlo_y and j == domlo_y) or (edhi_y and j == domhi_y) )
+    {
+        int lc=0;
+#if (AMREX_SPACEDIM == 3)
+        for(int kk(-1); kk<=1; kk++) 
+#else
+        int kk = 0;
+#endif
+        {
+            for(int jj(-1); jj<=1; jj++){
+              for(int ii(-1); ii<=1; ii++){
+
+                if( flag(i,j,k).isConnected(ii,jj,kk) and
+                    not (ii==0 and jj==0 and kk==0)) {
+    
+                    // Not multplying by dx to be consistent with how the
+                    // slope is stored. Also not including the global shift
+                    // wrt plo or i,j,k. We only need relative distance.
+
+                    if (edlo_y and j == domlo_y and jj == -1) {
+                        A[lc][0] = ii + fcy(i+ii,j   ,k+kk,0) - ccent(i,j,k,0);
+                        A[lc][1] = -0.5                       - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+                        A[lc][2] = kk + fcy(i+ii,j   ,k+kk,1) - ccent(i,j,k,2);
+#endif
+                    } 
+                    else if (edhi_y and j == domhi_y and jj == 1) 
+                    {
+                        A[lc][0] = ii + fcy(i+ii,j+jj,k+kk,0) - ccent(i,j,k,0);
+                        A[lc][1] = 0.5                        - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+                        A[lc][2] = kk + fcy(i+ii,j+jj,k+kk,1) - ccent(i,j,k,2);
+#endif
+                    } else {
+                        A[lc][0] = ii + ccent(i+ii,j+jj,k+kk,0) - ccent(i,j,k,0);
+                        A[lc][1] = jj + ccent(i+ii,j+jj,k+kk,1) - ccent(i,j,k,1);
+#if (AMREX_SPACEDIM == 3)
+                        A[lc][2] = kk + ccent(i+ii,j+jj,k+kk,2) - ccent(i,j,k,2);
+#endif
+                    }
+
+                 } else {
+                    AMREX_D_TERM(A[lc][0] = 0.0;,
+                                 A[lc][1] = 0.0;,
+                                 A[lc][2] = 0.0;);
+                }
+
+                lc++;
+              }
+            }
+        }
+
+        const auto& slopes = amrex_calc_slopes_eb_given_A (i,j,k,n,A,state,flag);
+        AMREX_D_TERM(xslope = slopes[0];,
+                     yslope = slopes[1];,
+                     zslope = slopes[2];);
+    }
+
+#if (AMREX_SPACEDIM == 3)
+    if ( (edlo_z and k == domlo_z) or (edhi_z and k == domhi_z) )
+    {
+        int lc=0;
+        for(int kk(-1); kk<=1; kk++) {
+            for(int jj(-1); jj<=1; jj++){
+              for(int ii(-1); ii<=1; ii++){
+
+                if( flag(i,j,k).isConnected(ii,jj,kk) and
+                    not (ii==0 and jj==0 and kk==0)) 
+                {
+                    // Not multplying by dx to be consistent with how the
+                    // slope is stored. Also not including the global shift
+                    // wrt plo or i,j,k. We only need relative distance.
+
+                    if (edlo_z and k == domlo_z and kk == -1) {
+                        A[lc][0] = ii + fcz(i+ii,j+jj,k   ,0) - ccent(i,j,k,0);
+                        A[lc][1] = jj + fcz(i+ii,j+jj,k   ,1) - ccent(i,j,k,1);
+                        A[lc][2] = -0.5                       - ccent(i,j,k,2);
+                    } 
+                    else if (edhi_z and k == domhi_z and kk == 1) 
+                    {
+                        A[lc][0] = ii + fcz(i+ii,j+jj,k+kk,0) - ccent(i,j,k,0);
+                        A[lc][1] = jj + fcz(i+ii,j+jj,k+kk,1) - ccent(i,j,k,1);
+                        A[lc][2] = 0.5                        - ccent(i,j,k,2);
+                    } else {
+                        A[lc][0] = ii + ccent(i+ii,j+jj,k+kk,0) - ccent(i,j,k,0);
+                        A[lc][1] = jj + ccent(i+ii,j+jj,k+kk,1) - ccent(i,j,k,1);
+                        A[lc][2] = kk + ccent(i+ii,j+jj,k+kk,2) - ccent(i,j,k,2);
+                    }
+
+                 } else {
+                    AMREX_D_TERM(A[lc][0] = 0.0;,
+                                 A[lc][1] = 0.0;,
+                                 A[lc][2] = 0.0;);
+                }
+
+                lc++;
+              }
+            }
+        }
+        const auto& slopes = amrex_calc_slopes_eb_given_A (i,j,k,n,A,state,flag);
+
+        AMREX_D_TERM(xslope = slopes[0];,
+                     yslope = slopes[1];,
+                     zslope = slopes[2];);
+    }
+#endif
+
+    //
+    // Correct only those cells which are affected by extdir but not by EB:
+    //    2) If all the cells are regular we use the "regular slope" in the extdir direction
+    //
+
+    int order = 2;
+
+    // Overwrite the tangential slope with the regular stencils if we can compute from non-EB cells
+    if ( flag(i,j,k).isRegular() and flag(i-1,j,k).isRegular() and flag(i+1,j,k).isRegular() )
+      xslope = amrex_calc_xslope_extdir(i,j,k,n,order,state,edlo_x,edhi_x,domlo_x,domhi_x);
+
+    if ( flag(i,j,k).isRegular() and flag(i,j-1,k).isRegular() and flag(i,j+1,k).isRegular() ) 
+      yslope = amrex_calc_yslope_extdir(i,j,k,n,order,state,edlo_y,edhi_y,domlo_y,domhi_y);
+
+#if (AMREX_SPACEDIM == 3)
+    if ( flag(i,j,k).isRegular() and flag(i,j,k-1).isRegular() and flag(i,j,k+1).isRegular() ) 
+      zslope = amrex_calc_zslope_extdir(i,j,k,n,order,state,edlo_z,edhi_z,domlo_z,domhi_z);
+#endif
+    }
+
+    // Zero out slopes outside of an extdir (or hoextrap) boundary
+    // TODO:  is this the right thing to do at a HOEXTRAP boundary??
+#if (AMREX_SPACEDIM == 2)
+    if ( (edlo_x and i < domlo_x) or (edhi_x and i > domhi_x)   or
+         (edlo_y and j < domlo_y) or (edhi_y and j > domhi_y) )  
+    { 
+          AMREX_D_TERM(xslope = 0.;,  
+                       xslope = 0.; yslope = 0.;, 
+                       xslope = 0.; yslope = 0.; zslope = 0.;);
+    } 
+#elif (AMREX_SPACEDIM == 3)
+    if ( (edlo_x and i < domlo_x) or (edhi_x and i > domhi_x) or
+         (edlo_y and j < domlo_y) or (edhi_y and j > domhi_y) or
+         (edlo_z and k < domlo_z) or (edhi_z and k > domhi_z) )
+    {
+          AMREX_D_TERM(xslope = 0.;,  
+                       xslope = 0.; yslope = 0.;, 
+                       xslope = 0.; yslope = 0.; zslope = 0.;);
+    }
+#endif
+
+    return {AMREX_D_DECL(xslope,yslope,zslope)};
+}
+
+#endif
+#endif
+
+}
+#endif
diff --git a/Src/EB/AMReX_EB_utils.H b/Src/EB/AMReX_EB_utils.H
index 888f36b32b5..c558f93bcc4 100644
--- a/Src/EB/AMReX_EB_utils.H
+++ b/Src/EB/AMReX_EB_utils.H
@@ -2,6 +2,9 @@
 #define AMREX_EB_UTILS_H_
 
 #include <AMReX.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_EB2.H>
+#include <AMReX_EB2_GeometryShop.H>
 
 namespace amrex {
 
@@ -28,9 +31,37 @@ namespace amrex {
     { single_level_weighted_redistribute(div_tmp_in, div_out, weights, div_comp, ncomp, geom[lev]); }
 #endif
 
-#ifndef BL_NO_FORT
-    void FillEBNormals(MultiFab & normals, const EBFArrayBoxFactory & eb_factory,
-                       const Geometry & geom);
+    template <typename G>
+    void FillImpFunc (MultiFab& mf, G const& gshop, Geometry const& geom)
+    {
+        AMREX_ALWAYS_ASSERT(mf.is_nodal());
+
+        Box bounding_box = geom.Domain();
+        bounding_box.surroundingNodes();
+        bool extend_domain_face = EB2::ExtendDomainFace();
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+            if (!extend_domain_face || geom.isPeriodic(idim)) {
+                bounding_box.grow(mf.nGrowVect()[idim]);
+            }
+        }
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+        for(MFIter mfi(mf); mfi.isValid(); ++ mfi) {
+            gshop.fillFab(mf[mfi], geom, RunOn::Gpu, bounding_box);
+        }
+    }
+
+#if (AMREX_SPACEDIM == 3)
+    // mf is at the same level as ls_lev.
+    // ls_lev is refratio finer than eb_factory.
+    void FillSignedDistance (MultiFab& mf, EB2::Level const& ls_lev,
+                             EBFArrayBoxFactory const& eb_fac, int refratio,
+                             bool fluid_has_positive_sign=true);
+
+    // mf needs to be built with EBFactory already.
+    void FillSignedDistance (MultiFab& mf, bool fluid_has_positive_sign=true);
 #endif
 }
 
diff --git a/Src/EB/AMReX_EB_utils.cpp b/Src/EB/AMReX_EB_utils.cpp
index c213760bca8..45b0869629b 100644
--- a/Src/EB/AMReX_EB_utils.cpp
+++ b/Src/EB/AMReX_EB_utils.cpp
@@ -1,4 +1,3 @@
-#include <AMReX_EB_F.H>
 #include <AMReX_MultiFab.H>
 #include <AMReX_EB_utils.H>
 #include <AMReX_Geometry.H>
@@ -8,57 +7,6 @@
 
 namespace amrex {
 
-#ifndef BL_NO_FORT
-    //
-    // Fill EB normals
-    //
-    void FillEBNormals(MultiFab & normals, const EBFArrayBoxFactory & eb_factory,
-                       const Geometry & geom) {
-
-        BL_PROFILE("amrex::FillEBNormals()");
-
-        BoxArray ba = normals.boxArray();
-        DistributionMapping dm = normals.DistributionMap();
-        int n_grow = normals.nGrow();
-
-        // Dummy array for MFIter
-        MultiFab dummy(ba, dm, 1, n_grow, MFInfo(), eb_factory);
-        // Area fraction data
-        std::array<const MultiCutFab*, AMREX_SPACEDIM> areafrac = eb_factory.getAreaFrac();
-
-        const auto & flags = eb_factory.getMultiEBCellFlagFab();
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for(MFIter mfi(dummy, true); mfi.isValid(); ++mfi) {
-            Box tile_box = mfi.growntilebox();
-            const int * lo = tile_box.loVect();
-            const int * hi = tile_box.hiVect();
-
-            const auto & flag = flags[mfi];
-
-            if (flag.getType(tile_box) == FabType::singlevalued) {
-                // Target for compute_normals(...)
-                auto & norm_tile = normals[mfi];
-                // Area fractions in x, y, and z directions
-                const auto & af_x_tile = (* areafrac[0])[mfi];
-                const auto & af_y_tile = (* areafrac[1])[mfi];
-                const auto & af_z_tile = (* areafrac[2])[mfi];
-
-                amrex_eb_compute_normals(lo, hi,
-                                         BL_TO_FORTRAN_3D(flag),
-                                         BL_TO_FORTRAN_3D(norm_tile),
-                                         BL_TO_FORTRAN_3D(af_x_tile),
-                                         BL_TO_FORTRAN_3D(af_y_tile),
-                                         BL_TO_FORTRAN_3D(af_z_tile)  );
-            }
-        }
-
-        normals.FillBoundary(geom.periodicity());
-    }
-#endif
-
 #if (AMREX_SPACEDIM > 1)
     //
     // Do small cell redistribution on one FAB
@@ -72,7 +20,7 @@ namespace amrex {
                                    const int ncomp,
                                    const EBCellFlagFab& flags_fab,
                                    const MultiFab* volfrac,
-                                   Box& domain,
+                                   Box& /*domain*/,
                                    const Geometry & geom)
     {
         //
@@ -93,9 +41,6 @@ namespace amrex {
 
         const Box dbox = geom.growPeriodicDomain(2);
 
-        const amrex::Dim3 dom_low  = amrex::lbound(domain);
-        const amrex::Dim3 dom_high = amrex::ubound(domain);
-
         //
         // Get array from arguments
         //
@@ -147,12 +92,8 @@ namespace amrex {
             Real divnc(0.0);
             Real vtot(0.0);
             Real wted_frac(0.0);
-            int  ks(0);
-            int  ke(0);
-#if (AMREX_SPACEDIM==3)
-            ks = -1;
-            ke = 1;
-#endif
+            int  ks = (AMREX_SPACEDIM == 3) ? -1 : 0;
+            int  ke = (AMREX_SPACEDIM == 3) ?  1 : 0;
 
             for (int kk(ks); kk <= ke; ++kk) {
               for (int jj(-1); jj <= 1; ++jj) {
@@ -193,12 +134,9 @@ namespace amrex {
         if(flags(i,j,k).isSingleValued())
         {
             Real wtot(0.0);
-            int  ks(0);
-            int  ke(0);
-#if (AMREX_SPACEDIM==3)
-            ks = -1;
-            ke = 1;
-#endif
+            int  ks = (AMREX_SPACEDIM == 3) ? -1 : 0;
+            int  ke = (AMREX_SPACEDIM == 3) ?  1 : 0;
+
             for (int kk(ks); kk <= ke; ++kk) {
               for (int jj(-1); jj <= 1; ++jj) {
                 for (int ii(-1); ii <= 1; ++ii) {         
@@ -221,14 +159,10 @@ namespace amrex {
                             (flags(i,j,k).isConnected(ii,jj,kk)) and
                             bx.contains(IntVect(AMREX_D_DECL(i+ii,j+jj,k+kk))) )
                         {
-#ifdef AMREX_USE_CUDA
-                            Gpu::Atomic::Add(&optmp(i+ii,j+jj,k+kk,n),
+                            Gpu::Atomic::AddNoRet(&optmp(i+ii,j+jj,k+kk,n),
                                              delm(i,j,k,n) * wtot * mask(i+ii,j+jj,k+kk) * wt(i+ii,j+jj,k+kk));
-#else
-                            optmp(i+ii,j+jj,k+kk,n) += delm(i,j,k,n) * wtot * mask(i+ii,j+jj,k+kk) * wt(i+ii,j+jj,k+kk);
-#endif
                         }
-                        }}}
+                }}}
 
         }
         });
@@ -303,4 +237,394 @@ namespace amrex {
     }
 #endif
 
+#if (AMREX_SPACEDIM == 3)
+
+void FillSignedDistance (MultiFab& mf, bool fluid_has_positive_sign)
+{
+    auto factory = dynamic_cast<EBFArrayBoxFactory const*>(&(mf.Factory()));
+    if (factory) {
+        FillSignedDistance(mf, *(factory->getEBLevel()), *factory, 1, fluid_has_positive_sign);
+    } else {
+        mf.setVal(std::numeric_limits<Real>::max());
+    }
+}
+
+namespace detail
+{
+// Purpose: Given a collision between particle and EB surface, and
+// given that a neighbour cell owns the EB surface, a collision between
+// the particle and the EDGE of the EB facet might occur. This
+// function returns the coordinates of the closest point on the edge of
+// an EB facet. This function does not check of collisions.
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+RealVect
+facets_nearest_pt (IntVect const& ind_pt, IntVect const& ind_loop, RealVect const& r_vec,
+                   RealVect const& eb_normal, RealVect const& eb_p0,
+                   GpuArray<Real,AMREX_SPACEDIM> const& dx)
+{
+    // Enumerate the possible EB facet edges invovlved.
+    int n_facets = 0;
+    IntVect ind_facets {AMREX_D_DECL(0, 0, 0)};
+    for (int d = 0; d < AMREX_SPACEDIM; ++d) {
+        if ( ind_pt[d] != ind_loop[d] ) {
+            ind_facets[n_facets++] = d;
+        }
+    }
+
+    // scalar characterizing EB facet position
+    Real eb_h = eb_normal.dotProduct(eb_p0);
+
+#if (__CUDACC_VER_MAJOR__ != 9) || (__CUDACC_VER_MINOR__ != 2)
+    Real min_dist = std::numeric_limits<Real>::max();
+#else
+    Real min_dist = 3.4e38_rt;
+#endif
+
+    RealVect c_vec;
+
+    // iterate over EB facet edges and find whichever has the closest nearest point
+    for (int i_facet=0; i_facet<n_facets; ++i_facet)
+    {
+        int tmp_facet = ind_facets[i_facet];
+
+        // determine the normal of the cell's facet (cube faces)
+        RealVect facet_normal {AMREX_D_DECL(0._rt, 0._rt, 0._rt)};
+        facet_normal[tmp_facet] = 1.; // whether facing inwards or outwards is not important here
+
+        // skip cases where cell faces conincide with the eb facets
+        if (AMREX_D_TERM(amrex::Math::abs(eb_normal[0]) == amrex::Math::abs(facet_normal[0]),
+                      && amrex::Math::abs(eb_normal[1]) == amrex::Math::abs(facet_normal[1]),
+                      && amrex::Math::abs(eb_normal[2]) == amrex::Math::abs(facet_normal[2])))
+        { continue; }
+
+        int ind_cell = ind_loop[tmp_facet];
+        int ind_nb   = ind_pt[tmp_facet];
+
+        // determine position of the cell's facet
+        Real f_c;
+        if (ind_cell < ind_nb) {
+            f_c = ( ind_cell + 1 ) * dx[tmp_facet];
+        } else {
+            f_c =   ind_cell       * dx[tmp_facet];
+        }
+
+        RealVect facet_p0{AMREX_D_DECL((ind_loop[0] + 0.5_rt) * dx[0],
+                                       (ind_loop[1] + 0.5_rt) * dx[1],
+                                       (ind_loop[2] + 0.5_rt) * dx[2])};
+        facet_p0[tmp_facet] = f_c;
+
+        // scalar characterizing cell facet position
+        Real facet_h = facet_normal.dotProduct(facet_p0);
+
+        // compute EB facet edge by finding the intercept between EB surface (first plane)
+        // and the cell's facet (second plane)
+        //
+        //  Purpose: Calculates the line (represented by a position and a
+        //  direction vector) given by the intersection of two planes (defined
+        //  by two normal (n1, n2) and two positions (h1 = n1.p1, h2 = n2.p2).
+        //
+        //  When one plane is the EB surface, and the other is a face of the
+        //  cell. Then this line represents the edge of the EB facet.
+        //
+        Real c_dp = eb_normal.dotProduct(facet_normal);
+        Real c_norm = 1._rt - c_dp*c_dp;
+        //
+        Real c1 = ( eb_h - facet_h * c_dp ) / c_norm;
+        Real c2 = ( facet_h - eb_h * c_dp ) / c_norm;
+        //
+        RealVect edge_p0{AMREX_D_DECL(c1*eb_normal[0] + c2*facet_normal[0],
+                                      c1*eb_normal[1] + c2*facet_normal[1],
+                                      c1*eb_normal[2] + c2*facet_normal[2])};
+        RealVect edge_v = eb_normal.crossProduct(facet_normal);
+
+        // this solution is a line representing the closest EB edge, now compute the point
+        // on the line which minimizes the distance to the particle
+        //
+        // Purpose: Given an a line an a point, this finds the point
+        // one the line which minimizes the cartesian distance. It also finds
+        // the corresponing distance along the line corresponding to this point
+        //
+        RealVect c = edge_p0 - r_vec;
+        Real lambda_tmp = - edge_v.dotProduct(c) / edge_v.dotProduct(edge_v);
+        RealVect c_vec_tmp{AMREX_D_DECL(edge_p0[0] + lambda_tmp*edge_v[0],
+                                        edge_p0[1] + lambda_tmp*edge_v[1],
+                                        edge_p0[2] + lambda_tmp*edge_v[2])};
+
+        // IMPORTANT: this point might be outside the cell
+        //  -> in that case, it will be one of the cell's corners
+        //
+        // if closest point is outside cell, determine the furthest we can go along the
+        // EB edge line whilst staying within the cell.
+        //
+        // Purpose: Given a line which passes through a box in three dimensions
+        // (it can pass through the edges). Let lambda be a real value
+        // representing the coordinate along the line. This finds
+        // the min/max values of lambda, in order for the point described by
+        // lambda to be contained within the box.
+        //
+#if (__CUDACC_VER_MAJOR__ != 9) || (__CUDACC_VER_MINOR__ != 2)
+        Real cx_lo = -std::numeric_limits<Real>::max();
+        Real cy_lo = -std::numeric_limits<Real>::max();
+        Real cz_lo = -std::numeric_limits<Real>::max();
+        Real cx_hi = std::numeric_limits<Real>::max();
+        Real cy_hi = std::numeric_limits<Real>::max();
+        Real cz_hi = std::numeric_limits<Real>::max();
+        Real eps = std::numeric_limits<Real>::epsilon();
+#else
+        Real cx_lo = -3.4e38_rt;
+        Real cy_lo = -3.4e38_rt;
+        Real cz_lo = -3.4e38_rt;
+        Real cx_hi =  3.4e38_rt;
+        Real cy_hi =  3.4e38_rt;
+        Real cz_hi =  3.4e38_rt;
+        Real eps = 1.e-7_rt;
+#endif
+        // if the line runs parrallel to any of these dimensions (which is true for
+        // EB edges), then skip -> the min/max functions at the end will skip them
+        // due to the +/-huge(c...) defaults (above).
+        if ( amrex::Math::abs(edge_v[0]) > eps ) {
+            cx_lo = -( edge_p0[0] -   ind_loop[0]       * dx[0] ) / edge_v[0];
+            cx_hi = -( edge_p0[0] - ( ind_loop[0] + 1 ) * dx[0] ) / edge_v[0];
+            if ( edge_v[0] < 0._rt ) amrex::Swap(cx_lo, cx_hi);
+        }
+        //
+        if ( amrex::Math::abs(edge_v[1]) > eps ) {
+            cy_lo = -( edge_p0[1] -   ind_loop[1]       * dx[1] ) / edge_v[1];
+            cy_hi = -( edge_p0[1] - ( ind_loop[1] + 1 ) * dx[1] ) / edge_v[1];
+            if ( edge_v[1] < 0._rt ) amrex::Swap(cy_lo, cy_hi);
+        }
+        //
+        if ( amrex::Math::abs(edge_v[2]) > eps ) {
+            cz_lo = -( edge_p0[2] -   ind_loop[2]       * dx[2] ) / edge_v[2];
+            cz_hi = -( edge_p0[2] - ( ind_loop[2] + 1 ) * dx[2] ) / edge_v[2];
+            if ( edge_v[2] < 0._rt ) amrex::Swap(cz_lo, cz_hi);
+        }
+        //
+        Real lambda_min = amrex::max(cx_lo, cy_lo, cz_lo);
+        Real lambda_max = amrex::min(cx_hi, cy_hi, cz_hi);
+
+        if (lambda_tmp < lambda_min) {
+            lambda_tmp = lambda_min;
+        } else if ( lambda_tmp > lambda_max) {
+            lambda_tmp = lambda_max;
+        }
+
+        RealVect rc_vec;
+        for (int d=0; d<AMREX_SPACEDIM; ++d) {
+            c_vec_tmp[d] = edge_p0[d] + lambda_tmp*edge_v[d];
+            rc_vec[d] = c_vec_tmp[d] - r_vec[d];
+        }
+
+        // determine new distance to particle
+        Real min_dist_tmp = rc_vec.dotProduct(rc_vec);
+
+        // minimize distance
+        if (min_dist_tmp < min_dist) {
+            min_dist = min_dist_tmp;
+            c_vec = c_vec_tmp;
+        }
+    }
+
+    return c_vec;
+}
+}
+
+void FillSignedDistance (MultiFab& mf, EB2::Level const& ls_lev,
+                         EBFArrayBoxFactory const& eb_factory, int refratio,
+                         bool fluid_has_positive_sign)
+{
+    ls_lev.fillLevelSet(mf, ls_lev.Geom()); // This is the implicit function, not the SDF.
+
+    const auto& bndrycent = eb_factory.getBndryCent();
+    const auto& areafrac = eb_factory.getAreaFrac();
+    const auto& flags = eb_factory.getMultiEBCellFlagFab();
+    const int eb_pad = bndrycent.nGrow();
+
+    const auto dx_ls = ls_lev.Geom().CellSizeArray();
+    const auto dx_eb = eb_factory.Geom().CellSizeArray();
+    Real ls_roof = amrex::min(AMREX_D_DECL(dx_eb[0],dx_eb[1],dx_eb[2])) * (flags.nGrow()+1);
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    for (MFIter mfi(mf); mfi.isValid(); ++mfi)
+    {
+        Box const& gbx = mfi.fabbox();
+        Array4<Real> const& fab = mf.array(mfi);
+
+        amrex::ParallelFor(gbx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            if (fab(i,j,k) <= 0._rt) {
+                fab(i,j,k) = (fluid_has_positive_sign) ? ls_roof : -ls_roof;
+            } else {
+                fab(i,j,k) = (fluid_has_positive_sign) ? -ls_roof : ls_roof;
+            }
+        });
+
+        if (bndrycent.ok(mfi))
+        {
+            const auto& flag = flags.const_array(mfi);
+
+            Box eb_search = mfi.validbox();
+            eb_search.coarsen(refratio).enclosedCells().grow(eb_pad);
+
+            const int nallcells = eb_search.numPts();
+            Gpu::DeviceVector<int> is_cut(nallcells);
+            int* p_is_cut = is_cut.data();
+            amrex::ParallelFor(nallcells, [=] AMREX_GPU_DEVICE (int icell) noexcept
+            {
+                GpuArray<int,3> ijk = eb_search.atOffset3d(icell);
+                if (flag(ijk[0],ijk[1],ijk[2]).isSingleValued()) {
+                    p_is_cut[icell] = 1;
+                } else {
+                    p_is_cut[icell] = 0;
+                }
+            });
+
+            Gpu::DeviceVector<int> cutcell_offset(nallcells);
+            int* p_cutcell_offset = cutcell_offset.data();
+            int ncutcells = Scan::ExclusiveSum(nallcells, p_is_cut, p_cutcell_offset);
+
+            if (ncutcells > 0) {
+                Gpu::DeviceVector<GpuArray<Real,AMREX_SPACEDIM*2> > facets(ncutcells);
+                auto p_facets = facets.data();
+                Array4<Real const> const& bcent = bndrycent.const_array(mfi);
+                AMREX_D_TERM(Array4<Real const> const& apx = areafrac[0]->const_array(mfi);,
+                             Array4<Real const> const& apy = areafrac[1]->const_array(mfi);,
+                             Array4<Real const> const& apz = areafrac[2]->const_array(mfi));
+                amrex::ParallelFor(eb_search, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+                {
+                    int icell = eb_search.index(IntVect(AMREX_D_DECL(i,j,k)));
+                    if (p_is_cut[icell]) {
+                        GpuArray<Real,AMREX_SPACEDIM*2>& fac = p_facets[p_cutcell_offset[icell]];
+                        AMREX_D_TERM(fac[0] = (bcent(i,j,k,0)+Real(i)+0.5_rt) * dx_eb[0];,
+                                     fac[1] = (bcent(i,j,k,1)+Real(j)+0.5_rt) * dx_eb[1];,
+                                     fac[2] = (bcent(i,j,k,2)+Real(k)+0.5_rt) * dx_eb[2]);
+
+                         Real axm = apx(i,  j  , k  );
+                         Real axp = apx(i+1,j  , k  );
+                         Real aym = apy(i,  j  , k  );
+                         Real ayp = apy(i,  j+1, k  );
+#if (AMREX_SPACEDIM == 3)
+                         Real azm = apz(i,  j  , k  );
+                         Real azp = apz(i,  j  , k+1);
+                         Real apnorm = std::sqrt((axm-axp)*(axm-axp) +
+                                                 (aym-ayp)*(aym-ayp) +
+                                                 (azm-azp)*(azm-azp));
+#else
+                         Real apnorm = std::sqrt((axm-axp)*(axm-axp) +
+                                                 (aym-ayp)*(aym-ayp));
+#endif
+                         Real apnorminv = 1._rt / apnorm;
+                         AMREX_D_TERM(Real anrmx = (axp-axm) * apnorminv;,   // pointing to the wall
+                                      Real anrmy = (ayp-aym) * apnorminv;,
+                                      Real anrmz = (azp-azm) * apnorminv);
+
+                         // pointing to the fluid
+                         AMREX_D_TERM(fac[AMREX_SPACEDIM+0] = -anrmx;,
+                                      fac[AMREX_SPACEDIM+1] = -anrmy;,
+                                      fac[AMREX_SPACEDIM+2] = -anrmz);
+                    }
+                });
+
+                amrex::ParallelFor(gbx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+                {
+                    AMREX_D_TERM(Real dxinv = 1._rt/dx_eb[0];,
+                                 Real dyinv = 1._rt/dx_eb[1];,
+                                 Real dzinv = 1._rt/dx_eb[2]);
+                    AMREX_D_TERM(Real x = i*dx_ls[0];,
+                                 Real y = j*dx_ls[1];,
+                                 Real z = k*dx_ls[2]);
+#if (__CUDACC_VER_MAJOR__ != 9) || (__CUDACC_VER_MINOR__ != 2)
+                    Real min_dist2 = std::numeric_limits<Real>::max();
+#else
+                    Real min_dist2 = 3.4e38_rt;
+#endif
+                    int i_nearest = 0;
+                    for (int ifac  = 0; ifac < ncutcells; ++ifac) {
+                        AMREX_D_TERM(Real cx = p_facets[ifac][0];,
+                                     Real cy = p_facets[ifac][1];,
+                                     Real cz = p_facets[ifac][2]);
+                        Real dist2 = AMREX_D_TERM((x-cx)*(x-cx),+(y-cy)*(y-cy),+(z-cz)*(z-cz));
+                        if (dist2 < min_dist2) {
+                            i_nearest = ifac;
+                            min_dist2 = dist2;
+                        }
+                    }
+
+                    // Test if pos "projects onto" the nearest EB facet's interior
+                    AMREX_D_TERM(Real cx = p_facets[i_nearest][0];,
+                                 Real cy = p_facets[i_nearest][1];,
+                                 Real cz = p_facets[i_nearest][2]);
+                    AMREX_D_TERM(Real nx = p_facets[i_nearest][AMREX_SPACEDIM+0];,
+                                 Real ny = p_facets[i_nearest][AMREX_SPACEDIM+1];,
+                                 Real nz = p_facets[i_nearest][AMREX_SPACEDIM+2]);
+                    Real dist_proj = AMREX_D_TERM((x-cx)*(-nx),+(y-cy)*(-ny),+(z-cz)*(-nz));
+                    AMREX_D_TERM(Real eb_min_x = x + nx*dist_proj;,
+                                 Real eb_min_y = y + ny*dist_proj;,
+                                 Real eb_min_z = z + nz*dist_proj);
+                    AMREX_D_TERM(int vi_cx = static_cast<int>(amrex::Math::floor(cx * dxinv));,
+                                 int vi_cy = static_cast<int>(amrex::Math::floor(cy * dyinv));,
+                                 int vi_cz = static_cast<int>(amrex::Math::floor(cz * dzinv)));
+                    AMREX_D_TERM(int vi_x = static_cast<int>(amrex::Math::floor(eb_min_x * dxinv));,
+                                 int vi_y = static_cast<int>(amrex::Math::floor(eb_min_y * dyinv));,
+                                 int vi_z = static_cast<int>(amrex::Math::floor(eb_min_z * dzinv)));
+
+                    bool min_pt_valid = false;
+                    if (AMREX_D_TERM(vi_cx == vi_x, && vi_cy == vi_y, && vi_cz == vi_z)) {
+                        min_pt_valid = true;
+                    } else { // rounding error might give false negatives
+#if (AMREX_SPACEDIM == 3)
+                        for (int k_shift = -1; k_shift <= 1; ++k_shift) {
+#endif
+                        for (int j_shift = -1; j_shift <= 1; ++j_shift) {
+                        for (int i_shift = -1; i_shift <= 1; ++i_shift) {
+                            AMREX_D_TERM(vi_x = static_cast<int>(amrex::Math::floor((eb_min_x+i_shift*1.e-6_rt*dx_eb[0])*dxinv));,
+                                         vi_y = static_cast<int>(amrex::Math::floor((eb_min_y+j_shift*1.e-6_rt*dx_eb[1])*dyinv));,
+                                         vi_z = static_cast<int>(amrex::Math::floor((eb_min_z+k_shift*1.e-6_rt*dx_eb[2])*dzinv)));
+                            if (AMREX_D_TERM(vi_cx == vi_x, && vi_cy == vi_y, && vi_cz == vi_z)) {
+                                min_pt_valid = true;
+                                goto after_loops;
+                            }
+                        }}
+#if (AMREX_SPACEDIM == 3)
+                        }
+#endif
+                        after_loops:;
+                    }
+
+                    // If projects onto nearest EB facet, then return projected distance
+                    // Alternatively: find the nearest point on the EB edge
+                    Real min_dist;
+                    if ( min_pt_valid ) {
+                        // this is a signed distance function
+                        min_dist = dist_proj;
+                    } else {
+                        // fallback: find the nearest point on the EB edge
+                        // revert the value of vi_x, vi_y and vi_z
+                        AMREX_D_TERM(vi_x = static_cast<int>(amrex::Math::floor(eb_min_x * dxinv));,
+                                     vi_y = static_cast<int>(amrex::Math::floor(eb_min_y * dyinv));,
+                                     vi_z = static_cast<int>(amrex::Math::floor(eb_min_z * dzinv)));
+                        auto c_vec = detail::facets_nearest_pt
+                            ({AMREX_D_DECL(vi_x,vi_y,vi_z)}, {AMREX_D_DECL(vi_cx, vi_cy, vi_cz)},
+                             {AMREX_D_DECL(x,y,z)}, {AMREX_D_DECL(nx,ny,nz)},
+                             {AMREX_D_DECL(cx,cy,cz)}, dx_eb);
+                        Real min_edge_dist2 = AMREX_D_TERM( (c_vec[0]-x)*(c_vec[0]-x),
+                                                           +(c_vec[1]-y)*(c_vec[1]-y),
+                                                           +(c_vec[2]-z)*(c_vec[2]-z));
+                        min_dist = -std::sqrt(amrex::min(min_dist2, min_edge_dist2));
+                    }
+                    fab(i,j,k) = amrex::min(ls_roof,amrex::Math::abs(min_dist))
+                        * amrex::Math::copysign(1._rt,fab(i,j,k));
+                });
+                Gpu::synchronize();
+            }
+        }
+    }
+
+    mf.FillBoundary(0,1,ls_lev.Geom().periodicity());
+}
+
+#endif
+
 } // end namespace
diff --git a/Src/EB/AMReX_WriteEBSurface.cpp b/Src/EB/AMReX_WriteEBSurface.cpp
index 5bcd446516c..75724ea7a53 100644
--- a/Src/EB/AMReX_WriteEBSurface.cpp
+++ b/Src/EB/AMReX_WriteEBSurface.cpp
@@ -1,23 +1,10 @@
 #include <AMReX.H>
-
 #include <AMReX_ParmParse.H>
-
-#include <AMReX_MultiFab.H>
 #include <AMReX_Geometry.H>
-#include <AMReX_BoxArray.H>
+#include <AMReX_MultiFab.H>
 #include <AMReX_MultiCutFab.H>
 #include <AMReX_EBFArrayBox.H>
-#include <AMReX_EBFabFactory.H>
-#include <AMReX_DistributionMapping.H>
-
 #include <AMReX_EB2.H>
-#include <AMReX_EB2_IF_Torus.H>
-#include <AMReX_EB2_IF_Union.H>
-#include <AMReX_EB2_IF_Cylinder.H>
-#include <AMReX_EB2_IF_Difference.H>
-#include <AMReX_EB2_GeometryShop.H>
-
-#include <AMReX_EB_LSCore.H>
 #include <AMReX_WriteEBSurface.H>
 #include <AMReX_WriteEB_F.H>
 
@@ -26,7 +13,8 @@ namespace amrex {
 void WriteEBSurface (const BoxArray & ba, const DistributionMapping & dmap, const Geometry & geom,
                      const EBFArrayBoxFactory * ebf) {
 
-    const Real * dx = geom.CellSize();
+    const Real* dx     = geom.CellSize();
+    const Real* problo = geom.ProbLo();
 
     MultiFab mf_ba(ba, dmap, 1, 0, MFInfo(), *ebf);
 
@@ -46,7 +34,7 @@ void WriteEBSurface (const BoxArray & ba, const DistributionMapping & dmap, cons
         areafrac  =   ebf->getAreaFrac();
         bndrycent = &(ebf->getBndryCent());
 
-        amrex_eb_to_polygon(dx, BL_TO_FORTRAN_BOX(bx),
+        amrex_eb_to_polygon(problo, dx, BL_TO_FORTRAN_BOX(bx),
                             BL_TO_FORTRAN_3D(my_flag),
                             BL_TO_FORTRAN_3D((* bndrycent)[mfi]),
                             BL_TO_FORTRAN_3D((* areafrac[0])[mfi]),
@@ -62,7 +50,6 @@ void WriteEBSurface (const BoxArray & ba, const DistributionMapping & dmap, cons
     if(ParallelDescriptor::IOProcessor())
         amrex_write_pvtp(& nProcs);
 
-
     for (MFIter mfi(mf_ba); mfi.isValid(); ++mfi) {
 
         const auto & sfab    = static_cast<EBFArrayBox const &>(mf_ba[mfi]);
@@ -73,7 +60,7 @@ void WriteEBSurface (const BoxArray & ba, const DistributionMapping & dmap, cons
         if (my_flag.getType(bx) == FabType::covered or
             my_flag.getType(bx) == FabType::regular) continue;
 
-        amrex_eb_grid_coverage(& cpu, dx, BL_TO_FORTRAN_BOX(bx), BL_TO_FORTRAN_3D(my_flag));
+        amrex_eb_grid_coverage(& cpu, problo, dx, BL_TO_FORTRAN_BOX(bx), BL_TO_FORTRAN_3D(my_flag));
     }
 }
 
diff --git a/Src/EB/AMReX_WriteEB_F.H b/Src/EB/AMReX_WriteEB_F.H
index e8152536eee..f1c697a52d0 100644
--- a/Src/EB/AMReX_WriteEB_F.H
+++ b/Src/EB/AMReX_WriteEB_F.H
@@ -9,6 +9,7 @@ extern "C"
 #endif
 
     void amrex_eb_to_polygon(
+            const amrex::Real* problo,
             const amrex::Real* dx,
             const int* slo, const int* shi,
             const void* flag,        const int* fglo, const int* fghi,
@@ -22,7 +23,9 @@ extern "C"
     void amrex_write_pvtp(int* nProcs);
 
     void amrex_eb_grid_coverage(
-            int* myID, const amrex::Real* dx,
+            int* myID, 
+            const amrex::Real* problo, 
+            const amrex::Real* dx,
             const int* slo, const int* shi,
             const void* flag, const int* fglo, const int* fghi
         );
diff --git a/Src/EB/AMReX_algoim.cpp b/Src/EB/AMReX_algoim.cpp
index 795d803b882..7f95861a01f 100644
--- a/Src/EB/AMReX_algoim.cpp
+++ b/Src/EB/AMReX_algoim.cpp
@@ -15,6 +15,7 @@ void
 compute_integrals (MultiFab& intgmf, IntVect nghost)
 {
 #if (AMREX_SPACEDIM == 2)
+    amrex::ignore_unused(intgmf, nghost);
     amrex::Abort("amrex::algoim::compute_integrals is 3D only");
 #else
 
@@ -79,41 +80,41 @@ compute_integrals (MultiFab& intgmf, IntVect nghost)
 
                         const QuadratureRule q = quadGen(phi);
 
-                        intg(i,j,k,i_S_x    ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x    ) = q([] AMREX_GPU_DEVICE (Real x, Real /*y*/, Real /*z*/) noexcept
                                                    { return x; });
-                        intg(i,j,k,i_S_y    ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y    ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real y, Real /*z*/) noexcept
                                                    { return y; });
-                        intg(i,j,k,i_S_z    ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_z    ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real /*y*/, Real z) noexcept
                                                    { return z; });
-                        intg(i,j,k,i_S_x2   ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2   ) = q([] AMREX_GPU_DEVICE (Real x, Real /*y*/, Real /*z*/) noexcept
                                                    { return x*x; });
-                        intg(i,j,k,i_S_y2   ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y2   ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real y, Real /*z*/) noexcept
                                                    { return y*y; });
-                        intg(i,j,k,i_S_z2   ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_z2   ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real /*y*/, Real z) noexcept
                                                    { return z*z; });
-                        intg(i,j,k,i_S_x_y  ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_y  ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real /*z*/) noexcept
                                                    { return x*y; });
-                        intg(i,j,k,i_S_x_z  ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_z  ) = q([] AMREX_GPU_DEVICE (Real x, Real /*y*/, Real z) noexcept
                                                    { return x*z; });
-                        intg(i,j,k,i_S_y_z  ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y_z  ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real y, Real z) noexcept
                                                    { return y*z; });
-                        intg(i,j,k,i_S_x2_y ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_y ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real /*z*/) noexcept
                                                    { return x*x*y; });
-                        intg(i,j,k,i_S_x2_z ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_z ) = q([] AMREX_GPU_DEVICE (Real x, Real /*y*/, Real z) noexcept
                                                    { return x*x*z; });
-                        intg(i,j,k,i_S_x_y2 ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_y2 ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real /*z*/) noexcept
                                                    { return x*y*y; });
-                        intg(i,j,k,i_S_y2_z ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y2_z ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real y, Real z) noexcept
                                                    { return y*y*z; });
-                        intg(i,j,k,i_S_x_z2 ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_z2 ) = q([] AMREX_GPU_DEVICE (Real x, Real /*y*/, Real z) noexcept
                                                    { return x*z*z; });
-                        intg(i,j,k,i_S_y_z2 ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y_z2 ) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real y, Real z) noexcept
                                                    { return y*z*z; });
-                        intg(i,j,k,i_S_x2_y2) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_y2) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real /*z*/) noexcept
                                                    { return x*x*y*y; });
-                        intg(i,j,k,i_S_x2_z2) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_z2) = q([] AMREX_GPU_DEVICE (Real x, Real /*y*/, Real z) noexcept
                                                    { return x*x*z*z; });
-                        intg(i,j,k,i_S_y2_z2) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y2_z2) = q([] AMREX_GPU_DEVICE (Real /*x*/, Real y, Real z) noexcept
                                                    { return y*y*z*z; });
                         intg(i,j,k,i_S_xyz  ) = q([] AMREX_GPU_DEVICE (Real x, Real y, Real z) noexcept
                                                    { return x*y*z; });
@@ -139,41 +140,41 @@ compute_integrals (MultiFab& intgmf, IntVect nghost)
 
                         const QuadratureRule q = quadGen(phi);
 
-                        intg(i,j,k,i_S_x    ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x    ) = q.eval([](Real x, Real /*y*/, Real /*z*/) noexcept
                                                    { return x; });
-                        intg(i,j,k,i_S_y    ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y    ) = q.eval([](Real /*x*/, Real y, Real /*z*/) noexcept
                                                    { return y; });
-                        intg(i,j,k,i_S_z    ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_z    ) = q.eval([](Real /*x*/, Real /*y*/, Real z) noexcept
                                                    { return z; });
-                        intg(i,j,k,i_S_x2   ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2   ) = q.eval([](Real x, Real /*y*/, Real /*z*/) noexcept
                                                    { return x*x; });
-                        intg(i,j,k,i_S_y2   ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y2   ) = q.eval([](Real /*x*/, Real y, Real /*z*/) noexcept
                                                    { return y*y; });
-                        intg(i,j,k,i_S_z2   ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_z2   ) = q.eval([](Real /*x*/, Real /*y*/, Real z) noexcept
                                                    { return z*z; });
-                        intg(i,j,k,i_S_x_y  ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_y  ) = q.eval([](Real x, Real y, Real /*z*/) noexcept
                                                    { return x*y; });
-                        intg(i,j,k,i_S_x_z  ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_z  ) = q.eval([](Real x, Real /*y*/, Real z) noexcept
                                                    { return x*z; });
-                        intg(i,j,k,i_S_y_z  ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y_z  ) = q.eval([](Real /*x*/, Real y, Real z) noexcept
                                                    { return y*z; });
-                        intg(i,j,k,i_S_x2_y ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_y ) = q.eval([](Real x, Real y, Real /*z*/) noexcept
                                                    { return x*x*y; });
-                        intg(i,j,k,i_S_x2_z ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_z ) = q.eval([](Real x, Real /*y*/, Real z) noexcept
                                                    { return x*x*z; });
-                        intg(i,j,k,i_S_x_y2 ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_y2 ) = q.eval([](Real x, Real y, Real /*z*/) noexcept
                                                    { return x*y*y; });
-                        intg(i,j,k,i_S_y2_z ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y2_z ) = q.eval([](Real /*x*/, Real y, Real z) noexcept
                                                    { return y*y*z; });
-                        intg(i,j,k,i_S_x_z2 ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x_z2 ) = q.eval([](Real x, Real /*y*/, Real z) noexcept
                                                    { return x*z*z; });
-                        intg(i,j,k,i_S_y_z2 ) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y_z2 ) = q.eval([](Real /*x*/, Real y, Real z) noexcept
                                                    { return y*z*z; });
-                        intg(i,j,k,i_S_x2_y2) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_y2) = q.eval([](Real x, Real y, Real /*z*/) noexcept
                                                    { return x*x*y*y; });
-                        intg(i,j,k,i_S_x2_z2) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_x2_z2) = q.eval([](Real x, Real /*y*/, Real z) noexcept
                                                    { return x*x*z*z; });
-                        intg(i,j,k,i_S_y2_z2) = q.eval([](Real x, Real y, Real z) noexcept
+                        intg(i,j,k,i_S_y2_z2) = q.eval([](Real /*x*/, Real y, Real z) noexcept
                                                    { return y*y*z*z; });
                         intg(i,j,k,i_S_xyz  ) = q.eval([](Real x, Real y, Real z) noexcept
                                                    { return x*y*z; });
diff --git a/Src/EB/AMReX_algoim_K.H b/Src/EB/AMReX_algoim_K.H
index 1b83924b88b..d181c08d1cc 100644
--- a/Src/EB/AMReX_algoim_K.H
+++ b/Src/EB/AMReX_algoim_K.H
@@ -370,7 +370,7 @@ struct ImplicitIntegral
         Real x_max = xrange.max(e0);
         roots[0] = x_min;
         int nroots = 1;
-        if (phi.grad(e0) != 0.0_rt) {
+        if (phi.grad(e0) != Real(0.0)) {
             for (int i = 0; i < psiCount; ++i)
             {
                 for (int dim = 0; dim < N; ++dim) {
diff --git a/Src/EB/AMReX_compute_normals.F90 b/Src/EB/AMReX_compute_normals.F90
deleted file mode 100644
index b30d7114909..00000000000
--- a/Src/EB/AMReX_compute_normals.F90
+++ /dev/null
@@ -1,60 +0,0 @@
-
-  subroutine amrex_eb_compute_normals ( lo, hi,           &
-                                        flag, fglo, fghi, &
-                                        normal, nlo, nhi, &
-                                        apx, axlo, axhi,  &
-                                        apy, aylo, ayhi,  &
-                                        apz, azlo, azhi ) &
-             bind(C, name="amrex_eb_compute_normals")
-
-    use amrex_fort_module, only: amrex_real
-    use iso_c_binding,     only: c_int
-
-    use amrex_constants_module , only : one
-    use amrex_ebcellflag_module, only : is_single_valued_cell
-
-    implicit none
-
-    integer         , intent(in   ) :: lo(3),hi(3),nlo(3),nhi(3),fglo(3),fghi(3)
-    integer         , intent(in   ) :: axlo(3),axhi(3),aylo(3),ayhi(3),azlo(3),azhi(3)
-    integer         , intent(in   ) :: flag(fglo(1):fghi(1),fglo(2):fghi(2),fglo(3):fghi(3))
-    real(amrex_real), intent(  out) :: normal(nlo(1):nhi(1),nlo(2):nhi(2),nlo(3):nhi(3),3)
-    real(amrex_real), intent(in   ) :: apx(axlo(1):axhi(1),axlo(2):axhi(2),axlo(3):axhi(3))
-    real(amrex_real), intent(in   ) :: apy(aylo(1):ayhi(1),aylo(2):ayhi(2),aylo(3):ayhi(3))
-    real(amrex_real), intent(in   ) :: apz(azlo(1):azhi(1),azlo(2):azhi(2),azlo(3):azhi(3))
-
-    real(amrex_real) :: axm, axp, aym, ayp, azm, azp
-    real(amrex_real) :: apnorm, apnorminv, anrmx, anrmy, anrmz
-
-    integer :: i, j, k
-
-    do k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if ( is_single_valued_cell(flag(i,j,k)) ) then
-                axm = apx(i,  j  , k  )
-                axp = apx(i+1,j  , k  )
-                aym = apy(i,  j  , k  )
-                ayp = apy(i,  j+1, k  )
-                azm = apz(i,  j  , k  )
-                azp = apz(i,  j  , k+1)
-
-                apnorm = sqrt((axm-axp)**2 + (aym-ayp)**2 + (azm-azp)**2)
-
-                apnorminv = one / apnorm
-                anrmx = (axp-axm) * apnorminv   ! pointing to the wall
-                anrmy = (ayp-aym) * apnorminv
-                anrmz = (azp-azm) * apnorminv
-
-                ! To fit the convention of previous mfix
-                normal(i,j,k,1) = -anrmx
-                normal(i,j,k,2) = -anrmy
-                normal(i,j,k,3) = -anrmz
-             end if
-
-          end do
-        end do
-    end do
-
-  end subroutine amrex_eb_compute_normals
diff --git a/Src/EB/AMReX_distFcnElement.cpp b/Src/EB/AMReX_distFcnElement.cpp
index a43b57df59c..dec3949b713 100644
--- a/Src/EB/AMReX_distFcnElement.cpp
+++ b/Src/EB/AMReX_distFcnElement.cpp
@@ -110,7 +110,7 @@ amrex::Real SplineDistFcnElement2d::cpside(amrex::RealVect pt,
   amrex::Real t;
   amrex::RealVect cp;
   amrex::Real dist;
-  amrex::Real x0, x1, y0, y1, Dx0, Dx1, Dy0, Dy1, tmin;
+  amrex::Real x0=0., x1=0., y0=0., y1=0., Dx0=0., Dx1=0., Dy0=0., Dy1=0., tmin=0.;
   int nsplines = Dx.size() - 1;
   for (int i=0; i<nsplines; ++i) {
     single_spline_cpdist(pt, control_points_x[i], control_points_x[i+1],
diff --git a/Src/EB/AMReX_eb_to_pvd.F90 b/Src/EB/AMReX_eb_to_pvd.F90
index f0ff3f2a0de..f3b7724cf6e 100644
--- a/Src/EB/AMReX_eb_to_pvd.F90
+++ b/Src/EB/AMReX_eb_to_pvd.F90
@@ -16,7 +16,7 @@ module amrex_eb_to_vtk
 
 contains
 
-  subroutine amrex_eb_to_polygon (dx, lo, hi, flag, fglo, fghi, bcent, blo, bhi, &
+  subroutine amrex_eb_to_polygon (problo, dx, lo, hi, flag, fglo, fghi, bcent, blo, bhi, &
        apx, axlo, axhi,  apy, aylo, ayhi, apz, azlo, azhi) &
        bind(C, name="amrex_eb_to_polygon")
 
@@ -34,7 +34,7 @@ subroutine amrex_eb_to_polygon (dx, lo, hi, flag, fglo, fghi, bcent, blo, bhi, &
   integer,          intent(in   ) :: &
        flag(fglo(1):fghi(1),fglo(2):fghi(2),fglo(3):fghi(3))
 
-  real(amrex_real), intent(in   ) :: dx(3), &
+  real(amrex_real), intent(in   ) :: problo(3), dx(3), &
        bcent(blo(1):bhi(1),blo(2):bhi(2),blo(3):bhi(3),3),   &
        apx(axlo(1):axhi(1),axlo(2):axhi(2),axlo(3):axhi(3)), &
        apy(aylo(1):ayhi(1),aylo(2):ayhi(2),aylo(3):ayhi(3)), &
@@ -88,20 +88,19 @@ subroutine amrex_eb_to_polygon (dx, lo, hi, flag, fglo, fghi, bcent, blo, bhi, &
               normal(3) = (azp-azm) * apnorminv
 
               ! convert bcent to global coordinate system centered at plo
-              centroid(1) = bcent(i,j,k,1)*dx(1) + (dble(i) + 0.5d0)*dx(1)
-              centroid(2) = bcent(i,j,k,2)*dx(2) + (dble(j) + 0.5d0)*dx(2)
-              centroid(3) = bcent(i,j,k,3)*dx(3) + (dble(k) + 0.5d0)*dx(3)
+              centroid(1) = problo(1) + bcent(i,j,k,1)*dx(1) + (dble(i) + 0.5d0)*dx(1)
+              centroid(2) = problo(2) + bcent(i,j,k,2)*dx(2) + (dble(j) + 0.5d0)*dx(2)
+              centroid(3) = problo(3) + bcent(i,j,k,3)*dx(3) + (dble(k) + 0.5d0)*dx(3)
 
               ! vertices of bounding cell (i,j,k)
-              vertex(1,:) = (/dble(i  )*dx(1), dble(j  )*dx(2), dble(k  )*dx(3)/)
-              vertex(2,:) = (/dble(i+1)*dx(1), dble(j  )*dx(2), dble(k  )*dx(3)/)
-              vertex(3,:) = (/dble(i  )*dx(1), dble(j+1)*dx(2), dble(k  )*dx(3)/)
-              vertex(4,:) = (/dble(i+1)*dx(1), dble(j+1)*dx(2), dble(k  )*dx(3)/)
-              vertex(5,:) = (/dble(i  )*dx(1), dble(j  )*dx(2), dble(k+1)*dx(3)/)
-              vertex(6,:) = (/dble(i+1)*dx(1), dble(j  )*dx(2), dble(k+1)*dx(3)/)
-              vertex(7,:) = (/dble(i  )*dx(1), dble(j+1)*dx(2), dble(k+1)*dx(3)/)
-              vertex(8,:) = (/dble(i+1)*dx(1), dble(j+1)*dx(2), dble(k+1)*dx(3)/)
-
+              vertex(1,:) = (/problo(1)+dble(i  )*dx(1), problo(2)+dble(j  )*dx(2), problo(3)+dble(k  )*dx(3)/)
+              vertex(2,:) = (/problo(1)+dble(i+1)*dx(1), problo(2)+dble(j  )*dx(2), problo(3)+dble(k  )*dx(3)/)
+              vertex(3,:) = (/problo(1)+dble(i  )*dx(1), problo(2)+dble(j+1)*dx(2), problo(3)+dble(k  )*dx(3)/)
+              vertex(4,:) = (/problo(1)+dble(i+1)*dx(1), problo(2)+dble(j+1)*dx(2), problo(3)+dble(k  )*dx(3)/)
+              vertex(5,:) = (/problo(1)+dble(i  )*dx(1), problo(2)+dble(j  )*dx(2), problo(3)+dble(k+1)*dx(3)/)
+              vertex(6,:) = (/problo(1)+dble(i+1)*dx(1), problo(2)+dble(j  )*dx(2), problo(3)+dble(k+1)*dx(3)/)
+              vertex(7,:) = (/problo(1)+dble(i  )*dx(1), problo(2)+dble(j+1)*dx(2), problo(3)+dble(k+1)*dx(3)/)
+              vertex(8,:) = (/problo(1)+dble(i+1)*dx(1), problo(2)+dble(j+1)*dx(2), problo(3)+dble(k+1)*dx(3)/)
 
               ! NOTE: this seems to be unncessary:
               ! skip cells that have a tiny intersection and cells that have
@@ -555,7 +554,7 @@ end subroutine reorder_polygon
 !                                                                       !
 !                                                                       !
 !.......................................................................!
-  subroutine amrex_eb_grid_coverage (myID, dx, lo, hi, flag, fglo, fghi)&
+  subroutine amrex_eb_grid_coverage (myID, problo, dx, lo, hi, flag, fglo, fghi)&
        bind(C, name="amrex_eb_grid_coverage")
 
   use amrex_ebcellflag_module, only : is_regular_cell, is_covered_cell
@@ -569,7 +568,7 @@ subroutine amrex_eb_grid_coverage (myID, dx, lo, hi, flag, fglo, fghi)&
   integer,          intent(in   ) :: &
        flag(fglo(1):fghi(1),fglo(2):fghi(2),fglo(3):fghi(3))
 
-  real(amrex_real), intent(in   ) :: dx(3)
+  real(amrex_real), intent(in   ) :: problo(3), dx(3)
 
   integer :: i, j, k, lc1
 
@@ -614,9 +613,9 @@ subroutine amrex_eb_grid_coverage (myID, dx, lo, hi, flag, fglo, fghi)&
      nodes(1),0,nodes(2),0,nodes(3),'">'
   write(100,'(A)') '<Coordinates>'
 
-  call data_array(lo(1), nodes(1), dx(1))
-  call data_array(lo(2), nodes(2), dx(2))
-  call data_array(lo(3), nodes(3), dx(3))
+  call data_array(problo(1), lo(1), nodes(1), dx(1))
+  call data_array(problo(2), lo(2), nodes(2), dx(2))
+  call data_array(problo(3), lo(3), nodes(3), dx(3))
 
   write(100,'("</Coordinates>")')
   write(100,'("</Piece>")')
@@ -627,21 +626,25 @@ subroutine amrex_eb_grid_coverage (myID, dx, lo, hi, flag, fglo, fghi)&
 
 contains
 
-  subroutine data_array(lo, lnodes, ldx)
+  subroutine data_array(problo, lo, lnodes, ldx)
 
     implicit none
 
     integer,          intent(in) :: lo, lnodes
+    real(amrex_real), intent(in) :: problo
     real(amrex_real), intent(in) :: ldx
 
     integer :: llc
     real(amrex_real), allocatable :: lines(:)
+    real(amrex_real)              :: grid_start 
 
     if(allocated(lines)) deallocate(lines)
     allocate(lines(0:lnodes))
 
-    do llc=0, lnodes
-       lines(llc) = real(lo + llc)*ldx
+    grid_start = problo + real(lo,amrex_real)*ldx
+
+    do llc = 0, lnodes
+       lines(llc) = grid_start + real(llc,amrex_real)*ldx
     enddo
 
     write(100,'(A,F14.8,A,F14.8,A)') '<DataArray &
diff --git a/Src/EB/CMakeLists.txt b/Src/EB/CMakeLists.txt
index 7f734587698..6aeb877b2c0 100644
--- a/Src/EB/CMakeLists.txt
+++ b/Src/EB/CMakeLists.txt
@@ -8,7 +8,7 @@ target_sources(amrex
    AMReX_EBFabFactory.cpp
    AMReX_EBMultiFabUtil.H
    AMReX_EBMultiFabUtil_C.H
-   AMReX_EBMultiFabUtil_${DIM}D_C.H
+   AMReX_EBMultiFabUtil_${AMReX_SPACEDIM}D_C.H
    AMReX_EBMultiFabUtil.cpp
    AMReX_EBCellFlag.H
    AMReX_EBCellFlag.cpp
@@ -21,10 +21,11 @@ target_sources(amrex
    AMReX_EBInterpolater.cpp
    AMReX_EBFluxRegister.H
    AMReX_EBFluxRegister_C.H
-   AMReX_EBFluxRegister_${DIM}D_C.H
+   AMReX_EBFluxRegister_${AMReX_SPACEDIM}D_C.H
    AMReX_EBFluxRegister.cpp
    AMReX_EBAmrUtil.H
    AMReX_EBAmrUtil.cpp
+   AMReX_EB_slopes_K.H
    AMReX_EB_utils.H
    AMReX_EB_utils.cpp
    AMReX_algoim.H
@@ -61,39 +62,19 @@ target_sources(amrex
    AMReX_EB2.cpp
    AMReX_EB2_Level.cpp
    AMReX_EB2_MultiGFab.cpp
-   AMReX_EB2_${DIM}D_C.cpp
-   AMReX_EB2_C.H AMReX_EB2_${DIM}D_C.H
+   AMReX_EB2_${AMReX_SPACEDIM}D_C.cpp
+   AMReX_EB2_C.H AMReX_EB2_${AMReX_SPACEDIM}D_C.H
    )
 
-if (ENABLE_FORTRAN)
+if (AMReX_FORTRAN)
    target_sources(amrex
       PRIVATE
       AMReX_ebcellflag_mod.F90
       AMReX_EBFluxRegister_nd.F90
-      AMReX_compute_normals.F90
-      AMReX_EB_F.H
       AMReX_WriteEBSurface.cpp
       AMReX_WriteEBSurface.H
       AMReX_WriteEB_F.H
       AMReX_eb_to_pvd.F90
-      # LS
-      AMReX_EB_geometry.F90
-      AMReX_EB_bc_fill_nd.F90
-      AMReX_EB_Tagging.F90
-      AMReX_EB_levelset_F.F90
-      AMReX_EB_levelset.H
-      AMReX_EB_levelset.cpp
       )
 
-   if (DIM EQUAL 3)
-      target_sources(amrex
-         PRIVATE
-         AMReX_EB_LSCoreBase.H
-         AMReX_EB_LSCoreBase.cpp
-         AMReX_EB_LSCore.H
-         AMReX_EB_LSCoreI.H
-         AMReX_EB_LSCore_F.H
-         )
-  endif ()
-
 endif ()
diff --git a/Src/EB/Make.package b/Src/EB/Make.package
index e5e67b0da91..8e7a6df7ba4 100644
--- a/Src/EB/Make.package
+++ b/Src/EB/Make.package
@@ -33,6 +33,8 @@ CEXE_sources += AMReX_EBAmrUtil.cpp
 CEXE_headers += AMReX_EB_utils.H
 CEXE_sources += AMReX_EB_utils.cpp
 
+CEXE_headers += AMReX_EB_slopes_K.H
+
 CEXE_headers += AMReX_algoim.H AMReX_algoim_K.H
 CEXE_sources += AMReX_algoim.cpp
 
@@ -71,23 +73,11 @@ CEXE_headers += AMReX_EB2_C.H AMReX_EB2_$(DIM)D_C.H
 ifneq ($(BL_NO_FORT),TRUE)
   F90EXE_sources += AMReX_ebcellflag_mod.F90
   F90EXE_sources += AMReX_EBFluxRegister_nd.F90
-  F90EXE_sources += AMReX_compute_normals.F90
-  CEXE_headers += AMReX_EB_F.H
 
   CEXE_sources += AMReX_WriteEBSurface.cpp
   CEXE_headers += AMReX_WriteEBSurface.H AMReX_WriteEB_F.H
   F90EXE_sources += AMReX_eb_to_pvd.F90
 
-  # LS
-  F90EXE_sources += AMReX_EB_geometry.F90 AMReX_EB_bc_fill_nd.F90 AMReX_EB_Tagging.F90 AMReX_EB_levelset_F.F90
-  CEXE_headers += AMReX_EB_levelset.H
-  CEXE_sources += AMReX_EB_levelset.cpp
-  ifeq ($(DIM),3)
-    CEXE_headers += AMReX_EB_LSCoreBase.H
-    CEXE_sources += AMReX_EB_LSCoreBase.cpp
-    CEXE_headers += AMReX_EB_LSCore.H AMReX_EB_LSCoreI.H AMReX_EB_LSCore_F.H
-  endif
-
 endif
 
 VPATH_LOCATIONS += $(AMREX_HOME)/Src/EB
diff --git a/Src/Extern/Conduit/AMReX_Conduit_Blueprint.H b/Src/Extern/Conduit/AMReX_Conduit_Blueprint.H
index 93bda5af2ab..7f476750f5f 100644
--- a/Src/Extern/Conduit/AMReX_Conduit_Blueprint.H
+++ b/Src/Extern/Conduit/AMReX_Conduit_Blueprint.H
@@ -19,8 +19,8 @@
 
 ///////////////////////////////////////////////////////////////////////////////
 // These functions generate a Conduit Blueprint Mesh representation of
-// AMReX AMR meshes and particle containers. 
-// 
+// AMReX AMR meshes and particle containers.
+//
 // Data from MultiFABs and ParticleContainers are zero copied and annotated
 // in Conduit Node Trees. This is the format used to pass meshes to ALPINE
 // Ascent for in situ rendering and analysis.
@@ -91,8 +91,8 @@ namespace amrex
     //   real_comp_names are first mapped in order to the aos then soa reals
     //   int_comp_names are first mapped in order to the aos then soa ints
     //
-    // `topology_name` allows you to control the name of the topology, 
-    //  coordset and fields used to represent the passed particle container. 
+    // `topology_name` allows you to control the name of the topology,
+    //  coordset and fields used to represent the passed particle container.
     //  This allows you to use unique names to wrap multiple particle containers
     //  into a single blueprint tree.
     template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
diff --git a/Src/Extern/Conduit/AMReX_Conduit_Blueprint.cpp b/Src/Extern/Conduit/AMReX_Conduit_Blueprint.cpp
index f01cdccc519..1e988b3254e 100644
--- a/Src/Extern/Conduit/AMReX_Conduit_Blueprint.cpp
+++ b/Src/Extern/Conduit/AMReX_Conduit_Blueprint.cpp
@@ -14,6 +14,115 @@ using namespace conduit;
 
 namespace amrex {
 
+//---------------------------------------------------------------------------//
+// Creates the Blueprint nesting relationships
+//---------------------------------------------------------------------------//
+bool Nestsets(const int level,
+              const int n_levels,
+              const FArrayBox &fab,
+              const Vector<const BoxArray*> box_arrays,
+              const Vector<IntVect> &ref_ratio,
+              const Vector<int> &domain_offsets,
+              conduit::Node &nestset)
+{
+    nestset.reset();
+    nestset["association"] = "element";
+    nestset["topology"] = "topo";
+
+    const int dims = BL_SPACEDIM;
+    const Box &box = fab.box();
+
+    bool valid = false;
+    if(level > 0)
+    {
+      // check for parents
+      std::vector<std::pair<int,Box> > isects
+        = box_arrays[level-1]->intersections(amrex::coarsen(box, ref_ratio[level-1]));
+
+      for(int b = 0; b < isects.size(); ++b)
+      {
+        valid = true;
+        // get parent box in terms of this level
+        Box parent = amrex::refine(isects[b].second, ref_ratio[level-1]);
+        Box overlap = box & parent;
+        int parent_id = isects[b].first + domain_offsets[level-1];
+
+        const std::string& w_name = amrex::Concatenate("window_",
+                                                        parent_id,
+                                                        4);
+        conduit::Node &window = nestset["windows/"+w_name];
+        window["domain_id"] = parent_id;
+        window["domain_type"] = "parent";
+        // box coordinates are global to the level,
+        // but the the window is local to this box so
+        // subtract the current box origin
+        window["origin/i"] = overlap.smallEnd()[0] - box.smallEnd()[0];
+        window["origin/j"] = overlap.smallEnd()[1] - box.smallEnd()[1];
+        if(dims == 3)
+        {
+            window["origin/k"] = overlap.smallEnd()[2] - box.smallEnd()[2];
+        }
+        window["dims/i"] = overlap.size()[0];
+        window["dims/j"] = overlap.size()[1];
+        if(dims == 3)
+        {
+            window["dims/k"] = overlap.size()[2];
+        }
+        window["ratio/i"] = ref_ratio[level-1][0];
+        window["ratio/j"] = ref_ratio[level-1][1];
+        if(dims == 3)
+        {
+            window["ratio/k"] = ref_ratio[level-1][2];
+        }
+      }
+    }
+
+    if(level < n_levels - 1)
+    {
+      // check for children
+      std::vector<std::pair<int,Box> > isects
+        = box_arrays[level+1]->intersections(amrex::refine(box, ref_ratio[level]));
+
+      for(int b = 0; b < isects.size(); ++b)
+      {
+        valid = true;
+        // get child box in terms of this level
+        Box child = amrex::coarsen(isects[b].second, ref_ratio[level]);
+        int child_id = isects[b].first + domain_offsets[level+1];
+        Box overlap = box & child;
+
+        const std::string& w_name = amrex::Concatenate("window_",
+                                                        child_id,
+                                                        4);
+
+        conduit::Node &window = nestset["windows/"+w_name];
+        window["domain_id"] = child_id;
+        window["domain_type"] = "child";
+        // box coordinates are global to the level,
+        // but the the window is local to this box so
+        // subtract the current box origin
+        window["origin/i"] = overlap.smallEnd()[0] - box.smallEnd()[0];
+        window["origin/j"] = overlap.smallEnd()[1] - box.smallEnd()[1];
+        if(dims == 3)
+        {
+            window["origin/k"] = overlap.smallEnd()[2] - box.smallEnd()[2];
+        }
+        window["dims/i"] = overlap.size()[0];
+        window["dims/j"] = overlap.size()[1];
+        if(dims == 3)
+        {
+            window["dims/k"] = overlap.size()[2];
+        }
+        window["ratio/i"] = ref_ratio[level+1][0];
+        window["ratio/j"] = ref_ratio[level+1][1];
+        if(dims == 3)
+        {
+            window["ratio/k"] = ref_ratio[level+1][2];
+        }
+      }
+    }
+    return valid;
+}
 
 //---------------------------------------------------------------------------//
 // Creates a Rectilinear Blueprint Topology from the Geom and Fab.
@@ -23,7 +132,7 @@ void FabToBlueprintTopology(const Geometry& geom,
                             Node &res)
 {
     int dims = BL_SPACEDIM;
-    
+
     // get the details of the entire level from geom
     amrex::Box level_box = geom.Domain();
 
@@ -46,12 +155,13 @@ void FabToBlueprintTopology(const Geometry& geom,
     // geom.CellSize()[j] == (level_y_max - level_y_min) / float64(level_ny);
     float64 level_dy = geom.CellSize()[1];
 
-    // geom.CellSize()[k] == (level_z_max - level_z_min) / float64(level_nz) 
+    // geom.CellSize()[k] == (level_z_max - level_z_min) / float64(level_nz)
     float64 level_dz = dims > 2 ? geom.CellSize()[2] : 0.0;
-    
+
     // now extract the FAB details
     const amrex::Box &fab_box = fab.box();
-    
+
+
     int i_min = fab_box.smallEnd(0);
     int i_max = fab_box.bigEnd(0);
 
@@ -68,51 +178,34 @@ void FabToBlueprintTopology(const Geometry& geom,
 
     float64 x_min = level_x_min + level_dx * i_min;
     float64 x_max = level_x_min + level_dx * i_max;
-    
+
     float64 y_min = level_y_min + level_dy * j_min;
     float64 y_max = level_y_min + level_dy * j_max;
-    
+
     float64 z_min = dims > 2 ? level_z_min + level_dz * k_min : 0.0;
     float64 z_max = dims > 2 ? level_z_min + level_dz * k_max : 0.0;
 
-    // create rectilinear coordset 
+    // create uniform coordset
     // (which also holds all implicit details needed for the topology)
-    res["coordsets/coords/type"] = "rectilinear";
-    res["coordsets/coords/values/x"] = DataType::float64(nx+1);
-    res["coordsets/coords/values/y"] = DataType::float64(ny+1);
-    
-    float64_array x_coords = res["coordsets/coords/values/x"].value();
-    float64_array y_coords = res["coordsets/coords/values/y"].value(); 
-
-    float64 vx = x_min;
-    for(index_t i =0; i< nx+1; i++)
-    {
-        x_coords[i] = vx;
-        vx+=level_dx;
-    }
-    
-    float64 vy = y_min;
-    for(index_t i =0; i< ny+1; i++)
-    {
-        y_coords[i] = vy;
-        vy+=level_dy;
-    }
-    
+    res["coordsets/coords/type"] = "uniform";
+    res["coordsets/coords/dims/i"] = nx+1;
+    res["coordsets/coords/dims/j"] = ny+1;
+
+    res["coordsets/coords/spacing/dx"] = level_dx;
+    res["coordsets/coords/spacing/dy"] = level_dy;
+
+    res["coordsets/coords/origin/x"] = x_min;
+    res["coordsets/coords/origin/y"] = y_min;
+
     if(dims > 2)
     {
-        res["coordsets/coords/values/z"] = DataType::float64(nz+1);
-        float64_array z_coords = res["coordsets/coords/values/z"].value();
-        
-        float64 vz = z_min;
-        for(index_t i =0; i< nz+1; i++)
-        {
-            z_coords[i] = vz;
-            vz+=level_dz;
-        }
+      res["coordsets/coords/dims/k"] = nz+1;
+      res["coordsets/coords/spacing/dz"] = level_dz;
+      res["coordsets/coords/origin/z"] = z_min;
     }
-    
+
     // create a rectilinear topology that refs our coordset
-    res["topologies/topo/type"] = "rectilinear";
+    res["topologies/topo/type"] = "uniform";
     res["topologies/topo/coordset"] = "coords";
 
     // add logical elements origin
@@ -122,14 +215,14 @@ void FabToBlueprintTopology(const Geometry& geom,
     {
         res["topologies/topo/elements/origin/k0"] = k_min;
     }
-    
+
 }
 
 //---------------------------------------------------------------------------//
 // Creates a Blueprint Field that identifies the cells in the ghost or "grow"
-// region of the fab. 
+// region of the fab.
 //
-// The values indicate: 
+// The values indicate:
 //    0 = normal cell
 //    1 = ghost cell
 //
@@ -138,17 +231,17 @@ void AddFabGhostIndicatorField (const FArrayBox& fab,
                                 int ngrow,
                                 Node &res)
 {
-    Node &n_field = res["fields/ghost_indicator"];
+    Node &n_field = res["fields/ascent_ghosts"];
     n_field["association"] = "element";
     n_field["topology"] = "topo";
     n_field["values"].set(DataType::float64(fab.box().numPts()));
     float64_array vals_array = n_field["values"].value();
 
     int dims = BL_SPACEDIM;
-    
+
     // find the FAB details
     const amrex::Box &fab_box = fab.box();
-    
+
     int i_min = fab_box.smallEnd(0);
     int i_max = fab_box.bigEnd(0);
 
@@ -157,11 +250,11 @@ void AddFabGhostIndicatorField (const FArrayBox& fab,
 
     int k_min = dims > 2 ? fab_box.smallEnd(2) : 0;
     int k_max = dims > 2 ? fab_box.bigEnd(2) : 0;
-    
+
     int ni = (i_max - i_min + 1);
     int nj = (j_max - j_min + 1);
     int nk = dims > 2 ? (k_max - k_min +1) : 1;
-    
+
     // ngrow is the number of ghosts on each side of the box
     // set indicator to 1 if the zone is a ghost
     int idx = 0;
@@ -173,7 +266,7 @@ void AddFabGhostIndicatorField (const FArrayBox& fab,
             {
                 if(  (i < ngrow ) || ( (ni - ngrow -1) < i ) ||
                      (j < ngrow ) || ( (nj - ngrow -1) < j ) ||
-                     ( (dims >2 )  && 
+                     ( (dims >2 )  &&
                        ( (k < ngrow ) || ( (nk - ngrow -1) < k ) )
                      )
                   )
@@ -203,7 +296,7 @@ void FabToBlueprintFields (const FArrayBox& fab,
         n_field["association"] = "element";
         n_field["topology"] = "topo";
         //
-        // const_cast is used b/c zero copy via Node::set_external 
+        // const_cast is used b/c zero copy via Node::set_external
         // requires non-const
         //
         // the field data values are the i'th component
@@ -219,7 +312,7 @@ void FabToBlueprintFields (const FArrayBox& fab,
 void
 SingleLevelToBlueprint (const MultiFab& mf,
                         const Vector<std::string>& varnames,
-                        const Geometry& geom, 
+                        const Geometry& geom,
                         Real time_value,
                         int level_step,
                         Node &res)
@@ -263,30 +356,45 @@ MultiLevelToBlueprint (int n_levels,
     BL_ASSERT(mfs[0]->nComp() == varnames.size());
 
     int finest_level = n_levels-1;
-    
+
     int num_levels = geoms.size();
-    
+
     // get mpi rank and # of tasks
     int rank   = ParallelDescriptor::MyProc();
     int ntasks = ParallelDescriptor::NProcs();
 
+    Vector<const BoxArray*> box_arrays;
+    Vector<int> box_offsets;
+    for(int i = 0; i < num_levels; i++)
+    {
+      const BoxArray &boxs = mfs[i]->boxArray();
+      box_arrays.push_back(&boxs);
+      if(i == 0)
+      {
+        box_offsets.push_back(0);
+      }
+      else
+      {
+        box_offsets[i] = box_offsets[i-1] + mfs[i]->size();
+      }
+    }
 
     int num_domains = 0;
     for(int i = 0; i < num_levels; i++)
     {
         //
         // Geometry represents the physical and logical space of an entire level.
-        // 
+        //
         // Multifab contains the patches or blocks for this level.
-        // In Blueprint speak, Each Multifab contains several domains and 
+        // In Blueprint speak, Each Multifab contains several domains and
         // each fab has "components" which map to a Blueprint field.
-        
+
         const Geometry &geom = geoms[i];
         const MultiFab &mf = *mfs[i];
-                
+
         // ngrow tells us how many layers of ghosts
         int ngrow = mf.nGrow();
-        
+
         // mfiter allows us to iterate over local patches
         for(MFIter mfi(mf); mfi.isValid(); ++mfi)
         {
@@ -295,6 +403,7 @@ MultiLevelToBlueprint (int n_levels,
             const std::string& patch_name = amrex::Concatenate("domain_",
                                                                domain_id,
                                                                6);
+
             Node &patch = res[patch_name];
             // add basic state info
             patch["state/domain_id"] = domain_id;
@@ -302,8 +411,19 @@ MultiLevelToBlueprint (int n_levels,
             patch["state/time"] = time_value;
 
             const FArrayBox &fab = mf[mfi];
+
             // create coordset and topo
             FabToBlueprintTopology(geom,fab,patch);
+            // add the nesting relationship
+            if(num_levels > 1)
+            {
+                conduit::Node nestset;
+                bool valid = Nestsets(i, n_levels, fab, box_arrays, ref_ratio, box_offsets, nestset);
+                if(valid)
+                {
+                    patch["nestsets/nest"].set(nestset);
+                }
+            }
             // add fields
             FabToBlueprintFields(fab,varnames,patch);
 
@@ -319,9 +439,9 @@ MultiLevelToBlueprint (int n_levels,
     Node info;
     // if we have mesh data, use blueprint verify
     // to make sure we conform to whats expected
-    // for a multi-domain mesh 
-    
-    if(!res.dtype().is_empty() && 
+    // for a multi-domain mesh
+
+    if(!res.dtype().is_empty() &&
        !blueprint::mesh::verify(res,info))
     {
         // ERROR -- doesn't conform to the mesh blueprint
@@ -333,7 +453,7 @@ MultiLevelToBlueprint (int n_levels,
 }
 
 //---------------------------------------------------------------------------//
-// Write a Conduit Mesh Blueprint Hierarchy to a set of files that can 
+// Write a Conduit Mesh Blueprint Hierarchy to a set of files that can
 // be viewed in Visit using the Blueprint plugin.
 //---------------------------------------------------------------------------//
 void WriteBlueprintFiles (const conduit::Node &bp_mesh,
@@ -350,7 +470,7 @@ void WriteBlueprintFiles (const conduit::Node &bp_mesh,
     // get numer of mpi tasks and this task's rank
     int rank   = ParallelDescriptor::MyProc();
     int ntasks = ParallelDescriptor::NProcs();
-    
+
     // gen base file name that includes padded step #
     const std::string& bp_base = amrex::Concatenate(fname_base,
                                                     step,
@@ -359,9 +479,9 @@ void WriteBlueprintFiles (const conduit::Node &bp_mesh,
     std::string bp_root_file = bp_base + ".blueprint_root";
 
     //
-    // For the 1 processor case, save everything (including the 
+    // For the 1 processor case, save everything (including the
     // blueprint index) to one file
-    // 
+    //
     if(ntasks == 1 )  // save everything to one file
     {
         // we don't want to modify the input tree,
@@ -387,8 +507,8 @@ void WriteBlueprintFiles (const conduit::Node &bp_mesh,
     else // save 1 per file domain + root file
     {
         // one file per domain, until blueprint clients
-        // get generalized 
-        
+        // get generalized
+
         // create a folder to hold data files
         UtilCreateCleanDirectory(bp_base, true);
 
@@ -414,11 +534,11 @@ void WriteBlueprintFiles (const conduit::Node &bp_mesh,
                                                          6);
             // save this domain's data
             relay::io::save(n,
-                            fname_data + domain_path, 
+                            fname_data + domain_path,
                             protocol);
         }
 
-        // generate root file on the MPI Task designated as 
+        // generate root file on the MPI Task designated as
         // the AMReX IO Processor
         if(rank == ParallelDescriptor::IOProcessorNumber())
         {
@@ -443,5 +563,4 @@ void WriteBlueprintFiles (const conduit::Node &bp_mesh,
 }
 
 
-
 }
diff --git a/Src/Extern/Conduit/AMReX_Conduit_Blueprint_ParticlesI.H b/Src/Extern/Conduit/AMReX_Conduit_Blueprint_ParticlesI.H
index 205be5d2692..f8fd48a080e 100644
--- a/Src/Extern/Conduit/AMReX_Conduit_Blueprint_ParticlesI.H
+++ b/Src/Extern/Conduit/AMReX_Conduit_Blueprint_ParticlesI.H
@@ -3,7 +3,7 @@
 // Template implementation of functions for Conduit Mesh Blueprint Support
 // for AMReX Particle Containers
 //
-// This file is included in AMReX_Conduit_Blueprint.H when 
+// This file is included in AMReX_Conduit_Blueprint.H when
 // when USE_PARTICLES = TRUE
 //
 ///////////////////////////////////////////////////////////////////////////////
@@ -36,9 +36,9 @@ ParticleTileToBlueprint(const ParticleTile<NStructReal,
 
     // knowing the above, we can zero copy the x,y,z positions + id, cpu
     // and any user fields in the AOS
-    
+
     // get the first particle's struct
-    const auto &p_aos = ptile.GetArrayOfStructs()[0];
+    const auto &pstruct = ptile.GetArrayOfStructs();
 
     // setup a blueprint description for the particle mesh
     // create a coordinate set
@@ -64,18 +64,24 @@ ParticleTileToBlueprint(const ParticleTile<NStructReal,
     // point locations from from aos
     //----------------------------------//
 
-    n_coords["values/x"].set_external(const_cast<ParticleReal*>(&p_aos.m_rdata.pos[0]),
+    const char* pbuf_const = reinterpret_cast<const char*>(pstruct.data());
+    char* pbuf = const_cast<char*>(pbuf_const);
+
+    ParticleReal* xp = reinterpret_cast<ParticleReal*>(pbuf); pbuf += sizeof(ParticleReal);
+    n_coords["values/x"].set_external(xp,
                                       num_particles,
                                       0,
                                       struct_size);
 #if AMREX_SPACEDIM > 1
-    n_coords["values/y"].set_external(const_cast<ParticleReal*>(&p_aos.m_rdata.pos[1]),
+    ParticleReal* yp = reinterpret_cast<ParticleReal*>(pbuf); pbuf += sizeof(ParticleReal);
+    n_coords["values/y"].set_external(yp,
                                       num_particles,
                                       0,
                                       struct_size);
 #endif
 #if AMREX_SPACEDIM > 2
-    n_coords["values/z"].set_external(const_cast<ParticleReal*>(&p_aos.m_rdata.pos[2]),
+    ParticleReal* zp = reinterpret_cast<ParticleReal*>(pbuf); pbuf += sizeof(ParticleReal);
+    n_coords["values/z"].set_external(zp,
                                       num_particles,
                                       0,
                                       struct_size);
@@ -84,60 +90,66 @@ ParticleTileToBlueprint(const ParticleTile<NStructReal,
     // fields
     conduit::Node &n_fields = res["fields"];
 
+    // -----------------------------
+    // user defined, real aos fields
+    // -----------------------------
+
+    int vname_real_idx = 0;
+    // struct real fields, the first set are always the particle positions
+    // which we wrap above
+    for (int i = 0; i < NStructReal; i++)
+    {
+        ParticleReal* val = reinterpret_cast<ParticleReal*>(pbuf); pbuf += sizeof(ParticleReal);
+        conduit::Node &n_f = n_fields[real_comp_names.at(vname_real_idx)];
+        n_f["topology"] = topology_name;
+        n_f["association"] = "element";
+        n_f["values"].set_external(val,
+                                   num_particles,
+                                   0,
+                                   struct_size);
+
+        vname_real_idx++;
+    }
+
     //----------------------------------//
     // standard integer fields from aos
     // (id, cpu)
     //----------------------------------//
 
     // id is the first int entry
+    int* id = reinterpret_cast<int*>(pbuf); pbuf += sizeof(int);
     conduit::Node &n_f_id = n_fields[topology_name + "_id"];
 
     n_f_id["topology"] = topology_name;
     n_f_id["association"] = "element";
-    n_f_id["values"].set_external(const_cast<int*>(&p_aos.m_idata.arr[0]),
+    n_f_id["values"].set_external(id,
                                   num_particles,
                                   0,
                                   struct_size);
 
     // cpu is the second int entry
+    int* cpu = reinterpret_cast<int*>(pbuf); pbuf += sizeof(int);
     conduit::Node &n_f_cpu = n_fields[topology_name + "_cpu"];
 
     n_f_cpu["topology"] = topology_name;
     n_f_cpu["association"] = "element";
-    n_f_cpu["values"].set_external(const_cast<int*>(&p_aos.m_idata.arr[1]),
+    n_f_cpu["values"].set_external(cpu,
                                    num_particles,
                                    0,
                                    struct_size);
 
-    // -------------------------
-    // user defined aos fields
-    // -------------------------
-
-    int vname_real_idx = 0;
-    // struct real fields, the first set are always the particle positions
-    // which we wrap above
-    for (int i = AMREX_SPACEDIM; i < AMREX_SPACEDIM + NStructReal; i++)
-    {
-        conduit::Node &n_f = n_fields[real_comp_names[vname_real_idx]];
-        n_f["topology"] = topology_name;
-        n_f["association"] = "element";
-        n_f["values"].set_external(const_cast<ParticleReal*>(&p_aos.m_rdata.arr[i]),
-                                   num_particles,
-                                   0,
-                                   struct_size);
-
-        vname_real_idx++;
-    }
+    // --------------------------------
+    // user defined, integer aos fields
+    // --------------------------------
 
     int vname_int_idx = 0;
-    // struct int fields, first two are always id, and cpu --
-    // which we wrap above
-    for (int i = 2; i < 2 + NStructInt; i++)
+    for (int i = 0; i < NStructInt; i++)
     {
-        conduit::Node &n_f = n_fields[int_comp_names[vname_int_idx]];
+        int* val = reinterpret_cast<int*>(pbuf); pbuf += sizeof(int);
+        conduit::Node &n_f = n_fields[int_comp_names.at(vname_int_idx)];
         n_f["topology"] = topology_name;
         n_f["association"] = "element";
-        n_f["values"].set_external(const_cast<int*>(&p_aos.m_idata.arr[i]),
+        n_f["values"].set_external(val,
                                    num_particles,
                                    0,
                                    struct_size);
@@ -150,13 +162,13 @@ ParticleTileToBlueprint(const ParticleTile<NStructReal,
 
      const auto &soa = ptile.GetStructOfArrays();
 
-    // for soa entries, we can use standard strides, 
+    // for soa entries, we can use standard strides,
     // since these are contiguous arrays
 
     // array real fields
     for (int i = 0; i < NArrayReal; i++)
     {
-        conduit::Node &n_f = n_fields[real_comp_names[vname_real_idx]];
+        conduit::Node &n_f = n_fields[real_comp_names.at(vname_real_idx)];
         n_f["topology"] = topology_name;
         n_f["association"] = "element";
         n_f["values"].set_external(const_cast<ParticleReal*>(&soa.GetRealData(i)[0]),
@@ -168,7 +180,7 @@ ParticleTileToBlueprint(const ParticleTile<NStructReal,
     // array int fields
     for (int i = 0; i < NArrayInt; i++)
     {
-        conduit::Node &n_f = n_fields[int_comp_names[vname_int_idx]];
+        conduit::Node &n_f = n_fields[int_comp_names.at(vname_int_idx)];
         n_f["topology"] = topology_name;
         n_f["association"] = "element";
         n_f["values"].set_external(const_cast<int*>(&soa.GetIntData(i)[0]),
diff --git a/Src/Extern/Conduit/CMakeLists.txt b/Src/Extern/Conduit/CMakeLists.txt
index 7cca54a7060..91b2a40dedf 100644
--- a/Src/Extern/Conduit/CMakeLists.txt
+++ b/Src/Extern/Conduit/CMakeLists.txt
@@ -2,39 +2,7 @@ target_include_directories(amrex PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_D
 
 # TODO: Particles PR merges another file
 target_sources(amrex
-   PRIVATE 
+   PRIVATE
    AMReX_Conduit_Blueprint.H
    AMReX_Conduit_Blueprint.cpp
    )
-
-#
-# Dependencies
-#
-
-# For now do not look for specific components (if Conduit has any)
-# It would be good to check whether component conduit_mpi is available
-# or not
-find_package(Conduit REQUIRED)
-
-target_link_libraries(amrex PUBLIC conduit::conduit)
-set_target_properties(conduit:conduit PROPERTIES IMPORTED_GLOBAL True )
-
-if (ENABLE_MPI)
-   target_link_libraries(amrex PUBLIC conduit::conduit_mpi)
-   set_target_properties(conduit:conduit_mpi PROPERTIES IMPORTED_GLOBAL True )   
-endif ()
-
-if (ENABLE_ASCENT)
-   find_package(Ascent)
-   
-   if (ENABLE_MPI)
-      target_link_libraries( amrex PUBLIC ascent::ascent_mpi )
-      set_target_properties( ascent::ascent_mpi PROPERTIES IMPORTED_GLOBAL True )
-   else ()
-      target_link_libraries( amrex PUBLIC ascent::ascent )
-      set_target_properties( ascent::ascent PROPERTIES IMPORTED_GLOBAL True )
-   endif ()   
-endif ()
-
-
-
diff --git a/Src/Extern/HYPRE/AMReX_HABEC_2D.F90 b/Src/Extern/HYPRE/AMReX_HABEC_2D.F90
deleted file mode 100644
index d527fd12c6c..00000000000
--- a/Src/Extern/HYPRE/AMReX_HABEC_2D.F90
+++ /dev/null
@@ -1,713 +0,0 @@
-module amrex_habec_module
-
-  ! habec is Hypre abec, where abec is the form of the linear equation
-  ! we are solving:
-  ! 
-  ! alpha*phi - div(beta*grad phi) + div(\vec{c}*phi) 
-
-  use iso_c_binding
-#ifdef AMREX_USE_PETSC
-  use amrex_petsc_fort_module, only : it=>petsc_int
-#else
-  use amrex_hypre_fort_module, only : it=>hypre_int
-#endif
-  use amrex_fort_module, only : rt => amrex_real
-  use amrex_lo_bctypes_module, only : amrex_lo_dirichlet, amrex_lo_neumann
-  use amrex_error_module, only : amrex_error
-  use amrex_constants_module, only : zero, one, two, three, half, fourth
-  implicit none
-
-contains
-
-  elemental function amrex_get_dx_eb (kappa)
-    real(rt), intent(in) :: kappa
-    real(rt) :: amrex_get_dx_eb
-    amrex_get_dx_eb = max(0.3_rt, (kappa*kappa-fourth)/(two*kappa))
-  end function amrex_get_dx_eb
-
-  subroutine amrex_hpacoef (lo, hi, mat, a, alo, ahi, sa) bind(c,name='amrex_hpacoef')
-    integer, intent(in) :: lo(2), hi(2), alo(2), ahi(2)
-    real(rt), intent(inout) :: mat(0:4, lo(1): hi(1), lo(2): hi(2))
-    real(rt), intent(in   ) ::   a(    alo(1):ahi(1),alo(2):ahi(2))
-    real(rt), intent(in) :: sa
-    integer :: i, j
-    if (sa .eq. zero) then
-       !$omp parallel do private(i,j)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             mat(0,i,j) = zero
-          enddo
-       enddo
-       !$omp end parallel do
-    else
-       !$omp parallel do private(i,j)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             mat(0,i,j) = sa * a(i,j)
-          enddo
-       enddo
-       !$omp end parallel do
-    end if
-  end subroutine amrex_hpacoef
-
-
-  subroutine amrex_hpbcoef (lo, hi, mat, b, blo, bhi, sb, dx, idim) &
-       bind(c,name='amrex_hpbcoef')
-    integer, intent(in) :: lo(2), hi(2), blo(2), bhi(2), idim
-    real(rt), intent(inout) :: mat(0:4, lo(1): hi(1), lo(2): hi(2))
-    real(rt), intent(in   ) ::   b(    blo(1):bhi(1),blo(2):bhi(2))
-    real(rt), intent(in) :: sb, dx(2)
-
-    integer :: i, j
-    real(rt) :: fac
-
-    fac = sb / dx(idim+1)**2 
-
-    if (idim .eq. 0) then
-       !$omp parallel do private(i,j)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             mat(0,i,j) = mat(0,i,j) + fac * (b(i,j) + b(i+1,j))
-             mat(1,i,j) = - fac * b(i,j)
-             mat(2,i,j) = - fac * b(i+1,j)
-          enddo
-       enddo
-       !$omp end parallel do
-    else
-       !$omp parallel do private(i,j)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             mat(0,i,j) = mat(0,i,j) + fac * (b(i,j) + b(i,j+1))
-             mat(3,i,j) = - fac * b(i,j)
-             mat(4,i,j) = - fac * b(i,j+1)
-          enddo
-       enddo
-       !$omp end parallel do
-    endif
-    
-  end subroutine amrex_hpbcoef
-
-
-  subroutine amrex_hpmat (lo, hi, mat, b, blo, bhi, mask, mlo, mhi, &
-       sb, dx, cdir, bct, bcl, bho) bind(c,name='amrex_hpmat')
-    integer, intent(in) :: lo(2), hi(2), blo(2), bhi(2), mlo(2), mhi(2), cdir, bct, bho
-    real(rt), intent(inout) ::  mat(0:4, lo(1): hi(1), lo(2): hi(2))
-    real(rt), intent(in   ) ::    b(    blo(1):bhi(1),blo(2):bhi(2))
-    integer , intent(in   ) :: mask(    mlo(1):mhi(1),mlo(2):mhi(2))
-    real(rt), intent(in) :: sb, dx(2), bcl
-
-    integer :: i, j
-    real(rt) :: fac, h, h2, h3, bf1, bf2
-
-    if (cdir .eq. 0 .or. cdir .eq. 2) then
-       h = dx(1)
-    else
-       h = dx(2)
-    endif
-    fac = sb / (h**2)
-
-    if (bct .eq. amrex_lo_dirichlet) then
-       h2 = half * h
-       if (bho.ge.1) then
-          h3 = three * h2
-          bf1 = fac * ((h3 - bcl) / (bcl + h2) - one)
-          bf2 = fac * (bcl - h2) / (bcl + h3)
-       else
-          bf1 = fac * ( h / (bcl + h2) - one)          
-          bf2 = zero
-       end if
-    else if (bct .eq. amrex_lo_neumann) then
-       bf1 = -fac
-       bf2 = zero
-    else
-       call amrex_error("hpmat: unsupported boundary type")       
-    end if
-    
-    if (cdir .eq. 0) then
-       i = lo(1)
-       !$omp parallel do private(j)
-       do j = lo(2), hi(2)
-          if (mask(i-1,j) .gt. 0) then
-             mat(0,i,j) = mat(0,i,j) + bf1 * b(i,j)
-             mat(1,i,j) = zero
-             mat(2,i,j) = mat(2,i,j) + bf2 * b(i,j)
-          endif
-       enddo
-    else if (cdir .eq. 2) then
-       i = hi(1)
-       !$omp parallel do private(j)
-       do j = lo(2), hi(2)
-          if (mask(i+1,j) .gt. 0) then
-             mat(0,i,j) = mat(0,i,j) + bf1 * b(i+1,j)
-             mat(2,i,j) = zero
-             mat(1,i,j) = mat(1,i,j) + bf2 * b(i+1,j)
-          endif
-       enddo
-    else if (cdir .eq. 1) then
-       j = lo(2)
-       do i = lo(1), hi(1)
-          if (mask(i,j-1) .gt. 0) then
-             mat(0,i,j) = mat(0,i,j) + bf1 * b(i,j)
-             mat(3,i,j) = zero
-             mat(4,i,j) = mat(4,i,j) + bf2 * b(i,j)
-          endif
-       enddo
-    else if (cdir .eq. 3) then
-       j = hi(2)
-       do i = lo(1), hi(1)
-          if (mask(i,j+1) .gt. 0) then
-             mat(0,i,j) = mat(0,i,j) + bf1 * b(i,j+1)
-             mat(4,i,j) = zero
-             mat(3,i,j) = mat(3,i,j) + bf2 * b(i,j+1)
-          endif
-       enddo
-    else
-       call amrex_error("hpmat: impossible face orientation")
-    endif
-    
-  end subroutine amrex_hpmat
-
-
-  subroutine amrex_hpdiag (lo, hi, mat, diag, dlo, dhi) bind(c,name='amrex_hpdiag')
-    integer, dimension(2), intent(in) :: lo, hi, dlo, dhi
-    real(rt), intent(inout) :: mat (0:4, lo(1): hi(1), lo(2): hi(2))
-    real(rt), intent(inout) :: diag(    dlo(1):dhi(1),dlo(2):dhi(2))
-    integer :: i,j
-    !$omp parallel do private(i,j)
-    do j = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          diag(i,j) = one/mat(0,i,j)
-          mat(0:4,i,j) = mat(0:4,i,j) * diag(i,j)
-       enddo
-    enddo
-    !$omp end parallel do
-  end subroutine amrex_hpdiag
-
-
-  subroutine amrex_hpijmatrix (lo, hi, nrows, ncols, rows, cols, mat, &
-       cell_id, clo, chi, cell_id_begin, diag, dlo, dhi, a, alo, ahi, &
-       bx, xlo, xhi, by, ylo, yhi, sa, sb, dx, bct, bcl, bho) &
-       bind(c,name='amrex_hpijmatrix')
-    integer(it), intent(in) :: nrows, cell_id_begin;
-    integer(it), dimension(0:nrows-1), intent(out) :: ncols, rows
-    integer(it), dimension(0:nrows*5-1), intent(out) :: cols
-    real(rt)   , dimension(0:nrows*5-1), intent(out) :: mat
-    integer, dimension(2), intent(in) :: lo, hi, clo, chi, dlo, dhi, &
-         alo, ahi, xlo, xhi, ylo, yhi
-    integer(it), intent(in) :: cell_id(clo(1):chi(1),clo(2):chi(2))
-    real(rt)   , intent(inout)::  diag(dlo(1):dhi(1),dlo(2):dhi(2))
-    real(rt)   , intent(in) :: a      (alo(1):ahi(1),alo(2):ahi(2))
-    real(rt)   , intent(in) :: bx     (xlo(1):xhi(1),xlo(2):xhi(2))
-    real(rt)   , intent(in) :: by     (ylo(1):yhi(1),ylo(2):yhi(2))
-    integer, intent(in) :: bct(0:3), bho
-    real(rt), intent(in) :: sa, sb, dx(2), bcl(0:3)
-
-    integer :: i,j, irow, imat, ic, cdir, idim
-    integer(it) :: cols_tmp(0:4)
-    real(rt) :: fac(2), mat_tmp(0:4)
-    real(rt) :: bf1(0:3), bf2(0:3), h, h2, h3
-
-    fac = sb/dx**2
-
-    do cdir = 0, 3
-       if (cdir .eq. 0 .or. cdir .eq. 2) then
-          idim = 1
-       else
-          idim = 2
-       end if
-       h = dx(idim)
-       if (bct(cdir) .eq. amrex_lo_dirichlet) then
-          h2 = half * h
-          if (bho.ge.1) then
-             h3 = three * h2
-             bf1(cdir) = fac(idim) * ((h3 - bcl(cdir)) / (bcl(cdir) + h2) - one)
-             bf2(cdir) = fac(idim) * (bcl(cdir) - h2) / (bcl(cdir) + h3)
-          else
-             bf1(cdir) = fac(idim) * ( h / (bcl(cdir) + h2) - one)
-             bf2(cdir) = zero
-          end if
-       else if (bct(cdir) .eq. amrex_lo_neumann) then
-          bf1(cdir) = -fac(idim)
-          bf2(cdir) = zero
-       end if
-    end do
-    
-    irow = 0
-    imat = 0
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          rows(irow) = cell_id(i,j)
-          ncols(irow) = 0
-          
-          cols_tmp(0) = cell_id(i,j)
-          mat_tmp(0) = sa * a(i,j) + fac(1)*(bx(i,j)+bx(i+1,j)) &
-               &                   + fac(2)*(by(i,j)+by(i,j+1))
-
-          cols_tmp(1) = cell_id(i-1,j)
-          mat_tmp(1) = -fac(1)*bx(i,j)
-
-          cols_tmp(2) = cell_id(i+1,j)
-          mat_tmp(2) = -fac(1)*bx(i+1,j)
-
-          cols_tmp(3) = cell_id(i,j-1)
-          mat_tmp(3) = -fac(2)*by(i,j)
-
-          cols_tmp(4) = cell_id(i,j+1)
-          mat_tmp(4) = -fac(2)*by(i,j+1)
-
-          if (i.eq.lo(1) .and. cell_id(i-1,j).lt.0) then
-             cdir = 0
-             mat_tmp(0) = mat_tmp(0) + bf1(cdir)*bx(i,j)
-             mat_tmp(2) = mat_tmp(2) + bf2(cdir)*bx(i,j)
-          end if
-          
-          if (i.eq.hi(1) .and. cell_id(i+1,j).lt.0) then
-             cdir = 2
-             mat_tmp(0) = mat_tmp(0) + bf1(cdir)*bx(i+1,j)
-             mat_tmp(1) = mat_tmp(1) + bf2(cdir)*bx(i+1,j)
-          end if
-          
-          if (j.eq.lo(2) .and. cell_id(i,j-1).lt.0) then
-             cdir = 1
-             mat_tmp(0) = mat_tmp(0) + bf1(cdir)*by(i,j)
-             mat_tmp(4) = mat_tmp(4) + bf2(cdir)*by(i,j)
-          end if
-
-          if (j.eq.hi(2) .and. cell_id(i,j+1).lt.0) then
-             cdir = 3
-             mat_tmp(0) = mat_tmp(0) + bf1(cdir)*by(i,j+1)
-             mat_tmp(3) = mat_tmp(3) + bf2(cdir)*by(i,j+1)
-          end if
-
-          diag(i,j) = one/mat_tmp(0)
-
-          do ic = 0, 4
-             if (cols_tmp(ic) .ge. 0) then
-                ncols(irow) = ncols(irow) + 1
-                cols(imat) = cols_tmp(ic)
-                mat(imat) = mat_tmp(ic)*diag(i,j)
-                imat = imat + 1
-             end if
-          end do
-          irow = irow+1
-
-       end do
-    end do
-  end subroutine amrex_hpijmatrix
-
-
-#ifdef AMREX_USE_EB
-
-  subroutine amrex_hpeb_fill_cellid (lo, hi, nrows, cell_id, clo, chi, flag, flo, fhi) &
-       bind(c,name='amrex_hpeb_fill_cellid')
-    use amrex_ebcellflag_module, only : is_covered_cell
-    integer, dimension(2), intent(in) :: lo, hi, clo, chi, flo, fhi
-    integer(it), intent(  out) :: nrows
-    integer(it), intent(inout) :: cell_id(clo(1):chi(1),clo(2):chi(2))
-    integer    , intent(in   ) :: flag   (flo(1):fhi(1),flo(2):fhi(2))
-
-    integer :: i,j
-
-    nrows = 0
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          if (.not.is_covered_cell(flag(i,j))) then
-             cell_id(i,j) = nrows
-             nrows = nrows+1
-          end if
-       end do
-    end do
-  end subroutine amrex_hpeb_fill_cellid
-
-  subroutine amrex_hpeb_copy_from_vec (lo, hi, a, alo, ahi, v, nv, flag, flo, fhi) &
-       bind(c,name='amrex_hpeb_copy_from_vec')
-    use amrex_ebcellflag_module, only : is_covered_cell
-    integer, dimension(2), intent(in) :: lo, hi, alo, ahi, flo, fhi
-    integer(it), intent(in) :: nv
-    real(rt), intent(inout) :: a   (alo(1):ahi(1),alo(2):ahi(2))
-    integer , intent(in   ) :: flag(flo(1):fhi(1),flo(2):fhi(2))
-    real(rt), intent(in) :: v(0:nv-1)
-    
-    integer :: i,j, nrows
-
-    nrows = 0
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          if (.not.is_covered_cell(flag(i,j))) then
-             a(i,j) = v(nrows)
-             nrows = nrows+1
-          end if
-       end do
-    end do
-  end subroutine amrex_hpeb_copy_from_vec
-
-  subroutine amrex_hpeb_copy_to_vec (lo, hi, a, alo, ahi, v, nv, flag, flo, fhi) &
-       bind(c,name='amrex_hpeb_copy_to_vec')
-    use amrex_ebcellflag_module, only : is_covered_cell
-    integer, dimension(2), intent(in) :: lo, hi, alo, ahi, flo, fhi
-    integer(it), intent(in) :: nv
-    real(rt), intent(in) :: a   (alo(1):ahi(1),alo(2):ahi(2))
-    integer , intent(in) :: flag(flo(1):fhi(1),flo(2):fhi(2))
-    real(rt), intent(out) :: v(0:nv-1)
-    
-    integer :: i,j, nrows
-
-    nrows = 0
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          if (.not.is_covered_cell(flag(i,j))) then
-             v(nrows) = a(i,j)
-             nrows = nrows+1
-          end if
-       end do
-    end do
-  end subroutine amrex_hpeb_copy_to_vec
-
-  subroutine amrex_hpeb_ijmatrix (lo, hi, nrows, ncols, rows, cols, mat, &
-       cell_id, clo, chi, cell_id_begin, diag, dlo, dhi, a, alo, ahi, &
-       bx, bxlo, bxhi, by, bylo, byhi, flag, flo, fhi, vfrc, vlo, vhi, &
-       apx, axlo, axhi, apy, aylo, ayhi, &
-       fcx, fxlo, fxhi, fcy, fylo, fyhi, &
-       ba, balo, bahi, bcen, bclo, bchi, beb, elo, ehi, is_eb_dirichlet, &
-       sa, sb, dx, bct, bcl, bho) &
-       bind(c,name='amrex_hpeb_ijmatrix')
-    use amrex_ebcellflag_module, only : is_covered_cell, is_regular_cell
-    integer(it), intent(in) :: nrows, cell_id_begin
-    integer(it), dimension(0:nrows-1), intent(out) :: ncols, rows
-    integer(it), dimension(0:nrows*9-1), intent(out) :: cols
-    real(rt)   , dimension(0:nrows*9-1), intent(out) :: mat
-    integer, dimension(2), intent(in) :: lo, hi, clo, chi, dlo, dhi, &
-         alo, ahi, bxlo, bxhi, bylo, byhi, &
-         flo, fhi, vlo, vhi, axlo, axhi, aylo, ayhi, fxlo, fxhi, fylo, fyhi, &
-         balo, bahi, bclo, bchi, elo, ehi
-    integer(it), intent(in) :: cell_id( clo(1): chi(1), clo(2): chi(2))
-    real(rt)   , intent(inout) :: diag( dlo(1): dhi(1), dlo(2): dhi(2))
-    real(rt)   , intent(in) :: a      ( alo(1): ahi(1), alo(2): ahi(2))
-    real(rt)   , intent(in) :: bx     (bxlo(1):bxhi(1),bxlo(2):bxhi(2))
-    real(rt)   , intent(in) :: by     (bylo(1):byhi(1),bylo(2):byhi(2))
-    integer    , intent(in) :: flag   ( flo(1): fhi(1), flo(2): fhi(2))
-    real(rt)   , intent(in) :: vfrc   ( vlo(1): vhi(1), vlo(2): vhi(2))
-    real(rt)   , intent(in) :: apx    (axlo(1):axhi(1),axlo(2):axhi(2))
-    real(rt)   , intent(in) :: apy    (aylo(1):ayhi(1),aylo(2):ayhi(2))
-    real(rt)   , intent(in) :: fcx    (fxlo(1):fxhi(1),fxlo(2):fxhi(2))
-    real(rt)   , intent(in) :: fcy    (fylo(1):fyhi(1),fylo(2):fyhi(2))
-    real(rt)   , intent(in) :: ba     (balo(1):bahi(1),balo(2):bahi(2))
-    real(rt)   , intent(in) :: bcen   (bclo(1):bchi(1),bclo(2):bchi(2),2)
-    real(rt)   , intent(in) :: beb    ( elo(1): ehi(1), elo(2): ehi(2))
-    integer, intent(in) :: bct(0:3), bho
-    real(rt), intent(in) :: sa, sb, dx(2), bcl(0:3)
-    integer, intent(in) :: is_eb_dirichlet
-
-    logical :: is_dirichlet
-    integer :: i,j, irow, imat, cdir, idim, ii,jj, ioff, joff
-    real(rt) :: fac(2), mat_tmp(-1:1,-1:1), phig(4), feb(4)
-    real(rt) :: bf1(0:3), bf2(0:3), h, h2, h3, bflo(0:3), c_0(-1:0,-1:0)
-    real(rt) :: c_x(-1:0,-1:0), c_y(-1:0,-1:0), c_xy(-1:0,-1:0)
-    real(rt) :: fracx, fracy, area, bc
-    real(rt) :: gx, gy, anrmx, anrmy, anorm, anorminv, sx, sy
-    real(rt) :: bctx, bcty, bsxinv, bsyinv
-    real(rt) :: dg
-
-    is_dirichlet = is_eb_dirichlet .ne. 0
-    fac = sb/dx**2
-
-    do cdir = 0, 3
-       if (cdir .eq. 0 .or. cdir .eq. 2) then
-          idim = 1
-       else
-          idim = 2
-       end if
-       h = dx(idim)
-       if (bct(cdir) .eq. amrex_lo_dirichlet) then
-          h2 = half * h
-          bflo(cdir) = fac(idim) * ( h / (bcl(cdir) + h2) - one) ! for low order
-          if (bho.ge.1) then
-             h3 = three * h2
-             bf1(cdir) = fac(idim) * ((h3 - bcl(cdir)) / (bcl(cdir) + h2) - one)
-             bf2(cdir) = fac(idim) * (bcl(cdir) - h2) / (bcl(cdir) + h3)
-          else
-             bf1(cdir) = bflo(cdir)
-             bf2(cdir) = zero
-          end if
-       else if (bct(cdir) .eq. amrex_lo_neumann) then
-          bflo(cdir) = -fac(idim)
-          bf1(cdir) = -fac(idim)
-          bf2(cdir) = zero
-       end if
-    end do
-
-    irow = 0
-    imat = 0
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          if (is_covered_cell(flag(i,j))) then
-             diag(i,j) = zero
-          else
-             rows(irow) = cell_id(i,j)
-             ncols(irow) = 0
-             mat_tmp = zero
-
-             if (is_regular_cell(flag(i,j))) then
-                
-                mat_tmp(0,0) = sa * a(i,j) + fac(1)*(bx(i,j)+bx(i+1,j)) &
-                     &                     + fac(2)*(by(i,j)+by(i,j+1))
-                mat_tmp(-1, 0) = -fac(1)*bx(i,j)
-                mat_tmp( 1, 0) = -fac(1)*bx(i+1,j)
-                mat_tmp( 0,-1) = -fac(2)*by(i,j)
-                mat_tmp( 0, 1) = -fac(2)*by(i,j+1)
-                
-                if (i.eq.lo(1) .and. cell_id(i-1,j).lt.0) then
-                   cdir = 0
-                   mat_tmp(0,0) = mat_tmp(0,0) + bf1(cdir)*bx(i,j)
-                   mat_tmp(-1,0) = zero
-                   mat_tmp(1,0) = mat_tmp(1,0) + bf2(cdir)*bx(i,j)
-                end if
-                
-                if (i.eq.hi(1) .and. cell_id(i+1,j).lt.0) then
-                   cdir = 2
-                   mat_tmp(0,0) = mat_tmp(0,0) + bf1(cdir)*bx(i+1,j)
-                   mat_tmp(1,0) = zero
-                   mat_tmp(-1,0) = mat_tmp(-1,0) + bf2(cdir)*bx(i+1,j)
-                end if
-                
-                if (j.eq.lo(2) .and. cell_id(i,j-1).lt.0) then
-                   cdir = 1
-                   mat_tmp(0,0) = mat_tmp(0,0) + bf1(cdir)*by(i,j)
-                   mat_tmp(0,-1) = zero
-                   mat_tmp(0,1) = mat_tmp(0,1) + bf2(cdir)*by(i,j)
-                end if
-             
-                if (j.eq.hi(2) .and. cell_id(i,j+1).lt.0) then
-                   cdir = 3
-                   mat_tmp(0,0) = mat_tmp(0,0) + bf1(cdir)*by(i,j+1)
-                   mat_tmp(0,1) = zero
-                   mat_tmp(0,-1) = mat_tmp(0,-1) + bf2(cdir)*by(i,j+1)
-                end if
-
-             else
-
-                cdir = 0
-                area = apx(i,j)
-                bc = bx(i,j)
-                if (area.ge.zero) then
-                   if (area.ne.one) then
-                      joff = int(sign(one,fcx(i,j)))
-                      jj = j + joff
-                      if (cell_id(i-1,jj).lt.0 .and. cell_id(i,jj).lt.0) then
-                         fracy = zero
-                      else
-                         fracy = abs(fcx(i,j))
-                      end if
-                   else
-                      joff = 0
-                      jj = j
-                      fracy = zero
-                   end if
-
-                   if (cell_id(i-1,j).ge.0) then
-                      mat_tmp(0,0)  = mat_tmp(0,0)  + (one-fracy)*area*fac(1)*bc
-                      mat_tmp(-1,0) = mat_tmp(-1,0) - (one-fracy)*area*fac(1)*bc
-                   else if (cell_id(i+1,j).lt.0 .or. apx(i+1,j).eq.zero) then
-                      mat_tmp(0,0)  = mat_tmp(0,0)  + (one-fracy)*area*(fac(1)+bflo(cdir))*bc
-                   else
-                      mat_tmp(0,0)  = mat_tmp(0,0)  + (one-fracy)*area*(fac(1)+bf1(cdir))*bc
-                      mat_tmp(1,0)  = mat_tmp(1,0)  + (one-fracy)*area*        bf2(cdir) *bc
-                   end if
-
-                   if (fracy.gt.zero) then
-                      if (cell_id(i-1,jj).ge.0 .and. cell_id(i,jj).ge.0) then
-                         mat_tmp(-1,joff) = mat_tmp(-1,joff) - fracy*area*fac(1)*bx(i,jj)
-                         mat_tmp( 0,joff) = mat_tmp( 0,joff) + fracy*area*fac(1)*bx(i,jj)
-                      else if (cell_id(i+1,jj).lt.0 .or. apx(i+1,jj).eq.zero) then
-                         mat_tmp(0,joff)  = mat_tmp(0,joff)  + (one-fracy)*area*(fac(1)+bflo(cdir))*bc
-                      else
-                         mat_tmp(0,joff)  = mat_tmp(0,joff)  + (one-fracy)*area*(fac(1)+bf1(cdir))*bc
-                         mat_tmp(1,joff)  = mat_tmp(1,joff)  + (one-fracy)*area*        bf2(cdir) *bc
-                      end if
-                   end if
-                end if
-
-                cdir = 2
-                area = apx(i+1,j)
-                bc = bx(i+1,j)
-                if (area.ge.zero) then
-                   if (area.ne.one) then
-                      joff = int(sign(one,fcx(i+1,j)))
-                      jj = j + joff
-                      if (cell_id(i,jj).lt.0 .and. cell_id(i+1,jj).lt.0) then
-                         fracy = zero
-                      else
-                         fracy = abs(fcx(i+1,j))
-                      end if
-                   else
-                      joff = 0
-                      jj = j
-                      fracy = zero
-                   end if
-                   
-                   if (cell_id(i+1,j).ge.0) then
-                      mat_tmp(0,0) = mat_tmp(0,0) + (one-fracy)*area*fac(1)*bc
-                      mat_tmp(1,0) = mat_tmp(1,0) - (one-fracy)*area*fac(1)*bc
-                   else if (cell_id(i-1,j).lt.0 .or. apx(i,j).eq.zero) then
-                      mat_tmp(0,0) = mat_tmp(0,0) + (one-fracy)*area*(fac(1)+bflo(cdir))*bc
-                   else
-                      mat_tmp( 0,0) = mat_tmp( 0,0) + (one-fracy)*area*(fac(1)+bf1(cdir))*bc
-                      mat_tmp(-1,0) = mat_tmp(-1,0) + (one-fracy)*area*        bf2(cdir) *bc
-                   end if
-                   
-                   if (fracy.gt.zero) then
-                      if (cell_id(i,jj).ge.0 .and. cell_id(i+1,jj).ge.0) then
-                         mat_tmp(0,joff) = mat_tmp(0,joff) + fracy*area*fac(1)*bx(i+1,jj)
-                         mat_tmp(1,joff) = mat_tmp(1,joff) - fracy*area*fac(1)*bx(i+1,jj)
-                      else if (cell_id(i-1,jj).lt.0 .or. apx(i,jj).eq.zero) then
-                         mat_tmp(0,joff) = mat_tmp(0,joff) + (one-fracy)*area*(fac(1)+bflo(cdir))*bc
-                      else
-                         mat_tmp( 0,joff) = mat_tmp( 0,joff) + (one-fracy)*area*(fac(1)+bf1(cdir))*bc
-                         mat_tmp(-1,joff) = mat_tmp(-1,joff) + (one-fracy)*area*        bf2(cdir) *bc
-                      end if
-                   end if
-                end if
-                
-                cdir = 1
-                area = apy(i,j)
-                bc = by(i,j)
-                if (area.ge.zero) then
-                   if (area.ne.one) then
-                      ioff = int(sign(one,fcy(i,j)))
-                      ii = i + ioff
-                      if (cell_id(ii,j-1).lt.0 .and. cell_id(ii,j).lt.0) then
-                         fracx = zero
-                      else
-                         fracx = abs(fcy(i,j))
-                      end if
-                   else
-                      ioff = 0
-                      ii = i
-                      fracx = zero
-                   end if
-
-                   if (cell_id(i,j-1).ge.0) then
-                      mat_tmp(0,0)  = mat_tmp(0,0)  + (one-fracx)*area*fac(2)*bc
-                      mat_tmp(0,-1) = mat_tmp(0,-1) - (one-fracx)*area*fac(2)*bc
-                   else if (cell_id(i,j+1).lt.0 .or. apy(i,j+1).eq.zero) then
-                      mat_tmp(0,0)  = mat_tmp(0,0)  + (one-fracx)*area*(fac(2)+bflo(cdir))*bc
-                   else
-                      mat_tmp(0,0)  = mat_tmp(0,0)  + (one-fracx)*area*(fac(2)+bf1(cdir))*bc
-                      mat_tmp(0,1)  = mat_tmp(0,1)  + (one-fracx)*area*        bf2(cdir) *bc
-                   end if
-
-                   if (fracx.gt.zero) then
-                      if (cell_id(ii,j-1).ge.0 .and. cell_id(ii,j).ge.0) then
-                         mat_tmp(ioff,-1) = mat_tmp(ioff,-1) - fracx*area*fac(2)*by(ii,j)
-                         mat_tmp(ioff, 0) = mat_tmp(ioff, 0) + fracx*area*fac(2)*by(ii,j)
-                      else if (cell_id(ii,j+1).lt.0 .or. apy(ii,j+1).eq.zero) then
-                         mat_tmp(ioff,0)  = mat_tmp(ioff,0)  + (one-fracx)*area*(fac(2)+bflo(cdir))*bc
-                      else
-                         mat_tmp(ioff,0)  = mat_tmp(ioff,0)  + (one-fracx)*area*(fac(2)+bf1(cdir))*bc
-                         mat_tmp(ioff,1)  = mat_tmp(ioff,1)  + (one-fracx)*area*        bf2(cdir) *bc
-                      end if
-                   end if
-                end if
-
-                cdir = 3
-                area = apy(i,j+1)
-                bc = by(i,j+1)
-                if (area.ge.zero) then
-                   if (area.ne.one) then
-                      ioff = int(sign(one,fcy(i,j+1)))
-                      ii = i + ioff
-                      if (cell_id(ii,j).lt.0 .and. cell_id(ii,j+1).lt.0) then
-                         fracx = zero
-                      else
-                         fracx = abs(fcy(i,j+1))
-                      end if
-                   else
-                      ioff = 0
-                      ii = i
-                      fracx = zero
-                   end if
-
-                   if (cell_id(i,j+1).ge.0) then
-                      mat_tmp(0,0) = mat_tmp(0,0) + (one-fracx)*area*fac(2)*bc
-                      mat_tmp(0,1) = mat_tmp(0,1) - (one-fracx)*area*fac(2)*bc
-                   else if (cell_id(i,j-1).lt.0 .or. apy(i,j).eq.zero) then
-                      mat_tmp(0,0) = mat_tmp(0,0) + (one-fracx)*area*(fac(2)+bflo(cdir))*bc
-                   else
-                      mat_tmp(0, 0) = mat_tmp(0, 0) + (one-fracx)*area*(fac(2)+bf1(cdir))*bc
-                      mat_tmp(0,-1) = mat_tmp(0,-1) + (one-fracx)*area*        bf2(cdir) *bc
-                   end if
-
-                   if (fracx.gt.zero) then
-                      if (cell_id(ii,j).ge.0 .and. cell_id(ii,j+1).ge.0) then
-                         mat_tmp(ioff,0) = mat_tmp(ioff,0) + fracx*area*fac(2)*bx(ii,j+1)
-                         mat_tmp(ioff,1) = mat_tmp(ioff,1) - fracx*area*fac(2)*bx(ii,j+1)
-                      else if (cell_id(ii,j-1).lt.0 .or. apy(ii,j).eq.zero) then
-                         mat_tmp(ioff,0) = mat_tmp(ioff,0) + (one-fracx)*area*(fac(2)+bflo(cdir))*bc
-                      else
-                         mat_tmp(ioff, 0) = mat_tmp(ioff, 0) + (one-fracx)*area*(fac(2)+bf1(cdir))*bc
-                         mat_tmp(ioff,-1) = mat_tmp(ioff,-1) + (one-fracx)*area*        bf2(cdir) *bc
-                      end if
-                   end if
-                end if
-
-                if (is_dirichlet) then
-                   anorm = sqrt((apx(i,j) - apx(i+1,j))**2 + (apy(i,j) - apy(i,j+1))**2)
-                   anorminv = one/anorm
-                   anrmx = (apx(i,j) - apx(i+1,j))*anorminv
-                   anrmy = (apy(i,j) - apy(i,j+1))*anorminv
-                   bctx = bcen(i,j,1)
-                   bcty = bcen(i,j,2)
-                   if (abs(anrmx) .gt. abs(anrmy)) then
-                      dg = amrex_get_dx_eb(vfrc(i,j)) / abs(anrmx)
-                      gx = bctx - dg*anrmx
-                      gy = bcty - dg*anrmy
-                      sx = sign(one,anrmx)
-                      sy = sign(one,anrmy)
-                   else
-                      dg = amrex_get_dx_eb(vfrc(i,j)) / abs(anrmy)
-                      gx = bctx - dg*anrmx
-                      gy = bcty - dg*anrmy
-                      sx = sign(one,anrmx)
-                      sy = sign(one,anrmy)
-                   endif
-                   ioff = -int(sx)
-                   joff = -int(sy)
-
-                   phig(1) = one + gx*sx + gy*sy + gx*gy*sx*sy
-                   phig(2) =     - gx*sx         - gx*gy*sx*sy
-                   phig(3) =             - gy*sy - gx*gy*sx*sy
-                   phig(4) =                     + gx*gy*sx*sy
-
-                   feb = -phig * (ba(i,j) * beb(i,j) / dg)
-                   mat_tmp(0   , 0  ) = mat_tmp(0   , 0  ) - feb(1)*fac(1)
-                   mat_tmp(ioff, 0  ) = mat_tmp(ioff, 0  ) - feb(2)*fac(1)
-                   mat_tmp(0   ,joff) = mat_tmp(0   ,joff) - feb(3)*fac(1)
-                   mat_tmp(ioff,joff) = mat_tmp(ioff,joff) - feb(4)*fac(1)
-                endif
-
-                mat_tmp = mat_tmp * (one/vfrc(i,j))
-                mat_tmp(0,0) = mat_tmp(0,0) + sa*a(i,j)
-             end if
-
-             diag(i,j) = one/mat_tmp(0,0)
-
-             do joff = -1, 1
-                do ioff = -1, 1
-                   if (mat_tmp(ioff,joff).ne.zero .and. cell_id(i+ioff,j+joff).ge.0) then
-                      ncols(irow) = ncols(irow) + 1
-                      cols(imat) = cell_id(i+ioff,j+joff)
-                      mat(imat) = mat_tmp(ioff,joff)*diag(i,j)
-                      imat = imat + 1
-                   end if
-                end do
-             end do
-             irow = irow + 1
-             
-          end if
-       end do
-    end do
-  end subroutine amrex_hpeb_ijmatrix
-
-#endif
-  
-end module amrex_habec_module
diff --git a/Src/Extern/HYPRE/AMReX_HABEC_3D.F90 b/Src/Extern/HYPRE/AMReX_HABEC_3D.F90
deleted file mode 100644
index f1c787c0395..00000000000
--- a/Src/Extern/HYPRE/AMReX_HABEC_3D.F90
+++ /dev/null
@@ -1,1184 +0,0 @@
-module amrex_habec_module
-
-  ! habec is Hypre abec, where abec is the form of the linear equation
-  ! we are solving:
-  ! 
-  ! alpha*phi - div(beta*grad phi) + div(\vec{c}*phi) 
-
-  use iso_c_binding
-#ifdef AMREX_USE_PETSC
-  use amrex_petsc_fort_module, only : it=>petsc_int
-#else
-  use amrex_hypre_fort_module, only : it=>hypre_int
-#endif
-  use amrex_fort_module, only : rt => amrex_real
-  use amrex_lo_bctypes_module, only : amrex_lo_dirichlet, amrex_lo_neumann
-  use amrex_error_module, only : amrex_error
-  use amrex_constants_module, only : zero, one, two, three, half, fourth
-  implicit none
-
-contains
-
-  elemental function amrex_get_dx_eb (kappa)
-    real(rt), intent(in) :: kappa
-    real(rt) :: amrex_get_dx_eb
-    amrex_get_dx_eb = max(0.3_rt, (kappa*kappa-fourth)/(two*kappa))
-  end function amrex_get_dx_eb
-
-  subroutine amrex_hpacoef (lo, hi, mat, a, alo, ahi, sa) bind(c,name='amrex_hpacoef')
-    integer, intent(in) :: lo(3), hi(3), alo(3), ahi(3)
-    real(rt), intent(inout) :: mat(0:6, lo(1): hi(1), lo(2): hi(2), lo(3): hi(3))
-    real(rt), intent(in   ) ::   a(    alo(1):ahi(1),alo(2):ahi(2),alo(3):ahi(3))
-    real(rt), intent(in) :: sa
-    integer :: i, j, k
-    if (sa .eq. zero) then
-       !$omp parallel do private(i,j,k) collapse(2)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                mat(0,i,j,k) = zero
-             enddo
-          enddo
-       enddo
-       !$omp end parallel do
-    else
-       !$omp parallel do private(i,j,k) collapse(2)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                mat(0,i,j,k) = sa * a(i,j,k)
-             enddo
-          enddo
-       enddo
-       !$omp end parallel do
-    end if
-  end subroutine amrex_hpacoef
-
-  subroutine amrex_hpbcoef (lo, hi, mat, b, blo, bhi, sb, dx, idim) &
-       bind(c,name='amrex_hpbcoef')
-    integer, intent(in) :: lo(3), hi(3), blo(3), bhi(3), idim
-    real(rt), intent(inout) :: mat(0:6, lo(1): hi(1), lo(2): hi(2), lo(3): hi(3))
-    real(rt), intent(in   ) ::   b(    blo(1):bhi(1),blo(2):bhi(2),blo(3):bhi(3))
-    real(rt), intent(in) :: sb, dx(3)
-
-    integer :: i, j, k
-    real(rt) :: fac
-
-    fac = sb / dx(idim+1)**2 
-
-    if (idim .eq. 0) then
-       !$omp parallel do private(i,j,k) collapse(2)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                mat(0,i,j,k) = mat(0,i,j,k) + fac * (b(i,j,k) + b(i+1,j,k))
-                mat(1,i,j,k) = - fac * b(i,j,k)
-                mat(2,i,j,k) = - fac * b(i+1,j,k)
-             enddo
-          enddo
-       enddo
-       !$omp end parallel do
-    else if (idim .eq. 1) then
-       !$omp parallel do private(i,j,k) collapse(2)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                mat(0,i,j,k) = mat(0,i,j,k) + fac * (b(i,j,k) + b(i,j+1,k))
-                mat(3,i,j,k) = - fac * b(i,j,k)
-                mat(4,i,j,k) = - fac * b(i,j+1,k)
-             enddo
-          enddo
-       enddo
-       !$omp end parallel do
-    else
-       !$omp parallel do private(i,j,k) collapse(2)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                mat(0,i,j,k) = mat(0,i,j,k) + fac * (b(i,j,k) + b(i,j,k+1))
-                mat(5,i,j,k) = - fac * b(i,j,k)
-                mat(6,i,j,k) = - fac * b(i,j,k+1)
-             enddo
-          enddo
-       enddo
-       !$omp end parallel do
-    endif
-    
-  end subroutine amrex_hpbcoef
-
-  
-  subroutine amrex_hpmat (lo, hi, mat, b, blo, bhi, mask, mlo, mhi, &
-       sb, dx, cdir, bct, bcl, bho) bind(c,name='amrex_hpmat')
-    integer, intent(in) :: lo(3), hi(3), blo(3), bhi(3), mlo(3), mhi(3), cdir, bct, bho
-    real(rt), intent(inout) ::  mat(0:6, lo(1): hi(1), lo(2): hi(2), lo(3): hi(3))
-    real(rt), intent(in   ) ::    b(    blo(1):bhi(1),blo(2):bhi(2),blo(3):bhi(3))
-    integer , intent(in   ) :: mask(    mlo(1):mhi(1),mlo(2):mhi(2),mlo(3):mhi(3))
-    real(rt), intent(in) :: sb, dx(3), bcl
-
-    integer :: i, j, k
-    real(rt) :: fac, h, h2, h3, bf1, bf2
-
-    if (cdir .eq. 0 .or. cdir .eq. 3) then
-       h = dx(1)
-    elseif (cdir .eq. 1 .or. cdir .eq. 4) then
-       h = dx(2)
-    else
-       h = dx(3)
-    endif
-    fac = sb / (h**2)
-
-    if (bct .eq. amrex_lo_dirichlet) then
-       h2 = half * h
-       if (bho.ge.1) then
-          h3 = three * h2
-          bf1 = fac * ((h3 - bcl) / (bcl + h2) - one)
-          bf2 = fac * (bcl - h2) / (bcl + h3)
-       else
-          bf1 = fac * ( h / (bcl + h2) - one)          
-          bf2 = zero
-       end if
-    else if (bct .eq. amrex_lo_neumann) then
-       bf1 = -fac
-       bf2 = zero
-    else
-       call amrex_error("hpmat: unsupported boundary type")       
-    end if
-    
-    if (cdir .eq. 0) then
-       i = lo(1)
-       !$omp parallel do private(j,k)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             if (mask(i-1,j,k) .gt. 0) then
-                mat(0,i,j,k) = mat(0,i,j,k) + bf1 * b(i,j,k)
-                mat(1,i,j,k) = zero
-                mat(2,i,j,k) = mat(2,i,j,k) + bf2 * b(i,j,k)
-             endif
-          enddo
-       enddo
-       !$omp end parallel do
-    else if (cdir .eq. 3) then
-       i = hi(1)
-       !$omp parallel do private(j,k)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             if (mask(i+1,j,k) .gt. 0) then
-                mat(0,i,j,k) = mat(0,i,j,k) + bf1 * b(i+1,j,k)
-                mat(2,i,j,k) = zero
-                mat(1,i,j,k) = mat(1,i,j,k) + bf2 * b(i+1,j,k)
-             endif
-          enddo
-       enddo
-       !$omp end parallel do
-    else if (cdir .eq. 1) then
-       j = lo(2)
-       !$omp parallel do private(i,k)
-       do k = lo(3), hi(3)
-          do i = lo(1), hi(1)
-             if (mask(i,j-1,k) .gt. 0) then
-                mat(0,i,j,k) = mat(0,i,j,k) + bf1 * b(i,j,k)
-                mat(3,i,j,k) = zero
-                mat(4,i,j,k) = mat(4,i,j,k) + bf2 * b(i,j,k)
-             endif
-          enddo
-       enddo
-       !$omp end parallel do
-    else if (cdir .eq. 4) then
-       j = hi(2)
-       !$omp parallel do private(i,k)
-       do k = lo(3), hi(3)
-          do i = lo(1), hi(1)
-             if (mask(i,j+1,k) .gt. 0) then
-                mat(0,i,j,k) = mat(0,i,j,k) + bf1 * b(i,j+1,k)
-                mat(4,i,j,k) = zero
-                mat(3,i,j,k) = mat(3,i,j,k) + bf2 * b(i,j+1,k)
-             endif
-          enddo
-       enddo
-       !$omp end parallel do
-    else if (cdir .eq. 2) then
-       k = lo(3)
-       !$omp parallel do private(i,j)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (mask(i,j,k-1) .gt. 0) then
-                mat(0,i,j,k) = mat(0,i,j,k) + bf1 * b(i,j,k)
-                mat(5,i,j,k) = zero
-                mat(6,i,j,k) = mat(6,i,j,k) + bf2 * b(i,j,k)
-             endif
-          enddo
-       enddo
-       !$omp end parallel do
-    else if (cdir .eq. 5) then
-       k = hi(3)
-       !$omp parallel do private(i,j)
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (mask(i,j,k+1) .gt. 0) then
-                mat(0,i,j,k) = mat(0,i,j,k) + bf1 * b(i,j,k+1)
-                mat(6,i,j,k) = zero
-                mat(5,i,j,k) = mat(5,i,j,k) + bf2 * b(i,j,k+1)
-             endif
-          enddo
-       enddo
-       !$omp end parallel do
-    else
-       call amrex_error("hpmat: impossible face orientation")
-    endif  
-  end subroutine amrex_hpmat
-
-
-  subroutine amrex_hpdiag (lo, hi, mat, diag, dlo, dhi) bind(c,name='amrex_hpdiag')
-    integer, dimension(3), intent(in) :: lo, hi, dlo, dhi
-    real(rt), intent(inout) :: mat (0:6, lo(1): hi(1), lo(2): hi(2), lo(3): hi(3))
-    real(rt), intent(inout) :: diag(    dlo(1):dhi(1),dlo(2):dhi(2),dlo(3):dhi(3))
-    integer :: i,j,k
-    !$omp parallel do private(i,j,k) collapse(2)
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             diag(i,j,k) = one/mat(0,i,j,k)
-             mat(0:6,i,j,k) = mat(0:6,i,j,k) * diag(i,j,k)
-          end do
-       enddo
-    enddo
-    !$omp end parallel do
-  end subroutine amrex_hpdiag
-
-
-  subroutine amrex_hpijmatrix (lo, hi, nrows, ncols, rows, cols, mat, &
-       cell_id, clo, chi, cell_id_begin, diag, dlo, dhi, a, alo, ahi, &
-       bx, xlo, xhi, by, ylo, yhi, bz, zlo, zhi, sa, sb, dx, bct, bcl, bho) &
-       bind(c,name='amrex_hpijmatrix')
-    integer(it), intent(in) :: nrows, cell_id_begin;
-    integer(it), dimension(0:nrows-1), intent(out) :: ncols, rows
-    integer(it), dimension(0:nrows*7-1), intent(out) :: cols
-    real(rt)   , dimension(0:nrows*7-1), intent(out) :: mat
-    integer, dimension(3), intent(in) :: lo, hi, clo, chi, dlo, dhi, alo, ahi,&
-         xlo, xhi, ylo, yhi, zlo, zhi
-    integer(it), intent(in) :: cell_id(clo(1):chi(1),clo(2):chi(2),clo(3):chi(3))
-    real(rt)   , intent(inout) :: diag(dlo(1):dhi(1),dlo(2):dhi(2),dlo(3):dhi(3))
-    real(rt)   , intent(in) :: a      (alo(1):ahi(1),alo(2):ahi(2),alo(3):ahi(3))
-    real(rt)   , intent(in) :: bx     (xlo(1):xhi(1),xlo(2):xhi(2),xlo(3):xhi(3))
-    real(rt)   , intent(in) :: by     (ylo(1):yhi(1),ylo(2):yhi(2),ylo(3):yhi(3))
-    real(rt)   , intent(in) :: bz     (zlo(1):zhi(1),zlo(2):zhi(2),zlo(3):zhi(3))
-    integer, intent(in) :: bct(0:5), bho
-    real(rt), intent(in) :: sa, sb, dx(3), bcl(0:5)
-
-    integer :: i,j,k, irow, imat, ic, cdir, idim
-    integer(it) :: cols_tmp(0:6)
-    real(rt) :: fac(3), mat_tmp(0:6)
-    real(rt) :: bf1(0:5), bf2(0:5), h, h2, h3
-
-    fac = sb/dx**2
-
-    do cdir = 0, 5
-       if (cdir .eq. 0 .or. cdir .eq. 3) then
-          idim = 1
-       else if (cdir .eq. 1 .or. cdir .eq. 4) then
-          idim = 2
-       else
-          idim = 3
-       end if
-       h = dx(idim)
-       if (bct(cdir) .eq. amrex_lo_dirichlet) then
-          h2 = half * h
-          if (bho.ge.1) then
-             h3 = three * h2
-             bf1(cdir) = fac(idim) * ((h3 - bcl(cdir)) / (bcl(cdir) + h2) - one)
-             bf2(cdir) = fac(idim) * (bcl(cdir) - h2) / (bcl(cdir) + h3)
-          else
-             bf1(cdir) = fac(idim) * ( h / (bcl(cdir) + h2) - one)
-             bf2(cdir) = zero
-          end if
-       else if (bct(cdir) .eq. amrex_lo_neumann) then
-          bf1(cdir) = -fac(idim)
-          bf2(cdir) = zero
-       end if
-    end do
-    
-    irow = 0
-    imat = 0
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             rows(irow) = cell_id(i,j,k)
-             ncols(irow) = 0
-
-             cols_tmp(0) = cell_id(i,j,k)
-             mat_tmp(0) = sa * a(i,j,k) + fac(1)*(bx(i,j,k)+bx(i+1,j,k)) &
-                  &                     + fac(2)*(by(i,j,k)+by(i,j+1,k)) &
-                  &                     + fac(3)*(bz(i,j,k)+bz(i,j,k+1))
-
-             cols_tmp(1) = cell_id(i-1,j,k)
-             mat_tmp(1) = -fac(1)*bx(i,j,k)
-
-             cols_tmp(2) = cell_id(i+1,j,k)
-             mat_tmp(2) = -fac(1)*bx(i+1,j,k)
-
-             cols_tmp(3) = cell_id(i,j-1,k)
-             mat_tmp(3) = -fac(2)*by(i,j,k)
-
-             cols_tmp(4) = cell_id(i,j+1,k)
-             mat_tmp(4) = -fac(2)*by(i,j+1,k)
-
-             cols_tmp(5) = cell_id(i,j,k-1)
-             mat_tmp(5) = -fac(3)*bz(i,j,k)
-
-             cols_tmp(6) = cell_id(i,j,k+1)
-             mat_tmp(6) = -fac(3)*bz(i,j,k+1)
-
-             if (i.eq.lo(1) .and. cell_id(i-1,j,k).lt.0) then
-                cdir = 0
-                mat_tmp(0) = mat_tmp(0) + bf1(cdir)*bx(i,j,k)
-                mat_tmp(2) = mat_tmp(2) + bf2(cdir)*bx(i,j,k)
-             end if
-
-             if (i.eq.hi(1) .and. cell_id(i+1,j,k).lt.0) then
-                cdir = 3
-                mat_tmp(0) = mat_tmp(0) + bf1(cdir)*bx(i+1,j,k)
-                mat_tmp(1) = mat_tmp(1) + bf2(cdir)*bx(i+1,j,k)
-             end if
-
-             if (j.eq.lo(2) .and. cell_id(i,j-1,k).lt.0) then
-                cdir = 1
-                mat_tmp(0) = mat_tmp(0) + bf1(cdir)*by(i,j,k)
-                mat_tmp(4) = mat_tmp(4) + bf2(cdir)*by(i,j,k)
-             end if
-
-             if (j.eq.hi(2) .and. cell_id(i,j+1,k).lt.0) then
-                cdir = 4
-                mat_tmp(0) = mat_tmp(0) + bf1(cdir)*by(i,j+1,k)
-                mat_tmp(3) = mat_tmp(3) + bf2(cdir)*by(i,j+1,k)
-             end if
-
-             if (k.eq.lo(3) .and. cell_id(i,j,k-1).lt.0) then
-                cdir = 2
-                mat_tmp(0) = mat_tmp(0) + bf1(cdir)*bz(i,j,k)
-                mat_tmp(6) = mat_tmp(6) + bf2(cdir)*bz(i,j,k)
-             end if
-
-             if (k.eq.hi(3) .and. cell_id(i,j,k+1).lt.0) then
-                cdir = 5
-                mat_tmp(0) = mat_tmp(0) + bf1(cdir)*bz(i,j,k+1)
-                mat_tmp(5) = mat_tmp(5) + bf2(cdir)*bz(i,j,k+1)
-             end if
-
-             diag(i,j,k) = one/mat_tmp(0)
-
-             do ic = 0, 6
-                if (cols_tmp(ic) .ge. 0) then
-                   ncols(irow) = ncols(irow) + 1
-                   cols(imat) = cols_tmp(ic)
-                   mat(imat) = mat_tmp(ic)*diag(i,j,k)
-                   imat = imat + 1
-                end if
-             end do
-             irow = irow+1
-
-          end do
-       end do
-    end do
-  end subroutine amrex_hpijmatrix
-
-
-#ifdef AMREX_USE_EB
-
-  subroutine amrex_hpeb_fill_cellid (lo, hi, nrows, cell_id, clo, chi, flag, flo, fhi) &
-       bind(c,name='amrex_hpeb_fill_cellid')
-    use amrex_ebcellflag_module, only : is_covered_cell
-    integer, dimension(3), intent(in) :: lo, hi, clo, chi, flo, fhi
-    integer(it), intent(  out) :: nrows
-    integer(it), intent(inout) :: cell_id(clo(1):chi(1),clo(2):chi(2),clo(3):chi(3))
-    integer    , intent(in   ) :: flag   (flo(1):fhi(1),flo(2):fhi(2),flo(3):fhi(3))
-
-    integer :: i,j,k
-
-    nrows = 0
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (.not.is_covered_cell(flag(i,j,k))) then
-                cell_id(i,j,k) = nrows
-                nrows = nrows+1
-             end if
-          end do
-       end do
-    end do
-  end subroutine amrex_hpeb_fill_cellid
-
-  subroutine amrex_hpeb_copy_from_vec (lo, hi, a, alo, ahi, v, nv, flag, flo, fhi) &
-       bind(c,name='amrex_hpeb_copy_from_vec')
-    use amrex_ebcellflag_module, only : is_covered_cell
-    integer, dimension(3), intent(in) :: lo, hi, alo, ahi, flo, fhi
-    integer(it), intent(in) :: nv
-    real(rt), intent(inout) :: a   (alo(1):ahi(1),alo(2):ahi(2),alo(3):ahi(3))
-    integer , intent(in   ) :: flag(flo(1):fhi(1),flo(2):fhi(2),flo(3):fhi(3))
-    real(rt), intent(in) :: v(0:nv-1)
-    
-    integer :: i,j,k, nrows
-
-    nrows = 0
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (.not.is_covered_cell(flag(i,j,k))) then
-                a(i,j,k) = v(nrows)
-                nrows = nrows+1
-             end if
-          end do
-       end do
-    end do
-  end subroutine amrex_hpeb_copy_from_vec
-
-  subroutine amrex_hpeb_copy_to_vec (lo, hi, a, alo, ahi, v, nv, flag, flo, fhi) &
-       bind(c,name='amrex_hpeb_copy_to_vec')
-    use amrex_ebcellflag_module, only : is_covered_cell
-    integer, dimension(3), intent(in) :: lo, hi, alo, ahi, flo, fhi
-    integer(it), intent(in) :: nv
-    real(rt), intent(in) :: a   (alo(1):ahi(1),alo(2):ahi(2),alo(3):ahi(3))
-    integer , intent(in) :: flag(flo(1):fhi(1),flo(2):fhi(2),flo(3):fhi(3))
-    real(rt), intent(out) :: v(0:nv-1)
-    
-    integer :: i,j,k, nrows
-
-    nrows = 0
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (.not.is_covered_cell(flag(i,j,k))) then
-                v(nrows) = a(i,j,k)
-                nrows = nrows+1
-             end if
-          end do
-       end do
-    end do
-  end subroutine amrex_hpeb_copy_to_vec
-
-
-  subroutine amrex_hpeb_ijmatrix (lo, hi, nrows, ncols, rows, cols, mat, &
-       cell_id, clo, chi, cell_id_begin, diag, dlo, dhi, a, alo, ahi, &
-       bx, bxlo, bxhi, by, bylo, byhi, bz, bzlo, bzhi, &
-       flag, flo, fhi, vfrc, vlo, vhi, &
-       apx, axlo, axhi, apy, aylo, ayhi, apz, azlo, azhi, &
-       fcx, fxlo, fxhi, fcy, fylo, fyhi, fcz, fzlo, fzhi, &
-       ba, balo, bahi, bcen, bclo, bchi, beb, elo, ehi, is_eb_dirichlet, & 
-       sa, sb, dx, bct, bcl, bho) &
-       bind(c,name='amrex_hpeb_ijmatrix')
-    use amrex_ebcellflag_module, only : is_covered_cell, is_regular_cell
-    integer(it), intent(in) :: nrows, cell_id_begin;
-    integer(it), dimension(0:nrows-1), intent(out) :: ncols, rows
-    integer(it), dimension(0:nrows*27-1), intent(out) :: cols
-    real(rt)   , dimension(0:nrows*27-1), intent(out) :: mat
-    integer, dimension(3), intent(in) :: lo, hi, clo, chi, dlo, dhi, &
-         alo, ahi, bxlo, bxhi, bylo, byhi, &
-         bzlo, bzhi, flo, fhi, vlo, vhi, axlo, axhi, aylo, ayhi, azlo, azhi, &
-         fxlo, fxhi, fylo, fyhi, fzlo, fzhi, balo, bahi, bclo, bchi, elo, ehi 
-    integer(it), intent(in) :: cell_id( clo(1): chi(1), clo(2): chi(2), clo(3): chi(3))
-    real(rt)   , intent(inout) :: diag( dlo(1): dhi(1), dlo(2): dhi(2), dlo(3): dhi(3))
-    real(rt)   , intent(in) :: a      ( alo(1): ahi(1), alo(2): ahi(2), alo(3): ahi(3))
-    real(rt)   , intent(in) :: bx     (bxlo(1):bxhi(1),bxlo(2):bxhi(2),bxlo(3):bxhi(3))
-    real(rt)   , intent(in) :: by     (bylo(1):byhi(1),bylo(2):byhi(2),bylo(3):byhi(3))
-    real(rt)   , intent(in) :: bz     (bzlo(1):bzhi(1),bzlo(2):bzhi(2),bzlo(3):bzhi(3))
-    integer    , intent(in) :: flag   ( flo(1): fhi(1), flo(2): fhi(2), flo(3): fhi(3))
-    real(rt)   , intent(in) :: vfrc   ( vlo(1): vhi(1), vlo(2): vhi(2), vlo(3): vhi(3))
-    real(rt)   , intent(in) :: apx    (axlo(1):axhi(1),axlo(2):axhi(2),axlo(3):axhi(3))
-    real(rt)   , intent(in) :: apy    (aylo(1):ayhi(1),aylo(2):ayhi(2),aylo(3):ayhi(3))
-    real(rt)   , intent(in) :: apz    (azlo(1):azhi(1),azlo(2):azhi(2),azlo(3):azhi(3))
-    real(rt)   , intent(in) :: fcx    (fxlo(1):fxhi(1),fxlo(2):fxhi(2),fxlo(3):fxhi(3),2)
-    real(rt)   , intent(in) :: fcy    (fylo(1):fyhi(1),fylo(2):fyhi(2),fylo(3):fyhi(3),2)
-    real(rt)   , intent(in) :: fcz    (fzlo(1):fzhi(1),fzlo(2):fzhi(2),fzlo(3):fzhi(3),2)
-    real(rt)   , intent(in) :: ba     (balo(1):bahi(1),balo(2):bahi(2),balo(3):bahi(3))
-    real(rt)   , intent(in) :: bcen   (bclo(1):bchi(1),bclo(2):bchi(2),bclo(3):bchi(3),3)
-    real(rt)   , intent(in) :: beb    ( elo(1): ehi(1), elo(2): ehi(2), elo(3): ehi(3))
-    integer, intent(in) :: bct(0:5), bho
-    real(rt), intent(in) :: sa, sb, dx(3), bcl(0:5)
-    integer, intent(in) :: is_eb_dirichlet
-
-    logical :: is_dirichlet 
-    integer :: i,j,k, irow, imat, cdir, idim, ii,jj,kk, ioff, joff, koff
-    real(rt) :: fac(3), mat_tmp(-1:1,-1:1,-1:1)
-    real(rt) :: bf1(0:5), bf2(0:5), h, h2, h3, bflo(0:5)
-    real(rt) :: fracx, fracy, fracz, area, abc, tmp, f, anorm
-    real(rt) :: anorminv, anrmx, anrmy, anrmz, bctx, bcty, bctz, dg
-    real(rt) :: gx, gy, gz, gxy, gxz, gyz, gxyz, sx, sy, sz 
-    real(rt) :: phig1(8), feb(8) 
-
-    is_dirichlet = is_eb_dirichlet .ne. 0 
-    fac = sb/dx**2
-
-    do cdir = 0, 5
-       if (cdir .eq. 0 .or. cdir .eq. 3) then
-          idim = 1
-       else if (cdir .eq. 1 .or. cdir .eq. 4) then
-          idim = 2
-       else
-          idim = 3
-       end if
-       h = dx(idim)
-       if (bct(cdir) .eq. amrex_lo_dirichlet) then
-          h2 = half * h
-          bflo(cdir) = fac(idim) * ( h / (bcl(cdir) + h2) - one)
-          if (bho.ge.1) then
-             h3 = three * h2
-             bf1(cdir) = fac(idim) * ((h3 - bcl(cdir)) / (bcl(cdir) + h2) - one)
-             bf2(cdir) = fac(idim) * (bcl(cdir) - h2) / (bcl(cdir) + h3)
-          else
-             bf1(cdir) = bflo(cdir)
-             bf2(cdir) = zero
-          end if
-       else if (bct(cdir) .eq. amrex_lo_neumann) then
-          bflo(cdir) = -fac(idim)
-          bf1(cdir) = -fac(idim)
-          bf2(cdir) = zero
-       end if
-    end do
-
-    irow = 0
-    imat = 0
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             if (is_covered_cell(flag(i,j,k))) then
-                diag(i,j,k) = zero
-             else
-                rows(irow) = cell_id(i,j,k)
-                ncols(irow) = 0
-                mat_tmp = zero
-
-                if (is_regular_cell(flag(i,j,k))) then
-
-                   mat_tmp(0,0,0) = sa*a(i,j,k) + fac(1)*(bx(i,j,k)+bx(i+1,j,k)) &
-                        &                       + fac(2)*(by(i,j,k)+by(i,j+1,k)) &
-                        &                       + fac(3)*(bz(i,j,k)+bz(i,j,k+1))
-                   mat_tmp(-1, 0, 0) = -fac(1)*bx(i,j,k)
-                   mat_tmp( 1, 0, 0) = -fac(1)*bx(i+1,j,k)
-                   mat_tmp( 0,-1, 0) = -fac(2)*by(i,j,k)
-                   mat_tmp( 0, 1, 0) = -fac(2)*by(i,j+1,k)
-                   mat_tmp( 0, 0,-1) = -fac(3)*bz(i,j,k)
-                   mat_tmp( 0, 0, 1) = -fac(3)*bz(i,j,k+1)
-
-                   if (i.eq.lo(1) .and. cell_id(i-1,j,k).lt.0) then
-                      cdir = 0
-                      mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1(cdir)*bx(i,j,k)
-                      mat_tmp(-1,0,0) = zero
-                      mat_tmp(1,0,0) = mat_tmp(1,0,0) + bf2(cdir)*bx(i,j,k)
-                   end if
-
-                   if (i.eq.hi(1) .and. cell_id(i+1,j,k).lt.0) then
-                      cdir = 3
-                      mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1(cdir)*bx(i+1,j,k)
-                      mat_tmp(1,0,0) = zero
-                      mat_tmp(-1,0,0) = mat_tmp(-1,0,0) + bf2(cdir)*bx(i+1,j,k)
-                   end if
-
-                   if (j.eq.lo(2) .and. cell_id(i,j-1,k).lt.0) then
-                      cdir = 1
-                      mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1(cdir)*by(i,j,k)
-                      mat_tmp(0,-1,0) = zero
-                      mat_tmp(0,1,0) = mat_tmp(0,1,0) + bf2(cdir)*by(i,j,k)
-                   end if
-
-                   if (j.eq.hi(2) .and. cell_id(i,j+1,k).lt.0) then
-                      cdir = 4
-                      mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1(cdir)*by(i,j+1,k)
-                      mat_tmp(0,1,0) = zero
-                      mat_tmp(0,-1,0) = mat_tmp(0,-1,0) + bf2(cdir)*by(i,j+1,k)
-                   end if
-
-                   if (k.eq.lo(3) .and. cell_id(i,j,k-1).lt.0) then
-                      cdir = 2
-                      mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1(cdir)*bz(i,j,k)
-                      mat_tmp(0,0,-1) = zero
-                      mat_tmp(0,0,1) = mat_tmp(0,0,1) + bf2(cdir)*bz(i,j,k)
-                   end if
-
-                   if (k.eq.hi(3) .and. cell_id(i,j,k+1).lt.0) then
-                      mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1(cdir)*bz(i,j,k+1)
-                      mat_tmp(0,0,1) = zero
-                      mat_tmp(0,0,-1) = mat_tmp(0,0,-1) + bf2(cdir)*bz(i,j,k+1)
-                   end if
-                   
-                else
-
-                   cdir = 0
-                   f = fac(1)
-                   area = apx(i,j,k)
-                   abc = area*bx(i,j,k)
-                   if (area.gt.zero) then
-                      if (area.ne.one) then
-                         joff = int(sign(one,fcx(i,j,k,1)))
-                         koff = int(sign(one,fcx(i,j,k,2)))
-                         jj = j+joff
-                         kk = k+koff
-                         if (cell_id(i-1,jj,k).lt.0 .and. cell_id(i,jj,k).lt.0) then
-                            fracy = zero
-                         else
-                            fracy = abs(fcx(i,j,k,1))
-                         end if
-                         if (cell_id(i-1,j,kk).lt.0 .and. cell_id(i,j,kk).lt.0) then
-                            fracz = zero
-                         else
-                            fracz = abs(fcx(i,j,k,2))
-                         end if
-                         if (cell_id(i-1,jj,kk).lt.0 .and. cell_id(i,jj,kk).lt.0 .and. fracy*fracz.gt.zero) then
-                            fracy = zero
-                            fracz = zero
-                         end if
-                      else
-                         joff = 0
-                         koff = 0
-                         jj = j
-                         kk = k
-                         fracy = zero
-                         fracz = zero
-                      end if
-
-                      tmp = (one-fracy)*(one-fracz)*abc
-                      ! cell(i-1,j,k) is not covered because area > 0
-                      if (cell_id(i-1,j,k).ge.0) then
-                         mat_tmp( 0,0,0) = mat_tmp( 0,0,0) + tmp*f
-                         mat_tmp(-1,0,0) = mat_tmp(-1,0,0) - tmp*f
-                      else if (cell_id(i+1,j,k).lt.0 .or. apx(i+1,j,k).eq.zero .or. bho.eq.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo(cdir))
-                      else
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bf1(cdir))
-                         mat_tmp(1,0,0) = mat_tmp(1,0,0) + tmp*   bf2(cdir)
-                      end if
-
-                      if (fracy.gt.zero) then
-                         tmp = fracy*(one-fracz)*area*bx(i,jj,k)
-                         if (cell_id(i-1,jj,k).ge.0 .and. cell_id(i,jj,k).ge.0) then
-                            mat_tmp(-1,joff,0) = mat_tmp(-1,joff,0) - tmp*f
-                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*f
-                         else if (cell_id(i+1,jj,k).lt.0 .or. apx(i+1,jj,k).eq.zero .or. bho.eq.0) then
-                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*(f+bf1(cdir))
-                            mat_tmp( 1,joff,0) = mat_tmp( 1,joff,0) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracz.gt.zero) then
-                         tmp = fracz*(one-fracy)*area*bx(i,j,kk)
-                         if (cell_id(i-1,j,kk).ge.0 .and. cell_id(i,j,kk).ge.0) then
-                            mat_tmp(-1,0,koff) = mat_tmp(-1,0,koff) - tmp*f
-                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*f
-                         else if (cell_id(i+1,j,kk).lt.0 .or. apx(i+1,j,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp( 1,0,koff) = mat_tmp( 1,0,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracy.gt.zero .and. fracz.gt.zero) then
-                         tmp = fracy*fracz*area*bx(i,jj,kk)
-                         if (cell_id(i-1,jj,kk).ge.0 .and. cell_id(i,jj,kk).ge.0) then
-                            mat_tmp(-1,joff,koff) = mat_tmp(-1,joff,koff) - tmp*f
-                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*f
-                         else if (cell_id(i+1,jj,kk).lt.0 .or. apx(i+1,jj,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp( 1,joff,koff) = mat_tmp( 1,joff,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if                      
-                   end if
-
-                   cdir = 3
-                   f = fac(1)
-                   area = apx(i+1,j,k)
-                   abc = area*bx(i+1,j,k)
-                   if (area.gt.zero) then
-                      if (area.ne.one) then
-                         joff = int(sign(one,fcx(i+1,j,k,1)))
-                         koff = int(sign(one,fcx(i+1,j,k,2)))
-                         jj = j+joff
-                         kk = k+koff
-                         if (cell_id(i,jj,k).lt.0 .and. cell_id(i+1,jj,k).lt.0) then
-                            fracy = zero
-                         else
-                            fracy = abs(fcx(i+1,j,k,1))
-                         end if
-                         if (cell_id(i,j,kk).lt.0 .and. cell_id(i+1,j,kk).lt.0) then
-                            fracz = zero
-                         else
-                            fracz = abs(fcx(i+1,j,k,2))
-                         end if
-                         if (cell_id(i,jj,kk).lt.0 .and. cell_id(i+1,jj,kk).lt.0 .and. fracy*fracz.gt.zero) then
-                            fracy = zero
-                            fracz = zero
-                         end if
-                      else
-                         joff = 0
-                         koff = 0
-                         jj = j
-                         kk = k
-                         fracy = zero
-                         fracz = zero
-                      end if
-
-                      tmp = (one-fracy)*(one-fracz)*abc
-                      if (cell_id(i+1,j,k).ge.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*f
-                         mat_tmp(1,0,0) = mat_tmp(1,0,0) - tmp*f
-                      else if (cell_id(i-1,j,k).lt.0 .or. apx(i-1,j,k).eq.zero .or. bho.eq.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo(cdir))
-                      else
-                         mat_tmp( 0,0,0) = mat_tmp( 0,0,0) + tmp*(f+bf1(cdir))
-                         mat_tmp(-1,0,0) = mat_tmp(-1,0,0) + tmp*   bf2(cdir)
-                      end if
-
-                      if (fracy.gt. zero) then
-                         tmp = fracy*(one-fracz)*area*bx(i+1,jj,k)
-                         if (cell_id(i,jj,k).ge.0 .and. cell_id(i+1,jj,k).ge.0) then
-                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*f
-                            mat_tmp(1,joff,0) = mat_tmp(1,joff,0) - tmp*f
-                         else if (cell_id(i-1,jj,k).lt.0 .or. apx(i-1,jj,k).eq.zero .or. bho.eq.0) then
-                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*(f+bf1(cdir))
-                            mat_tmp(-1,joff,0) = mat_tmp(-1,joff,0) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracz.gt.zero) then
-                         tmp = fracz*(one-fracy)*area*bx(i+1,j,kk)
-                         if (cell_id(i,j,kk).ge.0 .and. cell_id(i+1,j,kk).ge.0) then
-                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*f
-                            mat_tmp(1,0,koff) = mat_tmp(1,0,koff) - tmp*f
-                         else if (cell_id(i-1,j,kk).lt.0 .or. apx(i-1,j,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp(-1,0,koff) = mat_tmp(-1,0,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracy.gt.zero .and. fracz.gt.zero) then
-                         tmp = fracy*fracz*area*bx(i+1,jj,kk)
-                         if (cell_id(i,jj,kk).ge.0 .and. cell_id(i+1,jj,kk).ge.0) then
-                            mat_tmp(0,joff,koff) = mat_tmp(0,joff,koff) + tmp*f
-                            mat_tmp(1,joff,koff) = mat_tmp(1,joff,koff) - tmp*f
-                         else if (cell_id(i-1,jj,kk).lt.0 .or. apx(i-1,jj,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp(0,joff,koff) = mat_tmp(0,joff,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp(-1,joff,koff) = mat_tmp(-1,joff,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-                   end if
-                   
-                   cdir = 1
-                   f = fac(2)
-                   area = apy(i,j,k)
-                   abc = area*by(i,j,k)
-                   if (area.gt.zero) then
-                      if (area.ne.one) then
-                         ioff = int(sign(one,fcy(i,j,k,1)))
-                         koff = int(sign(one,fcy(i,j,k,2)))
-                         ii = i+ioff
-                         kk = k+koff
-                         if (cell_id(ii,j-1,k).lt.0 .and. cell_id(ii,j,k).lt.0) then
-                            fracx = zero
-                         else
-                            fracx = abs(fcy(i,j,k,1))
-                         end if
-                         if (cell_id(i,j-1,kk).lt.0 .and. cell_id(i,j,kk).lt.0) then
-                            fracz = zero
-                         else
-                            fracz = abs(fcy(i,j,k,2))
-                         end if
-                         if (cell_id(ii,j-1,kk).lt.0 .and. cell_id(ii,j,kk).lt.0 .and. fracx*fracz.gt.zero) then
-                            fracx = zero
-                            fracz = zero
-                         end if
-                      else
-                         ioff = 0
-                         koff = 0
-                         ii = i
-                         kk = k
-                         fracx = zero
-                         fracz = zero
-                      end if
-
-                      tmp = (one-fracx)*(one-fracz)*abc
-                      if (cell_id(i,j-1,k).ge.0) then
-                         mat_tmp(0, 0,0) = mat_tmp(0, 0,0) + tmp*f
-                         mat_tmp(0,-1,0) = mat_tmp(0,-1,0) - tmp*f
-                      else if (cell_id(i,j+1,k).lt.0 .or. apy(i,j+1,k).eq.zero .or. bho.eq.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo(cdir))
-                      else
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bf1(cdir))
-                         mat_tmp(0,1,0) = mat_tmp(0,1,0) + tmp*   bf2(cdir)
-                      end if
-                      
-                      if (fracx.gt.zero) then
-                         tmp = fracx*(one-fracz)*area*by(ii,j,k)
-                         if (cell_id(ii,j-1,k).ge.0 .and. cell_id(ii,j,k).ge.0) then
-                            mat_tmp(ioff,-1,0) = mat_tmp(ioff,-1,0) - tmp*f
-                            mat_tmp(ioff, 0,0) = mat_tmp(ioff, 0,0) + tmp*f
-                         else if (cell_id(ii,j+1,k).lt.0 .or. apy(ii,j+1,k).eq.zero .or. bho.eq.0) then
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,1,0) = mat_tmp(ioff,1,0) + tmp*   bf2(cdir)
-                         end if
-                      end if
-                      
-                      if (fracz.gt.zero) then
-                         tmp = fracz*(one-fracx)*area*by(i,j,kk)
-                         if (cell_id(i,j-1,kk).ge.0 .and. cell_id(i,j,kk).ge.0) then
-                            mat_tmp(0,-1,koff) = mat_tmp(0,-1,koff) - tmp*f
-                            mat_tmp(0, 0,koff) = mat_tmp(0, 0,koff) + tmp*f
-                         else if (cell_id(i,j+1,kk).lt.0 .or. apy(i,j+1,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp(0,1,koff) = mat_tmp(0,1,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracx.gt.zero .and. fracz.gt.zero) then
-                         tmp = fracx*fracz*area*by(ii,j,kk)
-                         if (cell_id(ii,j-1,kk).ge.0 .and. cell_id(ii,j,kk).ge.0) then
-                            mat_tmp(ioff,-1,koff) = mat_tmp(ioff,-1,koff) - tmp*f
-                            mat_tmp(ioff, 0,koff) = mat_tmp(ioff, 0,koff) + tmp*f
-                         else if (cell_id(ii,j+1,kk).lt.0 .or. apy(ii,j+1,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,1,koff) = mat_tmp(ioff,1,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-                   end if
-                   
-                   cdir = 4
-                   f = fac(2)
-                   area = apy(i,j+1,k)
-                   abc = area*by(i,j+1,k)
-                   if (area.gt.zero) then
-                      if (area.ne.one) then
-                         ioff = int(sign(one,fcy(i,j+1,k,1)))
-                         koff = int(sign(one,fcy(i,j+1,k,2)))
-                         ii = i+ioff
-                         kk = k+koff
-                         if (cell_id(ii,j,k).lt.0 .and. cell_id(ii,j+1,k).lt.0) then
-                            fracx = zero
-                         else
-                            fracx = abs(fcy(i,j+1,k,1))
-                         end if
-                         if (cell_id(i,j,kk).lt.0 .and. cell_id(i,j+1,kk).lt.0) then
-                            fracz = zero
-                         else
-                            fracz = abs(fcy(i,j+1,k,2))
-                         end if
-                         if (cell_id(ii,j,kk).lt.0 .and. cell_id(ii,j+1,kk).lt.0 .and. fracx*fracz.gt.zero) then
-                            fracx = zero
-                            fracz = zero
-                         end if
-                      else
-                         ioff = 0
-                         koff = 0
-                         ii = i
-                         kk = k
-                         fracx = zero
-                         fracz = zero
-                      end if
-
-                      tmp = (one-fracx)*(one-fracz)*abc
-                      if (cell_id(i,j+1,k).ge.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*f
-                         mat_tmp(0,1,0) = mat_tmp(0,1,0) - tmp*f
-                      else if (cell_id(i,j-1,k).lt.0 .or. apy(i,j-1,k).eq.zero .or. bho.eq.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo(cdir))
-                      else
-                         mat_tmp(0, 0,0) = mat_tmp(0, 0,0) + tmp*(f+bf1(cdir))
-                         mat_tmp(0,-1,0) = mat_tmp(0,-1,0) + tmp*   bf2(cdir)
-                      end if
-
-                      if (fracx.gt.zero) then
-                         tmp = fracx*(one-fracz)*area*by(ii,j+1,k)
-                         if (cell_id(ii,j,k).ge.0 .and. cell_id(ii,j+1,k).ge.0) then
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*f
-                            mat_tmp(ioff,1,0) = mat_tmp(ioff,1,0) - tmp*f
-                         else if (cell_id(ii,j-1,k).lt.0 .or. apy(ii,j-1,k).eq.zero .or. bho.eq.0) then
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff, 0,0) = mat_tmp(ioff, 0,0) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,-1,0) = mat_tmp(ioff,-1,0) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracz.gt.zero) then
-                         tmp = fracz*(one-fracx)*area*by(i,j+1,kk)
-                         if (cell_id(i,j,kk).ge.0 .and. cell_id(i,j+1,kk).ge.0) then
-                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*f
-                            mat_tmp(0,1,koff) = mat_tmp(0,1,koff) - tmp*f
-                         else if (cell_id(i,j-1,kk).lt.0 .or. apy(i,j-1,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(0, 0,koff) = mat_tmp(0, 0,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp(0,-1,koff) = mat_tmp(0,-1,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracx.gt. zero .and. fracz.gt.zero) then
-                         tmp = fracx*fracz*area*by(ii,j+1,kk)
-                         if (cell_id(ii,j,kk).ge.0 .and. cell_id(ii,j+1,kk).ge.0) then
-                            mat_tmp(ioff,1,koff) = mat_tmp(ioff,1,koff) - tmp*f
-                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*f
-                         else if (cell_id(ii,j-1,kk).lt.0 .or. apy(ii,j-1,kk).eq.zero .or. bho.eq.0) then
-                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff, 0,koff) = mat_tmp(ioff, 0,koff) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,-1,koff) = mat_tmp(ioff,-1,koff) + tmp*   bf2(cdir)
-                         end if
-                      end if
-                   end if
-
-                   cdir = 2
-                   f = fac(3)
-                   area = apz(i,j,k)
-                   abc = area*bz(i,j,k)
-                   if (area.gt.zero) then
-                      if (area.ne.one) then
-                         ioff = int(sign(one,fcz(i,j,k,1)))
-                         joff = int(sign(one,fcz(i,j,k,2)))
-                         ii = i+ioff
-                         jj = j+joff
-                         if (cell_id(ii,j,k-1).lt.0 .and. cell_id(ii,j,k).lt.0) then
-                            fracx = zero
-                         else
-                            fracx = abs(fcz(i,j,k,1))
-                         end if
-                         if (cell_id(i,jj,k-1).lt.0 .and. cell_id(i,jj,k).lt.0) then
-                            fracy = zero
-                         else
-                            fracy = abs(fcz(i,j,k,2))
-                         end if
-                         if (cell_id(ii,jj,k-1).lt.0 .and. cell_id(ii,jj,k).lt.0 .and. fracx*fracy.gt.zero) then
-                            fracx = zero
-                            fracy = zero
-                         end if
-                      else
-                         ioff = 0
-                         joff = 0
-                         ii = i
-                         jj = j
-                         fracx = zero
-                         fracy = zero
-                      end if
-
-                      tmp = (one-fracx)*(one-fracy)*abc
-                      if (cell_id(i,j,k-1).ge.0) then
-                         mat_tmp(0,0, 0) = mat_tmp(0,0, 0) + tmp*f
-                         mat_tmp(0,0,-1) = mat_tmp(0,0,-1) - tmp*f
-                      else if (cell_id(i,j,k+1).lt.0 .or. apz(i,j,k+1).eq.zero .or. bho.eq.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo(cdir))
-                      else
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bf1(cdir))
-                         mat_tmp(0,0,1) = mat_tmp(0,0,1) + tmp*   bf2(cdir)
-                      end if
-
-                      if (fracx.gt.zero) then
-                         tmp = fracx*(one-fracy)*area*bz(ii,j,k)
-                         if (cell_id(ii,j,k-1).ge.0 .and. cell_id(ii,j,k).ge.0) then
-                            mat_tmp(ioff,0,-1) = mat_tmp(ioff,0,-1) - tmp*f
-                            mat_tmp(ioff,0, 0) = mat_tmp(ioff,0, 0) + tmp*f
-                         else if (cell_id(ii,j,k+1).lt.0 .or. apz(ii,j,k+1).eq.zero .or. bho.eq.0) then
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,0,1) = mat_tmp(ioff,0,1) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracy.gt.zero) then
-                         tmp = fracy*(one-fracx)*area*bz(i,jj,k)
-                         if (cell_id(i,jj,k-1).ge.0 .and. cell_id(i,jj,k).ge.0) then
-                            mat_tmp(0,joff,-1) = mat_tmp(0,joff,-1) - tmp*f
-                            mat_tmp(0,joff, 0) = mat_tmp(0,joff, 0) + tmp*f
-                         else if (cell_id(i,jj,k+1).lt.0 .or. apz(i,jj,k+1).eq.zero .or. bho.eq.0) then
-                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bf1(cdir))
-                            mat_tmp(0,joff,1) = mat_tmp(0,joff,1) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracx.gt.zero .and. fracy.gt.zero) then
-                         tmp = fracx*fracy*area*bz(ii,jj,k)
-                         if (cell_id(ii,jj,k-1).ge.0 .and. cell_id(ii,jj,k).ge.0) then
-                            mat_tmp(ioff,joff,-1) = mat_tmp(ioff,joff,-1) - tmp*f
-                            mat_tmp(ioff,joff, 0) = mat_tmp(ioff,joff, 0) + tmp*f
-                         else if (cell_id(ii,jj,k+1).lt.0 .or. apz(ii,jj,k+1).eq.zero .or. bho.eq.0) then
-                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,joff,1) = mat_tmp(ioff,joff,1) + tmp*   bf2(cdir)
-                         end if
-                      end if
-                   end if
-
-                   cdir = 5
-                   f = fac(3)
-                   area = apz(i,j,k+1)
-                   abc = area*bz(i,j,k+1)
-                   if (area.gt.zero) then
-                      if (area.ne.one) then
-                         ioff = int(sign(one,fcz(i,j,k+1,1)))
-                         joff = int(sign(one,fcz(i,j,k+1,2)))
-                         ii = i+ioff
-                         jj = j+joff
-                         if (cell_id(ii,j,k).lt.0 .and. cell_id(ii,j,k+1).lt.0) then
-                            fracx = zero
-                         else
-                            fracx = abs(fcz(i,j,k+1,1))
-                         end if
-                         if (cell_id(i,jj,k).lt.0 .and. cell_id(i,jj,k+1).lt.0) then
-                            fracy = zero
-                         else
-                            fracy = abs(fcz(i,j,k+1,2))
-                         end if
-                         if (cell_id(ii,jj,k).lt.0 .and. cell_id(ii,jj,k+1).lt.0 .and. fracx*fracy.gt.zero) then
-                            fracx = zero
-                            fracy = zero
-                         end if
-                      else
-                         ioff = 0
-                         joff = 0
-                         ii = i
-                         jj = j
-                         fracx = zero
-                         fracy = zero
-                      end if
-
-                      tmp = (one-fracx)*(one-fracy)*abc
-                      if (cell_id(i,j,k+1).ge.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*f
-                         mat_tmp(0,0,1) = mat_tmp(0,0,1) - tmp*f
-                      else if (cell_id(i,j,k-1).lt.0 .or. apz(i,j,k-1).eq.zero .or.bho.eq.0) then
-                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo(cdir))
-                      else
-                         mat_tmp(0,0, 0) = mat_tmp(0,0, 0) + tmp*(f+bf1(cdir))
-                         mat_tmp(0,0,-1) = mat_tmp(0,0,-1) + tmp*   bf2(cdir)
-                      end if
-
-                      if (fracx.gt.zero) then
-                         tmp = fracx*(one-fracy)*area*bz(ii,j,k+1)
-                         if (cell_id(ii,j,k).ge.0 .and. cell_id(ii,j,k+1).ge.0) then
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*f
-                            mat_tmp(ioff,0,1) = mat_tmp(ioff,0,1) - tmp*f                            
-                         else if (cell_id(ii,j,k-1).lt.0 .or. apz(ii,j,k-1).eq.zero .or.bho.eq.0) then
-                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff,0, 0) = mat_tmp(ioff,0, 0) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,0,-1) = mat_tmp(ioff,0,-1) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracy.gt.zero) then
-                         tmp = fracy*(one-fracx)*area*bz(i,jj,k+1)
-                         if (cell_id(i,jj,k).ge.0 .and. cell_id(i,jj,k+1).ge.0) then
-                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*f
-                            mat_tmp(0,joff,1) = mat_tmp(0,joff,1) - tmp*f
-                         else if (cell_id(i,jj,k-1).lt.0 .or. apz(i,jj,k-1).eq.zero .or.bho.eq.0) then
-                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(0,joff, 0) = mat_tmp(0,joff, 0) + tmp*(f+bf1(cdir))
-                            mat_tmp(0,joff,-1) = mat_tmp(0,joff,-1) + tmp*   bf2(cdir)
-                         end if
-                      end if
-
-                      if (fracx.gt.zero .and. fracy.gt.zero) then
-                         tmp = fracx*fracy*area*bz(ii,jj,k+1)
-                         if (cell_id(ii,jj,k+1).ge.0 .and. cell_id(ii,jj,k).ge.0) then
-                            mat_tmp(ioff,joff,1) = mat_tmp(ioff,joff,1) - tmp*f
-                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*f
-                         else if (cell_id(ii,jj,k-1).lt.0 .or. apz(ii,jj,k-1).eq.zero .or.bho.eq.0) then
-                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*(f+bflo(cdir))
-                         else
-                            mat_tmp(ioff,joff, 0) = mat_tmp(ioff,joff, 0) + tmp*(f+bf1(cdir))
-                            mat_tmp(ioff,joff,-1) = mat_tmp(ioff,joff,-1) + tmp*   bf2(cdir)
-                         end if
-                      end if
-                   end if
-                   if(is_dirichlet) then 
-                     anorm = sqrt((apx(i,j,k) - apx(i+1,j,k))**2 & 
-                              + (apy(i,j,k) - apy(i,j+1,k))**2 &
-                              + (apz(i,j,k) - apz(i,j,k+1))**2)
-                     anorminv = one/anorm
-                     anrmx = (apx(i,j,k) - apx(i+1,j,k))*anorminv
-                     anrmy = (apy(i,j,k) - apy(i,j+1,k))*anorminv
-                     anrmz = (apz(i,j,k) - apz(i,j,k+1))*anorminv
-                     sx   = sign(one,anrmx) 
-                     sy   = sign(one,anrmy)
-                     sz   = sign(one,anrmz)
-                     bctx = bcen(i,j,k,1)
-                     bcty = bcen(i,j,k,2)
-                     bctz = bcen(i,j,k,3)
-                     dg   = amrex_get_dx_eb(vfrc(i,j,k)) / max(abs(anrmx), abs(anrmy), abs(anrmz))
-                     gx   = bctx - dg*anrmx 
-                     gy   = bcty - dg*anrmy
-                     gz   = bctz - dg*anrmz
-                     ioff = -int(sx)
-                     joff = -int(sy)
-                     koff = -int(sz) 
-                     gx   = sx*gx 
-                     gy   = sy*gy
-                     gz   = sz*gz
-                     gxy  = gx*gy
-                     gxz  = gx*gz 
-                     gyz  = gy*gz 
-                     gxyz = gx*gy*gz 
-                     phig1(1) = one + gx + gy + gz + gxy + gxz + gyz + gxyz
-                     phig1(2) =     - gx           - gxy - gxz       - gxyz
-                     phig1(3) =          - gy      - gxy       - gyz - gxyz
-                     phig1(4) =               - gz       - gxz - gyz - gxyz 
-                     phig1(5) =                    + gxy             + gxyz 
-                     phig1(6) =                          + gxz       + gxyz 
-                     phig1(7) =                                + gyz + gxyz 
-                     phig1(8) =                                      - gxyz
-
-                     feb = -phig1 * (ba(i,j,k) * beb(i,j,k) / dg)
-                     mat_tmp(0   , 0  , 0  ) = mat_tmp(0   , 0 , 0   ) - feb(1)*fac(1)
-                     mat_tmp(ioff, 0  , 0  ) = mat_tmp(ioff, 0 , 0   ) - feb(2)*fac(1)
-                     mat_tmp(0   ,joff, 0  ) = mat_tmp(0   ,joff, 0  ) - feb(3)*fac(1)
-                     mat_tmp(0   , 0  ,koff) = mat_tmp(0   , 0  ,koff) - feb(4)*fac(1)
-                     mat_tmp(ioff,joff, 0  ) = mat_tmp(ioff,joff, 0  ) - feb(5)*fac(1)
-                     mat_tmp(ioff, 0  ,koff) = mat_tmp(ioff, 0  ,koff) - feb(6)*fac(1)
-                     mat_tmp(0   ,joff,koff) = mat_tmp(0   ,joff,koff) - feb(7)*fac(1) 
-                     mat_tmp(ioff,joff,koff) = mat_tmp(ioff,joff,koff) - feb(8)*fac(1)            
-                   endif
-                  
-                   mat_tmp = mat_tmp * (one/vfrc(i,j,k))
-                   mat_tmp(0,0,0) = mat_tmp(0,0,0) + sa*a(i,j,k)
-                end if
-                
-                diag(i,j,k) = one/mat_tmp(0,0,0)
-
-                do koff = -1, 1
-                   do joff = -1, 1
-                      do ioff = -1, 1
-                         if (mat_tmp(ioff,joff,koff).ne.zero .and. cell_id(i+ioff,j+joff,k+koff).ge.0) then
-                            ncols(irow) = ncols(irow) + 1
-                            cols(imat) = cell_id(i+ioff,j+joff,k+koff)
-                            mat(imat) = mat_tmp(ioff,joff,koff)*diag(i,j,k)
-                            imat = imat + 1
-                         end if
-                      end do
-                   end do
-                end do
-                irow = irow + 1
-                
-             end if
-          end do
-       end do
-    end do
-  end subroutine amrex_hpeb_ijmatrix
-    
-#endif
-
-end module amrex_habec_module
diff --git a/Src/Extern/HYPRE/AMReX_Habec_2D_K.H b/Src/Extern/HYPRE/AMReX_Habec_2D_K.H
new file mode 100644
index 00000000000..ee978ceee86
--- /dev/null
+++ b/Src/Extern/HYPRE/AMReX_Habec_2D_K.H
@@ -0,0 +1,693 @@
+#ifndef AMREX_HABEC_2D_H_
+#define AMREX_HABEC_2D_H_
+
+#include <AMReX_LO_BCTYPES.H>
+#ifdef AMREX_USE_HYPRE
+#include <AMReX_Hypre.H>
+#endif
+#include <AMReX_MultiFabUtil.H>
+
+#ifdef AMREX_USE_EB
+#include <AMReX_EBMultiFabUtil.H>
+#include <AMReX_MultiCutFab.H>
+#include <AMReX_EBFabFactory.H>
+#include <AMReX_MLEBABecLap_K.H>
+#endif
+
+namespace amrex {
+
+AMREX_FORCE_INLINE
+void amrex_hpbcoef (Box const& box,
+                    BaseFab<GpuArray<Real,2*AMREX_SPACEDIM + 1>>& mat,
+                    const FArrayBox& b,
+                    Real& sb,
+                    const Real* dx,
+                    int& idim)
+{
+    Array4<GpuArray<Real,2*AMREX_SPACEDIM + 1>> const& mat_arr = mat.array();
+    Array4<Real const> const& b_arr = b.const_array();
+    Real fac = sb / (dx[idim]*dx[idim]);
+
+    if (idim == 0) {
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + fac * (b_arr(i,j,k) + b_arr(i+1,j,k));
+            mat_arr(i,j,k)[1] = - fac * b_arr(i,j,k);
+            mat_arr(i,j,k)[2] = - fac * b_arr(i+1,j,k);
+        });
+    }else{
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + fac * (b_arr(i,j,k) + b_arr(i,j+1,k));
+            mat_arr(i,j,k)[3] = - fac * b_arr(i,j,k);
+            mat_arr(i,j,k)[4] = - fac * b_arr(i,j+1,k);
+        });
+    }
+}
+
+AMREX_FORCE_INLINE
+void amrex_hpmat (Box const& box,
+                  BaseFab<GpuArray<Real,2*AMREX_SPACEDIM + 1>>& mat,
+                  const FArrayBox& b,
+                  const Mask& msk,
+                  Real& sb,
+                  const Real* dx,
+                  int& cdir,
+                  const int& bct,
+                  const Real& bcl,
+                  const int& bho)
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    Array4<GpuArray<Real,2*AMREX_SPACEDIM + 1>> const& mat_arr = mat.array();
+    Array4<Real const> const& b_arr = b.const_array();
+    Array4<int const> const& msk_arr = msk.const_array();
+
+    Real h = 0.0;
+    if (cdir == 0 || cdir == 2) {
+        h = dx[0];
+    }else{
+        h = dx[1];
+    }
+    Real fac = sb/(h*h);
+
+    Real h2 = 0.0;
+    Real h3 = 0.0;
+    Real bf1 = 0.0;
+    Real bf2 = 0.0;
+    if (bct == AMREX_LO_DIRICHLET) {
+        h2 = 0.5*h;
+        if (bho >= 1) {
+            h3 = 3.0*h2;
+            bf1 = fac*((h3 - bcl)/(bcl + h2) - 1.0);
+            bf2 = fac*(bcl - h2)/(bcl + h3);
+        }else{
+            bf1 = fac*( h/(bcl + h2) - 1.0);
+            bf2 = 0.0;
+        }
+    }else if (bct == AMREX_LO_NEUMANN) {
+        bf1 = -fac;
+        bf2 = 0.0;
+    }else{
+        Abort("hpmat: unsupported boundary type");
+    }
+
+    if (cdir == 0){
+        Box tbx = box;
+        tbx.setSmall(0,lo.x).setBig(0,lo.x); // 0: x-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tbx, i, j, k,
+        {
+            if (msk_arr(lo.x-1,j,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j,k);
+                mat_arr(i,j,k)[1] = 0.0;
+                mat_arr(i,j,k)[2] = mat_arr(i,j,k)[2] + bf2*b_arr(i,j,k);
+            }
+        });
+    }else if (cdir == 2){
+        Box tbx = box;
+        tbx.setSmall(0,hi.x).setBig(0,hi.x); // 0: x-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tbx, i, j, k,
+        {
+            if (msk_arr(hi.x+1,j,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i+1,j,k);
+                mat_arr(i,j,k)[2] = 0.0;
+                mat_arr(i,j,k)[1] = mat_arr(i,j,k)[1] + bf2*b_arr(i+1,j,k);
+            }
+        });
+   }else if (cdir == 1){
+        Box tby = box;
+        tby.setSmall(1,lo.y).setBig(1,lo.y); // 1: y-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tby, i, j, k,
+        {
+            if (msk_arr(i,lo.y-1,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j,k);
+                mat_arr(i,j,k)[3] = 0.0;
+                mat_arr(i,j,k)[4] = mat_arr(i,j,k)[4] + bf2*b_arr(i,j,k);
+            }
+        });
+   }else if (cdir == 3){
+        Box tby = box;
+        tby.setSmall(1,hi.y).setBig(1,hi.y); // 1: y-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tby, i, j, k,
+        {
+            if (msk_arr(i,hi.y+1,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j+1,k);
+                mat_arr(i,j,k)[4] = 0.0;
+                mat_arr(i,j,k)[3] = mat_arr(i,j,k)[3] + bf2*b_arr(i,j+1,k);
+            }
+        });
+   }else{
+        Abort("hpmat: impossible face orientation");
+   }
+}
+
+template<typename T> AMREX_FORCE_INLINE
+void amrex_hpijmatrix (Box const& box,
+                       const T& /*nrows*/,
+                       T* ncols,
+                       T* rows,
+                       T* colsg,
+                       Real* matg,
+                       BaseFab<T>& cell_id,
+                       T& /*offset*/, FArrayBox& diaginv,
+                       FArrayBox& acoefs, FArrayBox& bcoefsx,
+                       FArrayBox& bcoefsy,
+                       Real& sa, Real& sb, const Real* dx,
+                       GpuArray<int,AMREX_SPACEDIM*2>& bct,
+                       GpuArray<Real,AMREX_SPACEDIM*2> bcl,
+                       const int& bho,
+                       IArrayBox const* osmsk)
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    GpuArray<Real,AMREX_SPACEDIM> fac;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf1;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf2;
+
+    for (int i=0; i<AMREX_SPACEDIM; i++){
+        fac[i] = sb/(dx[i]*dx[i]);
+    }
+   
+    int idim = 0;
+    for (int cdir=0; cdir<=AMREX_SPACEDIM*2-1; cdir++){ 
+       if (cdir == 0 || cdir == 2){
+          idim = 0;
+       }else{
+          idim = 1;
+       }
+
+       Real h = dx[idim];
+
+       if (bct[cdir] == AMREX_LO_DIRICHLET) {
+          Real h2 = 0.5*h;
+          if (bho>=1) {
+             Real h3 = 3.0*h2;
+             bf1[cdir] = fac[idim] * ((h3 - bcl[cdir]) / (bcl[cdir] + h2) - 1.0);
+             bf2[cdir] = fac[idim] * (bcl[cdir] - h2) / (bcl[cdir] + h3);
+          }else{
+             bf1[cdir] = fac[idim] * ( h / (bcl[cdir] + h2) - 1.0);
+             bf2[cdir] = 0.0;
+          }
+       }else if (bct[cdir] == AMREX_LO_NEUMANN) {
+          bf1[cdir] = -fac[idim];
+          bf2[cdir] = 0.0;
+       }
+    }
+
+    Gpu::DeviceVector<int> iter(2,0);
+
+    Array4<T> const& cell_id_arr = cell_id.array();
+    Gpu::DeviceVector<T> cols_tmp(AMREX_SPACEDIM*2+1,0.0);
+    Gpu::DeviceVector<Real> mat_tmp(AMREX_SPACEDIM*2+1,0.0);
+    Array4<Real const> const& a_arr = acoefs.const_array();
+    Array4<Real const> const& bx_arr = bcoefsx.const_array();
+    Array4<Real const> const& by_arr = bcoefsy.const_array();
+    Array4<Real> const& diag_arr = diaginv.array();
+    Array4<int const> const osm = osmsk ? osmsk->const_array() : Array4<int const>{};
+
+    auto cols_tmpPtr = cols_tmp.dataPtr();
+    auto mat_tmpPtr = mat_tmp.dataPtr();
+    auto iterPtr = iter.dataPtr();
+
+    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+    {
+        int irow = iterPtr[0];
+        rows[irow]  = cell_id_arr(i,j,k);
+        ncols[irow] = 0;
+
+        if (!osm or osm(i,j,k) != 0) {
+            cols_tmpPtr[0] = cell_id_arr(i,j,k);
+            mat_tmpPtr[0]  = sa*a_arr(i,j,k) + fac[0]*(bx_arr(i,j,k)+bx_arr(i+1,j,k))
+                                             + fac[1]*(by_arr(i,j,k)+by_arr(i,j+1,k));
+
+            cols_tmpPtr[1] = cell_id_arr(i-1,j,k);
+            mat_tmpPtr[1]  = -fac[0]*bx_arr(i,j,k);
+
+            cols_tmpPtr[2] = cell_id_arr(i+1,j,k);
+            mat_tmpPtr[2]  = -fac[0]*bx_arr(i+1,j,k);
+
+            cols_tmpPtr[3] = cell_id_arr(i,j-1,k);
+            mat_tmpPtr[3]  = -fac[1]*by_arr(i,j,k);
+
+            cols_tmpPtr[4] = cell_id_arr(i,j+1,k);
+            mat_tmpPtr[4]  = -fac[1]*by_arr(i,j+1,k);
+
+            if (i == lo.x && cell_id_arr(i-1,j,k)<0) {
+                mat_tmpPtr[0] += bf1[0]*bx_arr(i,j,k);
+                mat_tmpPtr[2] += bf2[0]*bx_arr(i,j,k);
+            }
+
+            if (i == hi.x && cell_id_arr(i+1,j,k)<0) {
+                mat_tmpPtr[0] += bf1[2]*bx_arr(i+1,j,k);
+                mat_tmpPtr[1] += bf2[2]*bx_arr(i+1,j,k);
+            }
+
+            if (j == lo.y && cell_id_arr(i,j-1,k)<0) {
+                mat_tmpPtr[0] += bf1[1]*by_arr(i,j,k);
+                mat_tmpPtr[4] += bf2[1]*by_arr(i,j,k);
+            }
+
+            if (j == hi.y && cell_id_arr(i,j+1,k)<0) {
+                mat_tmpPtr[0] += bf1[3]*by_arr(i,j+1,k);
+                mat_tmpPtr[3] += bf2[3]*by_arr(i,j+1,k);
+            }
+
+            diag_arr(i,j,k) = 1.0/mat_tmpPtr[0];
+
+            for (int ic=0; ic<=4; ic++){
+                if (cols_tmpPtr[ic] >= 0){
+                    int imat = iterPtr[1];
+                    ncols[irow]  = ncols[irow] +1;
+                    colsg[imat]  = cols_tmpPtr[ic];
+                    matg[imat]   = mat_tmpPtr[ic]*diag_arr(i,j,k);
+                    Gpu::Atomic::Add(&iterPtr[1], 1);
+                }
+            }
+            Gpu::Atomic::Add(&iterPtr[0], 1);
+        } else {
+            diag_arr(i,j,k) = 1.0_rt;
+            int imat = iterPtr[1];
+            ++(ncols[irow]);
+            colsg[imat] = cell_id_arr(i,j,k);
+            matg[imat] = 1.0;
+            Gpu::Atomic::Add(&iterPtr[1], 1);
+            Gpu::Atomic::Add(&iterPtr[0], 1);
+        }
+    });
+}
+
+#ifdef AMREX_USE_EB
+
+template<typename T> AMREX_FORCE_INLINE
+void amrex_hpeb_ijmatrix (Box const& box,
+                          const T& nrows,
+                          T* ncols,
+                          T* rows,
+                          T* colsg,
+                          Real* matg,
+                          BaseFab<T>& cell_id,
+                          T& offset, FArrayBox& diaginv,
+                          FArrayBox& acoefs, FArrayBox& bcoefsx,
+                          FArrayBox& bcoefsy,
+                          const EBCellFlagFab& flag,
+                          const FArrayBox& vfrc,
+                          const FArrayBox& apx, const FArrayBox& apy,
+                          const FArrayBox& fcx,
+                          const FArrayBox& fcy,
+                          const FArrayBox& ba, const FArrayBox& bcen,
+                          const FArrayBox& beb,
+                          const int& is_eb_dirichlet,
+                          Real& sa, Real& sb, const Real* dx,
+                          GpuArray<int,AMREX_SPACEDIM*2>& bct,
+                          GpuArray<Real,AMREX_SPACEDIM*2> bcl,
+                          const int& bho)
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    GpuArray<Real,AMREX_SPACEDIM> fac;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf1;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf2;
+    GpuArray<Real,AMREX_SPACEDIM*2> bflo;
+ 
+    int is_dirichlet = (is_eb_dirichlet != 0) ? 1 : 0;
+
+    for (int i=0; i<AMREX_SPACEDIM; i++){
+        fac[i] = sb/(dx[i]*dx[i]);
+    }
+   
+    int idim = 0;
+    for (int cdir=0; cdir<2*AMREX_SPACEDIM; cdir++){ 
+       if (cdir == 0 || cdir == 2){
+          idim = 0;
+       }else{
+          idim = 1;
+       }
+
+       Real h = dx[idim];
+
+       if (bct[cdir] == AMREX_LO_DIRICHLET) {
+          Real h2 = 0.5*h;
+          bflo[cdir] = fac[idim] * ( h / (bcl[cdir] + h2) - 1.0); 
+          if (bho>=1) {
+             Real h3 = 3.0*h2;
+             bf1[cdir] = fac[idim] * ((h3 - bcl[cdir]) / (bcl[cdir] + h2) - 1.0);
+             bf2[cdir] = fac[idim] * (bcl[cdir] - h2) / (bcl[cdir] + h3);
+          }else{
+             bf1[cdir] = bflo[cdir];
+             bf2[cdir] = 0.0;
+          }
+       }else if (bct[cdir] == AMREX_LO_NEUMANN) {
+          bflo[cdir] = -fac[idim];
+          bf1[cdir] = -fac[idim];
+          bf2[cdir] = 0.0;
+       }
+    }
+
+    Gpu::DeviceVector<int> iter(2,0);
+    Array4<T> const& cell_id_arr = cell_id.array();
+    Array4<Real const> const& a_arr = acoefs.const_array();
+    Array4<Real const> const& bx_arr = bcoefsx.const_array();
+    Array4<Real const> const& by_arr = bcoefsy.const_array();
+    Array4<Real> const& diag_arr = diaginv.array();
+    Array4<const EBCellFlag> const& flag_arr = flag.array();
+    Array4<Real const> const& apx_arr = apx.const_array();
+    Array4<Real const> const& fcx_arr = fcx.const_array();
+    Array4<Real const> const& apy_arr = apy.const_array();
+    Array4<Real const> const& fcy_arr = fcy.const_array();
+    Array4<Real const> const& bcen_arr = bcen.const_array();
+    Array4<Real const> const& vfrc_arr = vfrc.const_array();
+    Array4<Real const> const& ba_arr = ba.const_array();
+    Array4<Real const> const& beb_arr = beb.const_array();
+
+    auto iterPtr = iter.dataPtr();
+
+    AMREX_HOST_DEVICE_FOR_3D (box, i, j, k,
+    {
+        hpeb_ij(i,j,k,nrows,ncols,rows,colsg,matg,fac,bf1,bf2,bflo,
+                  lo,hi,sa,bho,is_dirichlet,
+                  iterPtr,cell_id_arr,a_arr,bx_arr,
+                  by_arr,diag_arr,flag_arr,apx_arr,fcx_arr,
+                  apy_arr,fcy_arr,bcen_arr,vfrc_arr,
+                  ba_arr,beb_arr);
+    });
+
+}
+
+template<typename T> AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void hpeb_ij (int i, int j, int k,
+              const T& nrows,
+              T* ncols,
+              T* rows,
+              T* colsg,
+              Real* matg,
+              const GpuArray<Real,AMREX_SPACEDIM>& fac,
+              const GpuArray<Real,AMREX_SPACEDIM*2>& bf1,
+              const GpuArray<Real,AMREX_SPACEDIM*2>& bf2,
+              const GpuArray<Real,AMREX_SPACEDIM*2>& bflo,
+              const Dim3 lo,
+              const Dim3 hi,
+              const Real& sa, const int& bho, const int& is_dirichlet,
+              int* iterPtr,
+              Array4<T> const& cell_id_arr,
+              Array4<Real const> const& a_arr,
+              Array4<Real const> const& bx_arr,
+              Array4<Real const> const& by_arr,
+              Array4<Real> const& diag_arr,
+              Array4<const EBCellFlag> const& flag_arr,
+              Array4<Real const> const& apx_arr,
+              Array4<Real const> const& fcx_arr,
+              Array4<Real const> const& apy_arr,
+              Array4<Real const> const& fcy_arr,
+              Array4<Real const> const& bcen_arr,
+              Array4<Real const> const& vfrc_arr,
+              Array4<Real const> const& ba_arr,
+              Array4<Real const> const& beb_arr) noexcept
+{
+        Array2D<Real,-1,1,-1,1> mat_tmp;
+        Array1D<Real,0,3> phig1;
+        Array1D<Real,0,3> feb;
+
+        if (flag_arr(i,j,k).isCovered()){
+            diag_arr(i,j,k) = 0.0;
+        }else{
+            int irow = iterPtr[0];
+            rows[irow]  = cell_id_arr(i,j,k);
+            ncols[irow] = 0;
+            for (int jj=-1; jj<=1; jj++){
+                for (int ii=-1; ii<=1; ii++){
+                     mat_tmp(ii,jj) = 0.0;
+                }
+            }
+
+            if (flag_arr(i,j,k).isRegular()){
+                mat_tmp(0,0) = sa*a_arr(i,j,k) + fac[0]*(bx_arr(i,j,k)+bx_arr(i+1,j,k))
+                                                 + fac[1]*(by_arr(i,j,k)+by_arr(i,j+1,k));
+                mat_tmp(-1, 0) = -fac[0]*bx_arr(i,j,k);
+                mat_tmp( 1, 0) = -fac[0]*bx_arr(i+1,j,k);
+                mat_tmp( 0,-1) = -fac[1]*by_arr(i,j,k);
+                mat_tmp( 0, 1) = -fac[1]*by_arr(i,j+1,k);
+
+                if (i == lo.x && cell_id_arr(i-1,j,k)<0) {
+                   mat_tmp(0,0)  = mat_tmp(0,0) + bf1[0]*bx_arr(i,j,k);
+                   mat_tmp(-1,0) = 0.0;
+                   mat_tmp(1,0)  = mat_tmp(1,0) + bf2[0]*bx_arr(i,j,k);
+                }
+
+                if (i == hi.x && cell_id_arr(i+1,j,k)<0) {
+                   mat_tmp(0,0)  = mat_tmp(0,0) + bf1[2]*bx_arr(i+1,j,k);
+                   mat_tmp(1,0)  = 0.0;
+                   mat_tmp(-1,0) = mat_tmp(-1,0) + bf2[2]*bx_arr(i+1,j,k);
+                }
+
+                if (j == lo.y && cell_id_arr(i,j-1,k)<0) {
+                   mat_tmp(0,0)  = mat_tmp(0,0) + bf1[1]*by_arr(i,j,k);
+                   mat_tmp(0,-1) = 0.0;
+                   mat_tmp(0,1)  = mat_tmp(0,1) + bf2[1]*by_arr(i,j,k);
+                }
+
+                if (j == hi.y && cell_id_arr(i,j+1,k)<0) {
+                   mat_tmp(0,0) = mat_tmp(0,0) + bf1[3]*by_arr(i,j+1,k);
+                   mat_tmp(0,1) = 0.0;
+                   mat_tmp(0,-1) = mat_tmp(0,-1) + bf2[3]*by_arr(i,j+1,k);
+                }
+
+            }else{
+                   int cdir = 0;
+                   int joff = 0;
+                   int koff = 0;
+                   int jj = 0;
+                   int kk = 0;
+                   Real f = fac[0];
+                   Real area = apx_arr(i,j,k);
+                   Real bc = bx_arr(i,j,k);
+                   Real fracy = 0.0;
+                   if (area > 0.0) {
+                      if (area != 1.0) {
+                         joff = static_cast<int>(Math::copysign(1.0, fcx_arr(i,j,k)));
+                         jj = j+joff;
+                         if (cell_id_arr(i-1,jj,k)<0 && cell_id_arr(i,jj,k)<0) {
+                            fracy = 0.0;
+                         }else{
+                            fracy = Math::abs(fcx_arr(i,j,k));
+                         }
+                      }else{
+                         joff = 0;
+                         jj = j;
+                         fracy = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracy)*area*bc;
+                      if (cell_id_arr(i-1,j,k)>=0) {
+                         mat_tmp( 0,0) = mat_tmp( 0,0) + tmp*f;
+                         mat_tmp(-1,0) = mat_tmp(-1,0) - tmp*f;
+                      }else if (cell_id_arr(i+1,j,k)<0 || apx_arr(i+1,j,k)==0) {
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(1,0) = mat_tmp(1,0) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracy>0.0) {
+                         if (cell_id_arr(i-1,jj,k)>=0 && cell_id_arr(i,jj,k)>=0) {
+                            mat_tmp(-1,joff) = mat_tmp(-1,joff) - fracy*area*bx_arr(i,jj,k)*f;
+                            mat_tmp( 0,joff) = mat_tmp( 0,joff) + fracy*area*bx_arr(i,jj,k)*f;
+                         }else if (cell_id_arr(i+1,jj,k)<0 || apx_arr(i+1,jj,k)==0) {
+                            mat_tmp( 0,joff) = mat_tmp( 0,joff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,joff) = mat_tmp( 0,joff) + tmp*(f+bf1[cdir]);
+                            mat_tmp( 1,joff) = mat_tmp( 1,joff) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 2;
+                   f = fac[0];
+                   area = apx_arr(i+1,j,k);
+                   bc = bx_arr(i+1,j,k);
+                   if (area>0.0) {
+                      if (area!=1.0) {
+                         joff = static_cast<int>(Math::copysign(1.0, fcx_arr(i+1,j,k)));
+                         jj = j+joff;
+                         if (cell_id_arr(i,jj,k)<0 && cell_id_arr(i+1,jj,k)<0) {
+                            fracy = 0.0;
+                         }else{
+                            fracy = Math::abs(fcx_arr(i+1,j,k));
+                         }
+                      }else{
+                         joff = 0;
+                         jj = j;
+                         fracy = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracy)*area*bc;
+                      if (cell_id_arr(i+1,j,k)>=0) {
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*f;
+                         mat_tmp(1,0) = mat_tmp(1,0) - tmp*f;
+                      }else if (cell_id_arr(i-1,j,k)<0 || apx_arr(i,j,k)==0.0) {
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp( 0,0) = mat_tmp( 0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(-1,0) = mat_tmp(-1,0) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracy>0.0) {
+                         if (cell_id_arr(i,jj,k)>=0 && cell_id_arr(i+1,jj,k)>=0) {
+                            mat_tmp(0,joff) = mat_tmp(0,joff) + fracy*area*bx_arr(i+1,jj,k)*f;
+                            mat_tmp(1,joff) = mat_tmp(1,joff) - fracy*area*bx_arr(i+1,jj,k)*f;
+                         }else if (cell_id_arr(i-1,jj,k)<0 || apx_arr(i,jj,k)==0.0 || bho==0) {
+                            mat_tmp(0,joff) = mat_tmp(0,joff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,joff) = mat_tmp( 0,joff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(-1,joff) = mat_tmp(-1,joff) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 1;
+                   Real fracx = 0.0;
+                   int ii = 0;
+                   int ioff = 0;
+
+                   f = fac[1];
+                   area = apy_arr(i,j,k);
+                   bc = by_arr(i,j,k);
+                   if (area>0) {
+                      if (area!=1) {
+                         ioff = static_cast<int>(Math::copysign(1.0, fcy_arr(i,j,k)));
+                         ii = i+ioff;
+                         if (cell_id_arr(ii,j-1,k)<0 && cell_id_arr(ii,j,k)<0) {
+                            fracx = 0.0;
+                         }else{
+                            fracx = Math::abs(fcy_arr(i,j,k));
+                         }
+                      }else{
+                         ioff = 0;
+                         ii = i;
+                         fracx = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracx)*area*bc;
+                      if (cell_id_arr(i,j-1,k)>=0) {
+                         mat_tmp(0, 0) = mat_tmp(0, 0) + tmp*f;
+                         mat_tmp(0,-1) = mat_tmp(0,-1) - tmp*f;
+                      }else if (cell_id_arr(i,j+1,k)<0 || apy_arr(i,j+1,k)==0.0) {
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(0,1) = mat_tmp(0,1) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracx>0.0) {
+                         if (cell_id_arr(ii,j-1,k)>=0 && cell_id_arr(ii,j,k)>=0) {
+                            mat_tmp(ioff,-1) = mat_tmp(ioff,-1) - fracx*area*by_arr(ii,j,k)*f;
+                            mat_tmp(ioff, 0) = mat_tmp(ioff, 0) + fracx*area*by_arr(ii,j,k)*f;
+                         }else if (cell_id_arr(ii,j+1,k)<0 || apy_arr(ii,j+1,k)==0.0) {
+                            mat_tmp(ioff,0) = mat_tmp(ioff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,0) = mat_tmp(ioff,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,1) = mat_tmp(ioff,1) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 3;
+                   f = fac[1];
+                   area = apy_arr(i,j+1,k);
+                   bc = by_arr(i,j+1,k);
+                   if (area>0.0) {
+                      if (area!=1.0) {
+                         ioff = static_cast<int>(Math::copysign(1.0, fcy_arr(i,j+1,k)));
+                         ii = i+ioff;
+                         if (cell_id_arr(ii,j,k)<0 && cell_id_arr(ii,j+1,k)<0) {
+                            fracx = 0.0;
+                         }else{
+                            fracx = Math::abs(fcy_arr(i,j+1,k));
+                         }
+                      }else{
+                         ioff = 0;
+                         ii = i;
+                         fracx = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracx)*area*bc;
+                      if (cell_id_arr(i,j+1,k)>=0) {
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*f;
+                         mat_tmp(0,1) = mat_tmp(0,1) - tmp*f;
+                      }else if (cell_id_arr(i,j-1,k)<0 || apy_arr(i,j,k)==0.0) {
+                         mat_tmp(0,0) = mat_tmp(0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0, 0) = mat_tmp(0, 0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(0,-1) = mat_tmp(0,-1) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracx>0.0) {
+                         if (cell_id_arr(ii,j,k)>=0 && cell_id_arr(ii,j+1,k)>=0) {
+                            mat_tmp(ioff,0) = mat_tmp(ioff,0) + fracx*area*by_arr(ii,j+1,k)*f;
+                            mat_tmp(ioff,1) = mat_tmp(ioff,1) - fracx*area*by_arr(ii,j+1,k)*f;
+                         }else if (cell_id_arr(ii,j-1,k)<0 || apy_arr(ii,j,k)==0.0) {
+                            mat_tmp(ioff,0) = mat_tmp(ioff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff, 0) = mat_tmp(ioff, 0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,-1) = mat_tmp(ioff,-1) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   if (is_dirichlet){
+                     Real anorm = std::sqrt((apx_arr(i,j,k) - apx_arr(i+1,j,k))*(apx_arr(i,j,k) - apx_arr(i+1,j,k)) 
+                              + (apy_arr(i,j,k) - apy_arr(i,j+1,k))*(apy_arr(i,j,k) - apy_arr(i,j+1,k))); 
+
+                     Real anorminv = 1.0/anorm;
+                     Real anrmx = (apx_arr(i,j,k) - apx_arr(i+1,j,k))*anorminv;
+                     Real anrmy = (apy_arr(i,j,k) - apy_arr(i,j+1,k))*anorminv;
+                     Real sx   = Math::copysign(1.0,anrmx);
+                     Real sy   = Math::copysign(1.0,anrmy);
+                     Real bctx = bcen_arr(i,j,k,0);
+                     Real bcty = bcen_arr(i,j,k,1);
+                     Real dg   = get_dx_eb(vfrc_arr(i,j,k)) / max(Math::abs(anrmx), Math::abs(anrmy));
+                     Real gx   = bctx - dg*anrmx;
+                     Real gy   = bcty - dg*anrmy;
+                     int ioff = -static_cast<int>(sx);
+                     int joff = -static_cast<int>(sy);
+                     phig1(0) = 1.0 + gx*sx + gy*sy + gx*gy*sx*sy;
+                     phig1(1) =     - gx*sx         - gx*gy*sx*sy;
+                     phig1(2) =             - gy*sy - gx*gy*sx*sy;
+                     phig1(3) =                     + gx*gy*sx*sy;
+
+                     for (int ii=0; ii<4; ii++){
+                         feb(ii) = -phig1(ii) * (ba_arr(i,j,k) * beb_arr(i,j,k) / dg);
+                     }
+                     mat_tmp(0   , 0  ) = mat_tmp(0   , 0  ) - feb(0)*fac[0];
+                     mat_tmp(ioff, 0  ) = mat_tmp(ioff, 0  ) - feb(1)*fac[0];
+                     mat_tmp(0   ,joff) = mat_tmp(0   ,joff) - feb(2)*fac[0];
+                     mat_tmp(ioff,joff) = mat_tmp(ioff,joff) - feb(3)*fac[0];
+
+                   }
+
+                   for (int jj=-1; jj<=1; jj++){
+                       for (int ii=-1; ii<=1; ii++){
+                           mat_tmp(ii,jj) = mat_tmp(ii,jj) * (1.0/vfrc_arr(i,j,k));
+                       }
+                   }
+                   mat_tmp(0,0) = mat_tmp(0,0) + sa*a_arr(i,j,k);
+            }
+                   diag_arr(i,j,k) = 1.0/mat_tmp(0,0);
+                   for (int jj=-1; jj<=1; jj++){
+                       for (int ii=-1; ii<=1; ii++){
+                           if (mat_tmp(ii,jj) != 0.0 && cell_id_arr(i+ii,j+jj,k)>=0){
+                               int imat = iterPtr[1];
+                               ncols[irow]  = ncols[irow] +1;
+                               colsg[imat]  = cell_id_arr(i+ii,j+jj,k);
+                               matg[imat] = mat_tmp(ii,jj)*diag_arr(i,j,k);
+                               Gpu::Atomic::Add(&iterPtr[1], 1);
+                           }
+                       }
+                   }
+                   Gpu::Atomic::Add(&iterPtr[0], 1);
+        }
+}
+
+#endif
+
+}
+#endif
diff --git a/Src/Extern/HYPRE/AMReX_Habec_3D_K.H b/Src/Extern/HYPRE/AMReX_Habec_3D_K.H
new file mode 100644
index 00000000000..7e7e87c1602
--- /dev/null
+++ b/Src/Extern/HYPRE/AMReX_Habec_3D_K.H
@@ -0,0 +1,1121 @@
+#ifndef AMREX_HABEC_3D_H_
+#define AMREX_HABEC_3D_H_
+
+#include <AMReX_LO_BCTYPES.H>
+#ifdef AMREX_USE_HYPRE
+#include <AMReX_Hypre.H>
+#endif
+#include <AMReX_MultiFabUtil.H>
+
+#ifdef AMREX_USE_EB
+#include <AMReX_EBMultiFabUtil.H>
+#include <AMReX_MultiCutFab.H>
+#include <AMReX_EBFabFactory.H>
+#include <AMReX_MLEBABecLap_K.H>
+#endif
+
+namespace amrex {
+
+AMREX_FORCE_INLINE
+void amrex_hpbcoef (Box const& box,
+                    BaseFab<GpuArray<Real,2*AMREX_SPACEDIM + 1>>& mat,
+                    const FArrayBox& b,
+                    Real& sb,
+                    const Real* dx,
+                    int& idim)
+{
+    Array4<GpuArray<Real,2*AMREX_SPACEDIM + 1>> const& mat_arr = mat.array();
+    Array4<Real const> const& b_arr = b.const_array();
+    Real fac = sb / (dx[idim]*dx[idim]);
+
+    if (idim == 0) {
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + fac * (b_arr(i,j,k) + b_arr(i+1,j,k));
+            mat_arr(i,j,k)[1] = - fac * b_arr(i,j,k);
+            mat_arr(i,j,k)[2] = - fac * b_arr(i+1,j,k);
+        });
+    }else if (idim == 1) {
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + fac * (b_arr(i,j,k) + b_arr(i,j+1,k));
+            mat_arr(i,j,k)[3] = - fac * b_arr(i,j,k);
+            mat_arr(i,j,k)[4] = - fac * b_arr(i,j+1,k);
+        });
+    }else{
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + fac * (b_arr(i,j,k) + b_arr(i,j,k+1));
+            mat_arr(i,j,k)[5] = - fac * b_arr(i,j,k);
+            mat_arr(i,j,k)[6] = - fac * b_arr(i,j,k+1);
+        });
+    }
+}
+
+AMREX_FORCE_INLINE
+void amrex_hpmat (Box const& box,
+                  BaseFab<GpuArray<Real,2*AMREX_SPACEDIM + 1>>& mat,
+                  const FArrayBox& b,
+                  const Mask& msk,
+                  Real& sb,
+                  const Real* dx,
+                  int& cdir,
+                  const int& bct,
+                  const Real& bcl,
+                  const int& bho)
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    Array4<GpuArray<Real,2*AMREX_SPACEDIM + 1>> const& mat_arr = mat.array();
+    Array4<Real const> const& b_arr = b.const_array();
+    Array4<int const> const& msk_arr = msk.const_array();
+
+    Real h = 0.0;
+    if (cdir == 0 || cdir == 3) {
+        h = dx[0];
+    }else if (cdir == 1 || cdir == 4) {
+        h = dx[1];
+    }else{
+        h = dx[2];
+    }
+    Real fac = sb/(h*h);
+
+    Real h2 = 0.0;
+    Real h3 = 0.0;
+    Real bf1 = 0.0;
+    Real bf2 = 0.0;
+    if (bct == AMREX_LO_DIRICHLET) {
+        h2 = 0.5*h;
+        if (bho >= 1) {
+            h3 = 3.0*h2;
+            bf1 = fac*((h3 - bcl)/(bcl + h2) - 1.0);
+            bf2 = fac*(bcl - h2)/(bcl + h3);
+        }else{
+            bf1 = fac*( h/(bcl + h2) - 1.0);
+            bf2 = 0.0;
+        }
+    }else if (bct == AMREX_LO_NEUMANN) {
+        bf1 = -fac;
+        bf2 = 0.0;
+    }else{
+        Abort("hpmat: unsupported boundary type");
+    }
+
+    if (cdir == 0){
+        Box tbx = box;
+        tbx.setSmall(0,lo.x).setBig(0,lo.x); // 0: x-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tbx, i, j, k,
+        {
+            if (msk_arr(lo.x-1,j,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j,k);
+                mat_arr(i,j,k)[1] = 0.0;
+                mat_arr(i,j,k)[2] = mat_arr(i,j,k)[2] + bf2*b_arr(i,j,k);
+            }
+        });
+    }else if (cdir == 3){
+        Box tbx = box;
+        tbx.setSmall(0,hi.x).setBig(0,hi.x); // 0: x-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tbx, i, j, k,
+        {
+            if (msk_arr(hi.x+1,j,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i+1,j,k);
+                mat_arr(i,j,k)[2] = 0.0;
+                mat_arr(i,j,k)[1] = mat_arr(i,j,k)[1] + bf2*b_arr(i+1,j,k);
+            }
+        });
+   }else if (cdir == 1){
+        Box tby = box;
+        tby.setSmall(1,lo.y).setBig(1,lo.y); // 1: y-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tby, i, j, k,
+        {
+            if (msk_arr(i,lo.y-1,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j,k);
+                mat_arr(i,j,k)[3] = 0.0;
+                mat_arr(i,j,k)[4] = mat_arr(i,j,k)[4] + bf2*b_arr(i,j,k);
+            }
+        });
+   }else if (cdir == 4){
+        Box tby = box;
+        tby.setSmall(1,hi.y).setBig(1,hi.y); // 1: y-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tby, i, j, k,
+        {
+            if (msk_arr(i,hi.y+1,k) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j+1,k);
+                mat_arr(i,j,k)[4] = 0.0;
+                mat_arr(i,j,k)[3] = mat_arr(i,j,k)[3] + bf2*b_arr(i,j+1,k);
+            }
+        });
+   }else if (cdir == 2){
+        Box tbz = box;
+        tbz.setSmall(2,lo.z).setBig(2,lo.z); // 2: z-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tbz, i, j, k,
+        {
+            if (msk_arr(i,j,lo.z-1) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j,k);
+                mat_arr(i,j,k)[5] = 0.0;
+                mat_arr(i,j,k)[6] = mat_arr(i,j,k)[6] + bf2*b_arr(i,j,k);
+            }
+        });   
+   }else if (cdir == 5){
+        Box tbz = box;
+        tbz.setSmall(2,hi.z).setBig(2,hi.z); // 2: z-direction
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (tbz, i, j, k,
+        {
+            if (msk_arr(i,j,hi.z+1) > 0){
+                mat_arr(i,j,k)[0] = mat_arr(i,j,k)[0] + bf1*b_arr(i,j,k+1);
+                mat_arr(i,j,k)[6] = 0.0;
+                mat_arr(i,j,k)[5] = mat_arr(i,j,k)[5] + bf2*b_arr(i,j,k+1);
+            }
+        });
+   }else{
+        Abort("hpmat: impossible face orientation");
+   }
+}
+
+template<typename T> AMREX_FORCE_INLINE
+void amrex_hpijmatrix (Box const& box,
+                       const T& /*nrows*/,
+                       T* ncols,
+                       T* rows,
+                       T* colsg,
+                       Real* matg,
+                       BaseFab<T>& cell_id,
+                       T& /*offset*/, FArrayBox& diaginv,
+                       FArrayBox& acoefs, FArrayBox& bcoefsx,
+                       FArrayBox& bcoefsy, FArrayBox& bcoefsz,
+                       Real& sa, Real& sb, const Real* dx,
+                       GpuArray<int,AMREX_SPACEDIM*2>& bct,
+                       GpuArray<Real,AMREX_SPACEDIM*2> bcl,
+                       const int& bho,
+                       IArrayBox const* osmsk)
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    GpuArray<Real,AMREX_SPACEDIM> fac;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf1;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf2;
+
+    for (int i=0; i<AMREX_SPACEDIM; i++){
+        fac[i] = sb/(dx[i]*dx[i]);
+    }
+   
+    int idim = 0;
+    for (int cdir=0; cdir<=AMREX_SPACEDIM*2-1; cdir++){ 
+       if (cdir == 0 || cdir == 3){
+          idim = 0;
+       }else if (cdir == 1 || cdir == 4){
+          idim = 1;
+       }else{
+          idim = 2;
+       }
+
+       Real h = dx[idim];
+
+       if (bct[cdir] == AMREX_LO_DIRICHLET) {
+          Real h2 = 0.5*h;
+          if (bho>=1) {
+             Real h3 = 3.0*h2;
+             bf1[cdir] = fac[idim] * ((h3 - bcl[cdir]) / (bcl[cdir] + h2) - 1.0);
+             bf2[cdir] = fac[idim] * (bcl[cdir] - h2) / (bcl[cdir] + h3);
+          }else{
+             bf1[cdir] = fac[idim] * ( h / (bcl[cdir] + h2) - 1.0);
+             bf2[cdir] = 0.0;
+          }
+       }else if (bct[cdir] == AMREX_LO_NEUMANN) {
+          bf1[cdir] = -fac[idim];
+          bf2[cdir] = 0.0;
+       }
+    }
+
+    Gpu::DeviceVector<int> iter(2,0);
+
+    Array4<T> const& cell_id_arr = cell_id.array();
+    Gpu::DeviceVector<T> cols_tmp(AMREX_SPACEDIM*2+1,0.0);
+    Gpu::DeviceVector<Real> mat_tmp(AMREX_SPACEDIM*2+1,0.0);
+    Array4<Real const> const& a_arr = acoefs.const_array();
+    Array4<Real const> const& bx_arr = bcoefsx.const_array();
+    Array4<Real const> const& by_arr = bcoefsy.const_array();
+    Array4<Real const> const& bz_arr = bcoefsz.const_array();
+    Array4<Real> const& diag_arr = diaginv.array();
+    Array4<int const> const osm = osmsk ? osmsk->const_array() : Array4<int const>{};
+
+    auto cols_tmpPtr = cols_tmp.dataPtr();
+    auto mat_tmpPtr = mat_tmp.dataPtr();
+    auto iterPtr = iter.dataPtr();
+
+    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+    {
+        int irow = iterPtr[0];
+        rows[irow]  = cell_id_arr(i,j,k);
+        ncols[irow] = 0;
+
+        if (!osm or osm(i,j,k) != 0) {
+            cols_tmpPtr[0] = cell_id_arr(i,j,k);
+            mat_tmpPtr[0]  = sa*a_arr(i,j,k) + fac[0]*(bx_arr(i,j,k)+bx_arr(i+1,j,k))
+                                             + fac[1]*(by_arr(i,j,k)+by_arr(i,j+1,k))
+                                             + fac[2]*(bz_arr(i,j,k)+bz_arr(i,j,k+1));
+
+            cols_tmpPtr[1] = cell_id_arr(i-1,j,k);
+            mat_tmpPtr[1]  = -fac[0]*bx_arr(i,j,k);
+
+            cols_tmpPtr[2] = cell_id_arr(i+1,j,k);
+            mat_tmpPtr[2]  = -fac[0]*bx_arr(i+1,j,k);
+
+            cols_tmpPtr[3] = cell_id_arr(i,j-1,k);
+            mat_tmpPtr[3]  = -fac[1]*by_arr(i,j,k);
+
+            cols_tmpPtr[4] = cell_id_arr(i,j+1,k);
+            mat_tmpPtr[4]  = -fac[1]*by_arr(i,j+1,k);
+
+            cols_tmpPtr[5] = cell_id_arr(i,j,k-1);
+            mat_tmpPtr[5]  = -fac[2]*bz_arr(i,j,k);
+
+            cols_tmpPtr[6] = cell_id_arr(i,j,k+1);
+            mat_tmpPtr[6]  = -fac[2]*bz_arr(i,j,k+1);
+
+            if (i == lo.x && cell_id_arr(i-1,j,k)<0) {
+                mat_tmpPtr[0] += bf1[0]*bx_arr(i,j,k);
+                mat_tmpPtr[2] += bf2[0]*bx_arr(i,j,k);
+            }
+
+            if (i == hi.x && cell_id_arr(i+1,j,k)<0) {
+                mat_tmpPtr[0] += bf1[3]*bx_arr(i+1,j,k);
+                mat_tmpPtr[1] += bf2[3]*bx_arr(i+1,j,k);
+            }
+
+            if (j == lo.y && cell_id_arr(i,j-1,k)<0) {
+                mat_tmpPtr[0] += bf1[1]*by_arr(i,j,k);
+                mat_tmpPtr[4] += bf2[1]*by_arr(i,j,k);
+            }
+
+            if (j == hi.y && cell_id_arr(i,j+1,k)<0) {
+                mat_tmpPtr[0] += bf1[4]*by_arr(i,j+1,k);
+                mat_tmpPtr[3] += bf2[4]*by_arr(i,j+1,k);
+            }
+
+            if (k == lo.z && cell_id_arr(i,j,k-1)<0) {
+                mat_tmpPtr[0] += bf1[2]*bz_arr(i,j,k);
+                mat_tmpPtr[6] += bf2[2]*bz_arr(i,j,k);
+            }
+
+            if (k == hi.z && cell_id_arr(i,j,k+1)<0) {
+                mat_tmpPtr[0] += bf1[5]*bz_arr(i,j,k+1);
+                mat_tmpPtr[5] += bf2[5]*bz_arr(i,j,k+1);
+            }
+
+            diag_arr(i,j,k) = 1.0/mat_tmpPtr[0];
+
+            for (int ic=0; ic<=6; ic++){
+                if (cols_tmpPtr[ic] >= 0){
+                    int imat = iterPtr[1];
+                    ncols[irow]  = ncols[irow] +1;
+                    colsg[imat]  = cols_tmpPtr[ic];
+                    matg[imat]   = mat_tmpPtr[ic]*diag_arr(i,j,k);
+                    Gpu::Atomic::Add(&iterPtr[1], 1);
+                }
+            }
+            Gpu::Atomic::Add(&iterPtr[0], 1);
+        } else {
+            diag_arr(i,j,k) = 1.0_rt;
+            int imat = iterPtr[1];
+            ++(ncols[irow]);
+            colsg[imat] = cell_id_arr(i,j,k);
+            matg[imat] = 1.0;
+            Gpu::Atomic::Add(&iterPtr[1], 1);
+            Gpu::Atomic::Add(&iterPtr[0], 1);
+        }
+    });
+}
+
+#ifdef AMREX_USE_EB
+
+template<typename T> AMREX_FORCE_INLINE
+void amrex_hpeb_ijmatrix (Box const& box,
+                          const T& nrows,
+                          T* ncols,
+                          T* rows,
+                          T* colsg,
+                          Real* matg,
+                          BaseFab<T>& cell_id,
+                          T& offset, FArrayBox& diaginv,
+                          FArrayBox& acoefs, FArrayBox& bcoefsx,
+                          FArrayBox& bcoefsy, FArrayBox& bcoefsz,
+                          const EBCellFlagFab& flag,
+                          const FArrayBox& vfrc,
+                          const FArrayBox& apx, const FArrayBox& apy,
+                          const FArrayBox& apz, const FArrayBox& fcx,
+                          const FArrayBox& fcy, const FArrayBox& fcz,
+                          const FArrayBox& ba, const FArrayBox& bcen,
+                          const FArrayBox& beb,
+                          const int& is_eb_dirichlet,
+                          Real& sa, Real& sb, const Real* dx,
+                          GpuArray<int,AMREX_SPACEDIM*2>& bct,
+                          GpuArray<Real,AMREX_SPACEDIM*2> bcl,
+                          const int& bho)
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    GpuArray<Real,AMREX_SPACEDIM> fac;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf1;
+    GpuArray<Real,AMREX_SPACEDIM*2> bf2;
+    GpuArray<Real,AMREX_SPACEDIM*2> bflo;
+ 
+    int is_dirichlet = (is_eb_dirichlet != 0) ? 1 : 0;
+
+    for (int i=0; i<AMREX_SPACEDIM; i++){
+        fac[i] = sb/(dx[i]*dx[i]);
+    }
+   
+    int idim = 0;
+    for (int cdir=0; cdir<2*AMREX_SPACEDIM; cdir++){ 
+       if (cdir == 0 || cdir == 3){
+          idim = 0;
+       }else if (cdir == 1 || cdir == 4){
+          idim = 1;
+       }else{
+          idim = 2;
+       }
+
+       Real h = dx[idim];
+
+       if (bct[cdir] == AMREX_LO_DIRICHLET) {
+          Real h2 = 0.5*h;
+          bflo[cdir] = fac[idim] * ( h / (bcl[cdir] + h2) - 1.0); 
+          if (bho>=1) {
+             Real h3 = 3.0*h2;
+             bf1[cdir] = fac[idim] * ((h3 - bcl[cdir]) / (bcl[cdir] + h2) - 1.0);
+             bf2[cdir] = fac[idim] * (bcl[cdir] - h2) / (bcl[cdir] + h3);
+          }else{
+             bf1[cdir] = bflo[cdir];
+             bf2[cdir] = 0.0;
+          }
+       }else if (bct[cdir] == AMREX_LO_NEUMANN) {
+          bflo[cdir] = -fac[idim];
+          bf1[cdir] = -fac[idim];
+          bf2[cdir] = 0.0;
+       }
+    }
+
+    Gpu::DeviceVector<int> iter(2,0);
+    Array4<T> const& cell_id_arr = cell_id.array();
+    Array4<Real const> const& a_arr = acoefs.const_array();
+    Array4<Real const> const& bx_arr = bcoefsx.const_array();
+    Array4<Real const> const& by_arr = bcoefsy.const_array();
+    Array4<Real const> const& bz_arr = bcoefsz.const_array();
+    Array4<Real> const& diag_arr = diaginv.array();
+    Array4<const EBCellFlag> const& flag_arr = flag.array();
+    Array4<Real const> const& apx_arr = apx.const_array();
+    Array4<Real const> const& fcx_arr = fcx.const_array();
+    Array4<Real const> const& apy_arr = apy.const_array();
+    Array4<Real const> const& fcy_arr = fcy.const_array();
+    Array4<Real const> const& apz_arr = apz.const_array();
+    Array4<Real const> const& fcz_arr = fcz.const_array();
+    Array4<Real const> const& bcen_arr = bcen.const_array();
+    Array4<Real const> const& vfrc_arr = vfrc.const_array();
+    Array4<Real const> const& ba_arr = ba.const_array();
+    Array4<Real const> const& beb_arr = beb.const_array();
+
+    auto iterPtr = iter.dataPtr();
+
+    AMREX_HOST_DEVICE_FOR_3D (box, i, j, k,
+    {
+        hpeb_ij(i,j,k,nrows,ncols,rows,colsg,matg,fac,bf1,bf2,bflo,
+                  lo,hi,sa,bho,is_dirichlet,
+                  iterPtr,cell_id_arr,a_arr,bx_arr,
+                  by_arr,bz_arr,diag_arr,flag_arr,apx_arr,fcx_arr,
+                  apy_arr,fcy_arr,apz_arr,fcz_arr,bcen_arr,vfrc_arr,
+                  ba_arr,beb_arr);
+    });
+}
+
+template<typename T> AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void hpeb_ij (int i, int j, int k,
+              const T& nrows,
+              T* ncols,
+              T* rows,
+              T* colsg,
+              Real* matg,
+              const GpuArray<Real,AMREX_SPACEDIM>& fac,
+              const GpuArray<Real,AMREX_SPACEDIM*2>& bf1,
+              const GpuArray<Real,AMREX_SPACEDIM*2>& bf2,
+              const GpuArray<Real,AMREX_SPACEDIM*2>& bflo,
+              const Dim3 lo,
+              const Dim3 hi,
+              const Real& sa, const int& bho, const int& is_dirichlet,
+              int* iterPtr,
+              Array4<T> const& cell_id_arr,
+              Array4<Real const> const& a_arr,
+              Array4<Real const> const& bx_arr,
+              Array4<Real const> const& by_arr,
+              Array4<Real const> const& bz_arr,
+              Array4<Real> const& diag_arr,
+              Array4<const EBCellFlag> const& flag_arr,
+              Array4<Real const> const& apx_arr,
+              Array4<Real const> const& fcx_arr,
+              Array4<Real const> const& apy_arr,
+              Array4<Real const> const& fcy_arr,
+              Array4<Real const> const& apz_arr,
+              Array4<Real const> const& fcz_arr,
+              Array4<Real const> const& bcen_arr,
+              Array4<Real const> const& vfrc_arr,
+              Array4<Real const> const& ba_arr,
+              Array4<Real const> const& beb_arr) noexcept
+{
+        Array3D<Real,-1,1,-1,1,-1,1> mat_tmp;
+        Array1D<Real,0,7> phig1;
+        Array1D<Real,0,7> feb;
+
+        if (flag_arr(i,j,k).isCovered()){
+            diag_arr(i,j,k) = 0.0;
+        }else{
+            int irow = iterPtr[0];
+            rows[irow]  = cell_id_arr(i,j,k);
+            ncols[irow] = 0;
+            for (int kk=-1; kk<=1; kk++){
+                for (int jj=-1; jj<=1; jj++){
+                    for (int ii=-1; ii<=1; ii++){
+                         mat_tmp(ii,jj,kk) = 0.0;
+                    }
+                }
+            }
+
+            if (flag_arr(i,j,k).isRegular()){
+                mat_tmp(0,0,0) = sa*a_arr(i,j,k) + fac[0]*(bx_arr(i,j,k)+bx_arr(i+1,j,k))
+                                                 + fac[1]*(by_arr(i,j,k)+by_arr(i,j+1,k))
+                                                 + fac[2]*(bz_arr(i,j,k)+bz_arr(i,j,k+1));
+                mat_tmp(-1, 0, 0) = -fac[0]*bx_arr(i,j,k);
+                mat_tmp( 1, 0, 0) = -fac[0]*bx_arr(i+1,j,k);
+                mat_tmp( 0,-1, 0) = -fac[1]*by_arr(i,j,k);
+                mat_tmp( 0, 1, 0) = -fac[1]*by_arr(i,j+1,k);
+                mat_tmp( 0, 0,-1) = -fac[2]*bz_arr(i,j,k);
+                mat_tmp( 0, 0, 1) = -fac[2]*bz_arr(i,j,k+1);
+
+                if (i == lo.x && cell_id_arr(i-1,j,k)<0) {
+                   mat_tmp(0,0,0)  = mat_tmp(0,0,0) + bf1[0]*bx_arr(i,j,k);
+                   mat_tmp(-1,0,0) = 0.0;
+                   mat_tmp(1,0,0)  = mat_tmp(1,0,0) + bf2[0]*bx_arr(i,j,k);
+                }
+
+                if (i == hi.x && cell_id_arr(i+1,j,k)<0) {
+                   mat_tmp(0,0,0)  = mat_tmp(0,0,0) + bf1[3]*bx_arr(i+1,j,k);
+                   mat_tmp(1,0,0)  = 0.0;
+                   mat_tmp(-1,0,0) = mat_tmp(-1,0,0) + bf2[3]*bx_arr(i+1,j,k);
+                }
+
+                if (j == lo.y && cell_id_arr(i,j-1,k)<0) {
+                   mat_tmp(0,0,0)  = mat_tmp(0,0,0) + bf1[1]*by_arr(i,j,k);
+                   mat_tmp(0,-1,0) = 0.0;
+                   mat_tmp(0,1,0)  = mat_tmp(0,1,0) + bf2[1]*by_arr(i,j,k);
+                }
+
+                if (j == hi.y && cell_id_arr(i,j+1,k)<0) {
+                   mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1[4]*by_arr(i,j+1,k);
+                   mat_tmp(0,1,0) = 0.0;
+                   mat_tmp(0,-1,0) = mat_tmp(0,-1,0) + bf2[4]*by_arr(i,j+1,k);
+                }
+
+                if (k == lo.z && cell_id_arr(i,j,k-1)<0) {
+                   mat_tmp(0,0,0)  = mat_tmp(0,0,0) + bf1[2]*bz_arr(i,j,k);
+                   mat_tmp(0,0,-1) = 0.0;
+                   mat_tmp(0,0,1)  = mat_tmp(0,0,1) + bf2[2]*bz_arr(i,j,k);
+                }
+
+                if (k == hi.z && cell_id_arr(i,j,k+1)<0) {
+                   mat_tmp(0,0,0) = mat_tmp(0,0,0) + bf1[5]*bz_arr(i,j,k+1);
+                   mat_tmp(0,0,1) = 0.0;
+                   mat_tmp(0,0,-1) = mat_tmp(0,0,-1) + bf2[5]*bz_arr(i,j,k+1);
+                }
+            }else{
+                   int cdir = 0;
+                   int joff = 0;
+                   int koff = 0;
+                   int jj = 0;
+                   int kk = 0;
+                   Real f = fac[0];
+                   Real area = apx_arr(i,j,k);
+                   Real abc = area*bx_arr(i,j,k);
+                   Real fracy = 0.0;
+                   Real fracz = 0.0;
+                   if (area > 0.0) {
+                      if (area != 1.0) {
+                         joff = static_cast<int>(Math::copysign(1.0, fcx_arr(i,j,k,0)));
+                         koff = static_cast<int>(Math::copysign(1.0, fcx_arr(i,j,k,1)));  
+                         jj = j+joff;
+                         kk = k+koff;
+                         if (cell_id_arr(i-1,jj,k)<0 && cell_id_arr(i,jj,k)<0) {
+                            fracy = 0.0;
+                         }else{
+                            fracy = Math::abs(fcx_arr(i,j,k,0));
+                         }
+                         if (cell_id_arr(i-1,j,kk)<0 && cell_id_arr(i,j,kk)<0) {
+                            fracz = 0.0;
+                         }else{
+                            fracz = Math::abs(fcx_arr(i,j,k,1));
+                         }
+                         if (cell_id_arr(i-1,jj,kk)<0 && cell_id_arr(i,jj,kk)<0 && (fracy*fracz)>0.0) {
+                            fracy = 0.0;
+                            fracz = 0.0;
+                         }
+                      }else{
+                         joff = 0;
+                         koff = 0;
+                         jj = j;
+                         kk = k;
+                         fracy = 0.0;
+                         fracz = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracy)*(1.0-fracz)*abc;
+                      // cell(i-1,j,k) is not covered because area > 0
+                      if (cell_id_arr(i-1,j,k)>=0) {
+                         mat_tmp( 0,0,0) = mat_tmp( 0,0,0) + tmp*f;
+                         mat_tmp(-1,0,0) = mat_tmp(-1,0,0) - tmp*f;
+                      }else if (cell_id_arr(i+1,j,k)<0 || apx_arr(i+1,j,k)==0 || bho==0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(1,0,0) = mat_tmp(1,0,0) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracy>0.0) {
+                         tmp = fracy*(1.0-fracz)*area*bx_arr(i,jj,k);
+                         if (cell_id_arr(i-1,jj,k)>=0 && cell_id_arr(i,jj,k)>=0) {
+                            mat_tmp(-1,joff,0) = mat_tmp(-1,joff,0) - tmp*f;
+                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*f;
+                         }else if (cell_id_arr(i+1,jj,k)<0 || apx_arr(i+1,jj,k)==0 || bho==0) {
+                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp( 1,joff,0) = mat_tmp( 1,joff,0) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracz>0.0) {
+                         tmp = fracz*(1.0-fracy)*area*bx_arr(i,j,kk);
+                         if (cell_id_arr(i-1,j,kk)>=0 && cell_id_arr(i,j,kk)>=0) {
+                            mat_tmp(-1,0,koff) = mat_tmp(-1,0,koff) - tmp*f;
+                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*f;
+                         }else if (cell_id_arr(i+1,j,kk)<0 || apx_arr(i+1,j,kk)==0 || bho==0) {
+                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp( 1,0,koff) = mat_tmp( 1,0,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracy>0.0 && fracz>0.0) {
+                         tmp = fracy*fracz*area*bx_arr(i,jj,kk);
+                         if (cell_id_arr(i-1,jj,kk)>=0 && cell_id_arr(i,jj,kk)>=0) {
+                            mat_tmp(-1,joff,koff) = mat_tmp(-1,joff,koff) - tmp*f;
+                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*f;
+                         }else if (cell_id_arr(i+1,jj,kk)<0 || apx_arr(i+1,jj,kk)==0 || bho==0) {
+                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp( 1,joff,koff) = mat_tmp( 1,joff,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 3;
+                   f = fac[0];
+                   area = apx_arr(i+1,j,k);
+                   abc = area*bx_arr(i+1,j,k);
+                   if (area>0.0) {
+                      if (area!=1.0) {
+                         joff = static_cast<int>(Math::copysign(1.0, fcx_arr(i+1,j,k,0)));
+                         koff = static_cast<int>(Math::copysign(1.0, fcx_arr(i+1,j,k,1)));
+                         jj = j+joff;
+                         kk = k+koff;
+                         if (cell_id_arr(i,jj,k)<0 && cell_id_arr(i+1,jj,k)<0) {
+                            fracy = 0.0;
+                         }else{
+                            fracy = Math::abs(fcx_arr(i+1,j,k,0));
+                         }
+                         if (cell_id_arr(i,j,kk)<0 && cell_id_arr(i+1,j,kk)<0) {
+                            fracz = 0.0;
+                         }else{
+                            fracz = Math::abs(fcx_arr(i+1,j,k,1));
+                         }
+                         if (cell_id_arr(i,jj,kk)<0 && cell_id_arr(i+1,jj,kk)<0 && (fracy*fracz)>0.0) {
+                            fracy = 0.0;
+                            fracz = 0.0;
+                         }
+                      }else{
+                         joff = 0;
+                         koff = 0;
+                         jj = j;
+                         kk = k;
+                         fracy = 0.0;
+                         fracz = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracy)*(1.0-fracz)*abc;
+                      if (cell_id_arr(i+1,j,k)>=0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*f;
+                         mat_tmp(1,0,0) = mat_tmp(1,0,0) - tmp*f;
+                      }else if (cell_id_arr(i-1,j,k)<0 || apx_arr(i-1,j,k)==0.0 || bho==0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp( 0,0,0) = mat_tmp( 0,0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(-1,0,0) = mat_tmp(-1,0,0) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracy>0.0) {
+                         tmp = fracy*(1.0-fracz)*area*bx_arr(i+1,jj,k);
+                         if (cell_id_arr(i,jj,k)>=0 && cell_id_arr(i+1,jj,k)>=0) {
+                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*f;
+                            mat_tmp(1,joff,0) = mat_tmp(1,joff,0) - tmp*f;
+                         }else if (cell_id_arr(i-1,jj,k)<0 || apx_arr(i-1,jj,k)==0.0 || bho==0) {
+                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,joff,0) = mat_tmp( 0,joff,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(-1,joff,0) = mat_tmp(-1,joff,0) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracz>0.0) {
+                         tmp = fracz*(1.0-fracy)*area*bx_arr(i+1,j,kk);
+                         if (cell_id_arr(i,j,kk)>=0 && cell_id_arr(i+1,j,kk)>=0) {
+                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*f;
+                            mat_tmp(1,0,koff) = mat_tmp(1,0,koff) - tmp*f;
+                         }else if (cell_id_arr(i-1,j,kk)<0 || apx_arr(i-1,j,kk)==0 || bho==0) {
+                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,0,koff) = mat_tmp( 0,0,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(-1,0,koff) = mat_tmp(-1,0,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracy>0.0 && fracz>0.0) {
+                         tmp = fracy*fracz*area*bx_arr(i+1,jj,kk);
+                         if (cell_id_arr(i,jj,kk)>=0 && cell_id_arr(i+1,jj,kk)>=0) {
+                            mat_tmp(0,joff,koff) = mat_tmp(0,joff,koff) + tmp*f;
+                            mat_tmp(1,joff,koff) = mat_tmp(1,joff,koff) - tmp*f;
+                         }else if (cell_id_arr(i-1,jj,kk)<0 || apx_arr(i-1,jj,kk)==0 || bho==0) {
+                            mat_tmp(0,joff,koff) = mat_tmp(0,joff,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp( 0,joff,koff) = mat_tmp( 0,joff,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(-1,joff,koff) = mat_tmp(-1,joff,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 1;
+                   Real fracx = 0.0;
+                   int ii = 0;
+                   int ioff = 0;
+
+                   f = fac[1];
+                   area = apy_arr(i,j,k);
+                   abc = area*by_arr(i,j,k);
+                   if (area>0) {
+                      if (area!=1) {
+                         ioff = static_cast<int>(Math::copysign(1.0, fcy_arr(i,j,k,0)));
+                         koff = static_cast<int>(Math::copysign(1.0, fcy_arr(i,j,k,1)));
+                         ii = i+ioff;
+                         kk = k+koff;
+                         if (cell_id_arr(ii,j-1,k)<0 && cell_id_arr(ii,j,k)<0) {
+                            fracx = 0.0;
+                         }else{
+                            fracx = Math::abs(fcy_arr(i,j,k,0));
+                         }
+                         if (cell_id_arr(i,j-1,kk)<0 && cell_id_arr(i,j,kk)<0) {
+                            fracz = 0.0;
+                         }else{
+                            fracz = Math::abs(fcy_arr(i,j,k,1));
+                         }
+                         if (cell_id_arr(ii,j-1,kk)<0 && cell_id_arr(ii,j,kk)<0 && fracx*fracz>0.0) {
+                            fracx = 0.0;
+                            fracz = 0.0;
+                         }
+                      }else{
+                         ioff = 0;
+                         koff = 0;
+                         ii = i;
+                         kk = k;
+                         fracx = 0.0;
+                         fracz = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracx)*(1.0-fracz)*abc;
+                      if (cell_id_arr(i,j-1,k)>=0) {
+                         mat_tmp(0, 0,0) = mat_tmp(0, 0,0) + tmp*f;
+                         mat_tmp(0,-1,0) = mat_tmp(0,-1,0) - tmp*f;
+                      }else if (cell_id_arr(i,j+1,k)<0 || apy_arr(i,j+1,k)==0.0 || bho==0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(0,1,0) = mat_tmp(0,1,0) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracx>0.0) {
+                         tmp = fracx*(1.0-fracz)*area*by_arr(ii,j,k);
+                         if (cell_id_arr(ii,j-1,k)>=0 && cell_id_arr(ii,j,k)>=0) {
+                            mat_tmp(ioff,-1,0) = mat_tmp(ioff,-1,0) - tmp*f;
+                            mat_tmp(ioff, 0,0) = mat_tmp(ioff, 0,0) + tmp*f;
+                         }else if (cell_id_arr(ii,j+1,k)<0 || apy_arr(ii,j+1,k)==0.0 || bho==0) {
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,1,0) = mat_tmp(ioff,1,0) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracz>0.0) {
+                         tmp = fracz*(1.0-fracx)*area*by_arr(i,j,kk);
+                         if (cell_id_arr(i,j-1,kk)>=0 && cell_id_arr(i,j,kk)>=0) {
+                            mat_tmp(0,-1,koff) = mat_tmp(0,-1,koff) - tmp*f;
+                            mat_tmp(0, 0,koff) = mat_tmp(0, 0,koff) + tmp*f;
+                         }else if (cell_id_arr(i,j+1,kk)<0 || apy_arr(i,j+1,kk)==0.0 || bho==0) {
+                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(0,1,koff) = mat_tmp(0,1,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracx>0.0 && fracz>0.0) {
+                         tmp = fracx*fracz*area*by_arr(ii,j,kk);
+                         if (cell_id_arr(ii,j-1,kk)>=0 && cell_id_arr(ii,j,kk)>=0) {
+                            mat_tmp(ioff,-1,koff) = mat_tmp(ioff,-1,koff) - tmp*f;
+                            mat_tmp(ioff, 0,koff) = mat_tmp(ioff, 0,koff) + tmp*f;
+                         }else if (cell_id_arr(ii,j+1,kk)<0 || apy_arr(ii,j+1,kk)==0.0 || bho==0) {
+                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,1,koff) = mat_tmp(ioff,1,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 4;
+                   f = fac[1];
+                   area = apy_arr(i,j+1,k);
+                   abc = area*by_arr(i,j+1,k);
+                   if (area>0.0) {
+                      if (area!=1.0) {
+                         ioff = static_cast<int>(Math::copysign(1.0, fcy_arr(i,j+1,k,0)));
+                         koff = static_cast<int>(Math::copysign(1.0, fcy_arr(i,j+1,k,1)));
+                         ii = i+ioff;
+                         kk = k+koff;
+                         if (cell_id_arr(ii,j,k)<0 && cell_id_arr(ii,j+1,k)<0) {
+                            fracx = 0.0;
+                         }else{
+                            fracx = Math::abs(fcy_arr(i,j+1,k,0));
+                         }
+                         if (cell_id_arr(i,j,kk)<0 && cell_id_arr(i,j+1,kk)<0) {
+                            fracz = 0.0;
+                         }else{
+                            fracz = Math::abs(fcy_arr(i,j+1,k,1));
+                         }
+                         if (cell_id_arr(ii,j,kk)<0 && cell_id_arr(ii,j+1,kk)<0 && fracx*fracz>0.0) {
+                            fracx = 0.0;
+                            fracz = 0.0;
+                         }
+                      }else{
+                         ioff = 0;
+                         koff = 0;
+                         ii = i;
+                         kk = k;
+                         fracx = 0.0;
+                         fracz = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracx)*(1.0-fracz)*abc;
+                      if (cell_id_arr(i,j+1,k)>=0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*f;
+                         mat_tmp(0,1,0) = mat_tmp(0,1,0) - tmp*f;
+                      }else if (cell_id_arr(i,j-1,k)<0 || apy_arr(i,j-1,k)==0.0 || bho==0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0, 0,0) = mat_tmp(0, 0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(0,-1,0) = mat_tmp(0,-1,0) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracx>0.0) {
+                         tmp = fracx*(1.0-fracz)*area*by_arr(ii,j+1,k);
+                         if (cell_id_arr(ii,j,k)>=0 && cell_id_arr(ii,j+1,k)>=0) {
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*f;
+                            mat_tmp(ioff,1,0) = mat_tmp(ioff,1,0) - tmp*f;
+                         }else if (cell_id_arr(ii,j-1,k)<0 || apy_arr(ii,j-1,k)==0.0 || bho==0) {
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff, 0,0) = mat_tmp(ioff, 0,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,-1,0) = mat_tmp(ioff,-1,0) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracz>0.0) {
+                         tmp = fracz*(1.0-fracx)*area*by_arr(i,j+1,kk);
+                         if (cell_id_arr(i,j,kk)>=0 && cell_id_arr(i,j+1,kk)>=0) {
+                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*f;
+                            mat_tmp(0,1,koff) = mat_tmp(0,1,koff) - tmp*f;
+                         }else if (cell_id_arr(i,j-1,kk)<0 || apy_arr(i,j-1,kk)==0.0 || bho==0) {
+                            mat_tmp(0,0,koff) = mat_tmp(0,0,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(0, 0,koff) = mat_tmp(0, 0,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(0,-1,koff) = mat_tmp(0,-1,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracx>0.0 && fracz>0.0) {
+                         tmp = fracx*fracz*area*by_arr(ii,j+1,kk);
+                         if (cell_id_arr(ii,j,kk)>=0 && cell_id_arr(ii,j+1,kk)>=0) {
+                            mat_tmp(ioff,1,koff) = mat_tmp(ioff,1,koff) - tmp*f;
+                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*f;
+                         }else if (cell_id_arr(ii,j-1,kk)<0 || apy_arr(ii,j-1,kk)==0.0 || bho==0) {
+                            mat_tmp(ioff,0,koff) = mat_tmp(ioff,0,koff) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff, 0,koff) = mat_tmp(ioff, 0,koff) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,-1,koff) = mat_tmp(ioff,-1,koff) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 2;
+                   f = fac[2];
+                   area = apz_arr(i,j,k);
+                   abc = area*bz_arr(i,j,k);
+                   if (area>0.0) {
+                      if (area!=1.0) {
+                         ioff = static_cast<int>(Math::copysign(1.0, fcz_arr(i,j,k,0)));
+                         joff = static_cast<int>(Math::copysign(1.0, fcz_arr(i,j,k,1)));
+                         ii = i+ioff;
+                         jj = j+joff;
+                         if (cell_id_arr(ii,j,k-1)<0 && cell_id_arr(ii,j,k)<0) {
+                            fracx = 0.0;
+                         }else{
+                            fracx = Math::abs(fcz_arr(i,j,k,0));
+                         }
+                         if (cell_id_arr(i,jj,k-1)<0 && cell_id_arr(i,jj,k)<0) {
+                            fracy = 0.0;
+                         }else{
+                            fracy = Math::abs(fcz_arr(i,j,k,1));
+                         }
+                         if (cell_id_arr(ii,jj,k-1)<0 && cell_id_arr(ii,jj,k)<0 && fracx*fracy>0.0) {
+                            fracx = 0.0;
+                            fracy = 0.0;
+                         }
+                      }else{
+                         ioff = 0;
+                         joff = 0;
+                         ii = i;
+                         jj = j;
+                         fracx = 0.0;
+                         fracy = 0.0;
+                      }
+                      Real tmp = (1.0-fracx)*(1.0-fracy)*abc;
+                      if (cell_id_arr(i,j,k-1)>=0) {
+                         mat_tmp(0,0, 0) = mat_tmp(0,0, 0) + tmp*f;
+                         mat_tmp(0,0,-1) = mat_tmp(0,0,-1) - tmp*f;
+                      }else if (cell_id_arr(i,j,k+1)<0 || apz_arr(i,j,k+1)==0.0 || bho==0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(0,0,1) = mat_tmp(0,0,1) + tmp*   bf2[cdir];
+                      }
+                      if (fracx>0.0) {
+                         tmp = fracx*(1.0-fracy)*area*bz_arr(ii,j,k);
+                         if (cell_id_arr(ii,j,k-1)>=0 && cell_id_arr(ii,j,k)>=0) {
+                            mat_tmp(ioff,0,-1) = mat_tmp(ioff,0,-1) - tmp*f;
+                            mat_tmp(ioff,0, 0) = mat_tmp(ioff,0, 0) + tmp*f;
+                         }else if (cell_id_arr(ii,j,k+1)<0 || apz_arr(ii,j,k+1)==0.0 || bho==0) {
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,0,1) = mat_tmp(ioff,0,1) + tmp*   bf2[cdir];
+                         }
+                      }
+                      if (fracy>0.0) {
+                         tmp = fracy*(1.0-fracx)*area*bz_arr(i,jj,k);
+                         if (cell_id_arr(i,jj,k-1)>=0 && cell_id_arr(i,jj,k)>=0) {
+                            mat_tmp(0,joff,-1) = mat_tmp(0,joff,-1) - tmp*f;
+                            mat_tmp(0,joff, 0) = mat_tmp(0,joff, 0) + tmp*f;
+                         }else if (cell_id_arr(i,jj,k+1)<0 || apz_arr(i,jj,k+1)==0.0 || bho==0) {
+                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(0,joff,1) = mat_tmp(0,joff,1) + tmp*   bf2[cdir];
+                         }
+                      }
+                      if (fracx>0.0 && fracy>0.0) {
+                         tmp = fracx*fracy*area*bz_arr(ii,jj,k);
+                         if (cell_id_arr(ii,jj,k-1)>=0 && cell_id_arr(ii,jj,k)>=0) {
+                            mat_tmp(ioff,joff,-1) = mat_tmp(ioff,joff,-1) - tmp*f;
+                            mat_tmp(ioff,joff, 0) = mat_tmp(ioff,joff, 0) + tmp*f;
+                         }else if (cell_id_arr(ii,jj,k+1)<0 || apz_arr(ii,jj,k+1)==0.0 || bho==0) {
+                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,joff,1) = mat_tmp(ioff,joff,1) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   cdir = 5;
+                   f = fac[2];
+                   area = apz_arr(i,j,k+1);
+                   abc = area*bz_arr(i,j,k+1);
+                   if (area>0.0) {
+                      if (area!=1.0) {
+                         ioff = static_cast<int>(Math::copysign(1.0, fcz_arr(i,j,k+1,0)));
+                         joff = static_cast<int>(Math::copysign(1.0, fcz_arr(i,j,k+1,1)));
+                         ii = i+ioff;
+                         jj = j+joff;
+                         if (cell_id_arr(ii,j,k)<0 && cell_id_arr(ii,j,k+1)<0) {
+                            fracx = 0.0;
+                         }else{
+                            fracx = Math::abs(fcz_arr(i,j,k+1,0));
+                         }
+                         if (cell_id_arr(i,jj,k)<0 && cell_id_arr(i,jj,k+1)<0) {
+                            fracy = 0.0;
+                         }else{
+                            fracy = Math::abs(fcz_arr(i,j,k+1,1));
+                         }
+                         if (cell_id_arr(ii,jj,k)<0 && cell_id_arr(ii,jj,k+1)<0 && fracx*fracy>0.0) {
+                            fracx = 0.0;
+                            fracy = 0.0;
+                         }
+                      }else{
+                         ioff = 0;
+                         joff = 0;
+                         ii = i;
+                         jj = j;
+                         fracx = 0.0;
+                         fracy = 0.0;
+                      }
+
+                      Real tmp = (1.0-fracx)*(1.0-fracy)*abc;
+                      if (cell_id_arr(i,j,k+1)>=0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*f;
+                         mat_tmp(0,0,1) = mat_tmp(0,0,1) - tmp*f;
+                      }else if (cell_id_arr(i,j,k-1)<0 || apz_arr(i,j,k-1)==0.0 || bho==0) {
+                         mat_tmp(0,0,0) = mat_tmp(0,0,0) + tmp*(f+bflo[cdir]);
+                      }else{
+                         mat_tmp(0,0, 0) = mat_tmp(0,0, 0) + tmp*(f+bf1[cdir]);
+                         mat_tmp(0,0,-1) = mat_tmp(0,0,-1) + tmp*   bf2[cdir];
+                      }
+
+                      if (fracx>0.0) {
+                         tmp = fracx*(1.0-fracy)*area*bz_arr(ii,j,k+1);
+                         if (cell_id_arr(ii,j,k)>=0 && cell_id_arr(ii,j,k+1)>=0) {
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*f;
+                            mat_tmp(ioff,0,1) = mat_tmp(ioff,0,1) - tmp*f;
+                         }else if (cell_id_arr(ii,j,k-1)<0 || apz_arr(ii,j,k-1)==0.0 || bho==0) {
+                            mat_tmp(ioff,0,0) = mat_tmp(ioff,0,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,0, 0) = mat_tmp(ioff,0, 0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,0,-1) = mat_tmp(ioff,0,-1) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracy>0.0) {
+                         tmp = fracy*(1.0-fracx)*area*bz_arr(i,jj,k+1);
+                         if (cell_id_arr(i,jj,k)>=0 && cell_id_arr(i,jj,k+1)>=0) {
+                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*f;
+                            mat_tmp(0,joff,1) = mat_tmp(0,joff,1) - tmp*f;
+                         }else if (cell_id_arr(i,jj,k-1)<0 || apz_arr(i,jj,k-1)==0.0 || bho==0) {
+                            mat_tmp(0,joff,0) = mat_tmp(0,joff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(0,joff, 0) = mat_tmp(0,joff, 0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(0,joff,-1) = mat_tmp(0,joff,-1) + tmp*   bf2[cdir];
+                         }
+                      }
+
+                      if (fracx>0.0 && fracy>0.0) {
+                         tmp = fracx*fracy*area*bz_arr(ii,jj,k+1);
+                         if (cell_id_arr(ii,jj,k+1)>=0 && cell_id_arr(ii,jj,k)>=0) {
+                            mat_tmp(ioff,joff,1) = mat_tmp(ioff,joff,1) - tmp*f;
+                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*f;
+                         }else if (cell_id_arr(ii,jj,k-1)<0 || apz_arr(ii,jj,k-1)==0.0 || bho==0) {
+                            mat_tmp(ioff,joff,0) = mat_tmp(ioff,joff,0) + tmp*(f+bflo[cdir]);
+                         }else{
+                            mat_tmp(ioff,joff, 0) = mat_tmp(ioff,joff, 0) + tmp*(f+bf1[cdir]);
+                            mat_tmp(ioff,joff,-1) = mat_tmp(ioff,joff,-1) + tmp*   bf2[cdir];
+                         }
+                      }
+                   }
+
+                   if (is_dirichlet){
+                     Real anorm = std::sqrt((apx_arr(i,j,k) - apx_arr(i+1,j,k))*(apx_arr(i,j,k) - apx_arr(i+1,j,k)) 
+                              + (apy_arr(i,j,k) - apy_arr(i,j+1,k))*(apy_arr(i,j,k) - apy_arr(i,j+1,k)) 
+                              + (apz_arr(i,j,k) - apz_arr(i,j,k+1))*(apz_arr(i,j,k) - apz_arr(i,j,k+1)));
+
+                     Real anorminv = 1.0/anorm;
+                     Real anrmx = (apx_arr(i,j,k) - apx_arr(i+1,j,k))*anorminv;
+                     Real anrmy = (apy_arr(i,j,k) - apy_arr(i,j+1,k))*anorminv;
+                     Real anrmz = (apz_arr(i,j,k) - apz_arr(i,j,k+1))*anorminv;
+                     Real sx   = Math::copysign(1.0,anrmx);
+                     Real sy   = Math::copysign(1.0,anrmy);
+                     Real sz   = Math::copysign(1.0,anrmz);
+                     Real bctx = bcen_arr(i,j,k,0);
+                     Real bcty = bcen_arr(i,j,k,1);
+                     Real bctz = bcen_arr(i,j,k,2);
+                     Real dg   = get_dx_eb(vfrc_arr(i,j,k)) / max(Math::abs(anrmx), Math::abs(anrmy), Math::abs(anrmz));
+                     Real gx   = bctx - dg*anrmx;
+                     Real gy   = bcty - dg*anrmy;
+                     Real gz   = bctz - dg*anrmz;
+                     int ioff = -static_cast<int>(sx);
+                     int joff = -static_cast<int>(sy);
+                     int koff = -static_cast<int>(sz);
+                     gx   = sx*gx;
+                     gy   = sy*gy;
+                     gz   = sz*gz;
+                     Real gxy  = gx*gy;
+                     Real gxz  = gx*gz;
+                     Real gyz  = gy*gz;
+                     Real gxyz = gx*gy*gz;
+                     phig1(0) = 1.0 + gx + gy + gz + gxy + gxz + gyz + gxyz;
+                     phig1(1) =     - gx           - gxy - gxz       - gxyz;
+                     phig1(2) =          - gy      - gxy       - gyz - gxyz;
+                     phig1(3) =               - gz       - gxz - gyz - gxyz;
+                     phig1(4) =                    + gxy             + gxyz;
+                     phig1(5) =                          + gxz       + gxyz;
+                     phig1(6) =                                + gyz + gxyz;
+                     phig1(7) =                                      - gxyz;
+                     for (int ii=0; ii<8; ii++){
+                         feb(ii) = -phig1(ii) * (ba_arr(i,j,k) * beb_arr(i,j,k) / dg);
+                     }
+                     mat_tmp(0   , 0  , 0  ) = mat_tmp(0   , 0 , 0   ) - feb(0)*fac[0];
+                     mat_tmp(ioff, 0  , 0  ) = mat_tmp(ioff, 0 , 0   ) - feb(1)*fac[0];
+                     mat_tmp(0   ,joff, 0  ) = mat_tmp(0   ,joff, 0  ) - feb(2)*fac[0];
+                     mat_tmp(0   , 0  ,koff) = mat_tmp(0   , 0  ,koff) - feb(3)*fac[0];
+                     mat_tmp(ioff,joff, 0  ) = mat_tmp(ioff,joff, 0  ) - feb(4)*fac[0];
+                     mat_tmp(ioff, 0  ,koff) = mat_tmp(ioff, 0  ,koff) - feb(5)*fac[0];
+                     mat_tmp(0   ,joff,koff) = mat_tmp(0   ,joff,koff) - feb(6)*fac[0];
+                     mat_tmp(ioff,joff,koff) = mat_tmp(ioff,joff,koff) - feb(7)*fac[0];
+
+                   }
+
+                   for (int kk=-1; kk<=1; kk++){
+                       for (int jj=-1; jj<=1; jj++){
+                           for (int ii=-1; ii<=1; ii++){
+                               mat_tmp(ii,jj,kk) = mat_tmp(ii,jj,kk) * (1.0/vfrc_arr(i,j,k));
+                           }
+                       }
+                   }
+                   mat_tmp(0,0,0) = mat_tmp(0,0,0) + sa*a_arr(i,j,k);
+            }
+                   diag_arr(i,j,k) = 1.0/mat_tmp(0,0,0);
+                   for (int kk=-1; kk<=1; kk++){
+                       for (int jj=-1; jj<=1; jj++){
+                           for (int ii=-1; ii<=1; ii++){
+                               if (mat_tmp(ii,jj,kk) != 0.0 && cell_id_arr(i+ii,j+jj,k+kk)>=0){
+                                   int imat = iterPtr[1];
+                                   ncols[irow]  = ncols[irow] +1;
+                                   colsg[imat]  = cell_id_arr(i+ii,j+jj,k+kk);
+                                   matg[imat] = mat_tmp(ii,jj,kk)*diag_arr(i,j,k);
+                                   Gpu::Atomic::Add(&iterPtr[1], 1);
+                               }
+                           }
+                       }
+                   }
+                   Gpu::Atomic::Add(&iterPtr[0], 1);
+        }
+}
+
+#endif
+
+}
+#endif
diff --git a/Src/Extern/HYPRE/AMReX_Habec_K.H b/Src/Extern/HYPRE/AMReX_Habec_K.H
new file mode 100644
index 00000000000..7a74ef1431a
--- /dev/null
+++ b/Src/Extern/HYPRE/AMReX_Habec_K.H
@@ -0,0 +1,122 @@
+#ifndef AMREX_Habec_K_H_
+#define AMREX_Habec_K_H_
+
+#if (AMREX_SPACEDIM == 2)
+#include <AMReX_Habec_2D_K.H>
+#elif (AMREX_SPACEDIM == 3)
+#include <AMReX_Habec_3D_K.H>
+#endif
+
+namespace amrex {
+
+AMREX_FORCE_INLINE
+void amrex_hpacoef (Box const& box,
+                    BaseFab<GpuArray<Real,2*AMREX_SPACEDIM + 1>>& mat,
+                    const FArrayBox& a,
+                    Real& sa)
+{
+    Array4<GpuArray<Real,2*AMREX_SPACEDIM + 1>> const& mat_arr = mat.array();
+    Array4<Real const> const& a_arr = a.const_array();
+    if (sa == 0.0){
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = 0.0;
+        });
+    }else{
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+        {
+            mat_arr(i,j,k)[0] = sa * a_arr(i,j,k);
+        });
+    }
+}
+
+AMREX_FORCE_INLINE
+void amrex_hpdiag (Box const& box,
+                   BaseFab<GpuArray<Real,2*AMREX_SPACEDIM + 1>>& mat,
+                   FArrayBox& diag)
+{
+    Array4<GpuArray<Real,2*AMREX_SPACEDIM + 1>> const& mat_arr = mat.array();
+    Array4<Real> const& diag_arr = diag.array();
+
+    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+    {
+        diag_arr(i,j,k) = 1.0/mat_arr(i,j,k)[0];
+        for (int ii=0; ii<2*AMREX_SPACEDIM + 1; ii++){
+            mat_arr(i,j,k)[ii] = mat_arr(i,j,k)[ii]*diag_arr(i,j,k);
+        }
+    });
+}
+
+#ifdef AMREX_USE_EB
+
+template<typename T> AMREX_FORCE_INLINE
+void amrex_hpeb_fill_cellid (Box const& box,
+                             T& nrows,
+                             BaseFab<T>& cell_id,
+                             const EBCellFlagFab& flag)
+{
+    Array4<T> const& cell_id_arr = cell_id.array();
+    Array4<const EBCellFlag> const& flag_arr = flag.array();
+
+    nrows = 0;
+    Gpu::DeviceScalar<int> nrows_gpu(nrows);
+    int* nrowsg = nrows_gpu.dataPtr();
+
+    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+    {
+        if (!flag_arr(i,j,k).isCovered()){
+            cell_id_arr(i,j,k) = *nrowsg;
+            Gpu::Atomic::Add(nrowsg, 1);
+        }
+    });
+    nrows = nrows_gpu.dataValue();
+}
+
+AMREX_FORCE_INLINE
+void amrex_hpeb_copy_from_vec (Box const& box,
+                               FArrayBox& a,
+                               Real* v,
+                               const EBCellFlagFab& flag)
+{
+    Array4<Real> const& a_arr = a.array();
+    Array4<const EBCellFlag> const& flag_arr = flag.array();
+
+    int nrows = 0;
+    Gpu::DeviceScalar<int> nrows_gpu(nrows);
+    int* nrowsg = nrows_gpu.dataPtr();
+
+    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+    {
+        if (!flag_arr(i,j,k).isCovered()){
+            a_arr(i,j,k) = v[*nrowsg];
+            Gpu::Atomic::Add(nrowsg, 1);
+        }
+    });
+}
+
+AMREX_FORCE_INLINE
+void amrex_hpeb_copy_to_vec (Box const& box,
+                             FArrayBox& a,
+                             Real* v,
+                             const EBCellFlagFab& flag)
+{
+    Array4<Real> const& a_arr = a.array();
+    Array4<const EBCellFlag> const& flag_arr = flag.array();
+
+    int nrows = 0;
+    Gpu::DeviceScalar<int> nrows_gpu(nrows);
+    int* nrowsg = nrows_gpu.dataPtr();
+
+    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (box, i, j, k,
+    {
+        if (!flag_arr(i,j,k).isCovered()){
+            v[*nrowsg] = a_arr(i,j,k);
+            Gpu::Atomic::Add(nrowsg, 1);
+        }
+    });
+}
+
+#endif
+
+}
+#endif
diff --git a/Src/Extern/HYPRE/AMReX_Hypre.H b/Src/Extern/HYPRE/AMReX_Hypre.H
index 879eeb17d19..1a45678647e 100644
--- a/Src/Extern/HYPRE/AMReX_Hypre.H
+++ b/Src/Extern/HYPRE/AMReX_Hypre.H
@@ -30,6 +30,7 @@ public:
     void setACoeffs (const MultiFab& alpha);
     void setBCoeffs (const Array<const MultiFab*,BL_SPACEDIM>& beta);
     void setVerbose (int _verbose);
+    void setIsMatrixSingular(bool flag) { is_matrix_singular = flag; }
     virtual void solve (MultiFab& soln, const MultiFab& rhs, Real rel_tol, Real abs_tol, 
                         int max_iter, const BndryData& bndry, int max_bndry_order) = 0;
 
@@ -51,7 +52,16 @@ public:
                              static_cast<HYPRE_Int>(v[1]),
                              static_cast<HYPRE_Int>(v[2]))};
     }
-    
+
+
+    void setHypreOptionsNamespace (const std::string& ns) noexcept
+    { options_namespace = ns; }
+    void setHypreOldDefault (bool l) noexcept {old_default = l;}
+    void setHypreRelaxType (int n) noexcept {relax_type = n;}
+    void setHypreRelaxOrder (int n) noexcept {relax_order = n;}
+    void setHypreNumSweeps (int n) noexcept {num_sweeps = n;}
+    void setHypreStrongThreshold (Real t) noexcept {strong_threshold = t;}
+
 protected:
 
     static constexpr HYPRE_Int regular_stencil_size = 2*AMREX_SPACEDIM + 1;
@@ -61,6 +71,13 @@ protected:
     Geometry geom;
 
     int verbose = 0;
+    bool old_default = true; // Falgout coarsening with modified classical interpolation
+    int relax_type = 6;  // G-S/Jacobi hybrid relaxation
+    int relax_order = 1; // uses C/F relaxation
+    int num_sweeps = 2;  // Sweeeps on each level
+    Real strong_threshold = 0.25; // Hypre default is 0.25
+
+    std::string options_namespace{"hypre"};
 
     MultiFab acoefs;
     Array<MultiFab,AMREX_SPACEDIM> bcoefs;
@@ -71,10 +88,13 @@ protected:
     FabFactory<FArrayBox> const* m_factory = nullptr;
     BndryData const* m_bndry = nullptr;
     int m_maxorder = -1;
+
+    bool is_matrix_singular { false };
 };
 
 std::unique_ptr<Hypre> makeHypre (const BoxArray& grids, const DistributionMapping& damp,
-                                  const Geometry& geom, MPI_Comm comm_, Hypre::Interface interface);
+                                  const Geometry& geom, MPI_Comm comm_, Hypre::Interface interface,
+                                  const iMultiFab* overset_mask = nullptr);
 
 }
 
diff --git a/Src/Extern/HYPRE/AMReX_Hypre.cpp b/Src/Extern/HYPRE/AMReX_Hypre.cpp
index aa01febd112..aed7d3b1b02 100644
--- a/Src/Extern/HYPRE/AMReX_Hypre.cpp
+++ b/Src/Extern/HYPRE/AMReX_Hypre.cpp
@@ -13,9 +13,12 @@ constexpr HYPRE_Int Hypre::eb_stencil_size;
 
 std::unique_ptr<Hypre>
 makeHypre (const BoxArray& grids, const DistributionMapping& dmap,
-           const Geometry& geom, MPI_Comm comm_, Hypre::Interface interface)
+           const Geometry& geom, MPI_Comm comm_, Hypre::Interface interface,
+           const iMultiFab* overset_mask)
 {
-    if (interface == Hypre::Interface::structed) {
+    if (overset_mask) {
+        return std::unique_ptr<Hypre>(new HypreABecLap3(grids, dmap, geom, comm_, overset_mask));
+    } else if (interface == Hypre::Interface::structed) {
         return std::unique_ptr<Hypre>(new HypreABecLap(grids, dmap, geom, comm_));
     } else if (interface == Hypre::Interface::semi_structed) {
         return std::unique_ptr<Hypre>(new HypreABecLap2(grids, dmap, geom, comm_));
diff --git a/Src/Extern/HYPRE/AMReX_HypreABecLap.cpp b/Src/Extern/HYPRE/AMReX_HypreABecLap.cpp
index 21f588ed455..914f0ac3760 100644
--- a/Src/Extern/HYPRE/AMReX_HypreABecLap.cpp
+++ b/Src/Extern/HYPRE/AMReX_HypreABecLap.cpp
@@ -1,9 +1,10 @@
 
 #include <AMReX_HypreABecLap.H>
-#include <AMReX_HypreABec_F.H>
 #include <string>
 #include <algorithm>
 
+#include <AMReX_Habec_K.H>
+
 #include <_hypre_struct_mv.h>
 
 namespace amrex {
@@ -129,9 +130,6 @@ HypreABecLap::prepareSolver ()
 {
     BL_PROFILE("HypreABecLap::prepareSolver()");
 
-    const BoxArray& ba = acoefs.boxArray();
-    const DistributionMapping& dm = acoefs.DistributionMap();
-
     HYPRE_StructGridCreate(comm, AMREX_SPACEDIM, &grid);
 
     Array<HYPRE_Int,AMREX_SPACEDIM> is_periodic {AMREX_D_DECL(0,0,0)};
@@ -195,24 +193,16 @@ HypreABecLap::prepareSolver ()
     std::iota(stencil_indices.begin(), stencil_indices.end(), 0);
     const Real* dx = geom.CellSize();
     const int bho = (m_maxorder > 2) ? 1 : 0;
-    FArrayBox rfab;
+    BaseFab<GpuArray<Real,regular_stencil_size>> rfab;
     for (MFIter mfi(acoefs); mfi.isValid(); ++mfi)
     {  
         const Box &reg = mfi.validbox();
 
-        rfab.resize(reg,regular_stencil_size);
-        Real* mat = rfab.dataPtr();
-
-        amrex_hpacoef(BL_TO_FORTRAN_BOX(reg),
-                      mat,
-                      BL_TO_FORTRAN_ANYD(acoefs[mfi]),
-                      &scalar_a);
+        rfab.resize(reg);
+        amrex_hpacoef(reg, rfab, acoefs[mfi], scalar_a); 
 
         for (int idim = 0; idim < AMREX_SPACEDIM; idim++) {
-            amrex_hpbcoef(BL_TO_FORTRAN_BOX(reg),
-                          mat,
-                          BL_TO_FORTRAN_ANYD(bcoefs[idim][mfi]),
-                          &scalar_b, dx, &idim);
+            amrex_hpbcoef(reg, rfab, bcoefs[idim][mfi], scalar_b, dx, idim);
         }
 
         const Vector< Vector<BoundCond> > & bcs_i = m_bndry->bndryConds(mfi);
@@ -227,17 +217,12 @@ HypreABecLap::prepareSolver ()
             const int bctype = bcs_i[cdir][0];
             const Real  &bcl = bcl_i[cdir];
             const Mask  &msk = m_bndry->bndryMasks(ori)[mfi];
-      
-            amrex_hpmat(BL_TO_FORTRAN_BOX(reg),
-                        mat,
-                        BL_TO_FORTRAN_ANYD(bcoefs[idim][mfi]),
-                        BL_TO_FORTRAN_ANYD(msk),
-                        &scalar_b, dx, &cdir, &bctype, &bcl, &bho);
+   
+            amrex_hpmat(reg, rfab, bcoefs[idim][mfi], msk, scalar_b, dx, cdir, bctype, bcl, bho);   
         }
-
-        amrex_hpdiag(BL_TO_FORTRAN_BOX(reg),
-                     mat,
-                     BL_TO_FORTRAN_ANYD(diaginv[mfi]));
+        
+        amrex_hpdiag(reg, rfab, diaginv[mfi]);
+        Real* mat = (Real*) rfab.dataPtr();
 
         auto reglo = Hypre::loV(reg);
         auto reghi = Hypre::hiV(reg);
diff --git a/Src/Extern/HYPRE/AMReX_HypreABecLap2.cpp b/Src/Extern/HYPRE/AMReX_HypreABecLap2.cpp
index 429a868a0c4..336c82f1495 100644
--- a/Src/Extern/HYPRE/AMReX_HypreABecLap2.cpp
+++ b/Src/Extern/HYPRE/AMReX_HypreABecLap2.cpp
@@ -1,5 +1,6 @@
 #include <AMReX_HypreABecLap2.H>
-#include <AMReX_HypreABec_F.H>
+
+#include <AMReX_Habec_K.H>
 
 #include <cmath>
 #include <numeric>
@@ -219,24 +220,16 @@ HypreABecLap2::prepareSolver ()
     const HYPRE_Int part = 0;
     const Real* dx = geom.CellSize();
     const int bho = (m_maxorder > 2) ? 1 : 0;
-    FArrayBox rfab;
+    BaseFab<GpuArray<Real, regular_stencil_size>> rfab;
     for (MFIter mfi(acoefs); mfi.isValid(); ++mfi)
     {
         const Box &reg = mfi.validbox();
 
-        rfab.resize(reg,regular_stencil_size);
-        Real* mat = rfab.dataPtr();
-
-        amrex_hpacoef(BL_TO_FORTRAN_BOX(reg),
-                      mat,
-                      BL_TO_FORTRAN_ANYD(acoefs[mfi]),
-                      &scalar_a);
+        rfab.resize(reg);
+        amrex_hpacoef(reg, rfab, acoefs[mfi], scalar_a);
          
         for (int idim = 0; idim < AMREX_SPACEDIM; idim++) {
-            amrex_hpbcoef(BL_TO_FORTRAN_BOX(reg),
-                          mat,
-                          BL_TO_FORTRAN_ANYD(bcoefs[idim][mfi]),
-                          &scalar_b, dx, &idim);
+            amrex_hpbcoef(reg, rfab, bcoefs[idim][mfi], scalar_b, dx, idim);
         }
 
         const Vector< Vector<BoundCond> > & bcs_i = m_bndry->bndryConds(mfi);
@@ -251,16 +244,11 @@ HypreABecLap2::prepareSolver ()
             const Real &bcl  = bcl_i[cdir];
             const Mask &msk  = m_bndry->bndryMasks(ori)[mfi];
 
-            amrex_hpmat(BL_TO_FORTRAN_BOX(reg),
-                        mat,
-                        BL_TO_FORTRAN_ANYD(bcoefs[idim][mfi]),
-                        BL_TO_FORTRAN_ANYD(msk),
-                        &scalar_b, dx, &cdir, &bctype, &bcl, &bho);
+            amrex_hpmat(reg, rfab, bcoefs[idim][mfi], msk, scalar_b, dx, cdir, bctype, bcl, bho);
         }
 
-        amrex_hpdiag(BL_TO_FORTRAN_BOX(reg),
-                     mat,
-                     BL_TO_FORTRAN_ANYD(diaginv[mfi]));
+        amrex_hpdiag(reg, rfab, diaginv[mfi]); 
+        Real* mat = (Real*) rfab.dataPtr();
 
         // initialize matrix
         auto reglo = Hypre::loV(reg);
diff --git a/Src/Extern/HYPRE/AMReX_HypreABecLap3.H b/Src/Extern/HYPRE/AMReX_HypreABecLap3.H
index f4cac98f51e..312a66b4669 100644
--- a/Src/Extern/HYPRE/AMReX_HypreABecLap3.H
+++ b/Src/Extern/HYPRE/AMReX_HypreABecLap3.H
@@ -5,9 +5,7 @@
 
 #include <AMReX_iMultiFab.H>
 #include <AMReX_LayoutData.H>
-
-#include "HYPRE_parcsr_ls.h"
-#include "_hypre_parcsr_mv.h"
+#include <AMReX_HypreIJIface.H>
 
 #include <algorithm>
 
@@ -20,7 +18,8 @@ class HypreABecLap3
 public:
 
     HypreABecLap3 (const BoxArray& grids, const DistributionMapping& dmap,
-                   const Geometry& geom_, MPI_Comm comm_);
+                   const Geometry& geom_, MPI_Comm comm_,
+                   const iMultiFab* overset_mask = nullptr);
     virtual ~HypreABecLap3 ();
 
     virtual void solve (MultiFab& soln, const MultiFab& rhs, Real rel_tol, Real abs_tol, 
@@ -30,22 +29,27 @@ public:
     void setEBDirichlet (MultiFab const* beb) { m_eb_b_coeffs = beb; }
 #endif
 
+    // public for CUDA
+    void getSolution (MultiFab& soln);
+
 private :
+    std::unique_ptr<HypreIJIface> hypre_ij;
 
+    // Non-owning references to hypre matrix, rhs, and solution data
     HYPRE_IJMatrix A = NULL;
     HYPRE_IJVector b = NULL;
     HYPRE_IJVector x = NULL;
-    HYPRE_Solver solver = NULL;
 
     LayoutData<HYPRE_Int> ncells_grid;
-    LayoutData<Vector<HYPRE_Int> > cell_id_vec;
+    LayoutData<Gpu::ManagedDeviceVector<HYPRE_Int> > cell_id_vec;
     FabArray<BaseFab<HYPRE_Int> > cell_id;
 
     MultiFab const* m_eb_b_coeffs = nullptr;
-    
+
+    iMultiFab const* m_overset_mask = nullptr;
+
     void prepareSolver ();
     void loadVectors (MultiFab& soln, const MultiFab& rhs);
-    void getSolution (MultiFab& soln);
 };
 
 }
diff --git a/Src/Extern/HYPRE/AMReX_HypreABecLap3.cpp b/Src/Extern/HYPRE/AMReX_HypreABecLap3.cpp
index aee9e7daa7b..39bb3d8bc62 100644
--- a/Src/Extern/HYPRE/AMReX_HypreABecLap3.cpp
+++ b/Src/Extern/HYPRE/AMReX_HypreABecLap3.cpp
@@ -1,7 +1,8 @@
 #include <AMReX_HypreABecLap3.H>
-#include <AMReX_HypreABec_F.H>
 #include <AMReX_VisMF.H>
 
+#include <AMReX_Habec_K.H>
+
 #ifdef AMREX_USE_EB
 #include <AMReX_EBMultiFabUtil.H>
 #include <AMReX_MultiCutFab.H>
@@ -17,30 +18,24 @@
 namespace amrex {
 
 HypreABecLap3::HypreABecLap3 (const BoxArray& grids, const DistributionMapping& dmap,
-                              const Geometry& geom_, MPI_Comm comm_)
-    : Hypre(grids, dmap, geom_, comm_)
-{
-}
-    
+                              const Geometry& geom_, MPI_Comm comm_,
+                              const iMultiFab* overset_mask)
+    : Hypre(grids, dmap, geom_, comm_),
+      m_overset_mask(overset_mask)
+{}
+
 HypreABecLap3::~HypreABecLap3 ()
-{
-    HYPRE_IJMatrixDestroy(A);
-    A = NULL;
-    HYPRE_IJVectorDestroy(b);
-    b = NULL;
-    HYPRE_IJVectorDestroy(x);
-    x = NULL;
-    HYPRE_BoomerAMGDestroy(solver);
-    solver = NULL;
-}
+{}
 
 void
 HypreABecLap3::solve (MultiFab& soln, const MultiFab& rhs, Real rel_tol, Real abs_tol,
                       int max_iter, const BndryData& bndry, int max_bndry_order)
 {
+    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
+
     BL_PROFILE("HypreABecLap3::solve()");
-    
-    if (solver == NULL || m_bndry != &bndry || m_maxorder != max_bndry_order)
+
+    if (!hypre_ij || m_bndry != &bndry || m_maxorder != max_bndry_order)
     {
         m_bndry = &bndry;
         m_maxorder = max_bndry_order;
@@ -51,7 +46,7 @@ HypreABecLap3::solve (MultiFab& soln, const MultiFab& rhs, Real rel_tol, Real ab
     {
         m_factory = &(rhs.Factory());
     }
-    
+
     HYPRE_IJVectorInitialize(b);
     HYPRE_IJVectorInitialize(x);
     //
@@ -59,44 +54,8 @@ HypreABecLap3::solve (MultiFab& soln, const MultiFab& rhs, Real rel_tol, Real ab
     //
     HYPRE_IJVectorAssemble(x);
     HYPRE_IJVectorAssemble(b);
-    
-    HYPRE_ParCSRMatrix par_A = NULL;
-    HYPRE_ParVector par_b = NULL;
-    HYPRE_ParVector par_x = NULL;
-    HYPRE_IJMatrixGetObject(A, (void**)  &par_A);
-    HYPRE_IJVectorGetObject(b, (void **) &par_b);
-    HYPRE_IJVectorGetObject(x, (void **) &par_x);
-
-    HYPRE_BoomerAMGSetMinIter(solver, 1);
-    HYPRE_BoomerAMGSetMaxIter(solver, max_iter);
-    HYPRE_BoomerAMGSetTol(solver, rel_tol);
-    if (abs_tol > 0.0)
-    {
-        Real bnorm = hypre_ParVectorInnerProd(par_b, par_b);
-        bnorm = std::sqrt(bnorm);
-        
-        const BoxArray& grids = rhs.boxArray();
-        Real volume = grids.numPts();
-        Real rel_tol_new = (bnorm > 0.0) ? (abs_tol / bnorm * std::sqrt(volume)) : rel_tol;
 
-        if (rel_tol_new > rel_tol) {
-            HYPRE_BoomerAMGSetTol(solver, rel_tol_new);
-        }
-    }
-
-    HYPRE_BoomerAMGSolve(solver, par_A, par_b, par_x);
-
-    if (verbose >= 2)
-    {
-        HYPRE_Int num_iterations;
-        Real res;
-        HYPRE_BoomerAMGGetNumIterations(solver, &num_iterations);
-        HYPRE_BoomerAMGGetFinalRelativeResidualNorm(solver, &res);
-
-        amrex::Print() <<"\n" <<  num_iterations
-                       << " Hypre IJ BoomerAMG Iterations, Relative Residual "
-                       << res << std::endl;
-    }
+    hypre_ij->solve(rel_tol, abs_tol, max_iter);
 
     getSolution(soln);
 }
@@ -149,12 +108,23 @@ HypreABecLap3::getSolution (MultiFab& soln)
 #ifdef AMREX_USE_EB
             else if (fabtyp != FabType::regular)
             {
-                amrex_hpeb_copy_from_vec(BL_TO_FORTRAN_BOX(bx),
-                                         BL_TO_FORTRAN_ANYD(soln[mfi]),
-                                         xfab->dataPtr(), &nrows,
-                                         BL_TO_FORTRAN_ANYD((*flags)[mfi]));
+                amrex_hpeb_copy_from_vec(bx,
+                                         soln[mfi],
+                                         xfab->dataPtr(),
+                                         (*flags)[mfi]);
             }
 #endif
+
+            if (m_overset_mask) {
+                Array4<int const> const& omsk_arr = m_overset_mask->const_array(mfi);
+                Array4<Real> const& soln_arr = soln.array(mfi);
+                AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+                {
+                    if (omsk_arr(i,j,k) == 0) {
+                        soln_arr(i,j,k) = 0._rt;
+                    }
+                });
+            }
         }
     }
 }
@@ -186,6 +156,8 @@ HypreABecLap3::prepareSolver ()
 
 #ifdef AMREX_USE_EB
     auto ebfactory = dynamic_cast<EBFArrayBoxFactory const*>(m_factory);
+    AMREX_ALWAYS_ASSERT_WITH_MESSAGE(m_overset_mask == nullptr || ebfactory == nullptr,
+                                     "Cannot have both EB and overset");
     const FabArray<EBCellFlagFab>* flags = (ebfactory) ? &(ebfactory->getMultiEBCellFlagFab()) : nullptr;
     const MultiFab* vfrac = (ebfactory) ? &(ebfactory->getVolFrac()) : nullptr;
     auto area = (ebfactory) ? ebfactory->getAreaFrac()
@@ -200,12 +172,12 @@ HypreABecLap3::prepareSolver ()
 #ifdef _OPENMP
 #pragma omp parallel reduction(+:ncells_proc)
 #endif
-    {  BaseFab<HYPRE_Int> ifab;
     for (MFIter mfi(cell_id); mfi.isValid(); ++mfi)
     {
         const Box& bx = mfi.validbox();
         BaseFab<HYPRE_Int>& cid_fab = cell_id[mfi];
         cid_fab.setVal<RunOn::Host>(std::numeric_limits<HYPRE_Int>::lowest());
+        Array4<HYPRE_Int> const& cid_arr = cid_fab.array();
 #ifdef AMREX_USE_EB
         auto fabtyp = (flags) ? (*flags)[mfi].getType(bx) : FabType::regular;
         if (fabtyp == FabType::covered)
@@ -214,10 +186,11 @@ HypreABecLap3::prepareSolver ()
         }
         else if (fabtyp == FabType::singlevalued)
         {
-            amrex_hpeb_fill_cellid(BL_TO_FORTRAN_BOX(bx),
-                                   &ncells_grid[mfi],
-                                   BL_TO_FORTRAN_ANYD(cid_fab),
-                                   BL_TO_FORTRAN_ANYD((*flags)[mfi]));
+            amrex_hpeb_fill_cellid(bx,
+                                   ncells_grid[mfi],
+                                   cid_fab,
+                                   (*flags)[mfi]);
+
             ncells_proc += ncells_grid[mfi];
         }
         else
@@ -227,14 +200,12 @@ HypreABecLap3::prepareSolver ()
             ncells_grid[mfi] = npts;
             ncells_proc += npts;
 
-            ifab.resize(bx);
-            HYPRE_Int* p = ifab.dataPtr();
-            for (Long i = 0; i < npts; ++i) {
-                *p++ = i;
-            }
-            cid_fab.copy<RunOn::Host>(ifab,bx);
+            AMREX_LOOP_3D(bx, i, j, k,
+            {
+                cid_arr(i,j,k) = bx.index(IntVect{AMREX_D_DECL(i,j,k)});
+            });
         }
-    }}
+    }
 
     Vector<HYPRE_Int> ncells_allprocs(num_procs);
     MPI_Allgather(&ncells_proc, sizeof(HYPRE_Int), MPI_CHAR,
@@ -276,25 +247,20 @@ HypreABecLap3::prepareSolver ()
     HYPRE_Int ilower = proc_begin;
     HYPRE_Int iupper = proc_end-1;
 
-    //
-    HYPRE_IJMatrixCreate(comm, ilower, iupper, ilower, iupper, &A);
-    HYPRE_IJMatrixSetObjectType(A, HYPRE_PARCSR);
-    HYPRE_IJMatrixInitialize(A);
-    //
-    HYPRE_IJVectorCreate(comm, ilower, iupper, &b);
-    HYPRE_IJVectorSetObjectType(b, HYPRE_PARCSR);
-    //
-    HYPRE_IJVectorCreate(comm, ilower, iupper, &x);
-    HYPRE_IJVectorSetObjectType(x, HYPRE_PARCSR);
-    
-    // A.SetValues() & A.assemble()
+    hypre_ij.reset(new HypreIJIface(comm, ilower, iupper, verbose));
+    hypre_ij->parse_inputs(options_namespace);
+
+    // Obtain non-owning references to the matrix, rhs, and solution data
+    A = hypre_ij->A();
+    b = hypre_ij->b();
+    x = hypre_ij->x();
 
     const Real* dx = geom.CellSize();
     const int bho = (m_maxorder > 2) ? 1 : 0;
-    FArrayBox rfab;
-    BaseFab<HYPRE_Int> ifab;
     FArrayBox foo(Box::TheUnitBox());
+#ifdef AMREX_USE_EB
     const int is_eb_dirichlet = m_eb_b_coeffs != nullptr;
+#endif
 
     for (MFIter mfi(acoefs); mfi.isValid(); ++mfi)
     {
@@ -307,21 +273,16 @@ HypreABecLap3::prepareSolver ()
 #endif
         if (fabtyp != FabType::covered)
         {
-            const HYPRE_Int max_stencil_size = (fabtyp == FabType::regular) ?
-                regular_stencil_size : eb_stencil_size;
-
-            ifab.resize(bx,(max_stencil_size+1));
-            rfab.resize(bx,max_stencil_size);
 
             const HYPRE_Int nrows = ncells_grid[mfi];
             cell_id_vec[mfi].resize(nrows);
-            HYPRE_Int* rows = cell_id_vec[mfi].data();
-            HYPRE_Int* ncols = ifab.dataPtr(0);
-            HYPRE_Int* cols  = ifab.dataPtr(1);
-            Real*      mat   = rfab.dataPtr();
 
-            Array<int,AMREX_SPACEDIM*2> bctype;
-            Array<Real,AMREX_SPACEDIM*2> bcl;
+            Gpu::ManagedDeviceVector<HYPRE_Int> ncolsg(nrows,0);
+            Gpu::ManagedDeviceVector<HYPRE_Int> colsg(nrows*(AMREX_SPACEDIM*2+1),0);
+            Gpu::ManagedDeviceVector<Real> matg(nrows*(AMREX_SPACEDIM*2+1),0.0);
+
+            GpuArray<int,AMREX_SPACEDIM*2> bctype;
+            GpuArray<Real,AMREX_SPACEDIM*2> bcl;
             const Vector< Vector<BoundCond> > & bcs_i = m_bndry->bndryConds(mfi);
             const BndryData::RealTuple        & bcl_i = m_bndry->bndryLocs(mfi);
             for (OrientationIter oit; oit; oit++) {
@@ -329,51 +290,69 @@ HypreABecLap3::prepareSolver ()
                 bctype[cdir] = bcs_i[cdir][0];
                 bcl[cdir]  = bcl_i[cdir];
             }
-            
+
             if (fabtyp == FabType::regular)
             {
-                amrex_hpijmatrix(BL_TO_FORTRAN_BOX(bx),
-                                 &nrows, ncols, rows, cols, mat,
-                                 BL_TO_FORTRAN_ANYD(cell_id[mfi]),
-                                 &(offset[mfi]),
-                                 BL_TO_FORTRAN_ANYD(diaginv[mfi]),
-                                 BL_TO_FORTRAN_ANYD(acoefs[mfi]),
-                                 AMREX_D_DECL(BL_TO_FORTRAN_ANYD(bcoefs[0][mfi]),
-                                              BL_TO_FORTRAN_ANYD(bcoefs[1][mfi]),
-                                              BL_TO_FORTRAN_ANYD(bcoefs[2][mfi])),
-                                 &scalar_a, &scalar_b, dx,
-                                 bctype.data(), bcl.data(), &bho);
+                IArrayBox const* osmsk = (m_overset_mask) ? &((*m_overset_mask)[mfi]) : nullptr;
+                amrex_hpijmatrix(bx,
+                                 nrows, ncolsg.dataPtr(), 
+                                 cell_id_vec[mfi].dataPtr(), 
+                                 colsg.dataPtr(), matg.dataPtr(),
+                                 cell_id[mfi], 
+                                 offset[mfi],
+                                 diaginv[mfi],
+                                 acoefs[mfi],
+                                 bcoefs[0][mfi],
+                                 bcoefs[1][mfi],
+#if (AMREX_SPACEDIM == 3)
+                                 bcoefs[2][mfi],
+#endif
+                                 scalar_a, scalar_b, dx,
+                                 bctype, bcl, bho,
+                                 osmsk);
             }
 #ifdef AMREX_USE_EB
             else
             {
                 FArrayBox const& beb = (is_eb_dirichlet) ? (*m_eb_b_coeffs)[mfi] : foo;
+                int size_vec = std::pow(3,AMREX_SPACEDIM);
+                colsg.resize(nrows*size_vec);
+                matg.resize(nrows*size_vec);
+                amrex_hpeb_ijmatrix(bx,
+                                    nrows, ncolsg.dataPtr(),
+                                    cell_id_vec[mfi].dataPtr(),
+                                    colsg.dataPtr(), matg.dataPtr(),
+                                    cell_id[mfi],
+                                    offset[mfi], diaginv[mfi],
+                                    acoefs[mfi], bcoefs[0][mfi],
+                                    bcoefs[1][mfi], 
+#if (AMREX_SPACEDIM == 3)
+                                    bcoefs[2][mfi],
+#endif
+                                    (*flags)[mfi],
+                                    (*vfrac)[mfi],
+                                    (*area[0])[mfi], (*area[1])[mfi],
+#if (AMREX_SPACEDIM == 3)
+                                    (*area[2])[mfi],
+#endif 
+                                    (*fcent[0])[mfi], (*fcent[1])[mfi], 
+#if (AMREX_SPACEDIM == 3)
+                                    (*fcent[2])[mfi],
+#endif
+                                    (*barea)[mfi],
+                                    (*bcent)[mfi],
+                                    beb, is_eb_dirichlet,
+                                    scalar_a, scalar_b, dx,
+                                    bctype, bcl, bho);
 
-                amrex_hpeb_ijmatrix(BL_TO_FORTRAN_BOX(bx),
-                                    &nrows, ncols, rows, cols, mat,
-                                    BL_TO_FORTRAN_ANYD(cell_id[mfi]),
-                                    &(offset[mfi]),
-                                    BL_TO_FORTRAN_ANYD(diaginv[mfi]),
-                                    BL_TO_FORTRAN_ANYD(acoefs[mfi]),
-                                    AMREX_D_DECL(BL_TO_FORTRAN_ANYD(bcoefs[0][mfi]),
-                                                 BL_TO_FORTRAN_ANYD(bcoefs[1][mfi]),
-                                                 BL_TO_FORTRAN_ANYD(bcoefs[2][mfi])),
-                                    BL_TO_FORTRAN_ANYD((*flags)[mfi]),
-                                    BL_TO_FORTRAN_ANYD((*vfrac)[mfi]),
-                                    AMREX_D_DECL(BL_TO_FORTRAN_ANYD((*area[0])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*area[1])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*area[2])[mfi])),
-                                    AMREX_D_DECL(BL_TO_FORTRAN_ANYD((*fcent[0])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*fcent[1])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*fcent[2])[mfi])),
-                                    BL_TO_FORTRAN_ANYD((*barea)[mfi]),
-                                    BL_TO_FORTRAN_ANYD((*bcent)[mfi]),
-                                    BL_TO_FORTRAN_ANYD(beb), &is_eb_dirichlet,
-                                    &scalar_a, &scalar_b, dx,
-                                    bctype.data(), bcl.data(), &bho);
             }
 #endif
 
+            HYPRE_Int* rows = cell_id_vec[mfi].data();
+            HYPRE_Int* ncols = (HYPRE_Int*) ncolsg.dataPtr();
+            HYPRE_Int* cols = (HYPRE_Int*) colsg.dataPtr();
+            Real* mat = (Real*) matg.dataPtr();
+
 #ifdef AMREX_DEBUG
             HYPRE_Int nvalues = 0;
             for (HYPRE_Int i = 0; i < nrows; ++i) {
@@ -384,29 +363,19 @@ HypreABecLap3::prepareSolver ()
             }
 #endif
 
+            // For singular matrices set reference solution on one row
+            if (hypre_ij->adjustSingularMatrix()
+                && is_matrix_singular
+                && (rows[0] == 0)) {
+                const int num_cols = ncols[0];
+                for (int ic = 0; ic < num_cols; ++ic)
+                    mat[ic] = (cols[ic] == rows[0]) ? mat[ic] : 0.0;
+            }
 
             HYPRE_IJMatrixSetValues(A,nrows,ncols,rows,cols,mat);
         }
     }
     HYPRE_IJMatrixAssemble(A);
-
-    // Create solver
-    HYPRE_BoomerAMGCreate(&solver);
-
-    HYPRE_BoomerAMGSetOldDefault(solver); // Falgout coarsening with modified classical interpolation
-//    HYPRE_BoomerAMGSetCoarsenType(solver, 6);
-//    HYPRE_BoomerAMGSetCycleType(solver, 1);
-    HYPRE_BoomerAMGSetRelaxType(solver, 6);   /* G-S/Jacobi hybrid relaxation */
-    HYPRE_BoomerAMGSetRelaxOrder(solver, 1);   /* uses C/F relaxation */
-    HYPRE_BoomerAMGSetNumSweeps(solver, 2);   /* Sweeeps on each level */
-//    HYPRE_BoomerAMGSetStrongThreshold(solver, 0.6); // default is 0.25
-
-    int logging = (verbose >= 2) ? 1 : 0;
-    HYPRE_BoomerAMGSetLogging(solver, logging);
-
-    HYPRE_ParCSRMatrix par_A = NULL;
-    HYPRE_IJMatrixGetObject(A, (void**)  &par_A);
-    HYPRE_BoomerAMGSetup(solver, par_A, NULL, NULL);
 }
 
 void
@@ -447,10 +416,10 @@ HypreABecLap3::loadVectors (MultiFab& soln, const MultiFab& rhs)
             {
                 bfab = &vecfab;
                 bfab->resize(bx);
-                amrex_hpeb_copy_to_vec(BL_TO_FORTRAN_BOX(bx),
-                                       BL_TO_FORTRAN_ANYD(rhsfab),
-                                       bfab->dataPtr(), &nrows,
-                                       BL_TO_FORTRAN_ANYD((*flags)[mfi]));
+                amrex_hpeb_copy_to_vec(bx,
+                                       rhsfab,
+                                       bfab->dataPtr(),
+                                       (*flags)[mfi]);
             }
             else
 #endif
@@ -458,6 +427,12 @@ HypreABecLap3::loadVectors (MultiFab& soln, const MultiFab& rhs)
                 bfab = &rhsfab;
             }
 
+            if (hypre_ij->adjustSingularMatrix() && is_matrix_singular) {
+                const auto* rows = cell_id_vec[mfi].data();
+                if (rows[0] == 0) {
+                    bfab->dataPtr()[0] = 0.0;
+                }
+            }
             HYPRE_IJVectorSetValues(b, nrows, cell_id_vec[mfi].data(), bfab->dataPtr());
         }
     }
diff --git a/Src/Extern/HYPRE/AMReX_HypreABec_F.H b/Src/Extern/HYPRE/AMReX_HypreABec_F.H
deleted file mode 100644
index 5570c568d94..00000000000
--- a/Src/Extern/HYPRE/AMReX_HypreABec_F.H
+++ /dev/null
@@ -1,103 +0,0 @@
-#ifndef AMREX_HYPREABEC_F_H_
-#define AMREX_HYPREABEC_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-
-    void amrex_hpacoef (const int* lo, const int* hi, amrex_real* mat,
-                        const amrex_real* acoefs, const int* alo, const int* ahi,
-                        const amrex_real* sa);
-
-    void amrex_hpbcoef (const int* lo, const int* hi, amrex_real* mat,
-                        const amrex_real* bcoefs, const int* blo, const int* bhi,
-                        const amrex_real* sb, const amrex_real* dx, const int* idim);
-
-    void amrex_hpmat (const int* lo, const int* hi, amrex_real* mat,
-                      const amrex_real* bcoefs, const int* blo, const int* bhi,
-                      const int* mask, const int* mlo, const int* mhi,
-                      const amrex_real* sb, const amrex_real* dx, const int* cdir,
-                      const int* bct, const amrex_real* bcl, const int* bho);
-
-    void amrex_hpdiag (const int* lo, const int* hi, amrex_real* mat,
-                       amrex_real* diag, const int* dlo, const int* dhi);
-
-    void amrex_hpijmatrix (const int* lo, const int* hi,
-                           const void* nrows, void* ncols,
-                           void* rows, void* cols, amrex_real* mat,
-                           const void* cell_id, const int* clo, const int* chi,
-                           const void* cell_id_begin,
-                           amrex_real* diaginv, const int* dlo, const int* dhi,
-                           const amrex_real* ac, const int* alo, const int* ahi,
-                           const amrex_real* bx, const int* bxlo, const int* bxhi,
-#if (AMREX_SPACEDIM >= 2)
-                           const amrex_real* by, const int* bylo, const int* byhi,
-#if (AMREX_SPACEDIM == 3)
-                           const amrex_real* bz, const int* bzlo, const int* bzhi,
-#endif
-#endif
-                           const amrex_real* sa, const amrex_real* sb, const amrex_real* dx,
-                           const int* bct, const amrex_real* bcl, const int* bho);
-                           
-
-#ifdef AMREX_USE_EB
-    void amrex_hpeb_fill_cellid (const int* lo, const int* hi,
-                                 void* nrows, const void* cell_id, const int* clo, const int* chi,
-                                 const void* flag, const int* flo, const int* fhi);
-
-    void amrex_hpeb_copy_from_vec (const int* lo, const int* hi,
-                                   amrex_real* a, const int* alo, const int* ahi,
-                                   const amrex_real* v, const void* nv,
-                                   const void* flag, const int* flo, const int* fhi);
-
-    void amrex_hpeb_copy_to_vec (const int* lo, const int* hi,
-                                 const amrex_real* a, const int* alo, const int* ahi,
-                                 amrex_real* v, const void* nv,
-                                 const void* flag, const int* flo, const int* fhi);
-
-    void amrex_hpeb_ijmatrix (const int* lo, const int* hi,
-                              const void* nrows, void* ncols,
-                              void* rows, void* cols, amrex_real* mat,
-                              const void* cell_id, const int* clo, const int* chi,
-                              const void* cell_id_begin,
-                              amrex_real* diaginv, const int* dlo, const int* dhi,
-                              const amrex_real* ac, const int* alo, const int* ahi,
-                              const amrex_real* bx, const int* bxlo, const int* bxhi,
-#if (AMREX_SPACEDIM >= 2)
-                              const amrex_real* by, const int* bylo, const int* byhi,
-#if (AMREX_SPACEDIM == 3)
-                              const amrex_real* bz, const int* bzlo, const int* bzhi,
-#endif
-#endif
-                              const void* flag, const int* flo, const int* fhi,
-                              const amrex_real* vfrc, const int* vlo, const int* vhi,
-                              const amrex_real* apx, const int* axlo, const int* axhi,
-#if (AMREX_SPACEDIM >= 2)
-                              const amrex_real* apy, const int* aylo, const int* ayhi,
-#if (AMREX_SPACEDIM == 3)
-                              const amrex_real* apz, const int* azlo, const int* azhi,
-#endif
-#endif
-                              const amrex_real* fcx, const int* fxlo, const int* fxhi,
-#if (AMREX_SPACEDIM >= 2)
-                              const amrex_real* fcy, const int* fylo, const int* fyhi,
-#if (AMREX_SPACEDIM == 3)
-                              const amrex_real* fcz, const int* fzlo, const int* fzhi,
-#endif
-#endif
-                              const amrex_real* ba,   const int* balo, const int* bahi,
-                              const amrex_real* bcen, const int* bclo, const int* bchi,
-                              const amrex_real* beb,  const int* elo,  const int* ehi,
-                              const int* is_eb_dirichlet,
-                              const amrex_real* sa, const amrex_real* sb, const amrex_real* dx,
-                              const int* bct, const amrex_real* bcl, const int* bho);
-
-#endif
-    
-#ifdef __cplusplus
-};
-#endif
-
-#endif /* _HYPREABEC_F_H_ */
diff --git a/Src/Extern/HYPRE/AMReX_HypreIJIface.H b/Src/Extern/HYPRE/AMReX_HypreIJIface.H
new file mode 100644
index 00000000000..cb3539a4c5a
--- /dev/null
+++ b/Src/Extern/HYPRE/AMReX_HypreIJIface.H
@@ -0,0 +1,137 @@
+#ifndef AMREX_HYPREIJIFACE_H
+#define AMREX_HYPREIJIFACE_H
+
+#include <memory>
+
+#include <AMReX_MultiFab.H>
+
+#include <HYPRE.h>
+#include <HYPRE_parcsr_ls.h>
+#include <HYPRE_parcsr_mv.h>
+
+namespace amrex {
+
+class HypreIJIface
+{
+public:
+    using HypreIntType = HYPRE_Int;
+    using HypreRealType = HYPRE_Real;
+
+    HypreIJIface(MPI_Comm comm, const HypreIntType ilower, const HypreIntType iupper,
+                 int verbose);
+
+    ~HypreIJIface();
+
+    void parse_inputs(const std::string& prefix = "hypre");
+
+    void solve(const HypreRealType rel_tol, const HypreRealType abs_tol, const HypreIntType max_iter);
+
+    //! IJ matrix instance
+    HYPRE_IJMatrix A() { return m_mat; }
+
+    //! Right hand side IJ vector instance
+    HYPRE_IJVector b() { return m_rhs; }
+
+    //! Solution IJ vector instance
+    HYPRE_IJVector x() { return m_sln; }
+
+    //! Number of iterations taken by the solver to reach the desired tolerance
+    HypreIntType getNumIters() const { return m_num_iterations; }
+
+    //! Final residual norm after a linear solve
+    HypreRealType getFinalResidualNorm() const { return m_final_res_norm; }
+
+    bool adjustSingularMatrix() const { return m_adjust_singular_matrix; }
+
+private:
+    void init_preconditioner(const std::string& prefix, const std::string& name);
+    void init_solver(const std::string& prefix, const std::string& name);
+
+    // Preconditioners
+    void boomeramg_precond_configure(const std::string& prefix);
+    void euclid_precond_configure(const std::string& prefix);
+
+    // Solvers
+    void boomeramg_solver_configure(const std::string& prefix);
+    void gmres_solver_configure(const std::string& prefix);
+    void cogmres_solver_configure(const std::string& prefix);
+    void lgmres_solver_configure(const std::string& prefix);
+    void flex_gmres_solver_configure(const std::string& prefix);
+    void bicgstab_solver_configure(const std::string& prefix);
+    void pcg_solver_configure(const std::string& prefix);
+    void hybrid_solver_configure(const std::string& prefix);
+
+
+    MPI_Comm m_comm{MPI_COMM_NULL};
+
+    HYPRE_IJMatrix m_mat{nullptr};
+    HYPRE_IJVector m_rhs{nullptr};
+    HYPRE_IJVector m_sln{nullptr};
+
+    HYPRE_ParCSRMatrix m_parA{nullptr};
+    HYPRE_ParVector m_parRhs{nullptr};
+    HYPRE_ParVector m_parSln{nullptr};
+
+    HYPRE_Solver m_solver{nullptr};
+    HYPRE_Solver m_precond{nullptr};
+
+    HypreIntType (*m_solverDestroyPtr)(HYPRE_Solver){nullptr};
+    HypreIntType (*m_solverSetupPtr)(
+        HYPRE_Solver, HYPRE_ParCSRMatrix, HYPRE_ParVector, HYPRE_ParVector){nullptr};
+    HypreIntType (*m_solverSolvePtr)(
+        HYPRE_Solver, HYPRE_ParCSRMatrix, HYPRE_ParVector, HYPRE_ParVector){nullptr};
+    HypreIntType (*m_solverPrecondPtr)(
+        HYPRE_Solver,
+        HYPRE_PtrToParSolverFcn,
+        HYPRE_PtrToParSolverFcn,
+        HYPRE_Solver){nullptr};
+
+    HypreIntType (*m_precondDestroyPtr)(HYPRE_Solver){nullptr};
+    HypreIntType (*m_precondSetupPtr)(
+        HYPRE_Solver, HYPRE_ParCSRMatrix, HYPRE_ParVector, HYPRE_ParVector){nullptr};
+    HypreIntType (*m_precondSolvePtr)(
+        HYPRE_Solver, HYPRE_ParCSRMatrix, HYPRE_ParVector, HYPRE_ParVector){nullptr};
+
+    HypreIntType (*m_solverSetTolPtr)(HYPRE_Solver, double){nullptr};
+    HypreIntType (*m_solverSetAbsTolPtr)(HYPRE_Solver, double){nullptr};
+    HypreIntType (*m_solverSetMaxIterPtr)(HYPRE_Solver, HypreIntType){nullptr};
+    HypreIntType (*m_solverNumItersPtr)(HYPRE_Solver, HypreIntType*){nullptr};
+    HypreIntType (*m_solverFinalResidualNormPtr)(HYPRE_Solver, double*){nullptr};
+
+    HypreIntType m_ilower{0};
+    HypreIntType m_iupper{0};
+
+    HypreRealType m_final_res_norm;
+    HypreIntType m_num_iterations;
+
+    std::string m_solver_name{"BoomerAMG"};
+    std::string m_preconditioner_name{"none"};
+    std::string m_file_prefix{"IJ"};
+
+    //! Verbosity of the HYPRE solvers
+    int m_verbose{0};
+
+    unsigned int m_write_counter{0};
+
+    //! Flag indicating whether a preconditioner has been set
+    bool m_has_preconditioner{false};
+
+    //! Flag indicating whether the solver/preconditioner has been setup
+    bool m_need_setup{true};
+
+    //! Flag indicating whether user has requested recomputation of preconditioner
+    bool m_recompute_preconditioner{true};
+
+    //! Should singular matrix be adjusted to fix solution on a node/cell?
+    bool m_adjust_singular_matrix{false};
+
+    //! Flag indicating whether to dump matrix files
+    bool m_write_files{false};
+
+    //! Flag indicating whether the files are overwritten on subsequent writes
+    bool m_overwrite_files{true};
+};
+
+} // namespace amrex
+
+#endif /* AMREX_HYPREIJIFACE_H */
diff --git a/Src/Extern/HYPRE/AMReX_HypreIJIface.cpp b/Src/Extern/HYPRE/AMReX_HypreIJIface.cpp
new file mode 100644
index 00000000000..10ef81bd798
--- /dev/null
+++ b/Src/Extern/HYPRE/AMReX_HypreIJIface.cpp
@@ -0,0 +1,553 @@
+#include <AMReX_HypreIJIface.H>
+#include <AMReX.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_PlotFileUtil.H>
+
+namespace amrex {
+
+namespace {
+
+/** Helper object to parse HYPRE inputs and call API functions
+ */
+struct HypreOptParse
+{
+    //! Input file parser instance for the given namespace
+    amrex::ParmParse pp;
+
+    //! Hypre solver/precondtioner whose options are being set
+    HYPRE_Solver solver;
+
+    HypreOptParse(const std::string& prefix, HYPRE_Solver sinp)
+        : pp(prefix), solver(sinp)
+    {}
+
+    template <typename F>
+    void operator()(const std::string& key, F&& func)
+    {
+        if (pp.contains(key.c_str())) {
+            int val;
+            pp.query(key.c_str(), val);
+            func(solver, val);
+        }
+    }
+
+    template <typename F, typename T>
+    void operator()(const std::string& key, F&& func, T default_val)
+    {
+        T val = default_val;
+        pp.query(key.c_str(), val);
+        func(solver, val);
+    }
+
+    template <typename T, typename F>
+    void set(const std::string& key, F&& func)
+    {
+        if (pp.contains(key.c_str())) {
+            T val;
+            pp.query(key.c_str(), val);
+            func(solver, val);
+        }
+    }
+};
+
+} // namespace
+
+HypreIJIface::HypreIJIface(
+    MPI_Comm comm, HypreIntType ilower, HypreIntType iupper, int verbose)
+    : m_comm(comm), m_ilower(ilower), m_iupper(iupper), m_verbose(verbose)
+{
+    HYPRE_IJMatrixCreate(
+        m_comm, m_ilower, m_iupper, m_ilower, m_iupper, &m_mat);
+    HYPRE_IJMatrixSetObjectType(m_mat, HYPRE_PARCSR);
+    HYPRE_IJMatrixInitialize(m_mat);
+
+    HYPRE_IJVectorCreate(m_comm, m_ilower, m_iupper, &m_rhs);
+    HYPRE_IJVectorSetObjectType(m_rhs, HYPRE_PARCSR);
+    HYPRE_IJVectorInitialize(m_rhs);
+
+    HYPRE_IJVectorCreate(m_comm, m_ilower, m_iupper, &m_sln);
+    HYPRE_IJVectorSetObjectType(m_sln, HYPRE_PARCSR);
+    HYPRE_IJVectorInitialize(m_sln);
+}
+
+HypreIJIface::~HypreIJIface()
+{
+    HYPRE_IJMatrixDestroy(m_mat);
+    m_mat = nullptr;
+    HYPRE_IJVectorDestroy(m_rhs);
+    m_rhs = nullptr;
+    HYPRE_IJVectorDestroy(m_sln);
+    m_sln = nullptr;
+
+    if (m_solver != nullptr) {
+        m_solverDestroyPtr(m_solver);
+        m_solver = nullptr;
+    }
+
+    if (m_precond != nullptr) {
+        m_precondDestroyPtr(m_precond);
+        m_precond = nullptr;
+    }
+}
+
+void HypreIJIface::solve(
+    const HypreRealType rel_tol, const HypreRealType abs_tol, const HypreIntType max_iter)
+{
+    // Assuming that Matrix/rhs etc. has been assembled by calling code
+
+    HYPRE_IJMatrixGetObject(m_mat, (void**)&m_parA);
+    HYPRE_IJVectorGetObject(m_rhs, (void**)&m_parRhs);
+    HYPRE_IJVectorGetObject(m_sln, (void**)&m_parSln);
+
+    if (m_write_files) {
+        const std::string matfile = amrex::Concatenate(
+            m_file_prefix + "_A", m_write_counter) + ".out";
+        const std::string rhsfile = amrex::Concatenate(
+            m_file_prefix + "_b", m_write_counter) + ".out";
+        HYPRE_IJMatrixPrint(m_mat, matfile.c_str());
+        HYPRE_IJVectorPrint(m_rhs, rhsfile.c_str());
+    }
+
+    m_solverSetTolPtr(m_solver, rel_tol);
+    m_solverSetMaxIterPtr(m_solver, max_iter);
+    if ((abs_tol > 0.0) && (m_solverSetAbsTolPtr != nullptr))
+        m_solverSetAbsTolPtr(m_solver, abs_tol);
+
+    // setup
+    if (m_need_setup || m_recompute_preconditioner) {
+        if (m_has_preconditioner)
+            m_solverPrecondPtr(
+                m_solver, m_precondSolvePtr, m_precondSetupPtr, m_precond);
+
+        m_solverSetupPtr(m_solver, m_parA, m_parRhs, m_parSln);
+        m_need_setup = false;
+    }
+
+    // solve
+    m_solverSolvePtr(m_solver, m_parA, m_parRhs, m_parSln);
+
+    // diagnostics
+    m_solverNumItersPtr(m_solver, &m_num_iterations);
+    m_solverFinalResidualNormPtr(m_solver, &m_final_res_norm);
+
+    if (m_write_files) {
+        const std::string slnfile = amrex::Concatenate(
+            m_file_prefix + "_x", m_write_counter) + ".out";
+        HYPRE_IJVectorPrint(m_sln, slnfile.c_str());
+
+        // Increment counter if the user has requested output of multiple solves
+        if (!m_overwrite_files) ++m_write_counter;
+    }
+
+    if (m_verbose > 1)
+        amrex::Print() << "HYPRE " << m_solver_name
+                       << ": Num. iterations = " << m_num_iterations
+                       << "; Relative residual = " << m_final_res_norm
+                       << std::endl;
+}
+
+void HypreIJIface::parse_inputs(const std::string& prefix)
+{
+    amrex::ParmParse pp(prefix);
+
+    pp.query("hypre_solver", m_solver_name);
+    pp.query("hypre_preconditioner", m_preconditioner_name);
+    pp.query("recompute_preconditioner", m_recompute_preconditioner);
+    pp.query("write_matrix_files", m_write_files);
+    pp.query("overwrite_existing_matrix_files", m_overwrite_files);
+    pp.query("adjust_singular_matrix", m_adjust_singular_matrix);
+
+    if (m_verbose > 2)
+        amrex::Print() << "HYPRE: solver = " << m_solver_name
+                       << "; preconditioner = " << m_preconditioner_name
+                       << std::endl;
+
+    if (m_preconditioner_name == "none") {
+        m_has_preconditioner = false;
+    } else {
+        m_has_preconditioner = true;
+        init_preconditioner(prefix, m_preconditioner_name);
+    }
+
+    init_solver(prefix, m_solver_name);
+}
+
+void HypreIJIface::init_preconditioner(
+    const std::string& prefix, const std::string& name)
+{
+    if (name == "BoomerAMG") {
+        boomeramg_precond_configure(prefix);
+    } else if (name == "euclid") {
+        euclid_precond_configure(prefix);
+    } else {
+        amrex::Abort("Invalid HYPRE preconditioner specified: " + name);
+    }
+}
+
+void HypreIJIface::init_solver(
+    const std::string& prefix, const std::string& name)
+{
+    if (name == "BoomerAMG") {
+        boomeramg_solver_configure(prefix);
+    } else if (name == "GMRES") {
+        gmres_solver_configure(prefix);
+    } else if (name == "COGMRES") {
+        cogmres_solver_configure(prefix);
+    } else if (name == "LGMRES") {
+        lgmres_solver_configure(prefix);
+    } else if (name == "FlexGMRES") {
+        flex_gmres_solver_configure(prefix);
+    } else if (name == "BiCGSTAB") {
+        bicgstab_solver_configure(prefix);
+    } else if (name == "PCG") {
+        pcg_solver_configure(prefix);
+    } else if (name == "Hybrid") {
+        hybrid_solver_configure(prefix);
+    }else {
+        amrex::Abort("Invalid HYPRE solver specified: " + name);
+    }
+}
+
+void HypreIJIface::boomeramg_precond_configure(const std::string& prefix)
+{
+    if (m_verbose > 2)
+        amrex::Print() << "Creating BoomerAMG preconditioner" << std::endl;
+    HYPRE_BoomerAMGCreate(&m_precond);
+
+    // Setup the pointers
+    m_precondDestroyPtr = &HYPRE_BoomerAMGDestroy;
+    m_precondSetupPtr = &HYPRE_BoomerAMGSetup;
+    m_precondSolvePtr = &HYPRE_BoomerAMGSolve;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_precond);
+    hpp("bamg_verbose", HYPRE_BoomerAMGSetPrintLevel);
+    hpp("bamg_logging", HYPRE_BoomerAMGSetLogging);
+
+    hpp("bamg_max_iterations", HYPRE_BoomerAMGSetMaxIter, 1);
+    hpp("bamg_precond_tolerance", HYPRE_BoomerAMGSetTol, 0.0);
+    hpp("bamg_coarsen_type", HYPRE_BoomerAMGSetCoarsenType, 6);
+    hpp("bamg_cycle_type", HYPRE_BoomerAMGSetCycleType, 1);
+    hpp("bamg_relax_type", HYPRE_BoomerAMGSetRelaxType, 6);
+    hpp("bamg_relax_order", HYPRE_BoomerAMGSetRelaxOrder, 1);
+    hpp("bamg_num_sweeps", HYPRE_BoomerAMGSetNumSweeps, 2);
+    hpp("bamg_max_levels", HYPRE_BoomerAMGSetMaxLevels, 20);
+    hpp("bamg_strong_threshold", HYPRE_BoomerAMGSetStrongThreshold,
+        (AMREX_SPACEDIM == 3) ? 0.57 : 0.25);
+    hpp("bamg_interp_type", HYPRE_BoomerAMGSetInterpType, 0);
+
+    hpp("bamg_variant", HYPRE_BoomerAMGSetVariant);
+    hpp("bamg_keep_transpose", HYPRE_BoomerAMGSetKeepTranspose);
+    hpp("bamg_min_coarse_size", HYPRE_BoomerAMGSetMinCoarseSize);
+    hpp("bamg_max_coarse_size", HYPRE_BoomerAMGSetMaxCoarseSize);
+    hpp("bamg_pmax_elmts", HYPRE_BoomerAMGSetPMaxElmts);
+    hpp("bamg_agg_num_levels", HYPRE_BoomerAMGSetAggNumLevels);
+    hpp("bamg_agg_interp_type", HYPRE_BoomerAMGSetAggInterpType);
+    hpp("bamg_agg_pmax_elmts", HYPRE_BoomerAMGSetAggPMaxElmts);
+    hpp("bamg_set_trunc_factor", HYPRE_BoomerAMGSetTruncFactor);
+
+    if (hpp.pp.contains("bamg_non_galerkin_tol")) {
+        hpp("bamg_non_galerkin_tol", HYPRE_BoomerAMGSetNonGalerkinTol);
+
+        if (hpp.pp.contains("bamg_non_galerkin_level_tols")) {
+            std::vector<int> levels;
+            std::vector<double> tols;
+            hpp.pp.getarr("bamg_non_galerkin_level_levels", levels);
+            hpp.pp.getarr("bamg_non_galerkin_level_tols", tols);
+
+            if (levels.size() != tols.size())
+                amrex::Abort(
+                    "HypreIJIface: Invalid sizes for non-Galerkin level "
+                    "tolerances");
+
+            for (size_t i = 0; i < levels.size(); ++i)
+                HYPRE_BoomerAMGSetLevelNonGalerkinTol(
+                    m_precond, tols[i], levels[i]);
+        }
+    }
+
+    if (hpp.pp.contains("bamg_smooth_type")) {
+        int smooth_type;
+        hpp.pp.get("bamg_smooth_type", smooth_type);
+
+        hpp("bamg_smooth_type", HYPRE_BoomerAMGSetSmoothType);
+
+        // Process Euclid smoother parameters
+        if (smooth_type == 9) {
+            if (hpp.pp.contains("bamg_euclid_file")) {
+                std::string euclid_file;
+                hpp.pp.get("bamg_euclid_file", euclid_file);
+                HYPRE_BoomerAMGSetEuclidFile(
+                    m_precond, const_cast<char*>(euclid_file.c_str()));
+            }
+            hpp("bamg_smooth_num_levels", HYPRE_BoomerAMGSetSmoothNumLevels);
+            hpp("bamg_smooth_num_sweeps", HYPRE_BoomerAMGSetSmoothNumSweeps);
+        }
+    }
+}
+
+void HypreIJIface::euclid_precond_configure(const std::string& prefix)
+{
+    HYPRE_EuclidCreate(m_comm, &m_precond);
+
+    // Setup the pointers
+    m_precondDestroyPtr = &HYPRE_EuclidDestroy;
+    m_precondSetupPtr = &HYPRE_EuclidSetup;
+    m_precondSolvePtr = &HYPRE_EuclidSolve;
+
+    HypreOptParse hpp(prefix, m_precond);
+    // for 3D problems set to 1, for 2D set to 4-8
+    hpp("euclid_level", HYPRE_EuclidSetLevel, (AMREX_SPACEDIM == 3) ? 1 : 4);
+    // 0 = PILU; 1 = Block Jacobi
+    hpp("euclid_use_block_jacobi", HYPRE_EuclidSetBJ, 0);
+    // Flag indicating whether to write out euclid stats
+    hpp("euclid_stats", HYPRE_EuclidSetStats, 0);
+    // Flag indicating whether to print out memory diagnostic
+    hpp("euclid_mem", HYPRE_EuclidSetMem, 0);
+}
+
+void HypreIJIface::boomeramg_solver_configure(const std::string& prefix)
+{
+    if (m_has_preconditioner) {
+        amrex::Warning(
+            "HYPRE: Cannot use preconditioner with BoomerAMG solver");
+        m_has_preconditioner = false;
+    }
+
+    HYPRE_BoomerAMGCreate(&m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_BoomerAMGDestroy;
+    m_solverSetupPtr = &HYPRE_BoomerAMGSetup;
+    m_solverPrecondPtr = nullptr;
+    m_solverSolvePtr = &HYPRE_BoomerAMGSolve;
+
+    m_solverSetTolPtr = &HYPRE_BoomerAMGSetTol;
+    m_solverSetAbsTolPtr = nullptr;
+    m_solverSetMaxIterPtr = &HYPRE_BoomerAMGSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_BoomerAMGGetNumIterations;
+    m_solverFinalResidualNormPtr = &HYPRE_BoomerAMGGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_BoomerAMGSetPrintLevel);
+    hpp("logging", HYPRE_BoomerAMGSetLogging);
+
+    hpp("bamg_relax_type", HYPRE_BoomerAMGSetRelaxType, 6);
+    hpp("bamg_relax_order", HYPRE_BoomerAMGSetRelaxOrder, 1);
+    hpp("bamg_num_sweeps", HYPRE_BoomerAMGSetNumSweeps, 2);
+    hpp("bamg_strong_threshold", HYPRE_BoomerAMGSetStrongThreshold,
+        (AMREX_SPACEDIM == 3) ? 0.57 : 0.25);
+    hpp("bamg_coarsen_type", HYPRE_BoomerAMGSetCoarsenType);
+    hpp("bamg_cycle_type", HYPRE_BoomerAMGSetCycleType);
+    hpp("bamg_max_levels", HYPRE_BoomerAMGSetMaxLevels);
+
+    bool use_old_default = true;
+    hpp.pp.query("bamg_use_old_default", use_old_default);
+    if (use_old_default)
+        HYPRE_BoomerAMGSetOldDefault(m_solver);
+}
+
+void HypreIJIface::gmres_solver_configure(const std::string& prefix)
+{
+    if (m_verbose > 2)
+        amrex::Print() << "Creating GMRES solver" << std::endl;
+    HYPRE_ParCSRGMRESCreate(m_comm, &m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRGMRESDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRGMRESSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRGMRESSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRGMRESSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRGMRESSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRGMRESSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRGMRESSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRGMRESGetNumIterations;
+    m_solverFinalResidualNormPtr =
+        &HYPRE_ParCSRGMRESGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRGMRESSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRGMRESSetLogging);
+
+    hpp("num_krylov", HYPRE_ParCSRGMRESSetKDim, 50);
+    hpp("max_iterations", HYPRE_ParCSRGMRESSetMaxIter, 200);
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRGMRESSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRGMRESSetAbsoluteTol);
+}
+
+void HypreIJIface::cogmres_solver_configure(const std::string& prefix)
+{
+    HYPRE_ParCSRCOGMRESCreate(m_comm, &m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRCOGMRESDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRCOGMRESSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRCOGMRESSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRCOGMRESSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRCOGMRESSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRCOGMRESSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRCOGMRESSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRCOGMRESGetNumIterations;
+    m_solverFinalResidualNormPtr =
+        &HYPRE_ParCSRCOGMRESGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRCOGMRESSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRCOGMRESSetLogging);
+
+    hpp("num_krylov", HYPRE_ParCSRCOGMRESSetKDim, 50);
+    hpp("max_iterations", HYPRE_ParCSRCOGMRESSetMaxIter, 200);
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRCOGMRESSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRCOGMRESSetAbsoluteTol);
+}
+
+void HypreIJIface::lgmres_solver_configure(const std::string& prefix)
+{
+    HYPRE_ParCSRLGMRESCreate(m_comm, &m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRLGMRESDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRLGMRESSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRLGMRESSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRLGMRESSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRLGMRESSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRLGMRESSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRLGMRESSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRLGMRESGetNumIterations;
+    m_solverFinalResidualNormPtr =
+        &HYPRE_ParCSRLGMRESGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRLGMRESSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRLGMRESSetLogging);
+
+    hpp("num_krylov", HYPRE_ParCSRLGMRESSetKDim, 50);
+    hpp("max_iterations", HYPRE_ParCSRLGMRESSetMaxIter, 200);
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRLGMRESSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRLGMRESSetAbsoluteTol);
+}
+
+void HypreIJIface::flex_gmres_solver_configure(const std::string& prefix)
+{
+    HYPRE_ParCSRFlexGMRESCreate(m_comm, &m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRFlexGMRESDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRFlexGMRESSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRFlexGMRESSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRFlexGMRESSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRFlexGMRESSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRFlexGMRESSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRFlexGMRESSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRFlexGMRESGetNumIterations;
+    m_solverFinalResidualNormPtr =
+        &HYPRE_ParCSRFlexGMRESGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRFlexGMRESSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRFlexGMRESSetLogging);
+
+    hpp("num_krylov", HYPRE_ParCSRFlexGMRESSetKDim, 50);
+    hpp("max_iterations", HYPRE_ParCSRFlexGMRESSetMaxIter, 200);
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRFlexGMRESSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRFlexGMRESSetAbsoluteTol);
+}
+
+void HypreIJIface::bicgstab_solver_configure(const std::string& prefix)
+{
+    HYPRE_ParCSRBiCGSTABCreate(m_comm, &m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRBiCGSTABDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRBiCGSTABSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRBiCGSTABSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRBiCGSTABSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRBiCGSTABSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRBiCGSTABSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRBiCGSTABSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRBiCGSTABGetNumIterations;
+    m_solverFinalResidualNormPtr =
+        &HYPRE_ParCSRBiCGSTABGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRBiCGSTABSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRBiCGSTABSetLogging);
+
+    hpp("max_iterations", HYPRE_ParCSRBiCGSTABSetMaxIter, 200);
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRBiCGSTABSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRBiCGSTABSetAbsoluteTol);
+}
+
+void HypreIJIface::pcg_solver_configure(const std::string& prefix)
+{
+    HYPRE_ParCSRPCGCreate(m_comm, &m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRPCGDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRPCGSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRPCGSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRPCGSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRPCGSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRPCGSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRPCGSetMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRPCGGetNumIterations;
+    m_solverFinalResidualNormPtr = &HYPRE_ParCSRPCGGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRPCGSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRPCGSetLogging);
+
+    hpp("max_iterations", HYPRE_ParCSRPCGSetMaxIter, 200);
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRPCGSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRPCGSetAbsoluteTol);
+}
+
+void HypreIJIface::hybrid_solver_configure(const std::string& prefix)
+{
+    HYPRE_ParCSRHybridCreate(&m_solver);
+
+    // Setup pointers
+    m_solverDestroyPtr = &HYPRE_ParCSRHybridDestroy;
+    m_solverSetupPtr = &HYPRE_ParCSRHybridSetup;
+    m_solverPrecondPtr = &HYPRE_ParCSRHybridSetPrecond;
+    m_solverSolvePtr = &HYPRE_ParCSRHybridSolve;
+
+    m_solverSetTolPtr = &HYPRE_ParCSRHybridSetTol;
+    m_solverSetAbsTolPtr = &HYPRE_ParCSRHybridSetAbsoluteTol;
+    m_solverSetMaxIterPtr = &HYPRE_ParCSRHybridSetDSCGMaxIter;
+    m_solverNumItersPtr = &HYPRE_ParCSRHybridGetNumIterations;
+    m_solverFinalResidualNormPtr = &HYPRE_ParCSRHybridGetFinalRelativeResidualNorm;
+
+    // Parse options
+    HypreOptParse hpp(prefix, m_solver);
+    hpp("verbose", HYPRE_ParCSRHybridSetPrintLevel);
+    hpp("logging", HYPRE_ParCSRHybridSetLogging);
+
+    hpp.set<amrex::Real>("rtol", HYPRE_ParCSRHybridSetTol);
+    hpp.set<amrex::Real>("atol", HYPRE_ParCSRHybridSetAbsoluteTol);
+
+    hpp("num_krylov", HYPRE_ParCSRHybridSetKDim, 50);
+    hpp("hybrid_dscg_max_iter", HYPRE_ParCSRHybridSetDSCGMaxIter);
+    hpp("hybrid_pcg_max_iter", HYPRE_ParCSRHybridSetPCGMaxIter);
+    hpp("hybrid_setup_type", HYPRE_ParCSRHybridSetSetupType);
+    hpp("hybrid_solver_type", HYPRE_ParCSRHybridSetSolverType);
+    hpp.set<HypreRealType>(
+        "hybrid_set_strong_threshold", HYPRE_ParCSRHybridSetStrongThreshold);
+    hpp("hybrid_recompute_residual", HYPRE_ParCSRHybridSetRecomputeResidual);
+    hpp("hybrid_recompute_residual_period", HYPRE_ParCSRHybridSetRecomputeResidualP);
+}
+
+} // namespace amrex
diff --git a/Src/Extern/HYPRE/AMReX_HypreNodeLap.H b/Src/Extern/HYPRE/AMReX_HypreNodeLap.H
index 591046dc4b7..7ecf5ef0747 100644
--- a/Src/Extern/HYPRE/AMReX_HypreNodeLap.H
+++ b/Src/Extern/HYPRE/AMReX_HypreNodeLap.H
@@ -10,11 +10,8 @@
 #include <AMReX_LayoutData.H>
 #include <AMReX_BndryData.H>
 #include <AMReX_MultiFabUtil.H>
+#include <AMReX_HypreIJIface.H>
 
-#include "HYPRE.h"
-#include "_hypre_utilities.h"
-#include "HYPRE_parcsr_ls.h"
-#include "_hypre_parcsr_mv.h"
 
 namespace amrex {
 
@@ -26,13 +23,19 @@ public:
     HypreNodeLap (const BoxArray& grids_, const DistributionMapping& dmap_,
                   const Geometry& geom_, const FabFactory<FArrayBox>& factory_,
                   const iMultiFab& owner_mask_, const iMultiFab& dirichlet_mask_,
-                  MPI_Comm comm_, MLNodeLinOp const* linop_, int verbose_);
+                  MPI_Comm comm_, MLNodeLinOp const* linop_, int verbose_,
+                  const std::string& options_namespace_);
     ~HypreNodeLap ();
 
+    using Int = HYPRE_Int;
+
     void solve (MultiFab& soln, const MultiFab& rhs,
                 Real rel_tol, Real abs_tol, int max_iter);
 
-    using Int = HYPRE_Int;
+    void fill_node_id (LayoutData<Int>& offset);
+
+    void setHypreOptionsNamespace(const std::string& ns)
+    { options_namespace = ns; }
 
 private:
 
@@ -46,16 +49,20 @@ private:
     MLNodeLinOp const* linop = nullptr;
     int verbose = 0;
 
+    std::unique_ptr<HypreIJIface> hypre_ij;
+
+    // Non-owning references to Hypre matrix, rhs, and solution data
     HYPRE_IJMatrix A = NULL;
     HYPRE_IJVector b = NULL;
     HYPRE_IJVector x = NULL;
-    HYPRE_Solver solver = NULL;
 
     LayoutData<Int> nnodes_grid;
     LayoutData<Vector<Int> > node_id_vec;
     FabArray<BaseFab<Int> > node_id;
     MultiFab tmpsoln;
 
+    std::string options_namespace{"hypre"};
+
     void loadVectors (MultiFab& soln, const MultiFab& rhs);
     void getSolution (MultiFab& soln);
 };
diff --git a/Src/Extern/HYPRE/AMReX_HypreNodeLap.cpp b/Src/Extern/HYPRE/AMReX_HypreNodeLap.cpp
index 9b90f5510bd..f7667a5ad9d 100644
--- a/Src/Extern/HYPRE/AMReX_HypreNodeLap.cpp
+++ b/Src/Extern/HYPRE/AMReX_HypreNodeLap.cpp
@@ -18,10 +18,12 @@ namespace amrex {
 HypreNodeLap::HypreNodeLap (const BoxArray& grids_, const DistributionMapping& dmap_,
                             const Geometry& geom_, const FabFactory<FArrayBox>& factory_,
                             const iMultiFab& owner_mask_, const iMultiFab& dirichlet_mask_,
-                            MPI_Comm comm_, MLNodeLinOp const* linop_, int verbose_)
+                            MPI_Comm comm_, MLNodeLinOp const* linop_, int verbose_,
+                            const std::string& options_namespace_)
     : grids(grids_), dmap(dmap_), geom(geom_), factory(&factory_),
       owner_mask(&owner_mask_), dirichlet_mask(&dirichlet_mask_),
-      comm(comm_), linop(linop_), verbose(verbose_)
+      comm(comm_), linop(linop_), verbose(verbose_),
+      options_namespace(options_namespace_)
 {
     Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
 
@@ -170,20 +172,8 @@ HypreNodeLap::HypreNodeLap (const BoxArray& grids_, const DistributionMapping& d
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
-    for (MFIter mfi(node_id,TilingIfNotGPU()); mfi.isValid(); ++mfi)
-    {
-        Int os = offset[mfi];
-        const Box& bx = mfi.growntilebox();
-        const auto& nid = node_id.array(mfi);
-        AMREX_FOR_3D(bx, i, j, k,
-        {
-            if (nid(i,j,k) >= 0) {
-                nid(i,j,k) += os;
-            } else {
-                nid(i,j,k) = -1;
-            }
-        });
-    }    
+
+    fill_node_id(offset);
 
     amrex::OverrideSync(node_id, *owner_mask, geom.periodicity());
     node_id.FillBoundary(geom.periodicity());
@@ -192,18 +182,13 @@ HypreNodeLap::HypreNodeLap (const BoxArray& grids_, const DistributionMapping& d
     Int ilower = proc_begin;
     Int iupper = proc_end-1;
 
-    //
-    HYPRE_IJMatrixCreate(comm, ilower, iupper, ilower, iupper, &A);
-    HYPRE_IJMatrixSetObjectType(A, HYPRE_PARCSR);
-    HYPRE_IJMatrixInitialize(A);
-    //
-    HYPRE_IJVectorCreate(comm, ilower, iupper, &b);
-    HYPRE_IJVectorSetObjectType(b, HYPRE_PARCSR);
-    //
-    HYPRE_IJVectorCreate(comm, ilower, iupper, &x);
-    HYPRE_IJVectorSetObjectType(x, HYPRE_PARCSR);
+    hypre_ij.reset(new HypreIJIface(comm, ilower, iupper, verbose));
+    hypre_ij->parse_inputs(options_namespace);
 
-    // A.SetValues() & A.assemble()
+    // Obtain non-owning references to the matrix, rhs, and solution data
+    A = hypre_ij->A();
+    b = hypre_ij->b();
+    x = hypre_ij->x();
 
     Vector<Int> ncols;
     Vector<Int> cols;
@@ -243,41 +228,22 @@ HypreNodeLap::HypreNodeLap (const BoxArray& grids_, const DistributionMapping& d
             }
 #endif
 
+            if (hypre_ij->adjustSingularMatrix()
+                && linop->isBottomSingular()
+                && (rows[0] == 0)) {
+                const int num_cols = ncols[0];
+                for (int ic = 0; ic < num_cols; ++ic)
+                    mat[ic] = (cols[ic] == rows[0]) ? mat[ic] : 0.0;
+            }
+
             HYPRE_IJMatrixSetValues(A, nrows, ncols.data(), rows.data(), cols.data(), mat.data());
         }
     }
     HYPRE_IJMatrixAssemble(A);
-
-    // Create solver
-    HYPRE_BoomerAMGCreate(&solver);
-
-    HYPRE_BoomerAMGSetOldDefault(solver); // Falgout coarsening with modified classical interpolation
-//    HYPRE_BoomerAMGSetCoarsenType(solver, 6);
-//    HYPRE_BoomerAMGSetCycleType(solver, 1);
-    HYPRE_BoomerAMGSetRelaxType(solver, 6);   /* G-S/Jacobi hybrid relaxation */
-    HYPRE_BoomerAMGSetRelaxOrder(solver, 1);   /* uses C/F relaxation */
-    HYPRE_BoomerAMGSetNumSweeps(solver, 2);   /* Sweeeps on each level */
-//    HYPRE_BoomerAMGSetStrongThreshold(solver, 0.6); // default is 0.25
-
-    int logging = (verbose >= 2) ? 1 : 0;
-    HYPRE_BoomerAMGSetLogging(solver, logging);
-
-    HYPRE_ParCSRMatrix par_A = NULL;
-    HYPRE_IJMatrixGetObject(A, (void**)  &par_A);
-    HYPRE_BoomerAMGSetup(solver, par_A, NULL, NULL);
 }
 
 HypreNodeLap::~HypreNodeLap ()
-{
-    HYPRE_IJMatrixDestroy(A);
-    A = NULL;
-    HYPRE_IJVectorDestroy(b);
-    b = NULL;
-    HYPRE_IJVectorDestroy(x);
-    x = NULL;
-    HYPRE_BoomerAMGDestroy(solver);
-    solver = NULL;
-}
+{}
 
 void
 HypreNodeLap::solve (MultiFab& soln, const MultiFab& rhs,
@@ -293,45 +259,28 @@ HypreNodeLap::solve (MultiFab& soln, const MultiFab& rhs,
     HYPRE_IJVectorAssemble(x);
     HYPRE_IJVectorAssemble(b);
 
-    HYPRE_ParCSRMatrix par_A = NULL;
-    HYPRE_ParVector par_b = NULL;
-    HYPRE_ParVector par_x = NULL;
-    HYPRE_IJMatrixGetObject(A, (void**)  &par_A);
-    HYPRE_IJVectorGetObject(b, (void **) &par_b);
-    HYPRE_IJVectorGetObject(x, (void **) &par_x);
-
-    HYPRE_BoomerAMGSetMinIter(solver, 1);
-    HYPRE_BoomerAMGSetMaxIter(solver, max_iter);
-    HYPRE_BoomerAMGSetTol(solver, rel_tol);
-    if (abs_tol > 0.0)
-    {
-        Real bnorm = hypre_ParVectorInnerProd(par_b, par_b);
-        bnorm = std::sqrt(bnorm);
+    hypre_ij->solve(rel_tol, abs_tol, max_iter);
 
-        const BoxArray& grd = rhs.boxArray();
-        Real volume = grd.numPts();
-        Real rel_tol_new = (bnorm > 0.0) ? (abs_tol / bnorm * std::sqrt(volume)) : rel_tol;
-
-        if (rel_tol_new > rel_tol) {
-            HYPRE_BoomerAMGSetTol(solver, rel_tol_new);
-        }
-    }
-
-    HYPRE_BoomerAMGSolve(solver, par_A, par_b, par_x);
+    getSolution(soln);
+}
 
-    if (verbose >= 2)
+void
+HypreNodeLap::fill_node_id (LayoutData<Int>& offset)
+{
+    for (MFIter mfi(node_id,TilingIfNotGPU()); mfi.isValid(); ++mfi)
     {
-        HYPRE_Int num_iterations;
-        Real res;
-        HYPRE_BoomerAMGGetNumIterations(solver, &num_iterations);
-        HYPRE_BoomerAMGGetFinalRelativeResidualNorm(solver, &res);
-
-        amrex::Print() <<"\n" <<  num_iterations
-                       << " Hypre IJ BoomerAMG Iterations, Relative Residual "
-                       << res << std::endl;
+        Int os = offset[mfi];
+        const Box& bx = mfi.growntilebox();
+        const auto& nid = node_id.array(mfi);
+        AMREX_FOR_3D(bx, i, j, k,
+        {
+            if (nid(i,j,k) >= 0) {
+                nid(i,j,k) += os;
+            } else {
+                nid(i,j,k) = -1;
+            }
+        });
     }
-
-    getSolution(soln);
 }
 
 void
@@ -368,7 +317,13 @@ HypreNodeLap::loadVectors (MultiFab& soln, const MultiFab& rhs)
                     }
                 }
             }
-            
+
+            if (hypre_ij->adjustSingularMatrix()
+                && linop->isBottomSingular()
+                && (rows[0] == 0)) {
+                bvec[0] = 0.0;
+            }
+
             HYPRE_IJVectorSetValues(b, nrows, rows.data(), bvec.data());
         }
     }
diff --git a/Src/Extern/HYPRE/AMReX_Hypre_fort_mod.F90 b/Src/Extern/HYPRE/AMReX_Hypre_fort_mod.F90
deleted file mode 100644
index 5adebdecf7f..00000000000
--- a/Src/Extern/HYPRE/AMReX_Hypre_fort_mod.F90
+++ /dev/null
@@ -1,10 +0,0 @@
-#include "HYPRE_config.h"
-module amrex_hypre_fort_module
-  use iso_c_binding, only : c_long_long, c_int
-  implicit none
-#ifdef HYPRE_BIGINT
-  integer, parameter :: hypre_int = c_long_long
-#else
-  integer, parameter :: hypre_int = c_int
-#endif
-end module amrex_hypre_fort_module
diff --git a/Src/Extern/HYPRE/CMakeLists.txt b/Src/Extern/HYPRE/CMakeLists.txt
index 0416984fa6e..527000e4cf2 100644
--- a/Src/Extern/HYPRE/CMakeLists.txt
+++ b/Src/Extern/HYPRE/CMakeLists.txt
@@ -1,28 +1,26 @@
 #
-# This file gets processed if either ENABLE_PETSC or ENABLE_HYPRE are ON
-# If only ENABLE_PETSC is ON, we just need to include this directory
+# This file gets processed if either AMReX_PETSC or AMReX_HYPRE are ON
+# If only AMReX_PETSC is ON, we just need to include this directory
 # and a couple of files to the build.
 #
 target_include_directories( amrex
    PUBLIC
    $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_DIR}>)
 
-if (NOT ENABLE_HYPRE) # only ENABLE_PETSC is active
+if (NOT AMReX_HYPRE) # only AMReX_PETSC is active
 
    target_sources( amrex
       PRIVATE
-      AMReX_HypreABec_F.H
-      AMReX_HABEC_${DIM}D.F90
+      AMReX_Habec_${AMReX_SPACEDIM}D_K.H
+      AMReX_Habec_K.H
       )
 
 else ()
 
-   if (DIM EQUAL 1)
+   if (AMReX_SPACEDIM EQUAL 1)
       message(FATAL_ERROR "HYPRE interfaces are not supported for 1D builds")
    endif ()
 
-   find_package(HYPRE 2.15 REQUIRED)
-
    target_compile_definitions( amrex
       PUBLIC
       $<BUILD_INTERFACE:AMREX_USE_HYPRE>)
@@ -37,13 +35,12 @@ else ()
       AMReX_HypreABecLap2.H
       AMReX_Hypre.cpp
       AMReX_Hypre.H
-      AMReX_HypreABec_F.H
+      AMReX_Habec_${AMReX_SPACEDIM}D_K.H
+      AMReX_Habec_K.H
       AMReX_HypreNodeLap.cpp
       AMReX_HypreNodeLap.H
-      AMReX_HABEC_${DIM}D.F90
-      AMReX_Hypre_fort_mod.F90
+      AMReX_HypreIJIface.cpp
+      AMReX_HypreIJIface.H
       )
 
-   target_link_libraries( amrex PUBLIC HYPRE )
-
 endif ()
diff --git a/Src/Extern/HYPRE/Make.package b/Src/Extern/HYPRE/Make.package
index 451e03366e0..abf1a9f3e6e 100644
--- a/Src/Extern/HYPRE/Make.package
+++ b/Src/Extern/HYPRE/Make.package
@@ -3,12 +3,10 @@ CEXE_sources += AMReX_HypreABecLap.cpp AMReX_HypreABecLap2.cpp AMReX_HypreABecLa
 
 CEXE_headers += AMReX_HypreABecLap.H AMReX_HypreABecLap2.H AMReX_HypreABecLap3.H AMReX_Hypre.H
 
-CEXE_headers += AMReX_HypreABec_F.H 
-
-CEXE_headers += AMReX_HypreNodeLap.H
-CEXE_sources += AMReX_HypreNodeLap.cpp
-
-F90EXE_sources += AMReX_HABEC_$(DIM)D.F90 AMReX_Hypre_fort_mod.F90
+CEXE_headers += AMReX_Habec_$(DIM)D_K.H
+CEXE_headers += AMReX_Habec_K.H
+CEXE_headers += AMReX_HypreNodeLap.H AMReX_HypreIJIface.H
+CEXE_sources += AMReX_HypreNodeLap.cpp AMReX_HypreIJIface.cpp
 
 VPATH_LOCATIONS += $(AMREX_HOME)/Src/Extern/HYPRE
 INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/HYPRE
diff --git a/Src/Extern/PETSc/AMReX_PETSc.H b/Src/Extern/PETSc/AMReX_PETSc.H
index 548ff27270c..69895ee9396 100644
--- a/Src/Extern/PETSc/AMReX_PETSc.H
+++ b/Src/Extern/PETSc/AMReX_PETSc.H
@@ -58,7 +58,7 @@ private:
     Vec x = nullptr;
 
     LayoutData<PetscInt> ncells_grid;
-    LayoutData<Vector<PetscInt> > cell_id_vec;
+    LayoutData<Gpu::ManagedDeviceVector<PetscInt> > cell_id_vec;
     FabArray<BaseFab<PetscInt> > cell_id;
 
     MultiFab const* m_eb_b_coeffs = nullptr;
diff --git a/Src/Extern/PETSc/AMReX_PETSc.cpp b/Src/Extern/PETSc/AMReX_PETSc.cpp
index e90e5884d14..08ba5d30be2 100644
--- a/Src/Extern/PETSc/AMReX_PETSc.cpp
+++ b/Src/Extern/PETSc/AMReX_PETSc.cpp
@@ -7,7 +7,8 @@
 #include <AMReX_EBFabFactory.H>
 #endif
 
-#include <AMReX_HypreABec_F.H>
+#include <AMReX_Habec_K.H>
+
 #include <cmath>
 #include <numeric>
 #include <limits>
@@ -119,6 +120,7 @@ void
 PETScABecLap::solve (MultiFab& soln, const MultiFab& rhs, Real rel_tol, Real abs_tol, 
                      int max_iter, const BndryData& bndry, int max_bndry_order)
 {
+    Gpu::LaunchSafeGuard lsg(false); // xxxxx TODO: gpu
     BL_PROFILE("PETScABecLap::solve()");
 
     if (solver == nullptr || m_bndry != &bndry || m_maxorder != max_bndry_order)
@@ -207,10 +209,10 @@ PETScABecLap::prepareSolver ()
         }
         else if (fabtyp == FabType::singlevalued)
         {
-            amrex_hpeb_fill_cellid(BL_TO_FORTRAN_BOX(bx),
-                                   &ncells_grid[mfi],
-                                   BL_TO_FORTRAN_ANYD(cid_fab),
-                                   BL_TO_FORTRAN_ANYD((*flags)[mfi]));
+            amrex_hpeb_fill_cellid(bx,
+                                   ncells_grid[mfi],
+                                   cid_fab,
+                                   (*flags)[mfi]);
             ncells_proc += ncells_grid[mfi];
         }
         else
@@ -278,8 +280,6 @@ PETScABecLap::prepareSolver ()
     // A.SetValues
     const Real* dx = geom.CellSize();
     const int bho = (m_maxorder > 2) ? 1 : 0;
-    FArrayBox rfab;
-    BaseFab<PetscInt> ifab;
     FArrayBox foo(Box::TheUnitBox());
     const int is_eb_dirichlet = m_eb_b_coeffs != nullptr;
     for (MFIter mfi(acoefs); mfi.isValid(); ++mfi)
@@ -296,18 +296,15 @@ PETScABecLap::prepareSolver ()
             const PetscInt max_stencil_size = (fabtyp == FabType::regular) ?
                 regular_stencil_size : eb_stencil_size;
 
-            ifab.resize(bx,(max_stencil_size+1));
-            rfab.resize(bx,max_stencil_size);
-
             const PetscInt nrows = ncells_grid[mfi];
             cell_id_vec[mfi].resize(nrows);
-            PetscInt* rows = cell_id_vec[mfi].data();
-            PetscInt* ncols = ifab.dataPtr(0);
-            PetscInt* cols  = ifab.dataPtr(1);
-            Real*      mat   = rfab.dataPtr();
 
-            Array<int,AMREX_SPACEDIM*2> bctype;
-            Array<Real,AMREX_SPACEDIM*2> bcl;
+            Gpu::ManagedDeviceVector<PetscInt> ncolsg(nrows,0);
+            Gpu::ManagedDeviceVector<PetscInt> colsg(nrows*(AMREX_SPACEDIM*2+1),0);
+            Gpu::ManagedDeviceVector<Real> matg(nrows*(AMREX_SPACEDIM*2+1),0.0);
+
+            GpuArray<int,AMREX_SPACEDIM*2> bctype;
+            GpuArray<Real,AMREX_SPACEDIM*2> bcl;
             const Vector< Vector<BoundCond> > & bcs_i = m_bndry->bndryConds(mfi);
             const BndryData::RealTuple        & bcl_i = m_bndry->bndryLocs(mfi);
             for (OrientationIter oit; oit; oit++) {
@@ -318,47 +315,63 @@ PETScABecLap::prepareSolver ()
     
             if (fabtyp == FabType::regular)
             {
-                amrex_hpijmatrix(BL_TO_FORTRAN_BOX(bx),
-                                 &nrows, ncols, rows, cols, mat,
-                                 BL_TO_FORTRAN_ANYD(cell_id[mfi]),
-                                 &(offset[mfi]),
-                                 BL_TO_FORTRAN_ANYD(diaginv[mfi]),
-                                 BL_TO_FORTRAN_ANYD(acoefs[mfi]),
-                                 AMREX_D_DECL(BL_TO_FORTRAN_ANYD(bcoefs[0][mfi]),
-                                              BL_TO_FORTRAN_ANYD(bcoefs[1][mfi]),
-                                              BL_TO_FORTRAN_ANYD(bcoefs[2][mfi])),
-                                 &scalar_a, &scalar_b, dx,
-                                 bctype.data(), bcl.data(), &bho);
+                amrex_hpijmatrix(bx,
+                                 nrows, ncolsg.dataPtr(),
+                                 cell_id_vec[mfi].dataPtr(),
+                                 colsg.dataPtr(), matg.dataPtr(),
+                                 cell_id[mfi],
+                                 offset[mfi],
+                                 diaginv[mfi],
+                                 acoefs[mfi],
+                                 bcoefs[0][mfi],
+                                 bcoefs[1][mfi],
+#if (AMREX_SPACEDIM == 3)
+                                 bcoefs[2][mfi],
+#endif
+                                 scalar_a, scalar_b, dx,
+                                 bctype, bcl, bho, nullptr);
             }
 #ifdef AMREX_USE_EB
             else
             {
                 FArrayBox const& beb = (is_eb_dirichlet) ? (*m_eb_b_coeffs)[mfi] : foo;
-                
-                amrex_hpeb_ijmatrix(BL_TO_FORTRAN_BOX(bx),
-                                    &nrows, ncols, rows, cols, mat,
-                                    BL_TO_FORTRAN_ANYD(cell_id[mfi]),
-                                    &(offset[mfi]),
-                                    BL_TO_FORTRAN_ANYD(diaginv[mfi]),
-                                    BL_TO_FORTRAN_ANYD(acoefs[mfi]),
-                                    AMREX_D_DECL(BL_TO_FORTRAN_ANYD(bcoefs[0][mfi]),
-                                                 BL_TO_FORTRAN_ANYD(bcoefs[1][mfi]),
-                                                 BL_TO_FORTRAN_ANYD(bcoefs[2][mfi])),
-                                    BL_TO_FORTRAN_ANYD((*flags)[mfi]),
-                                    BL_TO_FORTRAN_ANYD((*vfrac)[mfi]),
-                                    AMREX_D_DECL(BL_TO_FORTRAN_ANYD((*area[0])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*area[1])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*area[2])[mfi])),
-                                    AMREX_D_DECL(BL_TO_FORTRAN_ANYD((*fcent[0])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*fcent[1])[mfi]),
-                                                 BL_TO_FORTRAN_ANYD((*fcent[2])[mfi])),
-                                    BL_TO_FORTRAN_ANYD((*barea)[mfi]),
-                                    BL_TO_FORTRAN_ANYD((*bcent)[mfi]),
-                                    BL_TO_FORTRAN_ANYD(beb), &is_eb_dirichlet,
-                                    &scalar_a, &scalar_b, dx,
-                                    bctype.data(), bcl.data(), &bho);
+                int size_vec = std::pow(3,AMREX_SPACEDIM);
+                colsg.resize(nrows*size_vec);
+                matg.resize(nrows*size_vec);
+                amrex_hpeb_ijmatrix(bx,
+                                    nrows, ncolsg.dataPtr(),
+                                    cell_id_vec[mfi].dataPtr(),
+                                    colsg.dataPtr(), matg.dataPtr(),
+                                    cell_id[mfi],
+                                    offset[mfi], diaginv[mfi],
+                                    acoefs[mfi], bcoefs[0][mfi],
+                                    bcoefs[1][mfi],
+#if (AMREX_SPACEDIM == 3)
+                                    bcoefs[2][mfi],
+#endif
+                                    (*flags)[mfi],
+                                    (*vfrac)[mfi],
+                                    (*area[0])[mfi], (*area[1])[mfi],
+#if (AMREX_SPACEDIM == 3)
+                                    (*area[2])[mfi],
+#endif
+                                    (*fcent[0])[mfi], (*fcent[1])[mfi],
+#if (AMREX_SPACEDIM == 3)
+                                    (*fcent[2])[mfi],
+#endif
+                                    (*barea)[mfi],
+                                    (*bcent)[mfi],
+                                    beb, is_eb_dirichlet,
+                                    scalar_a, scalar_b, dx,
+                                    bctype, bcl, bho);
             }
 #endif
+
+            PetscInt* rows = cell_id_vec[mfi].data();
+            PetscInt* ncols = (PetscInt*) ncolsg.dataPtr();
+            PetscInt* cols = (PetscInt*) colsg.dataPtr();
+            Real* mat = (Real*) matg.dataPtr();
+
             //Load in by row! 
             int matid = 0; 
             for (int rit = 0; rit < nrows; ++rit)
@@ -428,10 +441,10 @@ PETScABecLap::loadVectors (MultiFab& soln, const MultiFab& rhs)
             {
                 bfab = &vecfab;
                 bfab->resize(bx);
-                amrex_hpeb_copy_to_vec(BL_TO_FORTRAN_BOX(bx),
-                                       BL_TO_FORTRAN_ANYD(rhsfab),
-                                       bfab->dataPtr(), &nrows,
-                                       BL_TO_FORTRAN_ANYD((*flags)[mfi])); // */
+                amrex_hpeb_copy_to_vec(bx,
+                                       rhsfab,
+                                       bfab->dataPtr(),
+                                       (*flags)[mfi]);
             }
             else
 #endif
@@ -490,10 +503,10 @@ PETScABecLap::getSolution (MultiFab& soln)
 #ifdef AMREX_USE_EB
             else if (fabtyp != FabType::regular)
             {
-                amrex_hpeb_copy_from_vec(BL_TO_FORTRAN_BOX(bx),
-                                         BL_TO_FORTRAN_ANYD(soln[mfi]),
-                                         xfab->dataPtr(), &nrows,
-                                         BL_TO_FORTRAN_ANYD((*flags)[mfi])); // */
+                amrex_hpeb_copy_from_vec(bx,
+                                         soln[mfi],
+                                         xfab->dataPtr(),
+                                         (*flags)[mfi]);
             }
 #endif
         }
diff --git a/Src/Extern/PETSc/AMReX_PETSc_fort_mod.F90 b/Src/Extern/PETSc/AMReX_PETSc_fort_mod.F90
deleted file mode 100644
index 815d64a0e6e..00000000000
--- a/Src/Extern/PETSc/AMReX_PETSc_fort_mod.F90
+++ /dev/null
@@ -1,7 +0,0 @@
-#include <petsc/finclude/petscsys.h>
-
-module amrex_petsc_fort_module
-  implicit none
-  PetscInt, parameter, private :: a_petsc_int=0
-  integer, parameter, public :: petsc_int = kind(a_petsc_int)
-end module amrex_petsc_fort_module
diff --git a/Src/Extern/PETSc/CMakeLists.txt b/Src/Extern/PETSc/CMakeLists.txt
index adb1c0bcf92..39548e5ef9c 100644
--- a/Src/Extern/PETSc/CMakeLists.txt
+++ b/Src/Extern/PETSc/CMakeLists.txt
@@ -1,9 +1,7 @@
-if (DIM EQUAL 1)
+if (AMReX_SPACEDIM EQUAL 1)
    message(FATAL_ERROR "PETSc interfaces are not supported for 1D builds")
 endif ()
 
-find_package(PETSc 2.13 REQUIRED)
-
 target_compile_definitions( amrex
    PUBLIC
    $<BUILD_INTERFACE:AMREX_USE_PETSC>)
@@ -16,7 +14,4 @@ target_sources( amrex
    PRIVATE
    AMReX_PETSc.cpp
    AMReX_PETSc.H
-   AMReX_PETSc_fort_mod.F90
    )
-
-target_link_libraries( amrex PUBLIC PETSC )
diff --git a/Src/Extern/PETSc/Make.package b/Src/Extern/PETSc/Make.package
index 45da24d1697..00f81ae6046 100644
--- a/Src/Extern/PETSc/Make.package
+++ b/Src/Extern/PETSc/Make.package
@@ -6,8 +6,8 @@ CEXE_sources += AMReX_PETSc.cpp
 VPATH_LOCATIONS += $(AMREX_HOME)/Src/Extern/PETSc
 INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/PETSc
 
-CEXE_headers += AMReX_HypreABec_F.H 
-F90EXE_sources += AMReX_HABEC_$(DIM)D.F90 AMReX_PETSc_fort_mod.F90
+CEXE_headers += AMReX_Habec_$(DIM)D_K.H
+CEXE_headers += AMReX_Habec_K.H
 
 VPATH_LOCATIONS += $(AMREX_HOME)/Src/Extern/HYPRE
 INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/HYPRE
diff --git a/Src/Extern/ProfParser/AMReX_AVGDOWN_2D.F b/Src/Extern/ProfParser/AMReX_AVGDOWN_2D.F
index 0c0d30b53ef..69938bcfbc8 100644
--- a/Src/Extern/ProfParser/AMReX_AVGDOWN_2D.F
+++ b/Src/Extern/ProfParser/AMReX_AVGDOWN_2D.F
@@ -196,7 +196,8 @@ subroutine FORT_CV_AVGDOWN_STAG (
             do j=lo(2),hi(2)
                do i=lo(1),hi(1)
                   do joff=0,lrat-1
-                     crse(i,j,n) = crse(i,j,n) + vol_inv*fine(lrat*i,lrat*j+joff,n)
+                     crse(i,j,n) = crse(i,j,n) +
+     $                    vol_inv*fine(lrat*i,lrat*j+joff,n)
                   end do
                end do
             end do
@@ -206,7 +207,8 @@ subroutine FORT_CV_AVGDOWN_STAG (
             do j=lo(2),hi(2)
                do i=lo(1),hi(1)
                   do ioff=0,lrat-1
-                     crse(i,j,n) = crse(i,j,n) + vol_inv*fine(lrat*i+ioff,lrat*j,n)
+                     crse(i,j,n) = crse(i,j,n) +
+     $                    vol_inv*fine(lrat*i+ioff,lrat*j,n)
                   end do
                end do
             end do
diff --git a/Src/Extern/ProfParser/AMReX_AVGDOWN_3D.F b/Src/Extern/ProfParser/AMReX_AVGDOWN_3D.F
index 1212e301259..111074f3674 100644
--- a/Src/Extern/ProfParser/AMReX_AVGDOWN_3D.F
+++ b/Src/Extern/ProfParser/AMReX_AVGDOWN_3D.F
@@ -13,7 +13,8 @@
 #define SDIM 3
 
       subroutine FORT_CV_AVGDOWN (
-     &     crse,DIMS(crse),nvar,
+     &     crse,DIMS(crse),
+     &     nvar,
      &     fine,DIMS(fine),
      &     lo,hi,ratios)
 c     ----------------------------------------------------------
@@ -31,8 +32,10 @@ subroutine FORT_CV_AVGDOWN (
       integer  lo(SDIM), hi(SDIM)
       integer  nvar
       integer  ratios(SDIM)
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   fine(DIMV(fine),nvar)
+      REAL_T
+     $     crse(DIMV(crse),nvar)
+      REAL_T
+     $     fine(DIMV(fine),nvar)
 
       integer  i, j, k, n, ic, jc, kc, ioff, joff, koff
       integer  lratx,lraty,lratz
@@ -66,7 +69,8 @@ subroutine FORT_CV_AVGDOWN (
                      do ioff = 0, lratx-1
                         do ic = lo(1), hi(1)
                            i = ic*lratx + ioff
-                           crse(ic,jc,kc,n) = crse(ic,jc,kc,n) + fine(i,j,k,n)
+                           crse(ic,jc,kc,n) = crse(ic,jc,kc,n) +
+     $                          fine(i,j,k,n)
                         end do
                      end do
                   end do
@@ -87,7 +91,8 @@ subroutine FORT_CV_AVGDOWN (
       end
       subroutine FORT_CV_AVGDOWN_STAG (
      &     nodal_dir,
-     &     crse,DIMS(crse),nvar,
+     &     crse,DIMS(crse),
+     &     nvar,
      &     fine,DIMS(fine),
      &     lo,hi,ratios)
 c     ----------------------------------------------------------
@@ -106,8 +111,10 @@ subroutine FORT_CV_AVGDOWN_STAG (
       integer  lo(SDIM), hi(SDIM)
       integer  nvar
       integer  ratios(SDIM)
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   fine(DIMV(fine),nvar)
+      REAL_T
+     $     crse(DIMV(crse),nvar)
+      REAL_T
+     $     fine(DIMV(fine),nvar)
 
       integer  i, j, k, n, ic, jc, kc, ioff, joff, koff
       integer  lrat
@@ -147,8 +154,8 @@ subroutine FORT_CV_AVGDOWN_STAG (
                   do i=lo(1),hi(1)
                      do koff=0,lrat-1
                         do joff=0,lrat-1
-                           crse(i,j,k,n) = crse(i,j,k,n) + 
-     &                          vol_inv*fine(lrat*i,lrat*j+joff,lrat*k+koff,n)
+                           crse(i,j,k,n) = crse(i,j,k,n) + vol_inv*
+     $                          fine(lrat*i,lrat*j+joff,lrat*k+koff,n)
                         end do
                      end do
                   end do
@@ -162,8 +169,8 @@ subroutine FORT_CV_AVGDOWN_STAG (
                   do i=lo(1),hi(1)
                      do koff=0,lrat-1
                         do ioff=0,lrat-1
-                           crse(i,j,k,n) = crse(i,j,k,n) + 
-     &                          vol_inv*fine(lrat*i+ioff,lrat*j,lrat*k+koff,n)
+                           crse(i,j,k,n) = crse(i,j,k,n) + vol_inv
+     $                          *fine(lrat*i+ioff,lrat*j,lrat*k+koff,n)
                         end do
                      end do
                   end do
@@ -177,8 +184,8 @@ subroutine FORT_CV_AVGDOWN_STAG (
                   do i=lo(1),hi(1)
                      do joff=0,lrat-1
                         do ioff=0,lrat-1
-                           crse(i,j,k,n) = crse(i,j,k,n) + 
-     &                          vol_inv*fine(lrat*i+ioff,lrat*j+joff,lrat*k,n)
+                           crse(i,j,k,n) = crse(i,j,k,n) + vol_inv
+     $                          *fine(lrat*i+ioff,lrat*j+joff,lrat*k,n)
                         end do
                      end do
                   end do
@@ -193,7 +200,8 @@ subroutine FORT_CV_AVGDOWN_STAG (
 
 
       subroutine FORT_AVGDOWN (
-     &     crse,DIMS(crse),nvar,
+     &     crse,DIMS(crse),
+     &      nvar,
      &     fine,DIMS(fine),
      &     cv,DIMS(cv),
      &     fv,DIMS(fv),
@@ -217,9 +225,11 @@ subroutine FORT_AVGDOWN (
       integer  lo(SDIM), hi(SDIM)
       integer  nvar
       integer  ratios(SDIM)
-      REAL_T   crse(DIMV(crse),nvar)
+      REAL_T
+     $     crse(DIMV(crse),nvar)
       REAL_T     cv(DIMV(cv))
-      REAL_T   fine(DIMV(fine),nvar)
+      REAL_T
+     $     fine(DIMV(fine),nvar)
       REAL_T     fv(DIMV(fv))
 
       integer  i, j, k, n, ic, jc, kc, ioff, joff, koff
diff --git a/Src/Extern/ProfParser/AMReX_BLProfStats.H b/Src/Extern/ProfParser/AMReX_BLProfStats.H
index 9a6815ec633..c2495b5de51 100644
--- a/Src/Extern/ProfParser/AMReX_BLProfStats.H
+++ b/Src/Extern/ProfParser/AMReX_BLProfStats.H
@@ -168,54 +168,54 @@ class BLProfStats {
                               bool graphTopPct = true);
     virtual void AddCalcEndTime(double cet) { calcEndTime = cet; }
 
-    virtual void SetCPVersion(const int cpv) { }
-    virtual void SetCSSize(const int css) { }
-    virtual void InitCommDataBlock(const int proc, const long ncommstats,
-                               const std::string &filename, const long seekpos,
-			       const std::string &nodename = "",
-			       const int nodenumber = -1) { }
-    virtual void AddBarrier(long bnum, const std::string &bname, long index) { }
-    virtual void AddReduction(const long rnum, const long index) { }
-    virtual void AddTimeMinMax(const double tmin, const double tmax) { }
-    virtual void AddTimerTime(const double tt) { }
-    virtual void AddNameTag(const long ntnindex, const long seekindex) { }
-    virtual void AddNameTagName(const std::string &name) { }
-    virtual void AddTagRange(const long tmin, const long tmax) { }
-    virtual void AddGridLevel(const int level, const int ngrids) { }
-    virtual void AddGrid3D(int level, int xlo, int ylo, int zlo,
-                           int xhi, int yhi, int zhi,
-                           int xc,  int yc,  int zc,
-                           int xn,  int yn,  int zn, int proc) { }
-    virtual void AddFinestLevel(const int lev) { }
-    virtual void AddMaxLevel(const int lev) { }
-    virtual void AddRefRatio(const int lev, const amrex::IntVect &rr) { }
-    virtual void AddTopoCoord(const int nid, const int node,
-                      const int tx, const int ty, const int tz,
-                      const bool servicenode = false) { }
-
-    virtual void AddCommHeaderFileName(const std::string &hfn) { }
-    virtual void SetCSVersion(int csv)  { }
-    virtual void AddCStatsHeaderFileName(const std::string &hfn) { }
-    virtual void AddFunctionName(const std::string &fname, int fnumber) { }
-    virtual void InitCStatsDataBlock(int proc, long nrss, long ntracestats,
-                                     const std::string &filename, long seekpos) { }
+    virtual void SetCPVersion(const int /*cpv*/) { }
+    virtual void SetCSSize(const int /*css*/) { }
+    virtual void InitCommDataBlock(const int /*proc*/, const long /*ncommstats*/,
+                               const std::string &/*filename*/, const long /*seekpos*/,
+			       const std::string &/*nodename*/ = "",
+			       const int /*nodenumber*/ = -1) { }
+    virtual void AddBarrier(long /*bnum*/, const std::string &/*bname*/, long /*index*/) { }
+    virtual void AddReduction(const long /*rnum*/, const long /*index*/) { }
+    virtual void AddTimeMinMax(const double /*tmin*/, const double /*tmax*/) { }
+    virtual void AddTimerTime(const double /*tt*/) { }
+    virtual void AddNameTag(const long /*ntnindex*/, const long /*seekindex*/) { }
+    virtual void AddNameTagName(const std::string &/*name*/) { }
+    virtual void AddTagRange(const long /*tmin*/, const long /*tmax*/) { }
+    virtual void AddGridLevel(const int /*level*/, const int /*ngrids*/) { }
+    virtual void AddGrid3D(int /*level*/, int /*xlo*/, int /*ylo*/, int /*zlo*/,
+                           int /*xhi*/,   int /*yhi*/, int /*zhi*/,
+                           int /*xc*/,    int /*yc*/,  int /*zc*/,
+                           int /*xn*/,    int /*yn*/,  int /*zn*/, int /*proc*/) { }
+    virtual void AddFinestLevel(const int /*lev*/) { }
+    virtual void AddMaxLevel(const int /*lev*/) { }
+    virtual void AddRefRatio(const int /*lev*/, const amrex::IntVect &/*rr*/) { }
+    virtual void AddTopoCoord(const int /*nid*/, const int /*node*/,
+                      const int /*tx*/, const int /*ty*/, const int /*tz*/,
+                      const bool /*servicenode*/ = false) { }
+
+    virtual void AddCommHeaderFileName(const std::string &/*hfn*/) { }
+    virtual void SetCSVersion(int /*csv*/)  { }
+    virtual void AddCStatsHeaderFileName(const std::string &/*hfn*/) { }
+    virtual void AddFunctionName(const std::string &/*fname*/, int /*fnumber*/) { }
+    virtual void InitCStatsDataBlock(int /*proc*/, long /*nrss*/, long /*ntracestats*/,
+                                     const std::string &/*filename*/, long /*seekpos*/) { }
     static void SetInitDataBlocks(bool b) { bInitDataBlocks = b;    }
     static bool InitDBlocks()             { return bInitDataBlocks; }
 
     static void SetGPercent(Real p)  { gPercent = p/100.0; }
 
-    virtual void AddProbDomain(const int lev, const amrex::Box &pd) { }
-    virtual TimeRange MakeRegionPlt(amrex::FArrayBox &rFab, int noregionnumber,
-                               int width, int height,
-			       amrex::Vector<amrex::Vector<amrex::Box>> &regionBoxes)
+    virtual void AddProbDomain(const int /*lev*/, const amrex::Box &/*pd*/) { }
+    virtual TimeRange MakeRegionPlt(amrex::FArrayBox &/*rFab*/, int /*noregionnumber*/,
+                               int /*width*/, int /*height*/,
+			       amrex::Vector<amrex::Vector<amrex::Box>> &/*regionBoxes*/)
 			       { return TimeRange(); }
 
     static void OpenAllStreams(const std::string &dirname);
     static void CloseAllStreams();
 
-    virtual void AddEdisonPID(int X, int Y, int Z,
-                              int col, int row, int cage, int slot,
-                              int cpu, int pid) { }
+    virtual void AddEdisonPID(int /*X*/,   int /*Y*/, int /*Z*/,
+                              int /*col*/, int /*row*/, int /*cage*/, int /*slot*/,
+                              int /*cpu*/, int /*pid*/) { }
 
     static bool TimeRangeInitialized() { return bTimeRangeInitialized; }
 
diff --git a/Src/Extern/ProfParser/AMReX_BLProfStats.cpp b/Src/Extern/ProfParser/AMReX_BLProfStats.cpp
index f756b20af41..6eeed49f953 100644
--- a/Src/Extern/ProfParser/AMReX_BLProfStats.cpp
+++ b/Src/Extern/ProfParser/AMReX_BLProfStats.cpp
@@ -243,7 +243,7 @@ void BLProfStats::MakeFilterFile(const std::string &ffname) {
 
 // ----------------------------------------------------------------------
 void BLProfStats::SetFilter(BLProfStats::FilterStatus fs,
-                            const std::string &ffname, int rnumber)
+                            const std::string &/*ffname*/, int rnumber)
 {
   if(fs == BLProfStats::FilterStatus::ON) {
     includeSet.insert(rnumber);
@@ -473,7 +473,7 @@ void BLProfStats::ReadBlock(BLPDataBlock &dBlock) {
 
 
 // ----------------------------------------------------------------------
-void BLProfStats::ReadBlockNoOpen(BLPDataBlock &dBlock)
+void BLProfStats::ReadBlockNoOpen(BLPDataBlock &/*dBlock*/)
 {
 amrex::Abort("not implemented yet.");
 }
@@ -513,7 +513,7 @@ void BLProfStats::CollectFuncStats(Vector<Vector<FuncStat> > &funcStats)
 
 
 // ----------------------------------------------------------------------
-void BLProfStats::WriteSummary(std::ostream &ios, bool bwriteavg,
+void BLProfStats::WriteSummary(std::ostream &ios, bool /*bwriteavg*/,
                                int whichProc, bool graphTopPct)
 {
   if( ! ParallelDescriptor::IOProcessor()) {
diff --git a/Src/Extern/ProfParser/AMReX_BLProfUtilities.cpp b/Src/Extern/ProfParser/AMReX_BLProfUtilities.cpp
index fc12a61402d..ed9e0b0278d 100644
--- a/Src/Extern/ProfParser/AMReX_BLProfUtilities.cpp
+++ b/Src/Extern/ProfParser/AMReX_BLProfUtilities.cpp
@@ -208,7 +208,7 @@ void amrex::RedistFiles() {
       iss.open(readCPHFile.c_str(), std::ios::in);
       iss.seekg(0, std::ios::end);
       long fileLength(iss.tellg());
-      char charBuf[fileLength];
+      char* charBuf = (char*) malloc(fileLength);
       iss.seekg(0, std::ios::beg);
       iss.read(charBuf, fileLength);
       iss.close();
@@ -216,13 +216,14 @@ void amrex::RedistFiles() {
       oss.open(writeCPHFile.c_str(), std::ios::out);
       oss.write(charBuf, fileLength);
       oss.close();
+      free(charBuf);
     }
 
     {  // header files
       iss.open(readHFile.c_str(), std::ios::in);
       iss.seekg(0, std::ios::end);
       long fileLength(iss.tellg());
-      char charBuf[fileLength];
+      char* charBuf = (char*) malloc(fileLength);
       iss.seekg(0, std::ios::beg);
       iss.read(charBuf, fileLength);
       iss.close();
@@ -230,13 +231,14 @@ void amrex::RedistFiles() {
       oss.open(writeHFile.c_str(), std::ios::out);
       oss.write(charBuf, fileLength);
       oss.close();
+      free(charBuf);
     }
 
     {  // data files
       iss.open(readDFile.c_str(), std::ios::in);
       iss.seekg(0, std::ios::end);
       long fileLength(iss.tellg());
-      char charBuf[fileLength];
+      char* charBuf = (char*) malloc(fileLength);
       iss.seekg(0, std::ios::beg);
       iss.read(charBuf, fileLength);
       iss.close();
@@ -244,6 +246,7 @@ void amrex::RedistFiles() {
       oss.open(writeDFile.c_str(), std::ios::out);
       oss.write(charBuf, fileLength);
       oss.close();
+      free(charBuf);
     }
 }
 
diff --git a/Src/Extern/ProfParser/AMReX_CommProfStats.H b/Src/Extern/ProfParser/AMReX_CommProfStats.H
index 6378e164a25..906d2169243 100644
--- a/Src/Extern/ProfParser/AMReX_CommProfStats.H
+++ b/Src/Extern/ProfParser/AMReX_CommProfStats.H
@@ -121,7 +121,7 @@ class CommProfStats : public BLProfStats {
       inline static long HashLong(int fp, int tp, int t) {
 	return(fp + tp + 64*t);
       }
-      inline static long HashLong(int fp, int tp, int ds, int t) {
+      inline static long HashLong(int fp, int tp, int /*ds*/, int t) {
 	//if(fp < 0 || tp < 0 || ds < 0 || t < 0) {
 	  //cout << ":::: HashLong:  negative values:  fp tp ds t = "
 	       //<< fp << "  " << tp << "  " << ds << "  " << t << endl;
diff --git a/Src/Extern/ProfParser/AMReX_CommProfStats.cpp b/Src/Extern/ProfParser/AMReX_CommProfStats.cpp
index 9b7a41b8cf0..889e0d8bf43 100644
--- a/Src/Extern/ProfParser/AMReX_CommProfStats.cpp
+++ b/Src/Extern/ProfParser/AMReX_CommProfStats.cpp
@@ -156,7 +156,7 @@ void CommProfStats::InitCommDataBlock(const int proc, const long ncommstats,
 
 
 // ----------------------------------------------------------------------
-int CommProfStats::AfterBarrier(const int proc, const double t) {
+int CommProfStats::AfterBarrier(const int /*proc*/, const double /*t*/) {
 /*
   if(bExitTimesDone) {
     if(barrierExitTimes[proc][0] > t) {
@@ -238,14 +238,14 @@ void CommProfStats::AddTimerTime(const double tt) {
 
 
 // ----------------------------------------------------------------------
-void CommProfStats::AddGridLevel(const int level, const int ngrids) {
+void CommProfStats::AddGridLevel(const int /*level*/, const int /*ngrids*/) {
 }
 
 
 // ----------------------------------------------------------------------
-void CommProfStats::AddGrid3D(int level, int xlo, int ylo, int zlo,
-			      int xhi, int yhi, int zhi,
-			      int xc,  int yc,  int zc,
+void CommProfStats::AddGrid3D(int /*level*/, int /*xlo*/, int /*ylo*/, int /*zlo*/,
+			      int /*xhi*/, int /*yhi*/, int /*zhi*/,
+			      int /*xc*/,  int /*yc*/,  int /*zc*/,
 			      int xn,  int yn,  int zn, int proc)
 {
   long nPoints(xn * yn * zn);
@@ -286,13 +286,14 @@ void CommProfStats::AddProbDomain(const int level, const Box &pd) {
 // ----------------------------------------------------------------------
 void CommProfStats::AddTopoCoord(const int nid, const int node,
                                  const int tx, const int ty, const int tz,
-                                 const bool servicenode)
+                                 const bool /*servicenode*/)
 {
 #if (BL_SPACEDIM == 2)
+  amrex::ignore_unused(nid, node, tx, ty, tz);
   cout << "**** Error:  CommProfStats::AddTopoCoord not supported for 2D" << endl;
 #else
   cout << "TopoMap.size() = " << TopoMap.size() << " nid node = " << nid << "  " << node << endl;
-  TopoMap[node].insert(std::pair<int, IntVect>(nid, IntVect(tx, ty, tz)));
+  TopoMap[node].insert(std::pair<int, IntVect>(nid, IntVect(AMREX_D_DECL(tx, ty, tz))));
   ++nTopPts;
   maxTopNodeNum = std::max(maxTopNodeNum, node);
 #endif
@@ -340,8 +341,8 @@ void CommProfStats::WriteTopoFab() {
 #if (BL_SPACEDIM == 2)
   cout << "**** Error:  CommProfStats::WriteTopoFab not supported for 2D" << endl;
 #else
-  IntVect ivmin(100000, 100000, 100000);
-  IntVect ivmax(-100000, -100000, -100000);
+  IntVect ivmin(AMREX_D_DECL(100000, 100000, 100000));
+  IntVect ivmax(AMREX_D_DECL(-100000, -100000, -100000));
   std::map<int, IntVect>::iterator it;
   for(int i(0); i < TopoMap.size(); ++i) {
     for(it = TopoMap[i].begin(); it != TopoMap[i].end(); ++it) {
@@ -867,6 +868,8 @@ void CommProfStats::ReportStats(long &totalSentData, long &totalNCommStats,
                                 Real &timeMin, Real &timeMax, Real &timerTime,
 				Vector<int> &rankNodeNumbers)
 {
+  amrex::ignore_unused(timerTime);
+
   amrex::Print(Print::AllProcs) << ParallelDescriptor::MyProc() << "::Processing "
                                 << dataBlocks.size() << " data blocks:" << endl;
 
@@ -956,6 +959,8 @@ void CommProfStats::TimelineFAB(FArrayBox &timelineFAB, const Box &probDomain,
 {
   BL_PROFILE("CommProfStats::TimelineFAB()");
 
+  amrex::ignore_unused(rankMin, rankMax, ntnMultiplier, bnMultiplier);
+
   Real tlo = tr.startTime;
   Real thi = tr.stopTime;
   Real timeRangeAll(thi - tlo);
@@ -997,7 +1002,7 @@ void CommProfStats::TimelineFAB(FArrayBox &timelineFAB, const Box &probDomain,
       BLProfiler::CommStats &cs = dBlock.vCommStats[i];
       Real ts(cs.timeStamp);
       if((ts <= fabTimeHi && ts >= fabTimeLo) && InTimeRange(dBlock.proc, ts)) {  // within time range
-        xi = nTimeSlotsFab * ((ts - fabTimeLo) * ooTimeRangeFab);
+        xi = long( nTimeSlotsFab * ((ts - fabTimeLo) * ooTimeRangeFab) );
 	if(xi == nTimeSlotsFab) {
 	  --xi;
 	}
@@ -1064,7 +1069,7 @@ void CommProfStats::TimelineFAB(FArrayBox &timelineFAB, const Box &probDomain,
 	      cout << "::::  prevTs fabTimeLo = " << prevTs << "  " << fabTimeLo << endl;
 	      prevTs = fabTimeLo;
 	    }
-            long prevXi(nTimeSlotsFab * ((prevTs - fabTimeLo) * ooTimeRangeFab));
+            long prevXi = long(nTimeSlotsFab * ((prevTs - fabTimeLo) * ooTimeRangeFab));
             prevIndex = (((proc - fabRankLo) / rankStride) * nTimeSlotsFab) + prevXi;
 	    for(long idx(prevIndex); idx < index; ++idx) {
 	      if(idx < 0 || idx >= timelineFAB.box().numPts() || idx > index) {
@@ -1174,6 +1179,8 @@ void CommProfStats::SendRecvList(std::multimap<Real, SendRecvPairUnpaired> &srMM
 void CommProfStats::SendRecvData(const std::string &filenameprefix,
                                   const double tlo, const double thi)
 {
+  amrex::ignore_unused(filenameprefix, tlo, thi);
+
   double dstart(amrex::ParallelDescriptor::second());
   Real timeMin(std::numeric_limits<Real>::max());
   Real timeMax(-std::numeric_limits<Real>::max());
@@ -1234,7 +1241,7 @@ void CommProfStats::SendRecvData(const std::string &filenameprefix,
     for(int idb(0); idb < dataBlocks.size(); ++idb) {
       //cout << "idb dB.proc = " << idb << "  " << dataBlocks[idb].proc << endl;
       //cout << idb << "  " << dataBlocks[idb].proc << endl;
-      int t0(dataBlocks[idb].timeMin * 1.0);
+      int t0 = int(dataBlocks[idb].timeMin * 1.0);
       idbMM[t0].insert(std::pair<int, int>(dataBlocks[idb].proc, idb));
       ++countI;
     }
@@ -1265,7 +1272,9 @@ void CommProfStats::SendRecvData(const std::string &filenameprefix,
 
 
   while(anyDataLeft) {
+#ifdef _OPENMP
 #pragma omp parallel for
+#endif
   //for(idb = 0; idb < dataBlocks.size(); ++idb) {
   for(int idbII = 0; idbII < dataBlocks.size(); ++idbII) {
     int idb(idbIndex[idbII]);
@@ -1836,6 +1845,8 @@ void CommProfStats::AddEdisonPID(int X, int Y, int Z,
                                  int cab, int row, int cage, int slot,
                                  int cpu, int pid)
 {
+  amrex::ignore_unused(cage, slot);
+
   int ix, iy, iz, index;
   int ixGroup, ixCab, ixSlot, ixNode, iyCage, iySlot, izGroup, izNode;
 
diff --git a/Src/Extern/ProfParser/AMReX_ProfParserBatch.cpp b/Src/Extern/ProfParser/AMReX_ProfParserBatch.cpp
index 697190b12fa..b10407e7f6c 100644
--- a/Src/Extern/ProfParser/AMReX_ProfParserBatch.cpp
+++ b/Src/Extern/ProfParser/AMReX_ProfParserBatch.cpp
@@ -99,6 +99,8 @@ bool ProfParserBatchFunctions(int argc, char *argv[], bool runDefault,
   string outfileName, delimString("\t");
   Vector<string> actFNames;
 
+  amrex::ignore_unused(bParseFilterFile);
+
   bParserProf = false;
 
   if(argc > 2) {  // parse the command line
diff --git a/Src/Extern/ProfParser/AMReX_RegionsProfStats.H b/Src/Extern/ProfParser/AMReX_RegionsProfStats.H
index 5f77c74981f..ad2164f5aea 100644
--- a/Src/Extern/ProfParser/AMReX_RegionsProfStats.H
+++ b/Src/Extern/ProfParser/AMReX_RegionsProfStats.H
@@ -72,6 +72,8 @@ class RegionsProfStats : public BLProfStats {
     void SetMaxFNumber(int n)  { maxFNumber = n; }
     int  GetMaxFNumber() const  { return maxFNumber; }
 
+    void AddFunctionName(const std::string &/*fname*/)
+        { amrex::Abort("Wrong AddFunctionName for RegionsProfStats. Use (string, int)."); }
     virtual void AddFunctionName(const std::string &fname, int fnumber);
     virtual void AddTimeMinMax(double tmin, double tmax);
 
diff --git a/Src/Extern/ProfParser/AMReX_RegionsProfStats.cpp b/Src/Extern/ProfParser/AMReX_RegionsProfStats.cpp
index d33e540ce54..1564aa12c42 100644
--- a/Src/Extern/ProfParser/AMReX_RegionsProfStats.cpp
+++ b/Src/Extern/ProfParser/AMReX_RegionsProfStats.cpp
@@ -204,6 +204,8 @@ BLProfStats::TimeRange RegionsProfStats::MakeRegionPlt(FArrayBox &rFab, int nore
                                      int width, int height,
 				     Vector<Vector<Box>> &regionBoxes)
 {
+  amrex::ignore_unused(noregionnumber);
+
 #if (BL_SPACEDIM != 2)
   cout << "**** Error:  RegionsProfStats::MakeRegionPlt only supported for 2D" << endl;
   return TimeRange(0, 0);
@@ -255,8 +257,8 @@ BLProfStats::TimeRange RegionsProfStats::MakeRegionPlt(FArrayBox &rFab, int nore
         } else {                             // stopping
           Real rtStart(rStartTime[rss.rssRNumber]), rtStop(rss.rssTime);
           rStartTime[rss.rssRNumber] = -1.0;
-          int xStart(xLength * rtStart / timeMax);
-          int xStop(xLength * rtStop / timeMax);
+          int xStart = int(xLength * rtStart / timeMax);
+          int xStop = int(xLength * rtStop / timeMax);
 	  xStop = std::min(xStop, xLength - 1);
           int yLo(rss.rssRNumber * yHeight), yHi(((rss.rssRNumber + 1) *  yHeight) - 1);
           Box rBox(IntVect(xStart, yLo), IntVect(xStop, yHi));
@@ -505,7 +507,7 @@ bool RegionsProfStats::InitRegionTimeRanges(const Box &procBox) {
 
 
 // ----------------------------------------------------------------------
-bool RegionsProfStats::Include(const FuncStat &fs) {
+bool RegionsProfStats::Include(const FuncStat &/*fs*/) {
   std::set<int>::iterator it;
   bool binclude(bDefaultInclude);
   return binclude;
@@ -660,7 +662,7 @@ void RegionsProfStats::CollectFuncStats(Vector<Vector<FuncStat> > &funcStats)
 
 
 // ----------------------------------------------------------------------
-void RegionsProfStats::WriteSummary(std::ostream &ios, bool bwriteavg,
+void RegionsProfStats::WriteSummary(std::ostream &ios, bool /*bwriteavg*/,
                                     int whichProc, bool graphTopPct)
 {
   if( ! ParallelDescriptor::IOProcessor()) {
@@ -1577,7 +1579,7 @@ void RegionsProfStats::ReadBlockNoOpen(DataBlock &dBlock, bool readRSS,
 
 
 // ----------------------------------------------------------------------
-bool RegionsProfStats::ReadBlock(DataBlock &dBlock, const int nmessages) {
+bool RegionsProfStats::ReadBlock(DataBlock &/*dBlock*/, const int /*nmessages*/) {
 amrex::Abort("not implemented yet.");
 return false;
 /*
diff --git a/Src/Extern/ProfParser/BLProfParser.y b/Src/Extern/ProfParser/BLProfParser.y
index 7eb46130b8f..486e6d30b11 100644
--- a/Src/Extern/ProfParser/BLProfParser.y
+++ b/Src/Extern/ProfParser/BLProfParser.y
@@ -645,7 +645,7 @@ word: WORD {
 
 %%
 
-int yyerror(void *outpptr, const char *s) {
+int yyerror(void * /*outpptr*/, const char * /*s*/) {
   cerr << "*** Unrecognized output at line " << yylineno << "  ::  " << yytext << endl;
   return -1;
 }
@@ -654,6 +654,7 @@ int yyerror(void *outpptr, const char *s) {
 
 void CPIV(amrex::IntVect &bliv, IVec &ivec) {
 #if (BL_SPACEDIM == 2)
+  amrex::ignore_unused(bliv, ivec);
 #else
   bliv[0] = ivec[0];
   bliv[1] = ivec[1];
diff --git a/Src/Extern/ProfParser/CMakeLists.txt b/Src/Extern/ProfParser/CMakeLists.txt
index 67ff60b1140..82566284018 100644
--- a/Src/Extern/ProfParser/CMakeLists.txt
+++ b/Src/Extern/ProfParser/CMakeLists.txt
@@ -12,7 +12,7 @@ target_sources( amrex
     AMReX_RegionsProfStats.H
     AMReX_RegionsProfStats.cpp
     AMReX_AVGDOWN_F.H
-    AMReX_AVGDOWN_${DIM}D.F
+    AMReX_AVGDOWN_${AMReX_SPACEDIM}D.F
     AMReX_BLWritePlotFile.H
     AMReX_BLWritePlotFile.cpp
     AMReX_ProfParserBatch.cpp
diff --git a/Src/Extern/SENSEI/CMakeLists.txt b/Src/Extern/SENSEI/CMakeLists.txt
index 84b3fe74397..a3f5780b445 100644
--- a/Src/Extern/SENSEI/CMakeLists.txt
+++ b/Src/Extern/SENSEI/CMakeLists.txt
@@ -1,6 +1,3 @@
-find_package(SENSEI REQUIRED)
-
-target_link_libraries( amrex PUBLIC sensei)   
 target_include_directories(amrex PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_DIR}>)
 target_compile_definitions(amrex PUBLIC $<BUILD_INTERFACE:BL_USE_SENSEI_INSITU>)
 
diff --git a/Src/Extern/SUNDIALS/CMakeLists.txt b/Src/Extern/SUNDIALS/CMakeLists.txt
new file mode 100644
index 00000000000..dc51cc798d4
--- /dev/null
+++ b/Src/Extern/SUNDIALS/CMakeLists.txt
@@ -0,0 +1,7 @@
+target_sources( amrex
+   PRIVATE
+   arkode_interface.f90
+   cvode_interface.f90
+   )
+
+target_compile_definitions(amrex PUBLIC AMREX_USE_SUNDIALS)
diff --git a/Src/Extern/SUNDIALS/Make.package b/Src/Extern/SUNDIALS/Make.package
new file mode 100644
index 00000000000..30cd7e1af62
--- /dev/null
+++ b/Src/Extern/SUNDIALS/Make.package
@@ -0,0 +1,7 @@
+ifeq ($(USE_ARKODE_LIBS), TRUE)
+f90EXE_sources += arkode_interface.f90
+endif
+
+ifeq ($(USE_CVODE_LIBS), TRUE)
+f90EXE_sources += cvode_interface.f90
+endif
diff --git a/Src/Extern/SUNDIALS/arkode_interface.f90 b/Src/Extern/SUNDIALS/arkode_interface.f90
new file mode 100644
index 00000000000..6a6c11962e9
--- /dev/null
+++ b/Src/Extern/SUNDIALS/arkode_interface.f90
@@ -0,0 +1,24 @@
+module arkode_interface
+  use farkode_mod
+  use farkode_arkstep_mod
+  use fsundials_matrix_mod
+  use fsundials_nvector_mod
+  use fsundials_linearsolver_mod
+  contains
+  integer(c_int) function FARKDense(arkode_mem, N) result(ierr)
+    use, intrinsic :: iso_c_binding
+    use fnvector_serial_mod
+    use fsunmatrix_dense_mod
+    use fsunlinsol_dense_mod
+    implicit none 
+    type(c_ptr),           value    :: arkode_mem
+    integer(c_long),       value    :: N
+    type(SUNMatrix),       pointer  :: sunmat_A
+    type(SUNLinearSolver), pointer  :: sunlinsol_LS
+    type(N_Vector),        pointer  :: sunvec_y
+    sunvec_y => FN_VNewEmpty_Serial(N)
+    sunmat_A => FSUNDenseMatrix(N, N)
+    sunlinsol_LS => FSUNDenseLinearSolver(sunvec_y, sunmat_A)
+    ierr = FARKStepSetLinearSolver(arkode_mem, sunlinsol_LS, sunmat_A)
+  end function FARKDense
+end module arkode_interface
diff --git a/Src/Extern/SUNDIALS/cvode_interface.f90 b/Src/Extern/SUNDIALS/cvode_interface.f90
new file mode 100644
index 00000000000..caff4507a47
--- /dev/null
+++ b/Src/Extern/SUNDIALS/cvode_interface.f90
@@ -0,0 +1,23 @@
+module cvode_interface
+  use fcvode_mod
+  use fsundials_matrix_mod
+  use fsundials_nvector_mod
+  use fsundials_linearsolver_mod
+  contains
+  integer(c_int) function FCVDense(cvode_mem, N) result(ierr)
+    use, intrinsic :: iso_c_binding
+    use fnvector_serial_mod
+    use fsunmatrix_dense_mod
+    use fsunlinsol_dense_mod
+    implicit none 
+    type(c_ptr),           value    :: cvode_mem
+    integer(c_long),       value    :: N
+    type(SUNMatrix),       pointer  :: sunmat_A
+    type(SUNLinearSolver), pointer  :: sunlinsol_LS
+    type(N_Vector),        pointer  :: sunvec_y
+    sunvec_y => FN_VNewEmpty_Serial(N)
+    sunmat_A => FSUNDenseMatrix(N, N)
+    sunlinsol_LS => FSUNDenseLinearSolver(sunvec_y, sunmat_A)
+    ierr = FCVodeSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A)
+  end function FCVDense
+end module cvode_interface
diff --git a/Src/Extern/SUNDIALS3/CMakeLists.txt b/Src/Extern/SUNDIALS3/CMakeLists.txt
deleted file mode 100644
index 69c7b80cb7a..00000000000
--- a/Src/Extern/SUNDIALS3/CMakeLists.txt
+++ /dev/null
@@ -1,39 +0,0 @@
-if (ENABLE_FORTRAN_INTERFACES)
-   target_sources( amrex
-      PRIVATE
-      fnvector_serial.f90
-      fnvector_serial_fprefix.f90
-      fsunlinsol_dense.f90
-      fsunmat_dense.f90
-      # Arkcode interfaces
-      arkode_interface.f90
-      farkode.f90
-      # CVODE interfaces
-      cvode_interface.f90
-      fcvode.f90
-      )  
-endif ()
-
-#
-# We link to libraries and always include nvecserial (in case app code needs it)
-#
-set(_sundials_components nvecserial;cvode;arkode)
-
-if (ENABLE_OMP)
-   list(APPEND _sundials_components nvecopenmp)
-endif ()
-
-if (ENABLE_CUDA)
-   list(APPEND _sundials_components nveccuda)
-endif ()
-
-find_package(SUNDIALS REQUIRED COMPONENTS ${_sundials_components})
-
-foreach(_comp ${_sundials_components})
-   target_link_libraries(amrex PUBLIC SUNDIALS::${_comp})   
-endforeach ()
-
-target_compile_definitions(amrex PUBLIC AMREX_USE_SUNDIALS_3x4x)
-   
-
-
diff --git a/Src/Extern/SUNDIALS3/Make.package b/Src/Extern/SUNDIALS3/Make.package
deleted file mode 100644
index 4d59439ea41..00000000000
--- a/Src/Extern/SUNDIALS3/Make.package
+++ /dev/null
@@ -1,14 +0,0 @@
-ifeq ($(USE_ARKODE_LIBS), TRUE)
-f90EXE_sources += arkode_interface.f90
-f90EXE_sources += farkode.f90
-endif
-
-ifeq ($(USE_CVODE_LIBS), TRUE)
-f90EXE_sources += cvode_interface.f90
-f90EXE_sources += fcvode.f90
-endif
-
-f90EXE_sources += fnvector_serial.f90
-f90EXE_sources += fnvector_serial_fprefix.f90
-f90EXE_sources += fsunlinsol_dense.f90
-f90EXE_sources += fsunmat_dense.f90
\ No newline at end of file
diff --git a/Src/Extern/SUNDIALS3/arkode_interface.f90 b/Src/Extern/SUNDIALS3/arkode_interface.f90
deleted file mode 100644
index a69aa981ff9..00000000000
--- a/Src/Extern/SUNDIALS3/arkode_interface.f90
+++ /dev/null
@@ -1,22 +0,0 @@
-module arkode_interface
-  use farkode_mod
-  use fsunmat_dense_mod
-  use fsunlinsol_dense_mod
-  contains
-  integer(c_int) function FARKDense(cvode_mem, N) 
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial
-    implicit none 
-    type(c_ptr),     value :: cvode_mem
-    integer(c_long), value :: N
-    type(c_ptr)            :: sunmat_A
-    type(c_ptr)            :: sunlinsol_LS
-    type(c_ptr)            :: sunvec_y
-    integer(c_int)         :: ierr
-
-    sunvec_y = N_VNewEmpty_Serial(N)
-    sunmat_A = FSUNDenseMatrix(N, N)
-    sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A)
-    ierr = FARKDlsSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A)
-  end function FARKDense
-end module arkode_interface
diff --git a/Src/Extern/SUNDIALS3/cvode_interface.f90 b/Src/Extern/SUNDIALS3/cvode_interface.f90
deleted file mode 100644
index c365f9e649f..00000000000
--- a/Src/Extern/SUNDIALS3/cvode_interface.f90
+++ /dev/null
@@ -1,21 +0,0 @@
-module cvode_interface
-  use fcvode_mod
-  use fsunmat_dense_mod
-  use fsunlinsol_dense_mod
-  contains
-  integer(c_int) function FCVDense(cvode_mem, N) result(ierr)
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial
-    implicit none 
-    type(c_ptr),     value :: cvode_mem
-    integer(c_long), value :: N
-    type(c_ptr)            :: sunmat_A
-    type(c_ptr)            :: sunlinsol_LS
-    type(c_ptr)            :: sunvec_y
-
-    sunvec_y = N_VNewEmpty_Serial(N)
-    sunmat_A = FSUNDenseMatrix(N, N)
-    sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A)
-    ierr = FCVDlsSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A)
-  end function FCVDense
-end module cvode_interface
diff --git a/Src/Extern/SUNDIALS3/farkode.f90 b/Src/Extern/SUNDIALS3/farkode.f90
deleted file mode 100644
index ba5463f3738..00000000000
--- a/Src/Extern/SUNDIALS3/farkode.f90
+++ /dev/null
@@ -1,924 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-!                Daniel R. Reynolds @ SMU
-!                modified Jean M. Sexton @ LBL
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! This file contains a Fortran module for interfacing directly with
-! ARKODE using the ISO_C_BINDING module.
-! ------------------------------------------------------------------
-
-module farkode_mod
-
-  use, intrinsic :: iso_c_binding, only : c_int
-
-  ! =================================================================
-  !              A R K O D E     C O N S T A N T S
-  ! =================================================================
-
-  ! -----------------------------------------------------------------
-  ! Enumerations for inputs to ARKodeCreate and ARKode.
-  ! -----------------------------------------------------------------
-
-  ! itask
-  integer(c_int), parameter :: ARK_NORMAL   = 1
-  integer(c_int), parameter :: ARK_ONE_STEP = 2
-
-  ! -----------------------------------------------------------------
-  ! ARKODE return flags
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: ARK_SUCCESS           =   0
-  integer(c_int), parameter :: ARK_TSTOP_RETURN      =   1
-  integer(c_int), parameter :: ARK_ROOT_RETURN       =   2
-
-  integer(c_int), parameter :: ARK_WARNING           =  99
-
-  integer(c_int), parameter :: ARK_TOO_MUCH_WORK     =  -1
-  integer(c_int), parameter :: ARK_TOO_MUCH_ACC      =  -2
-  integer(c_int), parameter :: ARK_ERR_FAILURE       =  -3
-  integer(c_int), parameter :: ARK_CONV_FAILURE      =  -4
-
-  integer(c_int), parameter :: ARK_LINIT_FAIL        =  -5
-  integer(c_int), parameter :: ARK_LSETUP_FAIL       =  -6
-  integer(c_int), parameter :: ARK_LSOLVE_FAIL       =  -7
-  integer(c_int), parameter :: ARK_RHSFUNC_FAIL      =  -8
-  integer(c_int), parameter :: ARK_FIRST_RHSFUNC_ERR =  -9
-  integer(c_int), parameter :: ARK_REPTD_RHSFUNC_ERR =  -10
-  integer(c_int), parameter :: ARK_UNREC_RHSFUNC_ERR =  -11
-  integer(c_int), parameter :: ARK_RTFUNC_FAIL       =  -12
-
-  integer(c_int), parameter :: ARK_MEM_FAIL          =  -20
-  integer(c_int), parameter :: ARK_MEM_NULL          =  -21
-  integer(c_int), parameter :: ARK_ILL_INPUT         =  -22
-  integer(c_int), parameter :: ARK_NO_MALLOC         =  -23
-  integer(c_int), parameter :: ARK_BAD_K             =  -24
-  integer(c_int), parameter :: ARK_BAD_T             =  -25
-  integer(c_int), parameter :: ARK_BAD_DKY           =  -26
-  integer(c_int), parameter :: ARK_TOO_CLOSE         =  -27
-
-  ! -----------------------------------------------------------------
-  ! ARKDLS return values
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: ARKDLS_SUCCESS         =  0
-  integer(c_int), parameter :: ARKDLS_MEM_NULL        = -1
-  integer(c_int), parameter :: ARKDLS_LMEM_NULL       = -2
-  integer(c_int), parameter :: ARKDLS_ILL_INPUT       = -3
-  integer(c_int), parameter :: ARKDLS_MEM_FAIL        = -4
-
-  ! Additional last_flag values
-  integer(c_int), parameter :: ARKDLS_JACFUNC_UNREARKR = -5
-  integer(c_int), parameter :: ARKDLS_JACFUNC_REARKR   = -6
-  integer(c_int), parameter :: ARKDLS_SUNMAT_FAIL     = -7
-
-  ! -----------------------------------------------------------------
-  ! ARKSPILS return values
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: ARKSPILS_SUCCESS    =  0
-  integer(c_int), parameter :: ARKSPILS_MEM_NULL   = -1
-  integer(c_int), parameter :: ARKSPILS_LMEM_NULL  = -2
-  integer(c_int), parameter :: ARKSPILS_ILL_INPUT  = -3
-  integer(c_int), parameter :: ARKSPILS_MEM_FAIL   = -4
-  integer(c_int), parameter :: ARKSPILS_PMEM_NULL  = -5
-  integer(c_int), parameter :: ARKSPILS_SUNLS_NULL = -6
-
-  ! -----------------------------------------------------------------
-  ! ARKDIAG return values
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: ARKDIAG_SUCCESS         =  0
-  integer(c_int), parameter :: ARKDIAG_MEM_NULL        = -1
-  integer(c_int), parameter :: ARKDIAG_LMEM_NULL       = -2
-  integer(c_int), parameter :: ARKDIAG_ILL_INPUT       = -3
-  integer(c_int), parameter :: ARKDIAG_MEM_FAIL        = -4
-
-  ! Additional last_flag values
-  integer(c_int), parameter :: ARKDIAG_INV_FAIL        = -5
-  integer(c_int), parameter :: ARKDIAG_RHSFUNC_UNREARKR = -6
-  integer(c_int), parameter :: ARKDIAG_RHSFUNC_REARKR   = -7
-
-  ! =================================================================
-  !          U S E R - C A L L A B L E   R O U T I N E S
-  ! =================================================================
-
-  interface
-
-     ! =================================================================
-     ! Interfaces for arkode.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! ARKodeCreate
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FARKodeCreate() &
-          bind(C,name='ARKodeCreate')
-       use, intrinsic :: iso_c_binding
-       implicit none
-     end function FARKodeCreate
-
-     ! -----------------------------------------------------------------
-     ! Integrator optional input specification functions
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeSetErrHandlerFn(arkode_mem, ehfun, eh_data) &
-          bind(C,name='ARKodeSetErrHandlerFn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: ehfun
-       type(c_ptr),    value :: eh_data
-     end function FARKodeSetErrHandlerFn
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: ARKodeSetErrFile
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeSetUserData(arkode_mem, user_data) &
-          bind(C,name='ARKodeSetUserData')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       type(c_ptr), value :: user_data
-     end function FARKodeSetUserData
-
-     integer(c_int) function FARKodeSetMaxOrd(arkode_mem, maxord) &
-          bind(C,name='ARKodeSetMaxOrd')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: maxord
-     end function FARKodeSetMaxOrd
-
-     integer(c_int) function FARKodeSetMaxNumSteps(arkode_mem, mxsteps) &
-          bind(C,name='ARKodeSetMaxNumSteps')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: arkode_mem
-       integer(c_long), value :: mxsteps
-     end function FARKodeSetMaxNumSteps
-
-     integer(c_int) function FARKodeSetMaxHnilWarns(arkode_mem, mxhnil) &
-          bind(C,name='ARKodeSetMaxHnilWarns')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: mxhnil
-     end function FARKodeSetMaxHnilWarns
-
-     integer(c_int) function FARKodeSetStabLimDet(arkode_mem, stldet) &
-          bind(C,name='ARKodeSetStabLimDet')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: stldet
-     end function FARKodeSetStabLimDet
-
-     integer(c_int) function FARKodeSetInitStep(arkode_mem, hin) &
-          bind(C,name='ARKodeSetInitStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: hin
-     end function FARKodeSetInitStep
-
-     integer(c_int) function FARKodeSetMinStep(arkode_mem, hmin) &
-          bind(C,name='ARKodeSetMinStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: hmin
-     end function FARKodeSetMinStep
-
-     integer(c_int) function FARKodeSetMaxStep(arkode_mem, hmax) &
-          bind(C,name='ARKodeSetMaxStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: hmax
-     end function FARKodeSetMaxStep
-
-     integer(c_int) function FARKodeSetAdaptivityMethod(arkode_mem, imethod, idefault, pq, adapt_params) &
-	bind(C,name='ARKodeSetAdaptivityMethod')
-       use, intrinsic :: iso_c_binding
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: imethod
-       integer(c_int), value :: idefault
-       integer(c_int), value :: pq
-       type(c_ptr),    value :: adapt_params
-     end function FARKodeSetAdaptivityMethod
-
-     integer(c_int) function FARKodeSetStopTime(arkode_mem, tstop) &
-          bind(C,name='ARKodeSetStopTime')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: tstop
-     end function FARKodeSetStopTime
-
-     integer(c_int) function FARKodeSetMaxErrTestFails(arkode_mem, maxnef) &
-          bind(C,name='ARKodeSetMaxErrTestFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: maxnef
-     end function FARKodeSetMaxErrTestFails
-
-     integer(c_int) function FARKodeSetMaxNonlinIters(arkode_mem, maxcor) &
-          bind(C,name='ARKodeSetMaxNonlinIters')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: maxcor
-     end function FARKodeSetMaxNonlinIters
-
-     integer(c_int) function FARKodeSetMaxConvFails(arkode_mem, maxncf) &
-          bind(C,name='ARKodeSetMaxConvFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: maxncf
-     end function FARKodeSetMaxConvFails
-
-     integer(c_int) function FARKodeSetNonlinConvCoef(arkode_mem, nlscoef) &
-          bind(C,name='ARKodeSetNonlinConvCoef')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: nlscoef
-     end function FARKodeSetNonlinConvCoef
-
-     integer(c_int) function FARKodeSetIterType(arkode_mem, iter) &
-          bind(C,name='ARKodeSetIterType')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: iter
-     end function FARKodeSetIterType
-
-     integer(c_int) function FARKodeSetRootDirection(arkode_mem, rootdir) &
-          bind(C,name='ARKodeSetRootDirection')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       real(c_double)     :: rootdir
-     end function FARKodeSetRootDirection
-
-     integer(c_int) function FARKodeSetNoInactiveRootWarn(arkode_mem) &
-       bind(C,name='ARKodeSetNoInactiveRootWarn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-     end function FARKodeSetNoInactiveRootWarn
-
-     ! -----------------------------------------------------------------
-     ! ARKodeInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeInit(arkode_mem, fe, fi, t0, y0) &
-          bind(C,name='ARKodeInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: fe
-       type(c_funptr), value :: fi
-       real(c_double), value :: t0
-       type(c_ptr),    value :: y0
-     end function FARKodeInit
-
-     ! -----------------------------------------------------------------
-     ! ARKodeReInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeReInit(arkode_mem, fe, fi, t0, y0) &
-          bind(C,name='ARKodeReInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: fe
-       type(c_funptr), value :: fi
-       real(c_double), value :: t0
-       type(c_ptr),    value :: y0
-     end function FARKodeReInit
-
-
-     ! -----------------------------------------------------------------
-     ! ARKodeSStolerances
-     ! ARKodeSVtolerances
-     ! ARKodeWFtolerances
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeSStolerances(arkode_mem, reltol, abstol) &
-          bind(C,name='ARKodeSStolerances')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: reltol
-       real(c_double), value :: abstol
-     end function FARKodeSStolerances
-
-     integer(c_int) function FARKodeSVtolerances(arkode_mem, reltol, abstol) &
-          bind(C,name='ARKodeSVtolerances')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: reltol
-       type(c_ptr),    value :: abstol
-     end function FARKodeSVtolerances
-
-     integer(c_int) function FARKodeWFtolerances(arkode_mem, efun) &
-          bind(C,name='ARKodeWFtolerances')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: efun
-     end function FARKodeWFtolerances
-
-     ! -----------------------------------------------------------------
-     ! ARKodeRootInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeRootInit(arkode_mem, nrtfn, g) &
-          bind(C,name='ARKodeRootInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       integer(c_int), value :: nrtfn
-       type(c_funptr), value :: g
-     end function FARKodeRootInit
-
-     ! -----------------------------------------------------------------
-     ! ARKode
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKode(arkode_mem, tout, yout, tret, itask) &
-          bind(C,name='ARKode')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: tout
-       type(c_ptr),    value :: yout
-       real(c_double)        :: tret
-       integer(c_int), value :: itask
-     end function FARKode
-
-     ! -----------------------------------------------------------------
-     ! ARKodeGetDky
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeGetDky(arkode_mem, t, k, dky) &
-          bind(C,name='ARKodeGetDky')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: t
-       integer(c_int), value :: k
-       type(c_ptr),    value :: dky
-     end function FARKodeGetDky
-
-     ! -----------------------------------------------------------------
-     ! Integrator optional output extraction functions
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeGetWorkSpace(arkode_mem, lenrw, leniw) &
-          bind(C,name='ARKodeGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: lenrw
-       integer(c_long)    :: leniw
-     end function FARKodeGetWorkSpace
-
-     integer(c_int) function FARKodeGetNumSteps(arkode_mem, nsteps) &
-          bind(C,name='ARKodeGetNumSteps')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nsteps
-     end function FARKodeGetNumSteps
-
-     integer(c_int) function FARKodeGetNumStepAttempts(arkode_mem, nst_a) &
-          bind(C,name='ARKodeGetNumStepAttempts')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nst_a
-     end function FARKodeGetNumStepAttempts
-
-     integer(c_int) function FARKodeGetNumRhsEvals(arkode_mem, nfe,nfi) &
-          bind(C,name='ARKodeGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nfe
-       integer(c_long)    :: nfi
-     end function FARKodeGetNumRhsEvals
-
-     integer(c_int) function FARKodeGetNumLinSolvSetups(arkode_mem, nlinsetups) &
-          bind(C,name='ARKodeGetNumLinSolvSetups')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nlinsetups
-     end function FARKodeGetNumLinSolvSetups
-
-     integer(c_int) function FARKodeGetNumErrTestFails(arkode_mem, netfails) &
-          bind(C,name='ARKodeGetNumErrTestFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: netfails
-     end function FARKodeGetNumErrTestFails
-
-     integer(c_int) function FARKodeGetNumStabLimOrderReds(arkode_mem, nslred) &
-          bind(C,name='ARKodeGetNumStabLimOrderReds')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nslred
-     end function FARKodeGetNumStabLimOrderReds
-
-     integer(c_int) function FARKodeGetActualInitStep(arkode_mem, hinused) &
-          bind(C,name='ARKodeGetActualInitStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       real(c_double)     :: hinused
-     end function FARKodeGetActualInitStep
-
-     integer(c_int) function FARKodeGetLastStep(arkode_mem, hlast) &
-          bind(C,name='ARKodeGetLastStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       real(c_double)     :: hlast
-     end function FARKodeGetLastStep
-
-     integer(c_int) function FARKodeGetCurrentStep(arkode_mem, hcur) &
-         bind(C,name='ARKodeGetCurrentStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       real(c_double)     :: hcur
-     end function FARKodeGetCurrentStep
-
-     integer(c_int) function FARKodeGetCurrentTime(arkode_mem, tcur) &
-          bind(C,name='ARKodeGetCurrentTime')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       real(c_double)     :: tcur
-     end function FARKodeGetCurrentTime
-
-     integer(c_int) function FARKodeGetTolScaleFactor(arkode_mem, tolsfac) &
-          bind(C,name='ARKodeGetTolScaleFactor')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       real(c_double)     :: tolsfac
-     end function FARKodeGetTolScaleFactor
-
-     integer(c_int) function FARKodeGetErrWeights(arkode_mem, eweight) &
-          bind(C,name='ARKodeGetEffWeights')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       type(c_ptr), value :: eweight
-     end function FARKodeGetErrWeights
-
-     integer(c_int) function FARKodeGetEstLocalErrors(arkode_mem, ele) &
-          bind(C,name='ARKodeGetEstLocalErrors')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       type(c_ptr), value :: ele
-     end function FARKodeGetEstLocalErrors
-
-     integer(c_int) function FARKodeGetNumGEvals(arkode_mem, ngevals) &
-          bind(C,name='ARKodeGetNumGEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: ngevals
-     end function FARKodeGetNumGEvals
-
-     integer(c_int) function FARKodeGetRootInfo(arkode_mem, rootsfound) &
-          bind(C,name='ARKodeGetRootInfo')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_int)     :: rootsfound
-     end function FARKodeGetRootInfo
-
-     integer(c_int) function FARKodeGetIntegratorStats(arkode_mem, nsteps, nfevals, &
-          nlinsetups, netfails, qlast, qcur, hinused, hlast, hcur, tcur) &
-          bind(C,name='ARKodeGetIntegratorStats')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nsteps
-       integer(c_long)    :: nfevals
-       integer(c_long)    :: nlinsetups
-       integer(c_long)    :: netfails
-       integer(c_int)     :: qlast
-       integer(c_int)     :: qcur
-       real(c_double)     :: hinused
-       real(c_double)     :: hlast
-       real(c_double)     :: hcur
-       real(c_double)     :: tcur
-     end function FARKodeGetIntegratorStats
-
-     ! -----------------------------------------------------------------
-     ! Nonlinear solver optional output extraction functions
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKodeGetNumNonlinSolvIters(arkode_mem, nniters) &
-          bind(C,name='ARKodeGetNumNonlinSolvIters')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nniters
-     end function FARKodeGetNumNonlinSolvIters
-
-     integer(c_int) function FARKodeGetNumNonlinSolvConvFails(arkode_mem, nncfails) &
-          bind(C,name='ARKodeGetNumNonlinSolvConvFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nncfails
-     end function FARKodeGetNumNonlinSolvConvFails
-
-     integer(c_int) function FARKodeGetNonlinSolvStats(arkode_mem, nniters, nncfails) &
-          bind(C,name='ARKodeGetNonlinSolvStats')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nniters
-       integer(c_long)    :: nncfails
-     end function FARKodeGetNonlinSolvStats
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: ARKodeGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-     ! -----------------------------------------------------------------
-     ! ARKodeFree
-     ! -----------------------------------------------------------------
-
-     subroutine FARKodeFree(arkode_mem) &
-          bind(C,name='ARKodeFree')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr) :: arkode_mem ! DO NOT use value attribute input is void**
-     end subroutine FARKodeFree
-
-     ! =================================================================
-     ! Interfaces from arkode_direct.h
-     ! =================================================================
-
-     integer(c_int) function FARKDlsSetLinearSolver(arkode_mem, LS, A) &
-          bind(C,name='ARKDlsSetLinearSolver')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       type(c_ptr), value :: LS
-       type(c_ptr), value :: A
-     end function FARKDlsSetLinearSolver
-
-     ! -----------------------------------------------------------------
-     ! Optional inputs to the ARKDLS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKDlsSetJacFn(arkode_mem, jac) &
-          bind(C,name='ARKDlsSetJacFn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: jac
-     end function FARKDlsSetJacFn
-
-     ! -----------------------------------------------------------------
-     ! Optional outputs from the ARKDLS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKDlsGetWorkSpace(arkode_mem, lenrwLS, leniwLS) &
-          bind(C,name='ARKDlsGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FARKDlsGetWorkSpace
-
-     integer(c_int) function FARKDlsGetNumJacEvals(arkode_mem, njevals) &
-          bind(C,name='ARKDlsGetNumJacEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: njevals
-     end function FARKDlsGetNumJacEvals
-
-     integer(c_int) function FARKDlsGetNumRhsEvals(arkode_mem, nfevalsLS) &
-          bind(C,name='ARKDlsGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nfevalsLS
-     end function FARKDlsGetNumRhsEvals
-
-     integer(c_int) function FARKDlsGetLastFlag(arkode_mem, flag) &
-          bind(C,name='ARKDlsGetLastFlag')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: flag
-     end function FARKDlsGetLastFlag
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: ARKDlsGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-
-     ! =================================================================
-     ! Interfaces from arkode_spils.h
-     ! =================================================================
-
-     integer(c_int) function FARKSpilsSetLinearSolver(arkode_mem, LS) &
-          bind(C,name='ARKSpilsSetLinearSolver')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       type(c_ptr), value :: LS
-     end function FARKSpilsSetLinearSolver
-
-     ! -----------------------------------------------------------------
-     ! Optional inputs to the ARKSPILS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKSpilsSetEpsLin(arkode_mem, eplifac) &
-          bind(C,name='ARKSpilsSetEpsLin')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       real(c_double), value :: eplifac
-     end function FARKSpilsSetEpsLin
-
-     integer(c_int) function FARKSpilsSetPreconditioner(arkode_mem, pset, psolve) &
-          bind(C,name='ARKSpilsSetPreconditioner')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: pset
-       type(c_funptr), value :: psolve
-     end function FARKSpilsSetPreconditioner
-
-     integer(c_int) function FARKSpilsSetJacTimes(arkode_mem, jtsetup, jtimes) &
-          bind(C,name='ARKSpilsSetJacTimesVecFn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: arkode_mem
-       type(c_funptr), value :: jtsetup
-       type(c_funptr), value :: jtimes
-     end function FARKSpilsSetJacTimes
-
-     ! -----------------------------------------------------------------
-     ! Optional outputs from the ARKSPILS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKSpilsGetWorkSpace(arkode_mem, lenrwLS, leniwLS) &
-          bind(C,name='ARKSpilsGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FARKSpilsGetWorkSpace
-
-     integer(c_int) function FARKSpilsGetNumPrecEvals(arkode_mem, npevals) &
-          bind(C,name='ARKSpilsGetNumPrecEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: npevals
-     end function FARKSpilsGetNumPrecEvals
-
-     integer(c_int) function FARKSpilsGetNumPrecSolves(arkode_mem, npsolves) &
-          bind(C,name='ARKSpilsGetNumPrecSolves')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: npsolves
-     end function FARKSpilsGetNumPrecSolves
-
-     integer(c_int) function FARKSpilsGetNumLinIters(arkode_mem, nliters) &
-          bind(C,name='ARKSpilsGetNumLinIters')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nliters
-     end function FARKSpilsGetNumLinIters
-
-     integer(c_int) function FARKSpilsGetNumConvFails(arkode_mem, nlcfails) &
-          bind(C,name='ARKSpilsGetNumConvFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nlcfails
-     end function FARKSpilsGetNumConvFails
-
-     integer(c_int) function FARKSpilsGetNumJTSetupEvals(arkode_mem, njtsetups) &
-          bind(C,name='ARKSpilsGetNumJTSetupEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: njtsetups
-     end function FARKSpilsGetNumJTSetupEvals
-
-     integer(c_int) function FARKSpilsGetNumJtimesEvals(arkode_mem, njvevals) &
-          bind(C,name='ARKSpilsGetNumJtimesEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: njvevals
-     end function FARKSpilsGetNumJtimesEvals
-
-     integer(c_int) function FARKSpilsGetNumRhsEvals(arkode_mem, nfevalsLS) &
-          bind(C,name='ARKSpilsGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nfevalsLS
-     end function FARKSpilsGetNumRhsEvals
-
-     integer(c_int) function FARKSpilsGetLastFlag(arkode_mem, flag) &
-          bind(C,name='ARKSpilsGetLastFalg')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: flag
-     end function FARKSpilsGetLastFlag
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: ARKSpilsGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-     ! =================================================================
-     ! Interfaces for arkode_diag.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! ARKDiag
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKDiag(arkode_mem) &
-          bind(C,name='ARKDiag')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-     end function FARKDiag
-
-     ! -----------------------------------------------------------------
-     ! Optional outputs from the ARKDIAG linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKDiagGetWorkSpace(arkode_mem, lenrwLS, leniwLS) &
-          bind(C,name='ARKDiagGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FARKDiagGetWorkSpace
-
-     integer(c_int) function FARKDiagGetNumRhsEvals(arkode_mem, nfevalsLS) &
-          bind(C,name='ARKDiagGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nfevalsLS
-     end function FARKDiagGetNumRhsEvals
-
-     integer(c_int) function FARKDiagGetLastFlag(arkode_mem, flag) &
-          bind(C,name='ARKDiagGetLastFlag')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: flag
-     end function FARKDiagGetLastFlag
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: ARKDiagGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-     ! =================================================================
-     ! Interfaces from arkode_bandpre.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! ARKBandPrecInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKBandPrecInit(arkode_mem, N, mu, ml) &
-          bind(C,name='ARKBandPrecInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: arkode_mem
-       integer(c_long), value :: N
-       integer(c_long), value :: mu
-       integer(c_long), value :: ml
-     end function FARKBandPrecInit
-
-     ! -----------------------------------------------------------------
-     ! Optional output functions : ARKBandPrecGet*
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKBandPrecGetWorkSpace(arkode_mem, lenrwLS, leniwLS) &
-          bind(C,name='ARKBandPrecGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FARKBandPrecGetWorkSpace
-
-     integer(c_int) function FARKBandPrecGetNumRhsEvals(arkode_mem, nfevalsBP) &
-          bind(C,name='ARKBandPrecGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: nfevalsBP
-     end function FARKBandPrecGetNumRhsEvals
-
-     ! =================================================================
-     ! Interfaces for arkode_bbdpre.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! ARKBBDPrecInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKBBDPrecInit(arkode_mem, Nlocal, mudq, mldq, &
-          mukeep, mlkeep, dqrely, gloc, cfn) &
-          bind(C,name='ARKBBDPrecInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: arkode_mem
-       integer(c_long), value :: Nlocal
-       integer(c_long), value :: mudq
-       integer(c_long), value :: mldq
-       integer(c_long), value :: mukeep
-       integer(c_long), value :: mlkeep
-       real(c_double),  value :: dqrely
-       type(c_funptr),  value :: gloc
-       type(c_funptr),  value :: cfn
-     end function FARKBBDPrecInit
-
-     ! -----------------------------------------------------------------
-     ! ARKBBDPrecReInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKBBDPrecReInit(arkode_mem, mudq, mldq, dqrely) &
-          bind(C,name='ARKBBNPrecReInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: arkode_mem
-       integer(c_long), value :: mudq
-       integer(c_long), value :: mldq
-       real(c_double),  value :: dqrely
-     end function FARKBBDPrecReInit
-
-     ! -----------------------------------------------------------------
-     ! BBDPRE optional output extraction routines
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FARKBBDPrecGetWorkSpace(arkode_mem, lenrwLS, leniwLS) &
-          bind(C,name='ARKBBDPrecGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FARKBBDPrecGetWorkSpace
-
-     integer(c_int) function FARKBBDPrecGetNumGfnEvals(arkode_mem, ngevalsBBDP) &
-          bind(C,name='ARKBBDPrecGetNumGfnEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: arkode_mem
-       integer(c_long)    :: ngevalsBBDP
-     end function FARKBBDPrecGetNumGfnEvals
-
-  end interface
-
-end module farkode_mod
diff --git a/Src/Extern/SUNDIALS3/fcvode.f90 b/Src/Extern/SUNDIALS3/fcvode.f90
deleted file mode 100644
index 582625c8936..00000000000
--- a/Src/Extern/SUNDIALS3/fcvode.f90
+++ /dev/null
@@ -1,926 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-!                Daniel R. Reynolds @ SMU
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! This file contains a Fortran module for interfacing directly with
-! CVODE using the ISO_C_BINDING module.
-! ------------------------------------------------------------------
-
-module fcvode_mod
-
-  use, intrinsic :: iso_c_binding, only : c_int
-
-  ! =================================================================
-  !              C V O D E     C O N S T A N T S
-  ! =================================================================
-
-  ! -----------------------------------------------------------------
-  ! Enumerations for inputs to CVodeCreate and CVode.
-  ! -----------------------------------------------------------------
-
-  ! lmm
-  integer(c_int), parameter :: CV_ADAMS = 1
-  integer(c_int), parameter :: CV_BDF   = 2
-
-  ! iter
-  integer(c_int), parameter :: CV_FUNCTIONAL = 1
-  integer(c_int), parameter :: CV_NEWTON     = 2
-
-  ! itask
-  integer(c_int), parameter :: CV_NORMAL   = 1
-  integer(c_int), parameter :: CV_ONE_STEP = 2
-
-  ! -----------------------------------------------------------------
-  ! CVODE return flags
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: CV_SUCCESS           =   0
-  integer(c_int), parameter :: CV_TSTOP_RETURN      =   1
-  integer(c_int), parameter :: CV_ROOT_RETURN       =   2
-
-  integer(c_int), parameter :: CV_WARNING           =  99
-
-  integer(c_int), parameter :: CV_TOO_MUCH_WORK     =  -1
-  integer(c_int), parameter :: CV_TOO_MUCH_ACC      =  -2
-  integer(c_int), parameter :: CV_ERR_FAILURE       =  -3
-  integer(c_int), parameter :: CV_CONV_FAILURE      =  -4
-
-  integer(c_int), parameter :: CV_LINIT_FAIL        =  -5
-  integer(c_int), parameter :: CV_LSETUP_FAIL       =  -6
-  integer(c_int), parameter :: CV_LSOLVE_FAIL       =  -7
-  integer(c_int), parameter :: CV_RHSFUNC_FAIL      =  -8
-  integer(c_int), parameter :: CV_FIRST_RHSFUNC_ERR =  -9
-  integer(c_int), parameter :: CV_REPTD_RHSFUNC_ERR =  -10
-  integer(c_int), parameter :: CV_UNREC_RHSFUNC_ERR =  -11
-  integer(c_int), parameter :: CV_RTFUNC_FAIL       =  -12
-
-  integer(c_int), parameter :: CV_MEM_FAIL          =  -20
-  integer(c_int), parameter :: CV_MEM_NULL          =  -21
-  integer(c_int), parameter :: CV_ILL_INPUT         =  -22
-  integer(c_int), parameter :: CV_NO_MALLOC         =  -23
-  integer(c_int), parameter :: CV_BAD_K             =  -24
-  integer(c_int), parameter :: CV_BAD_T             =  -25
-  integer(c_int), parameter :: CV_BAD_DKY           =  -26
-  integer(c_int), parameter :: CV_TOO_CLOSE         =  -27
-
-  ! -----------------------------------------------------------------
-  ! CVDLS return values
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: CVDLS_SUCCESS         =  0
-  integer(c_int), parameter :: CVDLS_MEM_NULL        = -1
-  integer(c_int), parameter :: CVDLS_LMEM_NULL       = -2
-  integer(c_int), parameter :: CVDLS_ILL_INPUT       = -3
-  integer(c_int), parameter :: CVDLS_MEM_FAIL        = -4
-
-  ! Additional last_flag values
-  integer(c_int), parameter :: CVDLS_JACFUNC_UNRECVR = -5
-  integer(c_int), parameter :: CVDLS_JACFUNC_RECVR   = -6
-  integer(c_int), parameter :: CVDLS_SUNMAT_FAIL     = -7
-
-  ! -----------------------------------------------------------------
-  ! CVSPILS return values
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: CVSPILS_SUCCESS    =  0
-  integer(c_int), parameter :: CVSPILS_MEM_NULL   = -1
-  integer(c_int), parameter :: CVSPILS_LMEM_NULL  = -2
-  integer(c_int), parameter :: CVSPILS_ILL_INPUT  = -3
-  integer(c_int), parameter :: CVSPILS_MEM_FAIL   = -4
-  integer(c_int), parameter :: CVSPILS_PMEM_NULL  = -5
-  integer(c_int), parameter :: CVSPILS_SUNLS_NULL = -6
-
-  ! -----------------------------------------------------------------
-  ! CVDIAG return values
-  ! -----------------------------------------------------------------
-
-  integer(c_int), parameter :: CVDIAG_SUCCESS         =  0
-  integer(c_int), parameter :: CVDIAG_MEM_NULL        = -1
-  integer(c_int), parameter :: CVDIAG_LMEM_NULL       = -2
-  integer(c_int), parameter :: CVDIAG_ILL_INPUT       = -3
-  integer(c_int), parameter :: CVDIAG_MEM_FAIL        = -4
-
-  ! Additional last_flag values
-  integer(c_int), parameter :: CVDIAG_INV_FAIL        = -5
-  integer(c_int), parameter :: CVDIAG_RHSFUNC_UNRECVR = -6
-  integer(c_int), parameter :: CVDIAG_RHSFUNC_RECVR   = -7
-
-  ! =================================================================
-  !          U S E R - C A L L A B L E   R O U T I N E S
-  ! =================================================================
-
-  interface
-
-     ! =================================================================
-     ! Interfaces for cvode.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! CVodeCreate
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FCVodeCreate(lmm, iter) &
-          bind(C,name='CVodeCreate')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_int), value :: lmm
-       integer(c_int), value :: iter
-     end function FCVodeCreate
-
-     ! -----------------------------------------------------------------
-     ! Integrator optional input specification functions
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeSetErrHandlerFn(cvode_mem, ehfun, eh_data) &
-          bind(C,name='CVodeSetErrHandlerFn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       type(c_funptr), value :: ehfun
-       type(c_ptr),    value :: eh_data
-     end function FCVodeSetErrHandlerFn
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: CVodeSetErrFile
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeSetUserData(cvode_mem, user_data) &
-          bind(C,name='CVodeSetUserData')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       type(c_ptr), value :: user_data
-     end function FCVodeSetUserData
-
-     integer(c_int) function FCVodeSetMaxOrd(cvode_mem, maxord) &
-          bind(C,name='CVodeSetMaxOrd')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: maxord
-     end function FCVodeSetMaxOrd
-
-     integer(c_int) function FCVodeSetMaxNumSteps(cvode_mem, mxsteps) &
-          bind(C,name='CVodeSetMaxNumSteps')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: cvode_mem
-       integer(c_long), value :: mxsteps
-     end function FCVodeSetMaxNumSteps
-
-     integer(c_int) function FCVodeSetMaxHnilWarns(cvode_mem, mxhnil) &
-          bind(C,name='CVodeSetMaxHnilWarns')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: mxhnil
-     end function FCVodeSetMaxHnilWarns
-
-     integer(c_int) function FCVodeSetStabLimDet(cvode_mem, stldet) &
-          bind(C,name='CVodeSetStabLimDet')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: stldet
-     end function FCVodeSetStabLimDet
-
-     integer(c_int) function FCVodeSetInitStep(cvode_mem, hin) &
-          bind(C,name='CVodeSetInitStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: hin
-     end function FCVodeSetInitStep
-
-     integer(c_int) function FCVodeSetMinStep(cvode_mem, hmin) &
-          bind(C,name='CVodeSetMinStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: hmin
-     end function FCVodeSetMinStep
-
-     integer(c_int) function FCVodeSetMaxStep(cvode_mem, hmax) &
-          bind(C,name='CVodeSetMaxStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: hmax
-     end function FCVodeSetMaxStep
-
-     integer(c_int) function FCVodeSetStopTime(cvode_mem, tstop) &
-          bind(C,name='CVodeSetStopTime')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: tstop
-     end function FCVodeSetStopTime
-
-     integer(c_int) function FCVodeSetMaxErrTestFails(cvode_mem, maxnef) &
-          bind(C,name='CVodeSetMaxErrTestFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: maxnef
-     end function FCVodeSetMaxErrTestFails
-
-     integer(c_int) function FCVodeSetMaxNonlinIters(cvode_mem, maxcor) &
-          bind(C,name='CVodeSetMaxNonlinIters')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: maxcor
-     end function FCVodeSetMaxNonlinIters
-
-     integer(c_int) function FCVodeSetMaxConvFails(cvode_mem, maxncf) &
-          bind(C,name='CVodeSetMaxConvFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: maxncf
-     end function FCVodeSetMaxConvFails
-
-     integer(c_int) function FCVodeSetNonlinConvCoef(cvode_mem, nlscoef) &
-          bind(C,name='CVodeSetNonlinConvCoef')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: nlscoef
-     end function FCVodeSetNonlinConvCoef
-
-     integer(c_int) function FCVodeSetIterType(cvode_mem, iter) &
-          bind(C,name='CVodeSetIterType')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: iter
-     end function FCVodeSetIterType
-
-     integer(c_int) function FCVodeSetRootDirection(cvode_mem, rootdir) &
-          bind(C,name='CVodeSetRootDirection')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       real(c_double)     :: rootdir
-     end function FCVodeSetRootDirection
-
-     integer(c_int) function FCVodeSetNoInactiveRootWarn(cvode_mem) &
-       bind(C,name='CVodeSetNoInactiveRootWarn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-     end function FCVodeSetNoInactiveRootWarn
-
-     ! -----------------------------------------------------------------
-     ! CVodeInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeInit(cvode_mem, f, t0, y0) &
-          bind(C,name='CVodeInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       type(c_funptr), value :: f
-       real(c_double), value :: t0
-       type(c_ptr),    value :: y0
-     end function FCVodeInit
-
-     ! -----------------------------------------------------------------
-     ! CVodeReInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeReInit(cvode_mem, t0, y0) &
-          bind(C,name='CVodeReInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: t0
-       type(c_ptr),    value :: y0
-     end function FCVodeReInit
-
-     ! -----------------------------------------------------------------
-     ! CVodeSStolerances
-     ! CVodeSVtolerances
-     ! CVodeWFtolerances
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeSStolerances(cvode_mem, reltol, abstol) &
-          bind(C,name='CVodeSStolerances')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: reltol
-       real(c_double), value :: abstol
-     end function FCVodeSStolerances
-
-     integer(c_int) function FCVodeSVtolerances(cvode_mem, reltol, abstol) &
-          bind(C,name='CVodeSVtolerances')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: reltol
-       type(c_ptr),    value :: abstol
-     end function FCVodeSVtolerances
-
-     integer(c_int) function FCVodeWFtolerances(cvode_mem, efun) &
-          bind(C,name='CVodeWFtolerances')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       type(c_funptr), value :: efun
-     end function FCVodeWFtolerances
-
-     ! -----------------------------------------------------------------
-     ! CVodeRootInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeRootInit(cvode_mem, nrtfn, g) &
-          bind(C,name='CVodeRootInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       integer(c_int), value :: nrtfn
-       type(c_funptr), value :: g
-     end function FCVodeRootInit
-
-     ! -----------------------------------------------------------------
-     ! CVode
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVode(cvode_mem, tout, yout, tret, itask) &
-          bind(C,name='CVode')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: tout
-       type(c_ptr),    value :: yout
-       real(c_double)        :: tret
-       integer(c_int), value :: itask
-     end function FCVode
-
-     ! -----------------------------------------------------------------
-     ! CVodeGetDky
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeGetDky(cvode_mem, t, k, dky) &
-          bind(C,name='CVodeGetDky')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: t
-       integer(c_int), value :: k
-       type(c_ptr),    value :: dky
-     end function FCVodeGetDky
-
-     ! -----------------------------------------------------------------
-     ! Integrator optional output extraction functions
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeGetWorkSpace(cvode_mem, lenrw, leniw) &
-          bind(C,name='CVodeGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: lenrw
-       integer(c_long)    :: leniw
-     end function FCVodeGetWorkSpace
-
-     integer(c_int) function FCVodeGetNumSteps(cvode_mem, nsteps) &
-          bind(C,name='CVodeGetNumSteps')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nsteps
-     end function FCVodeGetNumSteps
-
-     integer(c_int) function FCVodeGetNumRhsEvals(cvode_mem, nfevals) &
-          bind(C,name='CVodeGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nfevals
-     end function FCVodeGetNumRhsEvals
-
-     integer(c_int) function FCVodeGetNumLinSolvSetups(cvode_mem, nlinsetups) &
-          bind(C,name='CVodeGetNumLinSolvSetups')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nlinsetups
-     end function FCVodeGetNumLinSolvSetups
-
-     integer(c_int) function FCVodeGetNumErrTestFails(cvode_mem, netfails) &
-          bind(C,name='CVodeGetNumErrTestFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: netfails
-     end function FCVodeGetNumErrTestFails
-
-     integer(c_int) function FCVodeGetLastOrder(cvode_mem, qlast) &
-          bind(C,name='CVodeGetLastOrder')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_int)    :: qlast
-     end function FCVodeGetLastOrder
-
-     integer(c_int) function FCVodeGetCurrentOrder(cvode_mem, qcur) &
-          bind(C,name='CVodeGetCurrentOrder')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_int)     :: qcur
-     end function FCVodeGetCurrentOrder
-
-     integer(c_int) function FCVodeGetNumStabLimOrderReds(cvode_mem, nslred) &
-          bind(C,name='CVodeGetNumStabLimOrderReds')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nslred
-     end function FCVodeGetNumStabLimOrderReds
-
-     integer(c_int) function FCVodeGetActualInitStep(cvode_mem, hinused) &
-          bind(C,name='CVodeGetActualInitStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       real(c_double)     :: hinused
-     end function FCVodeGetActualInitStep
-
-     integer(c_int) function FCVodeGetLastStep(cvode_mem, hlast) &
-          bind(C,name='CVodeGetLastStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       real(c_double)     :: hlast
-     end function FCVodeGetLastStep
-
-     integer(c_int) function FCVodeGetCurrentStep(cvode_mem, hcur) &
-         bind(C,name='CVodeGetCurrentStep')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       real(c_double)     :: hcur
-     end function FCVodeGetCurrentStep
-
-     integer(c_int) function FCVodeGetCurrentTime(cvode_mem, tcur) &
-          bind(C,name='CVodeGetCurrentTime')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       real(c_double)     :: tcur
-     end function FCVodeGetCurrentTime
-
-     integer(c_int) function FCVodeGetTolScaleFactor(cvode_mem, tolsfac) &
-          bind(C,name='CVodeGetTolScaleFactor')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       real(c_double)     :: tolsfac
-     end function FCVodeGetTolScaleFactor
-
-     integer(c_int) function FCVodeGetErrWeights(cvode_mem, eweight) &
-          bind(C,name='CVodeGetEffWeights')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       type(c_ptr), value :: eweight
-     end function FCVodeGetErrWeights
-
-     integer(c_int) function FCVodeGetEstLocalErrors(cvode_mem, ele) &
-          bind(C,name='CVodeGetEstLocalErrors')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       type(c_ptr), value :: ele
-     end function FCVodeGetEstLocalErrors
-
-     integer(c_int) function FCVodeGetNumGEvals(cvode_mem, ngevals) &
-          bind(C,name='CVodeGetNumGEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: ngevals
-     end function FCVodeGetNumGEvals
-
-     integer(c_int) function FCVodeGetRootInfo(cvode_mem, rootsfound) &
-          bind(C,name='CVodeGetRootInfo')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_int)     :: rootsfound
-     end function FCVodeGetRootInfo
-
-     integer(c_int) function FCVodeGetIntegratorStats(cvode_mem, nsteps, nfevals, &
-          nlinsetups, netfails, qlast, qcur, hinused, hlast, hcur, tcur) &
-          bind(C,name='CVodeGetIntegratorStats')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nsteps
-       integer(c_long)    :: nfevals
-       integer(c_long)    :: nlinsetups
-       integer(c_long)    :: netfails
-       integer(c_int)     :: qlast
-       integer(c_int)     :: qcur
-       real(c_double)     :: hinused
-       real(c_double)     :: hlast
-       real(c_double)     :: hcur
-       real(c_double)     :: tcur
-     end function FCVodeGetIntegratorStats
-
-     ! -----------------------------------------------------------------
-     ! Nonlinear solver optional output extraction functions
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVodeGetNumNonlinSolvIters(cvode_mem, nniters) &
-          bind(C,name='CVodeGetNumNonlinSolvIters')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nniters
-     end function FCVodeGetNumNonlinSolvIters
-
-     integer(c_int) function FCVodeGetNumNonlinSolvConvFails(cvode_mem, nncfails) &
-          bind(C,name='CVodeGetNumNonlinSolvConvFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nncfails
-     end function FCVodeGetNumNonlinSolvConvFails
-
-     integer(c_int) function FCVodeGetNonlinSolvStats(cvode_mem, nniters, nncfails) &
-          bind(C,name='CVodeGetNonlinSolvStats')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nniters
-       integer(c_long)    :: nncfails
-     end function FCVodeGetNonlinSolvStats
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: CVodeGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-     ! -----------------------------------------------------------------
-     ! CVodeFree
-     ! -----------------------------------------------------------------
-
-     subroutine FCVodeFree(cvode_mem) &
-          bind(C,name='CVodeFree')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr) :: cvode_mem ! DO NOT use value attribute input is void**
-     end subroutine FCVodeFree
-
-     ! =================================================================
-     ! Interfaces from cvode_direct.h
-     ! =================================================================
-
-     integer(c_int) function FCVDlsSetLinearSolver(cvode_mem, LS, A) &
-          bind(C,name='CVDlsSetLinearSolver')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       type(c_ptr), value :: LS
-       type(c_ptr), value :: A
-     end function FCVDlsSetLinearSolver
-
-     ! -----------------------------------------------------------------
-     ! Optional inputs to the CVDLS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVDlsSetJacFn(cvode_mem, jac) &
-          bind(C,name='CVDlsSetJacFn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       type(c_funptr), value :: jac
-     end function FCVDlsSetJacFn
-
-     ! -----------------------------------------------------------------
-     ! Optional outputs from the CVDLS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVDlsGetWorkSpace(cvode_mem, lenrwLS, leniwLS) &
-          bind(C,name='CVDlsGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FCVDlsGetWorkSpace
-
-     integer(c_int) function FCVDlsGetNumJacEvals(cvode_mem, njevals) &
-          bind(C,name='CVDlsGetNumJacEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: njevals
-     end function FCVDlsGetNumJacEvals
-
-     integer(c_int) function FCVDlsGetNumRhsEvals(cvode_mem, nfevalsLS) &
-          bind(C,name='CVDlsGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nfevalsLS
-     end function FCVDlsGetNumRhsEvals
-
-     integer(c_int) function FCVDlsGetLastFlag(cvode_mem, flag) &
-          bind(C,name='CVDlsGetLastFlag')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: flag
-     end function FCVDlsGetLastFlag
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: CVDlsGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-
-     ! =================================================================
-     ! Interfaces from cvode_spils.h
-     ! =================================================================
-
-     integer(c_int) function FCVSpilsSetLinearSolver(cvode_mem, LS) &
-          bind(C,name='CVSpilsSetLinearSolver')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       type(c_ptr), value :: LS
-     end function FCVSpilsSetLinearSolver
-
-     ! -----------------------------------------------------------------
-     ! Optional inputs to the CVSPILS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVSpilsSetEpsLin(cvode_mem, eplifac) &
-          bind(C,name='CVSpilsSetEpsLin')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       real(c_double), value :: eplifac
-     end function FCVSpilsSetEpsLin
-
-     integer(c_int) function FCVSpilsSetPreconditioner(cvode_mem, pset, psolve) &
-          bind(C,name='CVSpilsSetPreconditioner')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       type(c_funptr), value :: pset
-       type(c_funptr), value :: psolve
-     end function FCVSpilsSetPreconditioner
-
-     integer(c_int) function FCVSpilsSetJacTimes(cvode_mem, jtsetup, jtimes) &
-          bind(C,name='CVSpilsSetJacTimesVecFn')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: cvode_mem
-       type(c_funptr), value :: jtsetup
-       type(c_funptr), value :: jtimes
-     end function FCVSpilsSetJacTimes
-
-     ! -----------------------------------------------------------------
-     ! Optional outputs from the CVSPILS linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVSpilsGetWorkSpace(cvode_mem, lenrwLS, leniwLS) &
-          bind(C,name='CVSpilsGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FCVSpilsGetWorkSpace
-
-     integer(c_int) function FCVSpilsGetNumPrecEvals(cvode_mem, npevals) &
-          bind(C,name='CVSpilsGetNumPrecEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: npevals
-     end function FCVSpilsGetNumPrecEvals
-
-     integer(c_int) function FCVSpilsGetNumPrecSolves(cvode_mem, npsolves) &
-          bind(C,name='CVSpilsGetNumPrecSolves')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: npsolves
-     end function FCVSpilsGetNumPrecSolves
-
-     integer(c_int) function FCVSpilsGetNumLinIters(cvode_mem, nliters) &
-          bind(C,name='CVSpilsGetNumLinIters')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nliters
-     end function FCVSpilsGetNumLinIters
-
-     integer(c_int) function FCVSpilsGetNumConvFails(cvode_mem, nlcfails) &
-          bind(C,name='CVSpilsGetNumConvFails')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nlcfails
-     end function FCVSpilsGetNumConvFails
-
-     integer(c_int) function FCVSpilsGetNumJTSetupEvals(cvode_mem, njtsetups) &
-          bind(C,name='CVSpilsGetNumJTSetupEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: njtsetups
-     end function FCVSpilsGetNumJTSetupEvals
-
-     integer(c_int) function FCVSpilsGetNumJtimesEvals(cvode_mem, njvevals) &
-          bind(C,name='CVSpilsGetNumJtimesEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: njvevals
-     end function FCVSpilsGetNumJtimesEvals
-
-     integer(c_int) function FCVSpilsGetNumRhsEvals(cvode_mem, nfevalsLS) &
-          bind(C,name='CVSpilsGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nfevalsLS
-     end function FCVSpilsGetNumRhsEvals
-
-     integer(c_int) function FCVSpilsGetLastFlag(cvode_mem, flag) &
-          bind(C,name='CVSpilsGetLastFalg')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: flag
-     end function FCVSpilsGetLastFlag
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: CVSpilsGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-     ! =================================================================
-     ! Interfaces for cvode_diag.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! CVDiag
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVDiag(cvode_mem) &
-          bind(C,name='CVDiag')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-     end function FCVDiag
-
-     ! -----------------------------------------------------------------
-     ! Optional outputs from the CVDIAG linear solver
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVDiagGetWorkSpace(cvode_mem, lenrwLS, leniwLS) &
-          bind(C,name='CVDiagGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FCVDiagGetWorkSpace
-
-     integer(c_int) function FCVDiagGetNumRhsEvals(cvode_mem, nfevalsLS) &
-          bind(C,name='CVDiagGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nfevalsLS
-     end function FCVDiagGetNumRhsEvals
-
-     integer(c_int) function FCVDiagGetLastFlag(cvode_mem, flag) &
-          bind(C,name='CVDiagGetLastFlag')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: flag
-     end function FCVDiagGetLastFlag
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: CVDiagGetReturnFlagName
-     ! -----------------------------------------------------------------
-
-     ! =================================================================
-     ! Interfaces from cvode_bandpre.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! CVBandPrecInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVBandPrecInit(cvode_mem, N, mu, ml) &
-          bind(C,name='CVBandPrecInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: cvode_mem
-       integer(c_long), value :: N
-       integer(c_long), value :: mu
-       integer(c_long), value :: ml
-     end function FCVBandPrecInit
-
-     ! -----------------------------------------------------------------
-     ! Optional output functions : CVBandPrecGet*
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVBandPrecGetWorkSpace(cvode_mem, lenrwLS, leniwLS) &
-          bind(C,name='CVBandPrecGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FCVBandPrecGetWorkSpace
-
-     integer(c_int) function FCVBandPrecGetNumRhsEvals(cvode_mem, nfevalsBP) &
-          bind(C,name='CVBandPrecGetNumRhsEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: nfevalsBP
-     end function FCVBandPrecGetNumRhsEvals
-
-     ! =================================================================
-     ! Interfaces for cvode_bbdpre.h
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! CVBBDPrecInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVBBDPrecInit(cvode_mem, Nlocal, mudq, mldq, &
-          mukeep, mlkeep, dqrely, gloc, cfn) &
-          bind(C,name='CVBBDPrecInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: cvode_mem
-       integer(c_long), value :: Nlocal
-       integer(c_long), value :: mudq
-       integer(c_long), value :: mldq
-       integer(c_long), value :: mukeep
-       integer(c_long), value :: mlkeep
-       real(c_double),  value :: dqrely
-       type(c_funptr),  value :: gloc
-       type(c_funptr),  value :: cfn
-     end function FCVBBDPrecInit
-
-     ! -----------------------------------------------------------------
-     ! CVBBDPrecReInit
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVBBDPrecReInit(cvode_mem, mudq, mldq, dqrely) &
-          bind(C,name='CVBBNPrecReInit')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),     value :: cvode_mem
-       integer(c_long), value :: mudq
-       integer(c_long), value :: mldq
-       real(c_double),  value :: dqrely
-     end function FCVBBDPrecReInit
-
-     ! -----------------------------------------------------------------
-     ! BBDPRE optional output extraction routines
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FCVBBDPrecGetWorkSpace(cvode_mem, lenrwLS, leniwLS) &
-          bind(C,name='CVBBDPrecGetWorkSpace')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FCVBBDPrecGetWorkSpace
-
-     integer(c_int) function FCVBBDPrecGetNumGfnEvals(cvode_mem, ngevalsBBDP) &
-          bind(C,name='CVBBDPrecGetNumGfnEvals')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: cvode_mem
-       integer(c_long)    :: ngevalsBBDP
-     end function FCVBBDPrecGetNumGfnEvals
-
-  end interface
-
-end module fcvode_mod
diff --git a/Src/Extern/SUNDIALS3/fnvector_serial.f90 b/Src/Extern/SUNDIALS3/fnvector_serial.f90
deleted file mode 100644
index 49efb31c70b..00000000000
--- a/Src/Extern/SUNDIALS3/fnvector_serial.f90
+++ /dev/null
@@ -1,607 +0,0 @@
-! -----------------------------------------------------------------
-! $Revision$
-! $Date$
-! ----------------------------------------------------------------- 
-! Programmer(s): David J. Gardner @ LLNL 
-!                Daniel R. Reynolds @ SMU
-! -----------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department 
-! of Energy by Lawrence Livermore National Laboratory in part under 
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! -----------------------------------------------------------------
-! This module implements the Fortran 2003 interface to the SUNDIALS 
-! serial NVECTOR structure.
-! -----------------------------------------------------------------
-
-module fnvector_serial
-
-  !======= Interfaces =========
-  interface
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VNew_Serial
-     ! -----------------------------------------------------------------
-     ! This function creates and allocates memory for a serial vector.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VNew_Serial(vec_length) &
-          bind(C,name='N_VNewSerial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: vec_length
-     end function N_VNew_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VNewEmpty_Serial
-     ! -----------------------------------------------------------------
-     ! This function creates a new serial N_Vector with an empty (NULL)
-     ! data array.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VNewEmpty_Serial(vec_length) &
-          bind(C,name='N_VNewEmpty_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: vec_length
-     end function N_VNewEmpty_Serial
-     
-     ! -----------------------------------------------------------------
-     ! Function : N_VMake_Serial
-     ! -----------------------------------------------------------------
-     ! This function creates and allocates memory for a serial vector
-     ! with a user-supplied data array.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VMake_Serial(length, v_data) &
-          bind(C,name='N_VMake_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: length
-       real(c_double)         :: v_data(length)
-     end function N_VMake_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VCloneVectorArray_Serial
-     ! -----------------------------------------------------------------
-     ! This function creates an array of 'count' SERIAL vectors by
-     ! cloning a given vector w.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VCloneVectorArray_Serial(count, w) &
-          bind(C,name='N_VCloneVectorArray_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_int), value :: count
-       type(c_ptr),    value :: w
-     end function N_VCloneVectorArray_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VCloneVectorArrayEmpty_Serial
-     ! -----------------------------------------------------------------
-     ! This function creates an array of 'count' SERIAL vectors each
-     ! with an empty (NULL) data array by cloning w.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VCloneVectorArrayEmpty_Serial(count, w) &
-          bind(C,name='N_VCloneVectorArrayEmpty_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_int), value :: count
-       type(c_ptr),    value :: w
-     end function N_VCloneVectorArrayEmpty_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VDestroyVectorArray_Serial
-     ! -----------------------------------------------------------------
-     ! This function frees an array of SERIAL vectors created with 
-     ! N_VCloneVectorArray_Serial or N_VCloneVectorArrayEmpty_Serial.
-     ! -----------------------------------------------------------------
-
-     subroutine N_VDestroyVectorArray_Serial(vs, count) &
-          bind(C,name='N_VDestroyVectorArray_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr)    :: vs
-       integer(c_int) :: count
-     end subroutine N_VDestroyVectorArray_Serial
-     
-     ! -----------------------------------------------------------------
-     ! Function : N_VGetLength_Serial
-     ! -----------------------------------------------------------------
-     ! This function returns number of vector elements.
-     ! -----------------------------------------------------------------
-
-     integer(c_long) function N_VGetLength_Serial(v) &
-          bind(C,name='N_VGetLength_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-     end function N_VGetLength_Serial
-       
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VPrint_Serial
-     ! -----------------------------------------------------------------
-     ! This function prints the content of a serial vector to stdout.
-     ! -----------------------------------------------------------------
-
-     subroutine N_VPrint_Serial(v) &
-          bind(C,name='N_VPrint_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-     end subroutine N_VPrint_Serial
-
-     ! =================================================================
-     ! serial implementations of various useful vector operations
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VGetVectorID
-     ! -----------------------------------------------------------------
-     ! Returns an identifier for the vector type from enumeration 
-     ! N_Vector_ID.
-     ! -----------------------------------------------------------------
-
-     ! integer(c_int) function N_VGetVectorID_Serial(v) &
-     !      bind(C,name'N_VGetVectorID_Serial')
-     !   use, intrinsic :: iso_c_binding
-     !   implicit none
-     !   type(c_ptr), value :: vec
-     ! end function N_VGetVectorID_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VCloneEmpty_Serial
-     ! -----------------------------------------------------------------
-     ! Creates a new vector of the same type as an existing vector,
-     ! but does not allocate storage.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VCloneEmpty_Serial(w) &
-          bind(C,name='N_VCloneEmpty_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: w
-     end function N_VCloneEmpty_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VClone_Serial
-     ! -----------------------------------------------------------------
-     ! Creates a new vector of the same type as an existing vector.
-     ! It does not copy the vector, but rather allocates storage for
-     ! the new vector.
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function N_VClone_Serial(w) &
-          bind(C,name='N_VClone_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: w
-     end function N_VClone_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VDestroy_Serial
-     ! -----------------------------------------------------------------
-     ! Destroys a vector created with N_VClone_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine N_VDestroy_Serial(v) &
-          bind(C,name='N_VDestroy_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-     end subroutine N_VDestroy_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VSpace_Serial
-     ! -----------------------------------------------------------------
-     ! Returns space requirements for one N_Vector (type 'realtype' in
-     ! lrw and type 'long int' in liw).
-     ! -----------------------------------------------------------------
-     
-     subroutine N_VSpace_Serial(v, lrw, liw) &
-          bind(C,name='N_VSpace_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-       integer(c_long)    :: lrw
-       integer(c_long)    :: liw
-     end subroutine N_VSpace_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VGetArrayPointer_Serial
-     ! -----------------------------------------------------------------
-     ! Returns a pointer to the data component of the given N_Vector.
-     !
-     ! NOTE: This function assumes that the internal data is stored
-     ! as a contiguous 'realtype' array. This routine is only used in
-     ! the solver-specific interfaces to the dense and banded linear
-     ! solvers, as well as the interfaces to  the banded preconditioners
-     ! distributed with SUNDIALS.
-     ! -----------------------------------------------------------------
-          
-     type(c_ptr) function N_VGetArrayPointer_Serial(vec) &
-          bind(C,name='N_VGetArrayPointer_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: vec
-     end function N_VGetArrayPointer_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VSetArrayPointer_Serial
-     ! -----------------------------------------------------------------
-     ! Overwrites the data field in the given N_Vector with a user-supplied
-     ! array of type 'realtype'.
-     !
-     ! NOTE: This function assumes that the internal data is stored
-     ! as a contiguous 'realtype' array. This routine is only used in
-     ! the interfaces to the dense linear solver.
-     ! -----------------------------------------------------------------
-
-     subroutine N_VSetArrayPointer_Serial(v_data, v) &
-          bind(C,name='N_VSetArrayPointer_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double)     :: v_data
-       type(c_ptr), value :: v
-     end subroutine N_VSetArrayPointer_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VLinearSum_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z = a*x + b*y
-     ! -----------------------------------------------------------------
-     
-     subroutine N_VLinearSum_Serial(a, x, b, y, z) &
-          bind(C,name='N_VLinearSum_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: a
-       type(c_ptr),    value :: x
-       real(c_double), value :: b
-       type(c_ptr),    value :: y
-       type(c_ptr),    value :: z
-     end subroutine N_VLinearSum_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VConst_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = c for i = 0, 1, ..., N-1
-     ! -----------------------------------------------------------------
-     
-     subroutine N_VConst_Serial(c, z) &
-          bind(C,name='N_VConst_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: c
-       type(c_ptr),    value :: z
-     end subroutine N_VConst_Serial
-       
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VProd_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = x[i]*y[i] for i = 0, 1, ..., N-1
-     ! -----------------------------------------------------------------
-
-     subroutine N_VProd_Serial(x, y, z) &
-          bind(C,name='N_VProd_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-       type(c_ptr), value :: z
-     end subroutine N_VProd_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VDiv_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = x[i]/y[i] for i = 0, 1, ..., N-1
-     ! -----------------------------------------------------------------
-
-     subroutine N_VDiv_Serial(x, y, z) &
-          bind(C,name='N_VDiv_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-       type(c_ptr), value :: z
-     end subroutine N_VDiv_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VScale_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z = c*x
-     ! -----------------------------------------------------------------
-
-     subroutine N_VScale_Serial(c, x, z) &
-          bind(C,name='N_VScale_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: c
-       type(c_ptr),    value :: x
-       type(c_ptr),    value :: z
-     end subroutine N_VScale_Serial
-
-     ! -----------------------------------------------------------------         
-     ! Subroutine : N_VAbs_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = |x[i]| for i = 0, 1, ..., N-1
-     ! -----------------------------------------------------------------
-
-     subroutine N_VAbs_Serial(x, z) &
-          bind(C,name='N_VAbs_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: z
-     end subroutine N_VAbs_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VInv_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = 1/x[i] for i = 0, 1, ..., N-1
-     !
-     ! This routine does not check for division by 0. It should be
-     ! called only with an N_Vector x which is guaranteed to have
-     ! all non-zero components.
-     ! -----------------------------------------------------------------         
-
-     subroutine N_VInv_Serial(x, z) &
-          bind(C,name='N_VInv_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: z
-     end subroutine N_VInv_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VAddConst
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = x[i] + b   for i = 0, 1, ..., N-1
-     ! -----------------------------------------------------------------
-     
-     subroutine N_VAddConst_Serial(x, b, z) &
-          bind(C,name='N_VAddConst_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: x
-       real(c_double), value :: b
-       type(c_ptr),    value :: z
-     end subroutine N_VAddConst_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VDotProd_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the dot product of two vectors:
-     !     sum (i = 0 to N-1) {x[i]*y[i]}
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VDotProd_Serial(x, y) &
-          bind(C,name='N_VDotProd_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-     end function N_VDotProd_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VMaxNorm_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the maximum norm of x:
-     !     max (i = 0 to N-1) ABS(x[i])
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VMaxNorm_Serial(x) &
-          bind(C,name='N_VMaxNorm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-     end function N_VMaxNorm_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VWrmsNorm_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the weighted root mean square norm of x with weight 
-     ! vector w:
-     !     sqrt [(sum (i = 0 to N-1) {(x[i]*w[i])^2})/N]
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VWrmsNorm_Serial(x, w) &
-          bind(C,name='N_VWrmsNorm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: w
-     end function N_VWrmsNorm_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VWrmsNormMask_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the weighted root mean square norm of x with weight
-     ! vector w, masked by the elements of id:
-     !     sqrt [(sum (i = 0 to N-1) {(x[i]*w[i]*msk[i])^2})/N]
-     ! where msk[i] = 1.0 if id[i] > 0 and
-     !     msk[i] = 0.0 if id[i] < 0
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VWrmsNormMask_Serial(x, w, id) &
-          bind(C,name='N_VWrmsNormMask_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: w
-       type(c_ptr), value :: id
-     end function N_VWrmsNormMask_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VMin_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the smallest element of x:
-     !     min (i = 0 to N-1) x[i]
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VMin_Serial(x) &
-          bind(C,name='N_VMin_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-     end function N_VMin_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VWL2Norm_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the weighted Euclidean L2 norm of x with weight 
-     ! vector w:
-     !     sqrt [(sum (i = 0 to N-1) {(x[i]*w[i])^2})]
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VWL2Norm_Serial(x, w) &
-          bind(C,name='N_VWL2Norm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: w
-     end function N_VWL2Norm_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VL1Norm_Serial
-     ! -----------------------------------------------------------------
-     ! Returns the L1 norm of x:
-     !     sum (i = 0 to N-1) {ABS(x[i])}
-     ! -----------------------------------------------------------------
-
-     real(c_double) function N_VL1Norm_Serial(x) &
-          bind(C,name='N_VL1Norm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-     end function N_VL1Norm_Serial
-
-     ! -----------------------------------------------------------------
-     ! Subroutine : N_VCompare_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation
-     !     z[i] = 1.0 if ABS(x[i]) >= c   i = 0, 1, ..., N-1
-     !     0.0 otherwise
-     ! -----------------------------------------------------------------
-
-     subroutine N_VCompare_Serial(c, x, z) &
-          bind(C,name='N_VCompare_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: c
-       type(c_ptr),    value :: x
-       type(c_ptr),    value :: z
-     end subroutine N_VCompare_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VInvTest_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation z[i] = 1/x[i] with a test for 
-     !     x[i] == 0.0 before inverting x[i].
-     !
-     ! This routine returns TRUE if all components of x are non-zero 
-     ! (successful inversion) and returns FALSE otherwise.
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function N_VInvTest_Serial(x, z) &
-          bind(C,name='N_VInvTest_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: z
-     end function N_VInvTest_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VConstrMask_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation : 
-     !     m[i] = 1.0 if constraint test fails for x[i]
-     !     m[i] = 0.0 if constraint test passes for x[i]
-     ! where the constraint tests are as follows:
-     !     If c[i] = +2.0, then x[i] must be >  0.0.
-     !     If c[i] = +1.0, then x[i] must be >= 0.0.
-     !     If c[i] = -1.0, then x[i] must be <= 0.0.
-     !     If c[i] = -2.0, then x[i] must be <  0.0.
-     ! This routine returns a boolean FALSE if any element failed
-     ! the constraint test, TRUE if all passed. It also sets a
-     ! mask vector m, with elements equal to 1.0 where the
-     ! corresponding constraint test failed, and equal to 0.0
-     ! where the constraint test passed.
-     !
-     ! This routine is specialized in that it is used only for
-     ! constraint checking.
-     ! -----------------------------------------------------------------
-          
-     integer(c_int) function N_VConstrMask_Serial(c, x, m) &
-          bind(C,name='N_VConstrMask_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: c
-       type(c_ptr), value :: x
-       type(c_ptr), value :: m
-     end function N_VConstrMask_Serial
-
-     ! -----------------------------------------------------------------
-     ! Function : N_VMinQuotient_Serial
-     ! -----------------------------------------------------------------
-     ! Performs the operation : 
-     !     minq  = min ( num[i]/denom[i]) over all i such that   
-     !     denom[i] != 0.
-     ! This routine returns the minimum of the quotients obtained
-     ! by term-wise dividing num[i] by denom[i]. A zero element
-     ! in denom will be skipped. If no such quotients are found,
-     ! then the large value BIG_REAL is returned.
-     ! -----------------------------------------------------------------
-     
-     real(c_double) function N_VMinQuotient_Serial(num, denom) &
-          bind(C,name='N_VMinQuotient_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: num
-       type(c_ptr), value :: denom
-     end function N_VMinQuotient_Serial
-     
-  end interface
-  
-contains
-
-  ! ================================================================
-  ! Helpful N_Vector_Serial Functions / Subroutines
-  ! ================================================================
-
-  subroutine N_VGetData_Serial(SUNVec, length, f_array)
-    ! ----------------------------------------------------------------
-    ! Description: Extracts data array from serial SUNDIALS N_Vector
-    ! ----------------------------------------------------------------
-    
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    type(c_ptr)             :: SUNVec
-    integer(c_long)         :: length
-    real(c_double), pointer :: f_array(:)
-
-    ! C pointer for N_Vector interal data array
-    type(c_ptr) :: c_array
-
-    !======= Internals ============
-
-    ! get data pointer from N_Vector
-    c_array = N_VGetArrayPointer_Serial(SUNVec)
-
-    ! convert c pointer to f pointer
-    call c_f_pointer(c_array, f_array, (/length/))
-
-  end subroutine N_VGetData_Serial
-
-end module fnvector_serial
diff --git a/Src/Extern/SUNDIALS3/fnvector_serial_fprefix.f90 b/Src/Extern/SUNDIALS3/fnvector_serial_fprefix.f90
deleted file mode 100644
index 10b3faca61b..00000000000
--- a/Src/Extern/SUNDIALS3/fnvector_serial_fprefix.f90
+++ /dev/null
@@ -1,487 +0,0 @@
-! -----------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-!                Daniel R. Reynolds @ SMU
-! -----------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! -----------------------------------------------------------------
-! This file contains a Fortran module for interfacing directly with
-! the SUNDIALS serial NVector using the ISO_C_BINDING module.
-! -----------------------------------------------------------------
-
-module fnvector_serial_mod
-
-  !======= Interfaces =========
-  interface
-
-     ! =================================================================
-     ! Constructors
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! N_VNew_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VNew_Serial(vec_length) &
-          bind(C,name='N_VNew_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: vec_length
-     end function FN_VNew_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VNewEmpty_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VNewEmpty_Serial(vec_length) &
-          bind(C,name='N_VNewEmpty_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: vec_length
-     end function FN_VNewEmpty_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VMake_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VMake_Serial(length, v_data) &
-          bind(C,name='N_VMake_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: length
-       real(c_double)         :: v_data(length)
-     end function FN_VMake_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VCloneVectorArray_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VCloneVectorArray_Serial(count, w) &
-          bind(C,name='N_VCloneVectorArray_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_int), value :: count
-       type(c_ptr),    value :: w
-     end function FN_VCloneVectorArray_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VCloneVectorArrayEmpty_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VCloneVectorArrayEmpty_Serial(count, w) &
-          bind(C,name='N_VCloneVectorArrayEmpty_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_int), value :: count
-       type(c_ptr),    value :: w
-     end function FN_VCloneVectorArrayEmpty_Serial
-
-     ! =================================================================
-     ! Destructors
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! N_VDestroy_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VDestroy_Serial(v) &
-          bind(C,name='N_VDestroy_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-     end subroutine FN_VDestroy_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VDestroyVectorArray_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VDestroyVectorArray_Serial(vs, count) &
-          bind(C,name='N_VDestroyVectorArray_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr)    :: vs
-       integer(c_int) :: count
-     end subroutine FN_VDestroyVectorArray_Serial
-
-     ! =================================================================
-     ! Other routines
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! N_VGetLength_Serial
-     ! -----------------------------------------------------------------
-
-     integer(c_long) function FN_VGetLength_Serial(v) &
-          bind(C,name='N_VGetLength_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-     end function FN_VGetLength_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VPrint_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VPrint_Serial(v) &
-          bind(C,name='N_VPrint_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-     end subroutine FN_VPrint_Serial
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED: N_VPrintFile_Serial
-     ! -----------------------------------------------------------------
-
-     ! =================================================================
-     ! Operations
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! N_VGetVectorID: NOT INTERFACED
-     ! -----------------------------------------------------------------
-
-     ! -----------------------------------------------------------------
-     ! N_VCloneEmpty_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VCloneEmpty_Serial(w) &
-          bind(C,name='N_VCloneEmpty_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: w
-     end function FN_VCloneEmpty_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VClone_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VClone_Serial(w) &
-          bind(C,name='N_VClone_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: w
-     end function FN_VClone_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VSpace_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VSpace_Serial(v, lrw, liw) &
-          bind(C,name='N_VSpace_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: v
-       integer(c_long)    :: lrw
-       integer(c_long)    :: liw
-     end subroutine FN_VSpace_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VGetArrayPointer_Serial
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FN_VGetArrayPointer_Serial(vec) &
-          bind(C,name='N_VGetArrayPointer_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: vec
-     end function FN_VGetArrayPointer_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VSetArrayPointer_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VSetArrayPointer_Serial(v_data, v) &
-          bind(C,name='N_VSetArrayPointer_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double)     :: v_data
-       type(c_ptr), value :: v
-     end subroutine FN_VSetArrayPointer_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VLinearSum_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VLinearSum_Serial(a, x, b, y, z) &
-          bind(C,name='N_VLinearSum_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: a
-       type(c_ptr),    value :: x
-       real(c_double), value :: b
-       type(c_ptr),    value :: y
-       type(c_ptr),    value :: z
-     end subroutine FN_VLinearSum_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VConst_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VConst_Serial(c, z) &
-          bind(C,name='N_VConst_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: c
-       type(c_ptr),    value :: z
-     end subroutine FN_VConst_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VProd_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VProd_Serial(x, y, z) &
-          bind(C,name='N_VProd_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-       type(c_ptr), value :: z
-     end subroutine FN_VProd_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VDiv_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VDiv_Serial(x, y, z) &
-          bind(C,name='N_VDiv_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-       type(c_ptr), value :: z
-     end subroutine FN_VDiv_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VScale_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VScale_Serial(c, x, z) &
-          bind(C,name='N_VScale_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: c
-       type(c_ptr),    value :: x
-       type(c_ptr),    value :: z
-     end subroutine FN_VScale_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VAbs_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VAbs_Serial(x, z) &
-          bind(C,name='N_VAbs_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: z
-     end subroutine FN_VAbs_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VInv_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VInv_Serial(x, z) &
-          bind(C,name='N_VInv_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: z
-     end subroutine FN_VInv_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VAddConst
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VAddConst_Serial(x, b, z) &
-          bind(C,name='N_VAddConst_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: x
-       real(c_double), value :: b
-       type(c_ptr),    value :: z
-     end subroutine FN_VAddConst_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VDotProd_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VDotProd_Serial(x, y) &
-          bind(C,name='N_VDotProd_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-     end function FN_VDotProd_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VMaxNorm_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VMaxNorm_Serial(x) &
-          bind(C,name='N_VMaxNorm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-     end function FN_VMaxNorm_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VWrmsNorm_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VWrmsNorm_Serial(x, w) &
-          bind(C,name='N_VWrmsNorm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: w
-     end function FN_VWrmsNorm_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VWrmsNormMask_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VWrmsNormMask_Serial(x, w, id) &
-          bind(C,name='N_VWrmsNormMask_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: w
-       type(c_ptr), value :: id
-     end function FN_VWrmsNormMask_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VMin_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VMin_Serial(x) &
-          bind(C,name='N_VMin_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-     end function FN_VMin_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VWL2Norm_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VWL2Norm_Serial(x, w) &
-          bind(C,name='N_VWL2Norm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: w
-     end function FN_VWL2Norm_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VL1Norm_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VL1Norm_Serial(x) &
-          bind(C,name='N_VL1Norm_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-     end function FN_VL1Norm_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VCompare_Serial
-     ! -----------------------------------------------------------------
-
-     subroutine FN_VCompare_Serial(c, x, z) &
-          bind(C,name='N_VCompare_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       real(c_double), value :: c
-       type(c_ptr),    value :: x
-       type(c_ptr),    value :: z
-     end subroutine FN_VCompare_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VInvTest_Serial
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FN_VInvTest_Serial(x, z) &
-          bind(C,name='N_VInvTest_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: x
-       type(c_ptr), value :: z
-     end function FN_VInvTest_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VConstrMask_Serial
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FN_VConstrMask_Serial(c, x, m) &
-          bind(C,name='N_VConstrMask_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: c
-       type(c_ptr), value :: x
-       type(c_ptr), value :: m
-     end function FN_VConstrMask_Serial
-
-     ! -----------------------------------------------------------------
-     ! N_VMinQuotient_Serial
-     ! -----------------------------------------------------------------
-
-     real(c_double) function FN_VMinQuotient_Serial(num, denom) &
-          bind(C,name='N_VMinQuotient_Serial')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: num
-       type(c_ptr), value :: denom
-     end function FN_VMinQuotient_Serial
-
-  end interface
-
-contains
-
-  ! ================================================================
-  ! Helpful routines
-  ! ================================================================
-
-  ! ----------------------------------------------------------------
-  ! FN_VGetData_Serial 
-  ! 
-  ! Extracts data array from a serial SUNDIALS N_Vector
-  ! ----------------------------------------------------------------
-
-  subroutine FN_VGetData_Serial(vec, f_array)
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    type(c_ptr)             :: vec
-    integer(c_long)         :: length
-    real(c_double), pointer :: f_array(:)
-
-    ! C pointer for N_Vector interal data array
-    type(c_ptr) :: c_array
-
-    !======= Internals ============
-
-    ! get data pointer from N_Vector
-    c_array = FN_VGetArrayPointer_Serial(vec)
-
-    ! get vector length
-    length = FN_VGetLength_Serial(vec)
-    
-    ! convert c pointer to f pointer
-    call c_f_pointer(c_array, f_array, (/length/))
-
-  end subroutine FN_VGetData_Serial
-
-end module fnvector_serial_mod
diff --git a/Src/Extern/SUNDIALS3/fsunlinsol_dense.f90 b/Src/Extern/SUNDIALS3/fsunlinsol_dense.f90
deleted file mode 100644
index 60deb96fba8..00000000000
--- a/Src/Extern/SUNDIALS3/fsunlinsol_dense.f90
+++ /dev/null
@@ -1,98 +0,0 @@
-! -----------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-! -----------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! -----------------------------------------------------------------
-! This file contains a Fortran module for interfacing directly with
-! the SUNDIALS dense linear solver using the ISO_C_BINDING module.
-! -----------------------------------------------------------------
-
-module fsunlinsol_dense_mod
-
-  !======= Interfaces =========
-  interface
-
-     ! =================================================================
-     ! Constructors
-     ! =================================================================
-
-     type(c_ptr) function FSUNDenseLinearSolver(y, A) &
-          bind(C,name='SUNDenseLinearSolver')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: y
-       type(c_ptr), value :: A
-     end function FSUNDenseLinearSolver
-
-     ! =================================================================
-     ! Destructors
-     ! =================================================================
-
-     subroutine FSUNLinSolFree_Dense(LS) &
-          bind(C,name='SUNLinSolFree_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: LS
-     end subroutine FSUNLinSolFree_Dense
-
-     ! =================================================================
-     ! Operations
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED SUNLinSolGetType_Dense
-     ! -----------------------------------------------------------------
-
-     integer(c_int) function FSUNLinSolInitialize_Dense(LS) &
-          bind(C,name='SUNLinSolInitialize_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: LS
-     end function FSUNLinSolInitialize_Dense
-
-     integer(c_int) function FSUNLinSolSetup_Dense(LS, A) &
-          bind(C,name='SUNLinSolSetup_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: LS
-       type(c_ptr), value :: A
-     end function FSUNLinSolSetup_Dense
-
-     integer(c_int) function FSUNLinSolSolve_Dense(LS, A, x, b, tol) &
-          bind(C,name='SUNLinSolSolve_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr),    value :: LS
-       type(c_ptr),    value :: A
-       type(c_ptr),    value :: x
-       type(c_ptr),    value :: b
-       real(c_double), value :: tol
-     end function FSUNLinSolSolve_Dense
-
-     integer(c_long) function FSUNLinSolLastFlag_Dense(LS) &
-          bind(C,name='SUNLinSolLastFlag_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: LS
-     end function FSUNLinSolLastFlag_Dense
-
-     integer(c_int) function FSUNLinSolSpace_Dense(LS, lenrwLS, leniwLS) &
-          bind(C,name='SUNLinSolSpace_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: LS
-       integer(c_long)    :: lenrwLS
-       integer(c_long)    :: leniwLS
-     end function FSUNLinSolSpace_Dense
-
-  end interface
-
-end module fsunlinsol_dense_mod
diff --git a/Src/Extern/SUNDIALS3/fsunmat_dense.f90 b/Src/Extern/SUNDIALS3/fsunmat_dense.f90
deleted file mode 100644
index 960f8bc1709..00000000000
--- a/Src/Extern/SUNDIALS3/fsunmat_dense.f90
+++ /dev/null
@@ -1,197 +0,0 @@
-! -----------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-! -----------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! -----------------------------------------------------------------
-! This file contains a Fortran module for interfacing directly with
-! the SUNDIALS dense matrix using the ISO_C_BINDING module.
-! -----------------------------------------------------------------
-
-module fsunmat_dense_mod
-
-  !======= Interfaces =========
-  interface
-
-     ! =================================================================
-     ! Constructors
-     ! =================================================================
-
-     type(c_ptr) function FSUNDenseMatrix(M, N) &
-          bind(C,name='SUNDenseMatrix')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       integer(c_long), value :: M
-       integer(c_long), value :: N
-     end function FSUNDenseMatrix
-
-     ! =================================================================
-     ! Destructors
-     ! =================================================================
-
-     subroutine FSUNMatDestroy_Dense(A) &
-          bind(C,name='SUNMatDestroy_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: A
-     end subroutine FSUNMatDestroy_Dense
-
-     ! =================================================================
-     ! Other routines
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED SUNDenseMatrix_Print
-     ! -----------------------------------------------------------------
-
-     integer(c_long) function FSUNDenseMatrix_Rows(A) &
-          bind(C,name='SUNDenseMatrix_Rows')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: A
-     end function FSUNDenseMatrix_Rows
-
-     integer(c_long) function FSUNDenseMatrix_Columns(A) &
-          bind(C,name='SUNDenseMatrix_Columns')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: A
-     end function FSUNDenseMatrix_Columns
-
-     integer(c_long) function FSUNDenseMatrix_LData(A) &
-          bind(C,name='SUNDenseMatrix_LData')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: A
-     end function FSUNDenseMatrix_LData
-
-     type(c_ptr) function FSUNDenseMatrix_Data(A) &
-          bind(C,name='SUNDenseMatrix_Data')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: A
-     end function FSUNDenseMatrix_Data
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED SUNDenseMatrix_Cols
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FSUNDenseMatrix_Column(A, j) &
-          bind(C,name='SUNDenseMatrix_Column')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value     :: A
-       integer(c_long), value :: j
-     end function FSUNDenseMatrix_Column
-
-     ! =================================================================
-     ! Operations
-     ! =================================================================
-
-     ! -----------------------------------------------------------------
-     ! NOT INTERFACED SUNMatGetID_Dense
-     ! -----------------------------------------------------------------
-
-     type(c_ptr) function FSUNMatClone_Dense(A) &
-          bind(C,name='SUNMatClone_Dense')
-       use, intrinsic :: iso_c_binding
-       implicit none
-       type(c_ptr), value :: A
-     end function FSUNMatClone_Dense
-
-     integer(c_int) function FSUNMatZero_Dense(A) &
-          bind(C,name='SUNMatZero_Dense')
-       use, intrinsic :: iso_c_binding
-       type(c_ptr), value :: A
-     end function FSUNMatZero_Dense
-
-     integer(c_int) function FSUNMatCopy_Dense(A, B) &
-          bind(C,name='SUNMatCopy_Dense')
-       use, intrinsic :: iso_c_binding
-       type(c_ptr), value :: A
-       type(c_ptr), value :: B
-     end function FSUNMatCopy_Dense
-
-     integer(c_int) function FSUNMatScaleAdd_Dense(c, A, B) &
-          bind(C,name='SUNMatScaleAdd_Dense')
-       use, intrinsic :: iso_c_binding
-       real(c_double), value :: c
-       type(c_ptr),    value :: A
-       type(c_ptr),    value :: B
-     end function FSUNMatScaleAdd_Dense
-
-     integer(c_int) function FSUNMatScaleAddI_Dense(c, A) &
-          bind(C,name='SUNMatScaleAddI_Dense')
-       use, intrinsic :: iso_c_binding
-       real(c_double), value :: c
-       type(c_ptr),    value :: A
-     end function FSUNMatScaleAddI_Dense
-
-     integer(c_int) function FSUNMatMatvec_Dense(A, x, y) &
-          bind(C,name='SUNMatMatvec_Dense')
-       use, intrinsic :: iso_c_binding
-       type(c_ptr), value :: A
-       type(c_ptr), value :: x
-       type(c_ptr), value :: y
-     end function FSUNMatMatvec_Dense
-
-     integer(c_int) function FSUNMatSpace_Dense(A, lenrw, leniw) &
-          bind(C,name='SUNMatSpace_Dense')
-       use, intrinsic :: iso_c_binding
-       type(c_ptr), value :: A
-       integer(c_long)    :: lenrw
-       integer(c_long)    :: leniw
-     end function FSUNMatSpace_Dense
-
-  end interface
-
-contains
-
-  ! ================================================================
-  ! Helpful routines
-  ! ================================================================
-
-  ! ----------------------------------------------------------------
-  ! FSUNMatGetData_Dense
-  !
-  ! Extracts data array from a SUNDIALS Dense Matrix
-  ! ----------------------------------------------------------------
-
-  subroutine FSUNMatGetData_Dense(A, f_array)
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    type(c_ptr)             :: A
-    real(c_double), pointer :: f_array(:,:)
-
-    ! internal variables
-    type(c_ptr)     :: c_array
-    integer(c_long) :: M, N
-
-    !======= Internals ============
-
-    ! get data pointer from N_Vector
-    c_array = FSUNDenseMatrix_Data(A)
-
-    ! get matrix size
-    M = FSUNDenseMatrix_Rows(A)
-    N = FSUNDenseMatrix_Columns(A)
-    
-    ! convert and reshape 1D data array
-    call c_f_pointer(c_array, f_array, (/M,N/))
-
-  end subroutine FSUNMatGetData_Dense
-
-end module fsunmat_dense_mod
diff --git a/Src/Extern/SUNDIALS4/CMakeLists.txt b/Src/Extern/SUNDIALS4/CMakeLists.txt
deleted file mode 100644
index 148bc7768a5..00000000000
--- a/Src/Extern/SUNDIALS4/CMakeLists.txt
+++ /dev/null
@@ -1,40 +0,0 @@
-if (ENABLE_FORTRAN_INTERFACES)
-   target_sources( amrex
-      PRIVATE
-      fsundials_types_mod.f90
-      fnvector_mod.f90
-      fnvector_serial_mod.f90
-      fsunmatrix_mod.f90
-      fsunmatrix_dense_mod.f90
-      fsunlinsol_mod.f90
-      fsunlinsol_dense_mod.f90
-      # ARKode interfaces
-      arkode_interface.f90
-      farkode_mod.f90
-      farkode_arkstep_mod.f90
-      # CVODE interfaces
-      cvode_interface.f90
-      fcvode_mod.f90
-      )
-endif ()
-
-#
-# We link to libraries and always include nvecserial (in case app code needs it)
-#
-set(_sundials_components nvecserial;cvode;arkode)
-
-if (ENABLE_OMP)
-   list(APPEND _sundials_components nvecopenmp)
-endif ()
-
-if (ENABLE_CUDA)
-   list(APPEND _sundials_components nveccuda)
-endif ()
-
-find_package(SUNDIALS 4 REQUIRED COMPONENTS ${_sundials_components})
-
-foreach (_comp ${_sundials_components})
-   target_link_libraries(amrex PUBLIC SUNDIALS::${_comp})   
-endforeach ()
-
-target_compile_definitions(amrex PUBLIC AMREX_USE_SUNDIALS_3x4x)
diff --git a/Src/Extern/SUNDIALS4/Make.package b/Src/Extern/SUNDIALS4/Make.package
deleted file mode 100644
index d09553daaef..00000000000
--- a/Src/Extern/SUNDIALS4/Make.package
+++ /dev/null
@@ -1,11 +0,0 @@
-ifeq ($(USE_ARKODE_LIBS), TRUE)
-f90EXE_sources += arkode_interface.f90 farkode_mod.f90 farkode_arkstep_mod.f90
-endif
-
-ifeq ($(USE_CVODE_LIBS), TRUE)
-f90EXE_sources += cvode_interface.f90 fcvode_mod.f90
-endif
-
-f90EXE_sources += fsundials_types_mod.f90
-f90EXE_sources += fnvector_mod.f90 fsunmatrix_mod.f90 fsunlinsol_mod.f90
-f90EXE_sources += fnvector_serial_mod.f90 fsunmatrix_dense_mod.f90 fsunlinsol_dense_mod.f90
diff --git a/Src/Extern/SUNDIALS4/arkode_interface.f90 b/Src/Extern/SUNDIALS4/arkode_interface.f90
deleted file mode 100644
index 46072962247..00000000000
--- a/Src/Extern/SUNDIALS4/arkode_interface.f90
+++ /dev/null
@@ -1,23 +0,0 @@
-module arkode_interface
-  use farkode_mod
-  use farkode_arkstep_mod
-  use fsunmatrix_dense_mod
-  use fsunlinsol_dense_mod
-  contains
-  integer(c_int) function FARKDense(arkode_mem, N) 
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-    implicit none 
-    type(c_ptr),     value :: arkode_mem
-    integer(c_long), value :: N
-    type(c_ptr)            :: sunmat_A
-    type(c_ptr)            :: sunlinsol_LS
-    type(c_ptr)            :: sunvec_y
-    integer(c_int)         :: ierr
-
-    sunvec_y = FN_VNewEmpty_Serial(N)
-    sunmat_A = FSUNDenseMatrix(N, N)
-    sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A)
-    ierr = FARKStepSetLinearSolver(arkode_mem, sunlinsol_LS, sunmat_A)
-  end function FARKDense
-end module arkode_interface
diff --git a/Src/Extern/SUNDIALS4/cvode_interface.f90 b/Src/Extern/SUNDIALS4/cvode_interface.f90
deleted file mode 100644
index 1a4eb543fc5..00000000000
--- a/Src/Extern/SUNDIALS4/cvode_interface.f90
+++ /dev/null
@@ -1,21 +0,0 @@
-module cvode_interface
-  use fcvode_mod
-  use fsunmatrix_dense_mod
-  use fsunlinsol_dense_mod
-  contains
-  integer(c_int) function FCVDense(cvode_mem, N) result(ierr)
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-    implicit none 
-    type(c_ptr),     value :: cvode_mem
-    integer(c_long), value :: N
-    type(c_ptr)            :: sunmat_A
-    type(c_ptr)            :: sunlinsol_LS
-    type(c_ptr)            :: sunvec_y
-
-    sunvec_y = FN_VNewEmpty_Serial(N)
-    sunmat_A = FSUNDenseMatrix(N, N)
-    sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A)
-    ierr = FCVodeSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A)
-  end function FCVDense
-end module cvode_interface
diff --git a/Src/Extern/SUNDIALS4/farkode_arkstep_mod.f90 b/Src/Extern/SUNDIALS4/farkode_arkstep_mod.f90
deleted file mode 100644
index 49b81ed91eb..00000000000
--- a/Src/Extern/SUNDIALS4/farkode_arkstep_mod.f90
+++ /dev/null
@@ -1,1290 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module farkode_arkstep_mod
- use, intrinsic :: ISO_C_BINDING
- use farkode_mod
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- integer(C_INT), parameter, public :: DEFAULT_ERK_2 = 0_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ERK_3 = 1_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ERK_4 = 3_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ERK_5 = 6_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ERK_6 = 10_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ERK_8 = 11_C_INT
- integer(C_INT), parameter, public :: DEFAULT_DIRK_2 = 100_C_INT
- integer(C_INT), parameter, public :: DEFAULT_DIRK_3 = 104_C_INT
- integer(C_INT), parameter, public :: DEFAULT_DIRK_4 = 107_C_INT
- integer(C_INT), parameter, public :: DEFAULT_DIRK_5 = 111_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ARK_ETABLE_3 = 2_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ARK_ETABLE_4 = 4_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ARK_ETABLE_5 = 9_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ARK_ITABLE_3 = 104_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ARK_ITABLE_4 = 109_C_INT
- integer(C_INT), parameter, public :: DEFAULT_ARK_ITABLE_5 = 111_C_INT
- public :: FARKStepCreate
- public :: FARKStepResize
- public :: FARKStepReInit
- public :: FARKStepSStolerances
- public :: FARKStepSVtolerances
- public :: FARKStepWFtolerances
- public :: FARKStepResStolerance
- public :: FARKStepResVtolerance
- public :: FARKStepResFtolerance
- public :: FARKStepSetLinearSolver
- public :: FARKStepSetMassLinearSolver
- public :: FARKStepRootInit
- public :: FARKStepSetDefaults
- public :: FARKStepSetOptimalParams
- public :: FARKStepSetOrder
- public :: FARKStepSetDenseOrder
- public :: FARKStepSetNonlinearSolver
- public :: FARKStepSetLinear
- public :: FARKStepSetNonlinear
- public :: FARKStepSetExplicit
- public :: FARKStepSetImplicit
- public :: FARKStepSetImEx
- public :: FARKStepSetTables
- public :: FARKStepSetTableNum
- public :: FARKStepSetCFLFraction
- public :: FARKStepSetSafetyFactor
- public :: FARKStepSetErrorBias
- public :: FARKStepSetMaxGrowth
- public :: FARKStepSetFixedStepBounds
- public :: FARKStepSetAdaptivityMethod
- public :: FARKStepSetAdaptivityFn
- public :: FARKStepSetMaxFirstGrowth
- public :: FARKStepSetMaxEFailGrowth
- public :: FARKStepSetSmallNumEFails
- public :: FARKStepSetMaxCFailGrowth
- public :: FARKStepSetNonlinCRDown
- public :: FARKStepSetNonlinRDiv
- public :: FARKStepSetDeltaGammaMax
- public :: FARKStepSetMaxStepsBetweenLSet
- public :: FARKStepSetPredictorMethod
- public :: FARKStepSetStabilityFn
- public :: FARKStepSetMaxErrTestFails
- public :: FARKStepSetMaxNonlinIters
- public :: FARKStepSetMaxConvFails
- public :: FARKStepSetNonlinConvCoef
- public :: FARKStepSetMaxNumSteps
- public :: FARKStepSetMaxHnilWarns
- public :: FARKStepSetInitStep
- public :: FARKStepSetMinStep
- public :: FARKStepSetMaxStep
- public :: FARKStepSetStopTime
- public :: FARKStepSetFixedStep
- public :: FARKStepSetRootDirection
- public :: FARKStepSetNoInactiveRootWarn
- public :: FARKStepSetErrHandlerFn
- public :: FARKStepSetErrFile
- public :: FARKStepSetUserData
- public :: FARKStepSetDiagnostics
- public :: FARKStepSetPostprocessStepFn
- public :: FARKStepSetJacFn
- public :: FARKStepSetMassFn
- public :: FARKStepSetMaxStepsBetweenJac
- public :: FARKStepSetEpsLin
- public :: FARKStepSetMassEpsLin
- public :: FARKStepSetPreconditioner
- public :: FARKStepSetMassPreconditioner
- public :: FARKStepSetJacTimes
- public :: FARKStepSetMassTimes
- public :: FARKStepEvolve
- public :: FARKStepGetDky
- public :: FARKStepGetNumExpSteps
- public :: FARKStepGetNumAccSteps
- public :: FARKStepGetNumStepAttempts
- public :: FARKStepGetNumRhsEvals
- public :: FARKStepGetNumLinSolvSetups
- public :: FARKStepGetNumErrTestFails
- public :: FARKStepGetCurrentButcherTables
- public :: FARKStepGetEstLocalErrors
- public :: FARKStepGetWorkSpace
- public :: FARKStepGetNumSteps
- public :: FARKStepGetActualInitStep
- public :: FARKStepGetLastStep
- public :: FARKStepGetCurrentStep
- public :: FARKStepGetCurrentTime
- public :: FARKStepGetTolScaleFactor
- public :: FARKStepGetErrWeights
- public :: FARKStepGetResWeights
- public :: FARKStepGetNumGEvals
- public :: FARKStepGetRootInfo
- public :: FARKStepGetReturnFlagName
- public :: FARKStepWriteParameters
- public :: FARKStepWriteButcher
- public :: FARKStepGetTimestepperStats
- public :: FARKStepGetStepStats
- public :: FARKStepGetNumNonlinSolvIters
- public :: FARKStepGetNumNonlinSolvConvFails
- public :: FARKStepGetNonlinSolvStats
- public :: FARKStepGetLinWorkSpace
- public :: FARKStepGetNumJacEvals
- public :: FARKStepGetNumPrecEvals
- public :: FARKStepGetNumPrecSolves
- public :: FARKStepGetNumLinIters
- public :: FARKStepGetNumLinConvFails
- public :: FARKStepGetNumJTSetupEvals
- public :: FARKStepGetNumJtimesEvals
- public :: FARKStepGetNumLinRhsEvals
- public :: FARKStepGetLastLinFlag
- public :: FARKStepGetMassWorkSpace
- public :: FARKStepGetNumMassSetups
- public :: FARKStepGetNumMassMult
- public :: FARKStepGetNumMassSolves
- public :: FARKStepGetNumMassPrecEvals
- public :: FARKStepGetNumMassPrecSolves
- public :: FARKStepGetNumMassIters
- public :: FARKStepGetNumMassConvFails
- public :: FARKStepGetNumMTSetups
- public :: FARKStepGetLastMassFlag
- public :: FARKStepGetLinReturnFlagName
- public :: FARKStepFree
- public :: FARKStepPrintMem
-
-! WRAPPER DECLARATIONS
-interface
-function FARKStepCreate(fe, fi, t0, y0) &
-bind(C, name="ARKStepCreate") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_FUNPTR), value :: fe
-type(C_FUNPTR), value :: fi
-real(C_DOUBLE), value :: t0
-type(C_PTR), value :: y0
-type(C_PTR) :: fresult
-end function
-
-function FARKStepResize(arkode_mem, ynew, hscale, t0, resize, resize_data) &
-bind(C, name="ARKStepResize") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: ynew
-real(C_DOUBLE), value :: hscale
-real(C_DOUBLE), value :: t0
-type(C_FUNPTR), value :: resize
-type(C_PTR), value :: resize_data
-integer(C_INT) :: fresult
-end function
-
-function FARKStepReInit(arkode_mem, fe, fi, t0, y0) &
-bind(C, name="ARKStepReInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: fe
-type(C_FUNPTR), value :: fi
-real(C_DOUBLE), value :: t0
-type(C_PTR), value :: y0
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSStolerances(arkode_mem, reltol, abstol) &
-bind(C, name="ARKStepSStolerances") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: reltol
-real(C_DOUBLE), value :: abstol
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSVtolerances(arkode_mem, reltol, abstol) &
-bind(C, name="ARKStepSVtolerances") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: reltol
-type(C_PTR), value :: abstol
-integer(C_INT) :: fresult
-end function
-
-function FARKStepWFtolerances(arkode_mem, efun) &
-bind(C, name="ARKStepWFtolerances") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: efun
-integer(C_INT) :: fresult
-end function
-
-function FARKStepResStolerance(arkode_mem, rabstol) &
-bind(C, name="ARKStepResStolerance") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: rabstol
-integer(C_INT) :: fresult
-end function
-
-function FARKStepResVtolerance(arkode_mem, rabstol) &
-bind(C, name="ARKStepResVtolerance") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: rabstol
-integer(C_INT) :: fresult
-end function
-
-function FARKStepResFtolerance(arkode_mem, rfun) &
-bind(C, name="ARKStepResFtolerance") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: rfun
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetLinearSolver(arkode_mem, ls, a) &
-bind(C, name="ARKStepSetLinearSolver") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: ls
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMassLinearSolver(arkode_mem, ls, m, time_dep) &
-bind(C, name="ARKStepSetMassLinearSolver") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: ls
-type(C_PTR), value :: m
-logical(C_BOOL), value :: time_dep
-integer(C_INT) :: fresult
-end function
-
-function FARKStepRootInit(arkode_mem, nrtfn, g) &
-bind(C, name="ARKStepRootInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: nrtfn
-type(C_FUNPTR), value :: g
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetDefaults(arkode_mem) &
-bind(C, name="ARKStepSetDefaults") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetOptimalParams(arkode_mem) &
-bind(C, name="ARKStepSetOptimalParams") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetOrder(arkode_mem, maxord) &
-bind(C, name="ARKStepSetOrder") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: maxord
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetDenseOrder(arkode_mem, dord) &
-bind(C, name="ARKStepSetDenseOrder") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: dord
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetNonlinearSolver(arkode_mem, nls) &
-bind(C, name="ARKStepSetNonlinearSolver") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: nls
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetLinear(arkode_mem, timedepend) &
-bind(C, name="ARKStepSetLinear") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: timedepend
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetNonlinear(arkode_mem) &
-bind(C, name="ARKStepSetNonlinear") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetExplicit(arkode_mem) &
-bind(C, name="ARKStepSetExplicit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetImplicit(arkode_mem) &
-bind(C, name="ARKStepSetImplicit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetImEx(arkode_mem) &
-bind(C, name="ARKStepSetImEx") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetTables(arkode_mem, q, p, bi, be) &
-bind(C, name="ARKStepSetTables") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: q
-integer(C_INT), value :: p
-type(C_PTR), value :: bi
-type(C_PTR), value :: be
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetTableNum(arkode_mem, itable, etable) &
-bind(C, name="ARKStepSetTableNum") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: itable
-integer(C_INT), value :: etable
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetCFLFraction(arkode_mem, cfl_frac) &
-bind(C, name="ARKStepSetCFLFraction") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: cfl_frac
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetSafetyFactor(arkode_mem, safety) &
-bind(C, name="ARKStepSetSafetyFactor") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: safety
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetErrorBias(arkode_mem, bias) &
-bind(C, name="ARKStepSetErrorBias") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: bias
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxGrowth(arkode_mem, mx_growth) &
-bind(C, name="ARKStepSetMaxGrowth") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: mx_growth
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetFixedStepBounds(arkode_mem, lb, ub) &
-bind(C, name="ARKStepSetFixedStepBounds") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: lb
-real(C_DOUBLE), value :: ub
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetAdaptivityMethod(arkode_mem, imethod, idefault, pq, adapt_params) &
-bind(C, name="ARKStepSetAdaptivityMethod") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: imethod
-integer(C_INT), value :: idefault
-integer(C_INT), value :: pq
-type(C_PTR) :: adapt_params
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetAdaptivityFn(arkode_mem, hfun, h_data) &
-bind(C, name="ARKStepSetAdaptivityFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: hfun
-type(C_PTR), value :: h_data
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxFirstGrowth(arkode_mem, etamx1) &
-bind(C, name="ARKStepSetMaxFirstGrowth") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: etamx1
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxEFailGrowth(arkode_mem, etamxf) &
-bind(C, name="ARKStepSetMaxEFailGrowth") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: etamxf
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetSmallNumEFails(arkode_mem, small_nef) &
-bind(C, name="ARKStepSetSmallNumEFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: small_nef
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxCFailGrowth(arkode_mem, etacf) &
-bind(C, name="ARKStepSetMaxCFailGrowth") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: etacf
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetNonlinCRDown(arkode_mem, crdown) &
-bind(C, name="ARKStepSetNonlinCRDown") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: crdown
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetNonlinRDiv(arkode_mem, rdiv) &
-bind(C, name="ARKStepSetNonlinRDiv") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: rdiv
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetDeltaGammaMax(arkode_mem, dgmax) &
-bind(C, name="ARKStepSetDeltaGammaMax") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: dgmax
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxStepsBetweenLSet(arkode_mem, msbp) &
-bind(C, name="ARKStepSetMaxStepsBetweenLSet") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: msbp
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetPredictorMethod(arkode_mem, method) &
-bind(C, name="ARKStepSetPredictorMethod") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: method
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetStabilityFn(arkode_mem, estab, estab_data) &
-bind(C, name="ARKStepSetStabilityFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: estab
-type(C_PTR), value :: estab_data
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxErrTestFails(arkode_mem, maxnef) &
-bind(C, name="ARKStepSetMaxErrTestFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: maxnef
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxNonlinIters(arkode_mem, maxcor) &
-bind(C, name="ARKStepSetMaxNonlinIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: maxcor
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxConvFails(arkode_mem, maxncf) &
-bind(C, name="ARKStepSetMaxConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: maxncf
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetNonlinConvCoef(arkode_mem, nlscoef) &
-bind(C, name="ARKStepSetNonlinConvCoef") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: nlscoef
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxNumSteps(arkode_mem, mxsteps) &
-bind(C, name="ARKStepSetMaxNumSteps") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG), value :: mxsteps
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxHnilWarns(arkode_mem, mxhnil) &
-bind(C, name="ARKStepSetMaxHnilWarns") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT), value :: mxhnil
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetInitStep(arkode_mem, hin) &
-bind(C, name="ARKStepSetInitStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: hin
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMinStep(arkode_mem, hmin) &
-bind(C, name="ARKStepSetMinStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: hmin
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxStep(arkode_mem, hmax) &
-bind(C, name="ARKStepSetMaxStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: hmax
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetStopTime(arkode_mem, tstop) &
-bind(C, name="ARKStepSetStopTime") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: tstop
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetFixedStep(arkode_mem, hfixed) &
-bind(C, name="ARKStepSetFixedStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: hfixed
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetRootDirection(arkode_mem, rootdir) &
-bind(C, name="ARKStepSetRootDirection") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: rootdir
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetNoInactiveRootWarn(arkode_mem) &
-bind(C, name="ARKStepSetNoInactiveRootWarn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetErrHandlerFn(arkode_mem, ehfun, eh_data) &
-bind(C, name="ARKStepSetErrHandlerFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: ehfun
-type(C_PTR), value :: eh_data
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetErrFile(arkode_mem, errfp) &
-bind(C, name="ARKStepSetErrFile") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: errfp
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetUserData(arkode_mem, user_data) &
-bind(C, name="ARKStepSetUserData") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: user_data
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetDiagnostics(arkode_mem, diagfp) &
-bind(C, name="ARKStepSetDiagnostics") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: diagfp
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetPostprocessStepFn(arkode_mem, processstep) &
-bind(C, name="ARKStepSetPostprocessStepFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: processstep
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetJacFn(arkode_mem, jac) &
-bind(C, name="ARKStepSetJacFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: jac
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMassFn(arkode_mem, mass) &
-bind(C, name="ARKStepSetMassFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: mass
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMaxStepsBetweenJac(arkode_mem, msbj) &
-bind(C, name="ARKStepSetMaxStepsBetweenJac") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG), value :: msbj
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetEpsLin(arkode_mem, eplifac) &
-bind(C, name="ARKStepSetEpsLin") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: eplifac
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMassEpsLin(arkode_mem, eplifac) &
-bind(C, name="ARKStepSetMassEpsLin") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: eplifac
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetPreconditioner(arkode_mem, psetup, psolve) &
-bind(C, name="ARKStepSetPreconditioner") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: psetup
-type(C_FUNPTR), value :: psolve
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMassPreconditioner(arkode_mem, psetup, psolve) &
-bind(C, name="ARKStepSetMassPreconditioner") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: psetup
-type(C_FUNPTR), value :: psolve
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetJacTimes(arkode_mem, jtsetup, jtimes) &
-bind(C, name="ARKStepSetJacTimes") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: jtsetup
-type(C_FUNPTR), value :: jtimes
-integer(C_INT) :: fresult
-end function
-
-function FARKStepSetMassTimes(arkode_mem, msetup, mtimes, mtimes_data) &
-bind(C, name="ARKStepSetMassTimes") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_FUNPTR), value :: msetup
-type(C_FUNPTR), value :: mtimes
-type(C_PTR), value :: mtimes_data
-integer(C_INT) :: fresult
-end function
-
-function FARKStepEvolve(arkode_mem, tout, yout, tret, itask) &
-bind(C, name="ARKStepEvolve") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: tout
-type(C_PTR), value :: yout
-real(C_DOUBLE) :: tret
-integer(C_INT), value :: itask
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetDky(arkode_mem, t, k, dky) &
-bind(C, name="ARKStepGetDky") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE), value :: t
-integer(C_INT), value :: k
-type(C_PTR), value :: dky
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumExpSteps(arkode_mem, expsteps) &
-bind(C, name="ARKStepGetNumExpSteps") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: expsteps
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumAccSteps(arkode_mem, accsteps) &
-bind(C, name="ARKStepGetNumAccSteps") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: accsteps
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumStepAttempts(arkode_mem, step_attempts) &
-bind(C, name="ARKStepGetNumStepAttempts") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: step_attempts
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumRhsEvals(arkode_mem, nfe_evals, nfi_evals) &
-bind(C, name="ARKStepGetNumRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nfe_evals
-integer(C_LONG) :: nfi_evals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumLinSolvSetups(arkode_mem, nlinsetups) &
-bind(C, name="ARKStepGetNumLinSolvSetups") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nlinsetups
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumErrTestFails(arkode_mem, netfails) &
-bind(C, name="ARKStepGetNumErrTestFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: netfails
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetCurrentButcherTables(arkode_mem, bi, be) &
-bind(C, name="ARKStepGetCurrentButcherTables") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: bi
-type(C_PTR), value :: be
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetEstLocalErrors(arkode_mem, ele) &
-bind(C, name="ARKStepGetEstLocalErrors") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: ele
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetWorkSpace(arkode_mem, lenrw, leniw) &
-bind(C, name="ARKStepGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: lenrw
-integer(C_LONG) :: leniw
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumSteps(arkode_mem, nsteps) &
-bind(C, name="ARKStepGetNumSteps") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nsteps
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetActualInitStep(arkode_mem, hinused) &
-bind(C, name="ARKStepGetActualInitStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE) :: hinused
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetLastStep(arkode_mem, hlast) &
-bind(C, name="ARKStepGetLastStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE) :: hlast
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetCurrentStep(arkode_mem, hcur) &
-bind(C, name="ARKStepGetCurrentStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE) :: hcur
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetCurrentTime(arkode_mem, tcur) &
-bind(C, name="ARKStepGetCurrentTime") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE) :: tcur
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetTolScaleFactor(arkode_mem, tolsfac) &
-bind(C, name="ARKStepGetTolScaleFactor") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-real(C_DOUBLE) :: tolsfac
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetErrWeights(arkode_mem, eweight) &
-bind(C, name="ARKStepGetErrWeights") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: eweight
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetResWeights(arkode_mem, rweight) &
-bind(C, name="ARKStepGetResWeights") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: rweight
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumGEvals(arkode_mem, ngevals) &
-bind(C, name="ARKStepGetNumGEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: ngevals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetRootInfo(arkode_mem, rootsfound) &
-bind(C, name="ARKStepGetRootInfo") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT) :: rootsfound
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetReturnFlagName(flag) &
-bind(C, name="ARKStepGetReturnFlagName") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_LONG), value :: flag
-type(C_PTR) :: fresult
-end function
-
-function FARKStepWriteParameters(arkode_mem, fp) &
-bind(C, name="ARKStepWriteParameters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: fp
-integer(C_INT) :: fresult
-end function
-
-function FARKStepWriteButcher(arkode_mem, fp) &
-bind(C, name="ARKStepWriteButcher") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: fp
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetTimestepperStats(arkode_mem, expsteps, accsteps, step_attempts, nfe_evals, nfi_evals, nlinsetups, &
-  netfails) &
-bind(C, name="ARKStepGetTimestepperStats") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: expsteps
-integer(C_LONG) :: accsteps
-integer(C_LONG) :: step_attempts
-integer(C_LONG) :: nfe_evals
-integer(C_LONG) :: nfi_evals
-integer(C_LONG) :: nlinsetups
-integer(C_LONG) :: netfails
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetStepStats(arkode_mem, nsteps, hinused, hlast, hcur, tcur) &
-bind(C, name="ARKStepGetStepStats") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nsteps
-real(C_DOUBLE) :: hinused
-real(C_DOUBLE) :: hlast
-real(C_DOUBLE) :: hcur
-real(C_DOUBLE) :: tcur
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumNonlinSolvIters(arkode_mem, nniters) &
-bind(C, name="ARKStepGetNumNonlinSolvIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nniters
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumNonlinSolvConvFails(arkode_mem, nncfails) &
-bind(C, name="ARKStepGetNumNonlinSolvConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nncfails
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNonlinSolvStats(arkode_mem, nniters, nncfails) &
-bind(C, name="ARKStepGetNonlinSolvStats") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nniters
-integer(C_LONG) :: nncfails
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetLinWorkSpace(arkode_mem, lenrwls, leniwls) &
-bind(C, name="ARKStepGetLinWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumJacEvals(arkode_mem, njevals) &
-bind(C, name="ARKStepGetNumJacEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: njevals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumPrecEvals(arkode_mem, npevals) &
-bind(C, name="ARKStepGetNumPrecEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: npevals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumPrecSolves(arkode_mem, npsolves) &
-bind(C, name="ARKStepGetNumPrecSolves") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: npsolves
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumLinIters(arkode_mem, nliters) &
-bind(C, name="ARKStepGetNumLinIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nliters
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumLinConvFails(arkode_mem, nlcfails) &
-bind(C, name="ARKStepGetNumLinConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nlcfails
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumJTSetupEvals(arkode_mem, njtsetups) &
-bind(C, name="ARKStepGetNumJTSetupEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: njtsetups
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumJtimesEvals(arkode_mem, njvevals) &
-bind(C, name="ARKStepGetNumJtimesEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: njvevals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumLinRhsEvals(arkode_mem, nfevalsls) &
-bind(C, name="ARKStepGetNumLinRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nfevalsls
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetLastLinFlag(arkode_mem, flag) &
-bind(C, name="ARKStepGetLastLinFlag") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: flag
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetMassWorkSpace(arkode_mem, lenrwmls, leniwmls) &
-bind(C, name="ARKStepGetMassWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: lenrwmls
-integer(C_LONG) :: leniwmls
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassSetups(arkode_mem, nmsetups) &
-bind(C, name="ARKStepGetNumMassSetups") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmsetups
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassMult(arkode_mem, nmvevals) &
-bind(C, name="ARKStepGetNumMassMult") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmvevals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassSolves(arkode_mem, nmsolves) &
-bind(C, name="ARKStepGetNumMassSolves") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmsolves
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassPrecEvals(arkode_mem, nmpevals) &
-bind(C, name="ARKStepGetNumMassPrecEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmpevals
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassPrecSolves(arkode_mem, nmpsolves) &
-bind(C, name="ARKStepGetNumMassPrecSolves") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmpsolves
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassIters(arkode_mem, nmiters) &
-bind(C, name="ARKStepGetNumMassIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmiters
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMassConvFails(arkode_mem, nmcfails) &
-bind(C, name="ARKStepGetNumMassConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmcfails
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetNumMTSetups(arkode_mem, nmtsetups) &
-bind(C, name="ARKStepGetNumMTSetups") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nmtsetups
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetLastMassFlag(arkode_mem, flag) &
-bind(C, name="ARKStepGetLastMassFlag") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: flag
-integer(C_INT) :: fresult
-end function
-
-function FARKStepGetLinReturnFlagName(flag) &
-bind(C, name="ARKStepGetLinReturnFlagName") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_LONG), value :: flag
-type(C_PTR) :: fresult
-end function
-
-subroutine FARKStepFree(arkode_mem) &
-bind(C, name="ARKStepFree")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR) :: arkode_mem
-end subroutine
-
-subroutine FARKStepPrintMem(arkode_mem, outfile) &
-bind(C, name="ARKStepPrintMem")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-type(C_PTR), value :: outfile
-end subroutine
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SUNDIALS4/farkode_mod.f90 b/Src/Extern/SUNDIALS4/farkode_mod.f90
deleted file mode 100644
index 011611944e6..00000000000
--- a/Src/Extern/SUNDIALS4/farkode_mod.f90
+++ /dev/null
@@ -1,310 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module farkode_mod
- use, intrinsic :: ISO_C_BINDING
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- integer(C_INT), parameter, public :: ARK_NORMAL = 1_C_INT
- integer(C_INT), parameter, public :: ARK_ONE_STEP = 2_C_INT
- integer(C_INT), parameter, public :: ARK_SUCCESS = 0_C_INT
- integer(C_INT), parameter, public :: ARK_TSTOP_RETURN = 1_C_INT
- integer(C_INT), parameter, public :: ARK_ROOT_RETURN = 2_C_INT
- integer(C_INT), parameter, public :: ARK_WARNING = 99_C_INT
- integer(C_INT), parameter, public :: ARK_TOO_MUCH_WORK = -1_C_INT
- integer(C_INT), parameter, public :: ARK_TOO_MUCH_ACC = -2_C_INT
- integer(C_INT), parameter, public :: ARK_ERR_FAILURE = -3_C_INT
- integer(C_INT), parameter, public :: ARK_CONV_FAILURE = -4_C_INT
- integer(C_INT), parameter, public :: ARK_LINIT_FAIL = -5_C_INT
- integer(C_INT), parameter, public :: ARK_LSETUP_FAIL = -6_C_INT
- integer(C_INT), parameter, public :: ARK_LSOLVE_FAIL = -7_C_INT
- integer(C_INT), parameter, public :: ARK_RHSFUNC_FAIL = -8_C_INT
- integer(C_INT), parameter, public :: ARK_FIRST_RHSFUNC_ERR = -9_C_INT
- integer(C_INT), parameter, public :: ARK_REPTD_RHSFUNC_ERR = -10_C_INT
- integer(C_INT), parameter, public :: ARK_UNREC_RHSFUNC_ERR = -11_C_INT
- integer(C_INT), parameter, public :: ARK_RTFUNC_FAIL = -12_C_INT
- integer(C_INT), parameter, public :: ARK_LFREE_FAIL = -13_C_INT
- integer(C_INT), parameter, public :: ARK_MASSINIT_FAIL = -14_C_INT
- integer(C_INT), parameter, public :: ARK_MASSSETUP_FAIL = -15_C_INT
- integer(C_INT), parameter, public :: ARK_MASSSOLVE_FAIL = -16_C_INT
- integer(C_INT), parameter, public :: ARK_MASSFREE_FAIL = -17_C_INT
- integer(C_INT), parameter, public :: ARK_MASSMULT_FAIL = -18_C_INT
- integer(C_INT), parameter, public :: ARK_MEM_FAIL = -20_C_INT
- integer(C_INT), parameter, public :: ARK_MEM_NULL = -21_C_INT
- integer(C_INT), parameter, public :: ARK_ILL_INPUT = -22_C_INT
- integer(C_INT), parameter, public :: ARK_NO_MALLOC = -23_C_INT
- integer(C_INT), parameter, public :: ARK_BAD_K = -24_C_INT
- integer(C_INT), parameter, public :: ARK_BAD_T = -25_C_INT
- integer(C_INT), parameter, public :: ARK_BAD_DKY = -26_C_INT
- integer(C_INT), parameter, public :: ARK_TOO_CLOSE = -27_C_INT
- integer(C_INT), parameter, public :: ARK_POSTPROCESS_FAIL = -28_C_INT
- integer(C_INT), parameter, public :: ARK_VECTOROP_ERR = -29_C_INT
- integer(C_INT), parameter, public :: ARK_NLS_INIT_FAIL = -30_C_INT
- integer(C_INT), parameter, public :: ARK_NLS_SETUP_FAIL = -31_C_INT
- integer(C_INT), parameter, public :: ARK_NLS_SETUP_RECVR = -32_C_INT
- integer(C_INT), parameter, public :: ARK_NLS_OP_ERR = -33_C_INT
- integer(C_INT), parameter, public :: ARK_INNERSTEP_FAIL = -34_C_INT
- integer(C_INT), parameter, public :: ARK_UNRECOGNIZED_ERROR = -99_C_INT
- public :: FARKBandPrecInit
- public :: FARKBandPrecGetWorkSpace
- public :: FARKBandPrecGetNumRhsEvals
- public :: FARKBBDPrecInit
- public :: FARKBBDPrecReInit
- public :: FARKBBDPrecGetWorkSpace
- public :: FARKBBDPrecGetNumGfnEvals
- ! struct struct ARKodeButcherTableMem
- type, bind(C), public :: ARKodeButcherTableMem
-  integer(C_INT), public :: q
-  integer(C_INT), public :: p
-  integer(C_INT), public :: stages
-  type(C_PTR), public :: A
-  type(C_PTR), public :: c
-  type(C_PTR), public :: b
-  type(C_PTR), public :: d
- end type ARKodeButcherTableMem
- public :: FARKodeButcherTable_Alloc
- public :: FARKodeButcherTable_Create
- public :: FARKodeButcherTable_Copy
- public :: FARKodeButcherTable_Space
- public :: FARKodeButcherTable_Free
- public :: FARKodeButcherTable_Write
- public :: FARKodeButcherTable_CheckOrder
- public :: FARKodeButcherTable_CheckARKOrder
- integer(C_INT), parameter, public :: SDIRK_2_1_2 = 100_C_INT
- integer(C_INT), parameter, public :: BILLINGTON_3_3_2 = 101_C_INT
- integer(C_INT), parameter, public :: TRBDF2_3_3_2 = 102_C_INT
- integer(C_INT), parameter, public :: KVAERNO_4_2_3 = 103_C_INT
- integer(C_INT), parameter, public :: ARK324L2SA_DIRK_4_2_3 = 104_C_INT
- integer(C_INT), parameter, public :: CASH_5_2_4 = 105_C_INT
- integer(C_INT), parameter, public :: CASH_5_3_4 = 106_C_INT
- integer(C_INT), parameter, public :: SDIRK_5_3_4 = 107_C_INT
- integer(C_INT), parameter, public :: KVAERNO_5_3_4 = 108_C_INT
- integer(C_INT), parameter, public :: ARK436L2SA_DIRK_6_3_4 = 109_C_INT
- integer(C_INT), parameter, public :: KVAERNO_7_4_5 = 110_C_INT
- integer(C_INT), parameter, public :: ARK548L2SA_DIRK_8_4_5 = 111_C_INT
- integer(C_INT), parameter, public :: MIN_DIRK_NUM = 100_C_INT
- integer(C_INT), parameter, public :: MAX_DIRK_NUM = 111_C_INT
- public :: FARKodeButcherTable_LoadDIRK
- integer(C_INT), parameter, public :: HEUN_EULER_2_1_2 = 0_C_INT
- integer(C_INT), parameter, public :: BOGACKI_SHAMPINE_4_2_3 = 1_C_INT
- integer(C_INT), parameter, public :: ARK324L2SA_ERK_4_2_3 = 2_C_INT
- integer(C_INT), parameter, public :: ZONNEVELD_5_3_4 = 3_C_INT
- integer(C_INT), parameter, public :: ARK436L2SA_ERK_6_3_4 = 4_C_INT
- integer(C_INT), parameter, public :: SAYFY_ABURUB_6_3_4 = 5_C_INT
- integer(C_INT), parameter, public :: CASH_KARP_6_4_5 = 6_C_INT
- integer(C_INT), parameter, public :: FEHLBERG_6_4_5 = 7_C_INT
- integer(C_INT), parameter, public :: DORMAND_PRINCE_7_4_5 = 8_C_INT
- integer(C_INT), parameter, public :: ARK548L2SA_ERK_8_4_5 = 9_C_INT
- integer(C_INT), parameter, public :: VERNER_8_5_6 = 10_C_INT
- integer(C_INT), parameter, public :: FEHLBERG_13_7_8 = 11_C_INT
- integer(C_INT), parameter, public :: KNOTH_WOLKE_3_3 = 12_C_INT
- integer(C_INT), parameter, public :: MIN_ERK_NUM = 0_C_INT
- integer(C_INT), parameter, public :: MAX_ERK_NUM = 12_C_INT
- public :: FARKodeButcherTable_LoadERK
- integer(C_INT), parameter, public :: ARKLS_SUCCESS = 0_C_INT
- integer(C_INT), parameter, public :: ARKLS_MEM_NULL = -1_C_INT
- integer(C_INT), parameter, public :: ARKLS_LMEM_NULL = -2_C_INT
- integer(C_INT), parameter, public :: ARKLS_ILL_INPUT = -3_C_INT
- integer(C_INT), parameter, public :: ARKLS_MEM_FAIL = -4_C_INT
- integer(C_INT), parameter, public :: ARKLS_PMEM_NULL = -5_C_INT
- integer(C_INT), parameter, public :: ARKLS_MASSMEM_NULL = -6_C_INT
- integer(C_INT), parameter, public :: ARKLS_JACFUNC_UNRECVR = -7_C_INT
- integer(C_INT), parameter, public :: ARKLS_JACFUNC_RECVR = -8_C_INT
- integer(C_INT), parameter, public :: ARKLS_MASSFUNC_UNRECVR = -9_C_INT
- integer(C_INT), parameter, public :: ARKLS_MASSFUNC_RECVR = -10_C_INT
- integer(C_INT), parameter, public :: ARKLS_SUNMAT_FAIL = -11_C_INT
- integer(C_INT), parameter, public :: ARKLS_SUNLS_FAIL = -12_C_INT
-
-! WRAPPER DECLARATIONS
-interface
-function FARKBandPrecInit(arkode_mem, n, mu, ml) &
-bind(C, name="ARKBandPrecInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT64_T), value :: n
-integer(C_INT64_T), value :: mu
-integer(C_INT64_T), value :: ml
-integer(C_INT) :: fresult
-end function
-
-function FARKBandPrecGetWorkSpace(arkode_mem, lenrwls, leniwls) &
-bind(C, name="ARKBandPrecGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FARKBandPrecGetNumRhsEvals(arkode_mem, nfevalsbp) &
-bind(C, name="ARKBandPrecGetNumRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: nfevalsbp
-integer(C_INT) :: fresult
-end function
-
-function FARKBBDPrecInit(arkode_mem, nlocal, mudq, mldq, mukeep, mlkeep, dqrely, gloc, cfn) &
-bind(C, name="ARKBBDPrecInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT64_T), value :: nlocal
-integer(C_INT64_T), value :: mudq
-integer(C_INT64_T), value :: mldq
-integer(C_INT64_T), value :: mukeep
-integer(C_INT64_T), value :: mlkeep
-real(C_DOUBLE), value :: dqrely
-type(C_FUNPTR), value :: gloc
-type(C_FUNPTR), value :: cfn
-integer(C_INT) :: fresult
-end function
-
-function FARKBBDPrecReInit(arkode_mem, mudq, mldq, dqrely) &
-bind(C, name="ARKBBDPrecReInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_INT64_T), value :: mudq
-integer(C_INT64_T), value :: mldq
-real(C_DOUBLE), value :: dqrely
-integer(C_INT) :: fresult
-end function
-
-function FARKBBDPrecGetWorkSpace(arkode_mem, lenrwbbdp, leniwbbdp) &
-bind(C, name="ARKBBDPrecGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: lenrwbbdp
-integer(C_LONG) :: leniwbbdp
-integer(C_INT) :: fresult
-end function
-
-function FARKBBDPrecGetNumGfnEvals(arkode_mem, ngevalsbbdp) &
-bind(C, name="ARKBBDPrecGetNumGfnEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: arkode_mem
-integer(C_LONG) :: ngevalsbbdp
-integer(C_INT) :: fresult
-end function
-
-function FARKodeButcherTable_Alloc(stages, embedded) &
-bind(C, name="ARKodeButcherTable_Alloc") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: stages
-logical(C_BOOL), value :: embedded
-type(C_PTR) :: fresult
-end function
-
-function FARKodeButcherTable_Create(s, q, p, c, a, b, d) &
-bind(C, name="ARKodeButcherTable_Create") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: s
-integer(C_INT), value :: q
-integer(C_INT), value :: p
-real(C_DOUBLE) :: c
-real(C_DOUBLE) :: a
-real(C_DOUBLE) :: b
-real(C_DOUBLE) :: d
-type(C_PTR) :: fresult
-end function
-
-function FARKodeButcherTable_Copy(b) &
-bind(C, name="ARKodeButcherTable_Copy") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: b
-type(C_PTR) :: fresult
-end function
-
-subroutine FARKodeButcherTable_Space(b, liw, lrw) &
-bind(C, name="ARKodeButcherTable_Space")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: b
-integer(C_INT64_T) :: liw
-integer(C_INT64_T) :: lrw
-end subroutine
-
-subroutine FARKodeButcherTable_Free(b) &
-bind(C, name="ARKodeButcherTable_Free")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: b
-end subroutine
-
-subroutine FARKodeButcherTable_Write(b, outfile) &
-bind(C, name="ARKodeButcherTable_Write")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: b
-type(C_PTR), value :: outfile
-end subroutine
-
-function FARKodeButcherTable_CheckOrder(b, q, p, outfile) &
-bind(C, name="ARKodeButcherTable_CheckOrder") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: b
-integer(C_INT) :: q
-integer(C_INT) :: p
-type(C_PTR), value :: outfile
-integer(C_INT) :: fresult
-end function
-
-function FARKodeButcherTable_CheckARKOrder(b1, b2, q, p, outfile) &
-bind(C, name="ARKodeButcherTable_CheckARKOrder") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: b1
-type(C_PTR), value :: b2
-integer(C_INT) :: q
-integer(C_INT) :: p
-type(C_PTR), value :: outfile
-integer(C_INT) :: fresult
-end function
-
-function FARKodeButcherTable_LoadDIRK(imethod) &
-bind(C, name="ARKodeButcherTable_LoadDIRK") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: imethod
-type(C_PTR) :: fresult
-end function
-
-function FARKodeButcherTable_LoadERK(imethod) &
-bind(C, name="ARKodeButcherTable_LoadERK") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: imethod
-type(C_PTR) :: fresult
-end function
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fcvode_mod.f90 b/Src/Extern/SUNDIALS4/fcvode_mod.f90
deleted file mode 100644
index 1d05c04725a..00000000000
--- a/Src/Extern/SUNDIALS4/fcvode_mod.f90
+++ /dev/null
@@ -1,917 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module fcvode_mod
- use, intrinsic :: ISO_C_BINDING
- use fnvector_mod
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- integer(C_INT), parameter, public :: CV_ADAMS = 1_C_INT
- integer(C_INT), parameter, public :: CV_BDF = 2_C_INT
- integer(C_INT), parameter, public :: CV_NORMAL = 1_C_INT
- integer(C_INT), parameter, public :: CV_ONE_STEP = 2_C_INT
- integer(C_INT), parameter, public :: CV_SUCCESS = 0_C_INT
- integer(C_INT), parameter, public :: CV_TSTOP_RETURN = 1_C_INT
- integer(C_INT), parameter, public :: CV_ROOT_RETURN = 2_C_INT
- integer(C_INT), parameter, public :: CV_WARNING = 99_C_INT
- integer(C_INT), parameter, public :: CV_TOO_MUCH_WORK = -1_C_INT
- integer(C_INT), parameter, public :: CV_TOO_MUCH_ACC = -2_C_INT
- integer(C_INT), parameter, public :: CV_ERR_FAILURE = -3_C_INT
- integer(C_INT), parameter, public :: CV_CONV_FAILURE = -4_C_INT
- integer(C_INT), parameter, public :: CV_LINIT_FAIL = -5_C_INT
- integer(C_INT), parameter, public :: CV_LSETUP_FAIL = -6_C_INT
- integer(C_INT), parameter, public :: CV_LSOLVE_FAIL = -7_C_INT
- integer(C_INT), parameter, public :: CV_RHSFUNC_FAIL = -8_C_INT
- integer(C_INT), parameter, public :: CV_FIRST_RHSFUNC_ERR = -9_C_INT
- integer(C_INT), parameter, public :: CV_REPTD_RHSFUNC_ERR = -10_C_INT
- integer(C_INT), parameter, public :: CV_UNREC_RHSFUNC_ERR = -11_C_INT
- integer(C_INT), parameter, public :: CV_RTFUNC_FAIL = -12_C_INT
- integer(C_INT), parameter, public :: CV_NLS_INIT_FAIL = -13_C_INT
- integer(C_INT), parameter, public :: CV_NLS_SETUP_FAIL = -14_C_INT
- integer(C_INT), parameter, public :: CV_CONSTR_FAIL = -15_C_INT
- integer(C_INT), parameter, public :: CV_MEM_FAIL = -20_C_INT
- integer(C_INT), parameter, public :: CV_MEM_NULL = -21_C_INT
- integer(C_INT), parameter, public :: CV_ILL_INPUT = -22_C_INT
- integer(C_INT), parameter, public :: CV_NO_MALLOC = -23_C_INT
- integer(C_INT), parameter, public :: CV_BAD_K = -24_C_INT
- integer(C_INT), parameter, public :: CV_BAD_T = -25_C_INT
- integer(C_INT), parameter, public :: CV_BAD_DKY = -26_C_INT
- integer(C_INT), parameter, public :: CV_TOO_CLOSE = -27_C_INT
- integer(C_INT), parameter, public :: CV_VECTOROP_ERR = -28_C_INT
- public :: FCVodeCreate
- public :: FCVodeInit
- public :: FCVodeReInit
- public :: FCVodeSStolerances
- public :: FCVodeSVtolerances
- public :: FCVodeWFtolerances
- public :: FCVodeSetErrHandlerFn
- public :: FCVodeSetErrFile
- public :: FCVodeSetUserData
- public :: FCVodeSetMaxOrd
- public :: FCVodeSetMaxNumSteps
- public :: FCVodeSetMaxHnilWarns
- public :: FCVodeSetStabLimDet
- public :: FCVodeSetInitStep
- public :: FCVodeSetMinStep
- public :: FCVodeSetMaxStep
- public :: FCVodeSetStopTime
- public :: FCVodeSetMaxErrTestFails
- public :: FCVodeSetMaxNonlinIters
- public :: FCVodeSetMaxConvFails
- public :: FCVodeSetNonlinConvCoef
- public :: FCVodeSetConstraints
- public :: FCVodeSetNonlinearSolver
- public :: FCVodeRootInit
- public :: FCVodeSetRootDirection
- public :: FCVodeSetNoInactiveRootWarn
- public :: FCVode
- public :: FCVodeGetDky
- public :: FCVodeGetWorkSpace
- public :: FCVodeGetNumSteps
- public :: FCVodeGetNumRhsEvals
- public :: FCVodeGetNumLinSolvSetups
- public :: FCVodeGetNumErrTestFails
- public :: FCVodeGetLastOrder
- public :: FCVodeGetCurrentOrder
- public :: FCVodeGetNumStabLimOrderReds
- public :: FCVodeGetActualInitStep
- public :: FCVodeGetLastStep
- public :: FCVodeGetCurrentStep
- public :: FCVodeGetCurrentTime
- public :: FCVodeGetTolScaleFactor
- public :: FCVodeGetErrWeights
- public :: FCVodeGetEstLocalErrors
- public :: FCVodeGetNumGEvals
- public :: FCVodeGetRootInfo
- public :: FCVodeGetIntegratorStats
- public :: FCVodeGetNumNonlinSolvIters
- public :: FCVodeGetNumNonlinSolvConvFails
- public :: FCVodeGetNonlinSolvStats
- public :: FCVodeGetReturnFlagName
- public :: FCVodeFree
- public :: FCVBandPrecInit
- public :: FCVBandPrecGetWorkSpace
- public :: FCVBandPrecGetNumRhsEvals
- public :: FCVBBDPrecInit
- public :: FCVBBDPrecReInit
- public :: FCVBBDPrecGetWorkSpace
- public :: FCVBBDPrecGetNumGfnEvals
- integer(C_INT), parameter, public :: CVDIAG_SUCCESS = 0_C_INT
- integer(C_INT), parameter, public :: CVDIAG_MEM_NULL = -1_C_INT
- integer(C_INT), parameter, public :: CVDIAG_LMEM_NULL = -2_C_INT
- integer(C_INT), parameter, public :: CVDIAG_ILL_INPUT = -3_C_INT
- integer(C_INT), parameter, public :: CVDIAG_MEM_FAIL = -4_C_INT
- integer(C_INT), parameter, public :: CVDIAG_INV_FAIL = -5_C_INT
- integer(C_INT), parameter, public :: CVDIAG_RHSFUNC_UNRECVR = -6_C_INT
- integer(C_INT), parameter, public :: CVDIAG_RHSFUNC_RECVR = -7_C_INT
- public :: FCVDiag
- public :: FCVDiagGetWorkSpace
- public :: FCVDiagGetNumRhsEvals
- public :: FCVDiagGetLastFlag
- public :: FCVDiagGetReturnFlagName
- integer(C_INT), parameter, public :: CVLS_SUCCESS = 0_C_INT
- integer(C_INT), parameter, public :: CVLS_MEM_NULL = -1_C_INT
- integer(C_INT), parameter, public :: CVLS_LMEM_NULL = -2_C_INT
- integer(C_INT), parameter, public :: CVLS_ILL_INPUT = -3_C_INT
- integer(C_INT), parameter, public :: CVLS_MEM_FAIL = -4_C_INT
- integer(C_INT), parameter, public :: CVLS_PMEM_NULL = -5_C_INT
- integer(C_INT), parameter, public :: CVLS_JACFUNC_UNRECVR = -6_C_INT
- integer(C_INT), parameter, public :: CVLS_JACFUNC_RECVR = -7_C_INT
- integer(C_INT), parameter, public :: CVLS_SUNMAT_FAIL = -8_C_INT
- integer(C_INT), parameter, public :: CVLS_SUNLS_FAIL = -9_C_INT
- public :: FCVodeSetLinearSolver
- public :: FCVodeSetJacFn
- public :: FCVodeSetMaxStepsBetweenJac
- public :: FCVodeSetEpsLin
- public :: FCVodeSetPreconditioner
- public :: FCVodeSetJacTimes
- public :: FCVodeGetLinWorkSpace
- public :: FCVodeGetNumJacEvals
- public :: FCVodeGetNumPrecEvals
- public :: FCVodeGetNumPrecSolves
- public :: FCVodeGetNumLinIters
- public :: FCVodeGetNumLinConvFails
- public :: FCVodeGetNumJTSetupEvals
- public :: FCVodeGetNumJtimesEvals
- public :: FCVodeGetNumLinRhsEvals
- public :: FCVodeGetLastLinFlag
- public :: FCVodeGetLinReturnFlagName
-
-! WRAPPER DECLARATIONS
-interface
-function FCVodeCreate(lmm) &
-bind(C, name="CVodeCreate") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: lmm
-type(C_PTR) :: fresult
-end function
-
-function FCVodeInit(cvode_mem, f, t0, y0) &
-bind(C, name="CVodeInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_FUNPTR), value :: f
-real(C_DOUBLE), value :: t0
-type(C_PTR), value :: y0
-integer(C_INT) :: fresult
-end function
-
-function FCVodeReInit(cvode_mem, t0, y0) &
-bind(C, name="CVodeReInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: t0
-type(C_PTR), value :: y0
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSStolerances(cvode_mem, reltol, abstol) &
-bind(C, name="CVodeSStolerances") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: reltol
-real(C_DOUBLE), value :: abstol
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSVtolerances(cvode_mem, reltol, abstol) &
-bind(C, name="CVodeSVtolerances") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: reltol
-type(C_PTR), value :: abstol
-integer(C_INT) :: fresult
-end function
-
-function FCVodeWFtolerances(cvode_mem, efun) &
-bind(C, name="CVodeWFtolerances") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_FUNPTR), value :: efun
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetErrHandlerFn(cvode_mem, ehfun, eh_data) &
-bind(C, name="CVodeSetErrHandlerFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_FUNPTR), value :: ehfun
-type(C_PTR), value :: eh_data
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetErrFile(cvode_mem, errfp) &
-bind(C, name="CVodeSetErrFile") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: errfp
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetUserData(cvode_mem, user_data) &
-bind(C, name="CVodeSetUserData") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: user_data
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxOrd(cvode_mem, maxord) &
-bind(C, name="CVodeSetMaxOrd") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT), value :: maxord
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxNumSteps(cvode_mem, mxsteps) &
-bind(C, name="CVodeSetMaxNumSteps") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG), value :: mxsteps
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxHnilWarns(cvode_mem, mxhnil) &
-bind(C, name="CVodeSetMaxHnilWarns") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT), value :: mxhnil
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetStabLimDet(cvode_mem, stldet) &
-bind(C, name="CVodeSetStabLimDet") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-logical(C_BOOL), value :: stldet
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetInitStep(cvode_mem, hin) &
-bind(C, name="CVodeSetInitStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: hin
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMinStep(cvode_mem, hmin) &
-bind(C, name="CVodeSetMinStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: hmin
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxStep(cvode_mem, hmax) &
-bind(C, name="CVodeSetMaxStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: hmax
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetStopTime(cvode_mem, tstop) &
-bind(C, name="CVodeSetStopTime") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: tstop
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxErrTestFails(cvode_mem, maxnef) &
-bind(C, name="CVodeSetMaxErrTestFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT), value :: maxnef
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxNonlinIters(cvode_mem, maxcor) &
-bind(C, name="CVodeSetMaxNonlinIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT), value :: maxcor
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxConvFails(cvode_mem, maxncf) &
-bind(C, name="CVodeSetMaxConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT), value :: maxncf
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetNonlinConvCoef(cvode_mem, nlscoef) &
-bind(C, name="CVodeSetNonlinConvCoef") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: nlscoef
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetConstraints(cvode_mem, constraints) &
-bind(C, name="CVodeSetConstraints") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: constraints
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetNonlinearSolver(cvode_mem, nls) &
-bind(C, name="CVodeSetNonlinearSolver") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: nls
-integer(C_INT) :: fresult
-end function
-
-function FCVodeRootInit(cvode_mem, nrtfn, g) &
-bind(C, name="CVodeRootInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT), value :: nrtfn
-type(C_FUNPTR), value :: g
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetRootDirection(cvode_mem, rootdir) &
-bind(C, name="CVodeSetRootDirection") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT) :: rootdir
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetNoInactiveRootWarn(cvode_mem) &
-bind(C, name="CVodeSetNoInactiveRootWarn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT) :: fresult
-end function
-
-function FCVode(cvode_mem, tout, yout, tret, itask) &
-bind(C, name="CVode") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: tout
-type(C_PTR), value :: yout
-real(C_DOUBLE) :: tret
-integer(C_INT), value :: itask
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetDky(cvode_mem, t, k, dky) &
-bind(C, name="CVodeGetDky") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: t
-integer(C_INT), value :: k
-type(C_PTR), value :: dky
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetWorkSpace(cvode_mem, lenrw, leniw) &
-bind(C, name="CVodeGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: lenrw
-integer(C_LONG) :: leniw
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumSteps(cvode_mem, nsteps) &
-bind(C, name="CVodeGetNumSteps") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nsteps
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumRhsEvals(cvode_mem, nfevals) &
-bind(C, name="CVodeGetNumRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nfevals
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumLinSolvSetups(cvode_mem, nlinsetups) &
-bind(C, name="CVodeGetNumLinSolvSetups") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nlinsetups
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumErrTestFails(cvode_mem, netfails) &
-bind(C, name="CVodeGetNumErrTestFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: netfails
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetLastOrder(cvode_mem, qlast) &
-bind(C, name="CVodeGetLastOrder") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT) :: qlast
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetCurrentOrder(cvode_mem, qcur) &
-bind(C, name="CVodeGetCurrentOrder") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT) :: qcur
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumStabLimOrderReds(cvode_mem, nslred) &
-bind(C, name="CVodeGetNumStabLimOrderReds") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nslred
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetActualInitStep(cvode_mem, hinused) &
-bind(C, name="CVodeGetActualInitStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE) :: hinused
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetLastStep(cvode_mem, hlast) &
-bind(C, name="CVodeGetLastStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE) :: hlast
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetCurrentStep(cvode_mem, hcur) &
-bind(C, name="CVodeGetCurrentStep") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE) :: hcur
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetCurrentTime(cvode_mem, tcur) &
-bind(C, name="CVodeGetCurrentTime") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE) :: tcur
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetTolScaleFactor(cvode_mem, tolsfac) &
-bind(C, name="CVodeGetTolScaleFactor") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE) :: tolsfac
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetErrWeights(cvode_mem, eweight) &
-bind(C, name="CVodeGetErrWeights") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: eweight
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetEstLocalErrors(cvode_mem, ele) &
-bind(C, name="CVodeGetEstLocalErrors") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: ele
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumGEvals(cvode_mem, ngevals) &
-bind(C, name="CVodeGetNumGEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: ngevals
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetRootInfo(cvode_mem, rootsfound) &
-bind(C, name="CVodeGetRootInfo") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT) :: rootsfound
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetIntegratorStats(cvode_mem, nsteps, nfevals, nlinsetups, netfails, qlast, qcur, hinused, hlast, hcur, tcur) &
-bind(C, name="CVodeGetIntegratorStats") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nsteps
-integer(C_LONG) :: nfevals
-integer(C_LONG) :: nlinsetups
-integer(C_LONG) :: netfails
-integer(C_INT) :: qlast
-integer(C_INT) :: qcur
-real(C_DOUBLE) :: hinused
-real(C_DOUBLE) :: hlast
-real(C_DOUBLE) :: hcur
-real(C_DOUBLE) :: tcur
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumNonlinSolvIters(cvode_mem, nniters) &
-bind(C, name="CVodeGetNumNonlinSolvIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nniters
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumNonlinSolvConvFails(cvode_mem, nncfails) &
-bind(C, name="CVodeGetNumNonlinSolvConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nncfails
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNonlinSolvStats(cvode_mem, nniters, nncfails) &
-bind(C, name="CVodeGetNonlinSolvStats") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nniters
-integer(C_LONG) :: nncfails
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetReturnFlagName(flag) &
-bind(C, name="CVodeGetReturnFlagName") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_LONG), value :: flag
-type(C_PTR) :: fresult
-end function
-
-subroutine FCVodeFree(cvode_mem) &
-bind(C, name="CVodeFree")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR) :: cvode_mem
-end subroutine
-
-function FCVBandPrecInit(cvode_mem, n, mu, ml) &
-bind(C, name="CVBandPrecInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT64_T), value :: n
-integer(C_INT64_T), value :: mu
-integer(C_INT64_T), value :: ml
-integer(C_INT) :: fresult
-end function
-
-function FCVBandPrecGetWorkSpace(cvode_mem, lenrwls, leniwls) &
-bind(C, name="CVBandPrecGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FCVBandPrecGetNumRhsEvals(cvode_mem, nfevalsbp) &
-bind(C, name="CVBandPrecGetNumRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nfevalsbp
-integer(C_INT) :: fresult
-end function
-
-function FCVBBDPrecInit(cvode_mem, nlocal, mudq, mldq, mukeep, mlkeep, dqrely, gloc, cfn) &
-bind(C, name="CVBBDPrecInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT64_T), value :: nlocal
-integer(C_INT64_T), value :: mudq
-integer(C_INT64_T), value :: mldq
-integer(C_INT64_T), value :: mukeep
-integer(C_INT64_T), value :: mlkeep
-real(C_DOUBLE), value :: dqrely
-type(C_FUNPTR), value :: gloc
-type(C_FUNPTR), value :: cfn
-integer(C_INT) :: fresult
-end function
-
-function FCVBBDPrecReInit(cvode_mem, mudq, mldq, dqrely) &
-bind(C, name="CVBBDPrecReInit") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT64_T), value :: mudq
-integer(C_INT64_T), value :: mldq
-real(C_DOUBLE), value :: dqrely
-integer(C_INT) :: fresult
-end function
-
-function FCVBBDPrecGetWorkSpace(cvode_mem, lenrwbbdp, leniwbbdp) &
-bind(C, name="CVBBDPrecGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: lenrwbbdp
-integer(C_LONG) :: leniwbbdp
-integer(C_INT) :: fresult
-end function
-
-function FCVBBDPrecGetNumGfnEvals(cvode_mem, ngevalsbbdp) &
-bind(C, name="CVBBDPrecGetNumGfnEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: ngevalsbbdp
-integer(C_INT) :: fresult
-end function
-
-function FCVDiag(cvode_mem) &
-bind(C, name="CVDiag") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_INT) :: fresult
-end function
-
-function FCVDiagGetWorkSpace(cvode_mem, lenrwls, leniwls) &
-bind(C, name="CVDiagGetWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FCVDiagGetNumRhsEvals(cvode_mem, nfevalsls) &
-bind(C, name="CVDiagGetNumRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nfevalsls
-integer(C_INT) :: fresult
-end function
-
-function FCVDiagGetLastFlag(cvode_mem, flag) &
-bind(C, name="CVDiagGetLastFlag") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: flag
-integer(C_INT) :: fresult
-end function
-
-function FCVDiagGetReturnFlagName(flag) &
-bind(C, name="CVDiagGetReturnFlagName") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_LONG), value :: flag
-type(C_PTR) :: fresult
-end function
-
-function FCVodeSetLinearSolver(cvode_mem, ls, a) &
-bind(C, name="CVodeSetLinearSolver") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_PTR), value :: ls
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetJacFn(cvode_mem, jac) &
-bind(C, name="CVodeSetJacFn") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_FUNPTR), value :: jac
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetMaxStepsBetweenJac(cvode_mem, msbj) &
-bind(C, name="CVodeSetMaxStepsBetweenJac") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG), value :: msbj
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetEpsLin(cvode_mem, eplifac) &
-bind(C, name="CVodeSetEpsLin") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-real(C_DOUBLE), value :: eplifac
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetPreconditioner(cvode_mem, pset, psolve) &
-bind(C, name="CVodeSetPreconditioner") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_FUNPTR), value :: pset
-type(C_FUNPTR), value :: psolve
-integer(C_INT) :: fresult
-end function
-
-function FCVodeSetJacTimes(cvode_mem, jtsetup, jtimes) &
-bind(C, name="CVodeSetJacTimes") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-type(C_FUNPTR), value :: jtsetup
-type(C_FUNPTR), value :: jtimes
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetLinWorkSpace(cvode_mem, lenrwls, leniwls) &
-bind(C, name="CVodeGetLinWorkSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumJacEvals(cvode_mem, njevals) &
-bind(C, name="CVodeGetNumJacEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: njevals
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumPrecEvals(cvode_mem, npevals) &
-bind(C, name="CVodeGetNumPrecEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: npevals
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumPrecSolves(cvode_mem, npsolves) &
-bind(C, name="CVodeGetNumPrecSolves") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: npsolves
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumLinIters(cvode_mem, nliters) &
-bind(C, name="CVodeGetNumLinIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nliters
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumLinConvFails(cvode_mem, nlcfails) &
-bind(C, name="CVodeGetNumLinConvFails") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nlcfails
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumJTSetupEvals(cvode_mem, njtsetups) &
-bind(C, name="CVodeGetNumJTSetupEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: njtsetups
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumJtimesEvals(cvode_mem, njvevals) &
-bind(C, name="CVodeGetNumJtimesEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: njvevals
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetNumLinRhsEvals(cvode_mem, nfevalsls) &
-bind(C, name="CVodeGetNumLinRhsEvals") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: nfevalsls
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetLastLinFlag(cvode_mem, flag) &
-bind(C, name="CVodeGetLastLinFlag") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: cvode_mem
-integer(C_LONG) :: flag
-integer(C_INT) :: fresult
-end function
-
-function FCVodeGetLinReturnFlagName(flag) &
-bind(C, name="CVodeGetLinReturnFlagName") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_LONG), value :: flag
-type(C_PTR) :: fresult
-end function
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fnvector_mod.f90 b/Src/Extern/SUNDIALS4/fnvector_mod.f90
deleted file mode 100644
index 59e0ef78f13..00000000000
--- a/Src/Extern/SUNDIALS4/fnvector_mod.f90
+++ /dev/null
@@ -1,430 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-module fnvector_mod
- use, intrinsic :: ISO_C_BINDING
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- ! typedef enum N_Vector_ID
- enum, bind(c)
-  enumerator :: SUNDIALS_NVEC_SERIAL
-  enumerator :: SUNDIALS_NVEC_PARALLEL
-  enumerator :: SUNDIALS_NVEC_OPENMP
-  enumerator :: SUNDIALS_NVEC_PTHREADS
-  enumerator :: SUNDIALS_NVEC_PARHYP
-  enumerator :: SUNDIALS_NVEC_PETSC
-  enumerator :: SUNDIALS_NVEC_CUDA
-  enumerator :: SUNDIALS_NVEC_RAJA
-  enumerator :: SUNDIALS_NVEC_OPENMPDEV
-  enumerator :: SUNDIALS_NVEC_TRILINOS
-  enumerator :: SUNDIALS_NVEC_CUSTOM
- end enum
- integer, parameter, public :: N_Vector_ID = kind(SUNDIALS_NVEC_SERIAL)
- public :: SUNDIALS_NVEC_SERIAL, SUNDIALS_NVEC_PARALLEL, SUNDIALS_NVEC_OPENMP, SUNDIALS_NVEC_PTHREADS, SUNDIALS_NVEC_PARHYP, &
-    SUNDIALS_NVEC_PETSC, SUNDIALS_NVEC_CUDA, SUNDIALS_NVEC_RAJA, SUNDIALS_NVEC_OPENMPDEV, SUNDIALS_NVEC_TRILINOS, &
-    SUNDIALS_NVEC_CUSTOM
- public :: FN_VGetVectorID
- public :: FN_VClone
- public :: FN_VCloneEmpty
- public :: FN_VDestroy
- public :: FN_VSpace
- public :: FN_VGetArrayPointer
- public :: FN_VSetArrayPointer
- public :: FN_VLinearSum
- public :: FN_VConst
- public :: FN_VProd
- public :: FN_VDiv
- public :: FN_VScale
- public :: FN_VAbs
- public :: FN_VInv
- public :: FN_VAddConst
- public :: FN_VDotProd
- public :: FN_VMaxNorm
- public :: FN_VWrmsNorm
- public :: FN_VWrmsNormMask
- public :: FN_VMin
- public :: FN_VWL2Norm
- public :: FN_VL1Norm
- public :: FN_VCompare
- public :: FN_VInvTest
- public :: FN_VConstrMask
- public :: FN_VMinQuotient
- public :: FN_VLinearCombination
- public :: FN_VScaleAddMulti
- public :: FN_VDotProdMulti
- public :: FN_VLinearSumVectorArray
- public :: FN_VScaleVectorArray
- public :: FN_VConstVectorArray
- public :: FN_VWrmsNormVectorArray
- public :: FN_VWrmsNormMaskVectorArray
- public :: FN_VScaleAddMultiVectorArray
- public :: FN_VLinearCombinationVectorArray
- public :: FN_VCloneEmptyVectorArray
- public :: FN_VCloneVectorArray
- public :: FN_VDestroyVectorArray
-
-! WRAPPER DECLARATIONS
-interface
-function FN_VGetVectorID(w) &
-bind(C, name="N_VGetVectorID") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: w
-integer(C_INT) :: fresult
-end function
-
-function FN_VClone(w) &
-bind(C, name="N_VClone") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-function FN_VCloneEmpty(w) &
-bind(C, name="N_VCloneEmpty") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-subroutine FN_VDestroy(v) &
-bind(C, name="N_VDestroy")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-end subroutine
-
-subroutine FN_VSpace(v, lrw, liw) &
-bind(C, name="N_VSpace")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-integer(C_INT64_T) :: lrw
-integer(C_INT64_T) :: liw
-end subroutine
-
-function FN_VGetArrayPointer(v) &
-bind(C, name="N_VGetArrayPointer") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-type(C_PTR) :: fresult
-end function
-
-subroutine FN_VSetArrayPointer(v_data, v) &
-bind(C, name="N_VSetArrayPointer")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE) :: v_data
-type(C_PTR), value :: v
-end subroutine
-
-subroutine FN_VLinearSum(a, x, b, y, z) &
-bind(C, name="N_VLinearSum")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: a
-type(C_PTR), value :: x
-real(C_DOUBLE), value :: b
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VConst(c, z) &
-bind(C, name="N_VConst")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VProd(x, y, z) &
-bind(C, name="N_VProd")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VDiv(x, y, z) &
-bind(C, name="N_VDiv")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VScale(c, x, z) &
-bind(C, name="N_VScale")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VAbs(x, z) &
-bind(C, name="N_VAbs")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VInv(x, z) &
-bind(C, name="N_VInv")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VAddConst(x, b, z) &
-bind(C, name="N_VAddConst")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE), value :: b
-type(C_PTR), value :: z
-end subroutine
-
-function FN_VDotProd(x, y) &
-bind(C, name="N_VDotProd") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VMaxNorm(x) &
-bind(C, name="N_VMaxNorm") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VWrmsNorm(x, w) &
-bind(C, name="N_VWrmsNorm") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VWrmsNormMask(x, w, id) &
-bind(C, name="N_VWrmsNormMask") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-type(C_PTR), value :: id
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VMin(x) &
-bind(C, name="N_VMin") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VWL2Norm(x, w) &
-bind(C, name="N_VWL2Norm") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VL1Norm(x) &
-bind(C, name="N_VL1Norm") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE) :: fresult
-end function
-
-subroutine FN_VCompare(c, x, z) &
-bind(C, name="N_VCompare")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-function FN_VInvTest(x, z) &
-bind(C, name="N_VInvTest") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-logical(C_BOOL) :: fresult
-end function
-
-function FN_VConstrMask(c, x, m) &
-bind(C, name="N_VConstrMask") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: m
-logical(C_BOOL) :: fresult
-end function
-
-function FN_VMinQuotient(num, denom) &
-bind(C, name="N_VMinQuotient") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: num
-type(C_PTR), value :: denom
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VLinearCombination(nvec, c, x, z) &
-bind(C, name="N_VLinearCombination") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE) :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VScaleAddMulti(nvec, a, x, y, z) &
-bind(C, name="N_VScaleAddMulti") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE) :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VDotProdMulti(nvec, x, y, dotprods) &
-bind(C, name="N_VDotProdMulti") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-real(C_DOUBLE) :: dotprods
-integer(C_INT) :: fresult
-end function
-
-function FN_VLinearSumVectorArray(nvec, a, x, b, y, z) &
-bind(C, name="N_VLinearSumVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE), value :: a
-type(C_PTR), value :: x
-real(C_DOUBLE), value :: b
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VScaleVectorArray(nvec, c, x, z) &
-bind(C, name="N_VScaleVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE) :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VConstVectorArray(nvec, c, z) &
-bind(C, name="N_VConstVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VWrmsNormVectorArray(nvec, x, w, nrm) &
-bind(C, name="N_VWrmsNormVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-real(C_DOUBLE) :: nrm
-integer(C_INT) :: fresult
-end function
-
-function FN_VWrmsNormMaskVectorArray(nvec, x, w, id, nrm) &
-bind(C, name="N_VWrmsNormMaskVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-type(C_PTR), value :: id
-real(C_DOUBLE) :: nrm
-integer(C_INT) :: fresult
-end function
-
-function FN_VScaleAddMultiVectorArray(nvec, nsum, a, x, y, z) &
-bind(C, name="N_VScaleAddMultiVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-integer(C_INT), value :: nsum
-real(C_DOUBLE) :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VLinearCombinationVectorArray(nvec, nsum, c, x, z) &
-bind(C, name="N_VLinearCombinationVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-integer(C_INT), value :: nsum
-real(C_DOUBLE) :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VCloneEmptyVectorArray(count, w) &
-bind(C, name="N_VCloneEmptyVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: count
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-function FN_VCloneVectorArray(count, w) &
-bind(C, name="N_VCloneVectorArray") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: count
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-subroutine FN_VDestroyVectorArray(vs, count) &
-bind(C, name="N_VDestroyVectorArray")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: vs
-integer(C_INT), value :: count
-end subroutine
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fnvector_serial_mod.f90 b/Src/Extern/SUNDIALS4/fnvector_serial_mod.f90
deleted file mode 100644
index dd6367c1b7b..00000000000
--- a/Src/Extern/SUNDIALS4/fnvector_serial_mod.f90
+++ /dev/null
@@ -1,614 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module fnvector_serial_mod
- use, intrinsic :: ISO_C_BINDING
- use fnvector_mod
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
-
-  public :: FN_VGetData_Serial
-  
- public :: FN_VNew_Serial
- public :: FN_VNewEmpty_Serial
- public :: FN_VMake_Serial
- public :: FN_VCloneVectorArray_Serial
- public :: FN_VCloneVectorArrayEmpty_Serial
- public :: FN_VDestroyVectorArray_Serial
- public :: FN_VGetLength_Serial
- public :: FN_VPrint_Serial
- public :: FN_VPrintFile_Serial
- public :: FN_VGetVectorID_Serial
- public :: FN_VCloneEmpty_Serial
- public :: FN_VClone_Serial
- public :: FN_VDestroy_Serial
- public :: FN_VSpace_Serial
- public :: FN_VGetArrayPointer_Serial
- public :: FN_VSetArrayPointer_Serial
- public :: FN_VLinearSum_Serial
- public :: FN_VConst_Serial
- public :: FN_VProd_Serial
- public :: FN_VDiv_Serial
- public :: FN_VScale_Serial
- public :: FN_VAbs_Serial
- public :: FN_VInv_Serial
- public :: FN_VAddConst_Serial
- public :: FN_VDotProd_Serial
- public :: FN_VMaxNorm_Serial
- public :: FN_VWrmsNorm_Serial
- public :: FN_VWrmsNormMask_Serial
- public :: FN_VMin_Serial
- public :: FN_VWL2Norm_Serial
- public :: FN_VL1Norm_Serial
- public :: FN_VCompare_Serial
- public :: FN_VInvTest_Serial
- public :: FN_VConstrMask_Serial
- public :: FN_VMinQuotient_Serial
- public :: FN_VLinearCombination_Serial
- public :: FN_VScaleAddMulti_Serial
- public :: FN_VDotProdMulti_Serial
- public :: FN_VLinearSumVectorArray_Serial
- public :: FN_VScaleVectorArray_Serial
- public :: FN_VConstVectorArray_Serial
- public :: FN_VWrmsNormVectorArray_Serial
- public :: FN_VWrmsNormMaskVectorArray_Serial
- public :: FN_VScaleAddMultiVectorArray_Serial
- public :: FN_VLinearCombinationVectorArray_Serial
- public :: FN_VEnableFusedOps_Serial
- public :: FN_VEnableLinearCombination_Serial
- public :: FN_VEnableScaleAddMulti_Serial
- public :: FN_VEnableDotProdMulti_Serial
- public :: FN_VEnableLinearSumVectorArray_Serial
- public :: FN_VEnableScaleVectorArray_Serial
- public :: FN_VEnableConstVectorArray_Serial
- public :: FN_VEnableWrmsNormVectorArray_Serial
- public :: FN_VEnableWrmsNormMaskVectorArray_Serial
- public :: FN_VEnableScaleAddMultiVectorArray_Serial
- public :: FN_VEnableLinearCombinationVectorArray_Serial
-
-! WRAPPER DECLARATIONS
-interface
-function FN_VNew_Serial(vec_length) &
-bind(C, name="N_VNew_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT64_T), value :: vec_length
-type(C_PTR) :: fresult
-end function
-
-function FN_VNewEmpty_Serial(vec_length) &
-bind(C, name="N_VNewEmpty_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT64_T), value :: vec_length
-type(C_PTR) :: fresult
-end function
-
-function FN_VMake_Serial(vec_length, v_data) &
-bind(C, name="N_VMake_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT64_T), value :: vec_length
-real(C_DOUBLE), dimension(*) :: v_data
-type(C_PTR) :: fresult
-end function
-
-function FN_VCloneVectorArray_Serial(count, w) &
-bind(C, name="N_VCloneVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: count
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-function FN_VCloneVectorArrayEmpty_Serial(count, w) &
-bind(C, name="N_VCloneVectorArrayEmpty_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: count
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-subroutine FN_VDestroyVectorArray_Serial(vs, count) &
-bind(C, name="N_VDestroyVectorArray_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: vs
-integer(C_INT), value :: count
-end subroutine
-
-function FN_VGetLength_Serial(v) &
-bind(C, name="N_VGetLength_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-integer(C_INT64_T) :: fresult
-end function
-
-subroutine FN_VPrint_Serial(v) &
-bind(C, name="N_VPrint_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-end subroutine
-
-subroutine FN_VPrintFile_Serial(v, outfile) &
-bind(C, name="N_VPrintFile_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-type(C_PTR), value :: outfile
-end subroutine
-
-function FN_VGetVectorID_Serial(v) &
-bind(C, name="N_VGetVectorID_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-integer(C_INT) :: fresult
-end function
-
-function FN_VCloneEmpty_Serial(w) &
-bind(C, name="N_VCloneEmpty_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-function FN_VClone_Serial(w) &
-bind(C, name="N_VClone_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: w
-type(C_PTR) :: fresult
-end function
-
-subroutine FN_VDestroy_Serial(v) &
-bind(C, name="N_VDestroy_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-end subroutine
-
-subroutine FN_VSpace_Serial(v, lrw, liw) &
-bind(C, name="N_VSpace_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-integer(C_INT64_T) :: lrw
-integer(C_INT64_T) :: liw
-end subroutine
-
-function FN_VGetArrayPointer_Serial(v) &
-bind(C, name="N_VGetArrayPointer_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-type(C_PTR) :: fresult
-end function
-
-subroutine FN_VSetArrayPointer_Serial(v_data, v) &
-bind(C, name="N_VSetArrayPointer_Serial")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), dimension(*) :: v_data
-type(C_PTR), value :: v
-end subroutine
-
-subroutine FN_VLinearSum_Serial(a, x, b, y, z) &
-bind(C, name="N_VLinearSum_Serial")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: a
-type(C_PTR), value :: x
-real(C_DOUBLE), value :: b
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VConst_Serial(c, z) &
-bind(C, name="N_VConst_Serial")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VProd_Serial(x, y, z) &
-bind(C, name="N_VProd_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VDiv_Serial(x, y, z) &
-bind(C, name="N_VDiv_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VScale_Serial(c, x, z) &
-bind(C, name="N_VScale_Serial")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VAbs_Serial(x, z) &
-bind(C, name="N_VAbs_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VInv_Serial(x, z) &
-bind(C, name="N_VInv_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-subroutine FN_VAddConst_Serial(x, b, z) &
-bind(C, name="N_VAddConst_Serial")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE), value :: b
-type(C_PTR), value :: z
-end subroutine
-
-function FN_VDotProd_Serial(x, y) &
-bind(C, name="N_VDotProd_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VMaxNorm_Serial(x) &
-bind(C, name="N_VMaxNorm_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VWrmsNorm_Serial(x, w) &
-bind(C, name="N_VWrmsNorm_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VWrmsNormMask_Serial(x, w, id) &
-bind(C, name="N_VWrmsNormMask_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-type(C_PTR), value :: id
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VMin_Serial(x) &
-bind(C, name="N_VMin_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VWL2Norm_Serial(x, w) &
-bind(C, name="N_VWL2Norm_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VL1Norm_Serial(x) &
-bind(C, name="N_VL1Norm_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-real(C_DOUBLE) :: fresult
-end function
-
-subroutine FN_VCompare_Serial(c, x, z) &
-bind(C, name="N_VCompare_Serial")
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-end subroutine
-
-function FN_VInvTest_Serial(x, z) &
-bind(C, name="N_VInvTest_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-logical(C_BOOL) :: fresult
-end function
-
-function FN_VConstrMask_Serial(c, x, m) &
-bind(C, name="N_VConstrMask_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: m
-logical(C_BOOL) :: fresult
-end function
-
-function FN_VMinQuotient_Serial(num, denom) &
-bind(C, name="N_VMinQuotient_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: num
-type(C_PTR), value :: denom
-real(C_DOUBLE) :: fresult
-end function
-
-function FN_VLinearCombination_Serial(nvec, c, v, z) &
-bind(C, name="N_VLinearCombination_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE) :: c
-type(C_PTR), value :: v
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VScaleAddMulti_Serial(nvec, a, x, y, z) &
-bind(C, name="N_VScaleAddMulti_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE) :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VDotProdMulti_Serial(nvec, x, y, dotprods) &
-bind(C, name="N_VDotProdMulti_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-real(C_DOUBLE) :: dotprods
-integer(C_INT) :: fresult
-end function
-
-function FN_VLinearSumVectorArray_Serial(nvec, a, x, b, y, z) &
-bind(C, name="N_VLinearSumVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE), value :: a
-type(C_PTR), value :: x
-real(C_DOUBLE), value :: b
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VScaleVectorArray_Serial(nvec, c, x, z) &
-bind(C, name="N_VScaleVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-real(C_DOUBLE) :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VConstVectorArray_Serial(nvecs, c, z) &
-bind(C, name="N_VConstVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvecs
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VWrmsNormVectorArray_Serial(nvecs, x, w, nrm) &
-bind(C, name="N_VWrmsNormVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvecs
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-real(C_DOUBLE) :: nrm
-integer(C_INT) :: fresult
-end function
-
-function FN_VWrmsNormMaskVectorArray_Serial(nvecs, x, w, id, nrm) &
-bind(C, name="N_VWrmsNormMaskVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvecs
-type(C_PTR), value :: x
-type(C_PTR), value :: w
-type(C_PTR), value :: id
-real(C_DOUBLE) :: nrm
-integer(C_INT) :: fresult
-end function
-
-function FN_VScaleAddMultiVectorArray_Serial(nvec, nsum, a, x, y, z) &
-bind(C, name="N_VScaleAddMultiVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-integer(C_INT), value :: nsum
-real(C_DOUBLE) :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VLinearCombinationVectorArray_Serial(nvec, nsum, c, x, z) &
-bind(C, name="N_VLinearCombinationVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: nvec
-integer(C_INT), value :: nsum
-real(C_DOUBLE) :: c
-type(C_PTR), value :: x
-type(C_PTR), value :: z
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableFusedOps_Serial(v, tf) &
-bind(C, name="N_VEnableFusedOps_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableLinearCombination_Serial(v, tf) &
-bind(C, name="N_VEnableLinearCombination_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableScaleAddMulti_Serial(v, tf) &
-bind(C, name="N_VEnableScaleAddMulti_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableDotProdMulti_Serial(v, tf) &
-bind(C, name="N_VEnableDotProdMulti_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableLinearSumVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableLinearSumVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableScaleVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableScaleVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableConstVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableConstVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableWrmsNormVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableWrmsNormVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableWrmsNormMaskVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableWrmsNormMaskVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableScaleAddMultiVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableScaleAddMultiVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-function FN_VEnableLinearCombinationVectorArray_Serial(v, tf) &
-bind(C, name="N_VEnableLinearCombinationVectorArray_Serial") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-logical(C_BOOL), value :: tf
-integer(C_INT) :: fresult
-end function
-
-end interface
-
-
-contains
- ! MODULE SUBPROGRAMS
-
-  subroutine FN_VGetData_Serial(vec, vdata)
-
-      use, intrinsic :: iso_c_binding
-      implicit none
-
-      type(C_PTR)        :: vec
-      integer(C_INT64_T) :: len
-      type(C_PTR)        :: cptr
-      real(C_DOUBLE), dimension(:), pointer :: vdata
-
-      len = FN_VGetLength_Serial(vec)
-      cptr = FN_VGetArrayPointer_Serial(vec)
-
-      call c_f_pointer(cptr, vdata, (/len/))
-
-  end subroutine FN_VGetData_Serial
-  
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fsundials_types_mod.f90 b/Src/Extern/SUNDIALS4/fsundials_types_mod.f90
deleted file mode 100644
index 53247e51e9d..00000000000
--- a/Src/Extern/SUNDIALS4/fsundials_types_mod.f90
+++ /dev/null
@@ -1,30 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module fsundials_types_mod
- use, intrinsic :: ISO_C_BINDING
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- integer(C_INT), parameter, public :: SUNFALSE = 0_C_INT
- integer(C_INT), parameter, public :: SUNTRUE = 1_C_INT
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fsunlinsol_dense_mod.f90 b/Src/Extern/SUNDIALS4/fsunlinsol_dense_mod.f90
deleted file mode 100644
index ac0f4f0b284..00000000000
--- a/Src/Extern/SUNDIALS4/fsunlinsol_dense_mod.f90
+++ /dev/null
@@ -1,127 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module fsunlinsol_dense_mod
- use, intrinsic :: ISO_C_BINDING
- use fsunlinsol_mod
- use fsundials_types_mod
- use fnvector_mod
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- public :: FSUNLinSol_Dense
- public :: FSUNDenseLinearSolver
- public :: FSUNLinSolGetType_Dense
- public :: FSUNLinSolInitialize_Dense
- public :: FSUNLinSolSetup_Dense
- public :: FSUNLinSolSolve_Dense
- public :: FSUNLinSolLastFlag_Dense
- public :: FSUNLinSolSpace_Dense
- public :: FSUNLinSolFree_Dense
-
-! WRAPPER DECLARATIONS
-interface
-function FSUNLinSol_Dense(y, a) &
-bind(C, name="SUNLinSol_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: y
-type(C_PTR), value :: a
-type(C_PTR) :: fresult
-end function
-
-function FSUNDenseLinearSolver(y, a) &
-bind(C, name="SUNDenseLinearSolver") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: y
-type(C_PTR), value :: a
-type(C_PTR) :: fresult
-end function
-
-function FSUNLinSolGetType_Dense(s) &
-bind(C, name="SUNLinSolGetType_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolInitialize_Dense(s) &
-bind(C, name="SUNLinSolInitialize_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSetup_Dense(s, a) &
-bind(C, name="SUNLinSolSetup_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSolve_Dense(s, a, x, b, tol) &
-bind(C, name="SUNLinSolSolve_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: b
-real(C_DOUBLE), value :: tol
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolLastFlag_Dense(s) &
-bind(C, name="SUNLinSolLastFlag_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_LONG) :: fresult
-end function
-
-function FSUNLinSolSpace_Dense(s, lenrwls, leniwls) &
-bind(C, name="SUNLinSolSpace_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolFree_Dense(s) &
-bind(C, name="SUNLinSolFree_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fsunlinsol_mod.f90 b/Src/Extern/SUNDIALS4/fsunlinsol_mod.f90
deleted file mode 100644
index 1d1a249a7ce..00000000000
--- a/Src/Extern/SUNDIALS4/fsunlinsol_mod.f90
+++ /dev/null
@@ -1,243 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-module fsunlinsol_mod
- use, intrinsic :: ISO_C_BINDING
- use fsundials_types_mod
- use fnvector_mod
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- enum, bind(c)
-  enumerator :: PREC_NONE
-  enumerator :: PREC_LEFT
-  enumerator :: PREC_RIGHT
-  enumerator :: PREC_BOTH
- end enum
- public :: PREC_NONE, PREC_LEFT, PREC_RIGHT, PREC_BOTH
- enum, bind(c)
-  enumerator :: MODIFIED_GS = 1
-  enumerator :: CLASSICAL_GS = 2
- end enum
- public :: MODIFIED_GS, CLASSICAL_GS
- public :: FModifiedGS
- public :: FClassicalGS
- public :: FQRfact
- public :: FQRsol
- ! typedef enum SUNLinearSolver_Type
- enum, bind(c)
-  enumerator :: SUNLINEARSOLVER_DIRECT
-  enumerator :: SUNLINEARSOLVER_ITERATIVE
-  enumerator :: SUNLINEARSOLVER_MATRIX_ITERATIVE
- end enum
- integer, parameter, public :: SUNLinearSolver_Type = kind(SUNLINEARSOLVER_DIRECT)
- public :: SUNLINEARSOLVER_DIRECT, SUNLINEARSOLVER_ITERATIVE, SUNLINEARSOLVER_MATRIX_ITERATIVE
- public :: FSUNLinSolGetType
- public :: FSUNLinSolSetATimes
- public :: FSUNLinSolSetPreconditioner
- public :: FSUNLinSolSetScalingVectors
- public :: FSUNLinSolInitialize
- public :: FSUNLinSolSetup
- public :: FSUNLinSolSolve
- public :: FSUNLinSolNumIters
- public :: FSUNLinSolResNorm
- public :: FSUNLinSolResid
- public :: FSUNLinSolLastFlag
- public :: FSUNLinSolSpace
- public :: FSUNLinSolFree
- integer(C_INT), parameter, public :: SUNLS_SUCCESS = 0_C_INT
- integer(C_INT), parameter, public :: SUNLS_MEM_NULL = -1_C_INT
- integer(C_INT), parameter, public :: SUNLS_ILL_INPUT = -2_C_INT
- integer(C_INT), parameter, public :: SUNLS_MEM_FAIL = -3_C_INT
- integer(C_INT), parameter, public :: SUNLS_ATIMES_FAIL_UNREC = -4_C_INT
- integer(C_INT), parameter, public :: SUNLS_PSET_FAIL_UNREC = -5_C_INT
- integer(C_INT), parameter, public :: SUNLS_PSOLVE_FAIL_UNREC = -6_C_INT
- integer(C_INT), parameter, public :: SUNLS_PACKAGE_FAIL_UNREC = -7_C_INT
- integer(C_INT), parameter, public :: SUNLS_GS_FAIL = -8_C_INT
- integer(C_INT), parameter, public :: SUNLS_QRSOL_FAIL = -9_C_INT
- integer(C_INT), parameter, public :: SUNLS_VECTOROP_ERR = -10_C_INT
- integer(C_INT), parameter, public :: SUNLS_RES_REDUCED = 1_C_INT
- integer(C_INT), parameter, public :: SUNLS_CONV_FAIL = 2_C_INT
- integer(C_INT), parameter, public :: SUNLS_ATIMES_FAIL_REC = 3_C_INT
- integer(C_INT), parameter, public :: SUNLS_PSET_FAIL_REC = 4_C_INT
- integer(C_INT), parameter, public :: SUNLS_PSOLVE_FAIL_REC = 5_C_INT
- integer(C_INT), parameter, public :: SUNLS_PACKAGE_FAIL_REC = 6_C_INT
- integer(C_INT), parameter, public :: SUNLS_QRFACT_FAIL = 7_C_INT
- integer(C_INT), parameter, public :: SUNLS_LUFACT_FAIL = 8_C_INT
-
-! WRAPPER DECLARATIONS
-interface
-function FModifiedGS(v, h, k, p, new_vk_norm) &
-bind(C, name="ModifiedGS") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-type(C_PTR), value :: h
-integer(C_INT), value :: k
-integer(C_INT), value :: p
-real(C_DOUBLE) :: new_vk_norm
-integer(C_INT) :: fresult
-end function
-
-function FClassicalGS(v, h, k, p, new_vk_norm, stemp, vtemp) &
-bind(C, name="ClassicalGS") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: v
-type(C_PTR), value :: h
-integer(C_INT), value :: k
-integer(C_INT), value :: p
-real(C_DOUBLE) :: new_vk_norm
-real(C_DOUBLE) :: stemp
-type(C_PTR), value :: vtemp
-integer(C_INT) :: fresult
-end function
-
-function FQRfact(n, h, q, job) &
-bind(C, name="QRfact") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: n
-type(C_PTR), value :: h
-real(C_DOUBLE) :: q
-integer(C_INT), value :: job
-integer(C_INT) :: fresult
-end function
-
-function FQRsol(n, h, q, b) &
-bind(C, name="QRsol") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT), value :: n
-type(C_PTR), value :: h
-real(C_DOUBLE) :: q
-real(C_DOUBLE) :: b
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolGetType(s) &
-bind(C, name="SUNLinSolGetType") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSetATimes(s, a_data, atimes) &
-bind(C, name="SUNLinSolSetATimes") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: a_data
-type(C_FUNPTR), value :: atimes
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSetPreconditioner(s, p_data, pset, psol) &
-bind(C, name="SUNLinSolSetPreconditioner") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: p_data
-type(C_FUNPTR), value :: pset
-type(C_FUNPTR), value :: psol
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSetScalingVectors(s, s1, s2) &
-bind(C, name="SUNLinSolSetScalingVectors") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: s1
-type(C_PTR), value :: s2
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolInitialize(s) &
-bind(C, name="SUNLinSolInitialize") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSetup(s, a) &
-bind(C, name="SUNLinSolSetup") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolSolve(s, a, x, b, tol) &
-bind(C, name="SUNLinSolSolve") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR), value :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: b
-real(C_DOUBLE), value :: tol
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolNumIters(s) &
-bind(C, name="SUNLinSolNumIters") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolResNorm(s) &
-bind(C, name="SUNLinSolResNorm") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-real(C_DOUBLE) :: fresult
-end function
-
-function FSUNLinSolResid(s) &
-bind(C, name="SUNLinSolResid") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-type(C_PTR) :: fresult
-end function
-
-function FSUNLinSolLastFlag(s) &
-bind(C, name="SUNLinSolLastFlag") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_LONG) :: fresult
-end function
-
-function FSUNLinSolSpace(s, lenrwls, leniwls) &
-bind(C, name="SUNLinSolSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_LONG) :: lenrwls
-integer(C_LONG) :: leniwls
-integer(C_INT) :: fresult
-end function
-
-function FSUNLinSolFree(s) &
-bind(C, name="SUNLinSolFree") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: s
-integer(C_INT) :: fresult
-end function
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fsunmatrix_dense_mod.f90 b/Src/Extern/SUNDIALS4/fsunmatrix_dense_mod.f90
deleted file mode 100644
index 05ae30712fa..00000000000
--- a/Src/Extern/SUNDIALS4/fsunmatrix_dense_mod.f90
+++ /dev/null
@@ -1,220 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-
-! ---------------------------------------------------------------
-! Programmer(s): Auto-generated by swig.
-! ---------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ---------------------------------------------------------------
-
-module fsunmatrix_dense_mod
- use, intrinsic :: ISO_C_BINDING
- use fsunmatrix_mod
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
-
-  public :: FSUNMatGetData_Dense
-  
- public :: FSUNDenseMatrix
- public :: FSUNDenseMatrix_Print
- public :: FSUNDenseMatrix_Rows
- public :: FSUNDenseMatrix_Columns
- public :: FSUNDenseMatrix_LData
- public :: FSUNDenseMatrix_Data
- public :: FSUNDenseMatrix_Cols
- public :: FSUNDenseMatrix_Column
- public :: FSUNMatGetID_Dense
- public :: FSUNMatClone_Dense
- public :: FSUNMatDestroy_Dense
- public :: FSUNMatZero_Dense
- public :: FSUNMatCopy_Dense
- public :: FSUNMatScaleAdd_Dense
- public :: FSUNMatScaleAddI_Dense
- public :: FSUNMatMatvec_Dense
- public :: FSUNMatSpace_Dense
-
-! WRAPPER DECLARATIONS
-interface
-function FSUNDenseMatrix(m, n) &
-bind(C, name="SUNDenseMatrix") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-integer(C_INT64_T), value :: m
-integer(C_INT64_T), value :: n
-type(C_PTR) :: fresult
-end function
-
-subroutine FSUNDenseMatrix_Print(a, outfile) &
-bind(C, name="SUNDenseMatrix_Print")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR), value :: outfile
-end subroutine
-
-function FSUNDenseMatrix_Rows(a) &
-bind(C, name="SUNDenseMatrix_Rows") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT64_T) :: fresult
-end function
-
-function FSUNDenseMatrix_Columns(a) &
-bind(C, name="SUNDenseMatrix_Columns") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT64_T) :: fresult
-end function
-
-function FSUNDenseMatrix_LData(a) &
-bind(C, name="SUNDenseMatrix_LData") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT64_T) :: fresult
-end function
-
-function FSUNDenseMatrix_Data(a) &
-bind(C, name="SUNDenseMatrix_Data") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR) :: fresult
-end function
-
-function FSUNDenseMatrix_Cols(a) &
-bind(C, name="SUNDenseMatrix_Cols") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR) :: fresult
-end function
-
-function FSUNDenseMatrix_Column(a, j) &
-bind(C, name="SUNDenseMatrix_Column") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT64_T), value :: j
-type(C_PTR) :: fresult
-end function
-
-function FSUNMatGetID_Dense(a) &
-bind(C, name="SUNMatGetID_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatClone_Dense(a) &
-bind(C, name="SUNMatClone_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR) :: fresult
-end function
-
-subroutine FSUNMatDestroy_Dense(a) &
-bind(C, name="SUNMatDestroy_Dense")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-end subroutine
-
-function FSUNMatZero_Dense(a) &
-bind(C, name="SUNMatZero_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatCopy_Dense(a, b) &
-bind(C, name="SUNMatCopy_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR), value :: b
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatScaleAdd_Dense(c, a, b) &
-bind(C, name="SUNMatScaleAdd_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: a
-type(C_PTR), value :: b
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatScaleAddI_Dense(c, a) &
-bind(C, name="SUNMatScaleAddI_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatMatvec_Dense(a, x, y) &
-bind(C, name="SUNMatMatvec_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatSpace_Dense(a, lenrw, leniw) &
-bind(C, name="SUNMatSpace_Dense") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_LONG) :: lenrw
-integer(C_LONG) :: leniw
-integer(C_INT) :: fresult
-end function
-
-end interface
-
-
-contains
- ! MODULE SUBPROGRAMS
-
-  subroutine FSUNMatGetData_Dense(mat, mdata)
-
-      use, intrinsic :: iso_c_binding
-      implicit none
-
-      type(C_PTR)        :: mat
-      integer(C_INT64_T) :: M, N
-      type(C_PTR)        :: cptr
-      real(C_DOUBLE), dimension(:,:), pointer :: mdata
-
-      M = FSUNDenseMatrix_Rows(mat)
-      N = FSUNDenseMatrix_Columns(mat)
-      cptr = FSUNDenseMatrix_Data(mat)
-
-      call c_f_pointer(cptr, mdata, (/M,N/))
-
-  end subroutine FSUNMatGetData_Dense
-  
-
-end module
diff --git a/Src/Extern/SUNDIALS4/fsunmatrix_mod.f90 b/Src/Extern/SUNDIALS4/fsunmatrix_mod.f90
deleted file mode 100644
index 66e1b1b07e5..00000000000
--- a/Src/Extern/SUNDIALS4/fsunmatrix_mod.f90
+++ /dev/null
@@ -1,115 +0,0 @@
-! This file was automatically generated by SWIG (http://www.swig.org).
-! Version 4.0.0
-!
-! Do not make changes to this file unless you know what you are doing--modify
-! the SWIG interface file instead.
-module fsunmatrix_mod
- use, intrinsic :: ISO_C_BINDING
- use fsundials_types_mod
- implicit none
- private
-
- ! DECLARATION CONSTRUCTS
- ! typedef enum SUNMatrix_ID
- enum, bind(c)
-  enumerator :: SUNMATRIX_DENSE
-  enumerator :: SUNMATRIX_BAND
-  enumerator :: SUNMATRIX_SPARSE
-  enumerator :: SUNMATRIX_CUSTOM
- end enum
- integer, parameter, public :: SUNMatrix_ID = kind(SUNMATRIX_DENSE)
- public :: SUNMATRIX_DENSE, SUNMATRIX_BAND, SUNMATRIX_SPARSE, SUNMATRIX_CUSTOM
- public :: FSUNMatGetID
- public :: FSUNMatClone
- public :: FSUNMatDestroy
- public :: FSUNMatZero
- public :: FSUNMatCopy
- public :: FSUNMatScaleAdd
- public :: FSUNMatScaleAddI
- public :: FSUNMatMatvec
- public :: FSUNMatSpace
-
-! WRAPPER DECLARATIONS
-interface
-function FSUNMatGetID(a) &
-bind(C, name="SUNMatGetID") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatClone(a) &
-bind(C, name="SUNMatClone") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR) :: fresult
-end function
-
-subroutine FSUNMatDestroy(a) &
-bind(C, name="SUNMatDestroy")
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-end subroutine
-
-function FSUNMatZero(a) &
-bind(C, name="SUNMatZero") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatCopy(a, b) &
-bind(C, name="SUNMatCopy") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR), value :: b
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatScaleAdd(c, a, b) &
-bind(C, name="SUNMatScaleAdd") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: a
-type(C_PTR), value :: b
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatScaleAddI(c, a) &
-bind(C, name="SUNMatScaleAddI") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-real(C_DOUBLE), value :: c
-type(C_PTR), value :: a
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatMatvec(a, x, y) &
-bind(C, name="SUNMatMatvec") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-type(C_PTR), value :: x
-type(C_PTR), value :: y
-integer(C_INT) :: fresult
-end function
-
-function FSUNMatSpace(a, lenrw, leniw) &
-bind(C, name="SUNMatSpace") &
-result(fresult)
-use, intrinsic :: ISO_C_BINDING
-type(C_PTR), value :: a
-integer(C_LONG) :: lenrw
-integer(C_LONG) :: leniw
-integer(C_INT) :: fresult
-end function
-
-end interface
-
-
-end module
diff --git a/Src/Extern/SWFFT/distribution.c b/Src/Extern/SWFFT/distribution.c
index 9c2fd8e4819..ad888c7d947 100644
--- a/Src/Extern/SWFFT/distribution.c
+++ b/Src/Extern/SWFFT/distribution.c
@@ -77,7 +77,7 @@ enum {
 #define DEBUG_CONDITION false
 
 // return comma or period depending on position in a list
-static inline char *separator(int i, int n)
+static inline char const *separator(int i, int n)
 {
   return i == (n - 1) ? "." : ", ";
 }
diff --git a/Src/Extern/amrdata/AMReX_AmrData.cpp b/Src/Extern/amrdata/AMReX_AmrData.cpp
index 4f07a2afad4..ee86b11d8b0 100644
--- a/Src/Extern/amrdata/AMReX_AmrData.cpp
+++ b/Src/Extern/amrdata/AMReX_AmrData.cpp
@@ -805,7 +805,7 @@ bool AmrData::ReadData(const string &filename, Amrvis::FileType filetype) {
 
 
 // ---------------------------------------------------------------
-bool AmrData::ReadNonPlotfileData(const string &filename, Amrvis::FileType filetype) {
+bool AmrData::ReadNonPlotfileData(const string &filename, Amrvis::FileType /*filetype*/) {
   const int LevelZero(0), LevelOne(1), BoxZero(0), ComponentZero(0);
   const int NVarZero(0), FabZero(0), IndexZero(0);
   const int iopNum(ParallelDescriptor::IOProcessorNumber());
@@ -1572,7 +1572,7 @@ void AmrData::FillVar(Vector<FArrayBox *> &destFabs, const Vector<Box> &destBoxe
 
 
 // ---------------------------------------------------------------
-void AmrData::FillInterior(FArrayBox &dest, int level, const Box &subbox) {
+void AmrData::FillInterior(FArrayBox &/*dest*/, int /*level*/, const Box &/*subbox*/) {
    amrex::Abort("Error:  should not be in AmrData::FillInterior");
 }
 
diff --git a/Src/Extern/amrdata/AMReX_DataServices.cpp b/Src/Extern/amrdata/AMReX_DataServices.cpp
index cc0ac208735..a4d583f9d63 100644
--- a/Src/Extern/amrdata/AMReX_DataServices.cpp
+++ b/Src/Extern/amrdata/AMReX_DataServices.cpp
@@ -1586,7 +1586,7 @@ int DataServices::NumDeriveFunc() const {
 
 
 // ---------------------------------------------------------------
-void DataServices::PointValue(int pointBoxArraySize, Box *pointBoxArray,
+void DataServices::PointValue(int /*pointBoxArraySize*/, Box *pointBoxArray,
 		              const string &currentDerived,
 		              int coarsestLevelToSearch,
 			      int finestLevelToSearch,
@@ -1639,7 +1639,7 @@ void DataServices::PointValue(int pointBoxArraySize, Box *pointBoxArray,
 
 
 // ---------------------------------------------------------------
-void DataServices::LineValues(int lineBoxArraySize, Box *lineBoxArray, int whichDir,
+void DataServices::LineValues(int /*lineBoxArraySize*/, Box *lineBoxArray, int whichDir,
                               const string &currentDerived,
                               int coarsestLevelToSearch, int finestLevelToSearch,
                               XYPlotDataList *dataList, bool &bLineIsValid) {
diff --git a/Src/Extern/amrdata/AMReX_FABUTIL_2D.F b/Src/Extern/amrdata/AMReX_FABUTIL_2D.F
index 93353c25c6c..446ad02947c 100644
--- a/Src/Extern/amrdata/AMReX_FABUTIL_2D.F
+++ b/Src/Extern/amrdata/AMReX_FABUTIL_2D.F
@@ -199,8 +199,9 @@ subroutine FORT_CINTERP (fine,floi1,floi2,fhii1,fhii2, fblo,fbhi,
 
 
 c ::: --------------------------------------------------------------
-      subroutine FORT_PCINTERP (fine,floi1,floi2,fhii1,fhii2,fblo, fbhi,lrat,
-     $ nvar, crse,cloi1,cloi2,chii1,chii2,cblo, cbhi,temp,tloi,thii)
+      subroutine FORT_PCINTERP (fine,floi1,floi2,fhii1,fhii2,fblo,
+     $     fbhi,lrat,nvar,crse,cloi1,cloi2,chii1,chii2,cblo,
+     $     cbhi,temp,tloi,thii)
 
       integer floi1,floi2
       integer fhii1,fhii2
diff --git a/Src/Extern/amrdata/AMReX_FABUTIL_3D.F b/Src/Extern/amrdata/AMReX_FABUTIL_3D.F
index 6b40d1e79f8..d8e4ba66f82 100644
--- a/Src/Extern/amrdata/AMReX_FABUTIL_3D.F
+++ b/Src/Extern/amrdata/AMReX_FABUTIL_3D.F
@@ -53,7 +53,7 @@ subroutine FORT_CINTERP (fine,floi1,floi2,floi3,fhii1,fhii2,fhii3,
       integer cblo(3), cbhi(3)
       integer fslo(3), fshi(3)
       integer lratio, nvar, clen, flen, clo, chi
-      REAL_T fine(floi1 :fhii1 ,floi2 :fhii2 ,floi3 :fhii3, nvar)
+      REAL_T fine(floi1:fhii1,floi2:fhii2,floi3:fhii3,nvar)
       REAL_T crse(clo:chi, nvar)
       REAL_T cslope(clo:chi, 3)
       REAL_T fslope(flen, 3)
@@ -356,8 +356,8 @@ subroutine FORT_PCINTERP (fine,floi1,floi2,floi3,fhii1,fhii2,
       integer fblo(3), fbhi(3)
       integer cblo(3), cbhi(3)
       integer lrat, nvar, tloi, thii
-      REAL_T fine(floi1 :fhii1 ,floi2 :fhii2 ,floi3 :fhii3, nvar)
-      REAL_T crse(cloi1 :chii1 ,cloi2 :chii2 ,cloi3 :chii3, nvar)
+      REAL_T fine(floi1:fhii1,floi2:fhii2,floi3:fhii3, nvar)
+      REAL_T crse(cloi1:chii1,cloi2:chii2,cloi3:chii3, nvar)
       REAL_T temp(tloi:thii + 1)
 c ::: ::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
 c ::: pcinterp:  use piecewise constant interpolation to define
@@ -418,7 +418,7 @@ subroutine FORT_VCINTERP (fine,floi1,floi2,floi3,fhii1,fhii2,
       integer cblo(3), cbhi(3)
       integer fslo(3), fshi(3)
       integer lratio, nvar, clen, flen, clo, chi
-      REAL_T fine(floi1 :fhii1 ,floi2 :fhii2 ,floi3 :fhii3, nvar)
+      REAL_T fine(floi1:fhii1,floi2:fhii2,floi3:fhii3,nvar)
       REAL_T crse(clo:chi, nvar)
       REAL_T cslope(clo:chi, 3)
       REAL_T fslope(flen, 3)
diff --git a/Src/Extern/amrdata/CMakeLists.txt b/Src/Extern/amrdata/CMakeLists.txt
index 9c575f651a7..137b7d0090f 100644
--- a/Src/Extern/amrdata/CMakeLists.txt
+++ b/Src/Extern/amrdata/CMakeLists.txt
@@ -9,9 +9,9 @@ target_sources(amrex
    AMReX_DataServices.H
    AMReX_DataServices.cpp 
    AMReX_AmrvisConstants.H
-   AMReX_FABUTIL_${DIM}D.F
+   AMReX_FABUTIL_${AMReX_SPACEDIM}D.F
    )
 
-if (ENABLE_PROPARSER)
+if (AMReX_PROFPARSER)
    target_sources( amrex PRIVATE AMReX_XYPlotDataList.cpp AMReX_XYPlotDataList.H )
 endif ()
diff --git a/Src/F_Interfaces/AmrCore/AMReX_FlashFluxRegister.cpp b/Src/F_Interfaces/AmrCore/AMReX_FlashFluxRegister.cpp
index dfdc7e07965..aaae4113aaf 100644
--- a/Src/F_Interfaces/AmrCore/AMReX_FlashFluxRegister.cpp
+++ b/Src/F_Interfaces/AmrCore/AMReX_FlashFluxRegister.cpp
@@ -1,8 +1,5 @@
 #include <AMReX_FlashFluxRegister.H>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
+#include <AMReX_OpenMP.H>
 
 namespace amrex {
 
@@ -37,9 +34,9 @@ void FlashFluxRegister::define (const BoxArray& fba, const BoxArray& cba,
     {
         BoxArray const& fndba = amrex::convert(fba,IntVect::TheNodeVector());
         Array<BoxList,AMREX_SPACEDIM> bl
-            {AMREX_D_DECL(BoxList(IndexType(IntVect::TheDimensionVector(0))),
-                          BoxList(IndexType(IntVect::TheDimensionVector(1))),
-                          BoxList(IndexType(IntVect::TheDimensionVector(2))))};
+        {{AMREX_D_DECL(BoxList(IndexType(IntVect::TheDimensionVector(0))),
+                       BoxList(IndexType(IntVect::TheDimensionVector(1))),
+                       BoxList(IndexType(IntVect::TheDimensionVector(2))))}};
         Array<Vector<int>,AMREX_SPACEDIM> procmap;
         Array<Vector<int>,AMREX_SPACEDIM> my_global_indices;
         std::vector<std::pair<int,Box> > isects;
@@ -86,7 +83,7 @@ void FlashFluxRegister::define (const BoxArray& fba, const BoxArray& cba,
                     if (found != m_fine_map.end()) {
                         found->second[idim] = &(m_fine_fluxes[idim][mfi]);
                     } else {
-                        Array<FArrayBox*,AMREX_SPACEDIM> t{AMREX_D_DECL(nullptr,nullptr,nullptr)};
+                        Array<FArrayBox*,AMREX_SPACEDIM> t{{AMREX_D_DECL(nullptr,nullptr,nullptr)}};
                         t[idim] = &(m_fine_fluxes[idim][mfi]);
                         m_fine_map.insert(std::make_pair(gi,t));
                     }
@@ -99,9 +96,9 @@ void FlashFluxRegister::define (const BoxArray& fba, const BoxArray& cba,
     {
         BoxArray const fba_coarsened = amrex::coarsen(fba,ref_ratio);
         Array<BoxList,AMREX_SPACEDIM> bl
-            {AMREX_D_DECL(BoxList(IndexType(IntVect::TheDimensionVector(0))),
-                          BoxList(IndexType(IntVect::TheDimensionVector(1))),
-                          BoxList(IndexType(IntVect::TheDimensionVector(2))))};
+        {{AMREX_D_DECL(BoxList(IndexType(IntVect::TheDimensionVector(0))),
+                       BoxList(IndexType(IntVect::TheDimensionVector(1))),
+                       BoxList(IndexType(IntVect::TheDimensionVector(2))))}};
         Array<Vector<int>,AMREX_SPACEDIM> procmap;
         Array<Vector<int>,AMREX_SPACEDIM> my_global_indices;
         std::vector<std::pair<int,Box> > isects;
@@ -161,8 +158,8 @@ void FlashFluxRegister::define (const BoxArray& fba, const BoxArray& cba,
                     if (found != m_crse_map.end()) {
                         found->second[index] = &(m_crse_fluxes[idim][mfi]);
                     } else {
-                        Array<FArrayBox*,2*AMREX_SPACEDIM> t{AMREX_D_DECL(nullptr,nullptr,nullptr),
-                                                             AMREX_D_DECL(nullptr,nullptr,nullptr)};
+                        Array<FArrayBox*,2*AMREX_SPACEDIM> t{{AMREX_D_DECL(nullptr,nullptr,nullptr),
+                                    AMREX_D_DECL(nullptr,nullptr,nullptr)}};
                         t[index] = &(m_crse_fluxes[idim][mfi]);
                         m_crse_map.insert(std::make_pair(gi,t));
                     }
@@ -171,11 +168,7 @@ void FlashFluxRegister::define (const BoxArray& fba, const BoxArray& cba,
         }
     }
 
-#ifdef _OPNEMP
-    int nthreads = omp_get_max_threads;
-#else
-    int nthreads = 1;
-#endif
+    int nthreads = OpenMP::get_max_threads();
     m_h_ifd.resize(nthreads);
     m_d_ifd.resize(nthreads);
     for (int i = 0; i < nthreads; ++i) {
@@ -195,43 +188,55 @@ void FlashFluxRegister::store (int fine_global_index, int dir, FArrayBox const&
             Array4<Real> const& dest = fab_a[dir]->array();
             Array4<Real const> const& src = fine_flux.const_array();
             if (dir == 0) {
+#if (AMREX_SPACEDIM == 1)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
-#if (AMREX_SPACEDIM == 1)
                     dest(i,0,0,n) = src(2*i,0,0,n)*sf;
-#elif (AMREX_SPACEDIM == 2)
+                });
+#endif
+#if (AMREX_SPACEDIM == 2)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
                     dest(i,j,0,n) = (src(2*i,2*j  ,0,n) +
                                      src(2*i,2*j+1,0,n)) * (0.5*sf);
-#elif (AMREX_SPACEDIM == 3)
+                });
+#endif
+#if (AMREX_SPACEDIM == 3)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
                     dest(i,j,k,n) = (src(2*i,2*j  ,2*k  ,n) +
                                      src(2*i,2*j+1,2*k  ,n) +
                                      src(2*i,2*j  ,2*k+1,n) +
                                      src(2*i,2*j+1,2*k+1,n)) * (0.25*sf);
-#endif
                 });
+#endif
             } else if (dir == 1) {
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
-#if (AMREX_SPACEDIM == 2)
                     dest(i,j,0,n) = (src(2*i  ,2*j,0,n) +
                                      src(2*i+1,2*j,0,n)) * (0.5*sf);
-#elif (AMREX_SPACEDIM == 3)
+                });
+#endif
+#if (AMREX_SPACEDIM == 3)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
                     dest(i,j,k,n) = (src(2*i  ,2*j,2*k  ,n) +
                                      src(2*i+1,2*j,2*k  ,n) +
                                      src(2*i  ,2*j,2*k+1,n) +
                                      src(2*i+1,2*j,2*k+1,n)) * (0.25*sf);
-#endif
                 });
+#endif
             } else {
+#if (AMREX_SPACEDIM == 3)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
-#if (AMREX_SPACEDIM == 3)
                     dest(i,j,k,n) = (src(2*i  ,2*j  ,2*k,n) +
                                      src(2*i+1,2*j  ,2*k,n) +
                                      src(2*i  ,2*j+1,2*k,n) +
                                      src(2*i+1,2*j+1,2*k,n)) * (0.25*sf);
-#endif
                 });
+#endif
             }
         }
     }
@@ -251,43 +256,55 @@ void FlashFluxRegister::store (int fine_global_index, int dir, FArrayBox const&
             Array4<Real const> const& src = fine_flux.const_array();
             Array4<Real const> const& area = fine_area.const_array();
             if (dir == 0) {
+#if (AMREX_SPACEDIM == 1)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
-#if (AMREX_SPACEDIM == 1)
                     dest(i,0,0,n) = src(2*i,0,0,n)*area(2*i,0,0)*sf;
-#elif (AMREX_SPACEDIM == 2)
+                });
+#endif
+#if (AMREX_SPACEDIM == 2)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
                     dest(i,j,0,n) = (src(2*i,2*j  ,0,n)*area(2*i,2*j  ,0) +
                                      src(2*i,2*j+1,0,n)*area(2*i,2*j+1,0)) * sf;
-#elif (AMREX_SPACEDIM == 3)
+                });
+#endif
+#if (AMREX_SPACEDIM == 3)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
                     dest(i,j,k,n) = (src(2*i,2*j  ,2*k  ,n)*area(2*i,2*j  ,2*k  ) +
                                      src(2*i,2*j+1,2*k  ,n)*area(2*i,2*j+1,2*k  ) +
                                      src(2*i,2*j  ,2*k+1,n)*area(2*i,2*j  ,2*k+1) +
                                      src(2*i,2*j+1,2*k+1,n)*area(2*i,2*j+1,2*k+1)) * sf;
-#endif
                 });
+#endif
             } else if (dir == 1) {
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
-#if (AMREX_SPACEDIM == 2)
                     dest(i,j,0,n) = (src(2*i  ,2*j,0,n)*area(2*i  ,2*j,0) +
                                      src(2*i+1,2*j,0,n)*area(2*i+1,2*j,0)) * sf;
-#elif (AMREX_SPACEDIM == 3)
+                });
+#endif
+#if (AMREX_SPACEDIM == 3)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
                     dest(i,j,k,n) = (src(2*i  ,2*j,2*k  ,n)*area(2*i  ,2*j,2*k  ) +
                                      src(2*i+1,2*j,2*k  ,n)*area(2*i+1,2*j,2*k  ) +
                                      src(2*i  ,2*j,2*k+1,n)*area(2*i  ,2*j,2*k+1) +
                                      src(2*i+1,2*j,2*k+1,n)*area(2*i+1,2*j,2*k+1)) * sf;
-#endif
                 });
+#endif
             } else {
+#if (AMREX_SPACEDIM == 3)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
-#if (AMREX_SPACEDIM == 3)
                     dest(i,j,k,n) = (src(2*i  ,2*j  ,2*k,n)*area(2*i  ,2*j  ,2*k) +
                                      src(2*i+1,2*j  ,2*k,n)*area(2*i+1,2*j  ,2*k) +
                                      src(2*i  ,2*j+1,2*k,n)*area(2*i  ,2*j+1,2*k) +
                                      src(2*i+1,2*j+1,2*k,n)*area(2*i+1,2*j+1,2*k)) * sf;
-#endif
                 });
+#endif
             }
         }
     }
@@ -296,13 +313,8 @@ void FlashFluxRegister::store (int fine_global_index, int dir, FArrayBox const&
 void FlashFluxRegister::store (int fine_global_index, int dir, FArrayBox const& fine_flux,
                                FArrayBox const& fine_area, const int* isFluxDensity, Real sf)
 {
-#ifdef _OPENMP
-    auto& h_ifd = m_h_ifd[omp_get_thread_num()];
-    auto& d_ifd = m_d_ifd[omp_get_thread_num()];
-#else
-    auto& h_ifd = m_h_ifd[0];
-    auto& d_ifd = m_d_ifd[0];
-#endif
+    auto& h_ifd = m_h_ifd[OpenMP::get_thread_num()];
+    auto& d_ifd = m_d_ifd[OpenMP::get_thread_num()];
 
     AMREX_ASSERT(dir < AMREX_SPACEDIM);
     auto found = m_fine_map.find(fine_global_index);
@@ -331,59 +343,73 @@ void FlashFluxRegister::store (int fine_global_index, int dir, FArrayBox const&
             Array4<Real const> const& area = fine_area.const_array();
             const int* ifd = d_ifd.data();
             if (dir == 0) {
+#if (AMREX_SPACEDIM == 1)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
                     if (ifd[n]) {
-#if (AMREX_SPACEDIM == 1)
                         dest(i,0,0,n) = src(2*i,0,0,n)*area(2*i,0,0)*sf;
-#elif (AMREX_SPACEDIM == 2)
+                    } else {
+                        dest(i,0,0,n) = src(2*i,0,0,n)*sf;
+                    }
+                });
+#endif
+#if (AMREX_SPACEDIM == 2)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
+                    if (ifd[n]) {
                         dest(i,j,0,n) = (src(2*i,2*j  ,0,n)*area(2*i,2*j  ,0) +
                                          src(2*i,2*j+1,0,n)*area(2*i,2*j+1,0)) * sf;
-#elif (AMREX_SPACEDIM == 3)
+                    } else {
+                        dest(i,j,0,n) = (src(2*i,2*j  ,0,n) +
+                                         src(2*i,2*j+1,0,n)) * sf;
+                    }
+                });
+#endif
+#if (AMREX_SPACEDIM == 3)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
+                    if (ifd[n]) {
                         dest(i,j,k,n) = (src(2*i,2*j  ,2*k  ,n)*area(2*i,2*j  ,2*k  ) +
                                          src(2*i,2*j+1,2*k  ,n)*area(2*i,2*j+1,2*k  ) +
                                          src(2*i,2*j  ,2*k+1,n)*area(2*i,2*j  ,2*k+1) +
                                          src(2*i,2*j+1,2*k+1,n)*area(2*i,2*j+1,2*k+1)) * sf;
-#endif
                     } else {
-#if (AMREX_SPACEDIM == 1)
-                        dest(i,0,0,n) = src(2*i,0,0,n)*sf;
-#elif (AMREX_SPACEDIM == 2)
-                        dest(i,j,0,n) = (src(2*i,2*j  ,0,n) +
-                                         src(2*i,2*j+1,0,n)) * sf;
-#elif (AMREX_SPACEDIM == 3)
                         dest(i,j,k,n) = (src(2*i,2*j  ,2*k  ,n) +
                                          src(2*i,2*j+1,2*k  ,n) +
                                          src(2*i,2*j  ,2*k+1,n) +
                                          src(2*i,2*j+1,2*k+1,n)) * sf;
-#endif
                     }
                 });
+#endif
             } else if (dir == 1) {
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
                 {
                     if (ifd[n]) {
-#if (AMREX_SPACEDIM == 2)
                         dest(i,j,0,n) = (src(2*i  ,2*j,0,n)*area(2*i  ,2*j,0) +
                                          src(2*i+1,2*j,0,n)*area(2*i+1,2*j,0)) * sf;
-#elif (AMREX_SPACEDIM == 3)
+                    } else {
+                        dest(i,j,0,n) = (src(2*i  ,2*j,0,n) +
+                                         src(2*i+1,2*j,0,n)) * sf;
+                    }
+                });
+#endif
+#if (AMREX_SPACEDIM == 3)
+                AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
+                {
+                    if (ifd[n]) {
                         dest(i,j,k,n) = (src(2*i  ,2*j,2*k  ,n)*area(2*i  ,2*j,2*k  ) +
                                          src(2*i+1,2*j,2*k  ,n)*area(2*i+1,2*j,2*k  ) +
                                          src(2*i  ,2*j,2*k+1,n)*area(2*i  ,2*j,2*k+1) +
                                          src(2*i+1,2*j,2*k+1,n)*area(2*i+1,2*j,2*k+1)) * sf;
-#endif
                     } else {
-#if (AMREX_SPACEDIM == 2)
-                        dest(i,j,0,n) = (src(2*i  ,2*j,0,n) +
-                                         src(2*i+1,2*j,0,n)) * sf;
-#elif (AMREX_SPACEDIM == 3)
                         dest(i,j,k,n) = (src(2*i  ,2*j,2*k  ,n) +
                                          src(2*i+1,2*j,2*k  ,n) +
                                          src(2*i  ,2*j,2*k+1,n) +
                                          src(2*i+1,2*j,2*k+1,n)) * sf;
-#endif
                     }
                 });
+#endif
             } else {
 #if (AMREX_SPACEDIM == 3)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_4D (b, ncomp, i, j, k, n,
@@ -509,13 +535,8 @@ void FlashFluxRegister::load (int crse_global_index, int dir, FArrayBox& crse_fl
                               FArrayBox const& cflux, FArrayBox const& area_fab,
                               const int* isFluxDensity, Real sf_f, Real sf_c) const
 {
-#ifdef _OPENMP
-    auto& h_ifd = m_h_ifd[omp_get_thread_num()];
-    auto& d_ifd = m_d_ifd[omp_get_thread_num()];
-#else
-    auto& h_ifd = m_h_ifd[0];
-    auto& d_ifd = m_d_ifd[0];
-#endif
+    auto& h_ifd = m_h_ifd[OpenMP::get_thread_num()];
+    auto& d_ifd = m_d_ifd[OpenMP::get_thread_num()];
 
     AMREX_ASSERT(dir < AMREX_SPACEDIM);
     auto found = m_crse_map.find(crse_global_index);
diff --git a/Src/F_Interfaces/AmrCore/AMReX_fillpatch_fi.cpp b/Src/F_Interfaces/AmrCore/AMReX_fillpatch_fi.cpp
index 91399ea6cc7..a6afe15b07d 100644
--- a/Src/F_Interfaces/AmrCore/AMReX_fillpatch_fi.cpp
+++ b/Src/F_Interfaces/AmrCore/AMReX_fillpatch_fi.cpp
@@ -67,7 +67,7 @@ extern "C"
     {
 	Vector<BCRec> bcs(ncomp);
 	for (int i = 0; i < ncomp; ++i) {
-	    bcs.emplace_back(lo_bc[i], hi_bc[i]);
+	    bcs.emplace_back(lo_bc[i+scomp], hi_bc[i+scomp]);
 	}
 
         FPhysBC cbc(cfill, cgeom);
@@ -95,7 +95,7 @@ extern "C"
     {
 	Vector<BCRec> bcs(ncomp);
 	for (int i = 0; i < ncomp; ++i) {
-	    bcs.emplace_back(lo_bc[i], hi_bc[i]);
+	    bcs.emplace_back(lo_bc[i+scomp], hi_bc[i+scomp]);
 	}
 
         FPhysBC cbc(cfill, cgeom);
diff --git a/Src/F_Interfaces/AmrCore/AMReX_fluxregister_fi.cpp b/Src/F_Interfaces/AmrCore/AMReX_fluxregister_fi.cpp
index 3b7ec770db1..ee98cbb7ee0 100644
--- a/Src/F_Interfaces/AmrCore/AMReX_fluxregister_fi.cpp
+++ b/Src/F_Interfaces/AmrCore/AMReX_fluxregister_fi.cpp
@@ -72,7 +72,7 @@ extern "C"
                                           Real scale, const Geometry* crse_geom)
     {
         const int ncomp = flux_reg->nComp();
-        flux_reg->OverwriteFlux({AMREX_D_DECL(crse_flxs[0], crse_flxs[1], crse_flxs[2])},
+        flux_reg->OverwriteFlux({{AMREX_D_DECL(crse_flxs[0], crse_flxs[1], crse_flxs[2])}},
                                 scale, 0, 0, ncomp, *crse_geom);
     }
 }
diff --git a/Src/F_Interfaces/Base/AMReX_FPhysBC.cpp b/Src/F_Interfaces/Base/AMReX_FPhysBC.cpp
index ec9723cf71c..950970d4bad 100644
--- a/Src/F_Interfaces/Base/AMReX_FPhysBC.cpp
+++ b/Src/F_Interfaces/Base/AMReX_FPhysBC.cpp
@@ -4,7 +4,7 @@ using namespace amrex;
 
 void
 amrex::FPhysBC::operator() (MultiFab& mf, int scomp, int ncomp, IntVect const& /* */,
-                            Real time, int bccomp)
+                            Real time, int /*bccomp*/)
 {
     if (fill_physbc != nullptr) {
 	fill_physbc(&mf, scomp+1, ncomp, time, geom);
diff --git a/Src/F_Interfaces/Base/AMReX_boxarray_fi.cpp b/Src/F_Interfaces/Base/AMReX_boxarray_fi.cpp
index 6f2d5556def..2895a9667c9 100644
--- a/Src/F_Interfaces/Base/AMReX_boxarray_fi.cpp
+++ b/Src/F_Interfaces/Base/AMReX_boxarray_fi.cpp
@@ -1,6 +1,7 @@
 
 #include <AMReX_BoxArray.H>
 #include <AMReX_Print.H>
+#include <AMReX_Utility.H>
 
 using namespace amrex;
 
@@ -15,6 +16,7 @@ extern "C" {
     void amrex_fi_new_boxarray_from_bxfarr (BoxArray*& ba, const int* bxs, 
                                             const int nsides, const int ndims, const int nbxs)
     {
+        amrex::ignore_unused(nsides);
         AMREX_ASSERT(nsides == 2);
         AMREX_ASSERT(ndims >= AMREX_SPACEDIM);
         BoxList bl;
diff --git a/Src/F_Interfaces/Base/AMReX_distromap_fi.cpp b/Src/F_Interfaces/Base/AMReX_distromap_fi.cpp
index 926fe89208b..2d10dcb5c36 100644
--- a/Src/F_Interfaces/Base/AMReX_distromap_fi.cpp
+++ b/Src/F_Interfaces/Base/AMReX_distromap_fi.cpp
@@ -28,6 +28,14 @@ extern "C" {
 	dmo = new DistributionMapping(*dmi);
     }
 
+    void amrex_fi_distromap_get_pmap (const DistributionMapping* dm, int* pmap, const int plen)
+    {
+	Long dmsize = dm->size();
+	AMREX_ASSERT(plen >= dmsize);
+	for (int i = 0; i < dmsize && i < plen; ++i)
+            pmap[i] = (*dm)[i];
+    }
+
     void amrex_fi_print_distromap (const DistributionMapping* dm)
     {
 	AllPrint() << *dm;
diff --git a/Src/F_Interfaces/Base/AMReX_distromap_mod.F90 b/Src/F_Interfaces/Base/AMReX_distromap_mod.F90
index 172cb6581f7..259bb3fc086 100644
--- a/Src/F_Interfaces/Base/AMReX_distromap_mod.F90
+++ b/Src/F_Interfaces/Base/AMReX_distromap_mod.F90
@@ -17,6 +17,7 @@ module amrex_distromap_module
      generic   :: assignment(=) => amrex_distromap_assign, amrex_distromap_install   ! shallow copy
      procedure :: clone         => amrex_distromap_clone    ! deep copy
      procedure :: move          => amrex_distromap_move     ! transfer ownership
+     procedure :: get_pmap      => amrex_distromap_get_pmap ! fill caller-owned array of PEs
      procedure, private :: amrex_distromap_assign
      procedure, private :: amrex_distromap_install 
 #if !defined(__GFORTRAN__) || (__GNUC__ > 4)
@@ -71,6 +72,14 @@ subroutine amrex_fi_distromap_maxsize (dm,n) bind(c)
        integer(c_int), value :: n
      end subroutine amrex_fi_distromap_maxsize
 
+     subroutine amrex_fi_distromap_get_pmap (dm,pmap,plen) bind(c)
+       import
+       implicit none
+       type(c_ptr), value :: dm
+       integer(c_int), intent(out) :: pmap(*)
+       integer(c_int), value :: plen
+     end subroutine amrex_fi_distromap_get_pmap
+
      subroutine amrex_fi_print_distromap (dm) bind(c)
        import
        implicit none
@@ -134,6 +143,12 @@ subroutine amrex_distromap_move (dst, src)
     src%p = c_null_ptr
   end subroutine amrex_distromap_move
 
+  subroutine amrex_distromap_get_pmap (dm, pmap)
+    class(amrex_distromap) :: dm
+    integer, intent(out) :: pmap(:)
+    call amrex_fi_distromap_get_pmap(dm%p,pmap, size(pmap))
+  end subroutine amrex_distromap_get_pmap
+
   subroutine amrex_distromap_print (dm)
     type(amrex_distromap), intent(in) :: dm
     call amrex_fi_print_distromap(dm%p)
diff --git a/Src/F_Interfaces/Base/AMReX_geometry_mod.F90 b/Src/F_Interfaces/Base/AMReX_geometry_mod.F90
index bd26a5b5156..1ae3d0b074a 100644
--- a/Src/F_Interfaces/Base/AMReX_geometry_mod.F90
+++ b/Src/F_Interfaces/Base/AMReX_geometry_mod.F90
@@ -14,14 +14,15 @@ module amrex_geometry_module
   public :: amrex_pmask, amrex_problo, amrex_probhi
   public :: amrex_geometry_build, amrex_geometry_destroy, amrex_geometry_init_data
   public :: amrex_is_periodic, amrex_is_any_periodic, amrex_is_all_periodic
+  public :: amrex_geometry_finalize
 
   logical, save :: amrex_pmask(3)  = .false.  
   real(amrex_real), save :: amrex_problo(3) = 0.0_amrex_real
   real(amrex_real), save :: amrex_probhi(3) = 1.0_amrex_real
 
-  logical, save :: amrex_geometry_initialzied = .false.
+  logical, save :: amrex_geometry_initialized = .false.
 
-!$omp threadprivate(amrex_geometry_initialzied,amrex_pmask,amrex_problo,amrex_probhi)
+!$omp threadprivate(amrex_geometry_initialized,amrex_pmask,amrex_problo,amrex_probhi)
 
   type, public :: amrex_geometry
      logical          :: owner     = .false.
@@ -77,6 +78,13 @@ end subroutine amrex_fi_geometry_get_intdomain
 
 contains
 
+  subroutine amrex_geometry_finalize ()
+    amrex_pmask(3)  = .false.
+    amrex_problo(3) = 0.0_amrex_real
+    amrex_probhi(3) = 1.0_amrex_real
+    amrex_geometry_initialized = .false.
+  end subroutine amrex_geometry_finalize
+
   subroutine amrex_geometry_set_coord_sys (csys)
     integer, intent(in) :: csys
     type(amrex_parmparse) :: pp
@@ -126,9 +134,9 @@ subroutine amrex_geometry_init_data (geom)  ! geom%p must be valid!
     integer :: i, lo(3), hi(3)
     logical, external :: omp_in_parallel
     !$omp parallel if(.not.omp_in_parallel())
-    if (.not.amrex_geometry_initialzied) then
+    if (.not.amrex_geometry_initialized) then
        call amrex_geometry_init()
-       amrex_geometry_initialzied = .true.
+       amrex_geometry_initialized = .true.
     end if
     !$omp end parallel
     call amrex_fi_geometry_get_intdomain(geom%p, lo, hi)
diff --git a/Src/F_Interfaces/Base/AMReX_init_fi.cpp b/Src/F_Interfaces/Base/AMReX_init_fi.cpp
index 19c18c6d243..d439744f177 100644
--- a/Src/F_Interfaces/Base/AMReX_init_fi.cpp
+++ b/Src/F_Interfaces/Base/AMReX_init_fi.cpp
@@ -30,6 +30,7 @@ extern "C"
 #ifdef BL_USE_MPI
         MPI_Comm ccomm = MPI_Comm_f2c(fcomm);
 #else
+        amrex::ignore_unused(fcomm);
         int ccomm = 0;
 #endif
         amrex::Initialize(argc, argv, arg_parmparse, ccomm, proc_parmparse);
diff --git a/Src/F_Interfaces/Base/AMReX_init_mod.F90 b/Src/F_Interfaces/Base/AMReX_init_mod.F90
index 88266a9da21..ccd66c68769 100644
--- a/Src/F_Interfaces/Base/AMReX_init_mod.F90
+++ b/Src/F_Interfaces/Base/AMReX_init_mod.F90
@@ -62,6 +62,7 @@ end subroutine amrex_fi_init
   end subroutine amrex_init
   
   subroutine amrex_finalize ()
+    use amrex_geometry_module, only: amrex_geometry_finalize
     interface
        subroutine amrex_fi_finalize() bind(c)
          import
@@ -69,6 +70,7 @@ subroutine amrex_fi_finalize() bind(c)
        end subroutine amrex_fi_finalize
     end interface
     call amrex_fi_finalize()
+    call amrex_geometry_finalize()
     call amrex_parallel_finalize()
     initialized = .false.
   end subroutine amrex_finalize
diff --git a/Src/F_Interfaces/Base/AMReX_multifab_fi.cpp b/Src/F_Interfaces/Base/AMReX_multifab_fi.cpp
index 410ebca0f33..0094473fe80 100644
--- a/Src/F_Interfaces/Base/AMReX_multifab_fi.cpp
+++ b/Src/F_Interfaces/Base/AMReX_multifab_fi.cpp
@@ -9,9 +9,9 @@ extern "C" {
 
     void amrex_fi_new_multifab (MultiFab*& mf, const BoxArray*& ba, 
 				const DistributionMapping*& dm,
-				int nc, int ng, const int* nodal)
+				int nc, const int* ng, const int* nodal)
     {
-	mf = new MultiFab(amrex::convert(*ba, IntVect(nodal)), *dm, nc, ng);
+	mf = new MultiFab(amrex::convert(*ba, IntVect(nodal)), *dm, nc, IntVect(ng));
 	ba = &(mf->boxArray());
 	dm = &(mf->DistributionMap());
     }
@@ -31,9 +31,10 @@ extern "C" {
 	return mf->nComp();
     }
 
-    int amrex_fi_multifab_ngrow (const MultiFab* mf)
+    void amrex_fi_multifab_ngrow (const MultiFab* mf, int* ngv)
     {
-	return mf->nGrow();
+        IntVect const& ng = mf->nGrowVect();
+        AMREX_D_TERM(ngv[0] = ng[0];, ngv[1] = ng[1];, ngv[2] = ng[2]);
     }
 
     const BoxArray* amrex_fi_multifab_boxarray (const MultiFab* mf)
@@ -102,9 +103,9 @@ extern "C" {
 	return mf->norm2(comp);
     }
 
-    void amrex_fi_multifab_setval (MultiFab* mf, Real val, int ic, int nc, int ng)
+    void amrex_fi_multifab_setval (MultiFab* mf, Real val, int ic, int nc, const int* ng)
     {
-        mf->setVal(val, ic, nc, ng);
+        mf->setVal(val, ic, nc, IntVect(ng));
     }
 
     void amrex_fi_multifab_plus (MultiFab* mf, Real val, int ic, int nc, int ng)
@@ -156,9 +157,9 @@ extern "C" {
     }
 
     void amrex_fi_multifab_copy (MultiFab* dstmf, const MultiFab* srcmf,
-                                 int srccomp, int dstcomp, int nc, int ng)
+                                 int srccomp, int dstcomp, int nc, const int* ng)
     {
-        MultiFab::Copy(*dstmf, *srcmf, srccomp, dstcomp, nc, ng);
+        MultiFab::Copy(*dstmf, *srcmf, srccomp, dstcomp, nc, IntVect(ng));
     }
 
     void amrex_fi_multifab_parallelcopy (MultiFab* dstmf, const MultiFab* srcmf,
@@ -217,9 +218,9 @@ extern "C" {
 
     void amrex_fi_new_imultifab (iMultiFab*& imf, const BoxArray*& ba, 
 				 const DistributionMapping*& dm,
-				 int nc, int ng, const int* nodal)
+				 int nc, const int* ng, const int* nodal)
     {
-	imf = new iMultiFab(amrex::convert(*ba, IntVect(nodal)), *dm, nc, ng);
+	imf = new iMultiFab(amrex::convert(*ba, IntVect(nodal)), *dm, nc, IntVect(ng));
 	ba = &(imf->boxArray());
 	dm = &(imf->DistributionMap());
     }
@@ -247,9 +248,9 @@ extern "C" {
 	}
     }
 
-    void amrex_fi_imultifab_setval (iMultiFab* imf, int val, int ic, int nc, int ng)
+    void amrex_fi_imultifab_setval (iMultiFab* imf, int val, int ic, int nc, const int* ng)
     {
-        imf->setVal(val, ic, nc, ng);
+        imf->setVal(val, ic, nc, IntVect(ng));
     }
 
     // MFIter routines
diff --git a/Src/F_Interfaces/Base/AMReX_multifab_mod.F90 b/Src/F_Interfaces/Base/AMReX_multifab_mod.F90
index 4e64d4f618d..2d93a3a707c 100644
--- a/Src/F_Interfaces/Base/AMReX_multifab_mod.F90
+++ b/Src/F_Interfaces/Base/AMReX_multifab_mod.F90
@@ -27,7 +27,7 @@ module amrex_multifab_module
      logical               :: owner = .false.
      type   (c_ptr)        :: p     =  c_null_ptr
      integer(c_int)        :: nc    =  0
-     integer(c_int)        :: ng    =  0
+     integer(c_int)        :: ng(3) =  0
      type(amrex_boxarray)  :: ba
      type(amrex_distromap) :: dm
    contains
@@ -35,6 +35,7 @@ module amrex_multifab_module
      procedure :: move          => amrex_multifab_move     ! transfer ownership
      procedure :: ncomp         => amrex_multifab_ncomp
      procedure :: nghost        => amrex_multifab_nghost
+     procedure :: nghostvect    => amrex_multifab_nghost_vect
      procedure :: nodal_type    => amrex_multifab_nodal_type   ! get index type
      generic   :: dataPtr       => amrex_multifab_dataptr_iter, amrex_multifab_dataptr_int
      procedure :: min           => amrex_multifab_min
@@ -43,7 +44,7 @@ module amrex_multifab_module
      procedure :: norm0         => amrex_multifab_norm0
      procedure :: norm1         => amrex_multifab_norm1
      procedure :: norm2         => amrex_multifab_norm2
-     procedure :: setval        => amrex_multifab_setval
+     generic :: setval        => amrex_multifab_setval, amrex_multifab_setval_gv
      procedure :: plus          => amrex_multifab_plus
      procedure :: mult          => amrex_multifab_mult
      procedure :: add           => amrex_multifab_add
@@ -52,13 +53,17 @@ module amrex_multifab_module
      procedure :: divide        => amrex_multifab_divide
      procedure :: saxpy         => amrex_multifab_saxpy
      procedure :: lincomb       => amrex_multifab_lincomb
-     procedure :: copy          => amrex_multifab_copy     ! This copies the data
+     generic :: copy          => amrex_multifab_copy, amrex_multifab_copy_cgv ! This copies the data
      generic   :: parallel_copy => amrex_multifab_parallel_copy, amrex_multifab_parallel_copy_c, &
           amrex_multifab_parallel_copy_cg, amrex_multifab_parallel_copy_cgv
      generic   :: fill_boundary => amrex_multifab_fill_boundary, amrex_multifab_fill_boundary_c
      generic   :: override_sync => amrex_multifab_override_sync, amrex_multifab_override_sync_mask
      generic   :: sum_boundary  => amrex_multifab_sum_boundary, amrex_multifab_sum_boundary_c
      procedure :: average_sync  => amrex_multifab_average_sync
+     procedure, private :: amrex_multifab_setval
+     procedure, private :: amrex_multifab_setval_gv
+     procedure, private :: amrex_multifab_copy
+     procedure, private :: amrex_multifab_copy_cgv
      procedure, private :: amrex_multifab_fill_boundary
      procedure, private :: amrex_multifab_fill_boundary_c
      procedure, private :: amrex_multifab_parallel_copy
@@ -79,26 +84,39 @@ module amrex_multifab_module
 #endif
   end type amrex_multifab
 
+  interface amrex_multifab_build
+     module procedure amrex_multifab_build_s
+     module procedure amrex_multifab_build_a
+  end interface amrex_multifab_build
+
   type, public   :: amrex_imultifab
      logical               :: owner = .false.
      type   (c_ptr)        :: p     =  c_null_ptr
      integer(c_int)        :: nc    =  0
-     integer(c_int)        :: ng    =  0
+     integer(c_int)        :: ng(3) =  0
      type(amrex_boxarray)  :: ba
      type(amrex_distromap) :: dm
    contains
      generic   :: assignment(=) => amrex_imultifab_assign   ! shallow copy
      procedure :: ncomp         => amrex_imultifab_ncomp
      procedure :: nghost        => amrex_imultifab_nghost
+     procedure :: nghostvect    => amrex_imultifab_nghost_vect
      procedure :: nodal_type    => amrex_imultifab_nodal_type ! get index type
      procedure :: dataPtr       => amrex_imultifab_dataptr
-     procedure :: setval        => amrex_imultifab_setval
+     generic   :: setval        => amrex_imultifab_setval, amrex_imultifab_setval_gv
      procedure, private :: amrex_imultifab_assign
+     procedure, private :: amrex_imultifab_setval_gv
+     procedure, private :: amrex_imultifab_setval
 #if !defined(__GFORTRAN__) || (__GNUC__ > 4)
      final :: amrex_imultifab_destroy
 #endif
   end type amrex_imultifab
 
+  interface amrex_imultifab_build
+     module procedure amrex_imultifab_build_s
+     module procedure amrex_imultifab_build_a
+  end interface amrex_imultifab_build
+
   type, public :: amrex_mfiter
      type(c_ptr)      :: p       = c_null_ptr
      integer ,private :: counter = -1 
@@ -136,8 +154,8 @@ subroutine amrex_fi_new_multifab (mf,ba,dm,nc,ng,nodal) bind(c)
        import
        implicit none
        type(c_ptr) :: mf, ba, dm
-       integer(c_int), value :: nc, ng
-       integer(c_int), intent(in) :: nodal(3)
+       integer(c_int), value :: nc
+       integer(c_int), intent(in) :: ng(3), nodal(3)
      end subroutine amrex_fi_new_multifab
      
      subroutine amrex_fi_new_multifab_alias (mf, srcmf, comp, ncomp) bind(c)
@@ -160,11 +178,12 @@ integer(c_int) function amrex_fi_multifab_ncomp (mf) bind(c)
        type(c_ptr), value :: mf
      end function amrex_fi_multifab_ncomp
 
-     integer(c_int) function amrex_fi_multifab_ngrow (mf) bind(c)
+     subroutine amrex_fi_multifab_ngrow (mf, ngv) bind(c)
        import
        implicit none
        type(c_ptr), value :: mf
-     end function amrex_fi_multifab_ngrow
+       integer(c_int) :: ngv(3)
+     end subroutine amrex_fi_multifab_ngrow
 
      type(c_ptr) function amrex_fi_multifab_boxarray (mf) bind(c)
        import
@@ -248,7 +267,8 @@ subroutine amrex_fi_multifab_setval (mf, val, ic, nc, ng) bind(c)
        implicit none
        type(c_ptr), value :: mf
        real(amrex_real), value :: val
-       integer(c_int), value :: ic, nc, ng
+       integer(c_int), value :: ic, nc
+       integer(c_int), intent(in) :: ng(*)
      end subroutine amrex_fi_multifab_setval
 
      subroutine amrex_fi_multifab_plus (mf, val, ic, nc, ng) bind(c)
@@ -316,7 +336,8 @@ subroutine amrex_fi_multifab_copy (dstmf, srcmf, srccomp, dstcomp, nc, ng) bind(
        import
        implicit none
        type(c_ptr), value :: dstmf, srcmf
-       integer(c_int), value :: srccomp, dstcomp, nc, ng
+       integer(c_int), value :: srccomp, dstcomp, nc
+       integer(c_int), intent(in) :: ng(*)
      end subroutine amrex_fi_multifab_copy
 
      subroutine amrex_fi_multifab_parallelcopy(dstmf, srcmf, srccomp, dstcomp, nc,&
@@ -395,8 +416,8 @@ subroutine amrex_fi_new_imultifab (imf,ba,dm,nc,ng,nodal) bind(c)
        import
        implicit none
        type(c_ptr) :: imf, ba, dm
-       integer(c_int), value :: nc, ng
-       integer(c_int), intent(in) :: nodal(3)
+       integer(c_int), value :: nc
+       integer(c_int), intent(in) :: ng(3), nodal(3)
      end subroutine amrex_fi_new_imultifab
 
      subroutine amrex_fi_new_imultifab_alias (mf, srcmf, comp, ncomp) bind(c)
@@ -426,7 +447,8 @@ subroutine amrex_fi_imultifab_setval (imf, val, ic, nc, ng) bind(c)
        implicit none
        type(c_ptr), value :: imf
        integer(c_int), value :: val
-       integer(c_int), value :: ic, nc, ng
+       integer(c_int), value :: ic, nc
+       integer(c_int), intent(in) :: ng(*)
      end subroutine amrex_fi_imultifab_setval
   end interface
 
@@ -570,16 +592,16 @@ end subroutine amrex_fi_mfiter_fabbox
 
 contains
 
-  subroutine amrex_multifab_build (mf, ba, dm, nc, ng, nodal)
+  subroutine amrex_multifab_build_a (mf, ba, dm, nc, ng, nodal)
     type(amrex_multifab), intent(inout) :: mf
     type(amrex_boxarray), intent(in )   :: ba
     type(amrex_distromap),intent(in )   :: dm
-    integer, intent(in) :: nc, ng
+    integer, intent(in) :: nc, ng(*)
     logical, intent(in), optional :: nodal(*)
     integer :: inodal(3), dir
     mf%owner = .true.
     mf%nc = nc
-    mf%ng = ng
+    mf%ng(1:ndims) = ng(1:ndims)
     inodal = 0 
     if (present(nodal)) then
        do dir = 1, ndims
@@ -589,7 +611,16 @@ subroutine amrex_multifab_build (mf, ba, dm, nc, ng, nodal)
     mf%ba = ba
     mf%dm = dm
     call amrex_fi_new_multifab(mf%p, mf%ba%p, mf%dm%p, mf%nc, mf%ng, inodal)
-  end subroutine amrex_multifab_build
+  end subroutine amrex_multifab_build_a
+
+  subroutine amrex_multifab_build_s (mf, ba, dm, nc, ng, nodal)
+    type(amrex_multifab), intent(inout) :: mf
+    type(amrex_boxarray), intent(in )   :: ba
+    type(amrex_distromap),intent(in )   :: dm
+    integer, intent(in) :: nc, ng
+    logical, intent(in), optional :: nodal(*)
+    call amrex_multifab_build_a(mf, ba, dm, nc, (/ng,ng,ng/), nodal)
+  end subroutine amrex_multifab_build_s
 
   subroutine amrex_multifab_build_alias (mf, srcmf, comp, ncomp)
     type(amrex_multifab), intent(inout) :: mf
@@ -635,7 +666,7 @@ subroutine amrex_multifab_install (this, p)
     this%owner = .false.
     this%p     = p
     this%nc    = amrex_fi_multifab_ncomp(p)
-    this%ng    = amrex_fi_multifab_ngrow(p)
+    call amrex_fi_multifab_ngrow(p, this%ng)
     this%ba    = amrex_fi_multifab_boxarray(p)
     this%dm    = amrex_fi_multifab_distromap(p)
   end subroutine amrex_multifab_install
@@ -670,9 +701,15 @@ end function amrex_multifab_ncomp
 
   pure integer function amrex_multifab_nghost (this)
     class(amrex_multifab), intent(in) :: this
-    amrex_multifab_nghost = this%ng
+    amrex_multifab_nghost = this%ng(1)
   end function amrex_multifab_nghost
 
+  pure function amrex_multifab_nghost_vect (this) result(ngv)
+    class(amrex_multifab), intent(in) :: this
+    integer, dimension(3) :: ngv
+    ngv = this%ng
+  end function amrex_multifab_nghost_vect
+
   pure function amrex_multifab_nodal_type (this) result(nodal)
     class(amrex_multifab), intent(in) :: this
     logical, dimension(3) :: nodal
@@ -777,11 +814,18 @@ function amrex_multifab_norm2 (this, comp) result(r)
     end if
   end function amrex_multifab_norm2
 
+  subroutine amrex_multifab_setval_gv (this, val, icomp, ncomp, nghost)
+    class(amrex_multifab), intent(inout) :: this
+    real(amrex_real), intent(in) :: val
+    integer, intent(in) :: icomp, ncomp, nghost(*)
+    call amrex_fi_multifab_setval(this%p, val, icomp-1, ncomp, nghost)
+  end subroutine amrex_multifab_setval_gv
+
   subroutine amrex_multifab_setval (this, val, icomp, ncomp, nghost)
     class(amrex_multifab), intent(inout) :: this
     real(amrex_real), intent(in) :: val
     integer, intent(in), optional :: icomp, ncomp, nghost
-    integer :: ic, nc, ng
+    integer :: ic, nc, ng(3)
     ic = 0;         if (present(icomp))  ic = icomp-1
     nc = this%nc;   if (present(ncomp))  nc = ncomp
     ng = this%ng;   if (present(nghost)) ng = nghost
@@ -851,9 +895,16 @@ subroutine amrex_multifab_copy (this, srcmf, srccomp, dstcomp, nc, ng)
     class(amrex_multifab) :: this
     type(amrex_multifab), intent(in) :: srcmf
     integer, intent(in) :: srccomp, dstcomp, nc, ng
-    call amrex_fi_multifab_copy(this%p, srcmf%p, srccomp-1, dstcomp-1, nc, ng)
+    call amrex_fi_multifab_copy(this%p, srcmf%p, srccomp-1, dstcomp-1, nc, (/ng,ng,ng/))
   end subroutine amrex_multifab_copy
 
+  subroutine amrex_multifab_copy_cgv (this, srcmf, srccomp, dstcomp, nc, ng)
+    class(amrex_multifab) :: this
+    type(amrex_multifab), intent(in) :: srcmf
+    integer, intent(in) :: srccomp, dstcomp, nc, ng(*)
+    call amrex_fi_multifab_copy(this%p, srcmf%p, srccomp-1, dstcomp-1, nc, ng)
+  end subroutine amrex_multifab_copy_cgv
+
   subroutine amrex_multifab_parallel_copy (this, srcmf, geom)
     class(amrex_multifab) :: this
     type(amrex_multifab), intent(in) :: srcmf
@@ -922,7 +973,7 @@ subroutine amrex_multifab_read (mf, name)
     call amrex_fi_read_multifab(mf%p, amrex_string_f_to_c(name))
     mf%owner = .true.
     mf%nc    = amrex_fi_multifab_ncomp(mf%p)
-    mf%ng    = amrex_fi_multifab_ngrow(mf%p)
+    call amrex_fi_multifab_ngrow(mf%p, mf%ng)
     mf%ba    = amrex_fi_multifab_boxarray(mf%p)
     mf%dm    = amrex_fi_multifab_distromap(mf%p)
   end subroutine amrex_multifab_read
@@ -972,16 +1023,16 @@ end subroutine amrex_multifab_average_sync
 
 !------ imultifab routines ------!
 
-  subroutine amrex_imultifab_build (imf, ba, dm, nc, ng, nodal)
+  subroutine amrex_imultifab_build_a (imf, ba, dm, nc, ng, nodal)
     type(amrex_imultifab) :: imf
     type(amrex_boxarray), intent(in ) :: ba
     type(amrex_distromap), intent(in ) :: dm
-    integer, intent(in) :: nc, ng
+    integer, intent(in) :: nc, ng(*)
     logical, intent(in), optional :: nodal(*)
     integer :: inodal(3), dir
     imf%owner = .true.
     imf%nc = nc
-    imf%ng = ng
+    imf%ng(1:ndims) = ng(1:ndims)
     inodal = 0
     if (present(nodal)) then
        do dir = 1, ndims
@@ -991,7 +1042,16 @@ subroutine amrex_imultifab_build (imf, ba, dm, nc, ng, nodal)
     imf%ba = ba
     imf%dm = dm
     call amrex_fi_new_imultifab(imf%p, imf%ba%p, imf%dm%p, imf%nc, imf%ng, inodal)
-  end subroutine amrex_imultifab_build
+  end subroutine amrex_imultifab_build_a
+
+  subroutine amrex_imultifab_build_s (imf, ba, dm, nc, ng, nodal)
+    type(amrex_imultifab) :: imf
+    type(amrex_boxarray), intent(in ) :: ba
+    type(amrex_distromap), intent(in ) :: dm
+    integer, intent(in) :: nc, ng
+    logical, intent(in), optional :: nodal(*)
+    call amrex_imultifab_build_a(imf, ba, dm, nc, (/ng, ng, ng/), nodal)
+  end subroutine amrex_imultifab_build_s
 
   subroutine amrex_imultifab_build_alias (imf, srcimf, comp, ncomp)
     type(amrex_imultifab), intent(inout) :: imf
@@ -1038,9 +1098,15 @@ end function amrex_imultifab_ncomp
 
   pure integer function amrex_imultifab_nghost (this)
     class(amrex_imultifab), intent(in) :: this
-    amrex_imultifab_nghost = this%ng
+    amrex_imultifab_nghost = this%ng(1)
   end function amrex_imultifab_nghost
 
+  pure function amrex_imultifab_nghost_vect (this) result(ngv)
+    class(amrex_imultifab), intent(in) :: this
+    integer, dimension(3) :: ngv
+    ngv = this%ng
+  end function amrex_imultifab_nghost_vect
+
   pure function amrex_imultifab_nodal_type (this) result(nodal)
     class(amrex_imultifab), intent(in) :: this
     logical, dimension(3) :: nodal
@@ -1062,11 +1128,18 @@ function amrex_imultifab_dataPtr (this, mfi) result(dp)
     dp(bx%lo(1):,bx%lo(2):,bx%lo(3):,1:) => fp
   end function amrex_imultifab_dataPtr
 
+  subroutine amrex_imultifab_setval_gv (this, val, icomp, ncomp, nghost)
+    class(amrex_imultifab), intent(inout) :: this
+    integer, intent(in) :: val
+    integer, intent(in) :: icomp, ncomp, nghost(*)
+    call amrex_fi_imultifab_setval(this%p, val, icomp-1, ncomp, nghost)
+  end subroutine amrex_imultifab_setval_gv
+
   subroutine amrex_imultifab_setval (this, val, icomp, ncomp, nghost)
     class(amrex_imultifab), intent(inout) :: this
     integer, intent(in) :: val
     integer, intent(in), optional :: icomp, ncomp, nghost
-    integer :: ic, nc, ng
+    integer :: ic, nc, ng(3)
     ic = 0;         if (present(icomp))  ic = icomp-1
     nc = this%nc;   if (present(ncomp))  nc = ncomp
     ng = this%ng;   if (present(nghost)) ng = nghost
@@ -1332,7 +1405,7 @@ end function amrex_mfiter_validbox
   function amrex_mfiter_fabbox (this) result (bx)
     class(amrex_mfiter), intent(in) :: this
     type(amrex_box) :: bx
-    integer :: dir, inodal(3)
+    integer :: inodal(3)
     inodal = 0
     call amrex_fi_mfiter_fabbox(this%p, bx%lo, bx%hi, inodal)
     where (inodal .ne. 0) bx%nodal = .true.  ! note default is false
diff --git a/Src/F_Interfaces/Base/AMReX_parallel_mod.F90 b/Src/F_Interfaces/Base/AMReX_parallel_mod.F90
index ded3ca32ab3..1305369a0c1 100644
--- a/Src/F_Interfaces/Base/AMReX_parallel_mod.F90
+++ b/Src/F_Interfaces/Base/AMReX_parallel_mod.F90
@@ -1,8 +1,8 @@
 
 #ifdef BL_USE_MPI
 module amrex_fi_mpi
+  use mpi
   implicit none
-  include 'mpif.h'
 end module amrex_fi_mpi
 #endif
 
@@ -113,6 +113,8 @@ subroutine amrex_parallel_finalize ()
        call MPI_Finalize(ierr)
        call_mpi_finalize = .false.
     end if
+#else
+    call_mpi_finalize = .false.
 #endif
   end subroutine amrex_parallel_finalize
 
@@ -135,8 +137,8 @@ end function amrex_parallel_nprocs
   subroutine amrex_parallel_reduce_sum_is (i, rank)
     integer, intent(inout) :: i
     integer, intent(in), optional :: rank
-    integer :: tmp, ierr
 #ifdef BL_USE_MPI
+    integer :: tmp, ierr
     tmp = i
     if (present(rank)) then
        call MPI_Reduce(tmp, i, 1, MPI_INTEGER, MPI_SUM, rank, m_comm, ierr)
@@ -150,8 +152,8 @@ subroutine amrex_parallel_reduce_sum_iv (i, n, rank)
     integer, intent(inout) :: i(*)
     integer, intent(in) :: n
     integer, intent(in), optional :: rank
-    integer :: tmp(n), ierr
 #ifdef BL_USE_MPI
+    integer :: tmp(n), ierr
     tmp = i(1:n)
     if (present(rank)) then
        call MPI_Reduce(tmp, i, n, MPI_INTEGER, MPI_SUM, rank, m_comm, ierr)
@@ -164,9 +166,9 @@ end subroutine amrex_parallel_reduce_sum_iv
   subroutine amrex_parallel_reduce_sum_rs (r, rank)
     real(amrex_real), intent(inout) :: r
     integer, intent(in), optional :: rank
+#ifdef BL_USE_MPI
     real(amrex_real) :: tmp
     integer :: ierr
-#ifdef BL_USE_MPI
     tmp = r
     if (present(rank)) then
        call MPI_Reduce(tmp, r, 1, amrex_mpi_real, MPI_SUM, rank, m_comm, ierr)
@@ -180,9 +182,9 @@ subroutine amrex_parallel_reduce_sum_rv (r, n, rank)
     real(amrex_real), intent(inout) :: r(*)
     integer, intent(in) :: n
     integer, intent(in), optional :: rank
+#ifdef BL_USE_MPI
     real(amrex_real) :: tmp(n)
     integer :: ierr
-#ifdef BL_USE_MPI
     tmp = r(1:n)
     if (present(rank)) then
        call MPI_Reduce(tmp, r, n, amrex_mpi_real, MPI_SUM, rank, m_comm, ierr)
@@ -195,8 +197,8 @@ end subroutine amrex_parallel_reduce_sum_rv
   subroutine amrex_parallel_reduce_max_is (i, rank)
     integer, intent(inout) :: i
     integer, intent(in), optional :: rank
-    integer :: tmp, ierr
 #ifdef BL_USE_MPI
+    integer :: tmp, ierr
     tmp = i
     if (present(rank)) then
        call MPI_Reduce(tmp, i, 1, MPI_INTEGER, MPI_MAX, rank, m_comm, ierr)
@@ -210,8 +212,8 @@ subroutine amrex_parallel_reduce_max_iv (i, n, rank)
     integer, intent(inout) :: i(*)
     integer, intent(in) :: n
     integer, intent(in), optional :: rank
-    integer :: tmp(n), ierr
 #ifdef BL_USE_MPI
+    integer :: tmp(n), ierr
     tmp = i(1:n)
     if (present(rank)) then
        call MPI_Reduce(tmp, i, n, MPI_INTEGER, MPI_MAX, rank, m_comm, ierr)
@@ -224,9 +226,9 @@ end subroutine amrex_parallel_reduce_max_iv
   subroutine amrex_parallel_reduce_max_rs (r, rank)
     real(amrex_real), intent(inout) :: r
     integer, intent(in), optional :: rank
+#ifdef BL_USE_MPI
     real(amrex_real) :: tmp
     integer :: ierr
-#ifdef BL_USE_MPI
     tmp = r
     if (present(rank)) then
        call MPI_Reduce(tmp, r, 1, amrex_mpi_real, MPI_MAX, rank, m_comm, ierr)
@@ -240,9 +242,9 @@ subroutine amrex_parallel_reduce_max_rv (r, n, rank)
     real(amrex_real), intent(inout) :: r(*)
     integer, intent(in) :: n
     integer, intent(in), optional :: rank
+#ifdef BL_USE_MPI
     real(amrex_real) :: tmp(n)
     integer :: ierr
-#ifdef BL_USE_MPI
     tmp = r(1:n)
     if (present(rank)) then
        call MPI_Reduce(tmp, r, n, amrex_mpi_real, MPI_MAX, rank, m_comm, ierr)
@@ -255,8 +257,8 @@ end subroutine amrex_parallel_reduce_max_rv
   subroutine amrex_parallel_reduce_min_is (i, rank)
     integer, intent(inout) :: i
     integer, intent(in), optional :: rank
-    integer :: tmp, ierr
 #ifdef BL_USE_MPI
+    integer :: tmp, ierr
     tmp = i
     if (present(rank)) then
        call MPI_Reduce(tmp, i, 1, MPI_INTEGER, MPI_MIN, rank, m_comm, ierr)
@@ -270,8 +272,8 @@ subroutine amrex_parallel_reduce_min_iv (i, n, rank)
     integer, intent(inout) :: i(*)
     integer, intent(in) :: n
     integer, intent(in), optional :: rank
-    integer :: tmp(n), ierr
 #ifdef BL_USE_MPI
+    integer :: tmp(n), ierr
     tmp = i(1:n)
     if (present(rank)) then
        call MPI_Reduce(tmp, i, n, MPI_INTEGER, MPI_MIN, rank, m_comm, ierr)
@@ -284,9 +286,9 @@ end subroutine amrex_parallel_reduce_min_iv
   subroutine amrex_parallel_reduce_min_rs (r, rank)
     real(amrex_real), intent(inout) :: r
     integer, intent(in), optional :: rank
+#ifdef BL_USE_MPI
     real(amrex_real) :: tmp
     integer :: ierr
-#ifdef BL_USE_MPI
     tmp = r
     if (present(rank)) then
        call MPI_Reduce(tmp, r, 1, amrex_mpi_real, MPI_MIN, rank, m_comm, ierr)
@@ -300,9 +302,9 @@ subroutine amrex_parallel_reduce_min_rv (r, n, rank)
     real(amrex_real), intent(inout) :: r(*)
     integer, intent(in) :: n
     integer, intent(in), optional :: rank
+#ifdef BL_USE_MPI
     real(amrex_real) :: tmp(n)
     integer :: ierr
-#ifdef BL_USE_MPI
     tmp = r(1:n)
     if (present(rank)) then
        call MPI_Reduce(tmp, r, n, amrex_mpi_real, MPI_MIN, rank, m_comm, ierr)
diff --git a/Src/F_Interfaces/CMakeLists.txt b/Src/F_Interfaces/CMakeLists.txt
index 5da6a6d0537..403268508e2 100644
--- a/Src/F_Interfaces/CMakeLists.txt
+++ b/Src/F_Interfaces/CMakeLists.txt
@@ -6,13 +6,6 @@
 #
 target_compile_definitions( amrex PUBLIC $<BUILD_INTERFACE:AMREX_USE_F_INTERFACES BL_USE_F_INTERFACES>)
 
-# MPI Fortran library is required only when Fortran Interfaces are used
-if (ENABLE_MPI)
-   find_package(MPI REQUIRED Fortran)
-   target_link_libraries(amrex PUBLIC MPI::MPI_Fortran)
-   set_target_properties(MPI::MPI_Fortran  PROPERTIES IMPORTED_GLOBAL True )
-endif ()
-
 #
 # BASE subdir
 #
@@ -51,19 +44,22 @@ target_sources( amrex PRIVATE
 target_include_directories(amrex PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_DIR}/AmrCore>)
 
 target_sources(amrex PRIVATE
-   AmrCore/AMReX_amr_mod.F90
+   AmrCore/AMReX_amrcore_fi.cpp
    AmrCore/AMReX_amrcore_mod.F90
-   AmrCore/AMReX_tagbox_mod.F90
+   AmrCore/AMReX_amr_mod.F90
+   AmrCore/AMReX_FAmrCore.cpp
+   AmrCore/AMReX_FAmrCore.H
+   AmrCore/AMReX_fillpatch_fi.cpp
    AmrCore/AMReX_fillpatch_mod.F90
-   AmrCore/AMReX_fluxregister_mod.F90
+   AmrCore/AMReX_FlashFluxRegister.cpp
+   AmrCore/AMReX_flash_fluxregister_fi.cpp
+   AmrCore/AMReX_FlashFluxRegister.H
    AmrCore/AMReX_flash_fluxregister_mod.F90
+   AmrCore/AMReX_fluxregister_fi.cpp
+   AmrCore/AMReX_fluxregister_mod.F90
    AmrCore/AMReX_interpolater_mod.F90
-   AmrCore/AMReX_amrcore_fi.cpp
    AmrCore/AMReX_tagbox_fi.cpp
-   AmrCore/AMReX_fillpatch_fi.cpp
-   AmrCore/AMReX_fluxregister_fi.cpp
-   AmrCore/AMReX_FAmrCore.cpp
-   AmrCore/AMReX_FAmrCore.H
+   AmrCore/AMReX_tagbox_mod.F90
    )
 
 
@@ -78,7 +74,7 @@ target_sources( amrex PRIVATE Octree/AMReX_octree_mod.F90  Octree/AMReX_octree_f
 #
 # LINEARSOLVERS subdir
 #
-if (ENABLE_LINEAR_SOLVERS)
+if (AMReX_LINEAR_SOLVERS)
    target_include_directories(amrex PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_DIR}/LinearSolvers>)
 
    target_sources( amrex PRIVATE
@@ -97,7 +93,7 @@ endif ()
 #
 # PARTICLE subdir
 #
-if ( ENABLE_PARTICLES )
+if ( AMReX_PARTICLES )
    target_include_directories(amrex PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_LIST_DIR}/Particle>)
    target_sources( amrex PRIVATE
       Particle/AMReX_particlecontainer_fi.cpp Particle/AMReX_particlecontainer_mod.F90 )
diff --git a/Src/F_Interfaces/LinearSolvers/AMReX_abeclaplacian_fi.cpp b/Src/F_Interfaces/LinearSolvers/AMReX_abeclaplacian_fi.cpp
index 59596efc9e1..a66befab374 100644
--- a/Src/F_Interfaces/LinearSolvers/AMReX_abeclaplacian_fi.cpp
+++ b/Src/F_Interfaces/LinearSolvers/AMReX_abeclaplacian_fi.cpp
@@ -43,7 +43,7 @@ extern "C" {
     void amrex_fi_abeclap_set_bcoeffs (MLLinOp* linop, int amrlev, const MultiFab* beta[])
     {
         MLABecLaplacian& abeclap = dynamic_cast<MLABecLaplacian&>(*linop);
-        std::array<MultiFab const*, AMREX_SPACEDIM> b{AMREX_D_DECL(beta[0],beta[1],beta[2])};
+        std::array<MultiFab const*, AMREX_SPACEDIM> b{{AMREX_D_DECL(beta[0],beta[1],beta[2])}};
         abeclap.setBCoeffs(amrlev, b);
     }
 }
diff --git a/Src/F_Interfaces/LinearSolvers/AMReX_linop_fi.cpp b/Src/F_Interfaces/LinearSolvers/AMReX_linop_fi.cpp
index 19d01b09712..1bd61e613d5 100644
--- a/Src/F_Interfaces/LinearSolvers/AMReX_linop_fi.cpp
+++ b/Src/F_Interfaces/LinearSolvers/AMReX_linop_fi.cpp
@@ -18,13 +18,13 @@ extern "C" {
     void amrex_fi_linop_set_domain_bc (MLLinOp* linop, const int* ilobc, const int* ihibc)
     {
         std::array<LinOpBCType,AMREX_SPACEDIM> lobc
-             {AMREX_D_DECL(static_cast<LinOpBCType>(ilobc[0]),
-                           static_cast<LinOpBCType>(ilobc[1]),
-                           static_cast<LinOpBCType>(ilobc[2]))};
+        {{AMREX_D_DECL(static_cast<LinOpBCType>(ilobc[0]),
+                       static_cast<LinOpBCType>(ilobc[1]),
+                       static_cast<LinOpBCType>(ilobc[2]))}};
         std::array<LinOpBCType,AMREX_SPACEDIM> hibc
-             {AMREX_D_DECL(static_cast<LinOpBCType>(ihibc[0]),
-                           static_cast<LinOpBCType>(ihibc[1]),
-                           static_cast<LinOpBCType>(ihibc[2]))};
+        {{AMREX_D_DECL(static_cast<LinOpBCType>(ihibc[0]),
+                       static_cast<LinOpBCType>(ihibc[1]),
+                       static_cast<LinOpBCType>(ihibc[2]))}};
         linop->setDomainBC(lobc,hibc);
     }
 
diff --git a/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_fi.cpp b/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_fi.cpp
index 4f48c5a8326..bff278111a2 100644
--- a/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_fi.cpp
+++ b/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_fi.cpp
@@ -96,9 +96,9 @@
          }
      }
 
-     void amrex_fi_multigrid_set_cg_verbose (MLMG* mlmg, int n)
+     void amrex_fi_multigrid_set_bottom_verbose (MLMG* mlmg, int n)
      {
-         mlmg->setCGVerbose(n);
+         mlmg->setBottomVerbose(n);
      }
      
      void amrex_fi_multigrid_set_always_use_bnorm (MLMG* mlmg, int f)
diff --git a/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_mod.F90 b/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_mod.F90
index 754221d5db1..65d426ae474 100644
--- a/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_mod.F90
+++ b/Src/F_Interfaces/LinearSolvers/AMReX_multigrid_mod.F90
@@ -30,7 +30,7 @@ module amrex_multigrid_module
      procedure :: set_max_fmg_iter      => amrex_multigrid_set_max_fmg_iter
      procedure :: set_fixed_iter        => amrex_multigrid_set_fixed_iter
      procedure :: set_bottom_solver     => amrex_multigrid_set_bottom_solver
-     procedure :: set_cg_verbose        => amrex_multigrid_set_cg_verbose
+     procedure :: set_bottom_verbose    => amrex_multigrid_set_bottom_verbose
      procedure :: set_always_use_bnorm  => amrex_multigrid_set_always_use_bnorm
      procedure :: set_final_fill_bc     => amrex_multigrid_set_final_fill_bc
      procedure, private :: amrex_multigrid_assign
@@ -42,7 +42,7 @@ module amrex_multigrid_module
      procedure, private :: amrex_multigrid_set_max_iter
      procedure, private :: amrex_multigrid_set_max_fmg_iter
      procedure, private :: amrex_multigrid_set_fixed_iter
-     procedure, private :: amrex_multigrid_set_cg_verbose
+     procedure, private :: amrex_multigrid_set_bottom_verbose
      procedure, private :: amrex_multigrid_set_always_use_bnorm
      procedure, private :: amrex_multigrid_set_final_fill_bc
 
@@ -132,12 +132,12 @@ subroutine amrex_fi_multigrid_set_bottom_solver (mg, s) bind(c)
        integer(c_int), value :: s
      end subroutine amrex_fi_multigrid_set_bottom_solver
 
-     subroutine amrex_fi_multigrid_set_cg_verbose (mg, v) bind(c)
+     subroutine amrex_fi_multigrid_set_bottom_verbose (mg, v) bind(c)
        import
        implicit none
        type(c_ptr), value :: mg
        integer(c_int), value :: v
-     end subroutine amrex_fi_multigrid_set_cg_verbose
+     end subroutine amrex_fi_multigrid_set_bottom_verbose
 
      subroutine amrex_fi_multigrid_set_always_use_bnorm (mg, f) bind(c)
        import
@@ -283,11 +283,11 @@ subroutine amrex_multigrid_set_bottom_solver (mg, s)
   end subroutine amrex_multigrid_set_bottom_solver
 
 
-  subroutine amrex_multigrid_set_cg_verbose (mg, v)
+  subroutine amrex_multigrid_set_bottom_verbose (mg, v)
     class(amrex_multigrid), intent(inout) :: mg
     integer, intent(in) :: v
-    call amrex_fi_multigrid_set_cg_verbose(mg%p, v)
-  end subroutine amrex_multigrid_set_cg_verbose
+    call amrex_fi_multigrid_set_bottom_verbose(mg%p, v)
+  end subroutine amrex_multigrid_set_bottom_verbose
 
 
   subroutine amrex_multigrid_set_always_use_bnorm (mg, f)
diff --git a/Src/F_Interfaces/Octree/AMReX_octree_fi.cpp b/Src/F_Interfaces/Octree/AMReX_octree_fi.cpp
index d63bb1250bd..a63dba9fb12 100644
--- a/Src/F_Interfaces/Octree/AMReX_octree_fi.cpp
+++ b/Src/F_Interfaces/Octree/AMReX_octree_fi.cpp
@@ -26,7 +26,7 @@ extern "C" {
     {
         ParmParse pp("amr");
         int cnt = pp.countval("max_grid_size");
-        int max_grid_size;
+        int max_grid_size = 0;
         if (cnt == 0) {
             max_grid_size = 8;
             pp.add("max_grid_size", max_grid_size);
@@ -150,10 +150,12 @@ extern "C" {
                         famrcore->octree_leaf_dmap[lev] = DistributionMapping(iproc);
                         update_dummy_mf = true;
                     }
-                    famrcore->octree_leaf_dummy_mf[lev].reset
-                        (new MultiFab(famrcore->octree_leaf_grids[lev],
-                                      famrcore->octree_leaf_dmap[lev],
-                                      1,0,MFInfo().SetAlloc(false)));
+                    if (update_dummy_mf) {
+                        famrcore->octree_leaf_dummy_mf[lev].reset
+                            (new MultiFab(famrcore->octree_leaf_grids[lev],
+                                          famrcore->octree_leaf_dmap[lev],
+                                          1,0,MFInfo().SetAlloc(false)));
+                    }
                 }
             }
         }
diff --git a/Src/F_Interfaces/Octree/AMReX_octree_mod.F90 b/Src/F_Interfaces/Octree/AMReX_octree_mod.F90
index bab4a56ea41..e6259a7a9c8 100644
--- a/Src/F_Interfaces/Octree/AMReX_octree_mod.F90
+++ b/Src/F_Interfaces/Octree/AMReX_octree_mod.F90
@@ -11,6 +11,8 @@ module amrex_octree_module
   public :: amrex_octree_init, amrex_octree_finalize, amrex_octree_iter_build, &
        amrex_octree_iter_destroy, amrex_octree_average_down_leaves
 
+  public :: amrex_octree_post_regrid
+
   type, public :: amrex_octree_iter
      integer, private :: begin_index    = 0
      integer, private :: end_index      = 0 ! exclusive
diff --git a/Src/F_Interfaces/Particle/AMReX_particlecontainer_fi.cpp b/Src/F_Interfaces/Particle/AMReX_particlecontainer_fi.cpp
index da3a44de2b1..60f77c5a174 100644
--- a/Src/F_Interfaces/Particle/AMReX_particlecontainer_fi.cpp
+++ b/Src/F_Interfaces/Particle/AMReX_particlecontainer_fi.cpp
@@ -26,7 +26,7 @@ extern "C" {
 	delete particlecontainer;
     }
 
-    void amrex_fi_get_next_particle_id (int& id)
+    void amrex_fi_get_next_particle_id (Long& id)
     {
         id = FParticleContainer::ParticleType::NextID();
     }
@@ -35,7 +35,27 @@ extern "C" {
     {
         cpu = ParallelDescriptor::MyProc();
     }
-    
+
+    void amrex_fi_get_particle_id(Long& id, const FParticleContainer::ParticleType* p)
+    {
+        id = p->id();
+    }
+
+    void amrex_fi_set_particle_id(const Long& id, FParticleContainer::ParticleType* p)
+    {
+        p->id() = id;
+    }
+
+    void amrex_fi_get_particle_cpu(int& cpu, const FParticleContainer::ParticleType* p)
+    {
+        cpu = p->cpu();
+    }
+
+    void amrex_fi_set_particle_cpu(const int& cpu, FParticleContainer::ParticleType* p)
+    {
+        p->cpu() = cpu;
+    }
+
     void amrex_fi_write_particles(FParticleContainer* particlecontainer,
                                   const char* dirname, const char* pname, int is_checkpoint)
     {
@@ -49,7 +69,7 @@ extern "C" {
     }
 
     void amrex_fi_get_particles_mfi(FParticleContainer* particlecontainer,
-                                    int lev, MFIter* mfi, Real*& dp, Long& np)
+                                    int lev, MFIter* mfi, ParticleReal*& dp, Long& np)
     {
         const int grid = mfi->index();
         const int tile = mfi->LocalTileIndex();
@@ -69,7 +89,7 @@ extern "C" {
             dp = nullptr;
         }
     }
-    
+
     void amrex_fi_add_particle_mfi(FParticleContainer* particlecontainer,
                                    int lev, MFIter* mfi, FParticleContainer::ParticleType* p)
     {
@@ -79,7 +99,7 @@ extern "C" {
         auto& particle_tile  = particle_level[std::make_pair(grid, tile)];
         particle_tile.push_back(*p);
     }
-    
+
     void amrex_fi_num_particles_mfi(FParticleContainer* particlecontainer,
                                     int lev, MFIter* mfi, Long& np)
     {
@@ -87,7 +107,7 @@ extern "C" {
         const int tile = mfi->LocalTileIndex();
         auto& particle_level = particlecontainer->GetParticles(lev);
         auto search = particle_level.find(std::make_pair(grid, tile));
-        if (search != particle_level.end()) {            
+        if (search != particle_level.end()) {
             auto& particle_tile = search->second;
             np = particle_tile.numParticles();
         } else {
@@ -96,7 +116,7 @@ extern "C" {
     }
 
     void amrex_fi_get_particles_i(FParticleContainer* particlecontainer,
-                                  int lev, int grid, int tile, Real*& dp, Long& np)
+                                  int lev, int grid, int tile, ParticleReal*& dp, Long& np)
     {
         auto& particle_level = particlecontainer->GetParticles(lev);
         auto search = particle_level.find(std::make_pair(grid, tile));
@@ -114,7 +134,7 @@ extern "C" {
             dp = nullptr;
         }
     }
-    
+
     void amrex_fi_add_particle_i(FParticleContainer* particlecontainer,
                                  int lev, int grid, int tile, FParticleContainer::ParticleType* p)
     {
@@ -122,17 +142,17 @@ extern "C" {
         auto& particle_tile  = particle_level[std::make_pair(grid, tile)];
         particle_tile.push_back(*p);
     }
-    
+
     void amrex_fi_num_particles_i(FParticleContainer* particlecontainer,
                                   int lev, int grid, int tile, Long& np)
     {
         auto& particle_level = particlecontainer->GetParticles(lev);
         auto search = particle_level.find(std::make_pair(grid, tile));
-        if (search != particle_level.end()) {            
+        if (search != particle_level.end()) {
             auto& particle_tile = search->second;
             np = particle_tile.numParticles();
         } else {
             np = 0;
         }
-    }    
+    }
 }
diff --git a/Src/F_Interfaces/Particle/AMReX_particlecontainer_mod.F90 b/Src/F_Interfaces/Particle/AMReX_particlecontainer_mod.F90
index 6114ed8c807..fba25144fe7 100644
--- a/Src/F_Interfaces/Particle/AMReX_particlecontainer_mod.F90
+++ b/Src/F_Interfaces/Particle/AMReX_particlecontainer_mod.F90
@@ -4,7 +4,7 @@ module amrex_particlecontainer_module
   use amrex_base_module
   use amrex_string_module
   use amrex_fort_module, only: amrex_particle_real, amrex_long
-  
+
   implicit none
 
   private
@@ -12,12 +12,14 @@ module amrex_particlecontainer_module
   ! public routines
   public :: amrex_particlecontainer_build, amrex_particlecontainer_destroy
   public :: amrex_get_next_particle_id, amrex_get_cpu
-  
+  public :: amrex_get_particle_id, amrex_set_particle_id
+  public :: amrex_get_particle_cpu, amrex_set_particle_cpu
+
   type, bind(C), public :: amrex_particle
      real(amrex_particle_real)    :: pos(AMREX_SPACEDIM) !< Position
      real(amrex_particle_real)    :: vel(AMREX_SPACEDIM) !< Particle velocity
-     integer(c_int)               :: id
-     integer(c_int)               :: cpu
+     integer(c_int), private      :: id
+     integer(c_int), private      :: cpu
   end type amrex_particle
 
   type, public :: amrex_particlecontainer
@@ -56,7 +58,7 @@ end subroutine amrex_fi_delete_particlecontainer
      subroutine amrex_fi_get_next_particle_id (id) bind(c)
        import
        implicit none
-       integer(c_int) id
+       integer(amrex_long) id
      end subroutine amrex_fi_get_next_particle_id
 
      subroutine amrex_fi_get_cpu (cpu) bind(c)
@@ -64,7 +66,35 @@ subroutine amrex_fi_get_cpu (cpu) bind(c)
        implicit none
        integer(c_int) cpu
      end subroutine amrex_fi_get_cpu
-     
+
+     subroutine amrex_fi_get_particle_id (id, p) bind(c)
+       import
+       implicit none
+       integer(amrex_long) id
+       type(c_ptr),    value :: p
+     end subroutine amrex_fi_get_particle_id
+
+     subroutine amrex_fi_set_particle_id (id, p) bind(c)
+       import
+       implicit none
+       integer(amrex_long) id
+       type(c_ptr),    value :: p
+     end subroutine amrex_fi_set_particle_id
+
+     subroutine amrex_fi_get_particle_cpu (cpu, p) bind(c)
+       import
+       implicit none
+       integer(c_int) cpu
+       type(c_ptr),    value :: p
+     end subroutine amrex_fi_get_particle_cpu
+
+     subroutine amrex_fi_set_particle_cpu (cpu, p) bind(c)
+       import
+       implicit none
+       integer(c_int) cpu
+       type(c_ptr),    value :: p
+     end subroutine amrex_fi_set_particle_cpu
+
      subroutine amrex_fi_write_particles (pc, dirname, pname, is_checkpoint) bind(c)
        import
        implicit none
@@ -97,7 +127,7 @@ subroutine amrex_fi_add_particle_mfi(pc, lev, mfi, p) bind(c)
        type(c_ptr),    value :: pc, mfi
        type(c_ptr),    value :: p
      end subroutine amrex_fi_add_particle_mfi
-     
+
      subroutine amrex_fi_num_particles_mfi(pc, lev, mfi, np) bind(c)
        import
        implicit none
@@ -122,7 +152,7 @@ subroutine amrex_fi_add_particle_i(pc, lev, grid, tile, p) bind(c)
        type(c_ptr),    value :: pc
        type(c_ptr),    value :: p
      end subroutine amrex_fi_add_particle_i
-     
+
      subroutine amrex_fi_num_particles_i(pc, lev, grid, tile, np) bind(c)
        import
        implicit none
@@ -130,7 +160,7 @@ subroutine amrex_fi_num_particles_i(pc, lev, grid, tile, np) bind(c)
        type(c_ptr),    value :: pc
        integer(amrex_long)   :: np
      end subroutine amrex_fi_num_particles_i
-     
+
   end interface
 
 contains
@@ -148,7 +178,7 @@ subroutine amrex_particlecontainer_destroy (this)
   end subroutine amrex_particlecontainer_destroy
 
   function amrex_get_next_particle_id() result(id)
-    integer(c_int) :: id
+    integer(amrex_long) :: id
     call amrex_fi_get_next_particle_id(id)
   end function amrex_get_next_particle_id
 
@@ -157,8 +187,48 @@ function amrex_get_cpu() result(cpu)
     call amrex_fi_get_cpu(cpu)
   end function amrex_get_cpu
 
+  subroutine amrex_get_particle_id (id, particle)
+    integer(amrex_long), intent(inout) :: id
+    type(amrex_particle), intent(in), target :: particle
+    type(amrex_particle), pointer :: ptr
+    type(c_ptr) :: dp
+    ptr => particle
+    dp = c_loc(ptr)
+    call amrex_fi_get_particle_id(id, dp)
+  end subroutine amrex_get_particle_id
+
+  subroutine amrex_set_particle_id (id, particle)
+    integer(amrex_long), intent(in) :: id
+    type(amrex_particle), intent(inout), target :: particle
+    type(amrex_particle), pointer :: ptr
+    type(c_ptr) :: dp
+    ptr => particle
+    dp = c_loc(ptr)
+    call amrex_fi_set_particle_id(id, dp)
+  end subroutine amrex_set_particle_id
+
+  subroutine amrex_get_particle_cpu (cpu, particle)
+    integer(c_int), intent(inout) :: cpu
+    type(amrex_particle), intent(in), target :: particle
+    type(amrex_particle), pointer :: ptr
+    type(c_ptr) :: dp
+    ptr => particle
+    dp = c_loc(ptr)
+    call amrex_fi_get_particle_cpu(cpu, dp)
+  end subroutine amrex_get_particle_cpu
+
+  subroutine amrex_set_particle_cpu (cpu, particle)
+    integer(c_int), intent(in) :: cpu
+    type(amrex_particle), intent(inout), target :: particle
+    type(amrex_particle), pointer :: ptr
+    type(c_ptr) :: dp
+    ptr => particle
+    dp = c_loc(ptr)
+    call amrex_fi_set_particle_cpu(cpu, dp)
+  end subroutine amrex_set_particle_cpu
+
   subroutine amrex_write_particles (this, dirname, pname, is_checkpoint)
-    class(amrex_particlecontainer), intent(inout) :: this    
+    class(amrex_particlecontainer), intent(inout) :: this
     character(len=*), intent(in) :: dirname
     character(len=*), intent(in) :: pname
     logical, intent(in)          :: is_checkpoint
@@ -169,13 +239,13 @@ subroutine amrex_write_particles (this, dirname, pname, is_checkpoint)
     else
        is_check_flag = 0
     end if
-    
+
     call amrex_fi_write_particles(this%p, amrex_string_f_to_c(dirname), &
          amrex_string_f_to_c(pname), is_check_flag)
   end subroutine amrex_write_particles
 
   subroutine amrex_particle_redistribute (this, lev_min,lev_max,nghost)
-    class(amrex_particlecontainer), intent(inout) :: this    
+    class(amrex_particlecontainer), intent(inout) :: this
     integer, optional, intent(in) :: lev_min, lev_max, nghost
     integer(c_int) :: default_min, default_max, default_ng
     default_min = 0
@@ -189,7 +259,7 @@ subroutine amrex_particle_redistribute (this, lev_min,lev_max,nghost)
   end subroutine amrex_particle_redistribute
 
   subroutine amrex_add_particle_mfi(this, lev, mfi, particle)
-    class(amrex_particlecontainer), intent(inout) :: this    
+    class(amrex_particlecontainer), intent(inout) :: this
     integer(c_int),       intent(in)           :: lev
     type(amrex_mfiter),   intent(in)           :: mfi
     type(amrex_particle), intent(in), target :: particle
@@ -199,7 +269,7 @@ subroutine amrex_add_particle_mfi(this, lev, mfi, particle)
     dp = c_loc(ptr)
     call amrex_fi_add_particle_mfi(this%p, lev, mfi%p, dp)
   end subroutine amrex_add_particle_mfi
-  
+
   function amrex_get_particles_mfi(this, lev, mfi) result(particles)
     class(amrex_particlecontainer), intent(inout) :: this
     integer(c_int),     intent(in) :: lev
@@ -220,7 +290,7 @@ function amrex_num_particles_mfi(this, lev, mfi) result(np)
   end function amrex_num_particles_mfi
 
   subroutine amrex_add_particle_i(this, lev, grid, tile, particle)
-    class(amrex_particlecontainer), intent(inout) :: this    
+    class(amrex_particlecontainer), intent(inout) :: this
     integer(c_int),       intent(in)           :: lev, grid, tile
     type(amrex_particle), intent(in), target :: particle
     type(amrex_particle), pointer :: ptr
@@ -229,7 +299,7 @@ subroutine amrex_add_particle_i(this, lev, grid, tile, particle)
     dp = c_loc(ptr)
     call amrex_fi_add_particle_i(this%p, lev, grid, tile, dp)
   end subroutine amrex_add_particle_i
-  
+
   function amrex_get_particles_i(this, lev, grid, tile) result(particles)
     class(amrex_particlecontainer), intent(inout) :: this
     integer(c_int),     intent(in) :: lev, grid, tile
@@ -246,6 +316,6 @@ function amrex_num_particles_i(this, lev, grid, tile) result(np)
     integer(amrex_long) :: np
     call amrex_fi_num_particles_i(this%p, lev, grid, tile, np)
   end function amrex_num_particles_i
-  
+
 end module amrex_particlecontainer_module
 
diff --git a/Src/LinearSolvers/CMakeLists.txt b/Src/LinearSolvers/CMakeLists.txt
index 3da95852148..edd447e16e5 100644
--- a/Src/LinearSolvers/CMakeLists.txt
+++ b/Src/LinearSolvers/CMakeLists.txt
@@ -9,7 +9,7 @@ target_sources(amrex
    MLMG/AMReX_MLMG.H
    MLMG/AMReX_MLMG.cpp
    MLMG/AMReX_MLMG_K.H
-   MLMG/AMReX_MLMG_${DIM}D_K.H
+   MLMG/AMReX_MLMG_${AMReX_SPACEDIM}D_K.H
    MLMG/AMReX_MLMGBndry.H
    MLMG/AMReX_MLMGBndry.cpp
    MLMG/AMReX_MLLinOp.H
@@ -26,48 +26,48 @@ target_sources(amrex
    MLMG/AMReX_MLABecLaplacian.H
    MLMG/AMReX_MLABecLaplacian.cpp
    MLMG/AMReX_MLABecLap_K.H
-   MLMG/AMReX_MLABecLap_${DIM}D_K.H
+   MLMG/AMReX_MLABecLap_${AMReX_SPACEDIM}D_K.H
    MLMG/AMReX_MLALaplacian.H
    MLMG/AMReX_MLALaplacian.cpp
    MLMG/AMReX_MLALap_K.H
-   MLMG/AMReX_MLALap_${DIM}D_K.H
+   MLMG/AMReX_MLALap_${AMReX_SPACEDIM}D_K.H
    MLMG/AMReX_MLPoisson.H
    MLMG/AMReX_MLPoisson.cpp
    MLMG/AMReX_MLPoisson_K.H
-   MLMG/AMReX_MLPoisson_${DIM}D_K.H
+   MLMG/AMReX_MLPoisson_${AMReX_SPACEDIM}D_K.H
    MLMG/AMReX_MLNodeLaplacian.H
    MLMG/AMReX_MLNodeLaplacian.cpp
    MLMG/AMReX_MLNodeLap_K.H
-   MLMG/AMReX_MLNodeLap_${DIM}D_K.H
+   MLMG/AMReX_MLNodeLap_${AMReX_SPACEDIM}D_K.H
    MLMG/AMReX_MLNodeTensorLaplacian.H
    MLMG/AMReX_MLNodeTensorLaplacian.cpp
    MLMG/AMReX_MLNodeTensorLap_K.H
-   MLMG/AMReX_MLNodeTensorLap_${DIM}D_K.H
+   MLMG/AMReX_MLNodeTensorLap_${AMReX_SPACEDIM}D_K.H
    MLMG/AMReX_MLTensorOp.H
    MLMG/AMReX_MLTensorOp.cpp
    MLMG/AMReX_MLTensor_K.H
-   MLMG/AMReX_MLTensor_${DIM}D_K.H
+   MLMG/AMReX_MLTensor_${AMReX_SPACEDIM}D_K.H
    Projections/AMReX_MacProjector.H
    Projections/AMReX_MacProjector.cpp
    Projections/AMReX_NodalProjector.H
    Projections/AMReX_NodalProjector.cpp
    )
 
-if (ENABLE_EB)
+if (AMReX_EB)
    target_sources(amrex
       PRIVATE
       MLMG/AMReX_MLEBABecLap.H
       MLMG/AMReX_MLEBABecLap.cpp
       MLMG/AMReX_MLEBABecLap_K.H
-      MLMG/AMReX_MLEBABecLap_${DIM}D_K.H
+      MLMG/AMReX_MLEBABecLap_${AMReX_SPACEDIM}D_K.H
       MLMG/AMReX_MLEBTensorOp.H
       MLMG/AMReX_MLEBTensorOp.cpp
       MLMG/AMReX_MLEBTensor_K.H
-      MLMG/AMReX_MLEBTensor_${DIM}D_K.H
+      MLMG/AMReX_MLEBTensor_${AMReX_SPACEDIM}D_K.H
       )
 endif ()
 
-if (ENABLE_FORTRAN)
+if (AMReX_FORTRAN)
    target_sources(amrex
       PRIVATE
       MLMG/AMReX_MLLinOp_F.H
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABecLaplacian.H b/Src/LinearSolvers/C_CellMG/AMReX_ABecLaplacian.H
deleted file mode 100644
index 4f194a6c48a..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABecLaplacian.H
+++ /dev/null
@@ -1,334 +0,0 @@
-
-#ifndef AMREX_ABecLAPLACIAN_H_
-#define AMREX_ABecLAPLACIAN_H_
-
-#include <AMReX_Array.H>
-#include <AMReX_LinOp.H>
-
-namespace amrex {
-
-/**
-        An ABecLaplacian tailors the description of a linear operator to apply
-        the second-order central difference approximation to the differential
-        operator, ``alpha*a(x).phi - beta*div[b(x).grad(phi)]``, on a cell-centered
-        MultiFab, phi.  Here, alpha and beta are constants, a(x) is a
-        cell-centered MultiFab, and b(x) is a vector of wall-centered
-        MultiFabs, 1 per dimension.  phi can have multiple components, but
-        all coefficient info is scalar, and norm reports on ALL components
-        together.
-
-        An ABecLaplacian tailors a LinOp (a virtual base class for general
-        linear operators) to compute the second-order central difference
-        approximation to the differential operator,
-
-              ``alpha*a(x).phi - beta*div[b(x).grad(phi)]``
-
-        on a cell-centered
-        MultiFab, phi.  Here, alpha and beta are constants, a(x) is a
-        cell-centered MultiFab, and b(x) is a vector of wall-centered
-        MultiFabs, 1 per dimension.  phi can have multiple components, but
-        all coefficient info is scalar, and norm reports on ALL components
-        together.
-
-        This class provides the necessary
-        implementations for applying the operator, and for
-        smoothing a guessed solution to the linear equation system,
-        L(phi) = rhs (where rhs is another cell-centered MultiFab).  This
-        class also provides access functions to set/control the coefficient
-        MulitFabs a and b, as well as the scalars, alpha and beta.  These
-        customizations are designed for 2D and 3D, with constant (but
-        not necessarily equal) mesh spacing in each direction.
-
-        Application of the operator and smoothing are
-        "level" operations, and therefore must access "hidden" level data
-        (such as boundary conditions, etc) as required, in concert with the
-        semantics of the underlying LinOp defintions.  Accordingly, these
-        implementations are "protected" and called only by the publically
-        accessible members of the virtual base class, LinOp.  Note that these
-        implementations may therefore assume that boundary (ghost) nodes and
-        other pertinent information are filled properly by the base class
-        functions prior to call.
-
-        Defaults are as follows for the coefficients:
-
-         ``alpha = 1.0
-         beta = 1.0
-         a (MultiFab) = 0.0
-         b (MultiFab) = 1.0``
-
-        This class does NOT provide a copy constructor or assignment operator.
-*/
-
-class ABecLaplacian
-    :
-    public LinOp
-{
-public:
-
-    /**
-    * \brief constructor for box array, boundary data and scalar mesh spacing
-    *
-    * \param bd
-    * \param _h
-    */
-    ABecLaplacian (const BndryData& bd,
-                   Real             _h);
-
-    /**
-    * \brief constructor for box array, boundary data and vector mesh spacing
-    *
-    * \param bd
-    * \param _h
-    */
-    ABecLaplacian (const BndryData& bd,
-                   const Real*      _h);
-
-    /**
-    * \brief constructor for box array, boundary data and vector mesh spacing
-    *
-    * The ABecLaplacian assumes ownership of the pointer.
-    *
-    * \param bd
-    * \param _h
-    */
-    ABecLaplacian (BndryData*   bd,
-                   const Real* _h);
-
-    /**
-    * \brief destructor
-    */
-    virtual ~ABecLaplacian () override;
-
-    /**
-    * \brief Compute extensive (area-weighted) flux associated with the op
-    *
-    * \param xflux
-    * \param yflux
-    * \param zflux
-    * \param in
-    * \param bc_mode
-    * \param src_comp
-    * \param dst_comp
-    * \param num_comp
-    * \param bnd_comp
-    */
-    virtual void compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-			   MultiFab& in, const BC_Mode& bc_mode=LinOp::Inhomogeneous_BC,
-			   int src_comp=0, int dst_comp=0, int num_comp=1, int bnd_comp=0) override;
-
-    void compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-                   MultiFab& in, bool do_ApplyBC, const BC_Mode& bc_mode=LinOp::Inhomogeneous_BC,
-		   int src_comp=0, int dst_comp=0, int num_comp=1, int bnd_comp=0);
-
-    /**
-    * \brief Set scalar coefficients.
-    *
-    * \param _alpha
-    * \param _beta
-    */
-    void setScalars (Real _alpha, Real _beta) { alpha = _alpha; beta = _beta;}
-
-    /**
-    * \brief get scalar alpha coefficient
-    */
-    virtual Real get_alpha () const override { return alpha; }
-
-    /**
-    * \brief get scalar beta coefficient
-    */
-    virtual Real get_beta () const override { return beta; }
-
-    /**
-    * \brief return reference to "a" coefficients for base level
-    *
-    * \param level
-    */
-    virtual const MultiFab& aCoefficients (int level = 0) override;
-
-    /**
-    * \brief return reference to "b" coefficients for base level
-    *
-    * \param dir
-    * \param level
-    */
-    virtual const MultiFab& bCoefficients (int dir,
-					   int level=0) override;
-
-    /**
-    * \brief copy _a into "a" coeffs for base level
-    *
-    * \param _a
-    */
-    void aCoefficients (const MultiFab& _a);
-
-    /**
-    * \brief Zero out the "a" coeffs for base level.
-    */
-    void ZeroACoefficients ();
-
-    /**
-    * \brief copy _b into "b" coeffs in "dir" coordinate direction for base level
-    *
-    * \param _b
-    * \param dir
-    */
-    void bCoefficients (const MultiFab& _b,
-                        int             dir);
-
-    /**
-    * \brief copy _b into "b" coeffs in "dir" coordinate direction for base level
-    * at supplied gridno
-    *
-    * \param _b
-    * \param dir
-    * \param gridno
-    */
-    void bCoefficients (const FArrayBox& _b,
-                        int              dir,
-                        int              gridno);
-
-    /**
-    * \brief alternative (older) version of above members
-    *
-    * \param _a
-    * \param _bX
-    * \param _bY
-    */
-    void setCoefficients (const MultiFab& _a,
-                          const MultiFab& _bX,
-                          const MultiFab& _bY);
-
-    /**
-    * \brief collective version of above members (taking an array of MultiFabs for "b")
-    *
-    * \param _a
-    * \param _b
-    */
-    void setCoefficients (const MultiFab& _a,
-                          const MultiFab* _b);
-    void setCoefficients (const MultiFab& _a,
-                          const Vector<MultiFab*>& _b);
-
-    /**
-    * \brief allocate/fill internal data for new level
-    *
-    * \param level
-    */
-    virtual void prepareForLevel (int level) override;
-
-    /**
-    * \brief remove internal data for this level and all levels above
-    *
-    * \param level
-    */
-    virtual void clearToLevel (int level) override;
-
-    /**
-    * \brief set flags so that a coeffs at lev and coarser require recalculation
-    *
-    * \param lev
-    */
-    void invalidate_a_to_level (int lev);
-
-    /**
-    * \brief set flags so that b coeffs at lev and coarser require recalculation
-    *
-    * \param lev
-    */
-    void invalidate_b_to_level (int lev);
-
-    virtual Real norm (int nm = 0, int level = 0, const bool local = false) override;
-
-protected:
-
-    /**
-    * \brief initialize a full set (a,b) of coefficients on the box array
-    *
-    * \param _ba
-    * \param _dm
-    */
-    void initCoefficients (const BoxArray &_ba, const DistributionMapping& _dm);
-
-    /**
-    * \brief compute out=L(in) at level=level
-    *
-    * \param out
-    * \param in
-    * \param level
-    */
-    virtual void Fapply (MultiFab&       out,
-                         const MultiFab& in,
-                         int             level) override;
-    virtual void Fapply (MultiFab&       out,
-			 int             dst_comp,
-                         const MultiFab& in,
-			 int             src_comp,
-			 int             num_comp,
-                         int             level) override;
-
-    /**
-    * \brief apply GSRB smoother to improve residual to L(solnL)=rhsL
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param rgbflag
-    */
-    virtual void Fsmooth (MultiFab&       solnL,
-                          const MultiFab& rhsL,
-                          int             level,
-                          int             rgbflag) override;
-
-    /**
-    * \brief apply Jacobi smoother to improve residual to L(solnL)=rhsL
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    */
-    virtual void Fsmooth_jacobi (MultiFab&       solnL,
-                                 const MultiFab& rhsL,
-                                 int             level) override;
-private:
-
-    //! Vector (on level) of "a" coefficients
-    Vector< MultiFab* > acoefs;
-
-    //! Vector (on level) of Array (on dimension) of "b" coefficients
-    Vector< Array< MultiFab*, BL_SPACEDIM> > bcoefs;
-
-    //! Scalar "alpha" coefficient
-    Real alpha;
-
-    //! Scalar "beta" coefficient
-    Real beta;
-
-    //! Flag, can a coeffs be trusted at a level.
-    Vector<int> a_valid;
-
-    //! Flag, can b coeffs be trusted at a level.
-    Vector<int> b_valid;
-
-    //! Default value for a (MultiFab) coefficient.
-    static Real a_def;
-
-    //! Default value for b (MultiFab) coefficient.
-    static Real b_def;
-
-    //! Default value for alpha (scalar) coefficient.
-    static Real alpha_def;
-
-    //! Default value for beta (scalar) coefficient.
-    static Real beta_def;
-
-    /**
-    * \brief Disallow copy constructors (for now...to be fixed)
-    *
-    */
-    ABecLaplacian (const ABecLaplacian&);
-    ABecLaplacian& operator= (const ABecLaplacian&);
-};
-
-}
-
-#endif /*_ABecLAPLACIAN_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABecLaplacian.cpp b/Src/LinearSolvers/C_CellMG/AMReX_ABecLaplacian.cpp
deleted file mode 100644
index 3e041283427..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABecLaplacian.cpp
+++ /dev/null
@@ -1,712 +0,0 @@
-
-#include <fstream>
-#include <algorithm>
-
-#include <AMReX_ABecLaplacian.H>
-#include <AMReX_ABec_F.H>
-#include <AMReX_ParallelDescriptor.H>
-
-namespace amrex {
-
-Real ABecLaplacian::a_def     = 0.0;
-Real ABecLaplacian::b_def     = 1.0;
-Real ABecLaplacian::alpha_def = 1.0;
-Real ABecLaplacian::beta_def  = 1.0;
-
-ABecLaplacian::ABecLaplacian (const BndryData& _bd,
-                              Real             _h)
-    :
-    LinOp(_bd,_h),
-    alpha(alpha_def),
-    beta(beta_def)
-{
-    initCoefficients(_bd.boxes(), _bd.DistributionMap());
-}
-
-ABecLaplacian::ABecLaplacian (const BndryData& _bd,
-                              const Real*      _h)
-    :
-    LinOp(_bd,_h),
-    alpha(alpha_def),
-    beta(beta_def)
-{
-    initCoefficients(_bd.boxes(), _bd.DistributionMap());
-}
-
-ABecLaplacian::ABecLaplacian (BndryData*  _bd,
-                              const Real* _h)
-    :
-    LinOp(_bd,_h),
-    alpha(alpha_def),
-    beta(beta_def)
-{
-    initCoefficients(_bd->boxes(), _bd->DistributionMap());
-}
-
-ABecLaplacian::~ABecLaplacian ()
-{
-    clearToLevel(-1);
-}
-
-Real
-ABecLaplacian::norm (int nm, int level, const bool local)
-{
-    BL_PROFILE("ABecLaplacian::norm()");
-
-    BL_ASSERT(nm == 0);
-    const MultiFab& a   = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX  = bCoefficients(0,level);,
-           const MultiFab& bY  = bCoefficients(1,level);,
-           const MultiFab& bZ  = bCoefficients(2,level););
-
-    //const int nc = a.nComp(); // FIXME: This LinOp only really support single-component
-    const int nc = 1;
-    Real res = 0.0;
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(max:res)
-#endif
-    {
-	for (MFIter amfi(a,tiling); amfi.isValid(); ++amfi)
-	{
-	    Real tres;
-	    
-	    const Box&       tbx  = amfi.tilebox();
-	    const FArrayBox& afab = a[amfi];
-	    
-	    AMREX_D_TERM(const FArrayBox& bxfab = bX[amfi];,
-		   const FArrayBox& byfab = bY[amfi];,
-		   const FArrayBox& bzfab = bZ[amfi];);
-	    
-#if (BL_SPACEDIM==2)
-	    amrex_abec_norma(&tres,
-		       &alpha, &beta,
-		       afab.dataPtr(),  AMREX_ARLIM(afab.loVect()), AMREX_ARLIM(afab.hiVect()),
-		       bxfab.dataPtr(), AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-		       byfab.dataPtr(), AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-		       tbx.loVect(), tbx.hiVect(), &nc,
-		       h[level].data());
-#elif (BL_SPACEDIM==3)
-	    
-	    amrex_abec_norma(&tres,
-		       &alpha, &beta,
-		       afab.dataPtr(),  AMREX_ARLIM(afab.loVect()), AMREX_ARLIM(afab.hiVect()),
-		       bxfab.dataPtr(), AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-		       byfab.dataPtr(), AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-		       bzfab.dataPtr(), AMREX_ARLIM(bzfab.loVect()), AMREX_ARLIM(bzfab.hiVect()),
-		       tbx.loVect(), tbx.hiVect(), &nc,
-		       h[level].data());
-#endif
-
-	    res = std::max(res, tres);
-	}
-    }
-
-    if (!local)
-        ParallelDescriptor::ReduceRealMax(res);
-    return res;
-}
-
-void
-ABecLaplacian::clearToLevel (int level)
-{
-  BL_ASSERT(level >= -1);
-
-  for (int i = level+1; i < numLevels(); ++i)
-  {
-    if (acoefs[i] != 0) {
-      delete acoefs[i];
-      acoefs[i] = 0;
-    }
-    a_valid[i] = false;
-
-    for (int j = 0; j < BL_SPACEDIM; ++j)
-    {
-      if (bcoefs[i][j] != 0) {
-        delete bcoefs[i][j];
-        bcoefs[i][j] = 0;
-      }
-    }
-    b_valid[i] = false;
-  }
-}
-
-void
-ABecLaplacian::prepareForLevel (int level)
-{
-    LinOp::prepareForLevel(level);
-
-    if (level == 0 )
-        return;
-
-    prepareForLevel(level-1);
-    //
-    // If coefficients were marked invalid, or if not yet made, make new ones
-    // (Note: makeCoefficients is a LinOp routine, and it allocates AND
-    // fills coefficients.  A more efficient implementation would allocate
-    // and fill in separate steps--we could then use the a_valid bool
-    // along with the length of a_valid to separately determine whether to
-    // fill or allocate the coefficient MultiFabs.
-    //
-    if (level >= a_valid.size() || a_valid[level] == false)
-    {
-        if (acoefs.size() < level+1)
-        {
-            acoefs.resize(level+1);
-            acoefs[level] = new MultiFab;
-        }
-        else
-        {
-            delete acoefs[level];
-            acoefs[level] = new MultiFab;
-        }
-        makeCoefficients(*acoefs[level], *acoefs[level-1], level);
-        a_valid.resize(level+1);
-        a_valid[level] = true;
-    }
-    
-    if (level >= b_valid.size() || b_valid[level] == false)
-    {
-        if (bcoefs.size() < level+1)
-        {
-            bcoefs.resize(level+1);
-            for(int i = 0; i < BL_SPACEDIM; ++i)
-                bcoefs[level][i] = new MultiFab;
-        }
-        else
-        {
-            for(int i = 0; i < BL_SPACEDIM; ++i)
-            {
-                delete bcoefs[level][i];
-                bcoefs[level][i] = new MultiFab;
-            }
-        }
-        for (int i = 0; i < BL_SPACEDIM; ++i)
-        {
-            makeCoefficients(*bcoefs[level][i], *bcoefs[level-1][i], level);
-        }
-        b_valid.resize(level+1);
-        b_valid[level] = true;
-    }
-}
-
-void
-ABecLaplacian::initCoefficients (const BoxArray& _ba, const DistributionMapping& _dm)
-{
-    const int nComp=1;
-    const int nGrow=0;
-    acoefs.resize(1);
-    bcoefs.resize(1);
-    acoefs[0] = new MultiFab(_ba, _dm, nComp, nGrow, MFInfo(), FArrayBoxFactory());
-    acoefs[0]->setVal(a_def);
-    a_valid.resize(1);
-    a_valid[0] = true;
-
-    for (int i = 0; i < BL_SPACEDIM; ++i)
-    {
-        BoxArray edge_boxes(_ba);
-        edge_boxes.surroundingNodes(i);
-        bcoefs[0][i] = new MultiFab(edge_boxes, _dm, nComp, nGrow, MFInfo(), FArrayBoxFactory());
-        bcoefs[0][i]->setVal(b_def);
-    }
-    b_valid.resize(1);
-    b_valid[0] = true;
-}
-
-void
-ABecLaplacian::aCoefficients (const MultiFab& _a)
-{
-    BL_ASSERT(_a.ok());
-    BL_ASSERT(_a.boxArray() == (acoefs[0])->boxArray());
-    invalidate_a_to_level(0);
-    (*acoefs[0]).copy(_a,0,0,1);
-}
-
-void
-ABecLaplacian::ZeroACoefficients ()
-{
-    invalidate_a_to_level(0);
-    (*acoefs[0]).setVal(0,0,acoefs[0]->nComp(),acoefs[0]->nGrow());
-}
-
-void
-ABecLaplacian::bCoefficients (const MultiFab& _b,
-                              int             dir)
-{
-    BL_ASSERT(_b.ok());
-    BL_ASSERT(_b.boxArray() == (bcoefs[0][dir])->boxArray());
-    invalidate_b_to_level(0);
-    (*bcoefs[0][dir]).copy(_b,0,0,1);
-}
-
-void
-ABecLaplacian::bCoefficients (const FArrayBox& _b,
-                              int              dir,
-                              int              gridno)
-{
-    BL_ASSERT(_b.box().contains((bcoefs[0][dir])->boxArray()[gridno]));
-    invalidate_b_to_level(0);
-    (*bcoefs[0][dir])[gridno].copy<RunOn::Host>(_b,0,0,1);
-}
-
-const MultiFab&
-ABecLaplacian::aCoefficients (int level)
-{
-    prepareForLevel(level);
-    return *acoefs[level];
-}
-
-const MultiFab&
-ABecLaplacian::bCoefficients (int dir,int level)
-{
-    prepareForLevel(level);
-    return *bcoefs[level][dir];
-}
-
-void
-ABecLaplacian::setCoefficients (const MultiFab &_a,
-                                const MultiFab &_bX,
-                                const MultiFab &_bY)
-{
-    aCoefficients(_a);
-    bCoefficients(_bX, 0);
-    bCoefficients(_bY, 1);
-}
-
-void
-ABecLaplacian::setCoefficients (const MultiFab& _a,
-                                const MultiFab* _b)
-{
-    aCoefficients(_a);
-    for (int n = 0; n < BL_SPACEDIM; ++n)
-        bCoefficients(_b[n], n);
-}
-
-void
-ABecLaplacian::setCoefficients (const MultiFab& _a,
-                                const Vector<MultiFab*>& _b)
-{
-    aCoefficients(_a);
-    for (int n = 0; n < BL_SPACEDIM; ++n)
-        bCoefficients(*_b[n], n);
-}
-
-void
-ABecLaplacian::invalidate_a_to_level (int lev)
-{
-    lev = (lev >= 0 ? lev : 0);
-    for (int i = lev; i < numLevels(); i++)
-        a_valid[i] = false;
-}
-
-void
-ABecLaplacian::invalidate_b_to_level (int lev)
-{
-    lev = (lev >= 0 ? lev : 0);
-    for (int i = lev; i < numLevels(); i++)
-        b_valid[i] = false;
-}
-
-void
-ABecLaplacian::compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-			 MultiFab& in, const BC_Mode& bc_mode,
-			 int src_comp, int dst_comp, int num_comp, int bnd_comp)
-{
-  compFlux(AMREX_D_DECL(xflux, yflux, zflux), in, true, bc_mode, src_comp, dst_comp, num_comp, bnd_comp);
-}
-
-void
-ABecLaplacian::compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-                         MultiFab& in, bool do_ApplyBC, const BC_Mode& bc_mode,
-			 int src_comp, int dst_comp, int num_comp, int bnd_comp)
-{
-    BL_PROFILE("ABecLaplacian::compFlux()");
-
-    const int level = 0;
-    BL_ASSERT(num_comp==1);
-
-    if (do_ApplyBC)
-      applyBC(in,src_comp,num_comp,level,bc_mode,bnd_comp);
-
-    const MultiFab& a = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-           const MultiFab& bY = bCoefficients(1,level);,
-           const MultiFab& bZ = bCoefficients(2,level););
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter inmfi(in,tiling); inmfi.isValid(); ++inmfi)
-    {
-        AMREX_D_TERM(const Box& xbx   = inmfi.nodaltilebox(0);,
-	       const Box& ybx   = inmfi.nodaltilebox(1);,
-	       const Box& zbx   = inmfi.nodaltilebox(2););
-
-        FArrayBox& infab = in[inmfi];
-
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[inmfi];,
-               const FArrayBox& byfab = bY[inmfi];,
-               const FArrayBox& bzfab = bZ[inmfi];);
-
-        AMREX_D_TERM(FArrayBox& xfluxfab = xflux[inmfi];,
-               FArrayBox& yfluxfab = yflux[inmfi];,
-               FArrayBox& zfluxfab = zflux[inmfi];);
-
-        amrex_abec_flux(infab.dataPtr(src_comp),
-		  AMREX_ARLIM(infab.loVect()), AMREX_ARLIM(infab.hiVect()),
-		  &alpha, &beta, a[inmfi].dataPtr(), 
-		  AMREX_ARLIM(a[inmfi].loVect()), AMREX_ARLIM(a[inmfi].hiVect()),
-		  bxfab.dataPtr(), 
-		  AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-#if (BL_SPACEDIM >= 2)
-		  byfab.dataPtr(), 
-		  AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-#if (BL_SPACEDIM == 3)
-		  bzfab.dataPtr(), 
-		  AMREX_ARLIM(bzfab.loVect()), AMREX_ARLIM(bzfab.hiVect()),
-#endif
-#endif
-		  xbx.loVect(), xbx.hiVect(), 
-#if (BL_SPACEDIM >= 2)
-		  ybx.loVect(), ybx.hiVect(), 
-#if (BL_SPACEDIM == 3)
-		  zbx.loVect(), zbx.hiVect(), 
-#endif
-#endif
-		  &num_comp,
-		  h[level].data(),
-		  xfluxfab.dataPtr(dst_comp),
-		  AMREX_ARLIM(xfluxfab.loVect()), AMREX_ARLIM(xfluxfab.hiVect())
-#if (BL_SPACEDIM >= 2)
-		  ,yfluxfab.dataPtr(dst_comp),
-		  AMREX_ARLIM(yfluxfab.loVect()), AMREX_ARLIM(yfluxfab.hiVect())
-#endif
-#if (BL_SPACEDIM == 3)
-		  ,zfluxfab.dataPtr(dst_comp),
-		  AMREX_ARLIM(zfluxfab.loVect()), AMREX_ARLIM(zfluxfab.hiVect())
-#endif
-		  );
-    }
-}
-        
-//
-// Must be defined for MultiGrid/CGSolver to work.
-//
-
-void
-ABecLaplacian::Fsmooth (MultiFab&       solnL,
-                        const MultiFab& rhsL,
-                        int             level,
-                        int             redBlackFlag)
-{
-    BL_PROFILE("ABecLaplacian::Fsmooth()");
-
-    OrientationIter oitr;
-
-    const FabSet& f0 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f1 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f2 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f3 = undrrelxr[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-    const FabSet& f4 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f5 = undrrelxr[level][oitr()]; oitr++;
-#endif    
-    const MultiFab& a = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-           const MultiFab& bY = bCoefficients(1,level);,
-           const MultiFab& bZ = bCoefficients(2,level););
-
-    oitr.rewind();
-    const MultiMask& mm0 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm1 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm2 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm3 = maskvals[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-    const MultiMask& mm4 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm5 = maskvals[level][oitr()]; oitr++;
-#endif
-
-    //const int nc = solnL.nComp(); // FIXME: This LinOp only really supports single-component
-    const int nc = 1;
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter solnLmfi(solnL,tiling); solnLmfi.isValid(); ++solnLmfi)
-    {
-	const Mask& m0 = mm0[solnLmfi];
-        const Mask& m1 = mm1[solnLmfi];
-        const Mask& m2 = mm2[solnLmfi];
-        const Mask& m3 = mm3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-        const Mask& m4 = mm4[solnLmfi];
-        const Mask& m5 = mm5[solnLmfi];
-#endif
-
-	const Box&       tbx     = solnLmfi.tilebox();
-        const Box&       vbx     = solnLmfi.validbox();
-        FArrayBox&       solnfab = solnL[solnLmfi];
-        const FArrayBox& rhsfab  = rhsL[solnLmfi];
-        const FArrayBox& afab    = a[solnLmfi];
-
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[solnLmfi];,
-               const FArrayBox& byfab = bY[solnLmfi];,
-               const FArrayBox& bzfab = bZ[solnLmfi];);
-
-        const FArrayBox& f0fab = f0[solnLmfi];
-        const FArrayBox& f1fab = f1[solnLmfi];
-        const FArrayBox& f2fab = f2[solnLmfi];
-        const FArrayBox& f3fab = f3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-        const FArrayBox& f4fab = f4[solnLmfi];
-        const FArrayBox& f5fab = f5[solnLmfi];
-#endif
-
-#if (BL_SPACEDIM == 2)
-        amrex_abec_gsrb(solnfab.dataPtr(), AMREX_ARLIM(solnfab.loVect()),AMREX_ARLIM(solnfab.hiVect()),
-                  rhsfab.dataPtr(), AMREX_ARLIM(rhsfab.loVect()), AMREX_ARLIM(rhsfab.hiVect()),
-                  &alpha, &beta,
-                  afab.dataPtr(), AMREX_ARLIM(afab.loVect()),    AMREX_ARLIM(afab.hiVect()),
-                  bxfab.dataPtr(), AMREX_ARLIM(bxfab.loVect()),   AMREX_ARLIM(bxfab.hiVect()),
-                  byfab.dataPtr(), AMREX_ARLIM(byfab.loVect()),   AMREX_ARLIM(byfab.hiVect()),
-                  f0fab.dataPtr(), AMREX_ARLIM(f0fab.loVect()),   AMREX_ARLIM(f0fab.hiVect()),
-                  m0.dataPtr(), AMREX_ARLIM(m0.loVect()),   AMREX_ARLIM(m0.hiVect()),
-                  f1fab.dataPtr(), AMREX_ARLIM(f1fab.loVect()),   AMREX_ARLIM(f1fab.hiVect()),
-                  m1.dataPtr(), AMREX_ARLIM(m1.loVect()),   AMREX_ARLIM(m1.hiVect()),
-                  f2fab.dataPtr(), AMREX_ARLIM(f2fab.loVect()),   AMREX_ARLIM(f2fab.hiVect()),
-                  m2.dataPtr(), AMREX_ARLIM(m2.loVect()),   AMREX_ARLIM(m2.hiVect()),
-                  f3fab.dataPtr(), AMREX_ARLIM(f3fab.loVect()),   AMREX_ARLIM(f3fab.hiVect()),
-                  m3.dataPtr(), AMREX_ARLIM(m3.loVect()),   AMREX_ARLIM(m3.hiVect()),
-                  tbx.loVect(), tbx.hiVect(), vbx.loVect(), vbx.hiVect(),
-                  &nc, h[level].data(), &redBlackFlag);
-#endif
-
-#if (BL_SPACEDIM == 3)
-        amrex_abec_gsrb(solnfab.dataPtr(), AMREX_ARLIM(solnfab.loVect()),AMREX_ARLIM(solnfab.hiVect()),
-                  rhsfab.dataPtr(), AMREX_ARLIM(rhsfab.loVect()), AMREX_ARLIM(rhsfab.hiVect()),
-                  &alpha, &beta,
-                  afab.dataPtr(), AMREX_ARLIM(afab.loVect()), AMREX_ARLIM(afab.hiVect()),
-                  bxfab.dataPtr(), AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-                  byfab.dataPtr(), AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-                  bzfab.dataPtr(), AMREX_ARLIM(bzfab.loVect()), AMREX_ARLIM(bzfab.hiVect()),
-                  f0fab.dataPtr(), AMREX_ARLIM(f0fab.loVect()), AMREX_ARLIM(f0fab.hiVect()),
-                  m0.dataPtr(), AMREX_ARLIM(m0.loVect()), AMREX_ARLIM(m0.hiVect()),
-                  f1fab.dataPtr(), AMREX_ARLIM(f1fab.loVect()), AMREX_ARLIM(f1fab.hiVect()),
-                  m1.dataPtr(), AMREX_ARLIM(m1.loVect()), AMREX_ARLIM(m1.hiVect()),
-                  f2fab.dataPtr(), AMREX_ARLIM(f2fab.loVect()), AMREX_ARLIM(f2fab.hiVect()),
-                  m2.dataPtr(), AMREX_ARLIM(m2.loVect()), AMREX_ARLIM(m2.hiVect()),
-                  f3fab.dataPtr(), AMREX_ARLIM(f3fab.loVect()), AMREX_ARLIM(f3fab.hiVect()),
-                  m3.dataPtr(), AMREX_ARLIM(m3.loVect()), AMREX_ARLIM(m3.hiVect()),
-                  f4fab.dataPtr(), AMREX_ARLIM(f4fab.loVect()), AMREX_ARLIM(f4fab.hiVect()),
-                  m4.dataPtr(), AMREX_ARLIM(m4.loVect()), AMREX_ARLIM(m4.hiVect()),
-                  f5fab.dataPtr(), AMREX_ARLIM(f5fab.loVect()), AMREX_ARLIM(f5fab.hiVect()),
-                  m5.dataPtr(), AMREX_ARLIM(m5.loVect()), AMREX_ARLIM(m5.hiVect()),
-                  tbx.loVect(), tbx.hiVect(), vbx.loVect(), vbx.hiVect(),
-                  &nc, h[level].data(), &redBlackFlag);
-#endif
-    }
-}
-
-void
-ABecLaplacian::Fsmooth_jacobi (MultiFab&       solnL,
-                               const MultiFab& rhsL,
-                               int             level)
-{
-    BL_PROFILE("ABecLaplacian::Fsmooth_jacobi()");
-
-    OrientationIter oitr;
-
-    const FabSet& f0 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f1 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f2 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f3 = undrrelxr[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-    const FabSet& f4 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f5 = undrrelxr[level][oitr()]; oitr++;
-#endif    
-    const MultiFab& a = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-           const MultiFab& bY = bCoefficients(1,level);,
-           const MultiFab& bZ = bCoefficients(2,level););
-
-    oitr.rewind();
-    const MultiMask& mm0 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm1 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm2 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm3 = maskvals[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-    const MultiMask& mm4 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm5 = maskvals[level][oitr()]; oitr++;
-#endif
-
-    //const int nc = solnL.nComp(); // FIXME: This LinOp only really supports single-component
-    const int nc = 1;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter solnLmfi(solnL); solnLmfi.isValid(); ++solnLmfi)
-    {
-	const Mask& m0 = mm0[solnLmfi];
-        const Mask& m1 = mm1[solnLmfi];
-        const Mask& m2 = mm2[solnLmfi];
-        const Mask& m3 = mm3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-        const Mask& m4 = mm4[solnLmfi];
-        const Mask& m5 = mm5[solnLmfi];
-#endif
-
-        const Box&       vbx     = solnLmfi.validbox();
-        FArrayBox&       solnfab = solnL[solnLmfi];
-        const FArrayBox& rhsfab  = rhsL[solnLmfi];
-        const FArrayBox& afab    = a[solnLmfi];
-
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[solnLmfi];,
-               const FArrayBox& byfab = bY[solnLmfi];,
-               const FArrayBox& bzfab = bZ[solnLmfi];);
-
-        const FArrayBox& f0fab = f0[solnLmfi];
-        const FArrayBox& f1fab = f1[solnLmfi];
-        const FArrayBox& f2fab = f2[solnLmfi];
-        const FArrayBox& f3fab = f3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-        const FArrayBox& f4fab = f4[solnLmfi];
-        const FArrayBox& f5fab = f5[solnLmfi];
-#endif
-
-#if (BL_SPACEDIM == 2)
-        amrex_abec_jacobi(solnfab.dataPtr(), AMREX_ARLIM(solnfab.loVect()),AMREX_ARLIM(solnfab.hiVect()),
-                    rhsfab.dataPtr(), AMREX_ARLIM(rhsfab.loVect()), AMREX_ARLIM(rhsfab.hiVect()),
-                    &alpha, &beta,
-                    afab.dataPtr(), AMREX_ARLIM(afab.loVect()),    AMREX_ARLIM(afab.hiVect()),
-                    bxfab.dataPtr(), AMREX_ARLIM(bxfab.loVect()),   AMREX_ARLIM(bxfab.hiVect()),
-                    byfab.dataPtr(), AMREX_ARLIM(byfab.loVect()),   AMREX_ARLIM(byfab.hiVect()),
-                    f0fab.dataPtr(), AMREX_ARLIM(f0fab.loVect()),   AMREX_ARLIM(f0fab.hiVect()),
-                    m0.dataPtr(), AMREX_ARLIM(m0.loVect()),   AMREX_ARLIM(m0.hiVect()),
-                    f1fab.dataPtr(), AMREX_ARLIM(f1fab.loVect()),   AMREX_ARLIM(f1fab.hiVect()),
-                    m1.dataPtr(), AMREX_ARLIM(m1.loVect()),   AMREX_ARLIM(m1.hiVect()),
-                    f2fab.dataPtr(), AMREX_ARLIM(f2fab.loVect()),   AMREX_ARLIM(f2fab.hiVect()),
-                    m2.dataPtr(), AMREX_ARLIM(m2.loVect()),   AMREX_ARLIM(m2.hiVect()),
-                    f3fab.dataPtr(), AMREX_ARLIM(f3fab.loVect()),   AMREX_ARLIM(f3fab.hiVect()),
-                    m3.dataPtr(), AMREX_ARLIM(m3.loVect()),   AMREX_ARLIM(m3.hiVect()),
-                    vbx.loVect(), vbx.hiVect(),
-                    &nc, h[level].data());
-#endif
-
-#if (BL_SPACEDIM == 3)
-        amrex_abec_jacobi(solnfab.dataPtr(), AMREX_ARLIM(solnfab.loVect()),AMREX_ARLIM(solnfab.hiVect()),
-                    rhsfab.dataPtr(), AMREX_ARLIM(rhsfab.loVect()), AMREX_ARLIM(rhsfab.hiVect()),
-                    &alpha, &beta,
-                    afab.dataPtr(), AMREX_ARLIM(afab.loVect()), AMREX_ARLIM(afab.hiVect()),
-                    bxfab.dataPtr(), AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-                    byfab.dataPtr(), AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-                    bzfab.dataPtr(), AMREX_ARLIM(bzfab.loVect()), AMREX_ARLIM(bzfab.hiVect()),
-                    f0fab.dataPtr(), AMREX_ARLIM(f0fab.loVect()), AMREX_ARLIM(f0fab.hiVect()),
-                    m0.dataPtr(), AMREX_ARLIM(m0.loVect()), AMREX_ARLIM(m0.hiVect()),
-                    f1fab.dataPtr(), AMREX_ARLIM(f1fab.loVect()), AMREX_ARLIM(f1fab.hiVect()),
-                    m1.dataPtr(), AMREX_ARLIM(m1.loVect()), AMREX_ARLIM(m1.hiVect()),
-                    f2fab.dataPtr(), AMREX_ARLIM(f2fab.loVect()), AMREX_ARLIM(f2fab.hiVect()),
-                    m2.dataPtr(), AMREX_ARLIM(m2.loVect()), AMREX_ARLIM(m2.hiVect()),
-                    f3fab.dataPtr(), AMREX_ARLIM(f3fab.loVect()), AMREX_ARLIM(f3fab.hiVect()),
-                    m3.dataPtr(), AMREX_ARLIM(m3.loVect()), AMREX_ARLIM(m3.hiVect()),
-                    f4fab.dataPtr(), AMREX_ARLIM(f4fab.loVect()), AMREX_ARLIM(f4fab.hiVect()),
-                    m4.dataPtr(), AMREX_ARLIM(m4.loVect()), AMREX_ARLIM(m4.hiVect()),
-                    f5fab.dataPtr(), AMREX_ARLIM(f5fab.loVect()), AMREX_ARLIM(f5fab.hiVect()),
-                    m5.dataPtr(), AMREX_ARLIM(m5.loVect()), AMREX_ARLIM(m5.hiVect()),
-                    vbx.loVect(), vbx.hiVect(),
-                    &nc, h[level].data());
-#endif
-    }
-}
-
-void
-ABecLaplacian::Fapply (MultiFab&       y,
-                       const MultiFab& x,
-                       int             level)
-{
-  int num_comp = 1;
-  int src_comp = 0;
-  int dst_comp = 0;
-
-  Fapply(y,dst_comp,x,src_comp,num_comp,level);
-}
-
-void
-ABecLaplacian::Fapply (MultiFab&       y,
-		       int             dst_comp,
-                       const MultiFab& x,
-		       int             src_comp,
-		       int             num_comp,
-                       int             level)
-{
-    BL_PROFILE("ABecLaplacian::Fapply()");
-
-    BL_ASSERT(y.nComp()>=dst_comp+num_comp);
-    BL_ASSERT(x.nComp()>=src_comp+num_comp);
-
-    const MultiFab& a   = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX  = bCoefficients(0,level);,
-           const MultiFab& bY  = bCoefficients(1,level);,
-           const MultiFab& bZ  = bCoefficients(2,level););
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter ymfi(y,tiling); ymfi.isValid(); ++ymfi)
-    {
-        const Box&       tbx  = ymfi.tilebox();
-        FArrayBox&       yfab = y[ymfi];
-        const FArrayBox& xfab = x[ymfi];
-        const FArrayBox& afab = a[ymfi];
-
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[ymfi];,
-               const FArrayBox& byfab = bY[ymfi];,
-               const FArrayBox& bzfab = bZ[ymfi];);
-
-#if (BL_SPACEDIM == 2)
-        amrex_abec_adotx(yfab.dataPtr(dst_comp),
-                   AMREX_ARLIM(yfab.loVect()),AMREX_ARLIM(yfab.hiVect()),
-                   xfab.dataPtr(src_comp),
-                   AMREX_ARLIM(xfab.loVect()), AMREX_ARLIM(xfab.hiVect()),
-                   &alpha, &beta, afab.dataPtr(), 
-                   AMREX_ARLIM(afab.loVect()), AMREX_ARLIM(afab.hiVect()),
-                   bxfab.dataPtr(), 
-                   AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-                   byfab.dataPtr(), 
-                   AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-                   tbx.loVect(), tbx.hiVect(), &num_comp,
-                   h[level].data());
-#endif
-#if (BL_SPACEDIM ==3)
-        amrex_abec_adotx(yfab.dataPtr(dst_comp),
-                   AMREX_ARLIM(yfab.loVect()), AMREX_ARLIM(yfab.hiVect()),
-                   xfab.dataPtr(src_comp),
-                   AMREX_ARLIM(xfab.loVect()), AMREX_ARLIM(xfab.hiVect()),
-                   &alpha, &beta, afab.dataPtr(), 
-                   AMREX_ARLIM(afab.loVect()), AMREX_ARLIM(afab.hiVect()),
-                   bxfab.dataPtr(), 
-                   AMREX_ARLIM(bxfab.loVect()), AMREX_ARLIM(bxfab.hiVect()),
-                   byfab.dataPtr(), 
-                   AMREX_ARLIM(byfab.loVect()), AMREX_ARLIM(byfab.hiVect()),
-                   bzfab.dataPtr(), 
-                   AMREX_ARLIM(bzfab.loVect()), AMREX_ARLIM(bzfab.hiVect()),
-                   tbx.loVect(), tbx.hiVect(), &num_comp,
-                   h[level].data());
-#endif
-    }
-}
-
-}
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABec_1D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_ABec_1D.F90
deleted file mode 100644
index c6ee50ae8a7..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABec_1D.F90
+++ /dev/null
@@ -1,244 +0,0 @@
-
-module amrex_abec_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     LINESOLVE
-!>     Apply the line solve to the state phi for the equation
-!>     ``L(phi) = alpha*a(x)*phi(x) - beta*Div(b(x)Grad(phi(x))) = rhs(x)``
-!>     central differenced, according to the arrays of boundary
-!>     masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator`` L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.   The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_abec_linesolve ( &
-           phi,phi_l1,phi_h1, &
-           rhs,rhs_l1,rhs_h1, &
-           alpha, beta, &
-           a,  a_l1,a_h1, &
-           bX, bX_l1,bX_h1, &
-           f0, f0_l1,f0_h1, &
-           m0, m0_l1,m0_h1, &
-           f2, f2_l1,f2_h1, &
-           m2, m2_l1,m2_h1, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_linesolve')
-
-      use amrex_abec_util_module, only : tridiag
-
-      real(amrex_real) alpha, beta
-      integer phi_l1,phi_h1
-      integer rhs_l1,rhs_h1
-      integer a_l1,a_h1
-      integer bX_l1,bX_h1
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer nc
-      integer f0_l1,f0_h1
-      real(amrex_real) f0(f0_l1:f0_h1)
-      integer f2_l1,f2_h1
-      real(amrex_real) f2(f2_l1:f2_h1)
-      integer m0_l1,m0_h1
-      integer m0(m0_l1:m0_h1)
-      integer m2_l1,m2_h1
-      integer m2(m2_l1:m2_h1)
-      real(amrex_real)  h(BL_SPACEDIM)
-      real(amrex_real)   phi(phi_l1:phi_h1,nc)
-      real(amrex_real)   rhs(rhs_l1:rhs_h1,nc)
-      real(amrex_real)     a(a_l1:a_h1)
-      real(amrex_real)    bX(bX_l1:bX_h1)
-
-      integer  i, n
-
-      real(amrex_real) dhx, cf0, cf2
-      real(amrex_real) delta, gamma, rho, rho_x
-
-      integer LSDIM
-      parameter(LSDIM=127)
-      real(amrex_real) a_ls(0:LSDIM)
-      real(amrex_real) b_ls(0:LSDIM)
-      real(amrex_real) c_ls(0:LSDIM)
-      real(amrex_real) r_ls(0:LSDIM)
-      real(amrex_real) u_ls(0:LSDIM)
-
-      integer ilen
-      ilen = hi(1)-lo(1)+1
-
-      dhx = beta/h(1)**2
-      do n = 1, nc
-             do i = lo(1), hi(1)
-
-               cf0 = merge(f0(lo(1)), 0.0D0, &
-                    (i .eq. lo(1)) .and. (m0(lo(1)-1).gt.0))
-               cf2 = merge(f2(hi(1)), 0.0D0, &
-                    (i .eq. hi(1)) .and. (m2(hi(1)+1).gt.0))
-
-               delta = dhx*(bX(i)*cf0 + bX(i+1)*cf2)
-
-               gamma = alpha*a(i) + dhx*( bX(i) + bX(i+1) )
-
-               a_ls(i-lo(1)) = -dhx*bX(i)
-               b_ls(i-lo(1)) = gamma - delta
-               c_ls(i-lo(1)) = -dhx*bX(i+1)
-               r_ls(i-lo(1)) = rhs(i,n) - phi(i,n)*delta
-
-               if (i .eq. lo(1)) &
-                  r_ls(i-lo(1)) = r_ls(i-lo(1)) + dhx*bX(i)*phi(i-1,n)
-
-               if (i .eq. hi(1)) &
-                  r_ls(i-lo(1)) = r_ls(i-lo(1)) + dhx*bX(i+1)*phi(i+1,n)
-             end do
-
-             call tridiag(a_ls,b_ls,c_ls,r_ls,u_ls,ilen)
-
-             do i = lo(1), hi(1)
-               phi(i,n) = u_ls(i-lo(1))
-             end do
-      end do
-
-    end subroutine amrex_abec_linesolve
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_abec_adotx( &
-           y,y_l1,y_h1, &
-           x,x_l1,x_h1, &
-           alpha, beta, &
-           a, a_l1,a_h1, &
-           bX, bX_l1,bX_h1, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_adotx')
-
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer y_l1,y_h1
-      integer x_l1,x_h1
-      integer a_l1,a_h1
-      integer bX_l1,bX_h1
-      real(amrex_real)  x(x_l1:x_h1,nc)
-      real(amrex_real)  y(x_l1:x_h1,nc)
-      real(amrex_real)  a(a_l1:a_h1)
-      real(amrex_real) bX(bX_l1:bX_h1)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,n
-      real(amrex_real) dhx
-
-      dhx = beta/h(1)**2
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            y(i,n) = alpha*a(i)*x(i,n) &
-                 - dhx* &
-                 (   bX(i+1)*( x(i+1,n) - x(i  ,n) ) &
-                 -   bX(i  )*( x(i  ,n) - x(i-1,n) ) )
-         end do
-      end do
-
-    end subroutine amrex_abec_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_abec_norma( &
-           res, &
-           alpha, beta, &
-           a, a_l1,a_h1, &
-           bX,bX_l1,bX_h1, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_norma')
-
-      real(amrex_real) res
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer a_l1,a_h1
-      integer bX_l1,bX_h1
-      real(amrex_real)  a(a_l1:a_h1)
-      real(amrex_real) bX(bX_l1:bX_h1)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,n
-      real(amrex_real) dhx
-
-      dhx = beta/h(1)**2
-
-      res = 0.0D0
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            res = max(res, &
-                 + abs( alpha*a(i) &
-                      + dhx * (bX(i+1) + bX(i)) ) &
-                 + abs(-dhx*bX(i+1)) + abs(-dhx*bX(i)) )
-         end do
-      end do
-
-    end subroutine amrex_abec_norma
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-    subroutine amrex_abec_flux( &
-           x,x_l1,x_h1, &
-           alpha, beta, &
-           a, a_l1,a_h1, &
-           bX,bX_l1,bX_h1, &
-           xlo,xhi,nc, &
-           h, &
-           xflux,xflux_l1,xflux_h1 &
-           ) bind(c,name='amrex_abec_flux')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM), nc
-      integer x_l1,x_h1
-      integer a_l1,a_h1
-      integer bX_l1,bX_h1
-      integer xflux_l1,xflux_h1
-      real(amrex_real)  x(x_l1:x_h1,nc)
-      real(amrex_real)  a(a_l1:a_h1)
-      real(amrex_real) bX(bX_l1:bX_h1)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      real(amrex_real) dhx
-      integer i,n
-
-      dhx = one/h(1)
-
-      do n = 1, nc
-         do i = xlo(1), xhi(1)
-            xflux(i,n) = - dhx*bX(i)*( x(i,n) - x(i-1,n) )
-         end do
-      end do
-
-    end subroutine amrex_abec_flux
-
-end module amrex_abec_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABec_2D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_ABec_2D.F90
deleted file mode 100644
index 1ef68476f3c..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABec_2D.F90
+++ /dev/null
@@ -1,545 +0,0 @@
-
-
-module amrex_abec_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Gauss-Seidel Red-Black (GSRB):
-!>     Apply the GSRB relaxation to the state phi for the equation
-!>     ``L(phi) = alpha*a(x)*phi(x) - beta*Div(b(x)Grad(phi(x))) = rhs(x)``
-!>     central differenced, according to the arrays of boundary
-!>     masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.   The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_abec_gsrb ( &
-           phi,phi_l1,phi_l2,phi_h1,phi_h2, &
-           rhs,rhs_l1,rhs_l2,rhs_h1,rhs_h2, &
-           alpha, beta, &
-           a,  a_l1,a_l2,a_h1,a_h2, &
-           bX, bX_l1,bX_l2,bX_h1,bX_h2, &
-           bY, bY_l1,bY_l2,bY_h1,bY_h2, &
-           f0, f0_l1,f0_l2,f0_h1,f0_h2, &
-           m0, m0_l1,m0_l2,m0_h1,m0_h2, &
-           f1, f1_l1,f1_l2,f1_h1,f1_h2, &
-           m1, m1_l1,m1_l2,m1_h1,m1_h2, &
-           f2, f2_l1,f2_l2,f2_h1,f2_h2, &
-           m2, m2_l1,m2_l2,m2_h1,m2_h2, &
-           f3, f3_l1,f3_l2,f3_h1,f3_h2, &
-           m3, m3_l1,m3_l2,m3_h1,m3_h2, &
-           lo,hi,blo,bhi, &
-           nc,h,redblack &
-           ) bind(c,name='amrex_abec_gsrb')
-
-      use amrex_abec_util_module, only : tridiag
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer phi_l1,phi_l2,phi_h1,phi_h2
-      integer rhs_l1,rhs_l2,rhs_h1,rhs_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer bX_l1,bX_l2,bX_h1,bX_h2
-      integer bY_l1,bY_l2,bY_h1,bY_h2
-      integer  lo(BL_SPACEDIM),  hi(BL_SPACEDIM)
-      integer blo(BL_SPACEDIM), bhi(BL_SPACEDIM)
-      integer nc
-      integer redblack
-      integer f0_l1,f0_l2,f0_h1,f0_h2
-      real(amrex_real) f0(f0_l1:f0_h1,f0_l2:f0_h2)
-      integer f1_l1,f1_l2,f1_h1,f1_h2
-      real(amrex_real) f1(f1_l1:f1_h1,f1_l2:f1_h2)
-      integer f2_l1,f2_l2,f2_h1,f2_h2
-      real(amrex_real) f2(f2_l1:f2_h1,f2_l2:f2_h2)
-      integer f3_l1,f3_l2,f3_h1,f3_h2
-      real(amrex_real) f3(f3_l1:f3_h1,f3_l2:f3_h2)
-      integer m0_l1,m0_l2,m0_h1,m0_h2
-      integer m0(m0_l1:m0_h1,m0_l2:m0_h2)
-      integer m1_l1,m1_l2,m1_h1,m1_h2
-      integer m1(m1_l1:m1_h1,m1_l2:m1_h2)
-      integer m2_l1,m2_l2,m2_h1,m2_h2
-      integer m2(m2_l1:m2_h1,m2_l2:m2_h2)
-      integer m3_l1,m3_l2,m3_h1,m3_h2
-      integer m3(m3_l1:m3_h1,m3_l2:m3_h2)
-      real(amrex_real)  h(BL_SPACEDIM)
-      real(amrex_real)   phi(phi_l1:phi_h1,phi_l2:phi_h2,nc)
-      real(amrex_real)   rhs(rhs_l1:rhs_h1,rhs_l2:rhs_h2,nc)
-      real(amrex_real)     a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real)    bX(bX_l1:bX_h1,bX_l2:bX_h2)
-      real(amrex_real)    bY(bY_l1:bY_h1,bY_l2:bY_h2)
-
-      integer  i, j, ioff, joff, n
-
-      real(amrex_real) dhx, dhy, cf0, cf1, cf2, cf3
-      real(amrex_real) delta, gamma, rho, rho_x, rho_y
-
-      integer LSDIM
-      parameter(LSDIM=127)
-      real(amrex_real) a_ls(0:LSDIM)
-      real(amrex_real) b_ls(0:LSDIM)
-      real(amrex_real) c_ls(0:LSDIM)
-      real(amrex_real) r_ls(0:LSDIM)
-      real(amrex_real) u_ls(0:LSDIM)
-
-      integer do_line
-      integer ilen,jlen
-
-      if (h(2) .gt. 1.5D0*h(1)) then
-        do_line = 1
-        ilen = hi(1)-lo(1)+1
-        if (ilen .gt. LSDIM) then
-#ifdef AMREX_DEBUG
-          print *,'TOO BIG FOR LINE SOLVE IN GSRB: ilen = ',ilen
-#endif
-          call bl_error("stop")
-        end if
-      else if (h(1) .gt. 1.5D0*h(2)) then
-        do_line = 2
-        jlen = hi(2)-lo(2)+1
-        if (jlen .gt. LSDIM) then
-#ifdef AMREX_DEBUG
-          print *,'TOO BIG FOR LINE SOLVE IN GSRB: jlen = ',jlen
-#endif
-          call bl_error("stop")
-        end if
-      else
-        do_line = 0
-      end if
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      do n = 1, nc
-       if (do_line .eq. 0) then
-         do j = lo(2), hi(2)
-            ioff = MOD(lo(1) + j + redblack, 2)
-            do i = lo(1) + ioff,hi(1),2
-
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                    (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                    (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                    (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                    (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                    +  dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-
-               gamma = alpha*a(i,j) &
-                    +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                    +   dhy*( bY(i,j) + bY(i,j+1) )
-
-               rho = dhx*(bX(i,j)*phi(i-1,j,n) + bX(i+1,j)*phi(i+1,j,n)) &
-                    +dhy*(bY(i,j)*phi(i,j-1,n) + bY(i,j+1)*phi(i,j+1,n))
-
-               phi(i,j,n) = (rhs(i,j,n) + rho - phi(i,j,n)*delta) &
-                    /                (gamma - delta)
-
-            end do
-         end do
-       else if (do_line .eq. 2) then
-         ioff = MOD(lo(1) + redblack, 2)
-         do i = lo(1) + ioff,hi(1),2
-             do j = lo(2), hi(2)
-
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                    (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                    (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                    (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                    (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                     + dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-
-               gamma = alpha*a(i,j) &
-                    +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                    +   dhy*( bY(i,j) + bY(i,j+1) )
-
-               rho_x = dhx*(bX(i,j)*phi(i-1,j,n) + bX(i+1,j)*phi(i+1,j,n))
-
-               a_ls(j-lo(2)) = -dhy*bY(i,j)
-               b_ls(j-lo(2)) = gamma - delta
-               c_ls(j-lo(2)) = -dhy*bY(i,j+1)
-               r_ls(j-lo(2)) = rhs(i,j,n) + rho_x - phi(i,j,n)*delta
-
-               if (j .eq. lo(2)) &
-                  r_ls(j-lo(2)) = r_ls(j-lo(2)) + dhy*bY(i,j)*phi(i,j-1,n)
-
-               if (j .eq. hi(2)) &
-                  r_ls(j-lo(2)) = r_ls(j-lo(2)) + dhy*bY(i,j+1)*phi(i,j+1,n)
-
-             end do
-
-             call tridiag(a_ls,b_ls,c_ls,r_ls,u_ls,jlen)
-
-             do j = lo(2), hi(2)
-               phi(i,j,n) = u_ls(j-lo(2))
-             end do
-         end do
-
-       else if (do_line .eq. 1) then
-
-           joff = MOD(lo(2) + redblack, 2)
-           do j = lo(2) + joff,hi(2),2
-             do i = lo(1), hi(1)
-
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                    (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                    (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                    (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                    (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                     + dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-
-               gamma = alpha*a(i,j) &
-                    +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                    +   dhy*( bY(i,j) + bY(i,j+1) )
-
-               rho_y = dhy*(bY(i,j)*phi(i,j-1,n) + bY(i,j+1)*phi(i,j+1,n))
-
-               a_ls(i-lo(1)) = -dhx*bX(i,j)
-               b_ls(i-lo(1)) = gamma - delta
-               c_ls(i-lo(1)) = -dhx*bX(i+1,j)
-               r_ls(i-lo(1)) = rhs(i,j,n) + rho_y - phi(i,j,n)*delta
-
-               if (i .eq. lo(1)) &
-                  r_ls(i-lo(1)) = r_ls(i-lo(1)) + dhx*bX(i,j)*phi(i-1,j,n)
-
-               if (i .eq. hi(1)) &
-                  r_ls(i-lo(1)) = r_ls(i-lo(1)) + dhx*bX(i+1,j)*phi(i+1,j,n)
-             end do
-
-             call tridiag(a_ls,b_ls,c_ls,r_ls,u_ls,ilen)
-
-             do i = lo(1), hi(1)
-               phi(i,j,n) = u_ls(i-lo(1))
-             end do
-         end do
-
-       else
-#ifdef AMREX_DEBUG
-         print *,'BOGUS DO_LINE '
-#endif
-         call bl_error("stop")
-       end if
-      end do
-
-    end subroutine amrex_abec_gsrb
-
-!-----------------------------------------------------------------------
-!>
-!>     JACOBI:
-!>     Apply the JACOBI relaxation to the state phi for the equation
-!>     ``L(phi) = alpha*a(x)*phi(x) - beta*Div(b(x)Grad(phi(x))) = rhs(x)``
-!>     central differenced, according to the arrays of boundary
-!>     masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.   The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_abec_jacobi ( &
-           phi,phi_l1,phi_l2,phi_h1,phi_h2, &
-           rhs,rhs_l1,rhs_l2,rhs_h1,rhs_h2, &
-           alpha, beta, &
-           a,  a_l1,a_l2,a_h1,a_h2, &
-           bX, bX_l1,bX_l2,bX_h1,bX_h2, &
-           bY, bY_l1,bY_l2,bY_h1,bY_h2, &
-           f0, f0_l1,f0_l2,f0_h1,f0_h2, &
-           m0, m0_l1,m0_l2,m0_h1,m0_h2, &
-           f1, f1_l1,f1_l2,f1_h1,f1_h2, &
-           m1, m1_l1,m1_l2,m1_h1,m1_h2, &
-           f2, f2_l1,f2_l2,f2_h1,f2_h2, &
-           m2, m2_l1,m2_l2,m2_h1,m2_h2, &
-           f3, f3_l1,f3_l2,f3_h1,f3_h2, &
-           m3, m3_l1,m3_l2,m3_h1,m3_h2, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_jacobi')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer phi_l1,phi_l2,phi_h1,phi_h2
-      integer rhs_l1,rhs_l2,rhs_h1,rhs_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer bX_l1,bX_l2,bX_h1,bX_h2
-      integer bY_l1,bY_l2,bY_h1,bY_h2
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer nc
-      integer f0_l1,f0_l2,f0_h1,f0_h2
-      real(amrex_real) f0(f0_l1:f0_h1,f0_l2:f0_h2)
-      integer f1_l1,f1_l2,f1_h1,f1_h2
-      real(amrex_real) f1(f1_l1:f1_h1,f1_l2:f1_h2)
-      integer f2_l1,f2_l2,f2_h1,f2_h2
-      real(amrex_real) f2(f2_l1:f2_h1,f2_l2:f2_h2)
-      integer f3_l1,f3_l2,f3_h1,f3_h2
-      real(amrex_real) f3(f3_l1:f3_h1,f3_l2:f3_h2)
-      integer m0_l1,m0_l2,m0_h1,m0_h2
-      integer m0(m0_l1:m0_h1,m0_l2:m0_h2)
-      integer m1_l1,m1_l2,m1_h1,m1_h2
-      integer m1(m1_l1:m1_h1,m1_l2:m1_h2)
-      integer m2_l1,m2_l2,m2_h1,m2_h2
-      integer m2(m2_l1:m2_h1,m2_l2:m2_h2)
-      integer m3_l1,m3_l2,m3_h1,m3_h2
-      integer m3(m3_l1:m3_h1,m3_l2:m3_h2)
-      real(amrex_real)  h(BL_SPACEDIM)
-      real(amrex_real)   phi(phi_l1:phi_h1,phi_l2:phi_h2,nc)
-      real(amrex_real)   rhs(rhs_l1:rhs_h1,rhs_l2:rhs_h2,nc)
-      real(amrex_real)     a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real)    bX(bX_l1:bX_h1,bX_l2:bX_h2)
-      real(amrex_real)    bY(bY_l1:bY_h1,bY_l2:bY_h2)
-
-      integer  i, j, n
-
-      real(amrex_real) dhx, dhy, cf0, cf1, cf2, cf3
-      real(amrex_real) delta, gamma, rho
-
-      real(amrex_real), allocatable :: phinew(:,:)
-
-      allocate(phinew(lo(1):hi(1),lo(2):hi(2)))
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1),hi(1)
-
-               cf0 = merge(f0(lo(1),j), 0.0D0, &
-                    (i .eq. lo(1)) .and. (m0(lo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,lo(2)), 0.0D0, &
-                    (j .eq. lo(2)) .and. (m1(i,lo(2)-1).gt.0))
-               cf2 = merge(f2(hi(1),j), 0.0D0, &
-                    (i .eq. hi(1)) .and. (m2(hi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,hi(2)), 0.0D0, &
-                    (j .eq. hi(2)) .and. (m3(i,hi(2)+1).gt.0))
-
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                    +  dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-
-               gamma = alpha*a(i,j) &
-                    +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                    +   dhy*( bY(i,j) + bY(i,j+1) )
-
-               rho = dhx*(bX(i,j)*phi(i-1,j,n) + bX(i+1,j)*phi(i+1,j,n)) &
-                    +dhy*(bY(i,j)*phi(i,j-1,n) + bY(i,j+1)*phi(i,j+1,n))
-
-               phinew(i,j) = (rhs(i,j,n) + rho - phi(i,j,n)*delta) &
-                    /                (gamma - delta)
-
-            end do
-         end do
-
-         phi(lo(1):hi(1),lo(2):hi(2),n) = phinew(lo(1):hi(1),lo(2):hi(2))
-
-      end do
-
-      deallocate(phinew)
-
-    end subroutine amrex_abec_jacobi
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_abec_adotx( &
-           y,y_l1,y_l2,y_h1,y_h2, &
-           x,x_l1,x_l2,x_h1,x_h2, &
-           alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           bX,bX_l1,bX_l2,bX_h1,bX_h2, &
-           bY,bY_l1,bY_l2,bY_h1,bY_h2, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_adotx')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer y_l1,y_l2,y_h1,y_h2
-      integer x_l1,x_l2,x_h1,x_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer bX_l1,bX_l2,bX_h1,bX_h2
-      integer bY_l1,bY_l2,bY_h1,bY_h2
-      real(amrex_real)  y(y_l1:y_h1,y_l2:y_h2,nc)
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real) bX(bX_l1:bX_h1,bX_l2:bX_h2)
-      real(amrex_real) bY(bY_l1:bY_h1,bY_l2:bY_h2)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,j,n
-      real(amrex_real) dhx,dhy
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               y(i,j,n) = alpha*a(i,j)*x(i,j,n) &
-                    - dhx* &
-                    (   bX(i+1,j)*( x(i+1,j,n) - x(i  ,j,n) ) &
-                    -   bX(i  ,j)*( x(i  ,j,n) - x(i-1,j,n) ) ) &
-                    - dhy* &
-                    (   bY(i,j+1)*( x(i,j+1,n) - x(i,j  ,n) ) &
-                    -   bY(i,j  )*( x(i,j  ,n) - x(i,j-1,n) ) )
-            end do
-         end do
-      end do
-
-    end subroutine amrex_abec_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_abec_norma( &
-           res, &
-           alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           bX,bX_l1,bX_l2,bX_h1,bX_h2, &
-           bY,bY_l1,bY_l2,bY_h1,bY_h2, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_norma')
-
-      implicit none
-
-      real(amrex_real) res
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer a_l1,a_l2,a_h1,a_h2
-      integer bX_l1,bX_l2,bX_h1,bX_h2
-      integer bY_l1,bY_l2,bY_h1,bY_h2
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real) bX(bX_l1:bX_h1,bX_l2:bX_h2)
-      real(amrex_real) bY(bY_l1:bY_h1,bY_l2:bY_h2)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,j,n
-      real(amrex_real) dhx,dhy
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-
-      res = 0.0D0
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               res = max(res, &
-                    + abs( alpha*a(i,j) &
-                         + dhx * (bX(i+1,j) + bX(i,j)) &
-                         + dhy * (bY(i,j+1) + bY(i,j))) &
-                    + abs(-dhx*bX(i+1,j)) + abs(-dhx*bX(i,j)) &
-                    + abs(-dhy*bY(i,j+1)) + abs(-dhy*bY(i,j)))
-            end do
-         end do
-      end do
-
-    end subroutine amrex_abec_norma
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-    subroutine amrex_abec_flux( &
-           x,x_l1,x_l2,x_h1,x_h2, &
-           alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           bX,bX_l1,bX_l2,bX_h1,bX_h2, &
-           bY,bY_l1,bY_l2,bY_h1,bY_h2, &
-           xlo,xhi, &
-           ylo,yhi, &
-           nc, &
-           h, &
-           xflux,xflux_l1,xflux_l2,xflux_h1,xflux_h2, &
-           yflux,yflux_l1,yflux_l2,yflux_h1,yflux_h2 &
-           ) bind(c,name='amrex_abec_flux')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer nc
-      integer x_l1,x_l2,x_h1,x_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer bX_l1,bX_l2,bX_h1,bX_h2
-      integer bY_l1,bY_l2,bY_h1,bY_h2
-      integer xflux_l1,xflux_l2,xflux_h1,xflux_h2
-      integer yflux_l1,yflux_l2,yflux_h1,yflux_h2
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real) bX(bX_l1:bX_h1,bX_l2:bX_h2)
-      real(amrex_real) bY(bY_l1:bY_h1,bY_l2:bY_h2)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,xflux_l2:xflux_h2,nc)
-      real(amrex_real) yflux(yflux_l1:yflux_h1,yflux_l2:yflux_h2,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      real(amrex_real) dhx, dhy
-      integer i,j,n
-
-      dhx = one/h(1)
-      dhy = one/h(2)
-
-      do n = 1, nc
-         do j = xlo(2), xhi(2)
-            do i = xlo(1), xhi(1)
-               xflux(i,j,n) = - dhx*bX(i,j)*( x(i,j,n) - x(i-1,j,n) )
-            end do
-         end do
-      end do
-      do n = 1, nc
-         do j = ylo(2), yhi(2)
-            do i = ylo(1), yhi(1)
-               yflux(i,j,n) = - dhy*bY(i,j)*( x(i,j,n) - x(i,j-1,n) )
-            end do
-         end do
-      end do
-
-    end subroutine amrex_abec_flux
-
-end module amrex_abec_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABec_3D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_ABec_3D.F90
deleted file mode 100644
index d7df920d52d..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABec_3D.F90
+++ /dev/null
@@ -1,516 +0,0 @@
-
-module amrex_abec_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Gauss-Seidel Red-Black (GSRB):
-!>     Apply the GSRB relaxation to the state phi for the equation
-!>     ``L(phi) = alpha*a(x)*phi(x) - beta*Div(b(x)Grad(phi(x))) = rhs(x)``
-!>     central differenced, according to the arrays of boundary
-!>     masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.  The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_abec_gsrb ( &
-           phi,phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-           rhs,rhs_l1,rhs_l2,rhs_l3,rhs_h1,rhs_h2,rhs_h3, &
-           alpha, beta, &
-           a,  a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-           bX, bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3, &
-           bY, bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3, &
-           bZ, bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3, &
-           f0, f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3, &
-           m0, m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3, &
-           f1, f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3, &
-           m1, m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3, &
-           f2, f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3, &
-           m2, m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3, &
-           f3, f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3, &
-           m3, m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3, &
-           f4, f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3, &
-           m4, m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3, &
-           f5, f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3, &
-           m5, m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3, &
-           lo,hi,blo,bhi, &
-           nc, h,redblack &
-           ) bind(c,name='amrex_abec_gsrb')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      integer rhs_l1,rhs_l2,rhs_l3,rhs_h1,rhs_h2,rhs_h3
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer blo(BL_SPACEDIM), bhi(BL_SPACEDIM)
-      integer nc
-      integer redblack
-      integer f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3
-      real(amrex_real) f0(f0_l1:f0_h1,f0_l2:f0_h2,f0_l3:f0_h3)
-      integer f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3
-      real(amrex_real) f1(f1_l1:f1_h1,f1_l2:f1_h2,f1_l3:f1_h3)
-      integer f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3
-      real(amrex_real) f2(f2_l1:f2_h1,f2_l2:f2_h2,f2_l3:f2_h3)
-      integer f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3
-      real(amrex_real) f3(f3_l1:f3_h1,f3_l2:f3_h2,f3_l3:f3_h3)
-      integer f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3
-      real(amrex_real) f4(f4_l1:f4_h1,f4_l2:f4_h2,f4_l3:f4_h3)
-      integer f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3
-      real(amrex_real) f5(f5_l1:f5_h1,f5_l2:f5_h2,f5_l3:f5_h3)
-      integer m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3
-      integer m0(m0_l1:m0_h1,m0_l2:m0_h2,m0_l3:m0_h3)
-      integer m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3
-      integer m1(m1_l1:m1_h1,m1_l2:m1_h2,m1_l3:m1_h3)
-      integer m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3
-      integer m2(m2_l1:m2_h1,m2_l2:m2_h2,m2_l3:m2_h3)
-      integer m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3
-      integer m3(m3_l1:m3_h1,m3_l2:m3_h2,m3_l3:m3_h3)
-      integer m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3
-      integer m4(m4_l1:m4_h1,m4_l2:m4_h2,m4_l3:m4_h3)
-      integer m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3
-      integer m5(m5_l1:m5_h1,m5_l2:m5_h2,m5_l3:m5_h3)
-      real(amrex_real)  h(BL_SPACEDIM)
-      real(amrex_real)   phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,nc)
-      real(amrex_real)   rhs(rhs_l1:rhs_h1,rhs_l2:rhs_h2,rhs_l3:rhs_h3,nc)
-      real(amrex_real)     a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real)    bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real)    bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real)    bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-
-      integer  i, j, k, ioff, n
-
-      real(amrex_real) dhx, dhy, dhz, cf0, cf1, cf2, cf3, cf4, cf5
-      real(amrex_real) g_m_d, gamma, rho, res
-
-!     This factor of 1.15 in 3D does over-relaxation but seems to consistently reduce the number of V-cycles needed.
-      real(amrex_real) omega
-      omega = 1.15d0
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      dhz = beta/h(3)**2
-
-      do n = 1, nc
-          do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               ioff = MOD(lo(1) + j + k + redblack,2)
-               do i = lo(1) + ioff,hi(1),2
-
-                  cf0 = merge(f0(blo(1),j,k), 0.0D0, &
-                       (i .eq. blo(1)) .and. (m0(blo(1)-1,j,k).gt.0))
-                  cf1 = merge(f1(i,blo(2),k), 0.D00, &
-                       (j .eq. blo(2)) .and. (m1(i,blo(2)-1,k).gt.0))
-                  cf2 = merge(f2(i,j,blo(3)), 0.0D0, &
-                       (k .eq. blo(3)) .and. (m2(i,j,blo(3)-1).gt.0))
-                  cf3 = merge(f3(bhi(1),j,k), 0.0D0, &
-                       (i .eq. bhi(1)) .and. (m3(bhi(1)+1,j,k).gt.0))
-                  cf4 = merge(f4(i,bhi(2),k), 0.0D0, &
-                       (j .eq. bhi(2)) .and. (m4(i,bhi(2)+1,k).gt.0))
-                  cf5 = merge(f5(i,j,bhi(3)), 0.0D0, &
-                       (k .eq. bhi(3)) .and. (m5(i,j,bhi(3)+1).gt.0))
-
-                  gamma = alpha*a(i,j,k) &
-                       +   dhx*(bX(i,j,k)+bX(i+1,j,k)) &
-                       +   dhy*(bY(i,j,k)+bY(i,j+1,k)) &
-                       +   dhz*(bZ(i,j,k)+bZ(i,j,k+1))
-
-                  g_m_d = gamma &
-                       - (dhx*(bX(i,j,k)*cf0 + bX(i+1,j,k)*cf3) &
-                       +  dhy*(bY(i,j,k)*cf1 + bY(i,j+1,k)*cf4) &
-                       +  dhz*(bZ(i,j,k)*cf2 + bZ(i,j,k+1)*cf5))
-
-                  rho =  dhx*( bX(i  ,j,k)*phi(i-1,j,k,n) &
-                       +       bX(i+1,j,k)*phi(i+1,j,k,n) ) &
-                       + dhy*( bY(i,j  ,k)*phi(i,j-1,k,n) &
-                       +       bY(i,j+1,k)*phi(i,j+1,k,n) ) &
-                       + dhz*( bZ(i,j,k  )*phi(i,j,k-1,n) &
-                       +       bZ(i,j,k+1)*phi(i,j,k+1,n) )
-
-                  res =  rhs(i,j,k,n) - (gamma*phi(i,j,k,n) - rho)
-                  phi(i,j,k,n) = phi(i,j,k,n) + omega/g_m_d * res
-
-               end do
-            end do
-          end do
-      end do
-
-    end subroutine amrex_abec_gsrb
-
-!-----------------------------------------------------------------------
-!>
-!>     Jacobi:
-!>     Apply the Jacobi relaxation to the state phi for the equation
-!>     ``L(phi) = alpha*a(x)*phi(x) - beta*Div(b(x)Grad(phi(x))) = rhs(x)``
-!>     central differenced, according to the arrays of boundary
-!>     masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.  The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_abec_jacobi ( &
-           phi,phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-           rhs,rhs_l1,rhs_l2,rhs_l3,rhs_h1,rhs_h2,rhs_h3, &
-           alpha, beta, &
-           a,  a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-           bX, bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3, &
-           bY, bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3, &
-           bZ, bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3, &
-           f0, f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3, &
-           m0, m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3, &
-           f1, f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3, &
-           m1, m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3, &
-           f2, f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3, &
-           m2, m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3, &
-           f3, f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3, &
-           m3, m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3, &
-           f4, f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3, &
-           m4, m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3, &
-           f5, f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3, &
-           m5, m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_jacobi')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      integer rhs_l1,rhs_l2,rhs_l3,rhs_h1,rhs_h2,rhs_h3
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer nc
-      integer f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3
-      real(amrex_real) f0(f0_l1:f0_h1,f0_l2:f0_h2,f0_l3:f0_h3)
-      integer f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3
-      real(amrex_real) f1(f1_l1:f1_h1,f1_l2:f1_h2,f1_l3:f1_h3)
-      integer f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3
-      real(amrex_real) f2(f2_l1:f2_h1,f2_l2:f2_h2,f2_l3:f2_h3)
-      integer f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3
-      real(amrex_real) f3(f3_l1:f3_h1,f3_l2:f3_h2,f3_l3:f3_h3)
-      integer f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3
-      real(amrex_real) f4(f4_l1:f4_h1,f4_l2:f4_h2,f4_l3:f4_h3)
-      integer f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3
-      real(amrex_real) f5(f5_l1:f5_h1,f5_l2:f5_h2,f5_l3:f5_h3)
-      integer m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3
-      integer m0(m0_l1:m0_h1,m0_l2:m0_h2,m0_l3:m0_h3)
-      integer m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3
-      integer m1(m1_l1:m1_h1,m1_l2:m1_h2,m1_l3:m1_h3)
-      integer m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3
-      integer m2(m2_l1:m2_h1,m2_l2:m2_h2,m2_l3:m2_h3)
-      integer m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3
-      integer m3(m3_l1:m3_h1,m3_l2:m3_h2,m3_l3:m3_h3)
-      integer m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3
-      integer m4(m4_l1:m4_h1,m4_l2:m4_h2,m4_l3:m4_h3)
-      integer m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3
-      integer m5(m5_l1:m5_h1,m5_l2:m5_h2,m5_l3:m5_h3)
-      real(amrex_real)  h(BL_SPACEDIM)
-      real(amrex_real)   phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,nc)
-      real(amrex_real)   rhs(rhs_l1:rhs_h1,rhs_l2:rhs_h2,rhs_l3:rhs_h3,nc)
-      real(amrex_real)     a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real)    bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real)    bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real)    bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-
-      integer  i, j, k, n
-
-      real(amrex_real) dhx, dhy, dhz, cf0, cf1, cf2, cf3, cf4, cf5
-      real(amrex_real) delta, gamma, rho
-
-      real(amrex_real), allocatable :: phinew(:,:,:)
-
-      allocate(phinew(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3)))
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      dhz = beta/h(3)**2
-
-      do n = 1, nc
-          do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1),hi(1)
-
-                  cf0 = merge(f0(lo(1),j,k), 0.0D0, &
-                       (i .eq. lo(1)) .and. (m0(lo(1)-1,j,k).gt.0))
-                  cf1 = merge(f1(i,lo(2),k), 0.D00, &
-                       (j .eq. lo(2)) .and. (m1(i,lo(2)-1,k).gt.0))
-                  cf2 = merge(f2(i,j,lo(3)), 0.0D0, &
-                       (k .eq. lo(3)) .and. (m2(i,j,lo(3)-1).gt.0))
-                  cf3 = merge(f3(hi(1),j,k), 0.0D0, &
-                       (i .eq. hi(1)) .and. (m3(hi(1)+1,j,k).gt.0))
-                  cf4 = merge(f4(i,hi(2),k), 0.0D0, &
-                       (j .eq. hi(2)) .and. (m4(i,hi(2)+1,k).gt.0))
-                  cf5 = merge(f5(i,j,hi(3)), 0.0D0, &
-                       (k .eq. hi(3)) .and. (m5(i,j,hi(3)+1).gt.0))
-
-                  delta = dhx*(bX(i,j,k)*cf0 + bX(i+1,j,k)*cf3) &
-                       +  dhy*(bY(i,j,k)*cf1 + bY(i,j+1,k)*cf4) &
-                       +  dhz*(bZ(i,j,k)*cf2 + bZ(i,j,k+1)*cf5)
-
-                  gamma = alpha*a(i,j,k) &
-                       +   dhx*(bX(i,j,k)+bX(i+1,j,k)) &
-                       +   dhy*(bY(i,j,k)+bY(i,j+1,k)) &
-                       +   dhz*(bZ(i,j,k)+bZ(i,j,k+1))
-
-                  rho =  dhx*( bX(i  ,j,k)*phi(i-1,j,k,n) &
-                       +       bX(i+1,j,k)*phi(i+1,j,k,n) ) &
-                       + dhy*( bY(i,j  ,k)*phi(i,j-1,k,n) &
-                       +       bY(i,j+1,k)*phi(i,j+1,k,n) ) &
-                       + dhz*( bZ(i,j,k  )*phi(i,j,k-1,n) &
-                       +       bZ(i,j,k+1)*phi(i,j,k+1,n) )
-
-                  phinew(i,j,k) = (rhs(i,j,k,n)+rho-phi(i,j,k,n)*delta) &
-                       /                   (gamma - delta)
-
-               end do
-            end do
-          end do
-
-         phi(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3),n) = &
-               phinew(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3))
-
-      end do
-
-      deallocate(phinew)
-
-    end subroutine amrex_abec_jacobi
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_abec_adotx( &
-           y,y_l1,y_l2,y_l3,y_h1,y_h2,y_h3, &
-           x,x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-           alpha, beta, &
-           a, a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-           bX,bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3, &
-           bY,bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3, &
-           bZ,bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_adotx')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer y_l1,y_l2,y_l3,y_h1,y_h2,y_h3
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      real(amrex_real)  y(y_l1:y_h1,y_l2:y_h2,y_l3:y_h3,nc)
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real) bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real) bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real) bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,j,k,n
-      real(amrex_real) dhx,dhy,dhz
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      dhz = beta/h(3)**2
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  y(i,j,k,n) = alpha*a(i,j,k)*x(i,j,k,n) &
-                       - dhx* &
-                       (   bX(i+1,j,k)*( x(i+1,j,k,n) - x(i  ,j,k,n) ) &
-                       -   bX(i  ,j,k)*( x(i  ,j,k,n) - x(i-1,j,k,n) ) ) &
-                       - dhy* &
-                       (   bY(i,j+1,k)*( x(i,j+1,k,n) - x(i,j  ,k,n) ) &
-                       -   bY(i,j  ,k)*( x(i,j  ,k,n) - x(i,j-1,k,n) ) ) &
-                       - dhz* &
-                       (   bZ(i,j,k+1)*( x(i,j,k+1,n) - x(i,j,k  ,n) ) &
-                       -   bZ(i,j,k  )*( x(i,j,k  ,n) - x(i,j,k-1,n) ) )
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_abec_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_abec_norma( &
-           res, &
-           alpha, beta, &
-           a, a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-           bX,bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3, &
-           bY,bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3, &
-           bZ,bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3, &
-           lo,hi,nc, &
-           h &
-           ) bind(c,name='amrex_abec_norma')
-
-      implicit none
-
-      real(amrex_real) alpha, beta, res
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real) bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real) bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real) bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,j,k,n
-      real(amrex_real) dhx,dhy,dhz
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      dhz = beta/h(3)**2
-
-      res = 0.0D0
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  res = max(res, abs(alpha*a(i,j,k) &
-                       + dhx*(bX(i+1,j,k) + bX(i,j,k)) &
-                       + dhy*(bY(i,j+1,k) + bY(i,j,k)) &
-                       + dhz*(bZ(i,j,k+1) + bZ(i,j,k))) &
-                       + abs( -dhx*bX(i+1,j,k)) + abs( -dhx*bX(i,j,k)) &
-                       + abs( -dhy*bY(i,j+1,k)) + abs( -dhy*bY(i,j,k)) &
-                       + abs( -dhz*bZ(i,j,k+1)) + abs( -dhz*bZ(i,j,k)))
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_abec_norma
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-    subroutine amrex_abec_flux( &
-           x,x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-           alpha, beta, &
-           a, a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-           bX,bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3, &
-           bY,bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3, &
-           bZ,bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3, &
-           xlo,xhi, &
-           ylo,yhi, &
-           zlo,zhi, &
-           nc, &
-           h, &
-           xflux,xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3, &
-           yflux,yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3, &
-           zflux,zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3 &
-           ) bind(c,name='amrex_abec_flux')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer zlo(BL_SPACEDIM), zhi(BL_SPACEDIM)
-      integer nc
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      integer xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3
-      integer yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3
-      integer zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real) bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real) bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real) bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,xflux_l2:xflux_h2,xflux_l3:xflux_h3,nc)
-      real(amrex_real) yflux(yflux_l1:yflux_h1,yflux_l2:yflux_h2,yflux_l3:yflux_h3,nc)
-      real(amrex_real) zflux(zflux_l1:zflux_h1,zflux_l2:zflux_h2,zflux_l3:zflux_h3,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      real(amrex_real) dhx, dhy, dhz
-      integer i,j,k,n
-
-      dhx = one/h(1)
-      dhy = one/h(2)
-      dhz = one/h(3)
-
-      do n = 1, nc
-         do k = xlo(3), xhi(3)
-            do j = xlo(2), xhi(2)
-               do i = xlo(1), xhi(1)
-                  xflux(i,j,k,n) = - dhx*bX(i,j,k)*( x(i,j,k,n) - x(i-1,j,k,n) )
-               end do
-            end do
-         end do
-
-         do k = ylo(3), yhi(3)
-            do j = ylo(2), yhi(2)
-               do i = ylo(1), yhi(1)
-                  yflux(i,j,k,n) = - dhy*bY(i,j,k)*( x(i,j,k,n) - x(i,j-1,k,n) )
-               end do
-            end do
-         end do
-
-         do k = zlo(3), zhi(3)
-            do j = zlo(2), zhi(2)
-               do i = zlo(1), zhi(1)
-                  zflux(i,j,k,n) = - dhz*bZ(i,j,k)*( x(i,j,k,n) - x(i,j,k-1,n) )
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_abec_flux
-
-end module amrex_abec_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABec_F.H b/Src/LinearSolvers/C_CellMG/AMReX_ABec_F.H
deleted file mode 100644
index a662d0dd6f8..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABec_F.H
+++ /dev/null
@@ -1,224 +0,0 @@
-#ifndef AMREX_AABBEC_F_H_
-#define AMREX_AABBEC_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-#if (BL_SPACEDIM == 1)
-    void amrex_abec_linesolve (
-        amrex_real* phi       , AMREX_ARLIM_P(phi_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs , AMREX_ARLIM_P(rhs_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a   , AMREX_ARLIM_P(a_lo),   AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX  , AMREX_ARLIM_P(bX_lo),  AMREX_ARLIM_P(bX_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo),AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),  AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo),AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),  AMREX_ARLIM_P(m2_hi),
-        const int* lo, const int* hi, const int *nc,
-        const amrex_real *h
-        );
-
-    void amrex_abec_adotx(
-        amrex_real *y      , AMREX_ARLIM_P(y_lo), AMREX_ARLIM_P(y_hi),
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_abec_norma(
-        amrex_real* res      ,
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_abec_flux(
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const int *xlo, const int *xhi, const int *nc,
-        const amrex_real *h,
-        const amrex_real* xflux, AMREX_ARLIM_P(xflux_lo), AMREX_ARLIM_P(xflux_hi)
-        );
-#endif    
-#if (BL_SPACEDIM == 2)
-    void amrex_abec_gsrb (
-        amrex_real* phi       , AMREX_ARLIM_P(phi_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs , AMREX_ARLIM_P(rhs_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a   , AMREX_ARLIM_P(a_lo),   AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX  , AMREX_ARLIM_P(bX_lo),  AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY  , AMREX_ARLIM_P(bY_lo),  AMREX_ARLIM_P(bY_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo),AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),  AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den1, AMREX_ARLIM_P(den1_lo),AMREX_ARLIM_P(den1_hi),
-        const int* m1   , AMREX_ARLIM_P(m1_lo),  AMREX_ARLIM_P(m1_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo),AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),  AMREX_ARLIM_P(m2_hi),
-        const amrex_real* den3, AMREX_ARLIM_P(den3_lo),AMREX_ARLIM_P(den3_hi),
-        const int* m3   , AMREX_ARLIM_P(m3_lo),  AMREX_ARLIM_P(m3_hi),
-        const int* lo, const int* hi, const int* blo, const int* bhi, 
-	const int *nc, const amrex_real *h, const  int* redblack
-        );
-
-    void amrex_abec_jacobi (
-        amrex_real* phi       , AMREX_ARLIM_P(phi_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs , AMREX_ARLIM_P(rhs_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a   , AMREX_ARLIM_P(a_lo),   AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX  , AMREX_ARLIM_P(bX_lo),  AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY  , AMREX_ARLIM_P(bY_lo),  AMREX_ARLIM_P(bY_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo),AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),  AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den1, AMREX_ARLIM_P(den1_lo),AMREX_ARLIM_P(den1_hi),
-        const int* m1   , AMREX_ARLIM_P(m1_lo),  AMREX_ARLIM_P(m1_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo),AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),  AMREX_ARLIM_P(m2_hi),
-        const amrex_real* den3, AMREX_ARLIM_P(den3_lo),AMREX_ARLIM_P(den3_hi),
-        const int* m3   , AMREX_ARLIM_P(m3_lo),  AMREX_ARLIM_P(m3_hi),
-        const int* lo, const int* hi, const int *nc,
-        const amrex_real *h
-        );
-
-    void amrex_abec_adotx(
-        amrex_real *y      , AMREX_ARLIM_P(y_lo), AMREX_ARLIM_P(y_hi),
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_abec_norma(
-        amrex_real* res      ,
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_abec_flux(
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const int *xlo, const int *xhi, 
-        const int *ylo, const int *yhi, 
-	const int *nc,
-        const amrex_real *h,
-        const amrex_real* xflux, AMREX_ARLIM_P(xflux_lo), AMREX_ARLIM_P(xflux_hi),
-        const amrex_real* yflux, AMREX_ARLIM_P(yflux_lo), AMREX_ARLIM_P(yflux_hi)
-        );
-#endif    
-
-#if (BL_SPACEDIM == 3)
-    void amrex_abec_gsrb (
-        amrex_real* phi,       AMREX_ARLIM_P(phi_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs, AMREX_ARLIM_P(rhs_lo), AMREX_ARLIM_P(rhs_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const amrex_real* bZ, AMREX_ARLIM_P(bZ_lo), AMREX_ARLIM_P(bZ_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo), AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),   AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den1, AMREX_ARLIM_P(den1_lo), AMREX_ARLIM_P(den1_hi),
-        const int* m1   , AMREX_ARLIM_P(m1_lo),   AMREX_ARLIM_P(m1_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo), AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),   AMREX_ARLIM_P(m2_hi),
-        const amrex_real* den3, AMREX_ARLIM_P(den3_lo), AMREX_ARLIM_P(den3_hi),
-        const int* m3   , AMREX_ARLIM_P(m3_lo),   AMREX_ARLIM_P(m3_hi),
-        const amrex_real* den4, AMREX_ARLIM_P(den4_lo), AMREX_ARLIM_P(den4_hi),
-        const int* m4   , AMREX_ARLIM_P(m4_lo),   AMREX_ARLIM_P(m4_hi),
-        const amrex_real* den5, AMREX_ARLIM_P(den5_lo), AMREX_ARLIM_P(den5_hi),
-        const int* m5   , AMREX_ARLIM_P(m5_lo),   AMREX_ARLIM_P(m5_hi),
-        const int* lo, const int* hi, const int* blo, const int* bhi, 
-	const int *nc, const amrex_real *h, const  int* redblack
-        );
-
-    void amrex_abec_jacobi (
-        amrex_real* phi,       AMREX_ARLIM_P(phi_lo), AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs, AMREX_ARLIM_P(rhs_lo), AMREX_ARLIM_P(rhs_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const amrex_real* bZ, AMREX_ARLIM_P(bZ_lo), AMREX_ARLIM_P(bZ_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo), AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),   AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den1, AMREX_ARLIM_P(den1_lo), AMREX_ARLIM_P(den1_hi),
-        const int* m1   , AMREX_ARLIM_P(m1_lo),   AMREX_ARLIM_P(m1_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo), AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),   AMREX_ARLIM_P(m2_hi),
-        const amrex_real* den3, AMREX_ARLIM_P(den3_lo), AMREX_ARLIM_P(den3_hi),
-        const int* m3   , AMREX_ARLIM_P(m3_lo),   AMREX_ARLIM_P(m3_hi),
-        const amrex_real* den4, AMREX_ARLIM_P(den4_lo), AMREX_ARLIM_P(den4_hi),
-        const int* m4   , AMREX_ARLIM_P(m4_lo),   AMREX_ARLIM_P(m4_hi),
-        const amrex_real* den5, AMREX_ARLIM_P(den5_lo), AMREX_ARLIM_P(den5_hi),
-        const int* m5   , AMREX_ARLIM_P(m5_lo),   AMREX_ARLIM_P(m5_hi),
-        const int* lo, const int* hi, const int *nc,
-        const amrex_real *h
-        );
-
-    void amrex_abec_adotx(
-        amrex_real *y      , AMREX_ARLIM_P(y_lo), AMREX_ARLIM_P(y_hi),
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const amrex_real* bZ, AMREX_ARLIM_P(bZ_lo), AMREX_ARLIM_P(bZ_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_abec_norma(
-        amrex_real* res      ,
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const amrex_real* bZ, AMREX_ARLIM_P(bZ_lo), AMREX_ARLIM_P(bZ_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_abec_flux(
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a , AMREX_ARLIM_P(a_lo),  AMREX_ARLIM_P(a_hi),
-        const amrex_real* bX, AMREX_ARLIM_P(bX_lo), AMREX_ARLIM_P(bX_hi),
-        const amrex_real* bY, AMREX_ARLIM_P(bY_lo), AMREX_ARLIM_P(bY_hi),
-        const amrex_real* bZ, AMREX_ARLIM_P(bZ_lo), AMREX_ARLIM_P(bZ_hi),
-        const int *xlo, const int *xhi, 
-        const int *ylo, const int *yhi, 
-        const int *zlo, const int *zhi, 
-	const int *nc,
-        const amrex_real *h,
-        amrex_real* xflux, AMREX_ARLIM_P(xflux_lo), AMREX_ARLIM_P(xflux_hi),
-        amrex_real* yflux, AMREX_ARLIM_P(yflux_lo), AMREX_ARLIM_P(yflux_hi),
-        amrex_real* zflux, AMREX_ARLIM_P(zflux_lo), AMREX_ARLIM_P(zflux_hi)
-        );
-#endif
-#ifdef __cplusplus
-}
-#endif
-
-
-#endif /*_AABBEC_F_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_ABec_UTIL.F90 b/Src/LinearSolvers/C_CellMG/AMReX_ABec_UTIL.F90
deleted file mode 100644
index 411e313969a..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_ABec_UTIL.F90
+++ /dev/null
@@ -1,48 +0,0 @@
-
-module amrex_abec_util_module
-
-  use amrex_fort_module
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Tridiagonal solve
-!>
-    subroutine tridiag(a,b,c,r,u,n)
-
-      integer n
-      integer nmax
-
-      real(amrex_real) a(n)
-      real(amrex_real) b(n)
-      real(amrex_real) c(n)
-      real(amrex_real) r(n)
-      real(amrex_real) u(n)
-
-      parameter (nmax = 4098)
-
-      integer j
-      real(amrex_real) bet
-      real(amrex_real) gam(nmax)
-      if (n .gt. nmax ) call bl_error('tridiag: size exceeded')
-      if (b(1) .eq. 0) call bl_error('tridiag: CANT HAVE B(1) = ZERO')
-
-      bet = b(1)
-      u(1) = r(1)/bet
-
-      do j = 2,n
-        gam(j) = c(j-1)/bet
-        bet = b(j) - a(j)*gam(j)
-        if (bet .eq. 0) call bl_error('tridiag: TRIDIAG FAILED')
-        u(j) = (r(j)-a(j)*u(j-1))/bet
-      end do
-
-      do j = n-1,1,-1
-        u(j) = u(j) - gam(j+1)*u(j+1)
-      end do
-
-    end subroutine tridiag
-
-end module amrex_abec_util_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_CGSolver.H b/Src/LinearSolvers/C_CellMG/AMReX_CGSolver.H
deleted file mode 100644
index 4aa73a800de..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_CGSolver.H
+++ /dev/null
@@ -1,242 +0,0 @@
-
-#ifndef AMREX_CGSOLVER_H_
-#define AMREX_CGSOLVER_H_
-
-#include <cmath>
-
-#include <AMReX_Array.H>
-#include <AMReX_Vector.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_LinOp.H>
-#include <AMReX_ABecLaplacian.H>
-
-namespace amrex {
-
-class MultiGrid;
-
-/**
-        \brief A CGSolver solves the linear equation, L(phi)=rhs, for a LinOp L and
-        MultiFabs rhs and phi, using the conjugate gradient algorithm, either
-        vanilla, or preconditioned via a single V-cycle of multigrid.
-
-        A CGSolver object solves the linear equation, L(phi)=rhs for a LinOp
-        L, and MultiFabs phi and rhs.  A CGSolver is constructed with a
-        fully initialized 2D or 3D LinOp, and responds to "solve" requests of
-        various signatures.  The solve request (implicitly) includes a flag
-        as to whether the system is to be solved with homogeneous boundary
-        conditions or no.  If homogeneous BCs are requested, all boundary
-        information within the LinOp is used, except that the values of
-        boundary FabSets are zeroed.  The algorithm follows closely that
-        described of p15 of the SIAM book, "Templates for the Solution of
-        Linear Systems".  Before solving a system, a small number of control
-        parameters may be modified (maximum number of allowed iterations,
-        reporting verbosity, etc).  Also, either on construction or via
-        member access functions, the user may choose to use a V-cycle
-        1-step MultiGrid preconditioner within the CG loop by setting
-        the appropriate bool flag (see members/ctrs below).  The MG
-        preconditioner used is just an instantiation of a MultiGrid class
-        object (the MultiGrid class is documented separately).
-
-        Implementation Notes:
-
-        This algorithm implements solution of equations in a way that
-        requires linearity of the operator.  In "residual correction form",
-        equations are solved only for the "correction" to the initial guess
-        that is required to solve the desired system.  In particular,
-        boundary conditions are assumed to be satisfied after a single
-        application of the linear operator (therefore, the correction is
-        homogeneous at the boundary).  As a result, after putting the
-        problem in residual correction form, the entire system CG system
-        has homigeneous boundary conditions.  This solver therefore cannot
-        incorporate fully nonlinear systems.
-
-        In general, a LinOp has the ability to apply high-order
-        interpolation methods for computing boundary values.  However, if
-        the operator used in this CGSolver is non-symmetric, cg performance
-        suffers tremendously.  As a result, BC's should be applied with
-        interpolants of order less than or equal to 2.  We do not enforce
-        this condition rigourously, since it would interfere with the user's
-        definition of the operator.  If cg performance is bad however,
-        setting the LinOp's maxorder=2 is a good place to start.
-
-	CGSolver can fail to converge, or more likely diverge, if you
-	run into a solvability problem (likely the accuracy cannot be
-	achieved).  CGSolver returns error codes 0 means good, 1--7 means
-	loss-of-accuracy, 8 means iteration count exceeded.
-
-        Default settings:
-        The user has access to the following options in the cg algorithm:
-
-        maxiter(40) Maximum number of cg cycles allowed to solve the
-        system before abandoning
-
-        verbose(0) Verbosity (1-results, 2-progress, 3-detailed progress)
-
-        use_mg_precond(false) Whether to use the V-cycle multigrid
-        solver for the preconditioner system
-
-	unstable_criterion(10) if norm of residual grows by more than
-	this factor, it is taken as signal that you've run into a solvability
-	problem.
-
-        This class does NOT provide a copy constructor or assignment operator.
-*/
-
-class CGSolver
-{
-public:
-
-    enum Solver { CG, BiCGStab, CABiCGStab, CABiCGStabQuad };
-
-    /**
-    * \brief The Constructor.
-    *
-    * \param _lp
-    * \param _use_mg_precond
-    * \param _lev
-    */
-    CGSolver (LinOp& _lp,
-              bool   _use_mg_precond = false,
-              int    _lev = 0);
-
-    /**
-    * \brief The Destructor.
-    */
-    ~CGSolver ();
-
-    /**
-    * \brief solve the system, Lp(solnL)=rhsL to relative err, tolerance
-    * RETURNS AN INT!!!! indicating success or failure.
-    * 0 means success
-    * 1 means failed for loss of precision
-    * 2 means iterations exceeded
-    *
-    * \param solnL
-    * \param rhsL
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    */
-    int solve (MultiFab&       solnL,
-	       const MultiFab& rhsL,
-	       Real            eps_rel    = -1.0,
-	       Real            eps_abs    = -1.0,
-	       LinOp::BC_Mode  bc_mode    = LinOp::Inhomogeneous_BC);
-
-    /**
-    * \brief Set maximum allowed number of CG iterations.
-    *
-    * \param _maxiter
-    */
-    void setMaxIter (int _maxiter) { maxiter = _maxiter; }
-
-    /**
-    * \brief Get maximum allowed number of CG iterations.
-    */
-    int getMaxIter () const { return maxiter; }
-
-    /**
-    * \brief Set flag determining whether MG preconditioning is used.
-    *
-    * \param _use_mg_precond
-    */
-    void setUseMGPrecond (bool _use_mg_precond)
-    {
-        use_mg_precond = _use_mg_precond; set_mg_precond();
-    }
-
-    /**
-    * \brief Get  flag determining whether MG preconditioning is used.
-    */
-    bool getUseMGPrecond () const { return use_mg_precond; }
-
-    void setCGSolver (Solver s) { cg_solver = s; }
-    Solver getCGSolver () const { return cg_solver; }
-
-
-    /**
-    * \brief Set the verbosity value.
-    *
-    * \param _verbose
-    */
-    void setVerbose (int _verbose) { verbose = _verbose; }
-
-    /**
-    * \brief Return the verbosity value.
-    */
-    int getVerbose () const { return verbose; }
-
-protected:
-
-    int solve_cg (MultiFab&       solnL,
-		  const MultiFab& rhsL,
-		  Real            eps_rel,
-		  Real            eps_abs,
-		  LinOp::BC_Mode  bc_mode);
-
-    int solve_bicgstab (MultiFab&       solnL,
-                        const MultiFab& rhsL,
-                        Real            eps_rel,
-                        Real            eps_abs,
-                        LinOp::BC_Mode  bc_mode);
-
-    int solve_cabicgstab (MultiFab&       solnL,
-                          const MultiFab& rhsL,
-                          Real            eps_rel,
-                          Real            eps_abs,
-                          LinOp::BC_Mode  bc_mode);
-
-    int solve_cabicgstab_quad (MultiFab&       solnL,
-                               const MultiFab& rhsL,
-                               Real            eps_rel,
-                               Real            eps_abs,
-                               LinOp::BC_Mode  bc_mode);
-
-    int jbb_precond (MultiFab&       sol,
-                     const MultiFab& rhs,
-                     int             lev,
-                     LinOp&          Lp);
-
-    /**
-    * \brief Construct work space, initialize parameters.
-    */
-    static void Initialize ();
-
-    static void Finalize ();
-
-    /**
-    * \brief if  (use_mg_precond == 1) then define the MultiGrid * mg_precond
-    */
-    void set_mg_precond ();
-
-private:
-
-    static int    def_maxiter;
-    static double def_unstable_criterion;
-    static int    def_verbose;
-    static Solver def_cg_solver;
-    static bool   use_jbb_precond;        //!< Use JBB's new method as a preconditioner.
-    static bool   use_jacobi_precond;     //!< Use Jacobi smoothing as a preconditioner.
-
-
-    //! The data.
-    LinOp&     Lp;             //!< Operator for linear system to be solved.
-    MultiGrid* mg_precond;         //!< MultiGrid solver to be used as preconditioner
-    int        maxiter;            //!< Current maximum number of allowed iterations.
-    int        verbose;            //!< Current verbosity level.
-    int        lev;                //!< Level of the linear operator to use
-    bool       use_mg_precond;     //!< Use multigrid as a preconditioner.
-    Solver     cg_solver;
-
-
-    /**
-    * \brief Disable copy constructor and assignment operator.
-    *
-    */
-    CGSolver (const CGSolver&);
-    CGSolver& operator= (const CGSolver&);
-};
-
-}
-
-#endif /*_CGSOLVER_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_CGSolver.cpp b/Src/LinearSolvers/C_CellMG/AMReX_CGSolver.cpp
deleted file mode 100644
index b6c16b635f9..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_CGSolver.cpp
+++ /dev/null
@@ -1,1377 +0,0 @@
-
-#include <algorithm>
-#include <iomanip>
-#include <cmath>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_CGSolver.H>
-#include <AMReX_MultiGrid.H>
-#include <AMReX_VisMF.H>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-namespace amrex {
-
-//
-// The largest value allowed for SSS - the "S" in the Communicaton-avoiding BiCGStab.
-//
-static const int SSS_MAX = 4;
-
-namespace
-{
-    //
-    // Set default values for these in Initialize()!!!
-    //
-    int  SSS;
-    bool variable_SSS;
-    //
-    // Has Initialized() been called?
-    //
-    bool initialized = false;
-}
-//
-// Set default values for these in Initialize()!!!
-//
-int              CGSolver::def_maxiter;
-int              CGSolver::def_verbose;
-CGSolver::Solver CGSolver::def_cg_solver;
-bool             CGSolver::use_jbb_precond;
-bool             CGSolver::use_jacobi_precond;
-double           CGSolver::def_unstable_criterion;
-
-void
-CGSolver::Initialize ()
-{
-    if (initialized) return;
-    //
-    // Set defaults here!!!
-    //
-    SSS                              = SSS_MAX;
-    variable_SSS                     = true;
-    CGSolver::def_maxiter            = 80;
-    CGSolver::def_verbose            = 0;
-    CGSolver::def_cg_solver          = BiCGStab;
-    CGSolver::use_jbb_precond        = 0;
-    CGSolver::use_jacobi_precond     = 0;
-    CGSolver::def_unstable_criterion = 10;
-
-    ParmParse pp("cg");
-
-    pp.query("v",                  def_verbose);
-    pp.query("SSS",                SSS);
-    pp.query("maxiter",            def_maxiter);
-    pp.query("verbose",            def_verbose);
-    pp.query("variable_SSS",       variable_SSS);
-    pp.query("use_jbb_precond",    use_jbb_precond);
-    pp.query("use_jacobi_precond", use_jacobi_precond);
-    pp.query("unstable_criterion", def_unstable_criterion);
-
-    if (SSS < 1      ) amrex::Abort("SSS must be >= 1");
-    if (SSS > SSS_MAX) amrex::Abort("SSS must be <= SSS_MAX");
-
-    int ii;
-    if (pp.query("cg_solver", ii))
-    {
-        switch (ii)
-        {
-        case 0: def_cg_solver = CG;             break;
-        case 1: def_cg_solver = BiCGStab;       break;
-        case 2: def_cg_solver = CABiCGStab;     break;
-        default:
-            amrex::Error("CGSolver::Initialize(): bad cg_solver");
-        }
-    }
-
-    if ( def_verbose > 2 && ParallelDescriptor::IOProcessor() )
-    {
-        amrex::Print() << "CGSolver settings ...\n"
-                       << "   def_maxiter            = " << def_maxiter            << '\n'
-                       << "   def_unstable_criterion = " << def_unstable_criterion << '\n'
-                       << "   def_cg_solver          = " << def_cg_solver          << '\n'
-                       << "   use_jbb_precond        = " << use_jbb_precond        << '\n'
-                       << "   use_jacobi_precond     = " << use_jacobi_precond     << '\n'
-                       << "   SSS                    = " << SSS                    << '\n';
-    }
-
-    amrex::ExecOnFinalize(CGSolver::Finalize);
-    
-    initialized = true;
-}
-
-void
-CGSolver::Finalize ()
-{
-    ;
-}
-
-CGSolver::CGSolver (LinOp& _lp,
-                    bool   _use_mg_precond,
-                    int    _lev)
-    :
-    Lp(_lp),
-    mg_precond(0),
-    lev(_lev),
-    use_mg_precond(_use_mg_precond)
-{
-    Initialize();
-    maxiter = def_maxiter;
-    verbose = def_verbose;
-    cg_solver = def_cg_solver;
-    set_mg_precond();
-}
-
-void
-CGSolver::set_mg_precond ()
-{
-    delete mg_precond;
-    if (use_mg_precond)
-    {
-        mg_precond = new MultiGrid(Lp);
-    }
-}
-
-CGSolver::~CGSolver ()
-{
-    delete mg_precond;
-}
-
-namespace {
-
-static
-void
-Spacer (std::ostream& os, int lev)
-{
-    for (int k = 0; k < lev; k++)
-    {
-        os << "   ";
-    }
-}
-
-static
-Real
-norm_inf (const MultiFab& res, bool local = false)
-{
-    return res.norm0(0,0,local);
-}
-
-}
-
-int
-CGSolver::solve (MultiFab&       sol,
-                 const MultiFab& rhs,
-                 Real            eps_rel,
-                 Real            eps_abs,
-                 LinOp::BC_Mode  bc_mode)
-{
-    switch (def_cg_solver)
-    {
-    case CG:
-        return solve_cg(sol, rhs, eps_rel, eps_abs, bc_mode);
-    case BiCGStab:
-        return solve_bicgstab(sol, rhs, eps_rel, eps_abs, bc_mode);
-    case CABiCGStab:
-        return solve_cabicgstab(sol, rhs, eps_rel, eps_abs, bc_mode);
-    default:
-        amrex::Error("CGSolver::solve(): unknown solver");
-    }
-
-    return -1;
-}
-
-namespace {
-
-static
-void
-sxay (MultiFab&       ss,
-      const MultiFab& xx,
-      Real            a,
-      const MultiFab& yy,
-      int             yycomp)
-{
-    BL_PROFILE("CGSolver::sxay()");
-
-    const int ncomp  = 1;
-    const int sscomp = 0;
-    const int xxcomp = 0;
-    MultiFab::LinComb(ss, 1.0, xx, xxcomp, a, yy, yycomp, sscomp, ncomp, 0);
-}
-
-inline
-void
-sxay (MultiFab&       ss,
-      const MultiFab& xx,
-      Real            a,
-      const MultiFab& yy)
-{
-    sxay(ss,xx,a,yy,0);
-}
-
-static
-Real
-dotxy (const MultiFab& r,
-       const MultiFab& z,
-       bool            local = false)
-{
-    const int ncomp = 1;
-    const int nghost = 0;
-    return MultiFab::Dot(r,0,z,0,ncomp,nghost,local);
-}
-
-//
-// z[m] = A[m][n]*x[n]   [row][col]
-//
-inline
-void
-gemv (Real*       z,
-      Real        A[((4*SSS_MAX)+1)][((4*SSS_MAX)+1)],
-      const Real* x,
-      int         rows,
-      int         cols)
-{
-    for (int r = 0; r < rows; r++)
-    {
-        Real sum = 0;
-        for (int c = 0; c < cols; c++)
-        {
-            sum += A[r][c]*x[c];
-        }
-        z[r] = sum;
-    }
-}
-
-//
-// z[n] = x[n]+beta*y[n]
-//
-inline
-void
-axpy (Real*       z,
-      const Real* x,
-      Real        beta,
-      const Real* y,
-      int         n)
-{
-    for (int nn = 0; nn < n; nn++)
-    {
-        z[nn] = x[nn] + beta*y[nn];
-    }
-}
-
-//
-// x[n].y[n]
-//
-inline
-Real
-dot (const Real* x,
-     const Real* y,
-     int         n)
-{
-    Real sum = 0;
-    for (int nn = 0; nn < n; nn++)
-    {
-        sum += x[nn]*y[nn];
-    }
-    return sum;
-}
-
-//
-// z[n] = 0
-//
-inline
-void
-zero (Real* z, int n)
-{
-    for (int nn = 0; nn < n;nn++)
-    {
-        z[nn] = 0;
-    }
-}
-
-static
-void
-SetMonomialBasis (Real  Tp[((4*SSS_MAX)+1)][((4*SSS_MAX)+1)],
-                  Real Tpp[((4*SSS_MAX)+1)][((4*SSS_MAX)+1)],
-                  int   sss)
-{
-    for (int i = 0; i < 4*sss+1; i++)
-    {
-        for (int j = 0; j < 4*sss+1; j++)
-        {
-            Tp[i][j] = 0;
-        }
-    }
-    for (int i = 0; i < 2*sss; i++)
-    {
-        Tp[i+1][i] = 1;
-    }
-    for (int i = 2*sss+1; i < 4*sss; i++)
-    {
-        Tp[i+1][i] = 1;
-    }
-
-    for (int i = 0; i < 4*sss+1; i++)
-    {
-        for (int j = 0; j < 4*sss+1; j++)
-        {
-            Tpp[i][j] = 0;
-        }
-    }
-    for (int i = 0; i < 2*sss-1; i++)
-    {
-        Tpp[i+2][i] = 1;
-    }
-    for (int i = 2*sss+1; i < 4*sss-1; i++)
-    {
-        Tpp[i+2][i] = 1;
-    }
-}
-
-//
-// Forward declaration of BuildGramMatrix().
-//
-static void BuildGramMatrix (Real* Gg, const MultiFab& PR, const MultiFab& rt, int sss);
-
-}
-
-//
-// Based on Erin Carson/Jim Demmel/Nick Knight's s-Step BiCGStab Algorithm 3.4.
-//
-// As originally implemented by:
-//
-// Samuel Williams
-// SWWilliams@lbl.gov
-// Lawrence Berkeley National Lab
-//
-// NOTE: If you wish to compare CABiCGStab -vs- BiCGStab make sure to compile
-// this code with CG_USE_OLD_CONVERGENCE_CRITERIA defined.  The BiCGStab code
-// has two different convergence criteria it can use; the CABiCGStab code is
-// hard-coded to use only one convergence criterion.  They won't compare identically,
-// even in that case, since the CA algorithm uses L2 norms while the non-CA
-// algorithm uses the inf norm.  But they're usually pretty close in iteration
-// counts.
-//
-
-int
-CGSolver::solve_cabicgstab (MultiFab&       sol,
-                            const MultiFab& rhs,
-                            Real            eps_rel,
-                            Real            eps_abs,
-                            LinOp::BC_Mode  bc_mode)
-{
-    BL_PROFILE("CGSolver::solve_cabicgstab()");
-
-    BL_ASSERT(sol.nComp() == 1);
-    BL_ASSERT(sol.boxArray() == Lp.boxArray(lev));
-    BL_ASSERT(rhs.boxArray() == Lp.boxArray(lev));
-
-    Real  temp1[4*SSS_MAX+1];
-    Real  temp2[4*SSS_MAX+1];
-    Real  temp3[4*SSS_MAX+1];
-    Real     Tp[4*SSS_MAX+1][4*SSS_MAX+1];
-    Real    Tpp[4*SSS_MAX+1][4*SSS_MAX+1];
-    Real     aj[4*SSS_MAX+1];
-    Real     cj[4*SSS_MAX+1];
-    Real     ej[4*SSS_MAX+1];
-    Real   Tpaj[4*SSS_MAX+1];
-    Real   Tpcj[4*SSS_MAX+1];
-    Real  Tppaj[4*SSS_MAX+1];
-    Real      G[4*SSS_MAX+1][4*SSS_MAX+1];    // Extracted from first 4*SSS+1 columns of Gg[][].  indexed as [row][col]
-    Real      g[4*SSS_MAX+1];                 // Extracted from last [4*SSS+1] column of Gg[][].
-    Real     Gg[(4*SSS_MAX+1)*(4*SSS_MAX+2)]; // Buffer to hold the Gram-like matrix produced by matmul().  indexed as [row*(4*SSS+2) + col]
-    //
-    // If variable_SSS we "telescope" SSS.
-    // We start with 1 and increase it up to SSS_MAX on the outer iterations.
-    //
-    if (variable_SSS) SSS = 1;
-
-    zero(   aj, 4*SSS_MAX+1);
-    zero(   cj, 4*SSS_MAX+1);
-    zero(   ej, 4*SSS_MAX+1);
-    zero( Tpaj, 4*SSS_MAX+1);
-    zero( Tpcj, 4*SSS_MAX+1);
-    zero(Tppaj, 4*SSS_MAX+1);
-    zero(temp1, 4*SSS_MAX+1);
-    zero(temp2, 4*SSS_MAX+1);
-    zero(temp3, 4*SSS_MAX+1);
-
-    SetMonomialBasis(Tp,Tpp,SSS);
-
-    const int ncomp = 1, nghost = sol.nGrow();
-    //
-    // Contains the matrix powers of p[] and r[].
-    //
-    // First 2*SSS+1 components are powers of p[].
-    // Next  2*SSS   components are powers of r[].
-    //
-    const BoxArray& ba = sol.boxArray();
-    const DistributionMapping& dm = sol.DistributionMap();
-
-    MultiFab PR(ba, dm, 4*SSS_MAX+1, 0, MFInfo(), FArrayBoxFactory());
-
-    MultiFab  p(ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab  r(ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab rt(ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    
-    MultiFab tmp(ba, dm, 4, nghost, MFInfo(), FArrayBoxFactory());
-
-    Lp.residual(r, rhs, sol, lev, bc_mode);
-
-    BL_ASSERT(!r.contains_nan());
-
-    MultiFab::Copy(rt,r,0,0,1,0);
-    MultiFab::Copy( p,r,0,0,1,0);
-
-    const Real           rnorm0        = norm_inf(r);
-    Real                 delta         = dotxy(r,rt);
-    const Real           L2_norm_of_rt = sqrt(delta);
-    const LinOp::BC_Mode temp_bc_mode  = LinOp::Homogeneous_BC;
-
-    if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev);
-        amrex::OutStream() << "CGSolver_CABiCGStab: Initial error (error0) =        " << rnorm0 << '\n';
-    }
-
-    if ( rnorm0 == 0 || delta == 0 || rnorm0 < eps_abs )
-    {
-        if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-	{
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "CGSolver_CABiCGStab: niter = 0,"
-                               << ", rnorm = "   << rnorm0
-                               << ", delta = "   << delta
-                               << ", eps_abs = " << eps_abs << '\n';
-	}
-        return 0;
-    }
-
-    int niters = 0, ret = 0;
-
-    Real L2_norm_of_resid = 0, atime = 0, gtime = 0;
-
-    bool BiCGStabFailed = false, BiCGStabConverged = false;
-
-    for (int m = 0; m < maxiter && !BiCGStabFailed && !BiCGStabConverged; )
-    {
-        const Real time1 = amrex::second();
-        //
-        // Compute the matrix powers on p[] & r[] (monomial basis).
-        // The 2*SSS+1 powers of p[] followed by the 2*SSS powers of r[].
-        //
-        MultiFab::Copy(PR,p,0,0,1,0);
-        MultiFab::Copy(PR,r,0,2*SSS+1,1,0);
-	
-        BL_ASSERT(!PR.contains_nan(0,      1));
-        BL_ASSERT(!PR.contains_nan(2*SSS+1,1));
-        //
-        // We use "tmp" to minimize the number of Lp.apply()s.
-        // We do this by doing p & r together in a single call.
-        //
-        MultiFab::Copy(tmp,p,0,0,1,0);
-        MultiFab::Copy(tmp,r,0,1,1,0);
-
-        for (int n = 1; n < 2*SSS; n++)
-        {
-            Lp.apply(tmp, tmp, lev, temp_bc_mode, false, 0, 2, 2);
-
-            MultiFab::Copy(tmp,tmp,2,0,2,0);
-
-            MultiFab::Copy(PR,tmp,0,        n,1,0);
-            MultiFab::Copy(PR,tmp,1,2*SSS+n+1,1,0);
-
-            BL_ASSERT(!PR.contains_nan(n,        1));
-            BL_ASSERT(!PR.contains_nan(2*SSS+n+1,1));
-        }
-
-        MultiFab::Copy(tmp,PR,2*SSS-1,0,1,0);
-        Lp.apply(tmp, tmp, lev, temp_bc_mode, false, 0, 1, 1);
-        MultiFab::Copy(PR,tmp,1,2*SSS,1,0);
-
-        BL_ASSERT(!PR.contains_nan(2*SSS-1,1));
-        BL_ASSERT(!PR.contains_nan(2*SSS,  1));
-
-        Real time2 = amrex::second();
-
-        atime += (time2-time1);
-
-        BuildGramMatrix(Gg, PR, rt, SSS);
-
-        const Real time3 = amrex::second();
-
-        gtime += (time3-time2);
-        //
-        // Form G[][] and g[] from Gg.
-        //
-        for (int i = 0, k = 0; i < 4*SSS+1; i++)
-        {
-            for (int j = 0; j < 4*SSS+1; j++)
-                //
-                // First 4*SSS+1 elements in each row go to G[][].
-                //
-                G[i][j] = Gg[k++];
-            //
-            // Last element in row goes to g[].
-            //
-            g[i] = Gg[k++];
-        }
-
-        zero(aj, 4*SSS+1); aj[0]       = 1;
-        zero(cj, 4*SSS+1); cj[2*SSS+1] = 1;
-        zero(ej, 4*SSS+1);
-
-        for (int nit = 0; nit < SSS; nit++)
-        {
-            gemv( Tpaj,  Tp, aj, 4*SSS+1, 4*SSS+1);
-            gemv( Tpcj,  Tp, cj, 4*SSS+1, 4*SSS+1);
-            gemv(Tppaj, Tpp, aj, 4*SSS+1, 4*SSS+1);
-
-            const Real g_dot_Tpaj = dot(g, Tpaj, 4*SSS+1);
-
-            if ( g_dot_Tpaj == 0 )
-            {
-                if ( verbose > 1 && ParallelDescriptor::IOProcessor() )
-                    amrex::Print() << "CGSolver_CABiCGStab: g_dot_Tpaj == 0, nit = " << nit << '\n';
-                BiCGStabFailed = true; ret = 1; break;
-            }
-
-            const Real alpha = delta / g_dot_Tpaj;
-
-            if ( std::isinf(alpha) )
-            {
-                if ( verbose > 1 && ParallelDescriptor::IOProcessor() )
-                    amrex::Print() << "CGSolver_CABiCGStab: alpha == inf, nit = " << nit << '\n';
-                BiCGStabFailed = true; ret = 2; break;
-            }
-
-            axpy(temp1, Tpcj, -alpha, Tppaj, 4*SSS+1);
-
-            gemv(temp2, G, temp1, 4*SSS+1, 4*SSS+1);
-
-            axpy(temp3,   cj, -alpha,  Tpaj, 4*SSS+1);
-
-            const Real omega_numerator   = dot(temp3, temp2, 4*SSS+1);
-            const Real omega_denominator = dot(temp1, temp2, 4*SSS+1);
-            //
-            // NOTE: omega_numerator/omega_denominator can be 0/x or 0/0, but should never be x/0.
-            //
-            // If omega_numerator==0, and ||s||==0, then convergence, x=x+alpha*aj.
-            // If omega_numerator==0, and ||s||!=0, then stabilization breakdown.
-            //
-            // Partial update of ej must happen before the check on omega to ensure forward progress !!!
-            //
-            axpy(ej, ej, alpha, aj, 4*SSS+1);
-            //
-            // ej has been updated so consider that we've done an iteration since
-            // even if we break out of the loop we'll be able to update both sol.
-            //
-            niters++;
-            //
-            // Calculate the norm of Saad's vector 's' to check intra s-step convergence.
-            //
-            axpy(temp1, cj,-alpha,  Tpaj, 4*SSS+1);
-
-            gemv(temp2, G, temp1, 4*SSS+1, 4*SSS+1);
-
-            const Real L2_norm_of_s = dot(temp1,temp2,4*SSS+1);
-
-            L2_norm_of_resid = (L2_norm_of_s < 0 ? 0 : sqrt(L2_norm_of_s));
-
-            if ( L2_norm_of_resid < eps_rel*L2_norm_of_rt )
-            {
-                if ( verbose > 1 && L2_norm_of_resid == 0 && ParallelDescriptor::IOProcessor() )
-                    amrex::Print() << "CGSolver_CABiCGStab: L2 norm of s: " << L2_norm_of_s << '\n';
-                BiCGStabConverged = true; break;
-            }
-
-            if ( omega_denominator == 0 )
-            {
-                if ( verbose > 1 && ParallelDescriptor::IOProcessor() )
-                    amrex::Print() << "CGSolver_CABiCGStab: omega_denominator == 0, nit = " << nit << '\n';
-                BiCGStabFailed = true; ret = 3; break;
-            }
-
-            const Real omega = omega_numerator / omega_denominator;
-
-            if ( verbose > 1 && ParallelDescriptor::IOProcessor() )
-            {
-                if ( omega == 0   ) amrex::Print() << "CGSolver_CABiCGStab: omega == 0, nit = " << nit << '\n';
-                if ( std::isinf(omega) ) amrex::Print() << "CGSolver_CABiCGStab: omega == inf, nit = " << nit << '\n';
-            }
-
-            if ( omega == 0   ) { BiCGStabFailed = true; ret = 4; break; }
-            if ( std::isinf(omega) ) { BiCGStabFailed = true; ret = 4; break; }
-            //
-            // Complete the update of ej & cj now that omega is known to be ok.
-            //
-            axpy(ej, ej,       omega,    cj, 4*SSS+1);
-            axpy(ej, ej,-omega*alpha,  Tpaj, 4*SSS+1);
-            axpy(cj, cj,      -omega,  Tpcj, 4*SSS+1);
-            axpy(cj, cj,      -alpha,  Tpaj, 4*SSS+1);
-            axpy(cj, cj, omega*alpha, Tppaj, 4*SSS+1);
-            //
-            // Do an early check of the residual to determine convergence.
-            //
-            gemv(temp1, G, cj, 4*SSS+1, 4*SSS+1);
-            //
-            // sqrt( (cj,Gcj) ) == L2 norm of the intermediate residual in exact arithmetic.
-            // However, finite precision can lead to the norm^2 being < 0 (Jim Demmel).
-            // If cj_dot_Gcj < 0 we flush to zero and consider ourselves converged.
-            //
-            const Real L2_norm_of_r = dot(cj, temp1, 4*SSS+1);
-
-            L2_norm_of_resid = (L2_norm_of_r > 0 ? sqrt(L2_norm_of_r) : 0);
-
-            if ( L2_norm_of_resid < eps_rel*L2_norm_of_rt )
-            {
-                if ( verbose > 1 && L2_norm_of_resid == 0 && ParallelDescriptor::IOProcessor() )
-                    amrex::Print() << "CGSolver_CABiCGStab: L2_norm_of_r: " << L2_norm_of_r << '\n';
-                BiCGStabConverged = true; break;
-            }
-
-            const Real delta_next = dot(g, cj, 4*SSS+1);
-
-            if ( verbose > 1 && ParallelDescriptor::IOProcessor() )
-            {
-                if ( delta_next == 0   ) amrex::Print() << "CGSolver_CABiCGStab: delta == 0, nit = " << nit << '\n';
-                if ( std::isinf(delta_next) ) amrex::Print() << "CGSolver_CABiCGStab: delta == inf, nit = " << nit << '\n';
-            }
-
-            if ( std::isinf(delta_next) ) { BiCGStabFailed = true; ret = 5; break; } // delta = inf?
-            if ( delta_next  == 0  ) { BiCGStabFailed = true; ret = 5; break; } // Lanczos breakdown...
-
-            const Real beta = (delta_next/delta)*(alpha/omega);
-
-            if ( verbose > 1 && ParallelDescriptor::IOProcessor() )
-            {
-                if ( beta == 0   ) amrex::Print() << "CGSolver_CABiCGStab: beta == 0, nit = " << nit << '\n';
-                if ( std::isinf(beta) ) amrex::Print() << "CGSolver_CABiCGStab: beta == inf, nit = " << nit << '\n';
-            }
-
-            if ( std::isinf(beta) ) { BiCGStabFailed = true; ret = 6; break; } // beta = inf?
-            if ( beta == 0   ) { BiCGStabFailed = true; ret = 6; break; } // beta = 0?  can't make further progress(?)
-
-            axpy(aj, cj,        beta,   aj, 4*SSS+1);
-            axpy(aj, aj, -omega*beta, Tpaj, 4*SSS+1);
-
-            delta = delta_next;
-        }
-        //
-        // Update iterates.
-        //
-        for (int i = 0; i < 4*SSS+1; i++)
-            sxay(sol,sol,ej[i],PR,i);
-
-        MultiFab::Copy(p,PR,0,0,1,0);
-        p.mult(aj[0],0,1);
-        for (int i = 1; i < 4*SSS+1; i++)
-            sxay(p,p,aj[i],PR,i);
-
-        MultiFab::Copy(r,PR,0,0,1,0);
-        r.mult(cj[0],0,1);
-        for (int i = 1; i < 4*SSS+1; i++)
-            sxay(r,r,cj[i],PR,i);
-
-        if ( !BiCGStabFailed && !BiCGStabConverged )
-        {
-            m += SSS;
-
-            if ( variable_SSS && SSS < SSS_MAX ) { SSS++; SetMonomialBasis(Tp,Tpp,SSS); }
-        }
-    }
-
-    if ( verbose > 0 )
-    {
-        if ( ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "CGSolver_CABiCGStab: Final: Iteration "
-                      << std::setw(4) << niters
-                      << " rel. err. "
-                      << L2_norm_of_resid << '\n';
-        }
-
-        if ( verbose > 1 )
-        {
-            Real tmp1[2] = { atime, gtime };
-
-            ParallelAllReduce::Max(tmp1,2,ParallelContext::CommunicatorSub());
-
-            if ( ParallelDescriptor::IOProcessor() )
-            {
-                Spacer(amrex::OutStream(), lev);
-                amrex::OutStream() << "CGSolver_CABiCGStab apply time: " << tmp1[0] << ", gram time: " << tmp1[1] << '\n';
-            }
-        }
-    }
-
-    if ( niters >= maxiter && !BiCGStabFailed && !BiCGStabConverged)
-    {
-        if ( L2_norm_of_resid > L2_norm_of_rt )
-        {
-            if ( ParallelDescriptor::IOProcessor() )
-                amrex::Warning("CGSolver_CABiCGStab: failed to converge!");
-            //
-            // Return code 8 tells the MultiGrid driver to zero out the solution!
-            //
-            ret = 8;
-        }
-        else
-        {
-            //
-            // Return codes 1-7 tells the MultiGrid driver to smooth the solution!
-            //
-            ret = 7;
-        }
-    }
-
-    return ret;
-}
-
-namespace {
-
-static
-void
-BuildGramMatrix (Real*           Gg,
-                 const MultiFab& PR,
-                 const MultiFab& rt,
-                 int             sss)
-{
-    BL_ASSERT(rt.nComp() == 1);
-    BL_ASSERT(PR.nComp() >= 4*sss+1);
-
-    const int Nrows = 4*sss+1, Ncols = Nrows + 1;
-
-    //
-    // Gg is dimensioned (Ncols*Nrows).
-    //
-    // First fill the upper triangle into tmp
-    //
-#ifdef _OPENMP
-    const int nthreads = omp_get_max_threads();
-#else 
-    const int nthreads = 1;
-#endif
-    const int Ntmp = (Nrows*(Nrows+3))/2;
-
-    Vector<Vector<Real> > tmp(nthreads);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-#ifdef _OPENMP
-	int tid = omp_get_thread_num();
-#else
-	int tid = 0;
-#endif
-	tmp[tid].resize(Ntmp,0.0);
-
-	for (MFIter mfi(PR,true); mfi.isValid(); ++mfi)
-	{
-	    const Box& bx = mfi.tilebox();
-	    const FArrayBox& rfab = PR[mfi];
-	    const FArrayBox& tfab = rt[mfi];
-	    
-	    int cnt = 0;
-	    for (int mm = 0; mm < Nrows; mm++) {
-		for (int nn = mm; nn < Nrows; nn++) {
-		    tmp[tid][cnt++] = rfab.dot<RunOn::Host>(bx,nn,rfab,bx,mm);
-		}
-		tmp[tid][cnt++] = tfab.dot<RunOn::Host>(bx,0,rfab,bx,mm);
-	    }
-	}
-#ifdef _OPENMP
-#pragma omp barrier
-#pragma omp for
-	for (int i = 0; i < Ntmp; ++i) {
-	    for (int j = 1; j < nthreads; ++j) {
-		tmp[0][i] += tmp[j][i];
-	    }
-	}
-#endif
-    }
-
-    ParallelAllReduce::Sum(&tmp[0][0],Ntmp,ParallelContext::CommunicatorSub());
-
-    // Now fill upper triangle with "tmp".
-    int cnt = 0;
-    for (int mm = 0; mm < Nrows; mm++) {
-        for (int nn = mm; nn < Nrows; nn++) {
-            Gg[mm*Ncols + nn] = tmp[0][cnt++];
-        }
-        Gg[mm*Ncols + Nrows] = tmp[0][cnt++];
-    }
-    // Then fill in strict lower triangle using symmetry.
-    for (int mm = 0; mm < Nrows; mm++) {
-        for (int nn = 0; nn < mm; nn++) {
-            Gg[mm*Ncols + nn] = Gg[nn*Ncols + mm];
-        }
-    }
-}
-
-}
-
-int
-CGSolver::solve_bicgstab (MultiFab&       sol,
-                          const MultiFab& rhs,
-                          Real            eps_rel,
-                          Real            eps_abs,
-                          LinOp::BC_Mode  bc_mode)
-{
-    BL_PROFILE("CGSolver::solve_bicgstab()");
-
-    const int nghost = sol.nGrow(), ncomp = 1;
-
-    const BoxArray& ba = sol.boxArray();
-    const DistributionMapping& dm = sol.DistributionMap();
-
-    BL_ASSERT(sol.nComp() == ncomp);
-    BL_ASSERT(sol.boxArray() == Lp.boxArray(lev));
-    BL_ASSERT(rhs.boxArray() == Lp.boxArray(lev));
-
-    MultiFab ph(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab sh(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-
-    MultiFab sorig(ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab p    (ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab r    (ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab s    (ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab rh   (ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab v    (ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-    MultiFab t    (ba, dm, ncomp, 0, MFInfo(), FArrayBoxFactory());
-
-    Lp.residual(r, rhs, sol, lev, bc_mode);
-
-    MultiFab::Copy(sorig,sol,0,0,1,0);
-    MultiFab::Copy(rh,   r,  0,0,1,0);
-
-    sol.setVal(0);
-
-    const LinOp::BC_Mode temp_bc_mode = LinOp::Homogeneous_BC;
-
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-    Real rnorm = norm_inf(r);
-#else
-    //
-    // Calculate the local values of these norms & reduce their values together.
-    //
-    Real normvals[2] = { norm_inf(r, true), Lp.norm(0, lev, true) };
-
-    ParallelAllReduce::Max(normvals,2,ParallelContext::CommunicatorSub());
-
-    Real       rnorm    = normvals[0];
-    const Real Lp_norm  = normvals[1];
-    Real       sol_norm = 0;
-#endif
-    const Real rnorm0   = rnorm;
-
-    if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev);
-        amrex::OutStream() << "CGSolver_BiCGStab: Initial error (error0) =        " << rnorm0 << '\n';
-    }
-    int ret = 0, nit = 1;
-    Real rho_1 = 0, alpha = 0, omega = 0;
-
-    if ( rnorm0 == 0 || rnorm0 < eps_abs )
-    {
-        if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-	{
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "CGSolver_BiCGStab: niter = 0,"
-                               << ", rnorm = " << rnorm 
-                               << ", eps_abs = " << eps_abs << std::endl;
-	}
-        return ret;
-    }
-
-    for (; nit <= maxiter; ++nit)
-    {
-        const Real rho = dotxy(rh,r);
-        if ( rho == 0 ) 
-	{
-            ret = 1; break;
-	}
-        if ( nit == 1 )
-        {
-            MultiFab::Copy(p,r,0,0,1,0);
-        }
-        else
-        {
-            const Real beta = (rho/rho_1)*(alpha/omega);
-            sxay(p, p, -omega, v);
-            sxay(p, r,   beta, p);
-        }
-        if ( use_mg_precond )
-        {
-            ph.setVal(0);
-            mg_precond->solve(ph, p, eps_rel, eps_abs, temp_bc_mode);
-        }
-        else if ( use_jacobi_precond )
-        {
-            ph.setVal(0);
-            Lp.jacobi_smooth(ph, p, lev, temp_bc_mode);
-        }
-        else 
-        {
-            MultiFab::Copy(ph,p,0,0,1,0);
-        }
-        Lp.apply(v, ph, lev, temp_bc_mode);
-
-        if ( Real rhTv = dotxy(rh,v) )
-	{
-            alpha = rho/rhTv;
-	}
-        else
-	{
-            ret = 2; break;
-	}
-        sxay(sol, sol,  alpha, ph);
-        sxay(s,     r, -alpha,  v);
-
-        rnorm = norm_inf(s);
-
-        if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "CGSolver_BiCGStab: Half Iter "
-                               << std::setw(11) << nit
-                               << " rel. err. "
-                               << rnorm/(rnorm0) << '\n';
-        }
-
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-        if ( rnorm < eps_rel*rnorm0 || rnorm < eps_abs ) break;
-#else
-        sol_norm = norm_inf(sol);
-        if ( rnorm < eps_rel*(Lp_norm*sol_norm + rnorm0 ) || rnorm < eps_abs ) break;
-#endif
-        if ( use_mg_precond )
-        {
-            sh.setVal(0);
-            mg_precond->solve(sh, s, eps_rel, eps_abs, temp_bc_mode);
-        }
-        else if ( use_jacobi_precond )
-        {
-            sh.setVal(0);
-            Lp.jacobi_smooth(sh, s, lev, temp_bc_mode);
-        }
-        else
-        {
-            MultiFab::Copy(sh,s,0,0,1,0);
-        }
-        Lp.apply(t, sh, lev, temp_bc_mode);
-        //
-        // This is a little funky.  I want to elide one of the reductions
-        // in the following two dotxy()s.  We do that by calculating the "local"
-        // values and then reducing the two local values at the same time.
-        //
-        Real dotvals[2] = { dotxy(t,t,true), dotxy(t,s,true) };
-
-        ParallelAllReduce::Sum(dotvals,2,ParallelContext::CommunicatorSub());
-
-        if ( dotvals[0] )
-	{
-            omega = dotvals[1]/dotvals[0];
-	}
-        else
-	{
-            ret = 3; break;
-	}
-        sxay(sol, sol,  omega, sh);
-        sxay(r,     s, -omega,  t);
-
-        rnorm = norm_inf(r);
-
-        if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "CGSolver_BiCGStab: Iteration "
-                               << std::setw(11) << nit
-                               << " rel. err. "
-                               << rnorm/(rnorm0) << '\n';
-        }
-
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-        if ( rnorm < eps_rel*rnorm0 || rnorm < eps_abs ) break;
-#else
-        sol_norm = norm_inf(sol);
-        if ( rnorm < eps_rel*(Lp_norm*sol_norm + rnorm0 ) || rnorm < eps_abs ) break;
-#endif
-        if ( omega == 0 )
-	{
-            ret = 4; break;
-	}
-        rho_1 = rho;
-    }
-
-    if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev);
-        amrex::OutStream() << "CGSolver_BiCGStab: Final: Iteration "
-                           << std::setw(4) << nit
-                           << " rel. err. "
-                           << rnorm/(rnorm0) << '\n';
-    }
-
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-    if ( ret == 0 && rnorm > eps_rel*rnorm0 && rnorm > eps_abs)
-#else
-    if ( ret == 0 && rnorm > eps_rel*(Lp_norm*sol_norm + rnorm0 ) && rnorm > eps_abs )
-#endif
-    {
-        if ( ParallelDescriptor::IOProcessor() )
-            amrex::Warning("CGSolver_BiCGStab:: failed to converge!");
-        ret = 8;
-    }
-
-    if ( ( ret == 0 || ret == 8 ) && (rnorm < rnorm0) )
-    {
-        sol.plus(sorig, 0, 1, 0);
-    } 
-    else 
-    {
-        sol.setVal(0);
-        sol.plus(sorig, 0, 1, 0);
-    }
-
-    return ret;
-}
-
-int
-CGSolver::solve_cg (MultiFab&       sol,
-		    const MultiFab& rhs,
-		    Real            eps_rel,
-		    Real            eps_abs,
-		    LinOp::BC_Mode  bc_mode)
-{
-    BL_PROFILE("CGSolver::solve_cg()");
-
-    const int nghost = sol.nGrow(), ncomp = 1;
-
-    const BoxArray& ba = sol.boxArray();
-    const DistributionMapping& dm = sol.DistributionMap();
-
-    BL_ASSERT(sol.nComp() == ncomp);
-    BL_ASSERT(sol.boxArray() == Lp.boxArray(lev));
-    BL_ASSERT(rhs.boxArray() == Lp.boxArray(lev));
-
-    MultiFab sorig(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab r(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab z(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab q(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab p(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-
-    MultiFab r1(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab z1(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab r2(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab z2(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-
-    MultiFab::Copy(sorig,sol,0,0,1,0);
-
-    Lp.residual(r, rhs, sorig, lev, bc_mode);
-
-    sol.setVal(0);
-
-    const LinOp::BC_Mode temp_bc_mode=LinOp::Homogeneous_BC;
-
-    Real       rnorm    = norm_inf(r);
-    const Real rnorm0   = rnorm;
-    Real       minrnorm = rnorm;
-
-    if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev);
-        amrex::OutStream() << "              CG: Initial error :        " << rnorm0 << '\n';
-    }
-
-    const Real Lp_norm = Lp.norm(0, lev);
-    Real sol_norm      = 0;
-    Real rho_1         = 0;
-    int  ret           = 0;
-    int  nit           = 1;
-
-    if ( rnorm == 0 || rnorm < eps_abs )
-    {
-        if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-	{
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "       CG: niter = 0,"
-                      << ", rnorm = " << rnorm 
-                      << ", eps_rel*(Lp_norm*sol_norm + rnorm0 )" <<  eps_rel*(Lp_norm*sol_norm + rnorm0 ) 
-                      << ", eps_abs = " << eps_abs << std::endl;
-	}
-        return 0;
-    }
-
-    for (; nit <= maxiter; ++nit)
-    {
-        if (use_jbb_precond && ParallelDescriptor::NProcs() > 1)
-        {
-            z.setVal(0);
-
-            jbb_precond(z,r,lev,Lp);
-        }
-        else
-        {
-            MultiFab::Copy(z,r,0,0,1,0);
-        }
-
-        Real rho = dotxy(z,r);
-
-        if (nit == 1)
-        {
-            MultiFab::Copy(p,z,0,0,1,0);
-        }
-        else
-        {
-            Real beta = rho/rho_1;
-            sxay(p, z, beta, p);
-        }
-        Lp.apply(q, p, lev, temp_bc_mode);
-
-        Real alpha;
-        if ( Real pw = dotxy(p,q) )
-	{
-            alpha = rho/pw;
-	}
-        else
-	{
-            ret = 1; break;
-	}
-        
-        if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "CGSolver_cg:"
-                      << " nit " << nit
-                      << " rho " << rho
-                      << " alpha " << alpha << '\n';
-        }
-        sxay(sol, sol, alpha, p);
-        sxay(  r,   r,-alpha, q);
-        rnorm = norm_inf(r);
-        sol_norm = norm_inf(sol);
-
-        if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev);
-            amrex::OutStream() << "       CG:       Iteration"
-                      << std::setw(4) << nit
-                      << " rel. err. "
-                      << rnorm/(rnorm0) << '\n';
-        }
-
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-        if ( rnorm < eps_rel*rnorm0 || rnorm < eps_abs ) break;
-#else
-        if ( rnorm < eps_rel*(Lp_norm*sol_norm + rnorm0) || rnorm < eps_abs ) break;
-#endif
-        if ( rnorm > def_unstable_criterion*minrnorm )
-	{
-            ret = 2; break;
-	}
-        else if ( rnorm < minrnorm )
-	{
-            minrnorm = rnorm;
-	}
-
-        rho_1 = rho;
-    }
-    
-    if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev);
-        amrex::OutStream() << "       CG: Final Iteration"
-                  << std::setw(4) << nit
-                  << " rel. err. "
-                  << rnorm/(rnorm0) << '\n';
-    }
-
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-    if ( ret == 0 &&  rnorm > eps_rel*rnorm0 && rnorm > eps_abs )
-#else
-    if ( ret == 0 && rnorm > eps_rel*(Lp_norm*sol_norm + rnorm0) && rnorm > eps_abs )
-#endif
-    {
-        if ( ParallelDescriptor::IOProcessor() )
-            amrex::Warning("CGSolver_cg: failed to converge!");
-        ret = 8;
-    }
-
-    if ( ( ret == 0 || ret == 8 ) && (rnorm < rnorm0) )
-    {
-        sol.plus(sorig, 0, 1, 0);
-    } 
-    else 
-    {
-        sol.setVal(0);
-        sol.plus(sorig, 0, 1, 0);
-    }
-
-    return ret;
-}
-
-int
-CGSolver::jbb_precond (MultiFab&       sol,
-		       const MultiFab& rhs,
-                       int             lev_loc,
-		       LinOp&          Lp_jbb)
-{
-    //
-    // This is a local routine.  No parallel is allowed to happen here.
-    //
-    const Real           eps_rel = 1.e-2;
-    const Real           eps_abs = 1.e-16;
-    const int            nghost  = sol.nGrow();
-    const int            ncomp   = sol.nComp();
-    const bool           local   = true;
-    const LinOp::BC_Mode bc_mode = LinOp::Homogeneous_BC;
-
-    BL_ASSERT(ncomp == 1 );
-    BL_ASSERT(sol.boxArray() == Lp_jbb.boxArray(lev_loc));
-    BL_ASSERT(rhs.boxArray() == Lp_jbb.boxArray(lev_loc));
-
-    const BoxArray& ba = sol.boxArray();
-    const DistributionMapping& dm = sol.DistributionMap();
-
-    MultiFab sorig(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-
-    MultiFab r(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab z(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab q(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-    MultiFab p(ba, dm, ncomp, nghost, MFInfo(), FArrayBoxFactory());
-
-    sorig.copy(sol);
-
-    Lp_jbb.residual(r, rhs, sorig, lev_loc, LinOp::Homogeneous_BC, local);
-
-    sol.setVal(0);
-
-    Real       rnorm    = norm_inf(r,local);
-    const Real rnorm0   = rnorm;
-    Real       minrnorm = rnorm;
-
-    if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev_loc);
-        amrex::OutStream() << "     jbb_precond: Initial error :        " << rnorm0 << '\n';
-    }
-
-    const Real Lp_norm = Lp_jbb.norm(0, lev_loc, local);
-    Real sol_norm = 0;
-    int  ret      = 0;			// will return this value if all goes well
-    Real rho_1    = 0;
-    int  nit      = 1;
-
-    if ( rnorm0 == 0 || rnorm0 < eps_abs )
-    {
-        if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-	{
-            Spacer(amrex::OutStream(), lev_loc);
-            amrex::OutStream() << "jbb_precond: niter = 0,"
-                      << ", rnorm = " << rnorm 
-                      << ", eps_abs = " << eps_abs << std::endl;
-	}
-        return 0;
-    }
-
-    for (; nit <= maxiter; ++nit)
-    {
-        z.copy(r);
-
-        Real rho = dotxy(z,r,local);
-        if (nit == 1)
-        {
-            p.copy(z);
-        }
-        else
-        {
-            Real beta = rho/rho_1;
-            sxay(p, z, beta, p);
-        }
-
-        Lp_jbb.apply(q, p, lev_loc, bc_mode, local);
-
-        Real alpha;
-        if ( Real pw = dotxy(p,q,local) )
-	{
-            alpha = rho/pw;
-	}
-        else
-	{
-            ret = 1; break;
-	}
-        
-        if ( verbose > 3 && ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev_loc);
-            amrex::OutStream() << "jbb_precond:" << " nit " << nit
-                      << " rho " << rho << " alpha " << alpha << '\n';
-        }
-        sxay(sol, sol, alpha, p);
-        sxay(  r,   r,-alpha, q);
-        rnorm    = norm_inf(r,   local);
-        sol_norm = norm_inf(sol, local);
-
-        if ( verbose > 2 && ParallelDescriptor::IOProcessor() )
-        {
-            Spacer(amrex::OutStream(), lev_loc);
-            amrex::OutStream() << "jbb_precond:       Iteration"
-                      << std::setw(4) << nit
-                      << " rel. err. "
-                      << rnorm/(rnorm0) << '\n';
-        }
-
-        if ( rnorm < eps_rel*(Lp_norm*sol_norm + rnorm0) || rnorm < eps_abs )
-	{
-            break;
-	}
-      
-        if ( rnorm > def_unstable_criterion*minrnorm )
-	{
-            ret = 2; break;
-	}
-        else if ( rnorm < minrnorm )
-	{
-            minrnorm = rnorm;
-	}
-
-        rho_1 = rho;
-    }
-    
-    if ( verbose > 0 && ParallelDescriptor::IOProcessor() )
-    {
-        Spacer(amrex::OutStream(), lev_loc);
-        amrex::OutStream() << "jbb_precond: Final Iteration"
-                  << std::setw(4) << nit
-                  << " rel. err. "
-                  << rnorm/(rnorm0) << '\n';
-    }
-    if ( ret == 0 && rnorm > eps_rel*(Lp_norm*sol_norm + rnorm0) && rnorm > eps_abs )
-    {
-        if ( ParallelDescriptor::IOProcessor() )
-	{
-            amrex::Warning("jbb_precond:: failed to converge!");
-	}
-        ret = 8;
-    }
-
-    if ( ( ret == 0 || ret == 8 ) && (rnorm < rnorm0) )
-    {
-        sol.plus(sorig, 0, 1, 0);
-    } 
-    else 
-    {
-        sol.setVal(0);
-        sol.plus(sorig, 0, 1, 0);
-    }
-
-    return ret;
-}
-
-}
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LO_1D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_LO_1D.F90
deleted file mode 100644
index 5604c5760aa..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LO_1D.F90
+++ /dev/null
@@ -1,295 +0,0 @@
-
-module amrex_lo_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-  use amrex_lo_bctypes_module, only : amrex_lo_dirichlet, amrex_lo_neumann, amrex_lo_reflect_odd
-
-  implicit none
-
-  include 'AMReX_lo_bctypes.fi'
-
-contains
-
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_harmonic_averageec ( &
-           c, c_l1,c_h1, &
-           f, f_l1,f_h1, &
-           lo, hi, nc, &
-           cdir &
-           ) bind(c,name='amrex_lo_harmonic_averageec')
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer f_l1,f_h1
-      real(amrex_real) f(f_l1:f_h1,nc)
-      integer c_l1,c_h1
-      real(amrex_real) c(c_l1:c_h1,nc)
-
-      integer i,n
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            c(i,n) =  f(2*i,n)
-         end do
-      end do
-
-    end subroutine amrex_lo_harmonic_averageec
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_averageec ( &
-           c, c_l1,c_h1, &
-           f, f_l1,f_h1, &
-           lo, hi, nc, &
-           cdir &
-           ) bind(c,name='amrex_lo_averageec')
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer f_l1,f_h1
-      real(amrex_real) f(f_l1:f_h1,nc)
-      integer c_l1,c_h1
-      real(amrex_real) c(c_l1:c_h1,nc)
-
-      integer i,n
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            c(i,n) = f(2*i,n)
-         end do
-      end do
-
-    end subroutine amrex_lo_averageec
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_averagecc ( &
-           c, c_l1,c_h1, &
-           f, f_l1,f_h1, &
-           lo, hi, nc &
-           ) bind(c,name='amrex_lo_averagecc')
-
-      integer nc
-      integer f_l1,f_h1
-      integer c_l1,c_h1
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,nc)
-      real(amrex_real) c(c_l1:c_h1,nc)
-
-      integer i,n
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            c(i,n) =  (f(2*i+1,n) + f(2*i,n))*half
-         end do
-      end do
-
-    end subroutine amrex_lo_averagecc
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_applybc ( &
-           flagden, flagbc, maxorder, &
-           phi,   phi_l1,phi_h1, &
-           cdir, bct, bcl, &
-           bcval, bcval_l1,bcval_h1, &
-           mask,  mask_l1,mask_h1, &
-           den,   den_l1,den_h1, &
-           lo, hi, nc, &
-           h &
-           ) bind(c,name='amrex_lo_applybc')
-
-      use amrex_lo_util_module, only : polyInterpCoeff
-
-!     If the boundary is of Neumann type, set the ghost cell value to
-!     that of the outermost point in the valid data (2nd order accurate)
-!     and then fill the "den" array with the value "1"
-!     
-!     
-!     If flagbc==1:
-!     
-!     If the boundary is of Dirichlet type, construct a polynomial
-!     interpolation through the boundary location and internal points
-!     (at locations x(-1:len-2) that generates the ghost cell value (at
-!     location xInt).  Then fill the ghost cell with the interpolated value.
-!     If flagden==1, load the "den" array with the interpolation
-!     coefficient corresponding to outermost point in the valid region
-!     ( the coef(0) corresponding to the location x(0) )
-!      
-!     Note: 
-!     The bc type = amrex_lo_reflect_odd is a special type of boundary condition.
-
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer phi_l1,phi_h1
-      real(amrex_real) phi(phi_l1:phi_h1,nc)
-      integer den_l1,den_h1
-      real(amrex_real) den(den_l1:den_h1)
-      integer bcval_l1,bcval_h1
-      real(amrex_real) bcval(bcval_l1:bcval_h1,nc)
-      integer mask_l1,mask_h1
-      integer mask(mask_l1:mask_h1)
-      integer bct
-      real(amrex_real) bcl
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,n
-      logical is_dirichlet
-      logical is_neumann
-
-      integer lenx
-      integer m
-
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      real(amrex_real) x(-1:maxmaxorder-2)
-      real(amrex_real) coef(-1:maxmaxorder-2)
-      real(amrex_real) xInt
-
-      is_dirichlet(i) = ( i .eq. amrex_lo_dirichlet )
-      is_neumann(i)   = ( i .eq. amrex_lo_neumann )
-
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      end if
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-
-!     TODO:
-!     In order for this to work with growing multigrid, must
-!     sort xa[] because it is possible for the xb value to lay
-!     within this range.
-!     
-!     The Left face of the grid
-
-      if(cdir .eq. 0) then
-         if (is_neumann(bct)) then
-            do n = 1, nc
-               phi(lo(1)-1,n) = merge( &
-                    phi(lo(1),n), &
-                    phi(lo(1)-1,n), &
-                    mask(lo(1)-1) .gt. 0)
-            end do
-            if ( flagden .eq. 1) then
-               den(lo(1)) = 1.0D0
-            end if
-         else if (is_dirichlet(bct)) then
-            do m=0,lenx
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(1)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  phi(lo(1)-1,n) = merge( &
-                       bcval(lo(1)-1,n)*coef(-1), &
-                       phi(lo(1)-1,n), &
-                       mask(lo(1)-1) .gt. 0)
-               else
-                  phi(lo(1)-1,n) = merge( &
-                       0.0D0, &
-                       phi(lo(1)-1,n), &
-                       mask(lo(1)-1) .gt. 0)
-               end if
-               do m = 0, lenx
-                  phi(lo(1)-1,n) = merge(&
-                       phi(lo(1)-1,n) &
-                       + phi(lo(1)+m,n)*coef(m), &
-                       phi(lo(1)-1,n), &
-                       mask(lo(1)-1) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               den(lo(1)) = merge(coef(0), 0.0D0, &
-                    mask(lo(1)-1) .gt. 0)
-            end if
-
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-
-            do n = 1, nc
-               phi(lo(1)-1,n) = merge( &
-                   -phi(lo(1),n), &
-                    phi(lo(1)-1,n), &
-                    mask(lo(1)-1) .gt. 0)
-            end do
-            if ( flagden .eq. 1 ) then
-               den(lo(1)) = merge(-1.0D0, 0.0D0,&
-                    mask(lo(1)-1) .gt. 0)
-            end if
-
-         else 
-            call bl_error("stop UNKNOWN BC ON LEFT FACE IN APPLYBC")
-         end if
-      end if
-
-!     The Right face of the grid
-
-      if(cdir .eq. 2) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               phi(hi(1)+1,n) = merge( &
-                    phi(hi(1),n), &
-                    phi(hi(1)+1,n), &
-                    mask(hi(1)+1) .gt. 0)
-            end do
-	    if ( flagden .eq. 1 ) then
-                den(hi(1)) = 1.0D0
-	    end if
-         else if (is_dirichlet(bct)) then
-            do m=0,lenx
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(1)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do n = 1, nc 
-               if ( flagbc .eq. 1 ) then
-                  phi(hi(1)+1,n) = merge( &
-                       bcval(hi(1)+1,n)*coef(-1), &
-                       phi(hi(1)+1,n), &
-                       mask(hi(1)+1) .gt. 0)
-               else
-                  phi(hi(1)+1,n) = merge( &
-                       0.0D0, &
-                       phi(hi(1)+1,n), &
-                       mask(hi(1)+1) .gt. 0)
-               end if
-               do m = 0, lenx
-                  phi(hi(1)+1,n) = merge( &
-                       phi(hi(1)+1,n) &
-                       + phi(hi(1)-m,n)*coef(m), &
-                       phi(hi(1)+1,n), &
-                       mask(hi(1)+1) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               den(hi(1))   = merge(coef(0), 0.0D0, &
-                    mask(hi(1)+1) .gt. 0)
-            end if
-
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-
-            do n = 1, nc
-               phi(hi(1)+1,n) = merge( &
-                   -phi(hi(1),n), &
-                    phi(hi(1)+1,n), &
-                    mask(hi(1)+1) .gt. 0)
-            end do
-            if ( flagden .eq. 1 ) then
-               den(hi(1)) = merge(-1.0D0, 0.0D0, &
-                    mask(hi(1)+1) .gt. 0)
-            end if
-
-         else
-            call bl_error("stop UNKNOWN BC ON RIGHT FACE IN APPLYBC")
-         end if
-      end if
-
-    end subroutine amrex_lo_applybc
-
-end module amrex_lo_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LO_2D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_LO_2D.F90
deleted file mode 100644
index 306bc1c0fb0..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LO_2D.F90
+++ /dev/null
@@ -1,546 +0,0 @@
-
-module amrex_lo_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-  use amrex_lo_bctypes_module, only : amrex_lo_dirichlet, amrex_lo_neumann, amrex_lo_reflect_odd
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_harmonic_averageec ( &
-           c, c_l1,c_l2,c_h1,c_h2, &
-           f, f_l1,f_l2,f_h1,f_h2, &
-           lo, hi, nc, &
-           cdir &
-           ) bind(c,name='amrex_lo_harmonic_averageec')
-
-      implicit none
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer f_l1,f_l2,f_h1,f_h2
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,nc)
-      integer c_l1,c_l2,c_h1,c_h2
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,nc)
-
-      real(amrex_real) factor, den
-      parameter(factor=2.00D0)
-      integer n
-      integer i
-      integer j
-
-      if ( cdir .eq. 0 ) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  den = f(2*i,2*j,n) + f(2*i,2*j+1,n)
-                  if (den .ne. 0.0D0) then
-                    c(i,j,n) =  factor*f(2*i,2*j,n)*f(2*i,2*j+1,n)/den
-                  else
-                    c(i,j,n) =  0.0D0
-                  end if
-               end do
-            end do
-         end do
-      else if (cdir .eq. 1 ) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  den = f(2*i,2*j,n) + f(2*i+1,2*j,n)
-                  if (den .ne. 0.0D0) then
-                    c(i,j,n) =  factor*f(2*i,2*j,n)*f(2*i+1,2*j,n)/den
-                  else
-                    c(i,j,n) =  0.0D0
-                  end if
-               end do
-            end do
-         end do
-      end if
-
-    end subroutine amrex_lo_harmonic_averageec
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_averageec ( &
-           c, c_l1,c_l2,c_h1,c_h2, &
-           f, f_l1,f_l2,f_h1,f_h2, &
-           lo, hi, nc, &
-           cdir &
-           ) bind(c,name='amrex_lo_averageec')
-
-      implicit none
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer f_l1,f_l2,f_h1,f_h2
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,nc)
-      integer c_l1,c_l2,c_h1,c_h2
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,nc)
-
-      integer n
-      integer i
-      integer j
-      real(amrex_real) denom
-      parameter(denom=half)
-
-      if (cdir .eq. 0 ) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  c(i,j,n) = (f(2*i,2*j,n) + f(2*i,2*j+1,n))*denom
-               end do
-            end do
-         end do
-      else if (cdir .eq. 1) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  c(i,j,n) = (f(2*i,2*j,n) + f(2*i+1,2*j,n))*denom
-               end do
-            end do
-         end do
-      end if
-
-    end subroutine amrex_lo_averageec
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_averagecc ( &
-           c, c_l1,c_l2,c_h1,c_h2, &
-           f, f_l1,f_l2,f_h1,f_h2, &
-           lo, hi, nc &
-           ) bind(c,name='amrex_lo_averagecc')
-
-      implicit none
-
-      integer nc
-      integer f_l1,f_l2,f_h1,f_h2
-      integer c_l1,c_l2,c_h1,c_h2
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,nc)
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,nc)
-
-      integer i
-      integer j
-      integer n
-      real(amrex_real) denom
-      parameter(denom=fourth)
-
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               c(i,j,n) =  ( &
-                    f(2*i+1,2*j+1,n) + f(2*i  ,2*j+1,n) &
-                    + f(2*i+1,2*j  ,n) + f(2*i  ,2*j  ,n))*denom
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lo_averagecc
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_applybc ( &
-           flagden, flagbc, maxorder, &
-           phi,   phi_l1,phi_l2,phi_h1,phi_h2, &
-           cdir, bct, bcl, &
-           bcval, bcval_l1,bcval_l2,bcval_h1,bcval_h2, &
-           mask,  mask_l1,mask_l2,mask_h1,mask_h2, &
-           den,   den_l1,den_l2,den_h1,den_h2, &
-           lo, hi, nc, &
-           h &
-           ) bind(c,name='amrex_lo_applybc')
-
-      use amrex_lo_util_module, only : polyInterpCoeff
-      implicit none
-
-!     If the boundary is of Neumann type, set the ghost cell value to
-!     that of the outermost point in the valid data (2nd order accurate)
-!     and then fill the "den" array with the value "1"
-!     
-!     
-!     If flagbc==1:
-!     
-!     If the boundary is of Dirichlet type, construct a polynomial
-!     interpolation through the boundary location and internal points
-!     (at locations x(-1:len-2) that generates the ghost cell value (at
-!     location xInt).  Then fill the ghost cell with the interpolated value.
-!     If flagden==1, load the "den" array with the interpolation
-!     coefficient corresponding to outermost point in the valid region
-!     ( the coef(0) corresponding to the location x(0) )
-!      
-!     Note: 
-!     The bc type = amrex_lo_reflect_odd is a special type of boundary condition.
- 
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer phi_l1,phi_l2,phi_h1,phi_h2
-      real(amrex_real) phi(phi_l1:phi_h1,phi_l2:phi_h2,nc)
-      integer den_l1,den_l2,den_h1,den_h2
-      real(amrex_real) den(den_l1:den_h1,den_l2:den_h2)
-      integer bcval_l1,bcval_l2,bcval_h1,bcval_h2
-      real(amrex_real) bcval(bcval_l1:bcval_h1,bcval_l2:bcval_h2,nc)
-      integer mask_l1,mask_l2,mask_h1,mask_h2
-      integer mask(mask_l1:mask_h1,mask_l2:mask_h2)
-      integer bct
-      real(amrex_real) bcl
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i
-      integer j
-      integer n
-      logical is_dirichlet
-      logical is_neumann
-!      real(amrex_real) xb
-
-      integer lenx
-      integer leny
-      integer m
-
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      real(amrex_real) x(-1:maxmaxorder-2)
-      real(amrex_real) coef(-1:maxmaxorder-2)
-      real(amrex_real) xInt
-
-      is_dirichlet(i) = ( i .eq. amrex_lo_dirichlet )
-      is_neumann(i)   = ( i .eq. amrex_lo_neumann )
-
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      end if
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-
-!     TODO:
-!     In order for this to work with growing multigrid, must
-!     sort xa[] because it is possible for the xb value to lay
-!     within this range.
-!     
-!     The Left face of the grid
-
-      if(cdir .eq. 0) then
-         if (is_neumann(bct)) then
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  phi(lo(1)-1,j,n) = merge( &
-                       phi(lo(1),j,n), &
-                       phi(lo(1)-1,j,n), &
-                       mask(lo(1)-1,j) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1) then
-               do j = lo(2), hi(2)
-                  den(lo(1),j) = 1.0D0
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            do m=0,lenx
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(1)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     phi(lo(1)-1, j, n) = merge( &
-                          bcval(lo(1)-1,j,n)*coef(-1), &
-                          phi(lo(1)-1, j, n), &
-                          mask(lo(1)-1,j) .gt. 0)
-                  end do
-               else
-                  do j = lo(2), hi(2)
-                     phi(lo(1)-1, j, n) = merge( &
-                          0.0D0, &
-                          phi(lo(1)-1, j, n), &
-                          mask(lo(1)-1,j) .gt. 0)
-                  end do
-               end if
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     phi(lo(1)-1,j,n) = merge( &
-                          phi(lo(1)-1,j,n) &
-                          + phi(lo(1)+m, j, n)*coef(m), &
-                          phi(lo(1)-1,j,n), &
-                          mask(lo(1)-1,j) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(lo(1),j) = merge(coef(0), 0.0D0, &
-                       mask(lo(1)-1,j) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  phi(lo(1)-1, j, n) = merge( &
-                      -phi(lo(1),j,n), &
-                       phi(lo(1)-1, j, n), &
-                       mask(lo(1)-1,j) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(lo(1),j) = merge(-1.0D0, 0.0D0, &
-                       mask(lo(1)-1,j) .gt. 0)
-               end do
-            end if
-
-         else 
-            call bl_error("stop UNKNOWN BC ON LEFT FACE IN APPLYBC")
-         end if
-      end if
-
-!     The Right face of the grid
-
-      if(cdir .eq. 2) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  phi(hi(1)+1,j,n) = merge( &
-                       phi(hi(1), j, n), &
-                       phi(hi(1)+1, j, n), &
-                       mask(hi(1)+1,j) .gt. 0)
-               end do
-            end do
-	    if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(hi(1),j) = 1.0D0
-               end do
-	    end if
-         else if (is_dirichlet(bct)) then
-            do m=0,lenx
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(1)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     phi(hi(1)+1,j,n) = merge( &
-                          bcval(hi(1)+1,j,n)*coef(-1), &
-                          phi(hi(1)+1,j,n), &
-                          mask(hi(1)+1,j) .gt. 0)
-                  end do
-               else
-                  do j = lo(2), hi(2)
-                     phi(hi(1)+1,j,n) = merge( &
-                          0.0D0, &
-                          phi(hi(1)+1,j,n), &
-                          mask(hi(1)+1,j) .gt. 0)
-                  end do
-               end if
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     phi(hi(1)+1,j,n) = merge( &
-                          phi(hi(1)+1,j,n) &
-                          + phi(hi(1)-m,j,n)*coef(m), &
-                          phi(hi(1)+1,j,n), &
-                          mask(hi(1)+1,j) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(hi(1),j)   = merge(coef(0), 0.0D0, &
-                       mask(hi(1)+1,j) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  phi(hi(1)+1, j, n) = merge( &
-                      -phi(hi(1),j,n), &
-                       phi(hi(1)+1, j, n), &
-                       mask(hi(1)+1,j) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(hi(1),j) = merge(-1.0D0, 0.0D0, &
-                       mask(hi(1)+1,j) .gt. 0)
-               end do
-            end if
-
-         else
-            call bl_error("stop UNKNOWN BC ON RIGHT FACE IN APPLYBC")
-         end if
-      end if
-
-!     The Bottom of the Grid
-
-      if(cdir .eq. 1) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do i = lo(1),hi(1)
-                  phi(i,lo(2)-1,n) = merge( &
-                       phi(i,lo(2),n), &
-                       phi(i,lo(2)-1,n), &
-                       mask(i,lo(2)-1) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1),hi(1)
-                  den(i,lo(2))   = 1.0D0
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            do m=0,leny
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(2)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, leny+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     phi(i,lo(2)-1,n) = merge( &
-                          bcval(i,lo(2)-1,n)*coef(-1), &
-                          phi(i,lo(2)-1,n), &
-                          mask(i,lo(2)-1) .gt. 0)
-                  end do
-               else
-                  do i = lo(1), hi(1)
-                     phi(i,lo(2)-1,n) = merge( &
-                          0.0D0, &
-                          phi(i,lo(2)-1,n), &
-                          mask(i,lo(2)-1) .gt. 0)
-                  end do
-               end if
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     phi(i, lo(2)-1, n) = merge( &
-                          phi(i, lo(2)-1,n) &
-                          + phi(i, lo(2)+m,n)*coef(m), &
-                          phi(i, lo(2)-1, n), &
-                          mask(i, lo(2)-1) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i, lo(2))   = merge(coef(0), 0.0D0, &
-                       mask(i, lo(2)-1) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-
-            do n = 1, nc
-               do i = lo(1), hi(1)
-                  phi(i,lo(2)-1,n) = merge( &
-                      -phi(i,lo(2),n), &
-                       phi(i,lo(2)-1,n), &
-                       mask(i,lo(2)-1) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,lo(2)) = merge(-1.0D0, 0.0D0, &
-                       mask(i,lo(2)-1) .gt. 0)
-               end do
-            end if
-
-         else
-            call bl_error("stop UNKNOWN BC ON BOTTOM FACE IN APPLYBC")
-         end if
-      end if
-
-!     The top of the grid
-
-      if (cdir .eq. 3) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do i = lo(1), hi(1)
-                  phi(i,hi(2)+1,n) = merge( &
-                       phi(i,hi(2),n), &
-                       phi(i,hi(2)+1,n), &
-                       mask(i,hi(2)+1) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,hi(2))   = 1.0D0
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            if ( bct .eq. amrex_lo_reflect_odd ) leny = 0
-            do m=0,leny
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(2)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, leny+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     phi(i,hi(2)+1,n) = merge( &
-                          bcval(i,hi(2)+1,n)*coef(-1), &
-                          phi(i,hi(2)+1,n), &
-                          mask(i,hi(2)+1) .gt. 0)
-                  end do
-               else
-                  do i = lo(1), hi(1)
-                     phi(i,hi(2)+1,n) = merge( &
-                          0.0D0, &
-                          phi(i,hi(2)+1,n), &
-                          mask(i,hi(2)+1) .gt. 0)
-                  end do
-               end if
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     phi(i, hi(2)+1,n) = merge( &
-                          phi(i,hi(2)+1,n) &
-                          + phi(i, hi(2)-m,n)*coef(m), &
-                          phi(i,hi(2)+1,n), &
-                          mask(i,hi(2)+1) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,hi(2))   = merge(coef(0), 0.0D0, &
-                       mask(i,hi(2)+1) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-
-            do n = 1, nc
-               do i = lo(1), hi(1)
-                  phi(i,hi(2)+1,n) = merge( &
-                      -phi(i,hi(2),n), &
-                       phi(i,hi(2)+1,n), &
-                       mask(i,hi(2)+1) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,hi(2)) = merge(-1.0D0, 0.0D0, &
-                       mask(i,hi(2)+1) .gt. 0)
-               end do
-            end if
-
-         else
-            call bl_error("stop UNKNOWN BC ON TOP FACE IN APPLYBC")
-         end if
-      end if
-
-    end subroutine amrex_lo_applybc
-
-end module amrex_lo_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LO_3D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_LO_3D.F90
deleted file mode 100644
index d93e439f260..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LO_3D.F90
+++ /dev/null
@@ -1,827 +0,0 @@
-
-module amrex_lo_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-  use amrex_lo_bctypes_module, only : amrex_lo_dirichlet, amrex_lo_neumann, amrex_lo_reflect_odd
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_harmonic_averageec ( &
-           c, c_l1,c_l2,c_l3,c_h1,c_h2,c_h3, &
-           f, f_l1,f_l2,f_l3,f_h1,f_h2,f_h3, &
-           lo, hi, nc, &
-           cdir &
-           ) bind(c,name='amrex_lo_harmonic_averageec')
-
-      implicit none
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer f_l1,f_l2,f_l3,f_h1,f_h2,f_h3
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,f_l3:f_h3,nc)
-      integer c_l1,c_l2,c_l3,c_h1,c_h2,c_h3
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,c_l3:c_h3,nc)
-
-      integer n, i, j, k
-
-      select case(cdir)
-
-      case (0)
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = four/( &
-                          + 1.0D0/f(2*i,2*j  ,2*k  ,n) &
-                          + 1.0D0/f(2*i,2*j+1,2*k  ,n) &
-                          + 1.0D0/f(2*i,2*j  ,2*k+1,n) &
-                          + 1.0D0/f(2*i,2*j+1,2*k+1,n) )
-
-                  end do
-               end do
-            end do
-         end do
-
-      case (1)
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = four/( &
-                          + 1.0D0/f(2*i  ,2*j,2*k  ,n) &
-                          + 1.0D0/f(2*i+1,2*j,2*k  ,n) &
-                          + 1.0D0/f(2*i  ,2*j,2*k+1,n) &
-                          + 1.0D0/f(2*i+1,2*j,2*k+1,n) )
-
-                  end do
-               end do
-            end do
-         end do
-      case (2)
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = four/( &
-                           + 1.0D0/f(2*i  ,2*j  ,2*k,n) &
-                          + 1.0D0/f(2*i+1,2*j  ,2*k,n) &
-                          + 1.0D0/f(2*i  ,2*j+1,2*k,n) &
-                          + 1.0D0/f(2*i+1,2*j+1,2*k,n) )
-
-                  end do
-               end do
-            end do
-         end do
-
-      end select
-
-    end subroutine amrex_lo_harmonic_averageec
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_averageec ( &
-           c, c_l1,c_l2,c_l3,c_h1,c_h2,c_h3, &
-           f, f_l1,f_l2,f_l3,f_h1,f_h2,f_h3, &
-           lo, hi, nc, &
-           cdir &
-           ) bind(c,name='amrex_lo_averageec')
-
-      implicit none
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer f_l1,f_l2,f_l3,f_h1,f_h2,f_h3
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,f_l3:f_h3,nc)
-      integer c_l1,c_l2,c_l3,c_h1,c_h2,c_h3
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,c_l3:c_h3,nc)
-
-      integer n, i, j, k
-
-      select case(cdir)
-
-      case (0)
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = fourth*( &
-                          + f(2*i,2*j  ,2*k  ,n) &
-                          + f(2*i,2*j+1,2*k  ,n) &
-                          + f(2*i,2*j  ,2*k+1,n) &
-                          + f(2*i,2*j+1,2*k+1,n) )
-
-                  end do
-               end do
-            end do
-         end do
-
-      case (1)
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = fourth*( &
-                          + f(2*i  ,2*j,2*k  ,n) &
-                          + f(2*i+1,2*j,2*k  ,n) &
-                          + f(2*i  ,2*j,2*k+1,n) &
-                          + f(2*i+1,2*j,2*k+1,n) )
-
-                  end do
-               end do
-            end do
-         end do
-
-      case (2)
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = fourth*( &
-                          + f(2*i  ,2*j  ,2*k,n) &
-                          + f(2*i+1,2*j  ,2*k,n) &
-                          + f(2*i  ,2*j+1,2*k,n) &
-                          + f(2*i+1,2*j+1,2*k,n) )
-
-                  end do
-               end do
-            end do
-         end do
-
-      end select
-
-    end subroutine amrex_lo_averageec
-!-----------------------------------------------------------------------
-    subroutine amrex_lo_averagecc ( &
-           c, c_l1,c_l2,c_l3,c_h1,c_h2,c_h3, &
-           f, f_l1,f_l2,f_l3,f_h1,f_h2,f_h3, &
-           lo, hi, nc &
-           ) bind(c,name='amrex_lo_averagecc')
-
-      implicit none
-
-      integer nc
-      integer f_l1,f_l2,f_l3,f_h1,f_h2,f_h3
-      integer c_l1,c_l2,c_l3,c_h1,c_h2,c_h3
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,f_l3:f_h3,nc)
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,c_l3:c_h3,nc)
-
-      integer i, j, k, n
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-
-                  c(i,j,k,n) =  eighth*( &
-                       + f(2*i+1,2*j+1,2*k  ,n) &
-                       + f(2*i  ,2*j+1,2*k  ,n) &
-                       + f(2*i+1,2*j  ,2*k  ,n) &
-                       + f(2*i  ,2*j  ,2*k  ,n) &
-                       + f(2*i+1,2*j+1,2*k+1,n) &
-                       + f(2*i  ,2*j+1,2*k+1,n) &
-                       + f(2*i+1,2*j  ,2*k+1,n) &
-                       + f(2*i  ,2*j  ,2*k+1,n) )
-
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lo_averagecc
-!-----------------------------------------------------------------------
-!
-! Don't thread this.  We instead thread LinOp::applyBC() across faces.
-!
-    subroutine amrex_lo_applybc ( &
-           flagden, flagbc, maxorder, &
-           phi, phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-           cdir, bct, bcl, &
-           bcval, bcval_l1,bcval_l2,bcval_l3,bcval_h1,bcval_h2,bcval_h3, &
-           mask, mask_l1,mask_l2,mask_l3,mask_h1,mask_h2,mask_h3, &
-           den, den_l1,den_l2,den_l3,den_h1,den_h2,den_h3, &
-           lo, hi, nc, &
-           h &
-           ) bind(c,name='amrex_lo_applybc')
-
-      use amrex_lo_util_module, only : polyInterpCoeff
-      implicit none
-
-!     If the boundary is of Neumann type, set the ghost cell value to
-!     that of the outermost point in the valid data (2nd order accurate)
-!     and then fill the "den" array with the value "1"
-!     
-!     
-!     If flagbc==1:
-!     
-!     If the boundary is of Dirichlet type, construct a polynomial
-!     interpolation through the boundary location and internal points
-!     (at locations x(-1:len-2) that generates the ghost cell value (at
-!     location xInt).  Then fill the ghost cell with the interpolated value.
-!     If flagden==1, load the "den" array with the interpolation
-!     coefficient corresponding to outermost point in the valid region
-!     ( the coef(0) corresponding to the location x(0) )
-!
-!     Note: 
-!     The bc type = amrex_lo_reflect_odd is a special type of dirichlet condition,
-!     in that we want a "zeroth" order interpolant to fill the ghost cell.
-!     If this were treated in the normal way, then ALL boundaries would be
-!     low order.
-      
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      real(amrex_real) phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,nc)
-      integer den_l1,den_l2,den_l3,den_h1,den_h2,den_h3
-      real(amrex_real) den(den_l1:den_h1,den_l2:den_h2,den_l3:den_h3)
-      integer bcval_l1,bcval_l2,bcval_l3,bcval_h1,bcval_h2,bcval_h3
-      real(amrex_real) bcval(bcval_l1:bcval_h1,bcval_l2:bcval_h2,bcval_l3:bcval_h3,nc)
-      integer mask_l1,mask_l2,mask_l3,mask_h1,mask_h2,mask_h3
-      integer mask(mask_l1:mask_h1,mask_l2:mask_h2,mask_l3:mask_h3)
-      integer bct
-      real(amrex_real) bcl
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i, j, k, n
-      logical is_dirichlet, is_neumann
-
-      integer lenx, leny, lenz, m
-
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      real(amrex_real) x(-1:maxmaxorder-2)
-      real(amrex_real) coef(-1:maxmaxorder-2)
-      real(amrex_real) xInt
-      parameter(xInt = -0.5D0)
-
-      is_dirichlet(i) = ( i .eq. amrex_lo_dirichlet )
-      is_neumann(i) = (i .eq. amrex_lo_neumann)
-
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      end if
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-      lenz = MIN(hi(3)-lo(3), Lmaxorder-2)
-
-      do m=0,maxmaxorder-2
-         x(m) = m + 0.5D0
-      end do
-
-!     TODO:
-!     In order for this to work with growing multigrid, must
-!     sort xa[] because it is possible for the xb value to lay
-!     within this range.
-
-      select case (cdir)
-
-      case (0)
-         !     
-         ! The Left face of the grid
-         !
-         if (is_neumann(bct)) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     phi(lo(1)-1,j,k,n) = merge( &
-                          phi(lo(1),j,k,n), &
-                          phi(lo(1)-1,j,k,n), &
-                          mask(lo(1)-1,j,k) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,k) = 1.0D0
-                  end do
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            x(-1) = - bcl/h(1)
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        phi(lo(1)-1, j, k, n) = merge( &
-                             bcval(lo(1)-1,j,k,n)*coef(-1), &
-                             phi(lo(1)-1, j,k, n), &
-                             mask(lo(1)-1,j,k) .gt. 0)
-                     end do
-                  end do
-               else
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        phi(lo(1)-1, j, k, n) = merge( &
-                             0.0D0, &
-                             phi(lo(1)-1, j, k, n), &
-                             mask(lo(1)-1,j, k) .gt. 0)
-                     end do
-                  end do
-               end if
-               do m = 0, lenx
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        phi(lo(1)-1,j,k,n) = merge( &
-                             phi(lo(1)-1,j,k,n) &
-                             + phi(lo(1)+m, j, k, n)*coef(m), &
-                             phi(lo(1)-1,j,k,n), &
-                             mask(lo(1)-1,j,k) .gt. 0)
-                     end do
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,k) = merge(coef(0), 0.0D0, &
-                          mask(lo(1)-1,j,k) .gt. 0)
-                  end do
-               end do
-            end if
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     phi(lo(1)-1, j, k, n) = merge( &
-                         -phi(lo(1),j,k,n), &
-                          phi(lo(1)-1,j,k,n), &
-                          mask(lo(1)-1,j,k) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,k) = merge(-1.0D0, 0.0D0, &
-                          mask(lo(1)-1,j,k) .gt. 0)
-                  end do
-               end do
-            end if
-         else
-            call bl_error("stop UNKNOWN BC ON LEFT FACE IN APPLYBC")
-         end if
-
-      case (3)
-         !
-         ! The Right face of the grid
-         ! 
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     phi(hi(1)+1,j,k,n) = merge( &
-                          phi(hi(1), j, k, n), &
-                          phi(hi(1)+1, j, k, n), &
-                          mask(hi(1)+1,j,k) .gt. 0)
-                  end do
-               end do
-            end do
-	    if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,k) = 1.0D0
-                  end do
-               end do
-	    end if
-         else if (is_dirichlet(bct)) then
-            x(-1) = - bcl/h(1)
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        phi(hi(1)+1,j,k,n) = merge( &
-                             bcval(hi(1)+1,j,k,n)*coef(-1), &
-                             phi(hi(1)+1,j,k,n), &
-                             mask(hi(1)+1,j,k) .gt. 0)
-                     end do
-                  end do
-               else
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        phi(hi(1)+1,j,k,n) = merge( &
-                             0.0D0, &
-                             phi(hi(1)+1,j,k,n), &
-                             mask(hi(1)+1,j,k) .gt. 0)
-                     end do
-                  end do
-               end if
-               do m = 0, lenx
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        phi(hi(1)+1,j,k,n) = merge( &
-                             phi(hi(1)+1,j,k,n) &
-                             + phi(hi(1)-m,j,k,n)*coef(m), &
-                             phi(hi(1)+1,j,k,n), &
-                             mask(hi(1)+1,j,k) .gt. 0)
-                     end do
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,k)   = merge(coef(0), 0.0D0, &
-                          mask(hi(1)+1,j,k) .gt. 0)
-                  end do
-               end do
-            end if
-         else if ( bct .eq. amrex_lo_reflect_odd ) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     phi(hi(1)+1, j, k, n) = merge( &
-                         -phi(hi(1),j,k,n), &
-                          phi(hi(1)+1,j,k,n), &
-                          mask(hi(1)+1,j,k) .gt. 0)
-                  end do
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,k) = merge(-1.0D0, 0.0D0, &
-                          mask(hi(1)+1,j,k) .gt. 0)
-                  end do
-               end do
-            end if
-         else
-            call bl_error("stop UNKNOWN BC ON RIGHT FACE IN APPLYBC")
-         end if
-
-         case (1)
-            !
-            ! The Bottom of the Grid
-            !
-            if(is_neumann(bct)) then
-               do n = 1, nc
-                  do k = lo(3), hi(3)
-                     do i = lo(1),hi(1)
-                        phi(i,lo(2)-1,k,n) = merge( &
-                             phi(i,lo(2),k,n), &
-                             phi(i,lo(2)-1,k,n), &
-                             mask(i,lo(2)-1,k) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1),hi(1)
-                        den(i,lo(2),k)   = 1.0D0
-                     end do
-                  end do
-               end if
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(2)
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-               do n = 1, nc
-                  if ( flagbc .eq. 1 ) then
-                     do k = lo(3), hi(3)
-                        do i = lo(1), hi(1)
-                           phi(i,lo(2)-1,k,n) = merge( &
-                                bcval(i,lo(2)-1,k,n)*coef(-1), &
-                                phi(i,lo(2)-1,k,n), &
-                                mask(i,lo(2)-1,k) .gt. 0)
-                        end do
-                     end do
-                  else
-                     do k = lo(3), hi(3)
-                        do i = lo(1), hi(1)
-                           phi(i,lo(2)-1,k,n) = merge( &
-                               0.0D0, &
-                               phi(i,lo(2)-1,k,n), &
-                               mask(i,lo(2)-1,k) .gt. 0)
-                        end do
-                     end do
-                  end if
-                  do m = 0, leny
-                     do k = lo(3), hi(3)
-                        do i = lo(1), hi(1)
-                           phi(i, lo(2)-1, k, n) = merge( &
-                               phi(i, lo(2)-1,k,n) &
-                               + phi(i, lo(2)+m, k,n)*coef(m), &
-                               phi(i, lo(2)-1, k, n), &
-                               mask(i, lo(2)-1, k) .gt. 0)
-                        end do
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i, lo(2),k)   = merge(coef(0), 0.0D0, &
-                             mask(i, lo(2)-1,k) .gt. 0)
-                     end do
-                  end do
-               end if
-            else if ( bct .eq. amrex_lo_reflect_odd ) then
-               do n = 1, nc
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        phi(i, lo(2)-1, k, n) = merge( &
-                             -phi(i,lo(2),k,n), &
-                             phi(i,lo(2)-1,k,n), &
-                             mask(i,lo(2)-1,k) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,lo(2),k) = merge(-1.0D0, 0.0D0, &
-                             mask(i,lo(2)-1,k) .gt. 0)
-                     end do
-                  end do
-               end if
-            else
-               call bl_error("stop UNKNOWN BC ON BOTTOM FACE IN APPLYBC")
-            end if
-
-         case (4)
-            !
-            ! The top of the grid
-            !
-            if(is_neumann(bct)) then
-               do n = 1, nc
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        phi(i,hi(2)+1,k,n) = merge( &
-                             phi(i,hi(2),k,n), &
-                             phi(i,hi(2)+1,k,n), &
-                             mask(i,hi(2)+1,k) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k)   = 1.0D0
-                     end do
-                  end do
-               end if
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(2)
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-               do n = 1, nc
-                  if ( flagbc .eq. 1 ) then
-                     do k = lo(3), hi(3)
-                        do i = lo(1), hi(1)
-                           phi(i,hi(2)+1,k,n) = merge( &
-                                bcval(i,hi(2)+1,k,n)*coef(-1), &
-                                phi(i,hi(2)+1,k,n), &
-                                mask(i,hi(2)+1,k) .gt. 0)
-                        end do
-                     end do
-                  else
-                     do k = lo(3), hi(3)
-                        do i = lo(1), hi(1)
-                           phi(i,hi(2)+1,k,n) = merge( &
-                                0.0D0, &
-                                phi(i,hi(2)+1,k,n), &
-                                mask(i,hi(2)+1,k) .gt. 0)
-                        end do
-                     end do
-                  end if
-                  do m = 0, leny
-                     do k = lo(3), hi(3)
-                        do i = lo(1), hi(1)
-                           phi(i, hi(2)+1,k,n) = merge( &
-                                phi(i,hi(2)+1,k,n) &
-                                + phi(i, hi(2)-m,k,n)*coef(m), &
-                                phi(i,hi(2)+1,k,n), &
-                                mask(i,hi(2)+1,k) .gt. 0)
-                        end do
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k)   = merge(coef(0), 0.0D0, &
-                             mask(i,hi(2)+1,k) .gt. 0)
-                     end do
-                  end do
-               end if
-            else if ( bct .eq. amrex_lo_reflect_odd ) then
-               do n = 1, nc
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        phi(i, hi(2)+1, k, n) = merge( &
-                            -phi(i,hi(2),k,n), &
-                             phi(i,hi(2)+1,k,n), &
-                             mask(i,hi(2)+1,k) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k) = merge(-1.0D0, 0.0D0, &
-                             mask(i,hi(2)+1,k) .gt. 0)
-                     end do
-                  end do
-               end if
-            else
-               call bl_error("stop UNKNOWN BC ON TOP FACE IN APPLYBC")
-            end if
-
-         case (2)
-            !
-            ! The Front of the Grid
-            !
-            if(is_neumann(bct)) then
-               do n = 1, nc
-                  do j = lo(2), hi(2)
-                     do i = lo(1),hi(1)
-                        phi(i,j,lo(3)-1,n) = merge( &
-                             phi(i,j,lo(3),n), &
-                             phi(i,j,lo(3)-1,n), &
-                             mask(i,j,lo(3)-1) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1),hi(1)
-                        den(i,j,lo(3))   = 1.0D0
-                     end do
-                  end do
-               end if
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(3)
-               call polyInterpCoeff(xInt, x, lenz+2, coef)
-               do n = 1, nc
-                  if ( flagbc .eq. 1 ) then
-                     do j = lo(2), hi(2)
-                        do i = lo(1), hi(1)
-                           phi(i,j,lo(3)-1,n) = merge( &
-                                bcval(i,j,lo(3)-1,n)*coef(-1), &
-                                phi(i,j,lo(3)-1,n), &
-                                mask(i,j,lo(3)-1) .gt. 0)
-                        end do
-                     end do
-                  else
-                     do j = lo(2), hi(2)
-                        do i = lo(1), hi(1)
-                           phi(i,j,lo(3)-1,n) = merge( &
-                                0.0D0, &
-                                phi(i,j,lo(3)-1,n), &
-                                mask(i,j,lo(3)-1) .gt. 0)
-                        end do
-                     end do
-                  end if
-                  do m = 0, lenz
-                     do j = lo(2), hi(2)
-                        do i = lo(1), hi(1)
-                           phi(i, j, lo(3)-1, n) = merge( &
-                                phi(i, j, lo(3)-1,n) &
-                                + phi(i, j, lo(3)+m, n)*coef(m), &
-                                phi(i, j, lo(3)-1,n), &
-                                mask(i, j, lo(3)-1) .gt. 0)
-                        end do
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i, j, lo(3))   = merge(coef(0), 0.0D0, &
-                             mask(i, j, lo(3)-1) .gt. 0)
-                     end do
-                  end do
-               end if
-            else if ( bct .eq. amrex_lo_reflect_odd ) then
-               do n = 1, nc
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        phi(i, j, lo(3)-1, n) = merge( &
-                             -phi(i,j,lo(3),n), &
-                             phi(i,j,lo(3)-1,n), &
-                             mask(i,j,lo(3)-1) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j,lo(3)) = merge(-1.0D0, 0.0D0, &
-                             mask(i,j,lo(3)-1) .gt. 0)
-                     end do
-                  end do
-               end if
-            else
-               call bl_error("stop UNKNOWN BC ON FRONT FACE IN APPLYBC")
-            end if
-
-         case (5)
-            !
-            ! The back of the grid
-            !
-            if(is_neumann(bct)) then
-               do n = 1, nc
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        phi(i,j, hi(3)+1,n) = merge( &
-                             phi(i,j, hi(3),n), &
-                             phi(i,j, hi(3)+1,n), &
-                             mask(i,j, hi(3)+1) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j, hi(3))   = 1.0D0
-                     end do
-                  end do
-               end if
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(3)
-               call polyInterpCoeff(xInt, x, lenz+2, coef)
-               do n = 1, nc
-                  if ( flagbc .eq. 1 ) then
-                     do j = lo(2), hi(2)
-                        do i = lo(1), hi(1)
-                           phi(i,j, hi(3)+1,n) = merge( &
-                                bcval(i,j, hi(3)+1,n)*coef(-1), &
-                                phi(i,j, hi(3)+1,n), &
-                                mask(i,j, hi(3)+1) .gt. 0)
-                        end do
-                     end do
-                  else
-                     do j = lo(2), hi(2)
-                        do i = lo(1), hi(1)
-                           phi(i,j, hi(3)+1,n) = merge( &
-                                0.0D0, &
-                                phi(i,j, hi(3)+1,n), &
-                                mask(i,j, hi(3)+1) .gt. 0)
-                        end do
-                     end do
-                  end if
-                  do m = 0, lenz
-                     do j = lo(2), hi(2)
-                        do i = lo(1), hi(1)
-                           phi(i, j, hi(3)+1,n) = merge( &
-                                phi(i,j, hi(3)+1,n) &
-                                + phi(i, j, hi(3)-m,n)*coef(m), &
-                                phi(i,j, hi(3)+1,n), &
-                                mask(i,j, hi(3)+1) .gt. 0)
-                        end do
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j, hi(3))   = merge(coef(0), 0.0D0, &
-                             mask(i,j, hi(3)+1) .gt. 0)
-                     end do
-                  end do
-               end if
-            else if ( bct .eq. amrex_lo_reflect_odd ) then
-               do n = 1, nc
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        phi(i, j, hi(3)+1, n) = merge( &
-                             -phi(i,j,hi(3),n), &
-                             phi(i,j,hi(3)+1,n), &
-                             mask(i,j,hi(3)+1) .gt. 0)
-                     end do
-                  end do
-               end do
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j,hi(3)) = merge(-1.0D0, 0.0D0, &
-                            mask(i,j,hi(3)+1) .gt. 0)
-                     end do
-                  end do
-               end if
-            else
-               call bl_error("stop UNKNOWN BC ON BACK FACE IN APPLYBC")
-            end if
-         end select
-
-       end subroutine amrex_lo_applybc
-
-end module amrex_lo_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LO_F.H b/Src/LinearSolvers/C_CellMG/AMReX_LO_F.H
deleted file mode 100644
index ce5bb7e3f18..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LO_F.H
+++ /dev/null
@@ -1,46 +0,0 @@
-#ifndef AMREX_LO_F_H_
-#define AMREX_LO_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    void amrex_lo_applybc(
-        const int *flagden, const int *flagbc, const int *maxorder,
-        amrex_real *phi, AMREX_ARLIM_P(phi_lo), AMREX_ARLIM_P(phi_hi),
-        const int *cdr,
-        const int *bct,
-        const amrex_real *bcl,
-        const amrex_real *bcval, AMREX_ARLIM_P(bcval_lo), AMREX_ARLIM_P(bcval_hi),
-        const int *mask,   AMREX_ARLIM_P(mask_lo),  AMREX_ARLIM_P(mask_hi), 
-        amrex_real *den,         AMREX_ARLIM_P(den_lo),   AMREX_ARLIM_P(den_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-
-    void amrex_lo_averagecc (
-        amrex_real* crseX,       AMREX_ARLIM_P(crseX_lo), AMREX_ARLIM_P(crseX_hi),
-        const amrex_real* fineX, AMREX_ARLIM_P(fineX_lo), AMREX_ARLIM_P(fineX_hi),
-        const int *tlo, const int *thi, const int *nc
-        );
-
-    void amrex_lo_averageec (
-        amrex_real* crseX,       AMREX_ARLIM_P(crseX_lo), AMREX_ARLIM_P(crseX_hi),
-        const amrex_real* fineX, AMREX_ARLIM_P(fineX_lo), AMREX_ARLIM_P(fineX_hi),
-        const int *tlo, const int *thi, const int *nc,
-        const int *axis
-        );
-
-    void amrex_lo_harmonic_averageec (
-        amrex_real* crseX,       AMREX_ARLIM_P(crseX_lo), AMREX_ARLIM_P(crseX_hi),
-        const amrex_real* fineX, AMREX_ARLIM_P(fineX_lo), AMREX_ARLIM_P(fineX_hi),
-        const int *tlo, const int *thi, const int *nc,
-        const int *axis
-        );
-#ifdef __cplusplus
-}
-#endif
-
-#endif /*_LO_F_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LP_1D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_LP_1D.F90
deleted file mode 100644
index f7bcceea4ae..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LP_1D.F90
+++ /dev/null
@@ -1,150 +0,0 @@
-
-module amrex_lp_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Gauss-Seidel Red-Black (GSRB):
-!>     Apply the GSRB relaxation to the state phi for the equation
-!>     ``L(phi) = Div(Grad(phi(x))) = rhs(x)`` central differenced, according
-!>     to the arrays of boundary masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.   The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_lp_linesolve ( &
-           phi, phi_l1,phi_h1, &
-           rhs, rhs_l1,rhs_h1, &
-           f0, f0_l1,f0_h1, m0, m0_l1,m0_h1, &
-           f2, f2_l1,f2_h1, m2, m2_l1,m2_h1, &
-           lo, hi, nc, &
-           h) bind(c,name='amrex_lp_linesolve')
-
-      integer nc
-      integer phi_l1,phi_h1
-      real(amrex_real) phi(phi_l1:phi_h1,nc)
-      integer rhs_l1,rhs_h1
-      real(amrex_real) rhs(rhs_l1:rhs_h1,nc)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer f0_l1,f0_h1
-      integer f2_l1,f2_h1
-      real(amrex_real) f0(f0_l1:f0_h1)
-      real(amrex_real) f2(f2_l1:f2_h1)
-      integer m0_l1,m0_h1
-      integer m2_l1,m2_h1
-      integer m0(m0_l1:m0_h1)
-      integer m2(m2_l1:m2_h1)
-      real(amrex_real)  h
-
-      integer  i, n
-
-      real(amrex_real) cf0, cf2
-      real(amrex_real) delta, gamma, rho
-
-      gamma = 4.0D0
-      do n = 1, nc
-         do i = lo(1),hi(1)
-
-               cf0 = merge(f0(lo(1)), 0.0D0, &
-                    (i .eq. lo(1)) .and. (m0(lo(1)-1).gt.0))
-               cf2 = merge(f2(hi(1)), 0.0D0, &
-                    (i .eq. hi(1)) .and. (m2(hi(1)+1).gt.0))
-
-               delta = cf0 + cf2
-
-               rho =  phi(i-1,n) + phi(i+1,n)
-
-               phi(i,n) = (rhs(i,n)*h*h - rho + phi(i,n)*delta) &
-                    /                (delta - gamma)
-
-         end do
-      end do
-
-    end subroutine amrex_lp_linesolve
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_lp_adotx( &
-           y, y_l1,y_h1, &
-           x, x_l1,x_h1, &
-           lo, hi, nc, &
-           h &
-           ) bind(c,name='amrex_lp_adotx')
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer y_l1,y_h1
-      real(amrex_real) y(y_l1:y_h1,nc)
-      integer x_l1,x_h1
-      real(amrex_real) x(x_l1:x_h1,nc)
-      real(amrex_real) h
-
-      integer i, n
-      real(amrex_real) scal
-
-      scal = 1.0D0/h**2
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            y(i,n) = scal* &
-             ( x(i-1,n) + x(i+1,n) - 2.d0*x(i,n) )
-         end do
-      end do
-
-    end subroutine amrex_lp_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-    subroutine amrex_lp_flux( &
-           x,x_l1,x_h1, &
-           xlo,xhi,nc, &
-           h, &
-           xflux,xflux_l1,xflux_h1 &
-           ) bind(c,name='amrex_lp_flux')
-
-      implicit none
-
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM), nc
-      integer x_l1,x_h1
-      integer xflux_l1,xflux_h1
-      real(amrex_real)  x(x_l1:x_h1,nc)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      real(amrex_real) dhx
-      integer i,n
-
-      dhx = one/h(1)
-
-      do n = 1, nc
-         do i = xlo(1), xhi(1)
-            xflux(i,n) = - dhx*( x(i,n) - x(i-1,n) )
-         end do
-      end do
-
-    end subroutine amrex_lp_flux
-
-end module amrex_lp_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LP_2D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_LP_2D.F90
deleted file mode 100644
index 072cc2a28a8..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LP_2D.F90
+++ /dev/null
@@ -1,195 +0,0 @@
-module amrex_lp_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Gauss-Seidel Red-Black (GSRB):
-!>     Apply the GSRB relaxation to the state phi for the equation
-!>     ``L(phi) = Div(Grad(phi(x))) = rhs(x)`` central differenced, according
-!>     to the arrays of boundary masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.   The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_lp_gsrb ( &
-           phi, phi_l1,phi_l2,phi_h1,phi_h2, &
-           rhs, rhs_l1,rhs_l2,rhs_h1,rhs_h2, &
-           f0, f0_l1,f0_l2,f0_h1,f0_h2, m0, m0_l1,m0_l2,m0_h1,m0_h2, &
-           f1, f1_l1,f1_l2,f1_h1,f1_h2, m1, m1_l1,m1_l2,m1_h1,m1_h2, &
-           f2, f2_l1,f2_l2,f2_h1,f2_h2, m2, m2_l1,m2_l2,m2_h1,m2_h2, &
-           f3, f3_l1,f3_l2,f3_h1,f3_h2, m3, m3_l1,m3_l2,m3_h1,m3_h2, &
-           lo, hi, blo, bhi, &
-           nc, h, redblack &
-           ) bind(c,name='amrex_lp_gsrb')
-
-      implicit none
-
-      integer nc
-      integer phi_l1,phi_l2,phi_h1,phi_h2
-      real(amrex_real) phi(phi_l1:phi_h1,phi_l2:phi_h2,nc)
-      integer rhs_l1,rhs_l2,rhs_h1,rhs_h2
-      real(amrex_real) rhs(rhs_l1:rhs_h1,rhs_l2:rhs_h2,nc)
-      integer  lo(BL_SPACEDIM),  hi(BL_SPACEDIM)
-      integer blo(BL_SPACEDIM), bhi(BL_SPACEDIM)
-      integer f0_l1,f0_l2,f0_h1,f0_h2
-      integer f1_l1,f1_l2,f1_h1,f1_h2
-      integer f2_l1,f2_l2,f2_h1,f2_h2
-      integer f3_l1,f3_l2,f3_h1,f3_h2
-      real(amrex_real) f0(f0_l1:f0_h1,f0_l2:f0_h2)
-      real(amrex_real) f1(f1_l1:f1_h1,f1_l2:f1_h2)
-      real(amrex_real) f2(f2_l1:f2_h1,f2_l2:f2_h2)
-      real(amrex_real) f3(f3_l1:f3_h1,f3_l2:f3_h2)
-      integer m0_l1,m0_l2,m0_h1,m0_h2
-      integer m1_l1,m1_l2,m1_h1,m1_h2
-      integer m2_l1,m2_l2,m2_h1,m2_h2
-      integer m3_l1,m3_l2,m3_h1,m3_h2
-      integer m0(m0_l1:m0_h1,m0_l2:m0_h2)
-      integer m1(m1_l1:m1_h1,m1_l2:m1_h2)
-      integer m2(m2_l1:m2_h1,m2_l2:m2_h2)
-      integer m3(m3_l1:m3_h1,m3_l2:m3_h2)
-      integer redblack
-      real(amrex_real)  h
-
-      integer  i, j, ioff, n
-
-      real(amrex_real) cf0, cf1, cf2, cf3
-      real(amrex_real) delta, gamma, rho
-
-      gamma = 4.0D0
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            ioff = MOD(lo(1) + j +  redblack, 2)
-            do i = lo(1) + ioff,hi(1),2
-
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                    (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                    (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                    (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                    (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-
-               delta = cf0 + cf1 + cf2 + cf3
-
-               rho =  phi(i-1,j,n) + phi(i+1,j,n) &
-                    + phi(i,j-1,n) + phi(i,j+1,n)
-
-               phi(i,j,n) = (rhs(i,j,n)*h*h - rho + phi(i,j,n)*delta) &
-                    /                (delta - gamma)
-
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lp_gsrb
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_lp_adotx( &
-           y, y_l1,y_l2,y_h1,y_h2, &
-           x, x_l1,x_l2,x_h1,x_h2, &
-           lo, hi, nc, &
-           h &
-           ) bind(c,name='amrex_lp_adotx')
-
-      implicit none
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer y_l1,y_l2,y_h1,y_h2
-      real(amrex_real) y(y_l1:y_h1,y_l2:y_h2,nc)
-      integer x_l1,x_l2,x_h1,x_h2
-      real(amrex_real) x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real) h
-
-      integer i, j, n
-      real(amrex_real) scal
-
-      scal = 1.0D0/h**2
-
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               y(i,j,n) = scal* &
-                    ( x(i-1,j,n) + x(i+1,j,n) &
-                    + x(i,j-1,n) + x(i,j+1,n) &
-                    - 4*x(i,j,n) )
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lp_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-    subroutine amrex_lp_flux( &
-           x,x_l1,x_l2,x_h1,x_h2, &
-           xlo,xhi, &
-           ylo,yhi, &
-           nc, &
-           h, &
-           xflux,xflux_l1,xflux_l2,xflux_h1,xflux_h2, &
-           yflux,yflux_l1,yflux_l2,yflux_h1,yflux_h2 &
-           ) bind(c,name='amrex_lp_flux')
-
-      implicit none
-
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer nc
-      integer x_l1,x_l2,x_h1,x_h2
-      integer xflux_l1,xflux_l2,xflux_h1,xflux_h2
-      integer yflux_l1,yflux_l2,yflux_h1,yflux_h2
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,xflux_l2:xflux_h2,nc)
-      real(amrex_real) yflux(yflux_l1:yflux_h1,yflux_l2:yflux_h2,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      real(amrex_real) dhx, dhy
-      integer i,j,n
-
-      dhx = one/h(1)
-      dhy = one/h(2)
-
-      do n = 1, nc
-         do j = xlo(2), xhi(2)
-            do i = xlo(1), xhi(1)
-               xflux(i,j,n) = - dhx*( x(i,j,n) - x(i-1,j,n) )
-            end do
-         end do
-      end do
-      do n = 1, nc
-         do j = ylo(2), yhi(2)
-            do i = ylo(1), yhi(1)
-               yflux(i,j,n) = - dhy*( x(i,j,n) - x(i,j-1,n) )
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lp_flux
-
-end module amrex_lp_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LP_3D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_LP_3D.F90
deleted file mode 100644
index c841051f6b0..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LP_3D.F90
+++ /dev/null
@@ -1,234 +0,0 @@
-module amrex_lp_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Gauss-Seidel Red-Black (GSRB):
-!>     Apply the GSRB relaxation to the state phi for the equation
-!>     ``L(phi) = Div(Grad(phi(x))) = rhs(x)`` central differenced, according
-!>     to the arrays of boundary masks (m#) and auxiliary data (f#).
-!>
-!>     In general, if the linear operator ``L=gamma*y-rho``, the GS relaxation
-!>     is ``y = (R - rho)/gamma``.  Near a boundary, the ghost data is filled
-!>     using a polynomial interpolant based on the "old" phi values, so
-!>     ``L=(gamma-delta)*y - rho + delta*yOld``.   The resulting iteration is
-!>
-!>     ``y = (R - delta*yOld + rho)/(gamma - delta)``
-!>
-!>     This expression is valid additionally in the interior provided
-!>     delta->0 there.  delta is constructed by summing all the
-!>     contributions to the central stencil element coming from boundary
-!>     interpolants.  The f#s contain the corresponding coefficient of
-!>     the interpolating polynomial.  The masks are set > 0 if the boundary
-!>     value was filled with an interpolant involving the central stencil
-!>     element.
-!>
-!-----------------------------------------------------------------------
-    subroutine amrex_lp_gsrb ( &
-           phi, phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-           rhs, rhs_l1,rhs_l2,rhs_l3,rhs_h1,rhs_h2,rhs_h3, &
-           f0, f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3, m0, m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3, &
-           f1, f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3, m1, m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3, &
-           f2, f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3, m2, m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3, &
-           f3, f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3, m3, m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3, &
-           f4, f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3, m4, m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3, &
-           f5, f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3, m5, m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3, &
-           lo, hi, blo, bhi, &
-           nc, h, redblack &
-           ) bind(c,name='amrex_lp_gsrb')
-
-      implicit none
-
-      integer nc
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      real(amrex_real)  phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,nc)
-      integer rhs_l1,rhs_l2,rhs_l3,rhs_h1,rhs_h2,rhs_h3
-      real(amrex_real)  rhs(rhs_l1:rhs_h1,rhs_l2:rhs_h2,rhs_l3:rhs_h3,nc)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer blo(BL_SPACEDIM), bhi(BL_SPACEDIM)
-      integer redblack
-      integer f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3
-      integer f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3
-      integer f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3
-      integer f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3
-      integer f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3
-      integer f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3
-      real(amrex_real)  f0(f0_l1:f0_h1,f0_l2:f0_h2,f0_l3:f0_h3)
-      real(amrex_real)  f1(f1_l1:f1_h1,f1_l2:f1_h2,f1_l3:f1_h3)
-      real(amrex_real)  f2(f2_l1:f2_h1,f2_l2:f2_h2,f2_l3:f2_h3)
-      real(amrex_real)  f3(f3_l1:f3_h1,f3_l2:f3_h2,f3_l3:f3_h3)
-      real(amrex_real)  f4(f4_l1:f4_h1,f4_l2:f4_h2,f4_l3:f4_h3)
-      real(amrex_real)  f5(f5_l1:f5_h1,f5_l2:f5_h2,f5_l3:f5_h3)
-      integer m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3
-      integer m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3
-      integer m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3
-      integer m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3
-      integer m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3
-      integer m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3
-      integer m0(m0_l1:m0_h1,m0_l2:m0_h2,m0_l3:m0_h3)
-      integer m1(m1_l1:m1_h1,m1_l2:m1_h2,m1_l3:m1_h3)
-      integer m2(m2_l1:m2_h1,m2_l2:m2_h2,m2_l3:m2_h3)
-      integer m3(m3_l1:m3_h1,m3_l2:m3_h2,m3_l3:m3_h3)
-      integer m4(m4_l1:m4_h1,m4_l2:m4_h2,m4_l3:m4_h3)
-      integer m5(m5_l1:m5_h1,m5_l2:m5_h2,m5_l3:m5_h3)
-      real(amrex_real)  h
-
-      integer  i, j, k, ioff, n
-
-      real(amrex_real) cf0, cf1, cf2, cf3, cf4, cf5
-      real(amrex_real) delta, gamma, rho
-
-      parameter(gamma = 6.0D0)
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               ioff = MOD(lo(1) + j + k + redblack,2)
-               do i = lo(1) + ioff,hi(1),2
-
-                  cf0 = merge(f0(blo(1),j,k), 0.0D0, &
-                       (i .eq. blo(1)) .and. (m0(blo(1)-1,j,k).gt.0))
-                  cf1 = merge(f1(i,blo(2),k), 0.0D0, &
-                       (j .eq. blo(2)) .and. (m1(i,blo(2)-1,k).gt.0))
-                  cf2 = merge(f2(i,j,blo(3)), 0.0D0, &
-                       (k .eq. blo(3)) .and. (m2(i,j,blo(3)-1).gt.0))
-                  cf3 = merge(f3(bhi(1),j,k), 0.0D0, &
-                       (i .eq. bhi(1)) .and. (m3(bhi(1)+1,j,k).gt.0))
-                  cf4 = merge(f4(i,bhi(2),k), 0.0D0, &
-                       (j .eq. bhi(2)) .and. (m4(i,bhi(2)+1,k).gt.0))
-                  cf5 = merge(f5(i,j,bhi(3)), 0.0D0, &
-                       (k .eq. bhi(3)) .and. (m5(i,j,bhi(3)+1).gt.0))
-
-                  delta = cf0 + cf1 + cf2 + cf3 + cf4 + cf5
-
-                  rho =  phi(i-1,j,k,n) + phi(i+1,j,k,n) &
-                       + phi(i,j-1,k,n) + phi(i,j+1,k,n) &
-                       + phi(i,j,k-1,n) + phi(i,j,k+1,n)
-
-                  phi(i,j,k,n) &
-                       = (rhs(i,j,k,n)*h*h - rho + phi(i,j,k,n)*delta) &
-                       /             (delta - gamma)
-
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lp_gsrb
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-    subroutine amrex_lp_adotx( &
-           y, y_l1,y_l2,y_l3,y_h1,y_h2,y_h3, &
-           x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-           lo, hi, nc, &
-           h &
-           ) bind(c,name='amrex_lp_adotx')
-
-      implicit none
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer y_l1,y_l2,y_l3,y_h1,y_h2,y_h3
-      real(amrex_real)  y(y_l1:y_h1,y_l2:y_h2,y_l3:y_h3,nc)
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real)  h
-
-      integer i, j, k, n
-      real(amrex_real) scal
-
-      scal = 1.0D0/h**2
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  y(i,j,k,n) = scal* &
-                       ( x(i-1,j,k,n) + x(i+1,j,k,n) &
-                       + x(i,j-1,k,n) + x(i,j+1,k,n) &
-                       + x(i,j,k-1,n) + x(i,j,k+1,n) &
-                       - 6*x(i,j,k,n) )
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lp_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-    subroutine amrex_lp_flux( &
-           x,x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-           xlo,xhi, &
-           ylo,yhi, &
-           zlo,zhi, &
-           nc, &
-           h, &
-           xflux,xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3, &
-           yflux,yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3, &
-           zflux,zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3 &
-           ) bind(c,name='amrex_lp_flux')
-
-      implicit none
-
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer zlo(BL_SPACEDIM), zhi(BL_SPACEDIM)
-      integer nc
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      integer xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3
-      integer yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3
-      integer zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,xflux_l2:xflux_h2,xflux_l3:xflux_h3,nc)
-      real(amrex_real) yflux(yflux_l1:yflux_h1,yflux_l2:yflux_h2,yflux_l3:yflux_h3,nc)
-      real(amrex_real) zflux(zflux_l1:zflux_h1,zflux_l2:zflux_h2,zflux_l3:zflux_h3,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      real(amrex_real) dhx, dhy, dhz
-      integer i,j,k,n
-
-      dhx = one/h(1)
-      dhy = one/h(2)
-      dhz = one/h(3)
-
-      do n = 1, nc
-         do k = xlo(3), xhi(3)
-            do j = xlo(2), xhi(2)
-               do i = xlo(1), xhi(1)
-                  xflux(i,j,k,n) = - dhx*( x(i,j,k,n) - x(i-1,j,k,n) )
-               end do
-            end do
-         end do
-
-         do k = ylo(3), yhi(3)
-            do j = ylo(2), yhi(2)
-               do i = ylo(1), yhi(1)
-                  yflux(i,j,k,n) = - dhy*( x(i,j,k,n) - x(i,j-1,k,n) )
-               end do
-            end do
-         end do
-
-         do k = zlo(3), zhi(3)
-            do j = zlo(2), zhi(2)
-               do i = zlo(1), zhi(1)
-                  zflux(i,j,k,n) = - dhz*( x(i,j,k,n) - x(i,j,k-1,n) )
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_lp_flux
-
-end module amrex_lp_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LP_F.H b/Src/LinearSolvers/C_CellMG/AMReX_LP_F.H
deleted file mode 100644
index 806b914625a..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LP_F.H
+++ /dev/null
@@ -1,98 +0,0 @@
-#ifndef AMREX_LP_F_H_
-#define AMREX_LP_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-#if (BL_SPACEDIM == 1)
-    void amrex_lp_linesolve (
-        amrex_real* phi       , AMREX_ARLIM_P(phi_lo),  AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs , AMREX_ARLIM_P(rhs_lo),  AMREX_ARLIM_P(rhs_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo), AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),   AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo), AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),   AMREX_ARLIM_P(m2_hi),
-        const int* lo, const int* hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_lp_flux(
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const int *xlo, const int *xhi, const int *nc,
-        const amrex_real *h,
-        amrex_real* xflux, AMREX_ARLIM_P(xflux_lo), AMREX_ARLIM_P(xflux_hi)
-        );
-#endif
-#if (BL_SPACEDIM == 2)
-    void amrex_lp_gsrb (
-        amrex_real* phi       , AMREX_ARLIM_P(phi_lo),  AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs , AMREX_ARLIM_P(rhs_lo),  AMREX_ARLIM_P(rhs_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo), AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),   AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den1, AMREX_ARLIM_P(den1_lo), AMREX_ARLIM_P(den1_hi),
-        const int* m1   , AMREX_ARLIM_P(m1_lo),   AMREX_ARLIM_P(m1_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo), AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),   AMREX_ARLIM_P(m2_hi),
-        const amrex_real* den3, AMREX_ARLIM_P(den3_lo), AMREX_ARLIM_P(den3_hi),
-        const int* m3   , AMREX_ARLIM_P(m3_lo),   AMREX_ARLIM_P(m3_hi),
-        const int* lo, const int* hi, const int* blo, const int* bhi, 
-	const int *nc, const amrex_real *h, const  int* redblack
-        );
-    
-    void amrex_lp_flux(
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const int *xlo, const int *xhi, 
-        const int *ylo, const int *yhi, 
-	const int *nc,
-        const amrex_real *h,
-        amrex_real* xflux, AMREX_ARLIM_P(xflux_lo), AMREX_ARLIM_P(xflux_hi),
-        amrex_real* yflux, AMREX_ARLIM_P(yflux_lo), AMREX_ARLIM_P(yflux_hi)
-        );
-#endif
-#if (BL_SPACEDIM == 3)
-    void amrex_lp_gsrb (
-        amrex_real* phi       , AMREX_ARLIM_P(phi_lo),  AMREX_ARLIM_P(phi_hi),
-        const amrex_real* rhs , AMREX_ARLIM_P(rhs_lo),  AMREX_ARLIM_P(rhs_hi),
-        const amrex_real* den0, AMREX_ARLIM_P(den0_lo), AMREX_ARLIM_P(den0_hi),
-        const int* m0   , AMREX_ARLIM_P(m0_lo),   AMREX_ARLIM_P(m0_hi),
-        const amrex_real* den1, AMREX_ARLIM_P(den1_lo), AMREX_ARLIM_P(den1_hi),
-        const int* m1   , AMREX_ARLIM_P(m1_lo),   AMREX_ARLIM_P(m1_hi),
-        const amrex_real* den2, AMREX_ARLIM_P(den2_lo), AMREX_ARLIM_P(den2_hi),
-        const int* m2   , AMREX_ARLIM_P(m2_lo),   AMREX_ARLIM_P(m2_hi),
-        const amrex_real* den3, AMREX_ARLIM_P(den3_lo), AMREX_ARLIM_P(den3_hi),
-        const int* m3   , AMREX_ARLIM_P(m3_lo),   AMREX_ARLIM_P(m3_hi),
-        const amrex_real* den4, AMREX_ARLIM_P(den4),    AMREX_ARLIM_P(den4_hi),
-        const int* m4   , AMREX_ARLIM_P(m4),      AMREX_ARLIM_P(m4_hi),
-        const amrex_real* den5, AMREX_ARLIM_P(den5),    AMREX_ARLIM_P(den5_hi),
-        const int* m5   , AMREX_ARLIM_P(m5),      AMREX_ARLIM_P(m5_hi),
-        const int* lo, const int* hi, const int* blo, const int* bhi, 
-	const int *nc, const amrex_real *h, const  int* redblack
-        );
-    
-    void amrex_lp_flux(
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const int *xlo, const int *xhi, 
-        const int *ylo, const int *yhi, 
-        const int *zlo, const int *zhi, 
-	const int *nc,
-        const amrex_real *h,
-        amrex_real* xflux, AMREX_ARLIM_P(xflux_lo), AMREX_ARLIM_P(xflux_hi),
-        amrex_real* yflux, AMREX_ARLIM_P(yflux_lo), AMREX_ARLIM_P(yflux_hi),
-        amrex_real* zflux, AMREX_ARLIM_P(zflux_lo), AMREX_ARLIM_P(zflux_hi)
-        );
-#endif
-
-    void amrex_lp_adotx(
-        amrex_real *y,       AMREX_ARLIM_P(y_lo), AMREX_ARLIM_P(y_hi),
-        const amrex_real *x, AMREX_ARLIM_P(x_lo), AMREX_ARLIM_P(x_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-#ifdef __cplusplus
-}
-#endif
-
-#endif /*_LP_F_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_Laplacian.H b/Src/LinearSolvers/C_CellMG/AMReX_Laplacian.H
deleted file mode 100644
index 07e7da1bd00..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_Laplacian.H
+++ /dev/null
@@ -1,122 +0,0 @@
-
-#ifndef AMREX_LAPLACIAN_H_
-#define AMREX_LAPLACIAN_H_
-
-#include <AMReX_LinOp.H>
-
-namespace amrex {
-
-/**
-  \brief A Laplacian tailors the description of a linear operator to apply
-  the second-order central difference approximation to the laplacian
-  differential operator on a cell-centered MultiFab of data
-
-  A Laplacian tailors a LinOp (a virtual base class for general linear
-  operators) to compute the second-order central difference
-  approximation to the laplacian differential operator,
-  L(phi) = div(grad(phi)), on a cell-centered MultiFab, phi.  This class
-  provides the necessary implementations for applying the operator and
-  for smoothing a guessed solution for the linear
-  equation system, L(phi) = rhs (where rhs is another cell-centered
-  MultiFab).  These customizations are designed for 2D and 3D, with
-  uniform, constant mesh spacing in all directions.
-
-  Application of the operator and smoothing are
-  "level" operations, and therefore must access "hidden" level data
-  (such as boundary conditions, etc) as required, in concert with the
-  semantics of the underlying LinOp defintions.  Accordingly, these
-  implementations are "protected" and called only by the publically
-  accessible members of the virtual base class, LinOp.  Note that these
-  implementations may therefore assume that boundary (ghost) nodes and
-  other pertinent information are filled properly by the base class
-  functions prior to call.
-
-  This class does NOT provide a copy constructor or assignment operator.
-  */
-
-class Laplacian
-    :
-    public LinOp
-{
-public:
-
-    /**
-    * \brief constructor;
-    *
-    * \param bd
-    * \param _h
-    */
-    Laplacian (const BndryData& bd,
-               Real             _h);
-
-    /**
-    * \brief destructor
-    */
-    virtual ~Laplacian() override;
-
-    /**
-    * \brief Compute flux associated with the op
-    *
-    * \paramxflux
-    * \paramyflux
-    * \paramzflux)
-    * \param in
-    * \param bc_mode
-    * \param sComp
-    * \param dComp
-    * \param nComp
-    * \param bndComp
-    */
-    virtual void compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-			   MultiFab& in, const BC_Mode& bc_mode=LinOp::Inhomogeneous_BC,
-			   int sComp=0, int dComp=0, int nComp=1, int bndComp=0) override;
-
-    virtual Real norm (int nm = 0, int level = 0, const bool local = false) override;
-
-protected:
-
-    /**
-    * \brief compute out=L(in) at level=level
-    *
-    * \param out
-    * \param in
-    * \param level
-    */
-    virtual void Fapply (MultiFab&       out,
-                         const MultiFab& in,
-                         int             level) override;
-    virtual void Fapply (MultiFab&       out,
-			 int             dst_comp,
-                         const MultiFab& in,
-			 int             src_comp,
-			 int             num_comp,
-                         int             level) override;
-
-    /**
-    * \brief apply GSRB smoother to improve residual to ``L(solnL)=rhsL``
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param rgbflag
-    */
-    virtual void Fsmooth (MultiFab&       solnL,
-                          const MultiFab& rhsL,
-                          int             level,
-                          int             rgbflag) override;
-
-    /**
-    * \brief apply Jacobi smoother to improve residual to ``L(solnL)=rhsL``
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    */
-    virtual void Fsmooth_jacobi (MultiFab&       solnL,
-                                 const MultiFab& rhsL,
-                                 int             level) override;
-};
-
-}
-
-#endif /*_LAPLACIAN_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_Laplacian.cpp b/Src/LinearSolvers/C_CellMG/AMReX_Laplacian.cpp
deleted file mode 100644
index c2d5895aa0e..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_Laplacian.cpp
+++ /dev/null
@@ -1,246 +0,0 @@
-
-#include <AMReX_Laplacian.H>
-#include <AMReX_LP_F.H>
-
-namespace amrex {
-
-Laplacian::Laplacian (const BndryData& bd,
-                      Real             _h)
-    :
-    LinOp(bd,_h) {}
-
-Laplacian::~Laplacian() {}
-
-Real
-Laplacian::norm (int nm, int level, const bool local)
-{
-  switch ( nm )
-    {
-    case 0:
-      return 8.0/(h[level][0]*h[level][0]);
-    }
-  amrex::Error("Bad Laplacian::norm");
-  return -1.0;
-}
-
-void
-Laplacian::compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-		     MultiFab& in, const BC_Mode& bc_mode,
-		     int src_comp, int dst_comp, int num_comp, int bnd_comp)
-{
-    BL_PROFILE("Laplacian::compFlux()");
-
-    const int level    = 0;
-    applyBC(in,src_comp,num_comp,level,bc_mode,bnd_comp);
-
-    const bool tiling = true;
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter inmfi(in,tiling); inmfi.isValid(); ++inmfi)
-    {
-        AMREX_D_TERM(const Box& xbx   = inmfi.nodaltilebox(0);,
-	       const Box& ybx   = inmfi.nodaltilebox(1);,
-	       const Box& zbx   = inmfi.nodaltilebox(2););
-
-        FArrayBox& infab = in[inmfi];
-
-        AMREX_D_TERM(FArrayBox& xfab  = xflux[inmfi];,
-               FArrayBox& yfab  = yflux[inmfi];,
-               FArrayBox& zfab  = zflux[inmfi];);
-
-        amrex_lp_flux(infab.dataPtr(src_comp),
-		  AMREX_ARLIM(infab.loVect()), AMREX_ARLIM(infab.hiVect()),
-		  xbx.loVect(), xbx.hiVect(), 
-#if (BL_SPACEDIM >= 2)
-		  ybx.loVect(), ybx.hiVect(), 
-#if (BL_SPACEDIM == 3)
-		  zbx.loVect(), zbx.hiVect(), 
-#endif
-#endif
-	          &num_comp,
-		  h[level].data(),
-		  xfab.dataPtr(dst_comp),
-		  AMREX_ARLIM(xfab.loVect()), AMREX_ARLIM(xfab.hiVect())
-#if (BL_SPACEDIM >= 2)
-		  ,yfab.dataPtr(dst_comp),
-		  AMREX_ARLIM(yfab.loVect()), AMREX_ARLIM(yfab.hiVect())
-#endif
-#if (BL_SPACEDIM == 3)
-		  ,zfab.dataPtr(dst_comp),
-		  AMREX_ARLIM(zfab.loVect()), AMREX_ARLIM(zfab.hiVect())
-#endif
-		  );
-    }
-}
-
-void
-Laplacian::Fsmooth (MultiFab&       solnL,
-                    const MultiFab& rhsL,
-                    int             level,
-                    int             redBlackFlag)
-{
-    BL_PROFILE("Laplacian::Fsmooth()");
-
-    OrientationIter oitr;
-
-    const FabSet& f0 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f1 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f2 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f3 = undrrelxr[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-    const FabSet& f4 = undrrelxr[level][oitr()]; oitr++;
-    const FabSet& f5 = undrrelxr[level][oitr()]; oitr++;
-#endif
-
-    oitr.rewind();
-    const MultiMask& mm0 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm1 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm2 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm3 = maskvals[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-    const MultiMask& mm4 = maskvals[level][oitr()]; oitr++;
-    const MultiMask& mm5 = maskvals[level][oitr()]; oitr++;
-#endif
-
-    const int nc = rhsL.nComp();
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter solnLmfi(solnL,tiling); solnLmfi.isValid(); ++solnLmfi)
-    {
-	const Mask& m0 = mm0[solnLmfi];
-        const Mask& m1 = mm1[solnLmfi];
-        const Mask& m2 = mm2[solnLmfi];
-        const Mask& m3 = mm3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-        const Mask& m4 = mm4[solnLmfi];
-        const Mask& m5 = mm5[solnLmfi];
-#endif
-
-	const Box&       tbx     = solnLmfi.tilebox();
-        const Box&       vbx     = solnLmfi.validbox();
-        FArrayBox&       solnfab = solnL[solnLmfi];
-        const FArrayBox& rhsfab  = rhsL[solnLmfi];
-        const FArrayBox& f0fab   = f0[solnLmfi];
-        const FArrayBox& f1fab   = f1[solnLmfi];
-        const FArrayBox& f2fab   = f2[solnLmfi];
-        const FArrayBox& f3fab   = f3[solnLmfi];
-#if (BL_SPACEDIM == 3)
-        const FArrayBox& f4fab   = f4[solnLmfi];
-        const FArrayBox& f5fab   = f5[solnLmfi];
-#endif
-
-#if (BL_SPACEDIM == 2)
-        amrex_lp_gsrb(
-            solnfab.dataPtr(), 
-            AMREX_ARLIM(solnfab.loVect()),AMREX_ARLIM(solnfab.hiVect()),
-            rhsfab.dataPtr(), 
-            AMREX_ARLIM(rhsfab.loVect()), AMREX_ARLIM(rhsfab.hiVect()),
-            f0fab.dataPtr(), 
-            AMREX_ARLIM(f0fab.loVect()), AMREX_ARLIM(f0fab.hiVect()),
-            m0.dataPtr(), 
-            AMREX_ARLIM(m0.loVect()), AMREX_ARLIM(m0.hiVect()),
-            f1fab.dataPtr(), 
-            AMREX_ARLIM(f1fab.loVect()), AMREX_ARLIM(f1fab.hiVect()),
-            m1.dataPtr(), 
-            AMREX_ARLIM(m1.loVect()), AMREX_ARLIM(m1.hiVect()),
-            f2fab.dataPtr(), 
-            AMREX_ARLIM(f2fab.loVect()), AMREX_ARLIM(f2fab.hiVect()),
-            m2.dataPtr(), 
-            AMREX_ARLIM(m2.loVect()), AMREX_ARLIM(m2.hiVect()),
-            f3fab.dataPtr(), 
-            AMREX_ARLIM(f3fab.loVect()), AMREX_ARLIM(f3fab.hiVect()),
-            m3.dataPtr(), 
-            AMREX_ARLIM(m3.loVect()), AMREX_ARLIM(m3.hiVect()),
-	    tbx.loVect(), tbx.hiVect(), vbx.loVect(), vbx.hiVect(),
-            &nc, h[level].data(), &redBlackFlag);
-#endif
-
-#if (BL_SPACEDIM == 3)
-        amrex_lp_gsrb(
-            solnfab.dataPtr(), 
-            AMREX_ARLIM(solnfab.loVect()),AMREX_ARLIM(solnfab.hiVect()),
-            rhsfab.dataPtr(), 
-            AMREX_ARLIM(rhsfab.loVect()), AMREX_ARLIM(rhsfab.hiVect()),
-            f0fab.dataPtr(), 
-            AMREX_ARLIM(f0fab.loVect()), AMREX_ARLIM(f0fab.hiVect()),
-            m0.dataPtr(), 
-            AMREX_ARLIM(m0.loVect()), AMREX_ARLIM(m0.hiVect()),
-            f1fab.dataPtr(), 
-            AMREX_ARLIM(f1fab.loVect()), AMREX_ARLIM(f1fab.hiVect()),
-            m1.dataPtr(), 
-            AMREX_ARLIM(m1.loVect()), AMREX_ARLIM(m1.hiVect()),
-            f2fab.dataPtr(), 
-            AMREX_ARLIM(f2fab.loVect()), AMREX_ARLIM(f2fab.hiVect()),
-            m2.dataPtr(), 
-            AMREX_ARLIM(m2.loVect()), AMREX_ARLIM(m2.hiVect()),
-            f3fab.dataPtr(), 
-            AMREX_ARLIM(f3fab.loVect()), AMREX_ARLIM(f3fab.hiVect()),
-            m3.dataPtr(), 
-            AMREX_ARLIM(m3.loVect()), AMREX_ARLIM(m3.hiVect()),
-            f4fab.dataPtr(), 
-            AMREX_ARLIM(f4fab.loVect()), AMREX_ARLIM(f4fab.hiVect()),
-            m4.dataPtr(), 
-            AMREX_ARLIM(m4.loVect()), AMREX_ARLIM(m4.hiVect()),
-            f5fab.dataPtr(), 
-            AMREX_ARLIM(f5fab.loVect()), AMREX_ARLIM(f5fab.hiVect()),
-            m5.dataPtr(), 
-            AMREX_ARLIM(m5.loVect()), AMREX_ARLIM(m5.hiVect()),
-	    tbx.loVect(), tbx.hiVect(), vbx.loVect(), vbx.hiVect(),
-	    &nc, h[level].data(), &redBlackFlag);
-#endif
-    }
-}
-
-void
-Laplacian::Fsmooth_jacobi (MultiFab&       solnL,
-                           const MultiFab& rhsL,
-                           int            level)
-{
-}
-
-void
-Laplacian::Fapply (MultiFab&       y,
-                   const MultiFab& x,
-                   int             level)
-{
-  int src_comp = 0;
-  int dst_comp = 0;
-  int num_comp = 1;
-  Fapply(y,dst_comp,x,src_comp,num_comp,level);
-}
-
-void
-Laplacian::Fapply (MultiFab&       y,
-		   int             dst_comp,
-                   const MultiFab& x,
-		   int             src_comp,
-		   int             num_comp,
-                   int             level)
-{
-    BL_PROFILE("Laplacian::Fapply()");
-
-    const bool tiling = true;
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter ymfi(y,tiling); ymfi.isValid(); ++ymfi)
-    {
-        const Box&       tbx  = ymfi.tilebox();
-        FArrayBox&       yfab = y[ymfi];
-        const FArrayBox& xfab = x[ymfi];
-
-        amrex_lp_adotx(yfab.dataPtr(dst_comp), 
-                   AMREX_ARLIM(yfab.loVect()), AMREX_ARLIM(yfab.hiVect()),
-                   xfab.dataPtr(src_comp), 
-                   AMREX_ARLIM(xfab.loVect()), AMREX_ARLIM(xfab.hiVect()),
-                   tbx.loVect(), tbx.hiVect(), &num_comp,
-                   h[level].data());
-    }
-}
-
-}
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LinOp.H b/Src/LinearSolvers/C_CellMG/AMReX_LinOp.H
deleted file mode 100644
index 58575305f93..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LinOp.H
+++ /dev/null
@@ -1,466 +0,0 @@
-
-#ifndef AMREX_LINOP_H_
-#define AMREX_LINOP_H_
-
-#include <memory>
-
-#include <AMReX_Array.H>
-#include <AMReX_Vector.H>
-#include <AMReX_REAL.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_BndryData.H>
-
-namespace amrex {
-
-/**
-        \brief A LinOp is a virtual base class for general linear operators capable
-        of acting on MultiFabs.  All implementation and access functions are
-        designed to make a LinOp object useful for representing and solving
-        a set of linear equations on a union of rectangles in 2D or 3D.
-
-        A LinOp contains all the information necessary to construct and
-        maintain a linear operator which acts on a cell-centered MultiFab.  It
-        is a virtual base class, and therefore cannot itself be
-        instantiated.  The virtual functions implement "apply"
-         and "smooth" operators (for the internal nodes), and therefore
-        determine the mathematical character of the operator.  LinOp,
-        on the other hand, determines the implementation,
-        filling ghost cells and creating coarsened versions
-        of the domain and operator, etc. necessary for solving linear systems.
-
-        LinOp is designed specifically for representing discrete approximations
-        to partial differential operators.  It requires a BndryData object,
-        which maintains ghost cell data surrounding each rectangle in the
-        domain, as well as position and boundary condition type
-        specifiers.  It also requires a (vector/scalar) grid spacing.  On
-        levels above the base level, LinOp internally recognizes adjacent
-        domain rectangles (using methods similar to those in the BndryData
-        class) and when applying boundary conditions (filling ghost cell
-        regions) will give preference to "valid" data (i.e. ghost cells
-        covered by adjacent grids are filled with the corresponding data from
-        the interior of that adjacent grid rather than via the auxiliary
-        boundary instructions).
-
-        A LinOp constructs a set of "levels", which are useful for linear
-        solution methods such as multigrid.  On each grid, a new level is
-        created by uniformly coarsening the grid structure by a factor of
-        two in each coordinate direction (and then allocating and initializing
-        any internal data necessary--new level grid spacing, for example).
-        A LinOp can fill boundary ghost cells, compute a "norm" and coordinate
-        the "apply" and "smooth"  operations at each level.
-        Note that there are the same number of levels on each grid in the
-        LinOp's domain.
-
-        If a boundary type specifier indicates the type "BndryData::
-        LO_DIRICHLET", the ghost cells not covered by adjacent grids are
-        filled on demand by a polynomial interpolant (of settable order) to
-        compute the value specified in the BndryData FabSets along the edge
-        of the grid boxes.  A value is put into the ghost cell of the input
-        multifab that can be assumed to exist outside the domain, at equal
-        spacing with the rest of the nodes.
-        "BndryData::LO_NEUMANN" conditions result in ghost cells filled by
-        second order extrapolation, and results in again filling the
-        ghost cell with a value appropriate for application in a constant
-        spacing cell-centered discretization.
-        The order of the interpolant is set
-        by default in this class to 2, which is compatible with most
-        simple algebraic relaxation methods for linear systems based on
-        numerical PDE's.  The interpolant can be queried/set via member
-        functions, and is applied uniformly over the domain.  The boundary
-        location is specified as a distance from the wall of the grid block,
-        and is given in the same units that the grid spacing, h, is specified.
-
-        All the member functions of LinOp which interact directly with the
-        apply() member take a BC_Mode flag.  The BC_mode can be either
-        Homogeneous_BC, or Inhomogeneous_BC.  It is a strict requirement of
-        the linear operator that LinOp::apply(out,in,level,bc_mode=Homogeneous_BC)
-        acting on in=0 returns out=0.
-
-        This class does NOT provide a copy constructor or assignment operator.
-*/
-
-class LinOp
-{
-public:
-
-    enum BC_Mode { Homogeneous_BC = 0, Inhomogeneous_BC };
-
-    /**
-    * \brief Allocate a LinOp for this box array, boundary and (uniform) spacing info.
-    *
-    * \param mgb
-    * \param _h
-    */
-    LinOp (const BndryData& mgb,
-           const Real       _h);
-
-    /**
-    * \brief Allocate a LinOp for this box array, boundary data and spacing array info.
-    *
-    * \param mgb
-    * \param _h
-    */
-    LinOp (const BndryData& mgb,
-           const Real*      _h);
-
-    /**
-    * \brief Allocate a LinOp for this box array, boundary data and spacing array info.
-    *
-    * LinOp assumes ownership of the pointer.
-    *
-    * \param mgb
-    * \param _h
-    */
-    LinOp (BndryData*  mgb,
-           const Real* _h);
-
-    /**
-    * \brief The destructor.
-    */
-    virtual ~LinOp ();
-
-    /**
-    * \brief Applies level LinOp to "in", returns "out", uses BC_mode flag.
-    *
-    * \param out
-    * \param in
-    * \param level
-    * \param bc_mode
-    * \param local
-    * \param src_comp
-    * \param dst_comp
-    * \param num_comp
-    * \param bndry_comp
-    */
-    virtual void apply (MultiFab&      out,
-                        MultiFab&      in,
-                        int            level   = 0,
-                        LinOp::BC_Mode bc_mode = LinOp::Inhomogeneous_BC,
-                        bool           local   = false,
-			            int            src_comp = 0,
-                        int            dst_comp = 0,
-                        int            num_comp = 1,
-                        int            bndry_comp = 0);
-
-    /**
-    * \brief Fills level boundary cells using BC_mode flag, int. BC data if reqd.
-    *
-    * \param inout
-    * \param src_comp
-    * \param num_comp
-    * \param level
-    * \param bc_mode
-    * \param local
-    * \param bndryComp
-    */
-    virtual void applyBC (MultiFab&      inout,
-                  int            src_comp,
-                  int            num_comp,
-                  int            level   = 0,
-                  LinOp::BC_Mode bc_mode = LinOp::Inhomogeneous_BC,
-                  bool           local   = false,
-		          int            bndryComp = 0);
-
-    /**
-    * \brief Compute the level residual = rhsL - L(solnL).
-    *
-    * \param residL
-    * \param rhsL
-    * \param solnL
-    * \param level
-    * \param bc_mode
-    * \param local
-    */
-    virtual void residual (MultiFab&       residL,
-                           const MultiFab& rhsL,
-                           MultiFab&       solnL,
-                           int             level   = 0,
-                           LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC,
-                           bool            local   = false);
-
-    /**
-    * \brief Smooth the level system L(solnL)=rhsL.
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param bc_mode
-    */
-    virtual void smooth (MultiFab&       solnL,
-                         const MultiFab& rhsL,
-                         int             level   = 0,
-                         LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC);
-
-    virtual void jacobi_smooth (MultiFab&       solnL,
-                                const MultiFab& rhsL,
-                                int             level   = 0,
-                                LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC);
-
-    /**
-    * \brief Estimate the norm of the operator.
-    *
-    * \param nm
-    * \param level
-    * \param local
-    */
-    virtual Real norm (int nm = 0, int level = 0, const bool local = false);
-
-    /**
-    * \brief Compute flux associated with the op
-    *
-    * \paramxflux
-    * \paramyflux
-    * \paramzflux)
-    * \param in
-    * \param bc_mode
-    * \param sComp
-    * \param dComp
-    * \param nComp
-    * \param bndComp
-    */
-    virtual void compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-			   MultiFab& in, const BC_Mode& bc_mode=Inhomogeneous_BC,
-			   int sComp=0, int dComp=0, int nComp=1, int bndComp=0) = 0;
-
-    /**
-    * \brief Return the boundary data object.
-    */
-    const BndryData& bndryData () const { return *bgb; }
-
-    const DistributionMapping& DistributionMap () const { return bgb->DistributionMap(); }
-
-    /**
-    * \brief Set the boundary data object.
-    *
-    * \param bd
-    */
-    void bndryData (const BndryData& bd);
-
-    /**
-    * \brief Return the box array.
-    *
-    * \param level
-    */
-    virtual const BoxArray& boxArray (int level = 0) const
-    {
-        BL_ASSERT(level < numLevels()); return gbox[level];
-    }
-
-    /**
-    * \brief Return the number of grids.
-    */
-    int numGrids () const { return gbox[0].size(); }
-
-    /**
-    * \brief Return the number of levels.
-    */
-    virtual int numLevels () const { return h.size(); }
-
-    /**
-    * \brief Return the order of the boundary condition interpolant.
-    */
-    virtual int maxOrder () const { return maxorder; }
-
-    /**
-    * \brief Set the order of the boundary condition interpolant.
-    *
-    * \param maxorder_
-    */
-    virtual int maxOrder (int maxorder_);
-
-    /**
-    * \brief Return the number of grow cells this operator expects in the input state to compute "apply"
-    *
-    * \param level
-    */
-    virtual int NumGrow (int level = 0) const {return LinOp_grow;}
-
-    /**
-    * \brief Construct/allocate internal data necessary for adding a new level.
-    *
-    * \param level
-    */
-    virtual void prepareForLevel (int level);
-
-    /**
-    * \brief Output operator internal to an ASCII stream.
-    *
-    * \param os
-    * \param lp
-    */
-    friend std::ostream& operator<< (std::ostream& os, const LinOp& lp);
-
-    const Geometry& getGeom(int level);
-    const Real * getDx(int level);
-
-    /**
-    * \brief Get scalar alpha coefficient.
-    */
-    virtual Real get_alpha () const;
-
-    /**
-    * \brief Get scalar beta coefficient.
-    */
-    virtual Real get_beta () const;
-
-    /**
-    * \brief Return reference to "a" coefficients for base level.
-    *
-    * \param level
-    */
-    virtual const MultiFab& aCoefficients (int level = 0);
-
-    /**
-    * \brief Return reference to "b" coefficients for base level.
-    *
-    * \param dir
-    * \param level
-    */
-    virtual const MultiFab& bCoefficients (int dir, int level=0);
-
-protected:
-
-    /**
-    * \brief Remove internal data necessary for a level and all higher.
-    *
-    * \param level
-    */
-    virtual void clearToLevel (int level);
-
-    /**
-    * \brief Virtual to apply the level operator to the internal nodes of
-    * "in", return result in "out"
-    *
-    * \param out
-    * \param in
-    * \param level
-    */
-    virtual void Fapply (MultiFab&       out,
-                         const MultiFab& in,
-                         int             level) = 0;
-    virtual void Fapply (MultiFab&       out,
-			 int             dst_comp,
-                         const MultiFab& in,
-			 int             src_comp,
-			 int             num_comp,
-                         int             level) = 0;
-
-    /**
-    * \brief Virtual to carry out the level smoothing operation for
-    * L(solnL)=rhsL on internal nodes.  Modify solnL in place.
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param rgbflag
-    */
-    virtual void Fsmooth (MultiFab&       solnL,
-                          const MultiFab& rhsL,
-                          int             level,
-                          int             rgbflag) = 0;
-
-    virtual void Fsmooth_jacobi (MultiFab&       solnL,
-                                 const MultiFab& rhsL,
-                                 int             level) = 0;
-
-    /**
-    * \brief Build coefficients at coarser level by interpolating "fine"
-    * (builds in appropriate node/cell centering)
-    *
-    * \param crs
-    * \param fine
-    * \param level
-    */
-    void makeCoefficients (MultiFab&       crs,
-                           const MultiFab& fine,
-                           int             level);
-
-    /**
-    * \brief Initialize LinOp internal data.
-    */
-    static void Initialize ();
-
-    static void Finalize ();
-
-    /**
-    * \brief Helper function for object construction.
-    *
-    * \param _h
-    */
-    void initConstruct (const Real* _h);
-
-    //! Vector (on level) of Arrays (on dimension) of grid spacings
-    Vector< Array<Real,BL_SPACEDIM> > h;
-
-    //! Vector (on level) of BoxArray's of LinOp's domain
-    Vector< BoxArray > gbox;
-
-    /**
-    * \brief Vector (on level) of pointers to BndryRegisters along each grid
-    * for scratch data required to modify internal stencil on boundary
-    */
-    Vector<BndryRegister> undrrelxr;
-
-    /**
-    * \brief Vector (on level) of Vectors (on orientation) of MultiMasks for
-    * whether boundary Fabs are covered, not_covered, outside_domain
-    */
-    Vector<Vector<MultiMask> > maskvals;
-
-    /**
-    * \brief Similar to maskvals, but only for level 0.
-    * It's only made if it's needed.  Currently used only in applyBC().
-    */
-    Vector<Vector<MultiMask> > lmaskvals;
-
-    //! boundary data class
-    BndryData* bgb;
-
-    /**
-    * \brief Vector (on level) of geometry objects.  Needed for determining
-    * whether stuff intersects on periodic domains
-    */
-    Vector< Geometry > geomarray;
-
-    /**
-    * \brief flag (=1 if use harmonic averaged interpolation for coefficients,
-    * =0 is arithmetic averaging)
-    */
-    int harmavg;
-
-    //! flag (\>0 is verbose execution)
-    int verbose;
-
-    /**
-    * \brief maximum interpolation order used for constructing Dirichlet
-    * ghost node values
-    */
-    int maxorder;
-
-    //! default value for harm_avg
-    static int def_harmavg;
-
-    //! default value for verbose
-    static int def_verbose;
-
-    //! default maximum BC interpolant order
-    static int def_maxorder;
-
-   //! Number of grow cells required for this operator
-   static int LinOp_grow;
-
-private:
-
-    /**
-    * \brief Not implemented.
-    *
-    * \param rhs
-    */
-    LinOp (const LinOp& rhs);
-    void operator = (const LinOp& rhs);
-};
-
-}
-
-#endif /*_LINOP_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_LinOp.cpp b/Src/LinearSolvers/C_CellMG/AMReX_LinOp.cpp
deleted file mode 100644
index c168cd55642..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_LinOp.cpp
+++ /dev/null
@@ -1,598 +0,0 @@
-
-#include <cstdlib>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_LO_F.H>
-#include <AMReX_LinOp.H>
-
-namespace amrex {
-
-namespace
-{
-    bool initialized = false;
-}
-//
-// Set default values for these in Initialize()!!!
-//
-int LinOp::def_harmavg;
-int LinOp::def_verbose;
-int LinOp::def_maxorder;
-int LinOp::LinOp_grow;
-
-// Important:
-// LinOp::applyBC fills LinOp_grow ghost cells with data expected in
-// LinOp::apply therefore, the incoming MultiFab to LinOp::applyBC better
-// have LinOp_grow many ghost allocated.
-//
-
-void
-LinOp::Initialize ()
-{
-    if (initialized) return;
-    //
-    // Set defaults here!!!
-    //
-    LinOp::def_harmavg  = 0;
-    LinOp::def_verbose  = 0;
-    LinOp::def_maxorder = 2;
-    LinOp::LinOp_grow   = 1; // Must be consistent with expectations of apply/applyBC, not parm-parsed
-
-    ParmParse pp("Lp");
-
-    pp.query("harmavg",  def_harmavg);
-    pp.query("v",        def_verbose);
-    pp.query("maxorder", def_maxorder);
-
-    if (ParallelDescriptor::IOProcessor() && def_verbose)
-    {
-        amrex::Print() << "def_harmavg = "  << def_harmavg  << '\n'
-                       << "def_maxorder = " << def_maxorder << '\n';
-    }
-
-    amrex::ExecOnFinalize(LinOp::Finalize);
-
-    initialized = true;
-}
-
-void
-LinOp::Finalize ()
-{
-    ;
-}
-
-void
-LinOp::bndryData (const BndryData& bd)
-{
-    BL_ASSERT(gbox[0] == bd.boxes());
-    *bgb = bd;
-}
-
-LinOp::LinOp (const BndryData& _bgb,
-              const Real       _h)
-    :
-    bgb(new BndryData(_bgb))
-{
-    Real _hh[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        _hh[i] = _h;
-    }
-    initConstruct(_hh);
-}
-
-LinOp::LinOp (const BndryData& _bgb,
-              const Real*      _h)
-    :
-    bgb(new BndryData(_bgb))
-{
-    initConstruct(_h);
-}
-
-LinOp::LinOp (BndryData*  _bgb,
-              const Real* _h)
-    :
-    bgb(_bgb)
-{
-    initConstruct(_h);
-}
-
-LinOp::~LinOp ()
-{
-    delete bgb;
-}
-
-void
-LinOp::clearToLevel (int level) {}
-
-void
-LinOp::initConstruct (const Real* _h)
-{
-    Initialize();
-    //
-    // We'll reserve() space to cut down on copying during resize()s.
-    //
-    const int N = 10;
-
-    h.reserve(N);
-    gbox.reserve(N);
-    undrrelxr.reserve(N);
-    maskvals.reserve(N);
-    lmaskvals.reserve(N);
-    geomarray.reserve(N);
-
-    harmavg = def_harmavg;
-    verbose = def_verbose;
-    gbox.resize(1);
-    const int level = 0;
-    gbox[level] = bgb->boxes();
-    geomarray.resize(1);
-    geomarray[level] = bgb->getGeom();
-    h.resize(1);
-    maxorder = def_maxorder;
-
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        h[level][i] = _h[i];
-    }
-    undrrelxr.resize(1);
-    undrrelxr[0].define(gbox[level], bgb->DistributionMap(), 1, 0, 0, 1);
-
-    maskvals.resize(1);
-    maskvals[0].resize(2*BL_SPACEDIM);
-
-    lmaskvals.resize(1);
-    lmaskvals[0].resize(2*BL_SPACEDIM);
-
-    for (OrientationIter oitr; oitr; ++oitr)
-    {
-	const Orientation face = oitr();
-	const MultiMask& m = bgb->bndryMasks(face);
-	maskvals[0][face].define(m.boxArray(), m.DistributionMap(), 1);
-	lmaskvals[0][face].define(m.boxArray(), m.DistributionMap(), 1);
-	MultiMask::Copy(maskvals[0][face], m);
-	MultiMask::Copy(lmaskvals[0][face], m);
-    }
-}
-
-void
-LinOp::apply (MultiFab&      out,
-              MultiFab&      in,
-              int            level,
-              LinOp::BC_Mode bc_mode,
-              bool           local,
-	      int            src_comp,
-	      int            dst_comp,
-	      int            num_comp,
-	      int            bndry_comp)
-{
-    applyBC(in,src_comp,num_comp,level,bc_mode,local,bndry_comp);
-    Fapply(out,dst_comp,in,src_comp,num_comp,level);
-}
-
-void
-LinOp::applyBC (MultiFab&      inout,
-                int            src_comp,
-                int            num_comp,
-                int            level,
-                LinOp::BC_Mode bc_mode,
-                bool           local,
-		int            bndry_comp)
-{
-    BL_PROFILE("LinOp::applyBC()");
-    //
-    // The inout MultiFab needs at least LinOp_grow ghost cells for applyBC.
-    //
-    BL_ASSERT(inout.nGrow() >= LinOp_grow);
-    //
-    // No coarsened boundary values, cannot apply inhomog at lev>0.
-    //
-    BL_ASSERT(level < numLevels());
-    BL_ASSERT(!(level > 0 && bc_mode == Inhomogeneous_BC));
-
-    int flagden = 1; // Fill in undrrelxr.
-    int flagbc  = 1; // Fill boundary data.
-
-    if (bc_mode == LinOp::Homogeneous_BC)
-        //
-        // No data if homogeneous.
-        //
-        flagbc = 0;
-
-    prepareForLevel(level);
-
-    const bool cross = true;
-    inout.FillBoundary(src_comp,num_comp,geomarray[level].periodicity(),cross);
-
-    //
-    // Fill boundary cells.
-    //
-    // OMP over boxes
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(inout); mfi.isValid(); ++mfi)
-    {
-        const int gn = mfi.index();
-
-        BL_ASSERT(gbox[level][gn] == inout.box(gn));
-        BL_ASSERT(level<undrrelxr.size());
-
-        const BndryData::RealTuple&      bdl = bgb->bndryLocs(gn);
-        const Vector< Vector<BoundCond> >& bdc = bgb->bndryConds(gn);
-
-        for (OrientationIter oitr; oitr; ++oitr)
-        {
-            const Orientation o = oitr();
-
-            FabSet&       f   = undrrelxr[level][o];
-            int           cdr = o;
-            const FabSet& fs  = bgb->bndryValues(o);
-            const Mask&   m   = local ? lmaskvals[level][o][mfi] : maskvals[level][o][mfi];
-            Real          bcl = bdl[o];
-            BL_ASSERT(bdc[o].size()>bndry_comp);
-            int           bct = bdc[o][bndry_comp];
-
-            const Box&       vbx   = inout.box(gn);
-            FArrayBox&       iofab = inout[mfi];
-            BL_ASSERT(f.size()>gn);
-            BL_ASSERT(fs.size()>gn);
-
-            FArrayBox&       ffab  = f[mfi];
-            const FArrayBox& fsfab = fs[mfi];
-
-            amrex_lo_applybc(&flagden, &flagbc, &maxorder,
-                         iofab.dataPtr(src_comp),
-                         AMREX_ARLIM(iofab.loVect()), AMREX_ARLIM(iofab.hiVect()),
-                         &cdr, &bct, &bcl,
-                         fsfab.dataPtr(bndry_comp), 
-                         AMREX_ARLIM(fsfab.loVect()), AMREX_ARLIM(fsfab.hiVect()),
-                         m.dataPtr(),
-                         AMREX_ARLIM(m.loVect()), AMREX_ARLIM(m.hiVect()),
-                         ffab.dataPtr(),
-                         AMREX_ARLIM(ffab.loVect()), AMREX_ARLIM(ffab.hiVect()),
-                         vbx.loVect(),
-                         vbx.hiVect(), &num_comp, h[level].data());
-        }
-    }
-}
-
-void
-LinOp::residual (MultiFab&       residL,
-                 const MultiFab& rhsL,
-                 MultiFab&       solnL,
-                 int             level,
-                 LinOp::BC_Mode  bc_mode,
-                 bool            local)
-{
-    BL_PROFILE("LinOp::residual()");
-    apply(residL, solnL, level, bc_mode, local);
-    MultiFab::Xpay(residL, -1.0, rhsL, 0, 0, residL.nComp(), 0);
-}
-
-void
-LinOp::smooth (MultiFab&       solnL,
-               const MultiFab& rhsL,
-               int             level,
-               LinOp::BC_Mode  bc_mode)
-{
-    for (int redBlackFlag = 0; redBlackFlag < 2; redBlackFlag++)
-    {
-        applyBC(solnL, 0, 1, level, bc_mode);
-        Fsmooth(solnL, rhsL, level, redBlackFlag);
-    }
-}
-
-void
-LinOp::jacobi_smooth (MultiFab&       solnL,
-                      const MultiFab& rhsL,
-                      int             level,
-                      LinOp::BC_Mode  bc_mode)
-{        
-    applyBC(solnL, 0, 1, level, bc_mode);
-    Fsmooth_jacobi(solnL, rhsL, level);
-}
-
-Real
-LinOp::norm (int nm, int level, const bool local)
-{
-    amrex::Error("LinOp::norm: Placeholder for pure virtual function");
-    return 0;
-}
-
-void
-LinOp::prepareForLevel (int level)
-{
-    BL_PROFILE("LinOp::prepareForLevel()");
-
-    if (level == 0) return;
-
-    LinOp::prepareForLevel(level-1);
-
-    if (h.size() > level) return;
-    //
-    // Assume from here down that this is a new level one coarser than existing
-    //
-    BL_ASSERT(h.size() == level);
-    h.resize(level+1);
-    for (int i = 0; i < BL_SPACEDIM; ++i)
-    {
-        h[level][i] = h[level-1][i]*2.0;
-    }
-    geomarray.resize(level+1);
-    geomarray[level].define(amrex::coarsen(geomarray[level-1].Domain(),2));
-    //
-    // Add a box to the new coarser level (assign removes old BoxArray).
-    //
-    gbox.resize(level+1);
-    gbox[level] = gbox[level-1];
-    gbox[level].coarsen(2);
-    //
-    // Add the BndryRegister of relax values to the new coarser level.
-    //
-    BL_ASSERT(undrrelxr.size() == level);
-    undrrelxr.resize(level+1);
-    undrrelxr[level].define(gbox[level], bgb->DistributionMap(), 1, 0, 0, 1);
-    //
-    // Add an Array of Array of maskvals to the new coarser level
-    // For each orientation, build NULL masks, then use distributed allocation
-    // Initial masks for coarse levels, ignore outside_domain possibility since
-    // we always solve homogeneous equation on coarse levels.
-    //
-    BL_ASSERT( maskvals.size() == level);
-    BL_ASSERT(lmaskvals.size() == level);
-     maskvals.resize(level+1);
-    lmaskvals.resize(level+1);
-
-    maskvals[level].resize(2*BL_SPACEDIM);
-    lmaskvals[level].resize(2*BL_SPACEDIM);
-
-    int nGrow = NumGrow(level);
-
-    for (OrientationIter fi; fi; ++fi)
-    {
-        Orientation face = fi();
-	maskvals[level][face].define(gbox[level], bgb->DistributionMap(), geomarray[level],
-				     face, 0, nGrow, 0, 1, true);
-	lmaskvals[level][face].define(maskvals[level][face].boxArray(),
-				      maskvals[level][face].DistributionMap(), 1);
-	MultiMask::Copy(lmaskvals[level][face], maskvals[level][face]);
-    }
-}
-
-void
-LinOp::makeCoefficients (MultiFab&       cs,
-                         const MultiFab& fn,
-                         int             level)
-{
-    BL_PROFILE("LinOp::makeCoefficients()");
-
-    int nc = 1;
-    //
-    // Determine index type of incoming MultiFab.
-    //
-    const IndexType iType(fn.boxArray().ixType());
-    const IndexType cType(AMREX_D_DECL(IndexType::CELL, IndexType::CELL, IndexType::CELL));
-    const IndexType xType(AMREX_D_DECL(IndexType::NODE, IndexType::CELL, IndexType::CELL));
-    const IndexType yType(AMREX_D_DECL(IndexType::CELL, IndexType::NODE, IndexType::CELL));
-#if (BL_SPACEDIM == 3)    
-    const IndexType zType(AMREX_D_DECL(IndexType::CELL, IndexType::CELL, IndexType::NODE));
-#endif
-
-    int cdir;
-    if (iType == cType)
-    {
-        cdir = -1;
-    }
-    else if (iType == xType)
-    {
-        cdir = 0;
-    }
-    else if (iType == yType)
-    {
-        cdir = 1;
-#if (BL_SPACEDIM == 3)
-    }
-    else if (iType == zType)
-    {
-        cdir = 2;
-#endif    
-    }
-    else
-    {
-        cdir = -100;
-        amrex::Error("LinOp::makeCoeffients: Bad index type");
-    }
-
-    BoxArray d(gbox[level]);
-    if (cdir >= 0)
-        d.surroundingNodes(cdir);
-    //
-    // Only single-component solves supported (verified) by this class.
-    //
-    const int nComp=1;
-    const int nGrow=0;
-    cs.define(d, fn.DistributionMap(), nComp, nGrow, MFInfo(), FArrayBoxFactory());
-
-    const bool tiling = true;
-
-    switch (cdir)
-    {
-    case -1:
-    {
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for (MFIter csmfi(cs,tiling); csmfi.isValid(); ++csmfi)
-        {
-            const Box& tbx = csmfi.tilebox();
-            FArrayBox&       csfab = cs[csmfi];
-            const FArrayBox& fnfab = fn[csmfi];
-
-            amrex_lo_averagecc(csfab.dataPtr(), AMREX_ARLIM(csfab.loVect()),
-                           AMREX_ARLIM(csfab.hiVect()),fnfab.dataPtr(),
-                           AMREX_ARLIM(fnfab.loVect()),AMREX_ARLIM(fnfab.hiVect()),
-                           tbx.loVect(),tbx.hiVect(), &nc);
-        }
-    }
-    break;
-    case 0:
-    case 1:
-    case 2:
-        if (harmavg)
-        {
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  	    for (MFIter csmfi(cs,tiling); csmfi.isValid(); ++csmfi)
-            {
-	        const Box& tbx = csmfi.tilebox();
-                FArrayBox&       csfab = cs[csmfi];
-                const FArrayBox& fnfab = fn[csmfi];
-
-                amrex_lo_harmonic_averageec(csfab.dataPtr(),
-                                        AMREX_ARLIM(csfab.loVect()),
-                                        AMREX_ARLIM(csfab.hiVect()),
-                                        fnfab.dataPtr(),
-                                        AMREX_ARLIM(fnfab.loVect()),
-                                        AMREX_ARLIM(fnfab.hiVect()),
-                                        tbx.loVect(),tbx.hiVect(),
-                                        &nc,&cdir);
-            }
-        }
-        else
-        {
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-            for (MFIter csmfi(cs,tiling); csmfi.isValid(); ++csmfi)
-            {
-                const Box& tbx = csmfi.tilebox();
-                FArrayBox&       csfab = cs[csmfi];
-                const FArrayBox& fnfab = fn[csmfi];
-
-                amrex_lo_averageec(csfab.dataPtr(),AMREX_ARLIM(csfab.loVect()),
-                               AMREX_ARLIM(csfab.hiVect()),fnfab.dataPtr(), 
-                               AMREX_ARLIM(fnfab.loVect()),AMREX_ARLIM(fnfab.hiVect()),
-	                       tbx.loVect(),tbx.hiVect(),
-                               &nc, &cdir);
-            }
-        }
-        break;
-    default:
-        amrex::Error("LinOp:: bad coefficient coarsening direction!");
-    }
-}
-
-std::ostream&
-operator<< (std::ostream& os,
-            const LinOp&  lp)
-{
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << "LinOp" << '\n';
-        os << "Grids: " << '\n';
-        for (int level = 0; level < lp.h.size(); ++level)
-        {
-            os << " level = " << level << ": " << lp.gbox[level] << '\n';
-        }
-        os << "Grid Spacing: " << '\n';
-        for (int level = 0; level < lp.h.size(); ++level)
-        {
-            os << " level = " << level << ", dx = ";
-            for (int d =0; d < BL_SPACEDIM; ++d)
-            {
-                os << lp.h[level][d] << "  ";
-            }
-            os << '\n';
-        }
-        os << "Harmonic average? " << (lp.harmavg == 1 ? "yes" : "no") << '\n';
-        os << "Verbosity: " << lp.verbose << '\n';
-        os << "Max Order: " << lp.maxorder << '\n';
-    }
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << "Masks:" << '\n';
-    }
-    for (int level = 0; level < lp.h.size(); ++level)
-    {
-        if (ParallelDescriptor::IOProcessor())
-            os << "level = " << level << '\n';
-
-        for (int nproc = 0; nproc < ParallelDescriptor::NProcs(); ++nproc)
-        {
-            if (nproc == ParallelDescriptor::MyProc())
-            {
-                os << "Processor " << nproc << '\n';
-
-                for (OrientationIter oitr; oitr; ++oitr)
-                {
-                    const Orientation face = oitr();
-
-		    for (MultiMaskIter mmi(lp.maskvals[level][face]); mmi.isValid(); ++mmi)
-		    {
-                        os << lp.maskvals[level][face][mmi];
-                    }
-                }
-            }
-        }
-    }
-    
-    return os;
-}
-
-const Geometry&
-LinOp::getGeom (int level)
-{
-    return geomarray[level];
-}
-
-const Real * 
-LinOp::getDx (int level)
-{
-    return h[level].data();
-}
-
-Real
-LinOp::get_alpha () const
-{
-    amrex::Abort("LinOp::get_alpha");
-    return 0;
-}   
-    
-Real
-LinOp::get_beta () const 
-{   
-    amrex::Abort("LinOp::get_beta");
-    return 0; 
-}
-
-const MultiFab&
-LinOp::aCoefficients (int level)
-{
-    static MultiFab junk;
-    amrex::Abort("LinOp::aCoefficients");
-    return junk;
-}
-
-const MultiFab&
-LinOp::bCoefficients (int dir,int level)
-{
-    static MultiFab junk;
-    amrex::Abort("LinOp::bCoefficients");
-    return junk;
-}
-
-int
-LinOp::maxOrder (int maxorder_)
-{
-    BL_ASSERT(maxorder_ >= 2);
-    maxorder_ = (maxorder_ < 2 ? 2 : maxorder_ );
-    int omaxorder = maxorder;
-    maxorder = maxorder_;
-    return omaxorder;
-}
-
-}
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_MG_1D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_MG_1D.F90
deleted file mode 100644
index 21b3b856df8..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_MG_1D.F90
+++ /dev/null
@@ -1,57 +0,0 @@
-module amrex_mg_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-    subroutine amrex_mg_average ( &
-           c, c_l1,c_h1, &
-           f, f_l1,f_h1, &
-           lo, hi, nc) bind(c,name='amrex_mg_average')
-
-      integer nc
-      integer f_l1,f_h1
-      integer c_l1,c_h1
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,nc)
-      real(amrex_real) c(c_l1:c_h1,nc)
-
-      integer i,n
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            c(i,n) =  half * ( f(2*i+1,n) + f(2*i,n) )
-         end do
-      end do
-
-    end subroutine amrex_mg_average
-
-    subroutine amrex_mg_interp ( &
-           f, f_l1,f_h1, &
-           c, c_l1,c_h1, &
-           lo, hi, nc) bind(c,name='amrex_mg_interp')
-
-      integer nc
-      integer f_l1,f_h1
-      integer c_l1,c_h1
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,nc)
-      real(amrex_real) c(c_l1:c_h1,nc)
-
-      integer i,n
-
-      do n = 1, nc
-         do i = lo(1), hi(1)
-            f(2*i+1,n) = c(i,n) + f(2*i+1,n)
-            f(2*i  ,n) = c(i,n) + f(2*i  ,n)
-         end do
-      end do
-
-    end subroutine amrex_mg_interp
-
-end module amrex_mg_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_MG_2D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_MG_2D.F90
deleted file mode 100644
index 23248629b12..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_MG_2D.F90
+++ /dev/null
@@ -1,85 +0,0 @@
-module amrex_mg_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-    subroutine amrex_mg_average ( &
-           c, c_l1,c_l2,c_h1,c_h2, &
-           f, f_l1,f_l2,f_h1,f_h2, &
-           lo, hi, nc) bind(c,name='amrex_mg_average')
-
-      implicit none
-
-      integer nc
-      integer f_l1,f_l2,f_h1,f_h2
-      integer c_l1,c_l2,c_h1,c_h2
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,nc)
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,nc)
-
-      integer i
-      integer j
-      integer n
-      real(amrex_real) denom
-      parameter(denom=fourth)
-
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               c(i,j,n) =  ( &
-                    f(2*i+1,2*j+1,n) + f(2*i  ,2*j+1,n) &
-                    + f(2*i+1,2*j,n ) + f(2*i  ,2*j ,n))*denom
-            end do
-         end do
-      end do
-
-    end subroutine amrex_mg_average
-
-    subroutine amrex_mg_interp ( &
-           f, f_l1,f_l2,f_h1,f_h2, &
-           c, c_l1,c_l2,c_h1,c_h2, &
-           lo, hi, nc) bind(c,name='amrex_mg_interp')
-
-      implicit none
-
-      integer nc
-      integer f_l1,f_l2,f_h1,f_h2
-      integer c_l1,c_l2,c_h1,c_h2
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,nc)
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,nc)
-
-      integer i, j, n, twoi, twoj, twoip1, twojp1
-
-!     MultiGrid::relax(...) does only V-cycles (not F-cycles), and for V-cycles, 
-!     piecewise-constant interpolation performs better than linear interpolation,
-!     as measured both by run-time and number of V-cycles for convergence.
-
-      do n = 1, nc
-         do j = lo(2),hi(2)
-            twoj   = 2*j
-            twojp1 = twoj+1
-
-            do i = lo(1),hi(1)
-
-               twoi   = 2*i
-               twoip1 = twoi+1
-
-               f(twoi,   twoj  ,n) = f(twoi,   twoj  ,n) + c(i,j,n)
-               f(twoip1, twoj  ,n) = f(twoip1, twoj  ,n) + c(i,j,n)
-               f(twoi,   twojp1,n) = f(twoi,   twojp1,n) + c(i,j,n)
-               f(twoip1, twojp1,n) = f(twoip1, twojp1,n) + c(i,j,n)
-
-            end do
-         end do
-      end do
-
-    end subroutine amrex_mg_interp
-
-end module amrex_mg_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_MG_3D.F90 b/Src/LinearSolvers/C_CellMG/AMReX_MG_3D.F90
deleted file mode 100644
index 9ce9d3db3fd..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_MG_3D.F90
+++ /dev/null
@@ -1,100 +0,0 @@
-module amrex_mg_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-contains
-
-    subroutine amrex_mg_average ( &
-           c, c_l1,c_l2,c_l3,c_h1,c_h2,c_h3, &
-           f, f_l1,f_l2,f_l3,f_h1,f_h2,f_h3, &
-           lo, hi, nc) bind(c,name='amrex_mg_average')
-
-      implicit none
-
-      integer nc
-      integer c_l1,c_l2,c_l3,c_h1,c_h2,c_h3
-      integer f_l1,f_l2,f_l3,f_h1,f_h2,f_h3
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,f_l3:f_h3,nc)
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,c_l3:c_h3,nc)
-
-      integer i, i2, i2p1, j, j2, j2p1, k, k2, k2p1, n
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            k2 = 2*k
-            k2p1 = k2 + 1
-	    do j = lo(2), hi(2)
-               j2 = 2*j
-               j2p1 = j2 + 1
-               do i = lo(1), hi(1)
-                  i2 = 2*i
-                  i2p1 = i2 + 1
-                  c(i,j,k,n) =  ( &
-                       + f(i2p1,j2p1,k2  ,n) + f(i2,j2p1,k2  ,n) &
-                       + f(i2p1,j2  ,k2  ,n) + f(i2,j2  ,k2  ,n) &
-                       + f(i2p1,j2p1,k2p1,n) + f(i2,j2p1,k2p1,n) &
-                       + f(i2p1,j2  ,k2p1,n) + f(i2,j2  ,k2p1,n) &
-                       )*eighth
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_mg_average
-
-
-    subroutine amrex_mg_interp ( &
-           f, f_l1,f_l2,f_l3,f_h1,f_h2,f_h3, &
-           c, c_l1,c_l2,c_l3,c_h1,c_h2,c_h3, &
-           lo, hi, nc) bind(c,name='amrex_mg_interp')
-
-      implicit none
-
-      integer nc
-      integer f_l1,f_l2,f_l3,f_h1,f_h2,f_h3
-      integer c_l1,c_l2,c_l3,c_h1,c_h2,c_h3
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      real(amrex_real) f(f_l1:f_h1,f_l2:f_h2,f_l3:f_h3,nc)
-      real(amrex_real) c(c_l1:c_h1,c_l2:c_h2,c_l3:c_h3,nc)
-
-      integer i, i2, i2p1, j, j2, j2p1, k, k2, k2p1, n
-       
-!     MultiGrid::relax(...) does only V-cycles (not F-cycles), and for V-cycles, 
-!     piecewise-constant interpolation performs better than linear interpolation,
-!     as measured both by run-time and number of V-cycles for convergence.
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            k2 = 2*k
-            k2p1 = k2 + 1
-	    do j = lo(2), hi(2)
-               j2 = 2*j
-               j2p1 = j2 + 1
-
-               do i = lo(1), hi(1)
-                  i2 = 2*i
-                  i2p1 = i2 + 1
-
-                  f(i2p1,j2p1,k2  ,n) = c(i,j,k,n) + f(i2p1,j2p1,k2  ,n)
-                  f(i2  ,j2p1,k2  ,n) = c(i,j,k,n) + f(i2  ,j2p1,k2  ,n)
-                  f(i2p1,j2  ,k2  ,n) = c(i,j,k,n) + f(i2p1,j2  ,k2  ,n)
-                  f(i2  ,j2  ,k2  ,n) = c(i,j,k,n) + f(i2  ,j2  ,k2  ,n)
-                  f(i2p1,j2p1,k2p1,n) = c(i,j,k,n) + f(i2p1,j2p1,k2p1,n)
-                  f(i2  ,j2p1,k2p1,n) = c(i,j,k,n) + f(i2  ,j2p1,k2p1,n)
-                  f(i2p1,j2  ,k2p1,n) = c(i,j,k,n) + f(i2p1,j2  ,k2p1,n)
-                  f(i2  ,j2  ,k2p1,n) = c(i,j,k,n) + f(i2  ,j2  ,k2p1,n)
-
-               end do
-            end do
-         end do
-      end do
-
-    end subroutine amrex_mg_interp
-
-  end module amrex_mg_module
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_MG_F.H b/Src/LinearSolvers/C_CellMG/AMReX_MG_F.H
deleted file mode 100644
index 000e096b88f..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_MG_F.H
+++ /dev/null
@@ -1,25 +0,0 @@
-#ifndef AMREX_MG_F_H_
-#define AMREX_MG_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    void amrex_mg_average (
-        amrex_real* crse,       AMREX_ARLIM_P(crse_lo), AMREX_ARLIM_P(crse_hi),
-        const amrex_real* fine, AMREX_ARLIM_P(fine_lo), AMREX_ARLIM_P(fine_hi),
-        const int *tlo, const int *thi,
-        const int *nc);
-
-    void amrex_mg_interp (
-        amrex_real* fine,       AMREX_ARLIM_P(fine_lo), AMREX_ARLIM_P(fine_hi),
-        const amrex_real* crse, AMREX_ARLIM_P(crse_lo), AMREX_ARLIM_P(crse_hi),
-        const int *tlo, const int *thi,
-        const int *nc);
-#ifdef __cplusplus
-}
-#endif
-
-#endif /*_MG_F_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_MultiGrid.H b/Src/LinearSolvers/C_CellMG/AMReX_MultiGrid.H
deleted file mode 100644
index 279742591c3..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_MultiGrid.H
+++ /dev/null
@@ -1,459 +0,0 @@
-
-#ifndef AMREX_MULTIGRID_H_
-#define AMREX_MULTIGRID_H_
-
-#include <AMReX_Array.H>
-#include <AMReX_Vector.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_BndryData.H>
-#include <AMReX_LinOp.H>
-#include <AMReX_CGSolver.H>
-
-#include <algorithm>
-
-namespace amrex {
-
-/**
-  \brief A MultiGrid solves the linear equation, ``L(phi)=rhs``, for a LinOp L and
-  MultiFabs rhs and phi using a V-type cycle of the MultiGrid algorithm
-
-  A MultiGrid object solves the linear equation, ``L(phi)=rhs`` for a LinOp
-  L, and MultiFabs phi and rhs.  A MultiGrid is constructed with a
-  fully initialized 2D or 3D LinOp, and responds to "solve" requests of
-  various signatures, ultimately performing a recursive "relax"
-  operation over a hierachy of grid levels.  The LinOp therefore must
-  employ "levels" of application, as well as be able to provide an
-  implementation of the Gauss-Seidel red-black iterations on all levels.
-  At the coarsest level, the user has the option of applying the
-  GSRB smoother a set number of iterations.  Optionally, a Conjugate
-  Gradient solver, CGSolver, may be used to solve the coarsest system.
-
-  If the user chooses to use the conjugate gradient bottom solve,
-  the absolute and relative tolerances of this solve are independently
-  settable distinct from the tolerances of the mg solve.  However,
-  it rarely makes sense to stop cg after a fixed number of iterations,
-  so that capability was omited, wrt the mg options.  As a final
-  option, the user may choose to follow the cg solve with a fixed
-  number of relaxation passes (the relaxer within the class LinOp).
-
-  The solve request (implicitly) includes a flag as to whether the
-  system is to be solved with homogeneous boundary conditions or no.
-  If homogeneous BCs are requested, all boundary information within
-  the LinOp is used, except that the values of boundary FabSets are
-  zeroed.
-
-  Implementation Note:
-  This algorithm implements solution of equations in a way that
-  requires linearity of the operator.  In "residual correction form",
-  equations are solved only for the "correction" to the initial guess
-  that is required to solve the desired system.  In particular,
-  boundary conditions are assumed to be satisfied after a single
-  application of the linear operator (therefore, the correction is
-  homogeneous at the boundary).  As a result, after putting the
-  problem in residual correction form, the entire system MG hierarchy
-  has homigeneous boundary conditions (thus avoiding the need to
-  interpolate BC values, and simplifying the logic of the coarse-fine
-  transfer operations).  This solver therefore cannot incorporate
-  fully nonlinear systems.
-
-  Default settings:
-  There are a number of options in the multigrid algorithm details.
-  In addition to changing the actual smoothers employed, the user
-  has access to the following parameters (defaults shown in parentheses):
-
-   nu_1(2) Number of passes of the pre-smoother
-   nu_2(2) Number of passes of the post-smoother
-   nu_0(1) Number of passes of the coarse-grid smoother per cycle
-   nu_f(8) Number of passes of the bottom smoother (if not using
-           the conjugate-gradient bottom solve)
-   maxiter(40)  Maximum number of full multigrid cycles allowed to
-                solve the system value is ignored if < 0)
-   verbose(0)   Verbosity (1-results, 2-progress)
-   usecg(1)     Whether to use the conjugate-gradient solver for the
-                coarsest (bottom) solve of the multigrid hierarchy
-   atol_b(-1.0) Absolute error tolerance (<0 => ignored) for cg
-   rtol_b(.01)  Relative error tolerance (<0 => ignored) for cg
-   nu_b(0)      Number of passes of the bottom smoother taken
-                AFTER the cg bottom solve (value ignored if <= 0)
-   numLevelsMAX(1024) maximum number of mg levels
-
-  This class does NOT provide a copy constructor or assignment operator.
-*/
-
-class MultiGrid
-{
-public:
-
-    /**
-    * \brief constructor
-    *
-    * \param _lp
-    */
-    MultiGrid (LinOp& _lp);
-
-    /**
-    * \brief destructor
-    */
-    ~MultiGrid ();
-
-     /**
-     * \brief solve the system to relative err eps_rel, absolute err eps_abs
-     *
-     * \param solution
-     * \param _rhs
-     * \param eps_rel
-     * \param eps_abs
-     * \param bc_mode
-     */
-     void solve (MultiFab&       solution,
-                 const MultiFab& _rhs,
-                 Real            eps_rel = -1.0,
-                 Real            eps_abs = -1.0,
-                 LinOp::BC_Mode  bc_mode=LinOp::Inhomogeneous_BC);
-
-    /**
-    * \brief return the linear operator
-    */
-    LinOp& linOp () { return Lp; }
-
-    /**
-    * \brief set the maximum permitted multigrid iterations
-    *
-    * \param _maxiter
-    */
-    void setMaxIter (int _maxiter) { maxiter = _maxiter; }
-
-    /**
-    * \brief set the maximum number of permitted multigrid iterations --
-    * if this flag is set to 1 then multigrid will do exactly this number,
-    * regardless of convergence
-    *
-    * \param _do_fixed_number_of_iters
-    */
-    void setFixedIter (int _do_fixed_number_of_iters) { do_fixed_number_of_iters = _do_fixed_number_of_iters;}
-
-    /**
-    * \brief return the maximum permitted multigrid iterations
-    */
-    int getMaxIter () const { return maxiter; }
-
-    /**
-    * \brief return the number of multigrid iterations
-    */
-    int getNumIter () const;
-
-    /**
-    * \brief set the flag for whether to use CGSolver at coarsest level
-    *
-    * \param _usecg
-    */
-    void setUseCG (int _usecg) { usecg = _usecg; }
-
-    /**
-    * \brief return the flag for whether to use CGSolver at coarsest level
-    */
-    int getUseCG () const { return usecg; }
-
-    /**
-    * \brief set/return the number of multigrid levels
-    *
-    * \param _numlevels
-    */
-    int getNumLevels (int _numlevels);
-
-    /**
-    * \brief return the number of multigrid levels
-    */
-    int getNumLevels () const { return numlevels; }
-
-    /**
-    * \brief set the verbosity value
-    *
-    * \param _verbose
-    */
-    void setVerbose (int _verbose) { verbose = _verbose; }
-
-    /**
-    * \brief return the verbosity value
-    */
-    int getVerbose () { return verbose; }
-
-    /**
-    * \brief set the number of passes of the pre-smoother
-    *
-    * \param pre_smooth
-    */
-    void set_preSmooth (int pre_smooth) { nu_1 = pre_smooth; }
-
-    /**
-    * \brief set the number of passes of the post-smoother
-    *
-    * \param post_smooth
-    */
-    void set_postSmooth (int post_smooth) { nu_2 = post_smooth; }
-
-    /**
-    * \brief set the number of passes of the coarse-grid smoother/mg iteration
-    *
-    * \param cnt_relax
-    */
-    void set_cntRelax (int cnt_relax) { nu_0 = cnt_relax; }
-
-    /**
-    * \brief set the number of passes of the bottom mg relaxer
-    *
-    * \param final_smooth
-    */
-    void set_finalSmooth (int final_smooth) { nu_f = final_smooth; }
-
-    /**
-    * \brief Return the number of pre-smooth iterations at the level
-    */
-    int preSmooth () const { return nu_1; }
-
-    /**
-    * \brief Return the number of post-smooth iterations at the level
-    */
-    int postSmooth () const { return nu_2; }
-
-    /**
-    * \brief Return the number of level relaxations (not implemented)
-    */
-    int cntRelax () const { return nu_0; }
-
-    /**
-    * \brief Return the number of smoothing passes at bottom of MG (if no cg)
-    */
-    int finalSmooth () const { return nu_f; }
-
-    /**
-    * \brief set the maximum permitted absolute tolerance (\<0 bypasses test)
-    *
-    * \param atol
-    */
-    void set_atol_b (Real atol) { atol_b = atol; }
-
-    /**
-    * \brief get the maximum permitted absolute tolerance
-    */
-    Real get_atol_b () const { return atol_b; }
-
-    /**
-    * \brief set the maximum permitted relative tolerance (\<0 bypasses test)
-    *
-    * \param rtol
-    */
-    void set_rtol_b (Real rtol) { rtol_b = rtol; }
-
-    /**
-    * \brief get the maximum permitted relative tolerance
-    */
-    Real get_rtol_b () const { return rtol_b; }
-
-    /**
-    * \brief set the number of post-cg relax passes
-    *
-    * \param _nu_b
-    */
-    void set_nu_b (int _nu_b) { nu_b = _nu_b; }
-
-    /**
-    * \brief set the number of post-cg relax passes
-    */
-    int get_nu_b () const { return nu_b; }
-
-    void set_maxiter_b (int n) { maxiter_b = n; }
-
-    /**
-    * \brief get the maximum permitted relative tolerance
-    */
-    int  get_maxiter_b () const { return maxiter_b; }
-
-protected:
-
-    /**
-    * \brief Solve the linear system to relative and absolute tolerance
-    *
-    * \param _sol
-    * \param _eps_rel
-    * \param _eps_abs
-    * \param bc_mode
-    * \param bnorm
-    * \param resnorm0
-    */
-    int solve_ (MultiFab&      _sol,
-                Real           _eps_rel,
-                Real           _eps_abs,
-                LinOp::BC_Mode bc_mode,
-                Real           bnorm,
-                Real           resnorm0);
-
-    /**
-    * \brief Make space, set switches for new solution level
-    *
-    * \param level
-    */
-    void prepareForLevel (int level);
-
-    /**
-    * \brief Compute the number of multigrid levels, assuming ratio=2
-    */
-    int numLevels () const;
-
-    /**
-    * \brief Return scalar estimate of error
-    *
-    * \param level
-    * \param bc_mode
-    * \param local
-    */
-    Real errorEstimate (int            level,
-                        LinOp::BC_Mode bc_mode,
-                        bool           local = false);
-
-    /**
-    * \brief Transfer MultiFab from fine to coarse level
-    *
-    * \param c
-    * \param f
-    */
-    void average (MultiFab&       c,
-                  const MultiFab& f);
-
-    /**
-    * \brief Transfer MultiFab from coarse to fine level
-    *
-    * \param f
-    * \param c
-    */
-    void interpolate (MultiFab&       f,
-                      const MultiFab& c);
-
-    /**
-    * \brief Perform a MG V-cycle
-    *
-    * \param solL
-    * \param rhsL
-    * \param level
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    * \param cg_time
-    */
-    void relax (MultiFab&      solL,
-                MultiFab&      rhsL,
-                int            level,
-                Real           eps_rel,
-                Real           eps_abs,
-                LinOp::BC_Mode bc_mode,
-                Real&          cg_time);
-
-    /**
-    * \brief Perform relaxation at bottom of V-cycle
-    *
-    * \param solL
-    * \param rhsL
-    * \param level
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    * \param local_usecg
-    * \param cg_time
-    */
-    void coarsestSmooth (MultiFab&      solL,
-                         MultiFab&      rhsL,
-                         int            level,
-                         Real           eps_rel,
-                         Real           eps_abs,
-                         LinOp::BC_Mode bc_mode,
-                         int            local_usecg,
-                         Real&          cg_time);
-private:
-
-    //! default flag, whether to use CG at bottom of MG cycle
-    static int def_usecg;
-
-    //! \brief set flags, etc
-    static void Initialize ();
-
-    static void Finalize ();
-
-    //! default number of level, pre-, post- and bottom smooths
-    static int def_nu_0, def_nu_1, def_nu_2, def_nu_f;
-
-    //! default number of post-cg relax passes
-    static int def_nu_b;
-
-    //! default maximum number of complete MG cycle iterations
-    static int def_maxiter;
-
-    //! default convergence setting
-    static int use_Anorm_for_convergence;
-
-    //! default verbosity
-    static int def_verbose;
-
-    //! default relative, absolute tolerance for cg solve
-    static Real def_rtol_b, def_atol_b;
-    static int def_maxiter_b;
-
-    //! default maximum number of mg levels
-    static int def_numLevelsMAX;
-
-    //! default flag controlling the behaviour when the cg solver returns indicating unstable
-    static int def_smooth_on_cg_unstable;
-
-    //! verbosity
-    int verbose;
-
-    //! Number of MG levels
-    int numlevels;
-
-    //! current maximum number of allowed iterations
-    int maxiter;
-
-    //! whether to use a fixed number of iterations or continue until convergence
-    int do_fixed_number_of_iters;
-
-    //! current number of level, pre-, post- and bottom smooths
-    int nu_0, nu_1, nu_2, nu_f;
-
-    //! current number of post-cg relax passes
-    int nu_b;
-
-    //! current flag, whether to use CG at bottom of MG cycle
-    int usecg;
-
-    //! relative, absolute tolerance, maxiter for cg bottom solver.
-    Real rtol_b, atol_b;
-    int maxiter_b;
-
-    //! maximum number of mg levels
-    int numLevelsMAX;
-
-    //! flag controlling the behaviour when the cg solver returns indicating unstable
-    int smooth_on_cg_unstable;
-
-    //! internal temp data to store initial guess of solution
-    MultiFab* initialsolution;
-
-    //! internal temp data
-    Vector< MultiFab* > res;
-
-    //! internal temp data
-    Vector< MultiFab* > rhs;
-
-    //! internal temp data
-    Vector< MultiFab* > cor;
-
-    //! internal reference to linear operator
-    LinOp &Lp;
-
-    //! \brief Disallow copy constructor, assignment operator
-    MultiGrid (const MultiGrid&);
-    MultiGrid& operator= (const MultiGrid&);
-};
-
-}
-
-#endif /*_MULTIGRID_H_*/
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_MultiGrid.cpp b/Src/LinearSolvers/C_CellMG/AMReX_MultiGrid.cpp
deleted file mode 100644
index 06493ea9977..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_MultiGrid.cpp
+++ /dev/null
@@ -1,824 +0,0 @@
-
-#include <algorithm>
-#include <cstdlib>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_Utility.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_CGSolver.H>
-#include <AMReX_MG_F.H>
-#include <AMReX_MultiGrid.H>
-
-namespace amrex {
-
-namespace
-{
-    bool initialized = false;
-}
-//
-// Set default values for these in Initialize()!!!
-//
-int              MultiGrid::def_nu_0;
-int              MultiGrid::def_nu_1;
-int              MultiGrid::def_nu_2;
-int              MultiGrid::def_nu_f;
-int              MultiGrid::def_nu_b;
-int              MultiGrid::def_usecg;
-Real             MultiGrid::def_rtol_b;
-Real             MultiGrid::def_atol_b;
-int              MultiGrid::def_verbose;
-int              MultiGrid::def_maxiter;
-int              MultiGrid::def_maxiter_b;
-int              MultiGrid::def_numLevelsMAX;
-int              MultiGrid::def_smooth_on_cg_unstable;
-int              MultiGrid::use_Anorm_for_convergence;
-
-void
-MultiGrid::Initialize ()
-{
-    if ( initialized ) return;
-    //
-    // Set defaults here!!!
-    //
-    MultiGrid::def_nu_0                  = 1;
-    MultiGrid::def_nu_1                  = 2;
-    MultiGrid::def_nu_2                  = 2;
-    MultiGrid::def_nu_f                  = 8;
-    MultiGrid::def_nu_b                  = 0;
-    MultiGrid::def_usecg                 = 1;
-#if defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) || (!defined(AMREX_XSDK) && defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-    MultiGrid::def_rtol_b                = 0.01;
-#else
-    MultiGrid::def_rtol_b                = 0.0001;
-#endif
-    MultiGrid::def_atol_b                = -1.0;
-    MultiGrid::def_verbose               = 0;
-    MultiGrid::def_maxiter               = 40;
-    MultiGrid::def_maxiter_b             = 120;
-    MultiGrid::def_numLevelsMAX          = 1024;
-    MultiGrid::def_smooth_on_cg_unstable = 1;
-
-    // This has traditionally been part of the stopping criteria, but for testing against
-    //  other solvers it is convenient to be able to turn it off
-    MultiGrid::use_Anorm_for_convergence = 1;
-
-    ParmParse pp("mg");
-
-    pp.query("v",                     def_verbose);
-    pp.query("nu_0",                  def_nu_0);
-    pp.query("nu_1",                  def_nu_1);
-    pp.query("nu_2",                  def_nu_2);
-    pp.query("nu_f",                  def_nu_f);
-    pp.query("nu_b",                  def_nu_b);
-    pp.query("usecg",                 def_usecg);
-    pp.query("rtol_b",                def_rtol_b);
-    pp.query("verbose",               def_verbose);
-    pp.query("maxiter",               def_maxiter);
-    pp.query("bot_atol",              def_atol_b);
-    pp.query("maxiter_b",             def_maxiter_b);
-    pp.query("numLevelsMAX",          def_numLevelsMAX);
-    pp.query("smooth_on_cg_unstable", def_smooth_on_cg_unstable);
-
-    pp.query("use_Anorm_for_convergence", use_Anorm_for_convergence);
-#if !defined(AMREX_CG_USE_OLD_CONVERGENCE_CRITERIA) && (defined(AMREX_XSDK) || !defined(CG_USE_OLD_CONVERGENCE_CRITERIA))
-    if ( ParallelDescriptor::IOProcessor() && def_verbose > 2 )
-    {
-        if ( use_Anorm_for_convergence == 0 )
-            amrex::OutStream() << "It might be a good idea to define CG_USE_OLD_CONVERGENCE_CRITERIA\n";
-    }
-#endif
-
-    if ( ParallelDescriptor::IOProcessor() && (def_verbose > 2) )
-    {
-        amrex::OutStream() << "MultiGrid settings...\n"
-                           << "   def_nu_0                  = " << def_nu_0                  << '\n'
-                           << "   def_nu_1                  = " << def_nu_1                  << '\n'
-                           << "   def_nu_2                  = " << def_nu_2                  << '\n'
-                           << "   def_nu_f                  = " << def_nu_f                  << '\n'
-                           << "   def_nu_b                  = " << def_nu_b                  << '\n'
-                           << "   def_usecg                 = " << def_usecg                 << '\n'
-                           << "   def_rtol_b                = " << def_rtol_b                << '\n'
-                           << "   def_atol_b                = " << def_atol_b                << '\n'
-                           << "   def_maxiter               = " << def_maxiter               << '\n'
-                           << "   def_maxiter_b             = " << def_maxiter_b             << '\n'
-                           << "   def_numLevelsMAX          = " << def_numLevelsMAX          << '\n'
-                           << "   def_smooth_on_cg_unstable = " << def_smooth_on_cg_unstable << '\n'
-                           << "   use_Anorm_for_convergence = " << use_Anorm_for_convergence << '\n';
-    }
-
-    amrex::ExecOnFinalize(MultiGrid::Finalize);
-
-    initialized = true;
-}
-
-void
-MultiGrid::Finalize ()
-{
-    ;
-}
-
-static
-Real
-norm_inf (const MultiFab& res, bool local = false)
-{
-    return res.norm0(0, 0, local);
-}
-
-static
-void
-Spacer (std::ostream& os, int lev)
-{
-    for (int k = 0; k < lev; k++)
-    {
-        os << "   ";
-    }
-}
-
-MultiGrid::MultiGrid (LinOp &_lp)
-    :
-    initialsolution(0),
-    Lp(_lp)
-{
-    Initialize();
-
-    maxiter      = def_maxiter;
-    nu_0         = def_nu_0;
-    nu_1         = def_nu_1;
-    nu_2         = def_nu_2;
-    nu_f         = def_nu_f;
-    usecg        = def_usecg;
-    verbose      = def_verbose;
-    maxiter_b    = def_maxiter_b;
-    rtol_b       = def_rtol_b;
-    atol_b       = def_atol_b;
-    nu_b         = def_nu_b;
-    numLevelsMAX = def_numLevelsMAX;
-    smooth_on_cg_unstable = def_smooth_on_cg_unstable;
-    numlevels    = numLevels();
-
-    do_fixed_number_of_iters = 0;
-
-    if ( ParallelDescriptor::IOProcessor() && (verbose > 2) )
-    {
-	BoxArray tmp = Lp.boxArray();
-	amrex::OutStream() << "MultiGrid: numlevels = " << numlevels 
-                           << ": ngrid = " << tmp.size() << ", npts = [";
-	for ( int i = 0; i < numlevels; ++i ) 
-        {
-	    if ( i > 0 ) tmp.coarsen(2);
-	    amrex::OutStream() << tmp.d_numPts() << " ";
-        }
-	amrex::OutStream() << "]" << '\n';
-
-	amrex::OutStream() << "MultiGrid: " << numlevels
-                           << " multigrid levels created for this solve" << '\n';
-    }
-
-    if ( ParallelDescriptor::IOProcessor() && (verbose > 4) )
-    {
-	amrex::OutStream() << "Grids: " << '\n';
-	BoxArray tmp = Lp.boxArray();
-	for (int i = 0; i < numlevels; ++i)
-	{
-            Orientation face(0, Orientation::low);
-            const DistributionMapping& map = Lp.bndryData().bndryValues(face).DistributionMap();
-	    if (i > 0)
-		tmp.coarsen(2);
-	    amrex::OutStream() << " Level: " << i << '\n';
-	    for (int k = 0; k < tmp.size(); k++)
-	    {
-		const Box& b = tmp[k];
-		amrex::OutStream() << "  [" << k << "]: " << b << "   ";
-		for (int j = 0; j < BL_SPACEDIM; j++)
-		    amrex::OutStream() << b.length(j) << ' ';
-                amrex::OutStream() << ":: " << map[k] << '\n';
-	    }
-	}
-    }
-}
-
-MultiGrid::~MultiGrid ()
-{
-    delete initialsolution;
-
-    for (int i = 0; i < cor.size(); ++i)
-    {
-        delete res[i];
-        delete rhs[i];
-        delete cor[i];
-    }
-}
-
-Real
-MultiGrid::errorEstimate (int            level,
-                          LinOp::BC_Mode bc_mode,
-                          bool           local)
-{
-    Lp.residual(*res[level], *rhs[level], *cor[level], level, bc_mode);
-    return norm_inf(*res[level], local);
-}
-
-void
-MultiGrid::prepareForLevel (int level)
-{
-    //
-    // Build this level by allocating reqd internal MultiFabs if necessary.
-    //
-    if ( cor.size() > level ) return;
-
-    res.resize(level+1, (MultiFab*)0);
-    rhs.resize(level+1, (MultiFab*)0);
-    cor.resize(level+1, (MultiFab*)0);
-
-    Lp.prepareForLevel(level);
-
-    if ( cor[level] == 0 )
-    {
-	const DistributionMapping& dm = Lp.DistributionMap();
-	res[level] = new MultiFab(Lp.boxArray(level), dm, 1, Lp.NumGrow(), MFInfo(), FArrayBoxFactory());
-	rhs[level] = new MultiFab(Lp.boxArray(level), dm, 1, Lp.NumGrow(), MFInfo(), FArrayBoxFactory());
-	cor[level] = new MultiFab(Lp.boxArray(level), dm, 1, Lp.NumGrow(), MFInfo(), FArrayBoxFactory());
-	if ( level == 0 )
-	{
-	    initialsolution = new MultiFab(Lp.boxArray(0), dm, 1, Lp.NumGrow(), MFInfo(), FArrayBoxFactory());
-	}
-    }
-}
-
-void
-MultiGrid::solve (MultiFab&       _sol,
-                  const MultiFab& _rhs,
-                  Real            _eps_rel,
-                  Real            _eps_abs,
-                  LinOp::BC_Mode  bc_mode)
-{
-    //
-    // Prepare memory for new level, and solve the general boundary
-    // value problem to within relative error _eps_rel.  Customized
-    // to solve at level=0.
-    //
-    const int level = 0;
-    prepareForLevel(level);
-
-    //
-    // Copy the initial guess, which may contain inhomogeneous boundray conditions,
-    // into both "initialsolution" (to be added back later) and into "cor[0]" which
-    // we will only use here to compute the residual, then will set back to 0 below
-    //
-    initialsolution->copy(_sol);
-    cor[level]->copy(_sol);
-
-    //
-    // Put the problem in residual-correction form: we will now use "rhs[level
-    // the initial residual (rhs[0]) rather than the initial RHS (_rhs)
-    // to begin the solve.
-    //
-    Lp.residual(*rhs[level],_rhs,*cor[level],level,bc_mode);
-
-    //
-    // Now initialize correction to zero at this level (auto-filled at levels below)
-    //
-    (*cor[level]).setVal(0.0); //
-
-    //
-    // Elide a reduction by doing these together.
-    //
-    Real tmp[2] = { norm_inf(_rhs,true), norm_inf(*rhs[level],true) };
-    ParallelAllReduce::Max(tmp,2,ParallelContext::CommunicatorSub());
-    if ( ParallelDescriptor::IOProcessor() && verbose > 0)
-    {
-        Spacer(amrex::OutStream(), level);
-        amrex::OutStream() << "MultiGrid: Initial rhs                = " << tmp[0] << '\n'
-                           << "MultiGrid: Initial residual           = " << tmp[1] << '\n';
-    }
-
-    if (tmp[1] == 0.0)
-	return;
-
-    //
-    // We can now use homogeneous bc's because we have put the problem into residual-correction form.
-    //
-    if ( !solve_(_sol, _eps_rel, _eps_abs, LinOp::Homogeneous_BC, tmp[0], tmp[1]) )
-        amrex::Error("MultiGrid:: failed to converge!");
-}
-
-int
-MultiGrid::solve_ (MultiFab&      _sol,
-                   Real           eps_rel,
-                   Real           eps_abs,
-                   LinOp::BC_Mode bc_mode,
-                   Real           bnorm,
-                   Real           resnorm0)
-{
-    BL_PROFILE("MultiGrid::solve_()");
-
-  //
-  // If do_fixed_number_of_iters = 1, then do maxiter iterations without checking for convergence 
-  // 
-  // If do_fixed_number_of_iters = 0, then relax system maxiter times, 
-  //    and stop if relative error <= _eps_rel or if absolute err <= _abs_eps
-  //
-  const Real strt_time = amrex::second();
-
-  const int level = 0;
-
-  //
-  // We take the max of the norms of the initial RHS and the initial residual in order to capture both cases
-  //
-  Real norm_to_test_against;
-  bool using_bnorm;
-  if (bnorm >= resnorm0) 
-  {
-      norm_to_test_against = bnorm;
-      using_bnorm          = true;
-  } else {
-      norm_to_test_against = resnorm0;
-      using_bnorm          = false;
-  } 
-
-  int        returnVal = 0;
-  Real       error     = resnorm0;
-
-  //
-  // Note: if eps_rel, eps_abs < 0 then that test is effectively bypassed
-  //
-  if ( ParallelDescriptor::IOProcessor() && eps_rel < 1.0e-16 && eps_rel > 0 )
-  {
-      amrex::OutStream() << "MultiGrid: Tolerance "
-                         << eps_rel
-                         << " < 1e-16 is probably set too low" << '\n';
-  }
-
-  //
-  // We initially define norm_cor based on the initial solution only so we can use it in the very first iteration
-  //    to decide whether the problem is already solved (this is relevant if the previous solve used was only solved
-  //    according to the Anorm test and not the bnorm test).
-  //
-  Real       norm_cor    = norm_inf(*initialsolution,true);
-  ParallelAllReduce::Max(norm_cor,ParallelContext::CommunicatorSub());
-
-  int        nit         = 1;
-  const Real norm_Lp     = Lp.norm(0, level);
-  Real       cg_time     = 0;
-
-  if ( use_Anorm_for_convergence == 1 ) 
-  {
-     //
-     // Don't need to go any further -- no iterations are required
-     //
-     if (error <= eps_abs || error < eps_rel*(norm_Lp*norm_cor+norm_to_test_against)) 
-     {
-         if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-         {
-             amrex::OutStream() << "   Problem is already converged -- no iterations required\n";
-         }
-         return 1;
-     }
-
-     for ( ;
-           ( (error > eps_abs &&
-              error > eps_rel*(norm_Lp*norm_cor+norm_to_test_against)) ||
-             (do_fixed_number_of_iters == 1) )
-             && nit <= maxiter;
-           ++nit)
-     {
-         relax(*cor[level], *rhs[level], level, eps_rel, eps_abs, bc_mode, cg_time);
-
-         Real tmp[2] = { norm_inf(*cor[level],true), errorEstimate(level,bc_mode,true) };
-
-         ParallelAllReduce::Max(tmp,2,ParallelContext::CommunicatorSub());
-
-         norm_cor = tmp[0];
-         error    = tmp[1];
-
-         if ( ParallelDescriptor::IOProcessor() && verbose > 1 )
-         {
-             const Real rel_error = error / norm_to_test_against;
-             Spacer(amrex::OutStream(), level);
-             if (using_bnorm)
-             {
-                 amrex::OutStream() << "MultiGrid: Iteration   "
-                                    << nit
-                                    << " resid/bnorm = "
-                                    << rel_error << '\n';
-             } else {
-                 amrex::OutStream() << "MultiGrid: Iteration   "
-                                    << nit
-                                    << " resid/resid0 = "
-                                    << rel_error << '\n';
-             }
-         }
-     }
-  }
-  else
-  {
-     //
-     // Don't need to go any further -- no iterations are required
-     //
-     if (error <= eps_abs || error < eps_rel*norm_to_test_against) 
-     {
-         if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-         {
-             amrex::OutStream() << "   Problem is already converged -- no iterations required\n";
-         }
-         return 1;
-     }
-
-     for ( ;
-           ( (error > eps_abs &&
-              error > eps_rel*norm_to_test_against) ||
-             (do_fixed_number_of_iters == 1) )
-             && nit <= maxiter;
-           ++nit)
-     {
-         relax(*cor[level], *rhs[level], level, eps_rel, eps_abs, bc_mode, cg_time);
-
-         error = errorEstimate(level, bc_mode);
-	
-         if ( ParallelDescriptor::IOProcessor() && verbose > 1 )
-         {
-             const Real rel_error = error / norm_to_test_against;
-             Spacer(amrex::OutStream(), level);
-             if (using_bnorm)
-             {
-                 amrex::OutStream() << "MultiGrid: Iteration   "
-                                    << nit
-                                    << " resid/bnorm = "
-                                    << rel_error << '\n';
-             } else {
-                 amrex::OutStream() << "MultiGrid: Iteration   "
-                                    << nit
-                                    << " resid/resid0 = "
-                                    << rel_error << '\n';
-             }
-         }
-     }
-  }
-
-  Real run_time = (amrex::second() - strt_time);
-
-  if ( verbose > 0 )
-  {
-      if ( ParallelDescriptor::IOProcessor() )
-      {
-          const Real rel_error = error / norm_to_test_against;
-          Spacer(amrex::OutStream(), level);
-          if (using_bnorm)
-          {
-              amrex::OutStream() << "MultiGrid: Iteration   "
-                                 << nit-1
-                                 << " resid/bnorm = "
-                                 << rel_error << '\n';
-          } else {
-              amrex::OutStream() << "MultiGrid: Iteration   "
-                                 << nit-1
-                                 << " resid/resid0 = "
-                                 << rel_error << '\n';
-             }
-      }
-
-      if ( verbose > 1 )
-      {
-          Real tmp[2] = { run_time, cg_time };
-
-          ParallelAllReduce::Max(tmp,2,ParallelContext::CommunicatorSub());
-
-          if ( ParallelDescriptor::IOProcessor() )
-              amrex::OutStream() << ", Solve time: " << tmp[0] << ", CG time: " << tmp[1];
-      }
-
-      if ( ParallelDescriptor::IOProcessor() ) amrex::OutStream() << '\n';
-  }
-
-  if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-  {
-      if ( do_fixed_number_of_iters == 1)
-      {
-          amrex::OutStream() << "   Did fixed number of iterations: " << maxiter << std::endl;
-      } 
-      else if ( error < eps_rel*norm_to_test_against )
-      {
-          amrex::OutStream() << "   Converged res < eps_rel*max(bnorm,res_norm)\n";
-      } 
-      else if ( (use_Anorm_for_convergence == 1) && (error < eps_rel*norm_Lp*norm_cor) )
-      {
-          amrex::OutStream() << "   Converged res < eps_rel*Anorm*sol\n";
-      } 
-      else if ( error < eps_abs )
-      {
-          amrex::OutStream() << "   Converged res < eps_abs\n";
-      }
-  }
-
-  //
-  // Omit ghost update since maybe not initialized in calling routine.
-  // Add to boundary values stored in initialsolution.
-  //
-  _sol.copy(*cor[level]);
-  _sol.plus(*initialsolution,0,_sol.nComp(),0);
-
-  if ( use_Anorm_for_convergence == 1 ) 
-  {
-     if ( do_fixed_number_of_iters == 1                ||
-          error <= eps_rel*(norm_Lp*norm_cor+norm_to_test_against) ||
-          error <= eps_abs )
-       returnVal = 1;
-  } 
-  else 
-  {
-     if ( do_fixed_number_of_iters == 1 ||
-          error <= eps_rel*(norm_to_test_against)   ||
-          error <= eps_abs )
-       returnVal = 1;
-  } 
-
-  //
-  // Otherwise, failed to solve satisfactorily
-  //
-  return returnVal;
-}
-
-int
-MultiGrid::numLevels () const
-{
-    int ng = Lp.numGrids();
-    int lv = numLevelsMAX-1;
-    //
-    // The routine `falls through' since coarsening and refining
-    // a unit box does not yield the initial box.
-    //
-    const BoxArray& bs = Lp.boxArray(0);
-
-    for (int i = 0; i < ng; ++i)
-    {
-        int llv = 0;
-        Box tmp = bs[i];
-        for (;;)
-        {
-            Box ctmp  = tmp;   ctmp.coarsen(2);
-            Box rctmp = ctmp; rctmp.refine(2);
-            if ( tmp != rctmp || ctmp.numPts() == 1 )
-                break;
-            llv++;
-            tmp = ctmp;
-        }
-        //
-        // Set number of levels so that every box can be refined to there.
-        //
-        if ( lv >= llv )
-            lv = llv;
-    }
-
-    return lv+1; // Including coarsest.
-}
-
-void
-MultiGrid::relax (MultiFab&      solL,
-                  MultiFab&      rhsL,
-                  int            level,
-                  Real           eps_rel,
-                  Real           eps_abs,
-                  LinOp::BC_Mode bc_mode,
-                  Real&          cg_time)
-{
-    BL_PROFILE("MultiGrid::relax()");
-    //
-    // Recursively relax system.  Equivalent to multigrid V-cycle.
-    // At coarsest grid, call coarsestSmooth.
-    //
-    if ( level < numlevels - 1 )
-    {
-        if ( verbose > 2 )
-        {
-           Real rnorm = errorEstimate(level, bc_mode);
-           if (ParallelDescriptor::IOProcessor())
-           {
-              amrex::OutStream() << "  AT LEVEL " << level << '\n'
-                                 << "    DN:Norm before smooth " << rnorm << '\n';;
-           }
-        }
-        for (int i = preSmooth() ; i > 0 ; i--)
-        {
-            Lp.smooth(solL, rhsL, level, bc_mode);
-        }
-        Lp.residual(*res[level], rhsL, solL, level, bc_mode);
-
-        if ( verbose > 2 )
-        {
-           Real rnorm = norm_inf(*res[level]);
-           if (ParallelDescriptor::IOProcessor())
-              amrex::OutStream() << "    DN:Norm after  smooth " << rnorm << '\n';
-        }
-
-        prepareForLevel(level+1);
-        average(*rhs[level+1], *res[level]);
-        cor[level+1]->setVal(0.0);
-        for (int i = cntRelax(); i > 0 ; i--)
-        {
-            relax(*cor[level+1],*rhs[level+1],level+1,eps_rel,eps_abs,bc_mode,cg_time);
-        }
-        interpolate(solL, *cor[level+1]);
-
-        if ( verbose > 2 )
-        {
-           Lp.residual(*res[level], rhsL, solL, level, bc_mode);
-           Real rnorm = norm_inf(*res[level]);
-           if ( ParallelDescriptor::IOProcessor() )
-           {
-              amrex::OutStream() << "  AT LEVEL " << level << '\n'
-                                 << "    UP:Norm before  smooth " << rnorm << '\n';
-           }
-        }
-
-        for (int i = postSmooth(); i > 0 ; i--)
-        {
-            Lp.smooth(solL, rhsL, level, bc_mode);
-        }
-        if ( verbose > 2 )
-        {
-           Lp.residual(*res[level], rhsL, solL, level, bc_mode);
-           Real rnorm = norm_inf(*res[level]);
-           if ( ParallelDescriptor::IOProcessor() ) 
-             amrex::OutStream() << "    UP:Norm after  smooth " << rnorm << '\n';
-        }
-    }
-    else
-    {
-        if ( verbose > 2 )
-        {
-           Real rnorm = norm_inf(rhsL);
-           if ( ParallelDescriptor::IOProcessor() )
-           {
-              amrex::OutStream() << "  AT LEVEL " << level << '\n'
-                                 << "    DN:Norm before bottom " << rnorm << '\n';
-           }
-        }
-
-        coarsestSmooth(solL, rhsL, level, eps_rel, eps_abs, bc_mode, usecg, cg_time);
-
-        if ( verbose > 2 )
-        {
-           Lp.residual(*res[level], rhsL, solL, level, bc_mode);
-           Real rnorm = norm_inf(*res[level]);
-           if ( ParallelDescriptor::IOProcessor() ) 
-              amrex::OutStream() << "    UP:Norm after  bottom " << rnorm << '\n';
-        }
-    }
-}
-
-void
-MultiGrid::coarsestSmooth (MultiFab&      solL,
-                           MultiFab&      rhsL,
-                           int            level,
-                           Real           eps_rel,
-                           Real           eps_abs,
-                           LinOp::BC_Mode bc_mode,
-                           int            local_usecg,
-                           Real&          cg_time)
-{
-    BL_PROFILE("MultiGrid::coarsestSmooth()");
-    prepareForLevel(level);
-
-    if ( local_usecg == 0 )
-    {
-        Real error0 = 0;
-        if ( verbose > 0 )
-        {
-            error0 = errorEstimate(level, bc_mode);
-            if ( ParallelDescriptor::IOProcessor() )
-                amrex::OutStream() << "   Bottom Smoother: Initial error (error0) = " 
-                                   << error0 << '\n';
-        }
-
-        for (int i = finalSmooth(); i > 0; i--)
-        {
-            Lp.smooth(solL, rhsL, level, bc_mode);
-
-            if ( verbose > 1 || (i == 1 && verbose) )
-            {
-                Real error = errorEstimate(level, bc_mode);
-                const Real rel_error = (error0 != 0) ? error/error0 : 0;
-                if ( ParallelDescriptor::IOProcessor() )
-                    amrex::OutStream() << "   Bottom Smoother: Iteration "
-                                       << i
-                                       << " error/error0 = "
-                                       << rel_error << '\n';
-            }
-        }
-    }
-    else
-    {
-        bool use_mg_precond = false;
-	CGSolver cg(Lp, use_mg_precond, level);
-	cg.setMaxIter(maxiter_b);
-
-        const Real stime = amrex::second();
-
-	int ret = cg.solve(solL, rhsL, rtol_b, atol_b, bc_mode);
-        //
-        // The whole purpose of cg_time is to accumulate time spent in CGSolver.
-        //
-        cg_time += (amrex::second() - stime);
-
-	if ( ret != 0 )
-        {
-            if ( smooth_on_cg_unstable )
-            {
-                //
-                // If the CG solver returns a nonzero value indicating 
-                // the problem is unstable.  Assume this is not an accuracy 
-                // issue and pound on it with the smoother.
-                // if ret == 8, then you have failure to converge
-                //
-                if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-                    amrex::OutStream() << "MultiGrid::coarsestSmooth(): CGSolver returns nonzero. Smoothing ...\n";
-
-                coarsestSmooth(solL, rhsL, level, eps_rel, eps_abs, bc_mode, 0, cg_time);
-            }
-            else
-            {
-                //
-                // cg failure probably indicates loss of precision accident.
-                // if ret == 8, then you have failure to converge
-                // setting solL to 0 should be ok.
-                //
-                solL.setVal(0);
-                if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-                {
-                    amrex::OutStream() << "MultiGrid::coarsestSmooth(): setting coarse corr to zero" << '\n';
-                }
-            }
-	}
-        for (int i = 0; i < nu_b; i++)
-        {
-            Lp.smooth(solL, rhsL, level, bc_mode);
-        }
-    }
-}
-
-void
-MultiGrid::average (MultiFab&       c,
-                    const MultiFab& f)
-{
-    BL_PROFILE("MultiGrid::average()");
-    //
-    // Use Fortran function to average down (restrict) f to c.
-    //
-    const bool tiling = true;
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter cmfi(c,tiling); cmfi.isValid(); ++cmfi)
-    {
-        BL_ASSERT(c.boxArray().get(cmfi.index()) == cmfi.validbox());
-
-        const int        nc   = c.nComp();
-        const Box&       bx   = cmfi.tilebox();
-        FArrayBox&       cfab = c[cmfi];
-        const FArrayBox& ffab = f[cmfi];
-
-        amrex_mg_average(cfab.dataPtr(),
-                     AMREX_ARLIM(cfab.loVect()), AMREX_ARLIM(cfab.hiVect()),
-                     ffab.dataPtr(),
-                     AMREX_ARLIM(ffab.loVect()), AMREX_ARLIM(ffab.hiVect()),
-                     bx.loVect(), bx.hiVect(), &nc);
-    }
-}
-
-void
-MultiGrid::interpolate (MultiFab&       f,
-                        const MultiFab& c)
-{
-    BL_PROFILE("MultiGrid::interpolate()");
-    //
-    // Use fortran function to interpolate up (prolong) c to f
-    // Note: returns f=f+P(c) , i.e. ADDS interp'd c to f.
-    //
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(c,true); mfi.isValid(); ++mfi)
-    {
-        const Box&         bx = mfi.tilebox();
-        const int          nc = f.nComp();
-        const FArrayBox& cfab = c[mfi];
-        FArrayBox&       ffab = f[mfi];
-
-        amrex_mg_interp(ffab.dataPtr(),
-                    AMREX_ARLIM(ffab.loVect()), AMREX_ARLIM(ffab.hiVect()),
-                    cfab.dataPtr(),
-                    AMREX_ARLIM(cfab.loVect()), AMREX_ARLIM(cfab.hiVect()),
-                    bx.loVect(), bx.hiVect(), &nc);
-    }
-}
-
-int
-MultiGrid::getNumLevels (int _numlevels)
-{
-    BL_ASSERT(_numlevels >= 0);
-    int oldnumlevels = numlevels;
-    numlevels = std::min(_numlevels, numLevels());
-    return oldnumlevels;
-}
-
-}
diff --git a/Src/LinearSolvers/C_CellMG/AMReX_lo_bctypes.fi b/Src/LinearSolvers/C_CellMG/AMReX_lo_bctypes.fi
deleted file mode 100644
index df446942cee..00000000000
--- a/Src/LinearSolvers/C_CellMG/AMReX_lo_bctypes.fi
+++ /dev/null
@@ -1,11 +0,0 @@
-!-----------------------------------------------------------------------
-!     Should reflect the same contents as LO_BCTYPES.H
-!
-      integer LO_DIRICHLET
-      integer LO_NEUMANN
-      integer LO_REFLECT_ODD
-      parameter ( &
-     &     LO_DIRICHLET   = 101, &
-     &     LO_NEUMANN     = 102, &
-     &     LO_REFLECT_ODD = 103  &
-     &     )
diff --git a/Src/LinearSolvers/C_CellMG/Make.package b/Src/LinearSolvers/C_CellMG/Make.package
deleted file mode 100644
index bf7efe3403c..00000000000
--- a/Src/LinearSolvers/C_CellMG/Make.package
+++ /dev/null
@@ -1,14 +0,0 @@
-MGLIB_BASE=EXE
-
-CEXE_sources += AMReX_ABecLaplacian.cpp AMReX_CGSolver.cpp \
-                AMReX_LinOp.cpp AMReX_Laplacian.cpp AMReX_MultiGrid.cpp
-
-CEXE_headers += AMReX_ABecLaplacian.H AMReX_CGSolver.H AMReX_LinOp.H AMReX_MultiGrid.H AMReX_Laplacian.H
-
-FEXE_headers += AMReX_ABec_F.H AMReX_LO_F.H AMReX_LP_F.H AMReX_MG_F.H
-
-F90EXE_sources += AMReX_ABec_$(DIM)D.F90 AMReX_ABec_UTIL.F90 \
-                  AMReX_LO_$(DIM)D.F90 AMReX_LP_$(DIM)D.F90 AMReX_MG_$(DIM)D.F90
-
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/LinearSolvers/C_CellMG
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/LinearSolvers/C_CellMG
diff --git a/Src/LinearSolvers/C_CellMG/OpenSource.txt b/Src/LinearSolvers/C_CellMG/OpenSource.txt
deleted file mode 100755
index 12ff2bef422..00000000000
--- a/Src/LinearSolvers/C_CellMG/OpenSource.txt
+++ /dev/null
@@ -1,177 +0,0 @@
-SOURCE CODE LICENSE AGREEMENT
-Software: MGLib
-Version: Oct. 12, 2000 Release
-
-IMPORTANT - READ CAREFULLY: This License Agreement ("Agreement") is a
-legal agreement between you (in your capacity as an individual and as
-an agent for your company, institution or other entity) and The
-Regents of the University of California, Department of Energy
-contract-operators of the Ernest Orlando Lawrence Berkeley National
-Laboratory ("Berkeley Lab").  Downloading, installing, using, or
-copying of the Software (as defined below) by you or by a third party
-on your behalf indicates your agreement to be bound by the terms and
-conditions of this Agreement.  If you do not agree to these terms and
-conditions, do not download, install or use the Software.
-
-1.  LICENSE GRANT. Berkeley Lab grants you, and you hereby accept, a
-    non-exclusive, royalty-free perpetual license to install, use,
-    modify, prepare derivative works, incorporate into other computer
-    software, and distribute the version noted above of the computer
-    software program noted above, in binary and source code format, or
-    any derivative work thereof, together with any associated media,
-    printed materials, and on-line or electronic documentation (if
-    any) provided by Berkeley Lab (collectively, the "Software"),
-    subject to the following terms and conditions: (i) any
-    distribution of the Software shall bind the receiver to the terms
-    and conditions of this Agreement; (ii) any distribution of the
-    Software in modified form shall clearly state that the Software
-    has been modified from the version originally obtained from
-    Berkeley Lab.  This version of the Software constitutes a research
-    prototype and may be changed substantially.  The license grant set
-    forth above is subject to receipt by Berkeley Lab of any required
-    U.S. Department of Energy approvals.
-
-2.  COPYRIGHT; RETENTION OF RIGHTS.  The above license grant is
-    conditioned on the following: (i) you must reproduce all copyright
-    notices and other proprietary notices on any copies of the
-    Software and you must not remove such notices; (ii) in the event
-    you compile the Software, you will include the copyright notice
-    with the binary in such a manner as to allow it to be easily
-    viewable; (iii) if you incorporate the Software into other code,
-    you must provide notice that the code contains the Software and
-    include a copy of the copyright notices and other proprietary
-    notices.  All copies of the Software shall be subject to the terms
-    of this Agreement.  Subject to approval by the U.S. Department of
-    Energy: (a) you hereby acknowledge that the Software is protected
-    by United States copyright law and international treaty
-    provisions; (b) Berkeley Lab, and its licensors (if any), hereby
-    reserve all rights in the Software which are not explicitly
-    granted to you herein; (c) without limiting the generality of the
-    foregoing, Berkeley Lab and its licensors retain all title,
-    copyright, and other proprietary interests in the Software and any
-    copies thereof, and you do not acquire any rights, express or
-    implied, in the Software, other than those specifically set forth
-    in this Agreement.
-
-3.  NO MAINTENANCE OR SUPPORT; TREATMENT OF ENHANCEMENTS YOU CHOOSE TO
-    PROVIDE TO BERKELEY LAB.  Berkeley Lab is under no obligation
-    whatsoever to: (i) provide maintenance or support for the
-    Software; or (ii) to notify you of bug fixes, patches, or upgrades
-    to the features, functionality or performance of the Software
-    ("Enhancements") (if any), whether developed by Berkeley Lab or
-    third parties.  If, in its sole discretion, Berkeley Lab makes an
-    Enhancement available to you and Berkeley Lab does not separately
-    enter into a written license agreement with you relating to such
-    bug fix, patch or upgrade, then it shall be deemed incorporated
-    into the Software and subject to this Agreement.  You are under no
-    obligation whatsoever to provide any Enhancements to Berkeley Lab
-    that you may develop over time; however, if you choose to provide
-    Berkeley Lab with Enhancements in source code form that you have
-    developed without contemporaneously requiring Berkeley Lab to
-    enter into a separate written license agreement, then you hereby
-    grant Berkeley Lab a non-exclusive, royalty-free perpetual license
-    to install, use, modify, prepare derivative works, incorporate
-    into the Software or other computer software, distribute, and
-    sublicense your Enhancements or derivative works thereof, in
-    binary and source code form.
-
-4.  U.S. GOVERNMENT RIGHTS.  The Software was developed under funding
-    from the U.S. Department of Energy and the U.S. Government
-    consequently retains certain rights as follows: the
-    U.S. Government has been granted for itself and others acting on
-    its behalf a paid-up, nonexclusive, irrevocable, worldwide license
-    in the Software to reproduce, prepare derivative works, and
-    perform publicly and display publicly.  Beginning five (5) years
-    after the date permission to assert copyright was granted by the
-    U.S. Dept. of Energy, and subject to any subsequent five (5) year
-    renewals, the U.S. Government is granted for itself and others
-    acting on its behalf a paid-up, nonexclusive, irrevocable,
-    worldwide license in the Software to reproduce, prepare derivative
-    works, distribute copies to the public, perform publicly and
-    display publicly, and to permit others to do so.
-
-5.  WARRANTY DISCLAIMER.  THE SOFTWARE IS SUPPLIED "AS IS" WITHOUT
-    WARRANTY OF ANY KIND.  BERKELEY LAB, ITS LICENSORS, THE UNITED
-    STATES, THE UNITED STATES DEPARTMENT OF ENERGY, AND THEIR
-    EMPLOYEES: (1) DISCLAIM ANY WARRANTIES, EXPRESS OR IMPLIED,
-    INCLUDING BUT NOT LIMITED TO ANY IMPLIED WARRANTIES OF
-    MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, TITLE OR
-    NON-INFRINGEMENT, (2) DO NOT ASSUME ANY LEGAL LIABILITY OR
-    RESPONSIBILITY FOR THE ACCURACY, COMPLETENESS, OR USEFULNESS OF
-    THE SOFTWARE, (3) DO NOT REPRESENT THAT USE OF THE SOFTWARE WOULD
-    NOT INFRINGE PRIVATELY OWNED RIGHTS, (4) DO NOT WARRANT THAT THE
-    SOFTWARE WILL FUNCTION UNINTERRUPTED, THAT IT IS ERROR-FREE OR
-    THAT ANY ERRORS WILL BE CORRECTED.
-
-6.  LIMITATION OF LIABILITY. IN NO EVENT WILL BERKELEY LAB OR ITS
-    LICENSORS BE LIABLE FOR ANY INDIRECT, INCIDENTAL, CONSEQUENTIAL,
-    SPECIAL OR PUNITIVE DAMAGES OF ANY KIND OR NATURE, INCLUDING BUT
-    NOT LIMITED TO LOSS OF PROFITS OR LOSS OF DATA, FOR ANY REASON
-    WHATSOEVER, WHETHER SUCH LIABILITY IS ASSERTED ON THE BASIS OF
-    CONTRACT, TORT (INCLUDING NEGLIGENCE OR STRICT LIABILITY), OR
-    OTHERWISE, EVEN IF BERKELEY LAB HAS BEEN WARNED OF THE POSSIBILITY
-    OF SUCH LOSS OR DAMAGES.  IN NO EVENT SHALL BERKELEY LAB'S
-    LIABILITY FOR DAMAGES ARISING FROM OR IN CONNECTION WITH THIS
-    AGREEMENT EXCEED THE AMOUNT PAID BY YOU FOR THE SOFTWARE.
-
-7.  INDEMNITY.  You shall indemnify, defend, and hold harmless
-    Berkeley Lab, the U.S. Government, the Software developers, the
-    Software sponsors, and their agents, officers, and employees,
-    against any and all claims, suits, losses, damage, costs, fees,
-    and expenses arising out of or in connection with this Agreement.
-    You shall pay all costs incurred by Berkeley Lab in enforcing this
-    provision, including reasonable attorney fees.
-
-8.  TERM AND TERMINATION.  The license granted to you under this
-    Agreement will continue perpetually unless terminated by Berkeley
-    Lab in accordance with this Agreement.  If you breach any term of
-    this Agreement, and fail to cure such breach within thirty (30)
-    days of the date of written notice, this Agreement shall
-    immediately terminate. Upon such termination, you shall
-    immediately cease using the Software, return to Berkeley Lab, or
-    destroy, all copies of the Software, and provide Berkeley Lab with
-    written certification of your compliance with the foregoing.
-    Termination shall not relieve you from your obligations arising
-    prior to such termination. Notwithstanding any provision of this
-    Agreement to the contrary, Sections 5 through 10 shall survive
-    termination of this Agreement.
-
-9.  EXPORT CONTROLS. You shall observe all applicable United States
-    and foreign laws and regulations (if any) with respect to the
-    export, re-export, diversion or transfer of the Software, related
-    technical data and direct products thereof, including, without
-    limitation, the International Traffic in Arms Regulations (ITAR)
-    and the Export Administration Regulations.
-
-10. NO ENDORSEMENT.  In accordance with California Education Code
-    Section 92000, you shall not use in advertising, publicity or
-    other promotional activities any name, trade name, trademark, or
-    other designation of the University of California, nor shall you
-    so use "Ernest Orlando Lawrence Berkeley National Laboratory" or
-    "United States Department of Energy" (including any contraction,
-    abbreviation, or simulation of any of the foregoing) without
-    Berkeley Lab's prior written consent.
-
-11. GENERAL.  This Agreement shall be governed by the laws of the
-    State of California, excluding its rules governing conflicts of
-    laws.  No provision in either party's purchase orders, or in any
-    other business forms employed by either party will supersede the
-    terms of this Agreement, and no modification or amendment of this
-    Agreement is binding, unless in writing signed by a duly
-    authorized representative of each party.  This Agreement is
-    binding upon and shall inure to the benefit of Berkeley Lab, its
-    successors and assigns.  This Agreement represents the entire
-    understanding of the parties, and supersedes all previous
-    communications, written or oral, relating to the subject of this
-    Agreement. If you have any questions concerning this license,
-    contact Lawrence Berkeley National Laboratory, Technology Transfer
-    Department, One Cyclotron Road, MS 90-1070, Berkeley, CA 94720,
-    Attn: Software Licensing or via e-mail at TTD@lbl.gov.
-
-If you have any questions or feedback concerning this Software,
-contact the Center for Computational Sciences and Engineering,
-Lawrence Berkeley National Laboratory, One Cyclotron Road, MS
-50A-1148, Berkeley, CA 94720 or via email at webmaster@mothra.lbl.gov.
-
-Form rev000928
-
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2.H b/Src/LinearSolvers/C_CellMG4/AMReX_ABec2.H
deleted file mode 100644
index 9f60c197295..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2.H
+++ /dev/null
@@ -1,59 +0,0 @@
-
-#ifndef AMREX_ABec2_H_
-#define AMREX_ABec2_H_
-
-#include <AMReX_Array.H>
-#include <AMReX_LinOp.H>
-#include <AMReX_ABecLaplacian.H>
-
-namespace amrex {
-
-class ABec2
-    : public ABecLaplacian
-{
-public:
-
-  //! constructor for box array, boundary data and vector mesh spacing
-  ABec2 (const BndryData& bd,
-         const Real*      h)
-    : ABecLaplacian(bd,h) {}
-
-  virtual ~ABec2 () {}
-
-  void altSmooth (MultiFab&       solnL,
-                  const MultiFab& resL,
-                  int             level,
-                  int             redBlackFlag);
-
-  virtual void smooth (MultiFab&       solnL,
-		       const MultiFab& rhsL,
-		       int             level,
-		       LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC);
-
-  virtual void jacobi_smooth (MultiFab&       solnL,
-			      const MultiFab& rhsL,
-			      int             level,
-			      LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC);
-
-protected:
-
-  void altApplyBC (int  level,
-                   bool local);
-
-  virtual void Fsmooth_jacobi (MultiFab&       solnL,
-			       const MultiFab& resL,
-			       int             level);
-
-  virtual void Fsmooth (MultiFab&       solnL,
-			const MultiFab& resL,
-			int             level,
-			int             redBlackFlag);
-
-  //! Disallow copy constructors
-  ABec2 (const ABec2&);
-  ABec2& operator= (const ABec2&);
-};
-
-}
-
-#endif /*_ABec2_H_*/
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2.cpp b/Src/LinearSolvers/C_CellMG4/AMReX_ABec2.cpp
deleted file mode 100644
index c22526ee903..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2.cpp
+++ /dev/null
@@ -1,310 +0,0 @@
-#include <algorithm>
-#include <AMReX_ABec2.H>
-#include <AMReX_ABec2_F.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_LO_F.H>
-
-#include <AMReX_BLFort.H>
-
-namespace amrex {
-
-void
-ABec2::altApplyBC (int  level,
-                   bool local)
-{
-    //
-    // No coarsened boundary values, cannot apply inhomog at lev>0.
-    //
-    BL_ASSERT(level < numLevels());
-
-    prepareForLevel(level);
-    //
-    // Fill boundary cells.
-    //
-    const MultiFab& a = aCoefficients(level);
-
-    int bndry_comp = 0;
-    const BoxArray& ba = boxArray(level);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(a); mfi.isValid(); ++mfi)
-    {
-        const int gn = mfi.index();
-
-        BL_ASSERT(level<undrrelxr.size());
-
-        const BndryData::RealTuple&      bdl = bgb->bndryLocs(gn);
-        const Vector< Vector<BoundCond> >& bdc = bgb->bndryConds(gn);
-
-        for (OrientationIter oitr; oitr; ++oitr)
-        {
-            const Orientation o = oitr();
-
-            FabSet&       f   = undrrelxr[level][o];
-            int           cdr = o;
-            const Mask&   m   = local ? lmaskvals[level][o][mfi] : maskvals[level][o][mfi];
-            Real          bcl = bdl[o];
-            BL_ASSERT(bdc[o].size()>bndry_comp);
-            int           bct = bdc[o][bndry_comp];
-
-            const Box&       vbx   = ba[gn];
-
-            BL_ASSERT(f.size()>gn);
-            FArrayBox&       ffab  = f[gn];
-
-            amrex_ab2_bndryrlx
-              ( vbx.loVect(), vbx.hiVect(),
-                BL_TO_FORTRAN(ffab),
-                BL_TO_FORTRAN(m),
-                &cdr, &bct, &bcl, &maxorder, h[level].data());
-        }
-    }
-}
-
-
-
-void
-ABec2::Fsmooth (MultiFab&       solnL,
-		const MultiFab& resL,
-		int             level,
-		int             redBlackFlag)
-{
-  OrientationIter oitr;
-
-  const FabSet& f0 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f1 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f2 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f3 = undrrelxr[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-  const FabSet& f4 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f5 = undrrelxr[level][oitr()]; oitr++;
-#endif    
-  const MultiFab& a = aCoefficients(level);
-
-  AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-         const MultiFab& bY = bCoefficients(1,level);,
-         const MultiFab& bZ = bCoefficients(2,level););
-
-  oitr.rewind();
-  const MultiMask& mm0 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm1 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm2 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm3 = maskvals[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-  const MultiMask& mm4 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm5 = maskvals[level][oitr()]; oitr++;
-#endif
-
-  const int nc = 1;
-
-  Real alpha = get_alpha();
-  Real beta = get_beta();
-
-  const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  for (MFIter solnLmfi(solnL,tiling); solnLmfi.isValid(); ++solnLmfi)
-  {
-    const Mask& m0 = mm0[solnLmfi];
-    const Mask& m1 = mm1[solnLmfi];
-    const Mask& m2 = mm2[solnLmfi];
-    const Mask& m3 = mm3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-    const Mask& m4 = mm4[solnLmfi];
-    const Mask& m5 = mm5[solnLmfi];
-#endif
-
-    const Box&       tbx     = solnLmfi.tilebox();
-    const Box&       vbx     = solnLmfi.validbox();
-    FArrayBox&       solnfab = solnL[solnLmfi];
-    const FArrayBox& resfab  = resL[solnLmfi];
-    const FArrayBox& afab    = a[solnLmfi];
-
-    AMREX_D_TERM(const FArrayBox& bxfab = bX[solnLmfi];,
-           const FArrayBox& byfab = bY[solnLmfi];,
-           const FArrayBox& bzfab = bZ[solnLmfi];);
-
-    const FArrayBox& f0fab = f0[solnLmfi];
-    const FArrayBox& f1fab = f1[solnLmfi];
-    const FArrayBox& f2fab = f2[solnLmfi];
-    const FArrayBox& f3fab = f3[solnLmfi];
-#if (BL_SPACEDIM == 3)
-    const FArrayBox& f4fab = f4[solnLmfi];
-    const FArrayBox& f5fab = f5[solnLmfi];
-#endif
-
-    amrex_ab2_gsrb
-      ( tbx.loVect(), tbx.hiVect(),
-        vbx.loVect(), vbx.hiVect(),
-        BL_TO_FORTRAN(solnfab),
-        BL_TO_FORTRAN(resfab),
-        &alpha, &beta,
-        BL_TO_FORTRAN(afab),
-        BL_TO_FORTRAN(bxfab),
-	BL_TO_FORTRAN(byfab),
-#if (BL_SPACEDIM == 3)
-	BL_TO_FORTRAN(bzfab),
-#endif
-        BL_TO_FORTRAN(f0fab), BL_TO_FORTRAN(m0),
-        BL_TO_FORTRAN(f1fab), BL_TO_FORTRAN(m1),
-        BL_TO_FORTRAN(f2fab), BL_TO_FORTRAN(m2),
-        BL_TO_FORTRAN(f3fab), BL_TO_FORTRAN(m3),
-#if (BL_SPACEDIM == 3)
-        BL_TO_FORTRAN(f4fab), BL_TO_FORTRAN(m4),
-        BL_TO_FORTRAN(f5fab), BL_TO_FORTRAN(m5),
-#endif
-        &nc, h[level].data(), &redBlackFlag);
-
-  }
-}
-
-void
-ABec2::Fsmooth_jacobi (MultiFab&       solnL,
-		       const MultiFab& resL,
-		       int             level)
-{
-  OrientationIter oitr;
-
-  const FabSet& f0 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f1 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f2 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f3 = undrrelxr[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-  const FabSet& f4 = undrrelxr[level][oitr()]; oitr++;
-  const FabSet& f5 = undrrelxr[level][oitr()]; oitr++;
-#endif    
-  const MultiFab& a = aCoefficients(level);
-
-  AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-         const MultiFab& bY = bCoefficients(1,level);,
-         const MultiFab& bZ = bCoefficients(2,level););
-
-  oitr.rewind();
-  const MultiMask& mm0 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm1 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm2 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm3 = maskvals[level][oitr()]; oitr++;
-#if (BL_SPACEDIM > 2)
-  const MultiMask& mm4 = maskvals[level][oitr()]; oitr++;
-  const MultiMask& mm5 = maskvals[level][oitr()]; oitr++;
-#endif
-
-  //const int nc = solnL.nComp(); // FIXME: This LinOp only really supports single-component
-  const int nc = 1;
-  Real alpha = get_alpha();
-  Real beta = get_beta();
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  for (MFIter solnLmfi(solnL); solnLmfi.isValid(); ++solnLmfi)
-  {
-    const Mask& m0 = mm0[solnLmfi];
-    const Mask& m1 = mm1[solnLmfi];
-    const Mask& m2 = mm2[solnLmfi];
-    const Mask& m3 = mm3[solnLmfi];
-#if (BL_SPACEDIM > 2)
-    const Mask& m4 = mm4[solnLmfi];
-    const Mask& m5 = mm5[solnLmfi];
-#endif
-
-    const Box&       vbx     = solnLmfi.validbox();
-    FArrayBox&       solnfab = solnL[solnLmfi];
-    const FArrayBox& resfab  = resL[solnLmfi];
-    const FArrayBox& afab    = a[solnLmfi];
-
-    AMREX_D_TERM(const FArrayBox& bxfab = bX[solnLmfi];,
-           const FArrayBox& byfab = bY[solnLmfi];,
-           const FArrayBox& bzfab = bZ[solnLmfi];);
-
-    const FArrayBox& f0fab = f0[solnLmfi];
-    const FArrayBox& f1fab = f1[solnLmfi];
-    const FArrayBox& f2fab = f2[solnLmfi];
-    const FArrayBox& f3fab = f3[solnLmfi];
-#if (BL_SPACEDIM == 3)
-    const FArrayBox& f4fab = f4[solnLmfi];
-    const FArrayBox& f5fab = f5[solnLmfi];
-#endif
-
-    amrex_ab2_jacobi
-      ( vbx.loVect(), vbx.hiVect(),
-        BL_TO_FORTRAN(solnfab),
-        BL_TO_FORTRAN(resfab),
-        &alpha, &beta,
-        BL_TO_FORTRAN(afab),
-        BL_TO_FORTRAN(bxfab),
-	BL_TO_FORTRAN(byfab),
-#if (BL_SPACEDIM == 3)
-	BL_TO_FORTRAN(bzfab),
-#endif
-        BL_TO_FORTRAN(f0fab), BL_TO_FORTRAN(m0),
-        BL_TO_FORTRAN(f1fab), BL_TO_FORTRAN(m1),
-        BL_TO_FORTRAN(f2fab), BL_TO_FORTRAN(m2),
-        BL_TO_FORTRAN(f3fab), BL_TO_FORTRAN(m3),
-#if (BL_SPACEDIM == 3)
-        BL_TO_FORTRAN(f4fab), BL_TO_FORTRAN(m4),
-        BL_TO_FORTRAN(f5fab), BL_TO_FORTRAN(m5),
-#endif
-        &nc, h[level].data());
-
-  }
-}
-
-void
-ABec2::smooth (MultiFab&       solnL,
-               const MultiFab& rhsL,
-               int             level,
-               LinOp::BC_Mode  bc_mode)
-{
-  if (level > 0)
-  {
-    for (int redBlackFlag = 0; redBlackFlag < 2; redBlackFlag++)
-    {
-      applyBC(solnL, 0, 1, level, bc_mode);
-      ABecLaplacian::Fsmooth(solnL, rhsL, level, redBlackFlag);
-    }
-  }
-  else
-  {
-    amrex::Abort("Shouldnt be here");
-  }
-}
-
-void
-ABec2::altSmooth (MultiFab&       solnL,
-                  const MultiFab& resL,
-                  int             level,
-                  int             redBlackFlag)
-{
-  bool local = false;
-  altApplyBC(level,local);
-  Fsmooth(solnL, resL, level, redBlackFlag);
-}
-
-void
-ABec2::jacobi_smooth (MultiFab&       solnL,
-                      const MultiFab& rhsL,
-                      int             level,
-                      LinOp::BC_Mode  bc_mode)
-{
-  if (level > 0) {
-    for (int redBlackFlag = 0; redBlackFlag < 2; redBlackFlag++)
-    {
-      applyBC(solnL, 0, 1, level, bc_mode);
-      ABecLaplacian::Fsmooth_jacobi(solnL, rhsL, level);
-    }
-  }
-  else
-  {
-    amrex::Abort("Shouldnt be here");
-  }
-}
-
-}
-
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_2D.F90 b/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_2D.F90
deleted file mode 100644
index 1d4fbe90d94..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_2D.F90
+++ /dev/null
@@ -1,493 +0,0 @@
-
-module amrex_abec2_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-  include 'AMReX_lo_bctypes.fi'
-
-contains
-
-      subroutine amrex_ab2_gsrb (lo, hi, blo, bhi, &
-     &     phi, phi_l1, phi_l2, phi_h1, phi_h2,&
-     &     res, res_l1, res_l2, res_h1, res_h2,&
-     &     alpha, beta,                        &
-     &     a,   a_l1,   a_l2,   a_h1,   a_h2,  &
-     &     bX,  bX_l1,  bX_l2,  bX_h1,  bX_h2, &
-     &     bY,  bY_l1,  bY_l2,  bY_h1,  bY_h2, &
-     &     f0,  f0_l1,  f0_l2,  f0_h1,  f0_h2, &
-     &     m0,  m0_l1,  m0_l2,  m0_h1,  m0_h2, &
-     &     f1,  f1_l1,  f1_l2,  f1_h1,  f1_h2, &
-     &     m1,  m1_l1,  m1_l2,  m1_h1,  m1_h2, &
-     &     f2,  f2_l1,  f2_l2,  f2_h1,  f2_h2, &
-     &     m2,  m2_l1,  m2_l2,  m2_h1,  m2_h2, &
-     &     f3,  f3_l1,  f3_l2,  f3_h1,  f3_h2, &
-     &     m3,  m3_l1,  m3_l2,  m3_h1,  m3_h2, &
-     &     nc, h, redBlack) bind(c,name='amrex_ab2_gsrb')
-
-      use amrex_abec_util_module, only : tridiag
-
-      implicit none
-      integer lo(2), hi(2), blo(2), bhi(2), nc, redblack
-      integer phi_l1, phi_l2, phi_h1, phi_h2
-      integer res_l1, res_l2, res_h1, res_h2      
-      integer a_l1,   a_h1,   a_l2,    a_h2
-      integer bX_l1,  bX_h1,  bX_l2,   bX_h2
-      integer bY_l1,  bY_h1,  bY_l2,   bY_h2
-      integer f0_l1,  f0_h1,  f0_l2,   f0_h2
-      integer f1_l1,  f1_h1,  f1_l2,   f1_h2
-      integer f2_l1,  f2_h1,  f2_l2,   f2_h2
-      integer f3_l1,  f3_h1,  f3_l2,   f3_h2
-      integer m0_l1,  m0_h1,  m0_l2,   m0_h2
-      integer m1_l1,  m1_h1,  m1_l2,   m1_h2
-      integer m2_l1,  m2_h1,  m2_l2,   m2_h2
-      integer m3_l1,  m3_h1,  m3_l2,   m3_h2
-
-      real(amrex_real)  phi(phi_l1:phi_h1, phi_l2:phi_h2,1:nc)
-      real(amrex_real)  res(res_l1:res_h1, res_l2:res_h2,1:nc)
-      real(amrex_real)  alpha, beta
-
-      real(amrex_real)   a( a_l1:a_h1,  a_l2:a_h2)
-      real(amrex_real)  bX(bX_l1:bX_h1, bX_l2:bX_h2)
-      real(amrex_real)  bY(bY_l1:bY_h1, bY_l2:bY_h2)
-      real(amrex_real)  f0(f0_l1:f0_h1, f0_l2:f0_h2)
-      real(amrex_real)  f1(f1_l1:f1_h1, f1_l2:f1_h2)
-      real(amrex_real)  f2(f2_l1:f2_h1, f2_l2:f2_h2)
-      real(amrex_real)  f3(f3_l1:f3_h1, f3_l2:f3_h2)
-      integer  m0(m0_l1:m0_h1, m0_l2:m0_h2)
-      integer  m1(m1_l1:m1_h1, m1_l2:m1_h2)
-      integer  m2(m2_l1:m2_h1, m2_l2:m2_h2)
-      integer  m3(m3_l1:m3_h1, m3_l2:m3_h2)
-      real(amrex_real)  h(2)
-
-      integer  i, j, ioff, n
-
-      real(amrex_real) dhx, dhy, cf0, cf1, cf2, cf3
-      real(amrex_real) delta, gamma, rho_x, rho_y
-
-      integer LSDIM
-      parameter(LSDIM=127)
-      real(amrex_real) a_ls(0:LSDIM)
-      real(amrex_real) b_ls(0:LSDIM)
-      real(amrex_real) c_ls(0:LSDIM)
-      real(amrex_real) r_ls(0:LSDIM)
-      real(amrex_real) u_ls(0:LSDIM)
-
-      integer do_line
-      integer ilen,jlen
-      
-      if (h(2) .gt. 1.5D0*h(1)) then 
-        do_line = 1
-        ilen = hi(1)-lo(1)+1
-        if (ilen .gt. LSDIM) then
-          print *,'TOO BIG FOR LINE SOLVE IN GSRB: ilen = ',ilen
-          call bl_error("stop")
-        end if
-      else if (h(1) .gt. 1.5D0*h(2)) then
-        do_line = 2
-        jlen = hi(2)-lo(2)+1
-        if (jlen .gt. LSDIM) then
-          print *,'TOO BIG FOR LINE SOLVE IN GSRB: jlen = ',jlen
-          call bl_error("stop")
-        end if
-      else 
-        do_line = 0
-      end if
-
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      do n = 1, nc
-       if (do_line .eq. 0) then
-         do j = lo(2), hi(2)
-            ioff = MOD(j + redblack,2)
-            do i = lo(1) + ioff,hi(1),2
-     
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                   (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                   (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                   (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                   (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-     
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                   +  dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-
-               gamma = alpha*a(i,j) &
-                   +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                   +   dhy*( bY(i,j) + bY(i,j+1) )
-     
-     
-               phi(i,j,n) = phi(i,j,n) + res(i,j,n)/(gamma - delta)
-     
-            end do
-         end do
-       else if (do_line .eq. 2) then
-
-          print *,'Need to fix line solver in ABec2_2D.F'
-          call bl_abort()
-
-         do i = lo(1) + redblack,hi(1),2
-             do j = lo(2), hi(2)
-     
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                   (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                   (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                   (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                   (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-     
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                    + dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-     
-               gamma = alpha*a(i,j) &
-                   +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                   +   dhy*( bY(i,j) + bY(i,j+1) )
-     
-               rho_x = dhx*(bX(i,j)*phi(i-1,j,n) + bX(i+1,j)*phi(i+1,j,n))
-
-               a_ls(j-lo(2)) = -dhy*bY(i,j)
-               b_ls(j-lo(2)) = gamma - delta
-               c_ls(j-lo(2)) = -dhy*bY(i,j+1)
-               r_ls(j-lo(2)) = res(i,j,n) + rho_x - phi(i,j,n)*delta
-
-               if (j .eq. lo(2)) &
-                 r_ls(j-lo(2)) = r_ls(j-lo(2)) + dhy*bY(i,j)*phi(i,j-1,n)
-
-               if (j .eq. hi(2)) &
-                 r_ls(j-lo(2)) = r_ls(j-lo(2)) + dhy*bY(i,j+1)*phi(i,j+1,n)
-
-             end do
-
-             call tridiag(a_ls,b_ls,c_ls,r_ls,u_ls,jlen)
-     
-             do j = lo(2), hi(2)
-               phi(i,j,n) = u_ls(j-lo(2))
-             end do
-         end do
-
-       else if (do_line .eq. 1) then
-
-          print *,'Need to fix line solver in ABec2_2D.F'
-          call bl_abort()
-
-           do j = lo(2) + redblack,hi(2),2
-             do i = lo(1), hi(1)
-     
-               cf0 = merge(f0(blo(1),j), 0.0D0, &
-                   (i .eq. blo(1)) .and. (m0(blo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,blo(2)), 0.0D0, &
-                   (j .eq. blo(2)) .and. (m1(i,blo(2)-1).gt.0))
-               cf2 = merge(f2(bhi(1),j), 0.0D0, &
-                   (i .eq. bhi(1)) .and. (m2(bhi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,bhi(2)), 0.0D0, &
-                   (j .eq. bhi(2)) .and. (m3(i,bhi(2)+1).gt.0))
-     
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                    + dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-     
-               gamma = alpha*a(i,j) &
-                   +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                   +   dhy*( bY(i,j) + bY(i,j+1) )
-     
-               rho_y = dhy*(bY(i,j)*phi(i,j-1,n) + bY(i,j+1)*phi(i,j+1,n))
-
-               a_ls(i-lo(1)) = -dhx*bX(i,j)
-               b_ls(i-lo(1)) = gamma - delta
-               c_ls(i-lo(1)) = -dhx*bX(i+1,j)
-               r_ls(i-lo(1)) = res(i,j,n) + rho_y - phi(i,j,n)*delta
-
-               if (i .eq. lo(1)) &
-                 r_ls(i-lo(1)) = r_ls(i-lo(1)) + dhx*bX(i,j)*phi(i-1,j,n)
-
-               if (i .eq. hi(1)) &
-                 r_ls(i-lo(1)) = r_ls(i-lo(1)) + dhx*bX(i+1,j)*phi(i+1,j,n)
-             end do
-
-             call tridiag(a_ls,b_ls,c_ls,r_ls,u_ls,ilen)
-     
-             do i = lo(1), hi(1)
-               phi(i,j,n) = u_ls(i-lo(1))
-             end do
-         end do
-
-       else
-         print *,'BOGUS DO_LINE '
-         call bl_error("stop")
-       end if
-      end do
-
-      end
-
-
-      subroutine amrex_ab2_jacobi (lo, hi, &
-     &     phi, phi_l1, phi_l2, phi_h1, phi_h2,&
-     &     res, res_l1, res_l2, res_h1, res_h2,&
-     &     alpha, beta,                        &
-     &     a,   a_l1,   a_l2,   a_h1,   a_h2,  &
-     &     bX,  bX_l1,  bX_l2,  bX_h1,  bX_h2, &
-     &     bY,  bY_l1,  bY_l2,  bY_h1,  bY_h2, &
-     &     f0,  f0_l1,  f0_l2,  f0_h1,  f0_h2, &
-     &     m0,  m0_l1,  m0_l2,  m0_h1,  m0_h2, &
-     &     f1,  f1_l1,  f1_l2,  f1_h1,  f1_h2, &
-     &     m1,  m1_l1,  m1_l2,  m1_h1,  m1_h2, &
-     &     f2,  f2_l1,  f2_l2,  f2_h1,  f2_h2, &
-     &     m2,  m2_l1,  m2_l2,  m2_h1,  m2_h2, &
-     &     f3,  f3_l1,  f3_l2,  f3_h1,  f3_h2, &
-     &     m3,  m3_l1,  m3_l2,  m3_h1,  m3_h2, &
-     &     nc, h) bind(c,name='amrex_ab2_jacobi')
-
-      implicit none
-      integer lo(2), hi(2), nc
-      integer phi_l1, phi_l2, phi_h1, phi_h2
-      integer res_l1, res_l2, res_h1, res_h2      
-      integer a_l1,   a_h1,   a_l2,    a_h2
-      integer bX_l1,  bX_h1,  bX_l2,   bX_h2
-      integer bY_l1,  bY_h1,  bY_l2,   bY_h2
-      integer f0_l1,  f0_h1,  f0_l2,   f0_h2
-      integer f1_l1,  f1_h1,  f1_l2,   f1_h2
-      integer f2_l1,  f2_h1,  f2_l2,   f2_h2
-      integer f3_l1,  f3_h1,  f3_l2,   f3_h2
-      integer m0_l1,  m0_h1,  m0_l2,   m0_h2
-      integer m1_l1,  m1_h1,  m1_l2,   m1_h2
-      integer m2_l1,  m2_h1,  m2_l2,   m2_h2
-      integer m3_l1,  m3_h1,  m3_l2,   m3_h2
-
-      real(amrex_real)  phi(phi_l1:phi_h1, phi_l2:phi_h2,1:nc)
-      real(amrex_real)  res(res_l1:res_h1, res_l2:res_h2,1:nc)
-      real(amrex_real)  alpha, beta
-
-      real(amrex_real)   a( a_l1:a_h1,  a_l2:a_h2)
-      real(amrex_real)  bX(bX_l1:bX_h1, bX_l2:bX_h2)
-      real(amrex_real)  bY(bY_l1:bY_h1, bY_l2:bY_h2)
-      real(amrex_real)  f0(f0_l1:f0_h1, f0_l2:f0_h2)
-      real(amrex_real)  f1(f1_l1:f1_h1, f1_l2:f1_h2)
-      real(amrex_real)  f2(f2_l1:f2_h1, f2_l2:f2_h2)
-      real(amrex_real)  f3(f3_l1:f3_h1, f3_l2:f3_h2)
-      integer  m0(m0_l1:m0_h1, m0_l2:m0_h2)
-      integer  m1(m1_l1:m1_h1, m1_l2:m1_h2)
-      integer  m2(m2_l1:m2_h1, m2_l2:m2_h2)
-      integer  m3(m3_l1:m3_h1, m3_l2:m3_h2)
-      real(amrex_real)  h(2)
-
-      integer  i, j, n
-
-      real(amrex_real) dhx, dhy, cf0, cf1, cf2, cf3
-      real(amrex_real) delta, gamma
-      real(amrex_real), allocatable :: phit(:,:)
-      allocate(phit(lo(1):hi(1),lo(2):hi(2)))
-
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1),hi(1)
-     
-               cf0 = merge(f0(lo(1),j), 0.0D0, &
-                   (i .eq. lo(1)) .and. (m0(lo(1)-1,j).gt.0))
-               cf1 = merge(f1(i,lo(2)), 0.0D0, &
-                   (j .eq. lo(2)) .and. (m1(i,lo(2)-1).gt.0))
-               cf2 = merge(f2(hi(1),j), 0.0D0, &
-                   (i .eq. hi(1)) .and. (m2(hi(1)+1,j).gt.0))
-               cf3 = merge(f3(i,hi(2)), 0.0D0, &
-                   (j .eq. hi(2)) .and. (m3(i,hi(2)+1).gt.0))
-     
-               delta = dhx*(bX(i,j)*cf0 + bX(i+1,j)*cf2) &
-                   +  dhy*(bY(i,j)*cf1 + bY(i,j+1)*cf3)
-     
-               gamma = alpha*a(i,j) &
-                   +   dhx*( bX(i,j) + bX(i+1,j) ) &
-                   +   dhy*( bY(i,j) + bY(i,j+1) )
-     
-               phit = phi(i,j,n) + res(i,j,n) / (gamma - delta)
-     
-            end do
-         end do
-         phi(lo(1):hi(1),lo(2):hi(2),n) = phit         
-      end do
-      deallocate(phit)
-      end
-
-
-      subroutine amrex_ab2_bndryrlx(lo, hi, &
-     &     den,  f_l1, f_l2, f_h1, f_h2, &
-     &     mask, m_l1, m_l2, m_h1, m_h2, &
-     &     cdir, bct, bcl, maxorder, h) bind(c,name='amrex_ab2_bndryrlx')
-
-      use amrex_lo_util_module, only : polyInterpCoeff
-      implicit none
-      integer lo(2), hi(2)
-      integer f_l1, f_l2, f_h1, f_h2
-      integer m_l1, m_l2, m_h1, m_h2
-      
-      real(amrex_real)   den(f_l1:f_h1, f_l2:f_h2)
-      integer mask(m_l1:m_h1, m_l2:m_h2)
-
-      integer cdir, bct, maxorder
-      real(amrex_real) bcl
-      real(amrex_real) h(2)
-
-      integer i, j
-      logical is_dirichlet
-      logical is_neumann
-
-      integer m, lenx, leny
-
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      real(amrex_real) x(-1:maxmaxorder-2)
-      real(amrex_real) coef(-1:maxmaxorder-2)
-      real(amrex_real) xInt
-
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET )
-      is_neumann(i)   = ( i .eq. LO_NEUMANN )
-
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      end if
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-!     
-!     The Left face of the grid
-!
-      if(cdir .eq. 0) then
-         if (is_neumann(bct)) then
-            do j = lo(2), hi(2)
-               den(lo(1),j) = 1.0D0
-            end do
-         else if (is_dirichlet(bct)) then
-            do m=0,lenx
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(1)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do j = lo(2), hi(2)
-               den(lo(1),j) = merge(coef(0), 0.0D0, &
-                   mask(lo(1)-1,j) .gt. 0)
-            end do
-            
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do j = lo(2), hi(2)
-               den(lo(1),j) = merge(-1.0D0, 0.0D0, &
-                   mask(lo(1)-1,j) .gt. 0)
-            end do
-
-         else 
-            print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!     
-!     The Right face of the grid
-!
-      if(cdir .eq. 2) then
-         if(is_neumann(bct)) then
-            do j = lo(2), hi(2)
-               den(hi(1),j) = 1.0D0
-            end do
-         else if (is_dirichlet(bct)) then
-            do m=0,lenx
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(1)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do j = lo(2), hi(2)
-               den(hi(1),j)   = merge(coef(0), 0.0D0, &
-                   mask(hi(1)+1,j) .gt. 0)
-            end do
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do j = lo(2), hi(2)
-               den(hi(1),j) = merge(-1.0D0, 0.0D0, &
-                   mask(hi(1)+1,j) .gt. 0)
-            end do
-
-         else
-            print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The Bottom of the Grid
-!
-      if(cdir .eq. 1) then
-         if(is_neumann(bct)) then
-            do i = lo(1),hi(1)
-               den(i,lo(2))   = 1.0D0
-            end do
-         else if (is_dirichlet(bct)) then
-            do m=0,leny
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(2)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, leny+2, coef)
-            do i = lo(1), hi(1)
-               den(i, lo(2))   = merge(coef(0), 0.0D0, &
-                   mask(i, lo(2)-1) .gt. 0)
-            end do
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do i = lo(1), hi(1)
-               den(i,lo(2)) = merge(-1.0D0, 0.0D0, &
-                   mask(i,lo(2)-1) .gt. 0)
-            end do
-
-         else
-            print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The top of the grid
-!
-      if (cdir .eq. 3) then
-         if(is_neumann(bct)) then
-            do i = lo(1), hi(1)
-               den(i,hi(2))   = 1.0D0
-            end do
-         else if (is_dirichlet(bct)) then
-            if ( bct .eq. LO_REFLECT_ODD ) leny = 0
-            do m=0,leny
-               x(m) = m + 0.5D0
-            end do
-            x(-1) = - bcl/h(2)
-            xInt = - 0.5D0
-            call polyInterpCoeff(xInt, x, leny+2, coef)
-            do i = lo(1), hi(1)
-               den(i,hi(2))   = merge(coef(0), 0.0D0, &
-                   mask(i,hi(2)+1) .gt. 0)
-            end do
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do i = lo(1), hi(1)
-               den(i,hi(2)) = merge(-1.0D0, 0.0D0, &
-                   mask(i,hi(2)+1) .gt. 0)
-            end do
-
-         else
-            print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-
-      end
-
-end module amrex_abec2_module
-
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_3D.F90 b/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_3D.F90
deleted file mode 100644
index bba64bfbc26..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_3D.F90
+++ /dev/null
@@ -1,481 +0,0 @@
-module amrex_abec2_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-  include 'AMReX_lo_bctypes.fi'
-
-contains
-
-      subroutine amrex_ab2_gsrb (lo, hi, blo, bhi,              &
-     &     phi,phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-     &     res,res_l1,res_l2,res_l3,res_h1,res_h2,res_h3, &
-     &     alpha, beta,                                   &
-     &     a, a_l1, a_l2, a_l3, a_h1, a_h2, a_h3,         &
-     &     bX,bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3,        &
-     &     bY,bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3,        &
-     &     bZ,bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3,        &
-     &     f0,f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3,        &
-     &     m0,m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3,        &
-     &     f1,f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3,        &
-     &     m1,m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3,        &
-     &     f2,f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3,        &
-     &     m2,m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3,        &
-     &     f3,f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3,        &
-     &     m3,m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3,        &
-     &     f4,f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3,        &
-     &     m4,m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3,        &
-     &     f5,f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3,        &
-     &     m5,m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3,        &  
-     &     nc, h, redBlack) bind(c,name='amrex_ab2_gsrb')
-
-      implicit none
-      integer lo(3), hi(3), blo(3), bhi(3), nc, redblack
-
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      integer res_l1,res_l2,res_l3,res_h1,res_h2,res_h3
-      real(amrex_real) alpha, beta
-      integer a_l1,  a_l2, a_l3, a_h1, a_h2, a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      integer f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3
-      integer m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3
-      integer f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3
-      integer m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3
-      integer f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3
-      integer m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3
-      integer f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3
-      integer m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3
-      integer f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3
-      integer m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3
-      integer f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3
-      integer m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3
-
-      real(amrex_real)  phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,1:nc)
-      real(amrex_real)  res(res_l1:res_h1,res_l2:res_h2,res_l3:res_h3,1:nc)
-      real(amrex_real)   a( a_l1: a_h1, a_l2: a_h2, a_l3: a_h3)
-      real(amrex_real)  bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real)  bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real)  bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-      real(amrex_real)  f0(f0_l1:f0_h1,f0_l2:f0_h2,f0_l3:f0_h3)
-      real(amrex_real)  f1(f1_l1:f1_h1,f1_l2:f1_h2,f1_l3:f1_h3)
-      real(amrex_real)  f2(f2_l1:f2_h1,f2_l2:f2_h2,f2_l3:f2_h3)
-      real(amrex_real)  f3(f3_l1:f3_h1,f3_l2:f3_h2,f3_l3:f3_h3)
-      real(amrex_real)  f4(f4_l1:f4_h1,f4_l2:f4_h2,f4_l3:f4_h3)
-      real(amrex_real)  f5(f5_l1:f5_h1,f5_l2:f5_h2,f5_l3:f5_h3)
-      integer  m0(m0_l1:m0_h1,m0_l2:m0_h2,m0_l3:m0_h3)
-      integer  m1(m1_l1:m1_h1,m1_l2:m1_h2,m1_l3:m1_h3)
-      integer  m2(m2_l1:m2_h1,m2_l2:m2_h2,m2_l3:m2_h3)
-      integer  m3(m3_l1:m3_h1,m3_l2:m3_h2,m3_l3:m3_h3)
-      integer  m4(m4_l1:m4_h1,m4_l2:m4_h2,m4_l3:m4_h3)
-      integer  m5(m5_l1:m5_h1,m5_l2:m5_h2,m5_l3:m5_h3)
-      real(amrex_real)  h(3)
-!
-      integer  i, j, k, ioff, n
-!
-      real(amrex_real) dhx, dhy, dhz, cf0, cf1, cf2, cf3, cf4, cf5
-      real(amrex_real) delta, gamma
-!
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      dhz = beta/h(3)**2
-
-      do n = 1, nc
-          do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               ioff = MOD(j + k + redblack,2)
-               do i = lo(1) + ioff,hi(1),2
-
-                  cf0 = merge(f0(blo(1),j,k), 0.0D0, &
-                      (i .eq. blo(1)) .and. (m0(blo(1)-1,j,k).gt.0))
-                  cf1 = merge(f1(i,blo(2),k), 0.D00, &
-                      (j .eq. blo(2)) .and. (m1(i,blo(2)-1,k).gt.0))
-                  cf2 = merge(f2(i,j,blo(3)), 0.0D0, &
-                      (k .eq. blo(3)) .and. (m2(i,j,blo(3)-1).gt.0))
-                  cf3 = merge(f3(bhi(1),j,k), 0.0D0, &
-                      (i .eq. bhi(1)) .and. (m3(bhi(1)+1,j,k).gt.0))
-                  cf4 = merge(f4(i,bhi(2),k), 0.0D0, &
-                      (j .eq. bhi(2)) .and. (m4(i,bhi(2)+1,k).gt.0))
-                  cf5 = merge(f5(i,j,bhi(3)), 0.0D0, &
-                      (k .eq. bhi(3)) .and. (m5(i,j,bhi(3)+1).gt.0))
-
-                  delta = dhx*(bX(i,j,k)*cf0 + bX(i+1,j,k)*cf3) &
-                      +  dhy*(bY(i,j,k)*cf1 + bY(i,j+1,k)*cf4) &
-                      +  dhz*(bZ(i,j,k)*cf2 + bZ(i,j,k+1)*cf5)
-
-                  gamma = alpha*a(i,j,k) &
-                      +   dhx*(bX(i,j,k)+bX(i+1,j,k)) &
-                      +   dhy*(bY(i,j,k)+bY(i,j+1,k)) &
-                      +   dhz*(bZ(i,j,k)+bZ(i,j,k+1))
-
-                  phi(i,j,k,n) = phi(i,j,k,n) + res(i,j,k,n)/(gamma - delta)
-
-               end do
-            end do
-          end do
-      end do
-      end
-
-
-      subroutine amrex_ab2_jacobi (lo, hi,                      &
-     &     phi,phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-     &     res,res_l1,res_l2,res_l3,res_h1,res_h2,res_h3, &
-     &     alpha, beta,                                   &
-     &     a, a_l1, a_l2, a_l3, a_h1, a_h2, a_h3,         &
-     &     bX,bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3,        &
-     &     bY,bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3,        &
-     &     bZ,bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3,        &
-     &     f0,f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3,        &
-     &     m0,m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3,        &
-     &     f1,f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3,        &
-     &     m1,m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3,        &
-     &     f2,f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3,        &
-     &     m2,m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3,        &
-     &     f3,f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3,        &
-     &     m3,m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3,        &
-     &     f4,f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3,        &
-     &     m4,m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3,        &
-     &     f5,f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3,        &
-     &     m5,m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3,        & 
-     &     nc, h) bind(c,name='amrex_ab2_jacobi')
-
-      implicit none
-      integer lo(3), hi(3), nc
-
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      integer res_l1,res_l2,res_l3,res_h1,res_h2,res_h3
-      real(amrex_real) alpha, beta
-      integer a_l1,  a_l2, a_l3, a_h1, a_h2, a_h3
-      integer bX_l1,bX_l2,bX_l3,bX_h1,bX_h2,bX_h3
-      integer bY_l1,bY_l2,bY_l3,bY_h1,bY_h2,bY_h3
-      integer bZ_l1,bZ_l2,bZ_l3,bZ_h1,bZ_h2,bZ_h3
-      integer f0_l1,f0_l2,f0_l3,f0_h1,f0_h2,f0_h3
-      integer m0_l1,m0_l2,m0_l3,m0_h1,m0_h2,m0_h3
-      integer f1_l1,f1_l2,f1_l3,f1_h1,f1_h2,f1_h3
-      integer m1_l1,m1_l2,m1_l3,m1_h1,m1_h2,m1_h3
-      integer f2_l1,f2_l2,f2_l3,f2_h1,f2_h2,f2_h3
-      integer m2_l1,m2_l2,m2_l3,m2_h1,m2_h2,m2_h3
-      integer f3_l1,f3_l2,f3_l3,f3_h1,f3_h2,f3_h3
-      integer m3_l1,m3_l2,m3_l3,m3_h1,m3_h2,m3_h3
-      integer f4_l1,f4_l2,f4_l3,f4_h1,f4_h2,f4_h3
-      integer m4_l1,m4_l2,m4_l3,m4_h1,m4_h2,m4_h3
-      integer f5_l1,f5_l2,f5_l3,f5_h1,f5_h2,f5_h3
-      integer m5_l1,m5_l2,m5_l3,m5_h1,m5_h2,m5_h3
-
-      real(amrex_real)  phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,1:nc)
-      real(amrex_real)  res(res_l1:res_h1,res_l2:res_h2,res_l3:res_h3,1:nc)
-      real(amrex_real)   a( a_l1: a_h1, a_l2: a_h2, a_l3: a_h3)
-      real(amrex_real)  bX(bX_l1:bX_h1,bX_l2:bX_h2,bX_l3:bX_h3)
-      real(amrex_real)  bY(bY_l1:bY_h1,bY_l2:bY_h2,bY_l3:bY_h3)
-      real(amrex_real)  bZ(bZ_l1:bZ_h1,bZ_l2:bZ_h2,bZ_l3:bZ_h3)
-      real(amrex_real)  f0(f0_l1:f0_h1,f0_l2:f0_h2,f0_l3:f0_h3)
-      real(amrex_real)  f1(f1_l1:f1_h1,f1_l2:f1_h2,f1_l3:f1_h3)
-      real(amrex_real)  f2(f2_l1:f2_h1,f2_l2:f2_h2,f2_l3:f2_h3)
-      real(amrex_real)  f3(f3_l1:f3_h1,f3_l2:f3_h2,f3_l3:f3_h3)
-      real(amrex_real)  f4(f4_l1:f4_h1,f4_l2:f4_h2,f4_l3:f4_h3)
-      real(amrex_real)  f5(f5_l1:f5_h1,f5_l2:f5_h2,f5_l3:f5_h3)
-      integer  m0(m0_l1:m0_h1,m0_l2:m0_h2,m0_l3:m0_h3)
-      integer  m1(m1_l1:m1_h1,m1_l2:m1_h2,m1_l3:m1_h3)
-      integer  m2(m2_l1:m2_h1,m2_l2:m2_h2,m2_l3:m2_h3)
-      integer  m3(m3_l1:m3_h1,m3_l2:m3_h2,m3_l3:m3_h3)
-      integer  m4(m4_l1:m4_h1,m4_l2:m4_h2,m4_l3:m4_h3)
-      integer  m5(m5_l1:m5_h1,m5_l2:m5_h2,m5_l3:m5_h3)
-      real(amrex_real)  h(3)
-!
-      integer  i, j, k, n
-!
-      real(amrex_real) dhx, dhy, dhz, cf0, cf1, cf2, cf3, cf4, cf5
-      real(amrex_real) delta, gamma
-      real(amrex_real), allocatable :: phit(:,:,:)
-      allocate(phit(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3)))
-!
-      dhx = beta/h(1)**2
-      dhy = beta/h(2)**2
-      dhz = beta/h(3)**2
-
-      do n = 1, nc
-          do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1),hi(1)
-
-                  cf0 = merge(f0(lo(1),j,k), 0.0D0, &
-                      (i .eq. lo(1)) .and. (m0(lo(1)-1,j,k).gt.0))
-                  cf1 = merge(f1(i,lo(2),k), 0.D00, &
-                      (j .eq. lo(2)) .and. (m1(i,lo(2)-1,k).gt.0))
-                  cf2 = merge(f2(i,j,lo(3)), 0.0D0, &
-                      (k .eq. lo(3)) .and. (m2(i,j,lo(3)-1).gt.0))
-                  cf3 = merge(f3(hi(1),j,k), 0.0D0, &
-                      (i .eq. hi(1)) .and. (m3(hi(1)+1,j,k).gt.0))
-                  cf4 = merge(f4(i,hi(2),k), 0.0D0, &
-                      (j .eq. hi(2)) .and. (m4(i,hi(2)+1,k).gt.0))
-                  cf5 = merge(f5(i,j,hi(3)), 0.0D0, &
-                      (k .eq. hi(3)) .and. (m5(i,j,hi(3)+1).gt.0))
-
-                  delta = dhx*(bX(i,j,k)*cf0 + bX(i+1,j,k)*cf3) &
-                      +  dhy*(bY(i,j,k)*cf1 + bY(i,j+1,k)*cf4) &
-                      +  dhz*(bZ(i,j,k)*cf2 + bZ(i,j,k+1)*cf5)
-
-                  gamma = alpha*a(i,j,k) &
-                      +   dhx*(bX(i,j,k)+bX(i+1,j,k)) &
-                      +   dhy*(bY(i,j,k)+bY(i,j+1,k)) &
-                      +   dhz*(bZ(i,j,k)+bZ(i,j,k+1))
-
-                  phit = phi(i,j,k,n) + res(i,j,k,n) / (gamma - delta)
-
-               end do
-            end do
-          end do
-          phi(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3),n) = phit
-      end do
-
-      deallocate(phit)
-      end
-
-      subroutine amrex_ab2_bndryrlx(lo, hi, &
-     &     den, f_l1,f_l2,f_l3,f_h1,f_h2,f_h3, &
-     &     mask,m_l1,m_l2,m_l3,m_h1,m_h2,m_h3, &
-     &     cdir, bct, bcl, maxorder, h) bind(c,name='amrex_ab2_bndryrlx')
-
-      use amrex_lo_util_module, only : polyInterpCoeff
-      implicit none
-      integer lo(3), hi(3)
-      integer f_l1,f_l2,f_l3,f_h1,f_h2,f_h3
-      integer m_l1,m_l2,m_l3,m_h1,m_h2,m_h3
-      
-      real(amrex_real)   den(f_l1:f_h1,f_l2:f_h2,f_l3:f_h3)
-      integer mask(m_l1:m_h1,m_l2:m_h2,m_l3:m_h3)
-
-      integer cdir, bct, maxorder
-      real(amrex_real) bcl
-      real(amrex_real) h(3)
-!
-      integer i, j, k
-      logical is_dirichlet
-      logical is_neumann
-!
-      integer m, lenx, leny, lenz
-!
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      real(amrex_real) x(-1:maxmaxorder-2)
-      real(amrex_real) coef(-1:maxmaxorder-2)
-      real(amrex_real) xInt
-
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET )
-      is_neumann(i) = (i .eq. LO_NEUMANN)
-
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      end if
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-      lenz = MIN(hi(3)-lo(3), Lmaxorder-2)
-
-      do m=0,maxmaxorder-2
-         x(m) = m + 0.5D0
-      end do
-
-      select case (cdir)
-
-      case (0)
-         !     
-         ! The Left face of the grid
-         !
-         if (is_neumann(bct)) then
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  den(lo(1),j,k) = 1.0D0
-               end do
-            end do
-         else if (is_dirichlet(bct)) then
-            x(-1) = - bcl/h(1)
-            xInt = -0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  den(lo(1),j,k) = merge(coef(0), 0.0D0, &
-                      mask(lo(1)-1,j,k) .gt. 0)
-               end do
-            end do
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  den(lo(1),j,k) = merge(-1.0D0, 0.0D0, &
-                      mask(lo(1)-1,j,k) .gt. 0)
-               end do
-            end do
-         else
-            print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-
-      case (3)
-         !
-         ! The Right face of the grid
-         ! 
-         if(is_neumann(bct)) then
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  den(hi(1),j,k) = 1.0D0
-               end do
-            end do
-         else if (is_dirichlet(bct)) then
-            x(-1) = - bcl/h(1)
-            xInt = -0.5D0
-            call polyInterpCoeff(xInt, x, lenx+2, coef)
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  den(hi(1),j,k)   = merge(coef(0), 0.0D0, &
-                      mask(hi(1)+1,j,k) .gt. 0)
-               end do
-            end do
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  den(hi(1),j,k) = merge(-1.0D0, 0.0D0, &
-                      mask(hi(1)+1,j,k) .gt. 0)
-               end do
-            end do
-         else
-            print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-
-         case (1)
-            !
-            ! The Bottom of the Grid
-            !
-            if(is_neumann(bct)) then
-               do k = lo(3), hi(3)
-                  do i = lo(1),hi(1)
-                     den(i,lo(2),k)   = 1.0D0
-                  end do
-               end do
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(2)
-               xInt = -0.5D0
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i, lo(2),k)   = merge(coef(0), 0.0D0, &
-                         mask(i, lo(2)-1,k) .gt. 0)
-                  end do
-               end do
-            else if ( bct .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,lo(2),k) = merge(-1.0D0, 0.0D0, &
-                         mask(i,lo(2)-1,k) .gt. 0)
-                  end do
-               end do
-            else
-               print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-               call bl_error("stop")
-            end if
-
-         case (4)
-            !
-            ! The top of the grid
-            !
-            if(is_neumann(bct)) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),k)   = 1.0D0
-                  end do
-               end do
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(2)
-               xInt = -0.5D0
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),k)   = merge(coef(0), 0.0D0, &
-                         mask(i,hi(2)+1,k) .gt. 0)
-                  end do
-               end do
-            else if ( bct .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),k) = merge(-1.0D0, 0.0D0, &
-                         mask(i,hi(2)+1,k) .gt. 0)
-                  end do
-               end do
-            else
-               print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-               call bl_error("stop")
-            end if
-
-         case (2)
-            !
-            ! The Front of the Grid
-            !
-            if(is_neumann(bct)) then
-               do j = lo(2), hi(2)
-                  do i = lo(1),hi(1)
-                     den(i,j,lo(3))   = 1.0D0
-                  end do
-               end do
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(3)
-               xInt = -0.5D0
-               call polyInterpCoeff(xInt, x, lenz+2, coef)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i, j, lo(3))   = merge(coef(0), 0.0D0, &
-                         mask(i, j, lo(3)-1) .gt. 0)
-                  end do
-               end do
-            else if ( bct .eq. LO_REFLECT_ODD ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,lo(3)) = merge(-1.0D0, 0.0D0, &
-                         mask(i,j,lo(3)-1) .gt. 0)
-                  end do
-               end do
-            else
-               print *,'UNKNOWN BC ON FRONT FACE IN APPLYBC'
-               call bl_error("stop")
-            end if
-
-         case (5)
-            !
-            ! The back of the grid
-            !
-            if(is_neumann(bct)) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j, hi(3))   = 1.0D0
-                  end do
-               end do
-            else if (is_dirichlet(bct)) then
-               x(-1) = - bcl/h(3)
-               xInt = -0.5D0
-               call polyInterpCoeff(xInt, x, lenz+2, coef)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j, hi(3))   = merge(coef(0), 0.0D0, &
-                         mask(i,j, hi(3)+1) .gt. 0)
-                  end do
-               end do
-            else if ( bct .eq. LO_REFLECT_ODD ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,hi(3)) = merge(-1.0D0, 0.0D0, &
-                         mask(i,j,hi(3)+1) .gt. 0)
-                  end do
-               end do
-            else
-               print *,'UNKNOWN BC ON BACK FACE IN APPLYBC'
-               call bl_error("stop")
-            end if
-         end select
-
-      end
-
-end module amrex_abec2_module
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_F.H b/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_F.H
deleted file mode 100644
index 17fa5d6b9e6..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec2_F.H
+++ /dev/null
@@ -1,65 +0,0 @@
-#ifndef AMREX_ABec2_F_H_
-#define AMREX_ABec2_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-    void amrex_ab2_bndryrlx
-    ( const int lo[], const int hi[],
-      BL_FORT_FAB_ARG(f),
-      const BL_FORT_IFAB_ARG(m),
-      const int* cdir, const int* bct,
-      const amrex_real* bcl, const int* maxorder, const amrex_real dx[] );
-
-    void amrex_ab2_gsrb
-    ( const int tlo[], const int thi[],
-      const int blo[], const int bhi[],
-      BL_FORT_FAB_ARG(soln),
-      const BL_FORT_FAB_ARG(res),
-      const amrex_real* alpha, const amrex_real* beta,
-      const BL_FORT_FAB_ARG(a),
-      const BL_FORT_FAB_ARG(bx),
-      const BL_FORT_FAB_ARG(by),
-#if (BL_SPACEDIM == 3)
-      const BL_FORT_FAB_ARG(bz),
-#endif
-      const BL_FORT_FAB_ARG(f0),const BL_FORT_IFAB_ARG(m0),
-      const BL_FORT_FAB_ARG(f1),const BL_FORT_IFAB_ARG(m1),
-      const BL_FORT_FAB_ARG(f2),const BL_FORT_IFAB_ARG(m2),
-      const BL_FORT_FAB_ARG(f3),const BL_FORT_IFAB_ARG(m3),
-#if (BL_SPACEDIM == 3)
-      const BL_FORT_FAB_ARG(f4),const BL_FORT_IFAB_ARG(m4),
-      const BL_FORT_FAB_ARG(f5),const BL_FORT_IFAB_ARG(m5),
-#endif
-      const int* nc, const amrex_real dx[], const int* redBlackFlag);
-
-    void amrex_ab2_jacobi
-    ( const int lo[], const int hi[],
-      BL_FORT_FAB_ARG(soln),
-      const BL_FORT_FAB_ARG(res),
-      const amrex_real* alpha, const amrex_real* beta,
-      const BL_FORT_FAB_ARG(a),
-      const BL_FORT_FAB_ARG(bx),
-      const BL_FORT_FAB_ARG(by),
-#if (BL_SPACEDIM == 3)
-      const BL_FORT_FAB_ARG(bz),
-#endif
-      const BL_FORT_FAB_ARG(f0),const BL_FORT_IFAB_ARG(m0),
-      const BL_FORT_FAB_ARG(f1),const BL_FORT_IFAB_ARG(m1),
-      const BL_FORT_FAB_ARG(f2),const BL_FORT_IFAB_ARG(m2),
-      const BL_FORT_FAB_ARG(f3),const BL_FORT_IFAB_ARG(m3),
-#if (BL_SPACEDIM == 3)
-      const BL_FORT_FAB_ARG(f4),const BL_FORT_IFAB_ARG(m4),
-      const BL_FORT_FAB_ARG(f5),const BL_FORT_IFAB_ARG(m5),
-#endif
-      const int* nc, const amrex_real dx[]);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif /*_ABec2_F_H_*/
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4.H b/Src/LinearSolvers/C_CellMG4/AMReX_ABec4.H
deleted file mode 100644
index d30a9fa9954..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4.H
+++ /dev/null
@@ -1,362 +0,0 @@
-
-#ifndef AMREX_ABec4_H_
-#define AMREX_ABec4_H_
-
-#include <AMReX_Array.H>
-#include <AMReX_LinOp.H>
-#include <AMReX_ABec2.H>
-
-namespace amrex {
-
-/**
-        \brief An ABec4 tailors the description of a linear operator to apply
-        the fourth-order central difference approximation to the differential
-        operator, ``alpha*a(x).phi - beta*div[b(x).grad(phi)]``, on a cell-centered
-        MultiFab, phi.  Here, alpha and beta are constants, a(x) is a
-        cell-centered MultiFab, and b(x) is a vector of wall-centered
-        MultiFabs, 1 per dimension.  phi can have multiple components, but
-        all coefficient info is scalar, and norm reports on ALL components
-        together.
-
-        An ABec4 tailors a LinOp (a virtual base class for general
-        linear operators) to compute the fourth-order central difference
-        approximation to the differential operator,
-
-              ``alpha*a(x).phi - beta*div[b(x).grad(phi)]``
-
-        on a cell-centered
-        MultiFab, phi.  Here, alpha and beta are constants, a(x) is a
-        cell-centered MultiFab, and b(x) is a vector of wall-centered
-        MultiFabs, 1 per dimension.  phi can have multiple components, but
-        all coefficient info is scalar, and norm reports on ALL components
-        together.
-
-        This class provides the necessary
-        implementations for applying the operator, and for
-        smoothing a guessed solution to the linear equation system,
-        L(phi) = rhs (where rhs is another cell-centered MultiFab).  This
-        class also provides access functions to set/control the coefficient
-        MulitFabs a and b, as well as the scalars, alpha and beta.  These
-        customizations are designed for 2D and 3D, with constant (but
-        not necessarily equal) mesh spacing in each direction.
-
-        Application of the operator and smoothing are
-        "level" operations, and therefore must access "hidden" level data
-        (such as boundary conditions, etc) as required, in concert with the
-        semantics of the underlying LinOp defintions.  Accordingly, these
-        implementations are "protected" and called only by the publically
-        accessible members of the virtual base class, LinOp.  Note that these
-        implementations may therefore assume that boundary (ghost) nodes and
-        other pertinent information are filled properly by the base class
-        functions prior to call.
-
-        Defaults are as follows for the coefficients:
-
-         ``alpha = 1.0
-         beta = 1.0
-         a (MultiFab) = 0.0
-         b (MultiFab) = 1.0``
-
-        This class does NOT provide a copy constructor or assignment operator.
-*/
-
-class ABec4
-    : public LinOp
-{
-public:
-
-    /**
-    * \brief constructor for box array, boundary data and vector mesh spacing
-    *
-    * \param bd
-    * \param _h
-    */
-    ABec4 (const BndryData& bd,
-	    const Real*      _h);
-
-    /**
-    * \brief destructor
-    */
-    virtual ~ABec4 ();
-
-    /**
-    * \brief Compute extensive (area-weighted) flux associated with the op
-    *
-    * \param xflux
-    * \param yflux
-    * \param zflux
-    * \param in
-    * \param bc_mode
-    * \param src_comp
-    * \param dst_comp
-    * \param num_comp
-    * \param bnd_comp
-    */
-    virtual void compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-			   MultiFab& in, const BC_Mode& bc_mode=LinOp::Inhomogeneous_BC,
-			   int src_comp=0, int dst_comp=0, int num_comp=1, int bnd_comp=0);
-
-    void compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-                   MultiFab& in, bool do_ApplyBC, const BC_Mode& bc_mode=LinOp::Inhomogeneous_BC,
-		   int src_comp=0, int dst_comp=0, int num_comp=1, int bnd_comp=0);
-
-    /**
-    * \brief Compute the residual. If level==0, use 4th order otherwise use lower order
-    *
-    * \param residL
-    * \param rhsL
-    * \param solnL
-    * \param level
-    * \param bc_mode
-    * \param local
-    */
-    virtual void residual (MultiFab&       residL,
-                           const MultiFab& rhsL,
-                           MultiFab&       solnL,
-                           int             level   = 0,
-                           LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC,
-                           bool            local   = false);
-
-    virtual void smooth (MultiFab&       solnL,
-                         const MultiFab& rhsL,
-                         int             level   = 0,
-                         LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC);
-
-    virtual void jacobi_smooth (MultiFab&       solnL,
-                                const MultiFab& rhsL,
-                                int             level   = 0,
-                                LinOp::BC_Mode  bc_mode = LinOp::Inhomogeneous_BC);
-
-    virtual void apply (MultiFab&      out,
-                        MultiFab&      in,
-                        int            level   = 0,
-                        LinOp::BC_Mode bc_mode = LinOp::Inhomogeneous_BC,
-                        bool           local   = false,
-			int            src_comp = 0,
-                        int            dst_comp = 0,
-                        int            num_comp = 1,
-                        int            bndry_comp = 0);
-
-    /**
-    * \brief Set scalar coefficients.
-    *
-    * \param _alpha
-    * \param _beta
-    */
-    void setScalars (Real _alpha, Real _beta) { alpha = _alpha; beta = _beta;}
-
-    /**
-    * \brief get scalar alpha coefficient
-    */
-    Real get_alpha () const { return alpha; }
-
-    /**
-    * \brief get scalar beta coefficient
-    */
-    Real get_beta () const { return beta; }
-
-    /**
-    * \brief return reference to "a" coefficient
-    *
-    * \param level
-    */
-    const MultiFab& aCoefficients (int level = 0);
-
-    /**
-    * \brief return reference to "b" coefficients
-    *
-    * \param level
-    */
-    const MultiFab& bCoefficients (int level=0);
-
-    /**
-    * \brief copy _a into "a" coeffs for base level
-    *
-    * \param _a
-    */
-    void aCoefficients (const MultiFab& _a);
-
-    /**
-    * \brief Zero out the "a" coeffs for base level.
-    */
-    void ZeroACoefficients ();
-
-    /**
-    * \brief copy _b into "b" coeffs for base level
-    *
-    * \param _b
-    */
-    void bCoefficients (const MultiFab& _b);
-
-    /**
-    * \brief copy _b into "b" coeffs for base level at supplied gridno
-    *
-    * \param _b
-    * \param gridno
-    */
-    void bCoefficients (const FArrayBox& _b,
-                        int              gridno);
-
-    /**
-    * \brief alternative (older) version of above members
-    *
-    * \param _a
-    * \param _b
-    */
-    void setCoefficients (const MultiFab& _a,
-                          const MultiFab& _b);
-
-    /**
-    * \brief allocate/fill internal data for new level
-    *
-    * \param level
-    */
-    virtual void prepareForLevel (int level);
-
-    /**
-    * \brief remove internal data for this level and all levels above
-    *
-    * \param level
-    */
-    virtual void clearToLevel (int level);
-
-    /**
-    * \brief set flags so that a coeffs at lev and coarser require recalculation
-    *
-    * \param lev
-    */
-    void invalidate_a_to_level (int lev);
-
-    /**
-    * \brief set flags so that b coeffs at lev and coarser require recalculation
-    *
-    * \param lev
-    */
-    void invalidate_b_to_level (int lev);
-
-    virtual Real norm (int nm = 0, int level = 0, const bool local = false);
-
-  virtual int NumGrow(int level = 0) const;
-
-  virtual void applyBC (MultiFab&      inout,
-			int            src_comp,
-			int            num_comp,
-			int            level   = 0,
-			LinOp::BC_Mode bc_mode = LinOp::Inhomogeneous_BC,
-			bool           local   = false,
-			int            bndryComp = 0);
-
-  virtual int numLevels () const;
-  virtual int numLevelsHO () const;
-
-  virtual const BoxArray& boxArray (int level = 0) const;
-
-  static void ca2cc(const MultiFab& ca, MultiFab& cc,
-                     int sComp, int dComp, int nComp);
-
-  static void cc2ca(const MultiFab& cc, MultiFab& ca,
-                    int sComp, int dComp, int nComp);
-
-  static void lo_cc2ec(const MultiFab& cc, MultiFab& ec,
-                       int sComp, int dComp, int nComp, int dir, bool do_harm);
-
-protected:
-  void buildWorkSpace();
-
-  MultiFab resL;   //!< A temporary needed for relaxations at mg level = 0
-
-
-    /**
-    * \brief initialize a full set (a,b) of coefficients on the box array
-    *
-    * \param _ba
-    * \param _dm
-    */
-    void initCoefficients (const BoxArray &_ba, const DistributionMapping& _dm);
-
-    /**
-    * \brief compute ``out=L(in)`` at level=level
-    *
-    * \param out
-    * \param in
-    * \param level
-    */
-    virtual void Fapply (MultiFab&       out,
-                         const MultiFab& in,
-                         int             level);
-    virtual void Fapply (MultiFab&       out,
-			 int             dst_comp,
-                         const MultiFab& in,
-			 int             src_comp,
-			 int             num_comp,
-                         int             level);
-
-    /**
-    * \brief apply GSRB smoother to improve residual to ``L(solnL)=rhsL``
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param rgbflag
-    */
-    virtual void Fsmooth (MultiFab&       solnL,
-                          const MultiFab& rhsL,
-                          int             level,
-                          int             rgbflag);
-
-    /**
-    * \brief apply Jacobi smoother to improve residual to ``L(solnL)=rhsL``
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    */
-    virtual void Fsmooth_jacobi (MultiFab&       solnL,
-                                 const MultiFab& rhsL,
-                                 int             level);
-
-    ABec2* LO_Op;
-
-private:
-
-    //! Array (on level) of "a" coefficients
-    Vector< MultiFab* > acoefs;
-
-    //! Array (on level) of "b" coefficients
-    Vector< MultiFab* > bcoefs;
-
-    //! Scalar "alpha" coefficient
-    Real alpha;
-
-    //! Scalar "beta" coefficient
-    Real beta;
-
-    //! Flag, can a coeffs be trusted at a level.
-    Vector<int> a_valid;
-
-    //! Flag, can b coeffs be trusted at a level.
-    Vector<int> b_valid;
-
-    //! Default value for a (MultiFab) coefficient.
-    static Real a_def;
-
-    //! Default value for b (MultiFab) coefficient.
-    static Real b_def;
-
-    //! Default value for alpha (scalar) coefficient.
-    static Real alpha_def;
-
-    //! Default value for beta (scalar) coefficient.
-    static Real beta_def;
-
-    /**
-    * \brief Disallow copy constructors (for now...to be fixed)
-    *
-    */
-    ABec4 (const ABec4&);
-    ABec4& operator= (const ABec4&);
-};
-
-}
-
-#endif /*_ABec4_H_*/
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4.cpp b/Src/LinearSolvers/C_CellMG4/AMReX_ABec4.cpp
deleted file mode 100644
index 18ceb77a1fb..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4.cpp
+++ /dev/null
@@ -1,618 +0,0 @@
-#include <algorithm>
-#include <AMReX_ABec4.H>
-#include <AMReX_ABec4_F.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_LO_F.H>
-
-namespace amrex {
-
-Real ABec4::a_def     = 0.0;
-Real ABec4::b_def     = 1.0;
-Real ABec4::alpha_def = 1.0;
-Real ABec4::beta_def  = 1.0;
-
-ABec4::ABec4 (const BndryData& _bd,
-	      const Real*      _h)
-    :
-    LinOp(_bd,_h)
-{
-    LO_Op = new ABec2(_bd,_h);
-
-    buildWorkSpace();
-
-    initCoefficients(_bd.boxes(),_bd.DistributionMap());
-}
-
-ABec4::~ABec4 ()
-{
-    clearToLevel(-1);
-    delete LO_Op; LO_Op = 0;
-}
-
-void
-ABec4::buildWorkSpace()
-{
-  const BoxArray& ba = boxArray();
-  const DistributionMapping& dm = DistributionMapping();
-  BL_ASSERT(resL.size()==0);
-  resL.define(ba, dm, 1, 0);
-}
-
-int
-ABec4::NumGrow(int level) const
-{
-  if (level == 0) {
-    return 2;
-  }
-  
-  BL_ASSERT(LO_Op != 0);
-  return LO_Op->NumGrow(level);
-}
-
-int
-ABec4::numLevels () const
-{
-  BL_ASSERT(LO_Op != 0);
-  return LO_Op->numLevels();
-}
-
-int
-ABec4::numLevelsHO () const
-{
-  return acoefs.size();
-}
-
-const BoxArray&
-ABec4::boxArray (int level) const
-{
-  if (level == 0) {
-    return gbox[level];
-  }
-  
-  BL_ASSERT(LO_Op != 0);
-  return LO_Op->boxArray(level);
-}
-
-void
-ABec4::applyBC (MultiFab&     inout,
-                int            src_comp,
-                int            num_comp,
-                int            level,
-                LinOp::BC_Mode bc_mode,
-                bool           local,
-		int            bndry_comp)
-{
-    //
-    // The inout MultiFab needs enough ghost cells for applyBC.
-    //
-    BL_ASSERT(inout.nGrow() >= NumGrow(level));
-    //
-    // No coarsened boundary values, cannot apply inhomog at lev>0.
-    //
-    BL_ASSERT(level < numLevelsHO());
-    BL_ASSERT(!(level > 0 && bc_mode == Inhomogeneous_BC));
-
-    int flagden = 1; // Fill in undrrelxr.
-    int flagbc  = 1; // Fill boundary data.
-
-    if (bc_mode == LinOp::Homogeneous_BC)
-        //
-        // No data if homogeneous.
-        //
-        flagbc = 0;
-
-    prepareForLevel(level);
-
-    const bool cross = false;
-    inout.FillBoundary(src_comp,num_comp,geomarray[level].periodicity(),cross);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(inout); mfi.isValid(); ++mfi)
-    {
-        const int gn = mfi.index();
-
-        BL_ASSERT(gbox[level][gn] == inout.box(gn));
-
-        BL_ASSERT(level<undrrelxr.size());
-
-        const BndryData::RealTuple&      bdl = bgb->bndryLocs(gn);
-        const Vector< Vector<BoundCond> >& bdc = bgb->bndryConds(gn);
-
-        for (OrientationIter oitr; oitr; ++oitr)
-        {
-            const Orientation o = oitr();
-
-            FabSet&       f   = undrrelxr[level][o];
-            int           cdr = o;
-            const FabSet& fs  = bgb->bndryValues(o);
-            const Mask&   m   = local ? lmaskvals[level][o][mfi] : maskvals[level][o][mfi];
-            Real          bcl = bdl[o];
-            BL_ASSERT(bdc[o].size()>bndry_comp);
-            int           bct = bdc[o][bndry_comp];
-
-            const Box&       vbx   = inout.box(gn);
-            FArrayBox&       iofab = inout[gn];
-            BL_ASSERT(f.size()>gn);
-            BL_ASSERT(fs.size()>gn);
-
-            FArrayBox&       ffab  = f[gn];
-            const FArrayBox& fsfab = fs[gn];
-
-            amrex_ab4_applybc4(&flagden, &flagbc, &maxorder,
-			  iofab.dataPtr(src_comp),
-			  ARLIM(iofab.loVect()), ARLIM(iofab.hiVect()),
-			  &cdr, &bct, &bcl,
-			  fsfab.dataPtr(bndry_comp), 
-			  ARLIM(fsfab.loVect()), ARLIM(fsfab.hiVect()),
-			  m.dataPtr(),
-			  ARLIM(m.loVect()), ARLIM(m.hiVect()),
-			  ffab.dataPtr(),
-			  ARLIM(ffab.loVect()), ARLIM(ffab.hiVect()),
-			  vbx.loVect(),
-			  vbx.hiVect(), &num_comp, h[level].data());
-        }
-    }
-
-  // Clean up corners:
-  // The problem here is that APPLYBC fills only grow cells normal to the boundary.
-  // As a result, any corner cell on the boundary (either coarse-fine or fine-fine)
-  // is not filled.  For coarse-fine, the operator adjusts itself, sliding away from
-  // the box edge to avoid referencing that corner point.  On the physical boundary
-  // though, the corner point is needed.  Particularly if a fine-fine boundary intersects
-  // the physical boundary, since we want the stencil to be independent of the box
-  // blocking. 
-    inout.EnforcePeriodicity(geomarray[level].periodicity());
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  for (MFIter mfi(inout); mfi.isValid(); ++mfi) {
-
-    const int gn = mfi.index();
-
-    BL_ASSERT(gbox[level][gn] == inout.box(gn));
-
-    const Box& vbx   = inout.box(gn);
-    FArrayBox& iofab = inout[gn];
-
-    amrex_ab4_applybc4_touchup(
-      iofab.dataPtr(src_comp),ARLIM(iofab.loVect()), ARLIM(iofab.hiVect()),
-      vbx.loVect(), vbx.hiVect(), &num_comp);
-  }
-}
-
-void
-ABec4::ca2cc(const MultiFab& ca, MultiFab& cc,
-             int sComp, int dComp, int nComp)
-{
-  const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  for (MFIter mfi(ca,tiling); mfi.isValid(); ++mfi) {
-    const FArrayBox& caf = ca[mfi];
-    FArrayBox& ccf = cc[mfi];
-    const Box& box = mfi.tilebox();
-    BL_ASSERT(caf.box().contains(amrex::grow(box,1)));
-    amrex_ab4_ca2cc(box.loVect(), box.hiVect(),
-               caf.dataPtr(sComp), ARLIM(caf.box().loVect()), ARLIM(caf.box().hiVect()),
-               ccf.dataPtr(dComp), ARLIM(ccf.box().loVect()), ARLIM(ccf.box().hiVect()),
-               &nComp);
-  }
-}
-
-void
-ABec4::cc2ca(const MultiFab& cc, MultiFab& ca,
-             int sComp, int dComp, int nComp)
-{
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  for (MFIter mfi(ca,true); mfi.isValid(); ++mfi) {
-    const FArrayBox& ccf = cc[mfi];
-    FArrayBox& caf = ca[mfi];
-    const Box& box = mfi.growntilebox();
-    BL_ASSERT(ccf.box().contains(amrex::grow(box,1)));
-    amrex_ab4_cc2ca(box.loVect(), box.hiVect(),
-               ccf.dataPtr(sComp), ARLIM(ccf.box().loVect()), ARLIM(ccf.box().hiVect()),
-               caf.dataPtr(dComp), ARLIM(caf.box().loVect()), ARLIM(caf.box().hiVect()),
-               &nComp);
-  }
-}
-
-void
-ABec4::lo_cc2ec(const MultiFab& cc, MultiFab& ec,
-                int sComp, int dComp, int nComp, int dir, bool do_harm)
-{
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-  for (MFIter mfi(ec,true); mfi.isValid(); ++mfi) {
-    const FArrayBox& ccf = cc[mfi];
-    FArrayBox& ecf = ec[mfi];
-    const Box& box = mfi.growntilebox();
-    BL_ASSERT(ccf.box().contains(Box(box).enclosedCells().grow(dir,1)));
-    int iharm = (int)do_harm;
-    amrex_ab4_lo_cc2ec(box.loVect(), box.hiVect(),
-                  ccf.dataPtr(sComp), ARLIM(ccf.box().loVect()), ARLIM(ccf.box().hiVect()),
-                  ecf.dataPtr(dComp), ARLIM(ecf.box().loVect()), ARLIM(ecf.box().hiVect()),
-                  &nComp,&dir,&iharm);
-  }
-}
-
-Real
-ABec4::norm (int nm, int level, const bool local)
-{
-  return 1;
-}
-
-void
-ABec4::clearToLevel (int level)
-{
-  BL_ASSERT(level >= -1);
-  
-  for (int i = level+1; i < numLevelsHO(); ++i)
-  {
-    BL_ASSERT(acoefs.size()>=i);
-    delete acoefs[i];
-    a_valid[i] = false;
-    BL_ASSERT(bcoefs.size()>=i);
-    delete bcoefs[i];
-    b_valid[i] = false;
-  }
-
-  BL_ASSERT(LO_Op != 0);
-  LO_Op->clearToLevel(level);
-}
-
-void
-ABec4::prepareForLevel (int level)
-{
-    LinOp::prepareForLevel(level);
-
-    BL_ASSERT(LO_Op != 0);
-    LO_Op->prepareForLevel(level);
-
-    if (level == 0 )
-        return;
-
-    LO_Op->prepareForLevel(level-1);
-}
-
-void
-ABec4::initCoefficients (const BoxArray& _ba, const DistributionMapping& _dm)
-{
-    const int nComp=1;
-    const int nGrow=2;
-    acoefs.resize(1);
-    bcoefs.resize(1);
-    acoefs[0] = new MultiFab(_ba, _dm, nComp, nGrow);
-    acoefs[0]->setVal(a_def);
-    a_valid.resize(1);
-    a_valid[0] = true;
-
-    const int nGrowb=2;
-    bcoefs[0] = new MultiFab(_ba, _dm, nComp, nGrowb);
-    bcoefs[0]->setVal(b_def);
-    b_valid.resize(1);
-    b_valid[0] = true;
-}
-
-void
-ABec4::aCoefficients (const MultiFab& _a)
-{
-    BL_ASSERT(_a.ok());
-    BL_ASSERT(_a.boxArray() == (acoefs[0])->boxArray());
-    invalidate_a_to_level(0);
-    MultiFab::Copy(*acoefs[0],_a,0,0,acoefs[0]->nComp(),acoefs[0]->nGrow());
-}
-
-void
-ABec4::ZeroACoefficients ()
-{
-    invalidate_a_to_level(0);
-    (*acoefs[0]).setVal(0,0,acoefs[0]->nComp(),acoefs[0]->nGrow());
-}
-
-void
-ABec4::bCoefficients (const MultiFab& _b)
-{
-    BL_ASSERT(_b.ok());
-    BL_ASSERT(_b.boxArray() == (bcoefs[0])->boxArray());
-    invalidate_b_to_level(0);
-    MultiFab::Copy(*bcoefs[0],_b,0,0,bcoefs[0]->nComp(),bcoefs[0]->nGrow());
-}
-
-void
-ABec4::bCoefficients (const FArrayBox& _b,
-		      int              gridno)
-{
-    BL_ASSERT(_b.box().contains((bcoefs[0])->boxArray()[gridno]));
-    invalidate_b_to_level(0);
-    (*bcoefs[0])[gridno].copy(_b,0,0,bcoefs[0]->nComp());
-}
-
-const MultiFab&
-ABec4::aCoefficients (int level)
-{
-    prepareForLevel(level);
-    return *acoefs[level];
-}
-
-const MultiFab&
-ABec4::bCoefficients (int level)
-{
-    prepareForLevel(level);
-    return *bcoefs[level];
-}
-
-void
-ABec4::setCoefficients (const MultiFab &_a,
-			const MultiFab &_b)
-{
-  aCoefficients(_a);
-  bCoefficients(_b);
-
-  if (LO_Op) {
-    int level = 0;
-    const BoxArray& cba = boxArray(level);
-    const DistributionMapping& dm = DistributionMap();
-    LO_Op->aCoefficients(_a);
-    bool do_harm = true;
-    for (int d=0; d<BL_SPACEDIM; ++d) {
-      BoxArray eba = BoxArray(cba).surroundingNodes(d);
-      MultiFab btmp(eba,dm,1,0);
-      lo_cc2ec(_b,btmp,0,0,1,d,do_harm);
-      LO_Op->bCoefficients(btmp,d);
-    }
-  }
-}
-
-void
-ABec4::invalidate_a_to_level (int lev)
-{
-    lev = (lev >= 0 ? lev : 0);
-    for (int i = lev; i < numLevelsHO(); i++) {
-        a_valid[i] = false;
-    }
-    LO_Op->invalidate_a_to_level(lev);
-}
-
-void
-ABec4::invalidate_b_to_level (int lev)
-{
-    lev = (lev >= 0 ? lev : 0);
-    for (int i = lev; i < numLevelsHO(); i++) {
-        b_valid[i] = false;
-    }
-    LO_Op->invalidate_b_to_level(lev);
-}
-
-void
-ABec4::compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-		 MultiFab& in, const BC_Mode& bc_mode,
-		 int src_comp, int dst_comp, int num_comp, int bnd_comp)
-{
-  compFlux(AMREX_D_DECL(xflux, yflux, zflux), in, true, bc_mode, src_comp, dst_comp, num_comp, bnd_comp);
-}
-
-void
-ABec4::compFlux (AMREX_D_DECL(MultiFab &xflux, MultiFab &yflux, MultiFab &zflux),
-		 MultiFab& in, bool do_ApplyBC, const BC_Mode& bc_mode,
-		 int src_comp, int dst_comp, int num_comp, int bnd_comp)
-{
-    const int level = 0;
-    BL_ASSERT(num_comp==1);
-
-    if (do_ApplyBC)
-      applyBC(in,src_comp,num_comp,level,bc_mode,bnd_comp);
-
-    const MultiFab& a = aCoefficients(level);
-    const MultiFab& b = bCoefficients(level);
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter inmfi(in,tiling); inmfi.isValid(); ++inmfi)
-    {
-        AMREX_D_TERM(const Box& xbx   = inmfi.nodaltilebox(0);,
-	       const Box& ybx   = inmfi.nodaltilebox(1);,
-	       const Box& zbx   = inmfi.nodaltilebox(2););
-
-        FArrayBox& infab = in[inmfi];
-	const FArrayBox& bfab = b[inmfi];
-
-        AMREX_D_TERM(FArrayBox& xfluxfab = xflux[inmfi];,
-               FArrayBox& yfluxfab = yflux[inmfi];,
-               FArrayBox& zfluxfab = zflux[inmfi];);
-
-        amrex_ab4_flux(infab.dataPtr(src_comp),
-		  ARLIM(infab.loVect()), ARLIM(infab.hiVect()),
-		  &alpha, &beta, a[inmfi].dataPtr(), 
-		  ARLIM(a[inmfi].loVect()), ARLIM(a[inmfi].hiVect()),
-		  bfab.dataPtr(), 
-		  ARLIM(bfab.loVect()), ARLIM(bfab.hiVect()),
-		  &num_comp,
-		  h[level].data(),
-		  xbx.loVect(), xbx.hiVect(), 
-		  xfluxfab.dataPtr(dst_comp),
-		  ARLIM(xfluxfab.loVect()), ARLIM(xfluxfab.hiVect())
-#if (BL_SPACEDIM >= 2)
-		  ,ybx.loVect(), ybx.hiVect()
-		  ,yfluxfab.dataPtr(dst_comp),
-		  ARLIM(yfluxfab.loVect()), ARLIM(yfluxfab.hiVect())
-#endif
-#if (BL_SPACEDIM == 3)
-		  ,zbx.loVect(), zbx.hiVect()
-		  ,zfluxfab.dataPtr(dst_comp),
-		  ARLIM(zfluxfab.loVect()), ARLIM(zfluxfab.hiVect())
-#endif
-		  );
-    }
-}
-        
-//
-// Must be defined for MultiGrid/CGSolver to work.
-//
-
-void
-ABec4::Fsmooth (MultiFab&       solnL,
-		const MultiFab& rhsL,
-		int             level,
-		int             redBlackFlag)
-{
-  amrex::Abort("ABec4 does not surrport Fsmooth at level = 0");
-}
-
-void
-ABec4::Fsmooth_jacobi (MultiFab&       solnL,
-		       const MultiFab& rhsL,
-		       int             level)
-{
-  amrex::Abort("ABec4 does not surrport Fsmooth_jacobi");
-}
-
-void
-ABec4::smooth (MultiFab&       solnL,
-               const MultiFab& rhsL,
-               int             level,
-               LinOp::BC_Mode  bc_mode)
-{
-  BL_ASSERT(LO_Op != 0);
-
-  if (level == 0)
-  {
-    bool local = false;
-    for (int redBlackFlag = 0; redBlackFlag < 2; redBlackFlag++)
-    {
-      residual(resL,rhsL,solnL,level,bc_mode,local);
-      LO_Op->altSmooth(solnL, resL, level, redBlackFlag);
-    }
-  }
-  else {
-    LO_Op->smooth(solnL,rhsL,level,bc_mode);
-  }
-}
-
-void
-ABec4::jacobi_smooth (MultiFab&       solnL,
-                      const MultiFab& rhsL,
-                      int             level,
-                      LinOp::BC_Mode  bc_mode)
-{
-    BL_ASSERT(LO_Op != 0);
-
-    LO_Op->jacobi_smooth(solnL,rhsL,level,bc_mode);
-}
-
-void
-ABec4::Fapply (MultiFab&       y,
-	       const MultiFab& x,
-	       int             level)
-{
-  int num_comp = 1;
-  int src_comp = 0;
-  int dst_comp = 0;
-  Fapply(y,dst_comp,x,src_comp,num_comp,level);
-}
-
-void
-ABec4::Fapply (MultiFab&       y,
-	       int             dst_comp,
-	       const MultiFab& x,
-	       int             src_comp,
-	       int             num_comp,
-	       int             level)
-{
-  if (level == 0) {
-
-    BL_ASSERT(y.nComp()>=dst_comp+num_comp);
-    BL_ASSERT(x.nComp()>=src_comp+num_comp);
-
-    const MultiFab& a = aCoefficients(level);
-    const MultiFab& b = bCoefficients(level);
-
-    prepareForLevel(level);
-
-    const bool cross = false;
-    const_cast<MultiFab&>(b).FillBoundary(src_comp,num_comp,geomarray[level].periodicity(),cross);
-
-    const bool tiling = true;
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter ymfi(y,tiling); ymfi.isValid(); ++ymfi)
-    {
-        const Box&       tbx  = ymfi.tilebox();
-        FArrayBox&       yfab = y[ymfi];
-        const FArrayBox& xfab = x[ymfi];
-        const FArrayBox& afab = a[ymfi];
-	const FArrayBox& bfab = b[ymfi];
-
-        amrex_ab4_adotx(yfab.dataPtr(dst_comp),
-                   ARLIM(yfab.loVect()),ARLIM(yfab.hiVect()),
-                   xfab.dataPtr(src_comp),
-                   ARLIM(xfab.loVect()), ARLIM(xfab.hiVect()),
-                   &alpha, &beta, afab.dataPtr(), 
-                   ARLIM(afab.loVect()), ARLIM(afab.hiVect()),
-                   bfab.dataPtr(), 
-                   ARLIM(bfab.loVect()), ARLIM(bfab.hiVect()),
-                   tbx.loVect(), tbx.hiVect(), &num_comp,
-                   h[level].data());
-    }
-  }
-  else {
-    amrex::Abort("ABec4 cannot do Fapply on level != 0");
-  }
-}
-
-void
-ABec4::apply (MultiFab&      out,
-              MultiFab&      in,
-              int            level,
-              LinOp::BC_Mode bc_mode,
-              bool           local,
-	      int            src_comp,
-	      int            dst_comp,
-	      int            num_comp,
-	      int            bndry_comp)
-{
-  if (level == 0) {
-    applyBC(in,src_comp,num_comp,level,bc_mode,local,bndry_comp);
-    Fapply(out,dst_comp,in,src_comp,num_comp,level);
-  }
-  else {
-
-    BL_ASSERT(LO_Op != 0);
-
-    LO_Op->apply(out,in,level,bc_mode,local,src_comp,dst_comp,num_comp,bndry_comp);
-  }
-}
-
-void
-ABec4::residual (MultiFab&       residL,
-                 const MultiFab& rhsL,
-                 MultiFab&       solnL,
-                 int             level,
-                 LinOp::BC_Mode  bc_mode,
-                 bool            local)
-{
-  if (level == 0) {
-      apply(residL, solnL, level, bc_mode, local);
-      MultiFab::Xpay(residL, -1.0, rhsL, 0, 0, residL.nComp(), 0);
-  }
-  else {
-      BL_ASSERT(LO_Op != 0);
-      LO_Op->residual(residL,rhsL,solnL,level,bc_mode,local);
-  }
-}
-
-}
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_2D.F90 b/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_2D.F90
deleted file mode 100644
index 8884232dc21..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_2D.F90
+++ /dev/null
@@ -1,805 +0,0 @@
-
-module amrex_abec4_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-  include 'AMReX_lo_bctypes.fi'
-
-contains
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-      subroutine amrex_ab4_adotx( &
-          y,y_l1,y_l2,y_h1,y_h2, &
-          x,x_l1,x_l2,x_h1,x_h2, &
-          alpha, beta, &
-          a,a_l1,a_l2,a_h1,a_h2, &
-          b,b_l1,b_l2,b_h1,b_h2, &
-          lo,hi,nc, &
-          h &
-          ) bind(c,name='amrex_ab4_adotx')
-
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer y_l1,y_l2,y_h1,y_h2
-      integer x_l1,x_l2,x_h1,x_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer b_l1,b_l2,b_h1,b_h2
-      real(amrex_real)  y(y_l1:y_h1,y_l2:y_h2,nc)
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real)  b(b_l1:b_h1,b_l2:b_h2)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,j,n
-      real(amrex_real) bh1i, bh2i
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-
-      real(amrex_real), allocatable :: xflux(:,:,:), yflux(:,:,:)
-
-      xlo(:) = lo(:)
-      xhi(:) = hi(:)
-      ylo(:) = lo(:)
-      yhi(:) = hi(:)
-      xhi(1) = hi(1) + 1
-      yhi(2) = hi(2) + 1
-
-      allocate(xflux(xlo(1):xhi(1),xlo(2):xhi(2),nc))
-      allocate(yflux(ylo(1):yhi(1),ylo(2):yhi(2),nc))
-
-      bh1i = beta / h(1)
-      bh2i = beta / h(2)
-
-      call flux_dir(x, x_l1,x_l2,x_h1,x_h2, alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           b, b_l1,b_l2,b_h1,b_h2, &
-           nc, h(1), xlo, xhi, xflux, xlo(1), xlo(2), xhi(1), xhi(2), 1)
-      call flux_dir(x, x_l1,x_l2,x_h1,x_h2, alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           b, b_l1,b_l2,b_h1,b_h2, &
-           nc, h(2), ylo, yhi, yflux, ylo(1), ylo(2), yhi(1), yhi(2), 2)
-
-      do n=1,nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               y(i,j,n) = alpha*a(i,j)*x(i,j,n) &
-     &          - bh1i*(xflux(i+1,j,n) - xflux(i,j,n)) &
-     &          - bh2i*(yflux(i,j+1,n) - yflux(i,j,n))
-            enddo
-         enddo
-      enddo
-
-      deallocate(xflux)
-      deallocate(yflux)
-
-      end
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-      subroutine amrex_ab4_flux( &
-          x,x_l1,x_l2,x_h1,x_h2, &
-          alpha, beta, &
-          a, a_l1,a_l2,a_h1,a_h2, &
-          b, b_l1,b_l2,b_h1,b_h2, &
-          nc, &
-          h, &
-          xlo,xhi,xflux,xflux_l1,xflux_l2,xflux_h1,xflux_h2, &
-          ylo,yhi,yflux,yflux_l1,yflux_l2,yflux_h1,yflux_h2 &
-          ) bind(c,name='amrex_ab4_flux')
-      implicit none
-      real(amrex_real) alpha, beta
-      integer nc
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer x_l1,x_l2,x_h1,x_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer b_l1,b_l2,b_h1,b_h2
-      integer xflux_l1,xflux_l2,xflux_h1,xflux_h2
-      integer yflux_l1,yflux_l2,yflux_h1,yflux_h2
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real)  b(b_l1:b_h1,b_l2:b_h2)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,xflux_l2:xflux_h2,nc)
-      real(amrex_real) yflux(yflux_l1:yflux_h1,yflux_l2:yflux_h2,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      call flux_dir(x, x_l1,x_l2,x_h1,x_h2, alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           b, b_l1,b_l2,b_h1,b_h2, &
-           nc, h(1), xlo, xhi, xflux, xflux_l1,xflux_l2,xflux_h1,xflux_h2, 1)
-      call flux_dir(x, x_l1,x_l2,x_h1,x_h2, alpha, beta, &
-           a, a_l1,a_l2,a_h1,a_h2, &
-           b, b_l1,b_l2,b_h1,b_h2, &
-           nc,h(2), ylo, yhi, yflux, yflux_l1,yflux_l2,yflux_h1,yflux_h2, 2)
-
-      end
-
-!-----------------------------------------------------------------------
-      subroutine flux_dir( &
-          x,x_l1,x_l2,x_h1,x_h2, &
-          alpha, beta, &
-          a, a_l1,a_l2,a_h1,a_h2, &
-          b, b_l1,b_l2,b_h1,b_h2, &
-          nc, &
-          h, &
-          lo,hi,flux,flux_l1,flux_l2,flux_h1,flux_h2, &
-          dir)
-      implicit none
-      real(amrex_real) alpha, beta
-      integer nc, dir
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer x_l1,x_l2,x_h1,x_h2
-      integer a_l1,a_l2,a_h1,a_h2
-      integer b_l1,b_l2,b_h1,b_h2
-      integer flux_l1,flux_l2,flux_h1,flux_h2
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2)
-      real(amrex_real)  b(b_l1:b_h1,b_l2:b_h2)
-      real(amrex_real) flux(flux_l1:flux_h1,flux_l2:flux_h2,nc)
-      real(amrex_real) h
-
-      integer i,j,n
-      real(amrex_real) i12, i48
-      real(amrex_real) hi1_12
-
-      real(amrex_real), allocatable :: gt(:,:)
-      real(amrex_real), allocatable :: bt(:,:)
-      real(amrex_real) g1, b1
-
-      i12 = 1.d0/12.d0
-      i48 = 1.d0/48.d0
-      hi1_12 = 1.d0 / (12.d0*h)
-
-      if (dir .eq. 1) then
-         allocate(gt(lo(1):hi(1),lo(2)-2:hi(2)+2))
-         allocate(bt(lo(1):hi(1),lo(2)-2:hi(2)+2))
-
-         do j = lo(2)-2, hi(2)+2
-            do i = lo(1), hi(1)
-               bt(i,j) = (-b(i-2,j)+7*(b(i-1,j)+b(i,j))-b(i+1,j))*i12
-            enddo
-         enddo
-         do n=1,nc
-            do j = lo(2)-2, hi(2)+2
-               do i = lo(1), hi(1)
-                  gt(i,j) = (x(i-2,j,n)-x(i+1,j,n)+15.d0*(x(i,j,n)-x(i-1,j,n)))*hi1_12
-               enddo
-            enddo
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  g1 = (34.d0*(gt(i,j+1)-gt(i,j-1))+5.d0*(gt(i,j-2)-gt(i,j+2)))*i48
-                  b1 = (34.d0*(bt(i,j+1)-bt(i,j-1))+5.d0*(bt(i,j-2)-bt(i,j+2)))*i48
-                  flux(i,j,n) = bt(i,j)*gt(i,j)  +  i12*b1*g1
-               enddo
-            enddo
-         enddo
-      else
-         allocate(gt(lo(1)-2:hi(1)+2,lo(2):hi(2)))
-         allocate(bt(lo(1)-2:hi(1)+2,lo(2):hi(2)))
-
-         do j = lo(2), hi(2)
-            do i = lo(1)-2, hi(1)+2
-               bt(i,j) = (-b(i,j-2)+7*(b(i,j-1)+b(i,j))-b(i,j+1))*i12
-            enddo
-         enddo
-         do n=1,nc
-            do j = lo(2), hi(2)
-               do i = lo(1)-2, hi(1)+2
-                  gt(i,j) = (x(i,j-2,n)-x(i,j+1,n)+15.d0*(x(i,j,n)-x(i,j-1,n)))*hi1_12
-               enddo
-            enddo
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  g1 = (34.d0*(gt(i+1,j)-gt(i-1,j))+5.d0*(gt(i-2,j)-gt(i+2,j)))*i48
-                  b1 = (34.d0*(bt(i+1,j)-bt(i-1,j))+5.d0*(bt(i-2,j)-bt(i+2,j)))*i48
-                  flux(i,j,n) = bt(i,j)*gt(i,j)  +  i12*b1*g1
-               enddo
-            enddo
-         enddo
-      endif
-
-      deallocate(gt)
-      deallocate(bt)
-
-      end
-
-!-----------------------------------------------------------------------
-      subroutine amrex_ab4_applybc4 ( &
-          flagden, flagbc, maxorder, &
-          phi,   phi_l1,phi_l2,phi_h1,phi_h2, &
-          cdir, bct, bcl, &
-          bcval, bcval_l1,bcval_l2,bcval_h1,bcval_h2, &
-          mask,  mask_l1,mask_l2,mask_h1,mask_h2, &
-          den,   den_l1,den_l2,den_h1,den_h2, &
-          lo, hi, nc, &
-          h &
-          ) bind(c,name='amrex_ab4_applybc4')
-
-      implicit none
-!
-!     If the boundary is of Neumann type, set the ghost cell value to
-!     that of the outermost point in the valid data (2nd order accurate)
-!     and then fill the "den" array with the value "1"
-!
-!
-!     If flagbc==1:
-!
-!     If the boundary is of Dirichlet type, construct a polynomial
-!     interpolation through the boundary location and internal points
-!     (at locations x(-1:len-2) that generates the ghost cell value (at
-!     location xInt).  Then fill the ghost cell with the interpolated value.
-!     If flagden==1, load the "den" array with the interpolation
-!     coefficient corresponding to outermost point in the valid region
-!     ( the coef(0) corresponding to the location x(0) )
-!
-!     Note:
-!     The bc type = LO_REFLECT_ODD is a special type of boundary condition.
-!
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer phi_l1,phi_l2,phi_h1,phi_h2
-      real(amrex_real) phi(phi_l1:phi_h1,phi_l2:phi_h2,nc)
-      integer den_l1,den_l2,den_h1,den_h2
-      real(amrex_real) den(den_l1:den_h1,den_l2:den_h2)
-      integer bcval_l1,bcval_l2,bcval_h1,bcval_h2
-      real(amrex_real) bcval(bcval_l1:bcval_h1,bcval_l2:bcval_h2,nc)
-      integer mask_l1,mask_l2,mask_h1,mask_h2
-      integer mask(mask_l1:mask_h1,mask_l2:mask_h2)
-      integer bct
-      real(amrex_real) bcl, tmp, b, d
-      parameter (b = 1.d0/24.d0)
-      parameter (d = 11.d0/12.d0)
-      real(amrex_real) h(BL_SPACEDIM)
-!
-      integer i, j, n
-      logical is_dirichlet, is_neumann
-!
-!
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET )
-      is_neumann(i)   = ( i .eq. LO_NEUMANN )
-!
-!
-!     The Left face of the grid
-!
-      if(cdir .eq. 0) then
-         if (is_neumann(bct)) then
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  if (mask(lo(1)-1,j) .gt. 0) then
-!                     phi(lo(1)-1,j,n) =  (9*phi(lo(1),j,n) +  3*phi(lo(1)+1,j,n) - phi(lo(1)+2,j,n))/11.d0
-                     phi(lo(1)-1,j,n) =  (5*phi(lo(1),j,n) +  9*phi(lo(1)+1,j,n) - 5*phi(lo(1)+2,j,n) + phi(lo(1)+3,j,n))/10.d0
-                  endif
-                  if (mask(lo(1)-2,j) .gt. 0) then
-!                     phi(lo(1)-2,j,n) = (- 30*phi(lo(1),j,n) + 56*phi(lo(1)+1,j,n) - 15*phi(lo(1)+2,j,n))/11.d0
-                     phi(lo(1)-2,j,n) = (- 75*phi(lo(1),j,n) + 145*phi(lo(1)+1,j,n) - 75*phi(lo(1)+2,j,n) &
-                          + 15*phi(lo(1)+3,j,n))/10.d0
-                  endif
-               end do
-            end do
-            if ( flagden .eq. 1) then
-               do j = lo(2), hi(2)
-                  den(lo(1),j) = 1.0D0
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     if (mask(lo(1)-1,j) .gt. 0) then
-                        if (mask(lo(1)-1,j-1).gt.0 .and. mask(lo(1)-1,j+1).gt.0) then
-                           tmp = b*(bcval(lo(1)-1,j+1,n)+bcval(lo(1)-1,j-1,n)) + d*bcval(lo(1)-1,j,n)
-                        else
-                           tmp = bcval(lo(1)-1,j,n)
-                        endif
-!                        phi(lo(1)-1,j,n) = (12*tmp - 13*phi(lo(1),j,n) + 5*phi(lo(1)+1,j,n) - phi(lo(1)+2,j,n))/3.d0
-                        phi(lo(1)-1,j,n) = (60*tmp - 77*phi(lo(1),j,n) + 43*phi(lo(1)+1,j,n) - 17*phi(lo(1)+2,j,n) &
-                             + 3*phi(lo(1)+3,j,n))/12.d0
-                        if (mask(lo(1)-2,j) .gt. 0) then
-!                           phi(lo(1)-2,j,n) = (48*tmp - 70*phi(lo(1),j,n) + 32*phi(lo(1)+1,j,n) - 7*phi(lo(1)+2,j,n))/3.d0
-                           phi(lo(1)-2,j,n) = (300*tmp - 505*phi(lo(1),j,n) + 335*phi(lo(1)+1,j,n) - 145*phi(lo(1)+2,j,n) &
-                                + 27*phi(lo(1)+3,j,n))/12.d0
-                        endif
-                     endif
-                  end do
-               else
-                  do j = lo(2), hi(2)
-                     if (mask(lo(1)-1,j) .gt. 0) then
-                        phi(lo(1)-1, j, n) = 0.d0
-                     endif
-                     if (mask(lo(1)-2,j) .gt. 0) then
-                        phi(lo(1)-2, j, n) = 0.d0
-                     endif
-                  end do
-               end if
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(lo(1),j) = merge(66.D0, 0.0D0, &
-                      mask(lo(1)-1,j) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  phi(lo(1)-1, j, n) = merge( &
-                     -phi(lo(1),j,n), &
-                      phi(lo(1)-1, j, n), &
-                      mask(lo(1)-1,j) .gt. 0)
-                  phi(lo(1)-2, j, n) = merge( &
-                     -phi(lo(1)+1,j,n), &
-                      phi(lo(1)-2, j, n), &
-                      mask(lo(1)-2,j) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(lo(1),j) = merge(-1.0D0, 0.0D0, &
-                      mask(lo(1)-1,j) .gt. 0)
-               end do
-            end if
-
-         else
-            print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The Right face of the grid
-!
-      if(cdir .eq. 2) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  if (mask(hi(1)+1,j) .gt. 0) then
-!                     phi(hi(1)+1,j,n) =  (9*phi(hi(1),j,n) +  3*phi(hi(1)-1,j,n) - phi(hi(1)-2,j,n))/11.d0
-                     phi(hi(1)+1,j,n) =  (5*phi(hi(1)  ,j,n) +  9*phi(hi(1)-1,j,n) - 5*phi(hi(1)-2,j,n) &
-                          + phi(hi(1)-3,j,n))/10.d0
-                  endif
-                  if (mask(hi(1)+2,j) .gt. 0) then
-!                     phi(hi(1)+2,j,n) = (- 30*phi(hi(1),j,n) + 56*phi(hi(1)-1,j,n) - 15*phi(hi(1)-2,j,n))/11.d0
-                     phi(hi(1)+2,j,n) = (- 75*phi(hi(1),j,n) + 145*phi(hi(1)-1,j,n) - 75*phi(hi(1)-2,j,n) &
-                          + 15*phi(hi(1)-3,j,n))/10.d0
-                  endif
-               end do
-            end do
-	    if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(hi(1),j) = 1.0D0
-               end do
-	    end if
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     if (mask(hi(1)+1,j) .gt. 0) then
-                        if (mask(hi(1)+1,j-1).gt.0 .and. mask(hi(1)+1,j+1).gt.0) then
-                           tmp = b*(bcval(hi(1)+1,j+1,n)+bcval(hi(1)+1,j-1,n)) + d*bcval(hi(1)+1,j,n)
-                        else
-                           tmp = bcval(hi(1)+1,j,n)
-                        endif
-!                        phi(hi(1)+1,j,n) = (12*tmp - 13*phi(hi(1),j,n) + 5*phi(hi(1)-1,j,n) - phi(hi(1)-2,j,n))/3.d0
-                        phi(hi(1)+1,j,n) = (60*tmp - 77*phi(hi(1),j,n) + 43*phi(hi(1)-1,j,n) - 17*phi(hi(1)-2,j,n) &
-                             + 3*phi(hi(1)-3,j,n))/12.d0
-                        if (mask(hi(1)+2,j) .gt. 0) then
-!                            phi(hi(1)+2,j,n) = (48*tmp - 70*phi(hi(1),j,n) + 32*phi(hi(1)-1,j,n) - 7*phi(hi(1)-2,j,n))/3.d0
-                            phi(hi(1)+2,j,n) = (300*tmp - 505*phi(hi(1),j,n) + 335*phi(hi(1)-1,j,n) - 145*phi(hi(1)-2,j,n) &
-                                 + 27*phi(hi(1)-3,j,n))/12.d0
-                        endif
-                     endif
-                  end do
-               else
-                  do j = lo(2), hi(2)
-                     if (mask(hi(1)+1,j) .gt. 0) then
-                        phi(hi(1)+1, j, n) = 0.d0
-                     endif
-                     if (mask(hi(1)+2,j) .gt. 0) then
-                        phi(hi(1)+2, j, n) = 0.d0
-                     endif
-                  end do
-               end if
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(hi(1),j)   = merge(66.D0, 0.0D0, &
-                      mask(hi(1)+1,j) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  phi(hi(1)+1, j, n) = merge( &
-                     -phi(hi(1),j,n), &
-                      phi(hi(1)+1, j, n), &
-                      mask(hi(1)+1,j) .gt. 0)
-                  phi(hi(1)+2, j, n) = merge( &
-                     -phi(hi(1)-1,j,n), &
-                      phi(hi(1)+2, j, n), &
-                      mask(hi(1)+2,j) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  den(hi(1),j) = merge(-1.0D0, 0.0D0, &
-                      mask(hi(1)+1,j) .gt. 0)
-               end do
-            end if
-
-         else
-            print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The Bottom of the Grid
-!
-      if(cdir .eq. 1) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do i = lo(1),hi(1)
-                  if (mask(i,lo(2)-1) .gt. 0) then
-!                     phi(i,lo(2)-1,n) =  (9*phi(i,lo(2),n) +  3*phi(i,lo(2)+1,n) - phi(i,lo(2)+2,n))/11.d0
-                     phi(i,lo(2)-1,n) =  (5*phi(i,lo(2)  ,n) +  9*phi(i,lo(2)+1,n) - 5*phi(i,lo(2)+2,n) &
-                          + phi(i,lo(2)+3,n))/10.d0
-                  endif
-                  if (mask(i,lo(2)-2) .gt. 0) then
-!                     phi(i,lo(2)-2,n) = (- 30*phi(i,lo(2),n) + 56*phi(i,lo(2)+1,n) - 15*phi(i,lo(2)+2,n))/11.d0
-                     phi(i,lo(2)-2,n) = (- 75*phi(i,lo(2),n) + 145*phi(i,lo(2)+1,n) - 75*phi(i,lo(2)+2,n) &
-                          + 15*phi(i,lo(2)+3,n))/10.d0
-                  endif
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1),hi(1)
-                  den(i,lo(2))   = 1.0D0
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     if (mask(i,lo(2)-1) .gt. 0) then
-                        if (mask(i-1,lo(2)-1).gt.0 .and. mask(i+1,lo(2)-1).gt.0) then
-                           tmp = b*(bcval(i+1,lo(2)-1,n)+bcval(i-1,lo(2)-1,n)) + d*bcval(i,lo(2)-1,n)
-                        else
-                           tmp = bcval(i,lo(2)-1,n)
-                        endif
-!                        phi(i,lo(2)-1,n) = (12*tmp - 13*phi(i,lo(2),n) + 5*phi(i,lo(2)+1,n) - phi(i,lo(2)+2,n))/3.d0
-                        phi(i,lo(2)-1,n) = (60*tmp - 77*phi(i,lo(2),n) + 43*phi(i,lo(2)+1,n) - 17*phi(i,lo(2)+2,n) &
-                             + 3*phi(i,lo(2)+3,n))/12.d0
-                        if (mask(i,lo(2)-2) .gt. 0) then
-!                           phi(i,lo(2)-2,n) =   (48*tmp - 70*phi(i,lo(2),n) + 32*phi(i,lo(2)+1,n) - 7*phi(i,lo(2)+2,n))/3.d0
-                           phi(i,lo(2)-2,n) = (300*tmp - 505*phi(i,lo(2),n) + 335*phi(i,lo(2)+1,n) - 145*phi(i,lo(2)+2,n) &
-                                + 27*phi(i,lo(2)+3,n))/12.d0
-                        endif
-                     endif
-                  end do
-               else
-                  do i = lo(1), hi(1)
-                     if (mask(i,lo(2)-1) .gt. 0) then
-                        phi(i,lo(2)-1, n) = 0.d0
-                     endif
-                     if (mask(i,lo(2)-2) .gt. 0) then
-                        phi(i,lo(2)-2, n) = 0.d0
-                     endif
-                  end do
-               end if
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i, lo(2))   = merge(66.D0, 0.0D0, &
-                      mask(i, lo(2)-1) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do i = lo(1), hi(1)
-                  phi(i,lo(2)-1,n) = merge( &
-                     -phi(i,lo(2),n), &
-                      phi(i,lo(2)-1,n), &
-                      mask(i,lo(2)-1) .gt. 0)
-                  phi(i,lo(2)-2,n) = merge( &
-                     -phi(i,lo(2)+1,n), &
-                      phi(i,lo(2)-2,n), &
-                      mask(i,lo(2)-2) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,lo(2)) = merge(-1.0D0, 0.0D0, &
-                      mask(i,lo(2)-1) .gt. 0)
-               end do
-            end if
-
-         else
-            print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The top of the grid
-!
-      if (cdir .eq. 3) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do i = lo(1), hi(1)
-                  if (mask(i,hi(2)+1) .gt. 0) then
-!                     phi(i,hi(2)+1,n) =  (9*phi(i,hi(2),n) +  3*phi(i,hi(2)-1,n) - phi(i,hi(2)-2,n))/11.d0
-                     phi(i,hi(2)+1,n) =  (5*phi(i,hi(2),n) +  9*phi(i,hi(2)-1,n) - 5*phi(i,hi(2)-2,n) &
-                          + phi(i,hi(2)-3,n))/10.d0
-                  endif
-                  if (mask(i,hi(2)+2) .gt. 0) then
-!                     phi(i,hi(2)+2,n) = (- 30*phi(i,hi(2),n) + 56*phi(i,hi(2)-1,n) - 15*phi(i,hi(2)-2,n))/11.d0
-                     phi(i,hi(2)+2,n) = (- 75*phi(i,hi(2),n) + 145*phi(i,hi(2)-1,n) - 75*phi(i,hi(2)-2,n) &
-                          + 15*phi(i,hi(2)-3,n))/10.d0
-                  endif
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,hi(2))   = 1.0D0
-               end do
-            end if
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     if (mask(i,hi(2)+1) .gt. 0) then
-                        if (mask(i-1,hi(2)+1).gt.0 .and. mask(i+1,hi(2)+1).gt.0) then
-                           tmp = b*(bcval(i+1,hi(2)+1,n)+bcval(i-1,hi(2)+1,n)) + d*bcval(i,hi(2)+1,n)
-                        else
-                           tmp = bcval(i,hi(2)+1,n)
-                        endif
-!                        phi(i,hi(2)+1,n) = (12*tmp - 13*phi(i,hi(2),n) + 5*phi(i,hi(2)-1,n) - phi(i,hi(2)-2,n))/3.d0
-                        phi(i,hi(2)+1,n) = (60*tmp - 77*phi(i,hi(2),n) + 43*phi(i,hi(2)-1,n) - 17*phi(i,hi(2)-2,n) &
-                             + 3*phi(i,hi(2)-3,n))/12.d0
-                        if (mask(i,hi(2)+2) .gt. 0) then
-!                           phi(i,hi(2)+2,n) =   (48*tmp -  70*phi(i,hi(2),n) + 32*phi(i,hi(2)-1,n) - 7*phi(i,hi(2)-2,n))/3.d0
-                           phi(i,hi(2)+2,n) = (300*tmp - 505*phi(i,hi(2),n) + 335*phi(i,hi(2)-1,n) - 145*phi(i,hi(2)-2,n) &
-                                + 27*phi(i,hi(2)-3,n))/12.d0
-                        endif
-                     endif
-                  end do
-               else
-                  do i = lo(1), hi(1)
-                     if (mask(i,hi(2)+1) .gt. 0) then
-                        phi(i,hi(2)+1, n) = 0.d0
-                     endif
-                     if (mask(i,hi(2)+2) .gt. 0) then
-                        phi(i,hi(2)+2, n) = 0.d0
-                     endif
-                  end do
-               end if
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,hi(2))   = merge(66.D0, 0.0D0, &
-                      mask(i,hi(2)+1) .gt. 0)
-               end do
-            end if
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do i = lo(1), hi(1)
-                  phi(i,hi(2)+1,n) = merge( &
-                     -phi(i,hi(2),n), &
-                      phi(i,hi(2)+1,n), &
-                      mask(i,hi(2)+1) .gt. 0)
-                  phi(i,hi(2)+2,n) = merge( &
-                     -phi(i,hi(2)-2,n), &
-                      phi(i,hi(2)+2,n), &
-                      mask(i,hi(2)+2) .gt. 0)
-               end do
-            end do
-            if ( flagden .eq. 1 ) then
-               do i = lo(1), hi(1)
-                  den(i,hi(2)) = merge(-1.0D0, 0.0D0, &
-                      mask(i,hi(2)+1) .gt. 0)
-               end do
-            end if
-
-         else
-            print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_applybc4_touchup ( &
-          phi,   phi_l1,phi_l2,phi_h1,phi_h2, &
-          lo, hi, nc) bind(c,name='amrex_ab4_applybc4_touchup')
-
-      implicit none
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer phi_l1,phi_l2,phi_h1,phi_h2
-      real(amrex_real) phi(phi_l1:phi_h1,phi_l2:phi_h2,nc)
-!
-      integer i, j, n
-
-      do n = 1, nc
-         do i = lo(1)-1, phi_l1, -1
-            do j = lo(2)-1, phi_l2, -1
-               phi(i,j,n) = 0.5d0 * &
-     &              ( (4*phi(i,j+1,n)-6*phi(i,j+2,n)+4*phi(i,j+3,n)-phi(i,j+4,n)) &
-     &              + (4*phi(i+1,j,n)-6*phi(i+2,j,n)+4*phi(i+3,j,n)-phi(i+4,j,n)) )
-            enddo
-            do j = hi(2)+1, phi_h2
-               phi(i,j,n) = 0.5d0 * &
-     &              ( (4*phi(i,j-1,n)-6*phi(i,j-2,n)+4*phi(i,j-3,n)-phi(i,j-4,n)) &
-     &              + (4*phi(i+1,j,n)-6*phi(i+2,j,n)+4*phi(i+3,j,n)-phi(i+4,j,n)) )
-            enddo
-         enddo
-
-         do i = hi(1)+1, phi_h1
-            do j = lo(2)-1, phi_l2, -1
-               phi(i,j,n) = 0.5d0 * &
-     &              ( (4*phi(i,j+1,n)-6*phi(i,j+2,n)+4*phi(i,j+3,n)-phi(i,j+4,n)) &
-     &              + (4*phi(i-1,j,n)-6*phi(i-2,j,n)+4*phi(i-3,j,n)-phi(i-4,j,n)) )
-            enddo
-            do j = hi(2)+1, phi_h2
-               phi(i,j,n) = 0.5d0 * &
-     &              ( (4*phi(i,j-1,n)-6*phi(i,j-2,n)+4*phi(i,j-3,n)-phi(i,j-4,n)) &
-     &              + (4*phi(i-1,j,n)-6*phi(i-2,j,n)+4*phi(i-3,j,n)-phi(i-4,j,n)) )
-            enddo
-         enddo
-      enddo
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_ca2cc(lo, hi, ca, ca_l1,ca_l2,ca_h1,ca_h2, cc, cc_l1,cc_l2,cc_h1,cc_h2, nc) &
-           bind(c,name='amrex_ab4_ca2cc')
-
-      implicit none
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer ca_l1,ca_l2,ca_h1,ca_h2
-      integer cc_l1,cc_l2,cc_h1,cc_h2
-      integer nc
-      real(amrex_real) ca(ca_l1:ca_h1,ca_l2:ca_h2,nc)
-      real(amrex_real) cc(cc_l1:cc_h1,cc_l2:cc_h2,nc)
-
-      integer i,j,n
-      real(amrex_real) one24th, seven6th
-      parameter (one24th = 1.d0 / 24.d0)
-      parameter (seven6th = 7.d0 / 6.d0)
-
-      do n=1,nc
-         do j=lo(2),hi(2)
-            do i=lo(1),hi(1)
-               cc(i,j,n) = -one24th*( &
-     &              ca(i,j-1,n)+ca(i-1,j,n)+ca(i+1,j,n)+ca(i,j+1,n)) &
-     &              + seven6th*ca(i,j,n)
-            enddo
-         enddo
-      enddo
-
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_cc2ca(lo, hi, cc, cc_l1,cc_l2,cc_h1,cc_h2, &
-           ca, ca_l1,ca_l2,ca_h1,ca_h2, nc) bind(c,name='amrex_ab4_cc2ca')
-
-      implicit none
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cc_l1,cc_l2,cc_h1,cc_h2
-      integer ca_l1,ca_l2,ca_h1,ca_h2
-      integer nc
-      real(amrex_real) cc(cc_l1:cc_h1,cc_l2:cc_h2,nc)
-      real(amrex_real) ca(ca_l1:ca_h1,ca_l2:ca_h2,nc)
-
-      integer i,j,n
-      real(amrex_real) one24th, five6th
-      parameter (one24th = 1.d0 / 24.d0)
-      parameter (five6th = 5.d0 / 6.d0)
-
-      if (cc_h1.eq.31) then
-         print *,'hello'
-      endif
-
-      do n=1,nc
-         do j=lo(2),hi(2)
-            do i=lo(1),hi(1)
-               ca(i,j,n) = one24th*( &
-     &              cc(i,j-1,n)+cc(i-1,j,n)+cc(i+1,j,n)+cc(i,j+1,n)) &
-     &              + five6th*cc(i,j,n)
-            enddo
-         enddo
-      enddo
-      if (cc_h1.eq.31) then
-         print *,'goodbye'
-      endif
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_lo_cc2ec(lo, hi, &
-     &     cfab, cfab_l1,cfab_l2,cfab_h1,cfab_h2, &
-     &     efab, efab_l1,efab_l2,efab_h1,efab_h2, nc, dir, &
-     &     isharm) bind(c,name='amrex_ab4_lo_cc2ec')
-      implicit none
-      integer lo(2), hi(2), nc, dir, isharm
-      integer cfab_l1,cfab_l2,cfab_h1,cfab_h2
-      integer efab_l1,efab_l2,efab_h1,efab_h2
-      real(amrex_real)  cfab(cfab_l1:cfab_h1,cfab_l2:cfab_h2, nc)
-      real(amrex_real)  efab(efab_l1:efab_h1,efab_l2:efab_h2, nc)
-
-      integer i,j,n
-
-      if ( isharm .eq. 0 ) then
-         if (dir .EQ. 0) then
-            do n = 1,nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     efab(i,j,n) = half*(cfab(i,j,n) + cfab(i-1,j,n))
-                  end do
-               end do
-            end do
-         else
-            do n = 1,nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     efab(i,j,n) = half*(cfab(i,j,n) + cfab(i,j-1,n))
-                  end do
-               end do
-            end do
-         end if
-      else
-         if (dir .EQ. 0) then
-            do n = 1,nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     if((cfab(i,j,n) * cfab(i-1,j,n)).ne.0.d0)then
-                        efab(i,j,n) &
-     &                       = 2*(cfab(i,j,n) * cfab(i-1,j,n))/ &
-     &                       (cfab(i,j,n) + cfab(i-1,j,n))
-                     else
-                        efab(i,j,n)=0.d0
-                     endif
-                  end do
-               end do
-            end do
-         else
-            do n = 1,nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     if((cfab(i,j,n) * cfab(i,j-1,n)).ne.0.d0)then
-                        efab(i,j,n) &
-     &                       = 2*(cfab(i,j,n) * cfab(i,j-1,n))/ &
-     &                       (cfab(i,j,n) + cfab(i,j-1,n))
-                     else
-                        efab(i,j,n)=0.d0
-                     endif
-                  end do
-               end do
-            end do
-         end if
-      end if
-      end
-
-end module amrex_abec4_module
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_3D.F90 b/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_3D.F90
deleted file mode 100644
index 5e690f76e15..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_3D.F90
+++ /dev/null
@@ -1,1399 +0,0 @@
-
-module amrex_abec4_module
-
-  use amrex_fort_module
-  use amrex_constants_module
-
-  implicit none
-
-  include 'AMReX_lo_bctypes.fi'
-
-contains
-
-#undef BC_ORDER_4
-#define BC_ORDER_5
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in a matrix x vector operator here
-!>
-      subroutine amrex_ab4_adotx( &
-          y,y_l1,y_l2,y_l3,y_h1,y_h2,y_h3, &
-          x,x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-          alpha, beta, &
-          a,a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-          b,b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, &
-          lo,hi,nc, &
-          h &
-          ) bind(c,name='amrex_ab4_adotx')
-      implicit none
-
-      real(amrex_real) alpha, beta
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM), nc
-      integer y_l1,y_l2,y_l3,y_h1,y_h2,y_h3
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer b_l1,b_l2,b_l3,b_h1,b_h2,b_h3
-      real(amrex_real)  y(y_l1:y_h1,y_l2:y_h2,y_l3:y_h3,nc)
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real)  b(b_l1:b_h1,b_l2:b_h2,b_l3:b_h3)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      integer i,j,k,n
-      real(amrex_real) bh1i, bh2i, bh3i
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer zlo(BL_SPACEDIM), zhi(BL_SPACEDIM)
-
-      real(amrex_real), allocatable :: xflux(:,:,:,:), yflux(:,:,:,:), zflux(:,:,:,:)
-
-      xlo(:) = lo(:)
-      xhi(:) = hi(:)
-      ylo(:) = lo(:)
-      yhi(:) = hi(:)
-      zlo(:) = lo(:)
-      zhi(:) = hi(:)
-      xhi(1) = hi(1) + 1
-      yhi(2) = hi(2) + 1
-      zhi(3) = hi(3) + 1
-
-      allocate(xflux(xlo(1):xhi(1),xlo(2):xhi(2),xlo(3):xhi(3),nc))
-      allocate(yflux(ylo(1):yhi(1),ylo(2):yhi(2),ylo(3):yhi(3),nc))
-      allocate(zflux(zlo(1):zhi(1),zlo(2):zhi(2),zlo(3):zhi(3),nc))
-
-      call flux_dir(x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, alpha, beta, &
-           b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, nc, &
-           h(1), xlo, xhi, xflux, xlo(1), xlo(2), xlo(3), xhi(1), xhi(2), xhi(3), 1)
-      call flux_dir(x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, alpha, beta, &
-           b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, nc, &
-           h(2), ylo, yhi, yflux, ylo(1), ylo(2), ylo(3), yhi(1), yhi(2), yhi(3), 2)
-      call flux_dir(x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, alpha, beta, &
-           b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, nc, &
-           h(3), zlo, zhi, zflux, zlo(1), zlo(2), zlo(3), zhi(1), zhi(2), zhi(3), 3)
-
-      bh1i = beta / h(1)
-      bh2i = beta / h(2)
-      bh3i = beta / h(3)
-
-      do n=1,nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  y(i,j,k,n) = alpha*a(i,j,k)*x(i,j,k,n) &
-     &                 - bh1i*(xflux(i+1,j,k,n) - xflux(i,j,k,n)) &
-     &                 - bh2i*(yflux(i,j+1,k,n) - yflux(i,j,k,n)) &
-     &                 - bh3i*(zflux(i,j,k+1,n) - zflux(i,j,k,n))
-               enddo
-            enddo
-         enddo
-      enddo
-
-      deallocate(xflux)
-      deallocate(yflux)
-      deallocate(zflux)
-
-    end subroutine amrex_ab4_adotx
-
-!-----------------------------------------------------------------------
-!>
-!>     Fill in fluxes
-!>
-      subroutine amrex_ab4_flux( &
-          x,x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-          alpha, beta, &
-          a, a_l1,a_l2,a_l3,a_h1,a_h2,a_h3, &
-          b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, &
-          nc, &
-          h, &
-          xlo,xhi,xflux,xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3, &
-          ylo,yhi,yflux,yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3, &
-          zlo,zhi,zflux,zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3 &
-          ) bind(c,name='amrex_ab4_flux')
-      implicit none
-      real(amrex_real) alpha, beta
-      integer nc
-      integer xlo(BL_SPACEDIM), xhi(BL_SPACEDIM)
-      integer ylo(BL_SPACEDIM), yhi(BL_SPACEDIM)
-      integer zlo(BL_SPACEDIM), zhi(BL_SPACEDIM)
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      integer a_l1,a_l2,a_l3,a_h1,a_h2,a_h3
-      integer b_l1,b_l2,b_l3,b_h1,b_h2,b_h3
-      integer xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3
-      integer yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3
-      integer zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real)  a(a_l1:a_h1,a_l2:a_h2,a_l3:a_h3)
-      real(amrex_real)  b(b_l1:b_h1,b_l2:b_h2,b_l3:b_h3)
-      real(amrex_real) xflux(xflux_l1:xflux_h1,xflux_l2:xflux_h2,xflux_l3:xflux_h3,nc)
-      real(amrex_real) yflux(yflux_l1:yflux_h1,yflux_l2:yflux_h2,yflux_l3:yflux_h3,nc)
-      real(amrex_real) zflux(zflux_l1:zflux_h1,zflux_l2:zflux_h2,zflux_l3:zflux_h3,nc)
-      real(amrex_real) h(BL_SPACEDIM)
-
-      call flux_dir(x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, alpha, beta, &
-           b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, nc, &
-           h(1), xlo, xhi, xflux, xflux_l1,xflux_l2,xflux_l3,xflux_h1,xflux_h2,xflux_h3, 1)
-      call flux_dir(x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, alpha, beta, &
-           b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, nc, &
-           h(2), ylo, yhi, yflux, yflux_l1,yflux_l2,yflux_l3,yflux_h1,yflux_h2,yflux_h3, 2)
-      call flux_dir(x, x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, alpha, beta, &
-           b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, nc, &
-           h(3), zlo, zhi, zflux, zflux_l1,zflux_l2,zflux_l3,zflux_h1,zflux_h2,zflux_h3, 3)
-
-    end subroutine amrex_ab4_flux
-
-!-----------------------------------------------------------------------
-
-      subroutine flux_dir( &
-          x,x_l1,x_l2,x_l3,x_h1,x_h2,x_h3, &
-          alpha, beta, &
-          b, b_l1,b_l2,b_l3,b_h1,b_h2,b_h3, &
-          nc, &
-          h, &
-          lo,hi,flux,flux_l1,flux_l2,flux_l3,flux_h1,flux_h2,flux_h3, &
-          dir)
-      implicit none
-      real(amrex_real) alpha, beta
-      integer nc, dir
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer x_l1,x_l2,x_l3,x_h1,x_h2,x_h3
-      integer b_l1,b_l2,b_l3,b_h1,b_h2,b_h3
-      integer flux_l1,flux_l2,flux_l3,flux_h1,flux_h2,flux_h3
-      real(amrex_real)  x(x_l1:x_h1,x_l2:x_h2,x_l3:x_h3,nc)
-      real(amrex_real)  b(b_l1:b_h1,b_l2:b_h2,b_l3:b_h3)
-      real(amrex_real) flux(flux_l1:flux_h1,flux_l2:flux_h2,flux_l3:flux_h3,nc)
-      real(amrex_real) h
-
-      integer i,j,k,n
-      real(amrex_real) i12, i48
-      real(amrex_real) hi1_12
-
-      real(amrex_real), allocatable :: gt(:,:,:)
-      real(amrex_real), allocatable :: bt(:,:,:)
-      real(amrex_real) g1, g2, b1, b2
-
-      i12 = 1.d0/12.d0
-      i48 = 1.d0/48.d0
-      hi1_12 = 1.d0 / (12.d0*h)
-
-      if (dir .eq. 1) then
-         allocate(gt(lo(1):hi(1),lo(2)-2:hi(2)+2,lo(3)-2:hi(3)+2))
-         allocate(bt(lo(1):hi(1),lo(2)-2:hi(2)+2,lo(3)-2:hi(3)+2))
-
-         do k = lo(3)-2, hi(3)+2
-            do j = lo(2)-2, hi(2)+2
-               do i = lo(1), hi(1)
-                  bt(i,j,k) = (-b(i-2,j,k)+7*(b(i-1,j,k)+b(i,j,k))-b(i+1,j,k))*i12
-               enddo
-            enddo
-         enddo
-         do n=1,nc
-            do k = lo(3)-2, hi(3)+2
-               do j = lo(2)-2, hi(2)+2
-                  do i = lo(1), hi(1)
-                     gt(i,j,k) = (x(i-2,j,k,n)-x(i+1,j,k,n)+15.d0*(x(i,j,k,n)-x(i-1,j,k,n)))*hi1_12
-                  enddo
-               enddo
-            enddo
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     g1 = (34.d0*(gt(i,j+1,k)-gt(i,j-1,k))+5.d0*(gt(i,j-2,k)-gt(i,j+2,k)))*i48
-                     b1 = (34.d0*(bt(i,j+1,k)-bt(i,j-1,k))+5.d0*(bt(i,j-2,k)-bt(i,j+2,k)))*i48
-                     g2 = (34.d0*(gt(i,j,k+1)-gt(i,j,k-1))+5.d0*(gt(i,j,k-2)-gt(i,j,k+2)))*i48
-                     b2 = (34.d0*(bt(i,j,k+1)-bt(i,j,k-1))+5.d0*(bt(i,j,k-2)-bt(i,j,k+2)))*i48
-                     flux(i,j,k,n) = bt(i,j,k)*gt(i,j,k)  +  i12*(b1*g1 + b2*g2)
-                  enddo
-               enddo
-            enddo
-         enddo
-      else if (dir .eq. 2) then
-         allocate(gt(lo(1)-2:hi(1)+2,lo(2):hi(2),lo(3)-2:hi(3)+2))
-         allocate(bt(lo(1)-2:hi(1)+2,lo(2):hi(2),lo(3)-2:hi(3)+2))
-
-         do k = lo(3)-2, hi(3)+2
-            do j = lo(2), hi(2)
-               do i = lo(1)-2, hi(1)+2
-                  bt(i,j,k) = (-b(i,j-2,k)+7*(b(i,j-1,k)+b(i,j,k))-b(i,j+1,k))*i12
-               enddo
-            enddo
-         enddo
-         do n=1,nc
-            do k = lo(3)-2, hi(3)+2
-               do j = lo(2), hi(2)
-                  do i = lo(1)-2, hi(1)+2
-                     gt(i,j,k) = (x(i,j-2,k,n)-x(i,j+1,k,n)+15.d0*(x(i,j,k,n)-x(i,j-1,k,n)))*hi1_12
-                  enddo
-               enddo
-            enddo
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     g1 = (34.d0*(gt(i+1,j,k)-gt(i-1,j,k))+5.d0*(gt(i-2,j,k)-gt(i+2,j,k)))*i48
-                     b1 = (34.d0*(bt(i+1,j,k)-bt(i-1,j,k))+5.d0*(bt(i-2,j,k)-bt(i+2,j,k)))*i48
-                     g2 = (34.d0*(gt(i,j,k+1)-gt(i,j,k-1))+5.d0*(gt(i,j,k-2)-gt(i,j,k+2)))*i48
-                     b2 = (34.d0*(bt(i,j,k+1)-bt(i,j,k-1))+5.d0*(bt(i,j,k-2)-bt(i,j,k+2)))*i48
-                     flux(i,j,k,n) = bt(i,j,k)*gt(i,j,k)  +  i12*(b1*g1 + b2*g2)
-                  enddo
-               enddo
-            enddo
-         enddo
-      else
-         allocate(gt(lo(1)-2:hi(1)+2,lo(2)-2:hi(2)+2,lo(3):hi(3)))
-         allocate(bt(lo(1)-2:hi(1)+2,lo(2)-2:hi(2)+2,lo(3):hi(3)))
-
-         do k = lo(3), hi(3)
-            do j = lo(2)-2, hi(2)+2
-               do i = lo(1)-2, hi(1)+2
-                  bt(i,j,k) = (-b(i,j,k-2)+7*(b(i,j,k-1)+b(i,j,k))-b(i,j,k+1))*i12
-               enddo
-            enddo
-         enddo
-         do n=1,nc
-            do k = lo(3), hi(3)
-               do j = lo(2)-2, hi(2)+2
-                  do i = lo(1)-2, hi(1)+2
-                     gt(i,j,k) = (x(i,j,k-2,n)-x(i,j,k+1,n)+15.d0*(x(i,j,k,n)-x(i,j,k-1,n)))*hi1_12
-                  enddo
-               enddo
-            enddo
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     g1 = (34.d0*(gt(i+1,j,k)-gt(i-1,j,k))+5.d0*(gt(i-2,j,k)-gt(i+2,j,k)))*i48
-                     b1 = (34.d0*(bt(i+1,j,k)-bt(i-1,j,k))+5.d0*(bt(i-2,j,k)-bt(i+2,j,k)))*i48
-                     g2 = (34.d0*(gt(i,j+1,k)-gt(i,j-1,k))+5.d0*(gt(i,j-2,k)-gt(i,j+2,k)))*i48
-                     b2 = (34.d0*(bt(i,j+1,k)-bt(i,j-1,k))+5.d0*(bt(i,j-2,k)-bt(i,j+2,k)))*i48
-                     flux(i,j,k,n) = bt(i,j,k)*gt(i,j,k)  +  i12*(b1*g1 + b2*g2)
-                  enddo
-               enddo
-            enddo
-         enddo
-      endif
-
-      deallocate(gt)
-      deallocate(bt)
-
-    end subroutine flux_dir
-
-!-----------------------------------------------------------------------
-      subroutine amrex_ab4_applybc4 ( &
-          flagden, flagbc, maxorder, &
-          phi,   phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-          cdir, bct, bcl, &
-          bcval, bcval_l1,bcval_l2,bcval_l3,bcval_h1,bcval_h2,bcval_h3, &
-          mask,  mask_l1,mask_l2,mask_l3,mask_h1,mask_h2,mask_h3, &
-          den,   den_l1,den_l2,den_l3,den_h1,den_h2,den_h3, &
-          lo, hi, nc, &
-          h &
-          ) bind(c,name='amrex_ab4_applybc4')
-
-      implicit none
-!
-!     If the boundary is of Neumann type, set the ghost cell value to
-!     that of the outermost point in the valid data (2nd order accurate)
-!     and then fill the "den" array with the value "1"
-!
-!
-!     If flagbc==1:
-!
-!     If the boundary is of Dirichlet type, construct a polynomial
-!     interpolation through the boundary location and internal points
-!     (at locations x(-1:len-2) that generates the ghost cell value (at
-!     location xInt).  Then fill the ghost cell with the interpolated value.
-!     If flagden==1, load the "den" array with the interpolation
-!     coefficient corresponding to outermost point in the valid region
-!     ( the coef(0) corresponding to the location x(0) )
-!
-!     Note:
-!     The bc type = LO_REFLECT_ODD is a special type of boundary condition.
-!
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      integer den_l1,den_l2,den_l3,den_h1,den_h2,den_h3
-      integer bcval_l1,bcval_l2,bcval_l3,bcval_h1,bcval_h2,bcval_h3
-      integer mask_l1,mask_l2,mask_l3,mask_h1,mask_h2,mask_h3
-      real(amrex_real)  phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,nc)
-      real(amrex_real)  den(den_l1:den_h1,den_l2:den_h2,den_l3:den_h3)
-      real(amrex_real)  bcval(bcval_l1:bcval_h1,bcval_l2:bcval_h2,bcval_l3:bcval_h3,nc)
-      integer mask(mask_l1:mask_h1,mask_l2:mask_h2,mask_l3:mask_h3)
-      integer bct
-      real(amrex_real) bcl, tmp, b, d
-      parameter (b = 1.d0/24.d0)
-      parameter (d = 5.d0/6.d0)
-      real(amrex_real)  h(BL_SPACEDIM)
-      integer i, j, k, n
-      logical is_dirichlet, is_neumann
-
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET )
-      is_neumann(i)   = ( i .eq. LO_NEUMANN )
-
-!
-!
-!     The Left face of the grid
-!
-      if(cdir .eq. 0) then
-         if (is_neumann(bct)) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     if (mask(lo(1)-1,j,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(lo(1)-1,j,k,n) = (9*phi(lo(1),j,k,n)+3*phi(lo(1)+1,j,k,n) &
-     &                       -phi(lo(1)+2,j,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(lo(1)-1,j,k,n) = (5*phi(lo(1),j,k,n)+9*phi(lo(1)+1,j,k,n) &
-     &                       -5*phi(lo(1)+2,j,k,n)+phi(lo(1)+3,j,k,n))/10.d0
-#endif
-                     endif
-                     if (mask(lo(1)-2,j,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(lo(1)-2,j,k,n) = (-30*phi(lo(1),j,k,n)+56*phi(lo(1)+1,j,k,n) &
-     &                       -15*phi(lo(1)+2,j,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(lo(1)-2,j,k,n) = (-75*phi(lo(1),j,k,n)+145*phi(lo(1)+1,j,k,n) &
-     &                       -75*phi(lo(1)+2,j,k,n)+15*phi(lo(1)+3,j,k,n))/10.d0
-#endif
-                     endif
-                  enddo
-               enddo
-            enddo
-            if (flagden .eq. 1) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,k) = 1.0D0
-                  enddo
-               enddo
-            endif
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        if (mask(lo(1)-1,j,k) .gt. 0) then
-!     Convert ec BC data to ea BC data -> tmp
-                           if (mask(lo(1)-1,j-1,k).gt.0 .and. mask(lo(1)-1,j+1,k).gt.0 &
-                               .and. mask(lo(1)-1,j,k-1).gt.0 .and. mask(lo(1)-1,j,k+1).gt.0) then
-                              tmp = b*(bcval(lo(1)-1,j+1,k,n)+bcval(lo(1)-1,j-1,k,n) &
-     &                             +bcval(lo(1)-1,j,k+1,n)+bcval(lo(1)-1,j,k-1,n))+d*bcval(lo(1)-1,j,k,n)
-                           else
-                              tmp = bcval(lo(1)-1,j,k,n)
-                           endif
-#if defined(BC_ORDER_4)
-                           phi(lo(1)-1,j,k,n) = (12*tmp-13*phi(lo(1),j,k,n) &
-     &                          +5*phi(lo(1)+1,j,k,n)-phi(lo(1)+2,j,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                           phi(lo(1)-1,j,k,n) = (60*tmp-77*phi(lo(1),j,k,n)+43*phi(lo(1)+1,j,k,n) &
-     &                          -17*phi(lo(1)+2,j,k,n)+3*phi(lo(1)+3,j,k,n))/12.d0
-#endif
-                           if (mask(lo(1)-2,j,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                             phi(lo(1)-2,j,k,n) = (48*tmp - 70*phi(lo(1),j,k,n) + &
-     &                             32*phi(lo(1)+1,j,k,n) - 7*phi(lo(1)+2,j,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                              phi(lo(1)-2,j,k,n) = (300*tmp-505*phi(lo(1),j,k,n)+ &
-     &                            335*phi(lo(1)+1,j,k,n)-145*phi(lo(1)+2,j,k,n)+27*phi(lo(1)+3,j,k,n))/12.d0
-#endif
-                           endif
-                        endif
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        if (mask(lo(1)-1,j,k) .gt. 0) then
-                           phi(lo(1)-1,j,k,n) = 0.d0
-                        endif
-                        if (mask(lo(1)-2,j,k) .gt. 0) then
-                           phi(lo(1)-2,j,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               endif
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,k) = merge(66.D0, 0.0D0, &
-                         mask(lo(1)-1,j,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     phi(lo(1)-1,j,k,n) = merge( &
-                         -phi(lo(1),j,k,n), &
-                         phi(lo(1)-1,j,k,n), &
-                         mask(lo(1)-1,j,k) .gt. 0)
-                     phi(lo(1)-2,j,k,n) = merge( &
-                         -phi(lo(1)+1,j,k,n), &
-                         phi(lo(1)-2,j,k,n), &
-                         mask(lo(1)-2,j,k) .gt. 0)
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,k) = merge(-1.0D0, 0.0D0, &
-                         mask(lo(1)-1,j,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-         else
-            print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The Right face of the grid
-!
-      if(cdir .eq. 3) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     if (mask(hi(1)+1,j,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(hi(1)+1,j,k,n) =  (9*phi(hi(1),j,k,n) &
-     &                       +3*phi(hi(1)-1,j,k,n)-phi(hi(1)-2,j,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(hi(1)+1,j,k,n) =  (5*phi(hi(1)  ,j,k,n) +  9*phi(hi(1)-1,j,k,n) &
-     &                       - 5*phi(hi(1)-2,j,k,n) + phi(hi(1)-3,j,k,n))/10.d0
-#endif
-                     endif
-                     if (mask(hi(1)+2,j,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(hi(1)+2,j,k,n) = (- 30*phi(hi(1),j,k,n) + 56*phi(hi(1)-1,j,k,n) &
-     &                       - 15*phi(hi(1)-2,j,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(hi(1)+2,j,k,n) = (- 75*phi(hi(1),j,k,n) + 145*phi(hi(1)-1,j,k,n) &
-     &                       - 75*phi(hi(1)-2,j,k,n) + 15*phi(hi(1)-3,j,k,n))/10.d0
-#endif
-                     endif
-                  enddo
-               enddo
-            enddo
-	    if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,k) = 1.0D0
-                  enddo
-               enddo
-	    endif
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        if (mask(hi(1)+1,j,k) .gt. 0) then
-!     Convert ec BC data to ea BC data -> tmp
-                           if (mask(hi(1)+1,j-1,k).gt.0 .and. mask(hi(1)+1,j+1,k).gt.0 &
-                               .and. mask(hi(1)+1,j,k-1).gt.0 .and. mask(hi(1)+1,j,k+1).gt.0) then
-                              tmp = b*(bcval(hi(1)+1,j+1,k,n)+bcval(hi(1)+1,j-1,k,n)+bcval(hi(1)+1,j,k+1,n) &
-     &                             +bcval(hi(1)+1,j,k-1,n)) + d*bcval(hi(1)+1,j,k,n)
-                           else
-                              tmp = bcval(hi(1)+1,j,k,n)
-                           endif
-#if defined(BC_ORDER_4)
-                           phi(hi(1)+1,j,k,n) = (12*tmp - 13*phi(hi(1),j,k,n) &
-     &                          + 5*phi(hi(1)-1,j,k,n) - phi(hi(1)-2,j,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                           phi(hi(1)+1,j,k,n) = (60*tmp - 77*phi(hi(1),j,k,n) + 43*phi(hi(1)-1,j,k,n) &
-     &                          - 17*phi(hi(1)-2,j,k,n) + 3*phi(hi(1)-3,j,k,n))/12.d0
-#endif
-                           if (mask(hi(1)+2,j,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                              phi(hi(1)+2,j,k,n) = (48*tmp - 70*phi(hi(1),j,k,n) &
-     &                             + 32*phi(hi(1)-1,j,k,n) - 7*phi(hi(1)-2,j,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                              phi(hi(1)+2,j,k,n) = (300*tmp - 505*phi(hi(1),j,k,n) + 335*phi(hi(1)-1,j,k,n) &
-     &                             - 145*phi(hi(1)-2,j,k,n) + 27*phi(hi(1)-3,j,k,n))/12.d0
-#endif
-                           endif
-                        endif
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        if (mask(hi(1)+1,j,k) .gt. 0) then
-                           phi(hi(1)+1,j,k,n) = 0.d0
-                        endif
-                        if (mask(hi(1)+2,j,k) .gt. 0) then
-                           phi(hi(1)+2,j,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               endif
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,k)   = merge(66.D0, 0.0D0, &
-                         mask(hi(1)+1,j,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     phi(hi(1)+1,j,k,n) = merge( &
-                         -phi(hi(1),j,k,n), &
-                         phi(hi(1)+1,j,k,n), &
-                         mask(hi(1)+1,j,k) .gt. 0)
-                     phi(hi(1)+2,j,k,n) = merge( &
-                         -phi(hi(1)-1,j,k,n), &
-                         phi(hi(1)+2,j,k,n), &
-                         mask(hi(1)+2,j,k) .gt. 0)
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,k) = merge(-1.0D0, 0.0D0, &
-                         mask(hi(1)+1,j,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-         else
-            print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-            call bl_error("stop")
-         endif
-      endif
-!
-!     The Bottom of the Grid
-!
-      if(cdir .eq. 1) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do k = lo(3),hi(3)
-                  do i = lo(1),hi(1)
-                     if (mask(i,lo(2)-1,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,lo(2)-1,k,n) =  (9*phi(i,lo(2),k,n) +  3*phi(i,lo(2)+1,k,n) &
-     &                       - phi(i,lo(2)+2,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,lo(2)-1,k,n) =  (5*phi(i,lo(2)  ,k,n) +  9*phi(i,lo(2)+1,k,n) &
-     &                       - 5*phi(i,lo(2)+2,k,n) + phi(i,lo(2)+3,k,n))/10.d0
-#endif
-                     endif
-                     if (mask(i,lo(2)-2,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,lo(2)-2,k,n) = (- 30*phi(i,lo(2),k,n) + 56*phi(i,lo(2)+1,k,n) &
-     &                       - 15*phi(i,lo(2)+2,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,lo(2)-2,k,n) = (- 75*phi(i,lo(2),k,n) + 145*phi(i,lo(2)+1,k,n) &
-     &                       - 75*phi(i,lo(2)+2,k,n) + 15*phi(i,lo(2)+3,k,n))/10.d0
-#endif
-                     endif
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3),hi(3)
-                  do i = lo(1),hi(1)
-                     den(i,lo(2),k)   = 1.0D0
-                  enddo
-               enddo
-            endif
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        if (mask(i,lo(2)-1,k) .gt. 0) then
-!     Convert ec BC data to ea BC data -> tmp
-                           if (mask(i-1,lo(2)-1,k).gt.0 .and. mask(i+1,lo(2)-1,k).gt.0 &
-                               .and. mask(i,lo(2)-1,k-1).gt.0 .and. mask(i,lo(2)-1,k+1).gt.0) then
-                              tmp = b*(bcval(i+1,lo(2)-1,k,n)+bcval(i-1,lo(2)-1,k,n)+bcval(i,lo(2)-1,k+1,n) &
-     &                             +bcval(i,lo(2)-1,k-1,n)) + d*bcval(i,lo(2)-1,k,n)
-                           else
-                              tmp = bcval(i,lo(2)-1,k,n)
-                           endif
-#if defined(BC_ORDER_4)
-                           phi(i,lo(2)-1,k,n) = (12*tmp - 13*phi(i,lo(2),k,n) + 5*phi(i,lo(2)+1,k,n) &
-     &                          - phi(i,lo(2)+2,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                           phi(i,lo(2)-1,k,n) = (60*tmp - 77*phi(i,lo(2),k,n) + 43*phi(i,lo(2)+1,k,n) &
-     &                          - 17*phi(i,lo(2)+2,k,n) + 3*phi(i,lo(2)+3,k,n))/12.d0
-#endif
-                           if (mask(i,lo(2)-2,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                              phi(i,lo(2)-2,k,n) =   (48*tmp - 70*phi(i,lo(2),k,n) + 32*phi(i,lo(2)+1,k,n) &
-     &                             - 7*phi(i,lo(2)+2,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                              phi(i,lo(2)-2,k,n) = (300*tmp - 505*phi(i,lo(2),k,n) + 335*phi(i,lo(2)+1,k,n) &
-     &                             - 145*phi(i,lo(2)+2,k,n) + 27*phi(i,lo(2)+3,k,n))/12.d0
-#endif
-                           endif
-                        endif
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        if (mask(i,lo(2)-1,k) .gt. 0) then
-                           phi(i,lo(2)-1,k,n) = 0.d0
-                        endif
-                        if (mask(i,lo(2)-2,k) .gt. 0) then
-                           phi(i,lo(2)-2,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               endif
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,lo(2),k)   = merge(66.D0, 0.0D0, &
-                         mask(i,lo(2)-1,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     phi(i,lo(2)-1,k,n) = merge( &
-                         -phi(i,lo(2),k,n), &
-                         phi(i,lo(2)-1,k,n), &
-                         mask(i,lo(2)-1,k) .gt. 0)
-                     phi(i,lo(2)-2,k,n) = merge( &
-                         -phi(i,lo(2)+1,k,n), &
-                         phi(i,lo(2)-2,k,n), &
-                         mask(i,lo(2)-2,k) .gt. 0)
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,lo(2),k) = merge(-1.0D0, 0.0D0, &
-                         mask(i,lo(2)-1,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else
-            print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The top of the grid
-!
-      if (cdir .eq. 4) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     if (mask(i,hi(2)+1,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,hi(2)+1,k,n) =  (9*phi(i,hi(2),k,n) +  3*phi(i,hi(2)-1,k,n) &
-     &                       - phi(i,hi(2)-2,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,hi(2)+1,k,n) =  (5*phi(i,hi(2),k,n) +  9*phi(i,hi(2)-1,k,n) &
-     &                       - 5*phi(i,hi(2)-2,k,n) + phi(i,hi(2)-3,k,n))/10.d0
-#endif
-                     endif
-                     if (mask(i,hi(2)+2,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,hi(2)+2,k,n) = (- 30*phi(i,hi(2),k,n) + 56*phi(i,hi(2)-1,k,n) &
-     &                       - 15*phi(i,hi(2)-2,k,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,hi(2)+2,k,n) = (- 75*phi(i,hi(2),k,n) + 145*phi(i,hi(2)-1,k,n) &
-     &                       - 75*phi(i,hi(2)-2,k,n) + 15*phi(i,hi(2)-3,k,n))/10.d0
-#endif
-                     endif
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),k)   = 1.0D0
-                  enddo
-               enddo
-            endif
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        if (mask(i,hi(2)+1,k) .gt. 0) then
-!     Convert ec BC data to ea BC data -> tmp
-                           if (mask(i-1,hi(2)+1,k).gt.0 .and. mask(i+1,hi(2)+1,k).gt.0 &
-                               .and. mask(i,hi(2)+1,k-1).gt.0 .and. mask(i,hi(2)+1,k+1).gt.0) then
-                              tmp = b*(bcval(i+1,hi(2)+1,k,n)+bcval(i-1,hi(2)+1,k,n)+bcval(i,hi(2)+1,k+1,n) &
-     &                             +bcval(i,hi(2)+1,k-1,n)) + d*bcval(i,hi(2)+1,k,n)
-                           else
-                              tmp = bcval(i,hi(2)+1,k,n)
-                           endif
-#if defined(BC_ORDER_4)
-                           phi(i,hi(2)+1,k,n) = (12*tmp - 13*phi(i,hi(2),k,n) + 5*phi(i,hi(2)-1,k,n) &
-     &                          - phi(i,hi(2)-2,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                           phi(i,hi(2)+1,k,n) = (60*tmp - 77*phi(i,hi(2),k,n) + 43*phi(i,hi(2)-1,k,n) &
-     &                          - 17*phi(i,hi(2)-2,k,n) + 3*phi(i,hi(2)-3,k,n))/12.d0
-#endif
-                           if (mask(i,hi(2)+2,k) .gt. 0) then
-#if defined(BC_ORDER_4)
-                              phi(i,hi(2)+2,k,n) =   (48*tmp -  70*phi(i,hi(2),k,n) + 32*phi(i,hi(2)-1,k,n) &
-     &                             - 7*phi(i,hi(2)-2,k,n))/3.d0
-#elif defined(BC_ORDER_5)
-                              phi(i,hi(2)+2,k,n) = (300*tmp - 505*phi(i,hi(2),k,n) + 335*phi(i,hi(2)-1,k,n) &
-     &                             - 145*phi(i,hi(2)-2,k,n) + 27*phi(i,hi(2)-3,k,n))/12.d0
-#endif
-                           endif
-                        endif
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        if (mask(i,hi(2)+1,k) .gt. 0) then
-                           phi(i,hi(2)+1,k,n) = 0.d0
-                        endif
-                        if (mask(i,hi(2)+2,k) .gt. 0) then
-                           phi(i,hi(2)+2,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               endif
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),k)   = merge(66.D0, 0.0D0, &
-                         mask(i,hi(2)+1,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     phi(i,hi(2)+1,k,n) = merge( &
-                         -phi(i,hi(2),k,n), &
-                         phi(i,hi(2)+1,k,n), &
-                         mask(i,hi(2)+1,k) .gt. 0)
-                     phi(i,hi(2)+2,k,n) = merge( &
-                         -phi(i,hi(2)-2,k,n), &
-                         phi(i,hi(2)+2,k,n), &
-                         mask(i,hi(2)+2,k) .gt. 0)
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),k) = merge(-1.0D0, 0.0D0, &
-                         mask(i,hi(2)+1,k) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else
-            print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      endif
-!
-!
-!     The Front of the Grid
-!
-      if(cdir .eq. 2) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do j = lo(2),hi(2)
-                  do i = lo(1),hi(1)
-                     if (mask(i,j,lo(3)-1) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,j,lo(3)-1,n) =  (9*phi(i,j,lo(3),n) +  3*phi(i,j,lo(3)+1,n) &
-     &                       - phi(i,j,lo(3)+2,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,j,lo(3)-1,n) =  (5*phi(i,j,lo(3),n) +  9*phi(i,j,lo(3)+1,n) &
-     &                       - 5*phi(i,j,lo(3)+2,n) + phi(i,j,lo(3)+3,n))/10.d0
-#endif
-                     endif
-                     if (mask(i,k,lo(3)-2) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,j,lo(3)-2,n) = (- 30*phi(i,j,lo(3),n) + 56*phi(i,j,lo(3)+1,n) &
-     &                       - 15*phi(i,j,lo(3)+2,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,j,lo(3)-2,n) = (- 75*phi(i,j,lo(3),n) + 145*phi(i,j,lo(3)+1,n) &
-     &                       - 75*phi(i,j,lo(3)+2,n) + 15*phi(i,j,lo(3)+3,n))/10.d0
-#endif
-                     endif
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do j = lo(2),hi(2)
-                  do i = lo(1),hi(1)
-                     den(i,j,lo(3))   = 1.0D0
-                  enddo
-               enddo
-            endif
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if (mask(i,j,lo(3)-1) .gt. 0) then
-!     Convert ec BC data to ea BC data -> tmp
-                           if (mask(i-1,j,lo(3)-1).gt.0 .and. mask(i+1,j,lo(3)-1).gt.0 &
-                               .and. mask(i,j-1,lo(3)-1).gt.0 .and. mask(i,j+1,lo(3)-1).gt.0) then
-                              tmp = b*(bcval(i+1,j,lo(3)-1,n)+bcval(i-1,j,lo(3)-1,n)+bcval(i,j+1,lo(3)-1,n) &
-     &                             +bcval(i,j-1,lo(3)-1,n)) + d*bcval(i,j,lo(3)-1,n)
-                           else
-                              tmp = bcval(i,j,lo(3)-1,n)
-                           endif
-#if defined(BC_ORDER_4)
-                           phi(i,j,lo(3)-1,n) = (12*tmp - 13*phi(i,j,lo(3),n) + 5*phi(i,j,lo(3)+1,n) &
-     &                          - phi(i,j,lo(3)+2,n))/3.d0
-#elif defined(BC_ORDER_5)
-                           phi(i,j,lo(3)-1,n) = (60*tmp - 77*phi(i,j,lo(3),n) + 43*phi(i,j,lo(3)+1,n) &
-     &                          - 17*phi(i,j,lo(3)+2,n) + 3*phi(i,j,lo(3)+3,n))/12.d0
-#endif
-                           if (mask(i,j,lo(3)-2) .gt. 0) then
-#if defined(BC_ORDER_4)
-                              phi(i,j,lo(3)-2,n) =   (48*tmp - 70*phi(i,j,lo(3),n) + 32*phi(i,j,lo(3)+1,n) &
-     &                             - 7*phi(i,j,lo(3)+2,n))/3.d0
-#elif defined(BC_ORDER_5)
-                              phi(i,j,lo(3)-2,n) = (300*tmp - 505*phi(i,j,lo(3),n) + 335*phi(i,j,lo(3)+1,n) &
-     &                             - 145*phi(i,j,lo(3)+2,n) + 27*phi(i,j,lo(3)+3,n))/12.d0
-#endif
-                           endif
-                        endif
-                     enddo
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if (mask(i,j,lo(3)-1) .gt. 0) then
-                           phi(i,j,lo(3)-1,n) = 0.d0
-                        endif
-                        if (mask(i,j,lo(3)-2) .gt. 0) then
-                           phi(i,j,lo(3)-2,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               endif
-            enddo
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,lo(3))   = merge(66.D0, 0.0D0, &
-                         mask(i,j,lo(3)-1) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     phi(i,j,lo(3)-1,n) = merge( &
-                         -phi(i,j,lo(3),n), &
-                         phi(i,j,lo(3)-1,n), &
-                         mask(i,j,lo(3)-1) .gt. 0)
-                     phi(i,j,lo(3)-2,n) = merge( &
-                         -phi(i,j,lo(3)+1,n), &
-                         phi(i,j,lo(3)-2,n), &
-                         mask(i,j,lo(3)-2) .gt. 0)
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,lo(3)) = merge(-1.0D0, 0.0D0, &
-                         mask(i,j,lo(3)-1) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else
-            print *,'UNKNOWN BC ON FRONT FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      end if
-!
-!     The back of the grid
-!
-      if (cdir .eq. 5) then
-         if(is_neumann(bct)) then
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     if (mask(i,j,hi(2)+1) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,j,hi(3)+1,n) =  (9*phi(i,j,hi(3),n) +  3*phi(i,j,hi(3)-1,n) &
-     &                       - phi(i,j,hi(3)-2,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,j,hi(3)+1,n) =  (5*phi(i,j,hi(3),n) +  9*phi(i,j,hi(3)-1,n) &
-     &                       - 5*phi(i,j,hi(3)-2,n) + phi(i,j,hi(3)-3,n))/10.d0
-#endif
-                     endif
-                     if (mask(i,j,hi(3)+2) .gt. 0) then
-#if defined(BC_ORDER_4)
-                        phi(i,j,hi(3)+2,n) = (- 30*phi(i,j,hi(3),n) + 56*phi(i,j,hi(3)-1,n) &
-     &                       - 15*phi(i,j,hi(3)-2,n))/11.d0
-#elif defined(BC_ORDER_5)
-                        phi(i,j,hi(3)+2,n) = (- 75*phi(i,j,hi(3),n) + 145*phi(i,j,hi(3)-1,n) &
-     &                       - 75*phi(i,j,hi(3)-2,n) + 15*phi(i,j,hi(3)-3,n))/10.d0
-#endif
-                     endif
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,hi(3))   = 1.0D0
-                  enddo
-               enddo
-            endif
-         else if (is_dirichlet(bct)) then
-            do n = 1, nc
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if (mask(i,j,hi(3)+1) .gt. 0) then
-!     Convert ec BC data to ea BC data -> tmp
-                           if (mask(i-1,j,hi(3)+1).gt.0 .and. mask(i+1,j,hi(3)+1).gt.0 &
-                               .and. mask(i,j-1,hi(3)+1).gt.0 .and. mask(i,j+1,hi(3)+1).gt.0) then
-                              tmp = b*(bcval(i+1,j,hi(3)+1,n)+bcval(i-1,j,hi(3)+1,n)+bcval(i,j+1,hi(3)+1,n) &
-     &                             +bcval(i,j-1,hi(3)+1,n)) + d*bcval(i,j,hi(3)+1,n)
-                           else
-                              tmp = bcval(i,j,hi(3)+1,n)
-                           endif
-#if defined(BC_ORDER_4)
-                           phi(i,j,hi(3)+1,n) = (12*tmp - 13*phi(i,j,hi(3),n) + 5*phi(i,j,hi(3)-1,n) &
-     &                          - phi(i,j,hi(3)-2,n))/3.d0
-#elif defined(BC_ORDER_5)
-                           phi(i,j,hi(3)+1,n) = (60*tmp - 77*phi(i,j,hi(3),n) + 43*phi(i,j,hi(3)-1,n) &
-     &                          - 17*phi(i,j,hi(3)-2,n) + 3*phi(i,j,hi(3)-3,n))/12.d0
-#endif
-                           if (mask(i,j,hi(3)+2) .gt. 0) then
-#if defined(BC_ORDER_4)
-                              phi(i,j,hi(3)+2,n) =   (48*tmp -  70*phi(i,j,hi(3),n) + 32*phi(i,j,hi(3)-1,n) &
-     &                             - 7*phi(i,j,hi(3)-2,n))/3.d0
-#elif defined(BC_ORDER_5)
-                              phi(i,j,hi(3)+2,n) = (300*tmp - 505*phi(i,j,hi(3),n) + 335*phi(i,j,hi(3)-1,n) &
-     &                             - 145*phi(i,j,hi(3)-2,n) + 27*phi(i,j,hi(3)-3,n))/12.d0
-#endif
-                           endif
-                        endif
-                     enddo
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if (mask(i,j,hi(3)+1) .gt. 0) then
-                           phi(i,j,hi(3)+1,n) = 0.d0
-                        endif
-                        if (mask(i,j,hi(3)+2) .gt. 0) then
-                           phi(i,j,hi(3)+2,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               endif
-            enddo
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,hi(3))   = merge(66.D0, 0.0D0, &
-                         mask(i,j,hi(3)+1) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else if ( bct .eq. LO_REFLECT_ODD ) then
-
-            do n = 1, nc
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     phi(i,j,hi(3)+1,n) = merge( &
-                         -phi(i,j,hi(3),n), &
-                         phi(i,j,hi(3)+1,n), &
-                         mask(i,j,hi(3)+1) .gt. 0)
-                     phi(i,j,hi(3)+2,n) = merge( &
-                         -phi(i,j,hi(3)-2,n), &
-                         phi(i,j,hi(3)+2,n), &
-                         mask(i,j,hi(3)+2) .gt. 0)
-                  enddo
-               enddo
-            enddo
-            if ( flagden .eq. 1 ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     den(i,j,hi(3)) = merge(-1.0D0, 0.0D0, &
-                         mask(i,j,hi(3)+1) .gt. 0)
-                  enddo
-               enddo
-            endif
-
-         else
-            print *,'UNKNOWN BC ON BACK FACE IN APPLYBC'
-            call bl_error("stop")
-         end if
-      endif
-!
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_applybc4_touchup ( &
-          phi,   phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3, &
-          lo, hi, nc) bind(c,name='amrex_ab4_applybc4_touchup')
-
-      implicit none
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer phi_l1,phi_l2,phi_l3,phi_h1,phi_h2,phi_h3
-      real(amrex_real) phi(phi_l1:phi_h1,phi_l2:phi_h2,phi_l3:phi_h3,nc)
-!
-      integer i, j, k, n
-
-      do n = 1, nc
-         do k = lo(3),hi(3)
-            do i = lo(1)-1, phi_l1, -1
-               do j = lo(2)-1, phi_l2, -1
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) )
-               enddo
-               do j = hi(2)+1, phi_h2
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) )
-               enddo
-            enddo
-
-            do i = hi(1)+1, phi_h1
-               do j = lo(2)-1, phi_l2, -1
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) )
-               enddo
-               do j = hi(2)+1, phi_h2
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) )
-               enddo
-            enddo
-
-         enddo
-
-         do j = lo(2),hi(2)
-            do i = lo(1)-1, phi_l1, -1
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-
-            do i = hi(1)+1, phi_h1
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-         enddo
-
-
-         do i = lo(1),hi(1)
-            do j = lo(2)-1, phi_l2, -1
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-
-            do j = hi(2)+1, phi_h2
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = half * &
-     &                 ( (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-         enddo
-
-
-         do i = lo(1)-1, phi_l1, -1
-            do j = lo(2)-1, phi_l2, -1
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-            do j = hi(2)+1, phi_h2
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i+1,j,k,n)-6*phi(i+2,j,k,n)+4*phi(i+3,j,k,n)-phi(i+4,j,k,n)) &
-     &                 + (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-         enddo
-
-         do i = hi(1)+1, phi_h1
-            do j = lo(2)-1, phi_l2, -1
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j+1,k,n)-6*phi(i,j+2,k,n)+4*phi(i,j+3,k,n)-phi(i,j+4,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-            do j = hi(2)+1, phi_h2
-               do k = lo(3)-1, phi_l3, -1
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) &
-     &                 + (4*phi(i,j,k+1,n)-6*phi(i,j,k+2,n)+4*phi(i,j,k+3,n)-phi(i,j,k+4,n)) )
-               enddo
-               do k = hi(3)+1, phi_h3
-                  phi(i,j,k,n) = third * &
-     &                 ( (4*phi(i-1,j,k,n)-6*phi(i-2,j,k,n)+4*phi(i-3,j,k,n)-phi(i-4,j,k,n)) &
-     &                 + (4*phi(i,j-1,k,n)-6*phi(i,j-2,k,n)+4*phi(i,j-3,k,n)-phi(i,j-4,k,n)) &
-     &                 + (4*phi(i,j,k-1,n)-6*phi(i,j,k-2,n)+4*phi(i,j,k-3,n)-phi(i,j,k-4,n)) )
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_ca2cc(lo, hi, ca, ca_l1,ca_l2,ca_l3,ca_h1,ca_h2,ca_h3, &
-           cc, cc_l1,cc_l2,cc_l3,cc_h1,cc_h2,cc_h3, nc) bind(c,name='amrex_ab4_ca2cc')
-
-      implicit none
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer ca_l1,ca_l2,ca_l3,ca_h1,ca_h2,ca_h3
-      integer cc_l1,cc_l2,cc_l3,cc_h1,cc_h2,cc_h3
-      integer nc
-      real(amrex_real) ca(ca_l1:ca_h1,ca_l2:ca_h2,ca_l3:ca_h3,nc)
-      real(amrex_real) cc(cc_l1:cc_h1,cc_l2:cc_h2,cc_l3:cc_h3,nc)
-
-      integer i,j,k,n
-      real(amrex_real) b, d
-      parameter (b = -1.d0/24.d0)
-      parameter (d = 1.25d0)
-
-      do n=1,nc
-         do k=lo(3),hi(3)
-            do j=lo(2),hi(2)
-               do i=lo(1),hi(1)
-                  cc(i,j,k,n) = b*( &
-     &                  ca(i-1,j,k,n)+ca(i,j-1,k,n)+ca(i,j,k-1,n) &
-     &                 +ca(i+1,j,k,n)+ca(i,j+1,k,n)+ca(i,j,k+1,n)) &
-     &                 + d*ca(i,j,k,n)
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_cc2ca(lo, hi, cc, cc_l1,cc_l2,cc_l3,cc_h1,cc_h2,cc_h3, &
-           ca, ca_l1,ca_l2,ca_l3,ca_h1,ca_h2,ca_h3, nc) bind(c,name='amrex_ab4_cc2ca')
-
-      implicit none
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cc_l1,cc_l2,cc_l3,cc_h1,cc_h2,cc_h3
-      integer ca_l1,ca_l2,ca_l3,ca_h1,ca_h2,ca_h3
-      integer nc
-      real(amrex_real) cc(cc_l1:cc_h1,cc_l2:cc_h2,cc_l3:cc_h3,nc)
-      real(amrex_real) ca(ca_l1:ca_h1,ca_l2:ca_h2,ca_l3:ca_h3,nc)
-
-      integer i,j,k,n
-      real(amrex_real) b, d
-      parameter (b = 1.d0/24.d0)
-      parameter (d = 0.75d0)
-
-      do n=1,nc
-         do k=lo(3),hi(3)
-            do j=lo(2),hi(2)
-               do i=lo(1),hi(1)
-                  ca(i,j,k,n) = b*( &
-     &                  cc(i-1,j,k,n)+cc(i,j-1,k,n)+cc(i,j,k-1,n) &
-     &                 +cc(i+1,j,k,n)+cc(i,j+1,k,n)+cc(i,j,k+1,n)) &
-     &                 + d*cc(i,j,k,n)
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-!-----------------------------------------------------------------------
-
-      subroutine amrex_ab4_lo_cc2ec(lo, hi, &
-     &     cfab, cfab_l1,cfab_l2,cfab_l3,cfab_h1,cfab_h2,cfab_h3, &
-     &     efab, efab_l1,efab_l2,efab_l3,efab_h1,efab_h2,efab_h3, &
-     &     nc, dir, &
-     &     isharm) bind(c,name='amrex_ab4_lo_cc2ec')
-      implicit none
-      integer lo(3), hi(3), nc, dir, isharm
-      integer cfab_l1,cfab_l2,cfab_l3,cfab_h1,cfab_h2,cfab_h3
-      integer efab_l1,efab_l2,efab_l3,efab_h1,efab_h2,efab_h3
-      real(amrex_real)  cfab(cfab_l1:cfab_h1,cfab_l2:cfab_h2,cfab_l3:cfab_h3, nc)
-      real(amrex_real)  efab(efab_l1:efab_h1,efab_l2:efab_h2,efab_l3:efab_h3, nc)
-
-      integer i,j,k,n
-
-      if ( isharm .eq. 0 ) then
-         if (dir .EQ. 0) then
-            do n = 1,nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        efab(i,j,k,n) = half*(cfab(i,j,k,n) + cfab(i-1,j,k,n))
-                     enddo
-                  enddo
-               enddo
-            enddo
-         else if (dir .EQ. 1) then
-            do n = 1,nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        efab(i,j,k,n) = half*(cfab(i,j,k,n) + cfab(i,j-1,k,n))
-                     enddo
-                  enddo
-               enddo
-            enddo
-         else if (dir .EQ. 2) then
-            do n = 1,nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        efab(i,j,k,n) = half*(cfab(i,j,k,n) + cfab(i,j,k-1,n))
-                     enddo
-                  enddo
-               enddo
-            enddo
-         endif
-      else
-         if (dir .EQ. 0) then
-            do n = 1,nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if((cfab(i,j,k,n) * cfab(i-1,j,k,n)).ne.0.d0) then
-                           efab(i,j,k,n) &
-     &                          = 2*(cfab(i,j,k,n) * cfab(i-1,j,k,n))/ &
-     &                          (cfab(i,j,k,n) + cfab(i-1,j,k,n))
-                        else
-                           efab(i,j,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               enddo
-            enddo
-         else if (dir .EQ. 1) then
-            do n = 1,nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if((cfab(i,j,k,n) * cfab(i,j-1,k,n)).ne.0.d0) then
-                           efab(i,j,k,n) &
-     &                          = 2*(cfab(i,j,k,n) * cfab(i,j-1,k,n))/ &
-     &                          (cfab(i,j,k,n) + cfab(i,j-1,k,n))
-                        else
-                           efab(i,j,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               enddo
-            enddo
-         else
-            do n = 1,nc
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        if((cfab(i,j,k,n) * cfab(i,j,k-1,n)).ne.0.d0) then
-                           efab(i,j,k,n) &
-     &                          = 2*(cfab(i,j,k,n) * cfab(i,j,k-1,n))/ &
-     &                          (cfab(i,j,k,n) + cfab(i,j,k-1,n))
-                        else
-                           efab(i,j,k,n) = 0.d0
-                        endif
-                     enddo
-                  enddo
-               enddo
-            enddo
-         endif
-      endif
-      end
-
-end module amrex_abec4_module
diff --git a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_F.H b/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_F.H
deleted file mode 100644
index c4a57b651e9..00000000000
--- a/Src/LinearSolvers/C_CellMG4/AMReX_ABec4_F.H
+++ /dev/null
@@ -1,72 +0,0 @@
-#ifndef AMREX_AABBEC4_F_H_
-#define AMREX_AABBEC4_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    void amrex_ab4_applybc4(
-        const int *flagden, const int *flagbc, const int *maxorder,
-        amrex_real *phi, ARLIM_P(phi_lo), ARLIM_P(phi_hi),
-        const int *cdr,
-        const int *bct,
-        const amrex_real *bcl,
-        const amrex_real *bcval, ARLIM_P(bcval_lo), ARLIM_P(bcval_hi),
-        const int *mask,   ARLIM_P(mask_lo),  ARLIM_P(mask_hi), 
-        amrex_real *den,         ARLIM_P(den_lo),   ARLIM_P(den_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-
-    void amrex_ab4_applybc4_touchup(
-        amrex_real *phi, ARLIM_P(phi_lo), ARLIM_P(phi_hi),
-        const int *lo, const int *hi, const int *nc);
-
-    void amrex_ab4_adotx(
-        amrex_real *y      , ARLIM_P(y_lo), ARLIM_P(y_hi),
-        const amrex_real *x, ARLIM_P(x_lo), ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a, ARLIM_P(a_lo), ARLIM_P(a_hi),
-        const amrex_real* b, ARLIM_P(b_lo), ARLIM_P(b_hi),
-        const int *lo, const int *hi, const int *nc,
-        const amrex_real *h
-        );
-    
-    void amrex_ab4_flux(
-        const amrex_real *x, ARLIM_P(x_lo), ARLIM_P(x_hi),
-        const amrex_real* alpha, const amrex_real* beta,
-        const amrex_real* a, ARLIM_P(a_lo), ARLIM_P(a_hi),
-        const amrex_real* b, ARLIM_P(b_lo), ARLIM_P(b_hi),
-        const int *nc,
-        const amrex_real *h,
-        const int *xlo, const int *xhi,
-        const amrex_real* xflux, ARLIM_P(xflux_lo), ARLIM_P(xflux_hi)
-#if (BL_SPACEDIM >= 2)
-        ,const int *ylo, const int *yhi
-        ,const amrex_real* yflux, ARLIM_P(yflux_lo), ARLIM_P(yflux_hi)
-#endif
-#if (BL_SPACEDIM == 3)
-        ,const int *zlo, const int *zhi
-        ,const amrex_real* zflux, ARLIM_P(zflux_lo), ARLIM_P(zflux_hi)
-#endif
-        );
-
-      void amrex_ab4_ca2cc(const int* lo, const int* hi,
-                      const amrex_real* ca, ARLIM_P(ca_lo), ARLIM_P(ca_hi),
-                      amrex_real*       cc, ARLIM_P(cc_lo), ARLIM_P(cc_hi),
-                      const int* nc);
-      void amrex_ab4_cc2ca(const int* lo, const int* hi,
-                      const amrex_real* cc, ARLIM_P(cc_lo), ARLIM_P(cc_hi),
-                      amrex_real*       ca, ARLIM_P(ca_lo), ARLIM_P(ca_hi),
-                      const int* nc);
-      void amrex_ab4_lo_cc2ec(const int* lo, const int* hi,
-                         const amrex_real* cc, ARLIM_P(cc_lo), ARLIM_P(cc_hi),
-                         amrex_real*       ca, ARLIM_P(ca_lo), ARLIM_P(ca_hi),
-                         const int* nc, const int* dir, const int* isharm);
-#ifdef __cplusplus
-}
-#endif
-
-#endif /*_AABBEC4_F_H_*/
diff --git a/Src/LinearSolvers/C_CellMG4/Make.package b/Src/LinearSolvers/C_CellMG4/Make.package
deleted file mode 100644
index e2f96a687e7..00000000000
--- a/Src/LinearSolvers/C_CellMG4/Make.package
+++ /dev/null
@@ -1,7 +0,0 @@
-CEXE_sources += AMReX_ABec2.cpp AMReX_ABec4.cpp 
-CEXE_headers += AMReX_ABec2.H AMReX_ABec4.H
-CEXE_headers += AMReX_ABec2_F.H AMReX_ABec4_F.H
-F90EXE_sources += AMReX_ABec2_$(DIM)D.F90 AMReX_ABec4_$(DIM)D.F90
-
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/LinearSolvers/C_CellMG4
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/LinearSolvers/C_CellMG4
diff --git a/Src/LinearSolvers/C_CellMG4/OpenSource.txt b/Src/LinearSolvers/C_CellMG4/OpenSource.txt
deleted file mode 100755
index 12ff2bef422..00000000000
--- a/Src/LinearSolvers/C_CellMG4/OpenSource.txt
+++ /dev/null
@@ -1,177 +0,0 @@
-SOURCE CODE LICENSE AGREEMENT
-Software: MGLib
-Version: Oct. 12, 2000 Release
-
-IMPORTANT - READ CAREFULLY: This License Agreement ("Agreement") is a
-legal agreement between you (in your capacity as an individual and as
-an agent for your company, institution or other entity) and The
-Regents of the University of California, Department of Energy
-contract-operators of the Ernest Orlando Lawrence Berkeley National
-Laboratory ("Berkeley Lab").  Downloading, installing, using, or
-copying of the Software (as defined below) by you or by a third party
-on your behalf indicates your agreement to be bound by the terms and
-conditions of this Agreement.  If you do not agree to these terms and
-conditions, do not download, install or use the Software.
-
-1.  LICENSE GRANT. Berkeley Lab grants you, and you hereby accept, a
-    non-exclusive, royalty-free perpetual license to install, use,
-    modify, prepare derivative works, incorporate into other computer
-    software, and distribute the version noted above of the computer
-    software program noted above, in binary and source code format, or
-    any derivative work thereof, together with any associated media,
-    printed materials, and on-line or electronic documentation (if
-    any) provided by Berkeley Lab (collectively, the "Software"),
-    subject to the following terms and conditions: (i) any
-    distribution of the Software shall bind the receiver to the terms
-    and conditions of this Agreement; (ii) any distribution of the
-    Software in modified form shall clearly state that the Software
-    has been modified from the version originally obtained from
-    Berkeley Lab.  This version of the Software constitutes a research
-    prototype and may be changed substantially.  The license grant set
-    forth above is subject to receipt by Berkeley Lab of any required
-    U.S. Department of Energy approvals.
-
-2.  COPYRIGHT; RETENTION OF RIGHTS.  The above license grant is
-    conditioned on the following: (i) you must reproduce all copyright
-    notices and other proprietary notices on any copies of the
-    Software and you must not remove such notices; (ii) in the event
-    you compile the Software, you will include the copyright notice
-    with the binary in such a manner as to allow it to be easily
-    viewable; (iii) if you incorporate the Software into other code,
-    you must provide notice that the code contains the Software and
-    include a copy of the copyright notices and other proprietary
-    notices.  All copies of the Software shall be subject to the terms
-    of this Agreement.  Subject to approval by the U.S. Department of
-    Energy: (a) you hereby acknowledge that the Software is protected
-    by United States copyright law and international treaty
-    provisions; (b) Berkeley Lab, and its licensors (if any), hereby
-    reserve all rights in the Software which are not explicitly
-    granted to you herein; (c) without limiting the generality of the
-    foregoing, Berkeley Lab and its licensors retain all title,
-    copyright, and other proprietary interests in the Software and any
-    copies thereof, and you do not acquire any rights, express or
-    implied, in the Software, other than those specifically set forth
-    in this Agreement.
-
-3.  NO MAINTENANCE OR SUPPORT; TREATMENT OF ENHANCEMENTS YOU CHOOSE TO
-    PROVIDE TO BERKELEY LAB.  Berkeley Lab is under no obligation
-    whatsoever to: (i) provide maintenance or support for the
-    Software; or (ii) to notify you of bug fixes, patches, or upgrades
-    to the features, functionality or performance of the Software
-    ("Enhancements") (if any), whether developed by Berkeley Lab or
-    third parties.  If, in its sole discretion, Berkeley Lab makes an
-    Enhancement available to you and Berkeley Lab does not separately
-    enter into a written license agreement with you relating to such
-    bug fix, patch or upgrade, then it shall be deemed incorporated
-    into the Software and subject to this Agreement.  You are under no
-    obligation whatsoever to provide any Enhancements to Berkeley Lab
-    that you may develop over time; however, if you choose to provide
-    Berkeley Lab with Enhancements in source code form that you have
-    developed without contemporaneously requiring Berkeley Lab to
-    enter into a separate written license agreement, then you hereby
-    grant Berkeley Lab a non-exclusive, royalty-free perpetual license
-    to install, use, modify, prepare derivative works, incorporate
-    into the Software or other computer software, distribute, and
-    sublicense your Enhancements or derivative works thereof, in
-    binary and source code form.
-
-4.  U.S. GOVERNMENT RIGHTS.  The Software was developed under funding
-    from the U.S. Department of Energy and the U.S. Government
-    consequently retains certain rights as follows: the
-    U.S. Government has been granted for itself and others acting on
-    its behalf a paid-up, nonexclusive, irrevocable, worldwide license
-    in the Software to reproduce, prepare derivative works, and
-    perform publicly and display publicly.  Beginning five (5) years
-    after the date permission to assert copyright was granted by the
-    U.S. Dept. of Energy, and subject to any subsequent five (5) year
-    renewals, the U.S. Government is granted for itself and others
-    acting on its behalf a paid-up, nonexclusive, irrevocable,
-    worldwide license in the Software to reproduce, prepare derivative
-    works, distribute copies to the public, perform publicly and
-    display publicly, and to permit others to do so.
-
-5.  WARRANTY DISCLAIMER.  THE SOFTWARE IS SUPPLIED "AS IS" WITHOUT
-    WARRANTY OF ANY KIND.  BERKELEY LAB, ITS LICENSORS, THE UNITED
-    STATES, THE UNITED STATES DEPARTMENT OF ENERGY, AND THEIR
-    EMPLOYEES: (1) DISCLAIM ANY WARRANTIES, EXPRESS OR IMPLIED,
-    INCLUDING BUT NOT LIMITED TO ANY IMPLIED WARRANTIES OF
-    MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, TITLE OR
-    NON-INFRINGEMENT, (2) DO NOT ASSUME ANY LEGAL LIABILITY OR
-    RESPONSIBILITY FOR THE ACCURACY, COMPLETENESS, OR USEFULNESS OF
-    THE SOFTWARE, (3) DO NOT REPRESENT THAT USE OF THE SOFTWARE WOULD
-    NOT INFRINGE PRIVATELY OWNED RIGHTS, (4) DO NOT WARRANT THAT THE
-    SOFTWARE WILL FUNCTION UNINTERRUPTED, THAT IT IS ERROR-FREE OR
-    THAT ANY ERRORS WILL BE CORRECTED.
-
-6.  LIMITATION OF LIABILITY. IN NO EVENT WILL BERKELEY LAB OR ITS
-    LICENSORS BE LIABLE FOR ANY INDIRECT, INCIDENTAL, CONSEQUENTIAL,
-    SPECIAL OR PUNITIVE DAMAGES OF ANY KIND OR NATURE, INCLUDING BUT
-    NOT LIMITED TO LOSS OF PROFITS OR LOSS OF DATA, FOR ANY REASON
-    WHATSOEVER, WHETHER SUCH LIABILITY IS ASSERTED ON THE BASIS OF
-    CONTRACT, TORT (INCLUDING NEGLIGENCE OR STRICT LIABILITY), OR
-    OTHERWISE, EVEN IF BERKELEY LAB HAS BEEN WARNED OF THE POSSIBILITY
-    OF SUCH LOSS OR DAMAGES.  IN NO EVENT SHALL BERKELEY LAB'S
-    LIABILITY FOR DAMAGES ARISING FROM OR IN CONNECTION WITH THIS
-    AGREEMENT EXCEED THE AMOUNT PAID BY YOU FOR THE SOFTWARE.
-
-7.  INDEMNITY.  You shall indemnify, defend, and hold harmless
-    Berkeley Lab, the U.S. Government, the Software developers, the
-    Software sponsors, and their agents, officers, and employees,
-    against any and all claims, suits, losses, damage, costs, fees,
-    and expenses arising out of or in connection with this Agreement.
-    You shall pay all costs incurred by Berkeley Lab in enforcing this
-    provision, including reasonable attorney fees.
-
-8.  TERM AND TERMINATION.  The license granted to you under this
-    Agreement will continue perpetually unless terminated by Berkeley
-    Lab in accordance with this Agreement.  If you breach any term of
-    this Agreement, and fail to cure such breach within thirty (30)
-    days of the date of written notice, this Agreement shall
-    immediately terminate. Upon such termination, you shall
-    immediately cease using the Software, return to Berkeley Lab, or
-    destroy, all copies of the Software, and provide Berkeley Lab with
-    written certification of your compliance with the foregoing.
-    Termination shall not relieve you from your obligations arising
-    prior to such termination. Notwithstanding any provision of this
-    Agreement to the contrary, Sections 5 through 10 shall survive
-    termination of this Agreement.
-
-9.  EXPORT CONTROLS. You shall observe all applicable United States
-    and foreign laws and regulations (if any) with respect to the
-    export, re-export, diversion or transfer of the Software, related
-    technical data and direct products thereof, including, without
-    limitation, the International Traffic in Arms Regulations (ITAR)
-    and the Export Administration Regulations.
-
-10. NO ENDORSEMENT.  In accordance with California Education Code
-    Section 92000, you shall not use in advertising, publicity or
-    other promotional activities any name, trade name, trademark, or
-    other designation of the University of California, nor shall you
-    so use "Ernest Orlando Lawrence Berkeley National Laboratory" or
-    "United States Department of Energy" (including any contraction,
-    abbreviation, or simulation of any of the foregoing) without
-    Berkeley Lab's prior written consent.
-
-11. GENERAL.  This Agreement shall be governed by the laws of the
-    State of California, excluding its rules governing conflicts of
-    laws.  No provision in either party's purchase orders, or in any
-    other business forms employed by either party will supersede the
-    terms of this Agreement, and no modification or amendment of this
-    Agreement is binding, unless in writing signed by a duly
-    authorized representative of each party.  This Agreement is
-    binding upon and shall inure to the benefit of Berkeley Lab, its
-    successors and assigns.  This Agreement represents the entire
-    understanding of the parties, and supersedes all previous
-    communications, written or oral, relating to the subject of this
-    Agreement. If you have any questions concerning this license,
-    contact Lawrence Berkeley National Laboratory, Technology Transfer
-    Department, One Cyclotron Road, MS 90-1070, Berkeley, CA 94720,
-    Attn: Software Licensing or via e-mail at TTD@lbl.gov.
-
-If you have any questions or feedback concerning this Software,
-contact the Center for Computational Sciences and Engineering,
-Lawrence Berkeley National Laboratory, One Cyclotron Road, MS
-50A-1148, Berkeley, CA 94720 or via email at webmaster@mothra.lbl.gov.
-
-Form rev000928
-
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DV_2D.F b/Src/LinearSolvers/C_TensorMG/AMReX_DV_2D.F
deleted file mode 100644
index 2e091e5ce9b..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DV_2D.F
+++ /dev/null
@@ -1,2441 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a two by two tensor
-c     tau = | t_xx     t_xy |
-c           | t_xy     t_yy |
-c
-c     t_xx = 2*mu * u_x
-c     t_xy = mu*(u_y + v_x)
-c     t_yy = 2*mu * v_y
-
-c     and alpha is a diagonal 2x2 matrix, says rick
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc2d.ma
-c ::: Null
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_DVAPPLY(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     out, DIMS(out),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     lo,hi,h
-     $     )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(out)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),2)
-      REAL_T a(DIMV(a),2)
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T out(DIMV(out),2)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-
-      REAL_T trandern(DIMV(trandern),2)
-      REAL_T trandere(DIMV(trandere),2)
-      REAL_T tranderw(DIMV(tranderw),2)
-      REAL_T tranders(DIMV(tranders),2)
-
-      integer i,j
-      REAL_T hx,hy
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw,dudyn,dudys
-      REAL_T dvdxe,dvdxw,dvdxn,dvdxs
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-
-c ::: make some mathematica definitions
-c ::: allDerivAllUV makes replacements for the deriv expressions and
-c ::: maps U and V to the correct values
-c ::: Null
-
-c ::: cases:
-c     ::: 1) interior.  All normal derivative expressions
-c     ::: 2) edge but not on corner.  check mask value to see if use outside
-c     :::    value or use interpolations
-c     ::: 3) corners.  Must check mask values to see if use outside values
-c     :::    values or use interpolations ON TWO SIDES.  But must also
-c     :::    check to see if need to do one-sided derivs for tangential
-c     :::    derivatives.
-
-c ::: case 1
-      do j=lo(2)+1,hi(2)-1
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-
-            dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-         enddo
-      enddo
-
-c ::: ::: case 2a: north side
-c ::: Null
-c ::: Null
-c :::
-      j = hi(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( maskn(i,1 + j).gt.0.or.maskn(1 + i,1 + j).gt.0 ) then
-               dudye =         ((U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy) + 
-     -    (U(1 + i,-2 + j,1) - 4*U(1 + i,-1 + j,1) + 3*U(1 + i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            if( maskn(-1 + i,1 + j).gt.0.or.maskn(i,1 + j).gt.0 ) then
-               dudyw =         ((U(-1 + i,-2 + j,1) - 4*U(-1 + i,-1 + j,1) + 3*U(-1 + i,j,1))/
-     -     (2.*hy) + (U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-         enddo
-
-c ::: case 2b south side
-c ::: Null
-c ::: Null
-      j=lo(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( masks(i,-1 + j).gt.0.or.masks(1 + i,-1 + j).gt.0 ) then
-               dudye =         ((-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy) + 
-     -    (-3*U(1 + i,j,1) + 4*U(1 + i,1 + j,1) - U(1 + i,2 + j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            if( masks(-1 + i,-1 + j).gt.0.or.masks(i,-1 + j).gt.0 ) then
-               dudyw =         ((-3*U(-1 + i,j,1) + 4*U(-1 + i,1 + j,1) - U(-1 + i,2 + j,1))/
-     -     (2.*hy) + (-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy))/2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-         enddo
-
-
-c ::: case 2c: west side story
-c ::: Null
-c ::: Null
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            dudyw = tranderw(i-1,j,1)
-
-            if( maskw(-1 + i,j).gt.0.or.maskw(-1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx) + 
-     -    (-3*U(i,1 + j,2) + 4*U(1 + i,1 + j,2) - U(2 + i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            if( maskw(-1 + i,-1 + j).gt.0.or.maskw(-1 + i,j).gt.0 ) then
-               dvdxs =         ((-3*U(i,-1 + j,2) + 4*U(1 + i,-1 + j,2) - U(2 + i,-1 + j,2))/
-     -     (2.*hx) + (-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx))/2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-      enddo
-
-c ::: case 2d: east side story
-c ::: Null
-c ::: Null
-      i=hi(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-
-            if( maske(1 + i,j).gt.0.or.maske(1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx) + 
-     -    (U(-2 + i,1 + j,2) - 4*U(-1 + i,1 + j,2) + 3*U(i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            if( maske(1 + i,-1 + j).gt.0.or.maske(1 + i,j).gt.0 ) then
-               dvdxs =         ((U(-2 + i,-1 + j,2) - 4*U(-1 + i,-1 + j,2) + 3*U(i,-1 + j,2))/
-     -     (2.*hx) + (U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-         enddo
-
-c ::: case 3a: north-east corner
-c ::: Null
-c ::: Null
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            if( maskn(-1 + i,1 + j).gt.0.or.maskn(i,1 + j).gt.0 ) then
-               dudyw =         ((U(-1 + i,-2 + j,1) - 4*U(-1 + i,-1 + j,1) + 3*U(-1 + i,j,1))/
-     -     (2.*hy) + (U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            if( maske(1 + i,-1 + j).gt.0.or.maske(1 + i,j).gt.0 ) then
-               dvdxs =         ((U(-2 + i,-1 + j,2) - 4*U(-1 + i,-1 + j,2) + 3*U(i,-1 + j,2))/
-     -     (2.*hx) + (U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-
-c ::: case 3b: south-east corner, plus i, minus j, plus i, plus j
-c ::: Null
-      j=lo(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            if( masks(-1 + i,-1 + j).gt.0.or.masks(i,-1 + j).gt.0 ) then 
-               dudyw =         ((-3*U(-1 + i,j,1) + 4*U(-1 + i,1 + j,1) - U(-1 + i,2 + j,1))/
-     -     (2.*hy) + (-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy))/2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            if( maske(1 + i,j).gt.0.or.maske(1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx) + 
-     -    (U(-2 + i,1 + j,2) - 4*U(-1 + i,1 + j,2) + 3*U(i,1 + j,2))/(2.*hx))/
-     -  2. 
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-
-c ::: case 3c: south-west corner, minus i, minus j
-c ::: Null
-      j=lo(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( masks(i,-1 + j).gt.0.or.masks(1 + i,-1 + j).gt.0 ) then
-               dudye =         ((-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy) + 
-     -    (-3*U(1 + i,j,1) + 4*U(1 + i,1 + j,1) - U(1 + i,2 + j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            if( maskw(-1 + i,j).gt.0.or.maskw(-1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx) + 
-     -    (-3*U(i,1 + j,2) + 4*U(1 + i,1 + j,2) - U(2 + i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-
-c ::: case 3d: north-west corner, minus i, plus j
-c ::: Null
-      j=hi(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( maskn(i,1 + j).gt.0.or.maskn(1 + i,1 + j).gt.0 ) then
-               dudye =         ((U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy) + 
-     -    (U(1 + i,-2 + j,1) - 4*U(1 + i,-1 + j,1) + 3*U(1 + i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            dvdxn = trandern(i,j+1,2)
-            if( maskw(-1 + i,-1 + j).gt.0.or.maskw(-1 + i,j).gt.0 ) then
-               dvdxs =         ((-3*U(i,-1 + j,2) + 4*U(1 + i,-1 + j,2) - U(2 + i,-1 + j,2))/
-     -     (2.*hx) + (-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx))/2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            out(i,j,1) =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            out(i,j,2) =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-
-
-
-      return
-      end
-
-
-c -------------------------------------------------------------------
-c ... a point of interpretation here: lo and hi are the covered area in
-c ... cell centered coordinates.  The dimension of the x and y fluxes have
-c ... to be at least one larger in the appropriate direction.
-c ... we use the "usual" interpretation of fluxes: cell i has a left flux
-c ... numbered i and a right flux numbered i+1
-
-      subroutine FORT_DVFLUX(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     xflux,DIMS(xflux),
-     $     yflux,DIMS(yflux),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     lo,hi,h
-     $     )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(xflux)
-      integer DIMDEC(yflux)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),2)
-      REAL_T a(DIMV(a),2)
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T xflux(DIMV(xflux),2)
-      REAL_T yflux(DIMV(yflux),2)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-
-      REAL_T trandern(DIMV(trandern),2)
-      REAL_T trandere(DIMV(trandere),2)
-      REAL_T tranderw(DIMV(tranderw),2)
-      REAL_T tranders(DIMV(tranders),2)
-
-      integer i,j
-      REAL_T hx,hy
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw,dudyn,dudys
-      REAL_T dvdxe,dvdxw,dvdxn,dvdxs
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-
-c ::: make some mathematica definitions
-c ::: allDerivAllUV makes replacements for the deriv expressions and
-c ::: maps U and V to the correct values
-c ::: Null
-
-c ::: cases:
-c     ::: 1) interior.  All normal derivative expressions
-c     ::: 2) edge but not on corner.  check mask value to see if use outside
-c     :::    value or use interpolations
-c     ::: 3) corners.  Must check mask values to see if use outside values
-c     :::    values or use interpolations ON TWO SIDES.  But must also
-c     :::    check to see if need to do one-sided derivs for tangential
-c     :::    derivatives.
-
-c ::: case 1
-      do j=lo(2)+1,hi(2)
-         do i=lo(1)+1,hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-
-            dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-         enddo
-      enddo
-
-c ::: ::: case 2a: north side
-c ::: Null
-c ::: Null
-c :::
-      j = hi(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            if( maskn(-1 + i,1 + j).gt.0.or.maskn(i,1 + j).gt.0 ) then
-               dudyw =         ((U(-1 + i,-2 + j,1) - 4*U(-1 + i,-1 + j,1) + 3*U(-1 + i,j,1))/
-     -     (2.*hy) + (U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            yflux(i,j+1,1) = -((dudyn + dvdxn)*muY(i,1 + j))
-            yflux(i,j+1,2) = -(2*dvdyn*muY(i,1 + j))
-         enddo
-
-c ::: case 2b south side
-c ::: Null
-c ::: Null
-      j=lo(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( masks(-1 + i,-1 + j).gt.0.or.masks(i,-1 + j).gt.0 ) then
-               dudyw =         ((-3*U(-1 + i,j,1) + 4*U(-1 + i,1 + j,1) - U(-1 + i,2 + j,1))/
-     -     (2.*hy) + (-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy))/2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxs = tranders(i,j-1,2)
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-         enddo
-
-
-c ::: case 2c: west side story
-c ::: Null
-c ::: Null
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudyw = tranderw(i-1,j,1)
-
-            if( maskw(-1 + i,-1 + j).gt.0.or.maskw(-1 + i,j).gt.0 ) then
-               dvdxs =         ((-3*U(i,-1 + j,2) + 4*U(1 + i,-1 + j,2) - U(2 + i,-1 + j,2))/
-     -     (2.*hx) + (-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx))/2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-      enddo
-
-c ::: case 2d: east side story
-c ::: Null
-c ::: Null
-      i=hi(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-
-            if( maske(1 + i,-1 + j).gt.0.or.maske(1 + i,j).gt.0 ) then
-               dvdxs =         ((U(-2 + i,-1 + j,2) - 4*U(-1 + i,-1 + j,2) + 3*U(i,-1 + j,2))/
-     -     (2.*hx) + (U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i+1,j,1) = -(2*dudxe*muX(1 + i,j))
-            xflux(i+1,j,2) = -((dudye + dvdxe)*muX(1 + i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-         enddo
-
-c ::: case 3a: north-east corner
-c ::: Null
-c ::: Null
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            if( maskn(-1 + i,1 + j).gt.0.or.maskn(i,1 + j).gt.0 ) then
-               dudyw =         ((U(-1 + i,-2 + j,1) - 4*U(-1 + i,-1 + j,1) + 3*U(-1 + i,j,1))/
-     -     (2.*hy) + (U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            if( maske(1 + i,-1 + j).gt.0.or.maske(1 + i,j).gt.0 ) then
-               dvdxs =         ((U(-2 + i,-1 + j,2) - 4*U(-1 + i,-1 + j,2) + 3*U(i,-1 + j,2))/
-     -     (2.*hx) + (U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            xflux(i+1,j,1) = -(2*dudxe*muX(1 + i,j))
-            xflux(i+1,j,2) = -((dudye + dvdxe)*muX(1 + i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-            yflux(i,j+1,1) = -((dudyn + dvdxn)*muY(i,1 + j))
-            yflux(i,j+1,2) = -(2*dvdyn*muY(i,1 + j))
-
-c ::: case 3b: south-east corner, plus i, minus j, plus i, plus j
-c ::: Null
-      j=lo(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            if( masks(-1 + i,-1 + j).gt.0.or.masks(i,-1 + j).gt.0 ) then 
-               dudyw =         ((-3*U(-1 + i,j,1) + 4*U(-1 + i,1 + j,1) - U(-1 + i,2 + j,1))/
-     -     (2.*hy) + (-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy))/2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            if( maske(1 + i,j).gt.0.or.maske(1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx) + 
-     -    (U(-2 + i,1 + j,2) - 4*U(-1 + i,1 + j,2) + 3*U(i,1 + j,2))/(2.*hx))/
-     -  2. 
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            xflux(i+1,j,1) = -(2*dudxe*muX(1 + i,j))
-            xflux(i+1,j,2) = -((dudye + dvdxe)*muX(1 + i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-            yflux(i,j+1,1) = -((dudyn + dvdxn)*muY(i,1 + j))
-            yflux(i,j+1,2) = -(2*dvdyn*muY(i,1 + j))
-
-c ::: case 3c: south-west corner, minus i, minus j
-c ::: Null
-      j=lo(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( masks(i,-1 + j).gt.0.or.masks(1 + i,-1 + j).gt.0 ) then
-               dudye =         ((-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy) + 
-     -    (-3*U(1 + i,j,1) + 4*U(1 + i,1 + j,1) - U(1 + i,2 + j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            if( maskw(-1 + i,j).gt.0.or.maskw(-1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx) + 
-     -    (-3*U(i,1 + j,2) + 4*U(1 + i,1 + j,2) - U(2 + i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            xflux(i+1,j,1) = -(2*dudxe*muX(1 + i,j))
-            xflux(i+1,j,2) = -((dudye + dvdxe)*muX(1 + i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-            yflux(i,j+1,1) = -((dudyn + dvdxn)*muY(i,1 + j))
-            yflux(i,j+1,2) = -(2*dvdyn*muY(i,1 + j))
-
-c ::: case 3d: north-west corner, minus i, plus j
-c ::: Null
-      j=hi(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( maskn(i,1 + j).gt.0.or.maskn(1 + i,1 + j).gt.0 ) then
-               dudye =         ((U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy) + 
-     -    (U(1 + i,-2 + j,1) - 4*U(1 + i,-1 + j,1) + 3*U(1 + i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            dvdxn = trandern(i,j+1,2)
-            if( maskw(-1 + i,-1 + j).gt.0.or.maskw(-1 + i,j).gt.0 ) then
-               dvdxs =         ((-3*U(i,-1 + j,2) + 4*U(1 + i,-1 + j,2) - U(2 + i,-1 + j,2))/
-     -     (2.*hx) + (-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx))/2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  evaluate expression
-            xflux(i,j,1) = -(2*dudxw*muX(i,j))
-            xflux(i,j,2) = -((dudyw + dvdxw)*muX(i,j))
-            xflux(i+1,j,1) = -(2*dudxe*muX(1 + i,j))
-            xflux(i+1,j,2) = -((dudye + dvdxe)*muX(1 + i,j))
-            yflux(i,j,1) = -((dudys + dvdxs)*muY(i,j))
-            yflux(i,j,2) = -(2*dvdys*muY(i,j))
-            yflux(i,j+1,1) = -((dudyn + dvdxn)*muY(i,1 + j))
-            yflux(i,j+1,2) = -(2*dvdyn*muY(i,1 + j))
-
-
-
-      return
-      end
-
-
-
-c-----------------------------------------------------------------------
-      subroutine FORT_APPLYBC (
-     $     flagden, flagbc, maxorder,
-     $     u,   DIMS(u),
-     $     cdir, bct, bcl,
-     $     bcval, DIMS(bcval),
-     $     mask,  DIMS(mask),
-     $     maskp, DIMS(maskp),
-     $     maskm, DIMS(maskm),
-     $     den,   DIMS(den),
-     $     exttd, DIMS(exttd),
-     $     tander,DIMS(tander),
-     $     lo, hi, nc,
-     $     h
-     $     )
-c
-c     If the boundary is of Neumann type, set the ghost cell value to
-c     that of the outermost point in the valid data (2nd order accurate)
-c     and then fill the "den" array with the value "1"
-c     
-c     
-c     If flagbc==1:
-c     
-c     If the boundary is of Dirichlet type, construct a polynomial
-c     interpolation through the boundary location and internal points
-c     (at locations x(-1:len-2) that generates the ghost cell value (at
-c     location xInt).  Then fill the ghost cell with the interpolated value.
-c     If flagden==1, load the "den" array with the interpolation
-c     coefficient corresponding to outermost point in the valid region
-c     ( the coef(0) corresponding to the location x(0) )
-c      
-c     Note: 
-c     The bc type = LO_REFLECT_ODD is a special type of boundary condition.
-
-c ::: the old FORT_APPLYBC put values out in ghost cells.  The new
-c ::: FORT_APPLYBC makes a distinction between normal and tangential derivs.
-c ::: the normal derivatives are still evaluated with ghost cells ( and
-c ::: the den array for adjusting the diagonal element).  Tangential
-c ::: derivatives are NOT computed from the ghost cells (note: we are
-c ::: discussing here the tangential derivates which are centered on the
-c ::: external cells walls of the rectangular domain.  Internal tangential
-c ::: derivatives whose stencil extends outside the rectangular domain have
-c ::: still ANOTHER calculational trick, one sided derivatives, which is 
-c ::: implemented in the apply operator).  For these tangential derivatives,
-c ::: if some of the cells in the stencil are uncovered, the derivative is
-c ::: computed half from cells which are internal, plus an externally supplied
-c ::: tangential derivative centered at location bcl.
-c ??? exttd is the externally supplied tangential derivative which is
-c ??? centered at bcl from wall.  Since the location of exttd is
-c ??? indeterminate (determined by bcl), we arbitrarily index it in the
-c ??? cell just outside the wall.
-c ??? tander is the calculated tangential derivative which is centered at
-c ??? at the wall.  It is indexed as if it were a cell centered quantity
-c ??? just outside the wall.  This is anomalous since it is really edge
-c ??? centered on the outer wall.
-c      
-c ::: other notes since previous developers didn't bother to document
-c ::: cdir is mnemonic for coordinate direction, i.e. which side this is
-c ::: cdir==0 -> left wall
-c ::: cdir==2 -> right
-c ::: cdir==1 -> bottom
-c ::: cdir==3 -> top
-
-c ::: notes about mask
-c ::: since we now require other masks, there are 3.
-c ::: 1) mask -- the main one covering the cells off the side of valid domain.
-c ::: 2) maskp -- the plus end of transverse direction
-c ::: 3) maskn -- the minus end of transverse direction
-
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(u)
-      REAL_T u(DIMV(u),nc)
-      integer DIMDEC(den)
-      REAL_T den(DIMV(den),nc)
-      integer DIMDEC(exttd)
-      REAL_T exttd(DIMV(exttd),nc)
-      integer DIMDEC(tander)
-      REAL_T tander(DIMV(tander),nc)
-      integer DIMDEC(bcval)
-      REAL_T bcval(DIMV(bcval),nc)
-      integer DIMDEC(mask)
-      integer mask(DIMV(mask))
-      integer DIMDEC(maskp)
-      integer maskp(DIMV(maskp))
-      integer DIMDEC(maskm)
-      integer maskm(DIMV(maskm))
-      integer bct(nc)
-      REAL_T bcl
-      REAL_T h(BL_SPACEDIM)
-c
-      REAL_T hx,hy,lambda
-      REAL_T innder,outder
-      REAL_T innloc,outloc,edgloc
-      integer i
-      integer j
-      integer n
-      logical is_dirichlet
-      logical is_neumann
-c
-      integer lenx
-      integer leny
-      integer m
-c
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      REAL_T x(-1:maxmaxorder-2)
-      REAL_T coef(-1:maxmaxorder-2)
-      REAL_T xInt
-c
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-c
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET   )
-      is_neumann(i)   = ( i .eq. LO_NEUMANN )
-      hx = h(1)
-      hy = h(2)
-c
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      endif
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-c
-c     TODO:
-c     In order for this to work with growing multigrid, must
-c     sort xa[] because it is possible for the xb value to lay
-c     within this range.
-c     
-c     The Left face of the grid
-c
-      if(cdir .eq. 0) then
-         do n = 1, nc
-            if (is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  u(lo(1)-1,j,n) = merge(
-     $                 u(lo(1),j,n),
-     $                 u(lo(1)-1,j,n),
-     $                 mask(lo(1)-1,j) .gt. 0)
-               enddo
-               if ( flagden .eq. 1) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of left side
-               i = lo(1)
-               do j=lo(2)+1,hi(2)-1
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                  tander(i-1,j,n) = innder
-               enddo
-c     :::::: now end points
-c     :::::: lower leftside
-               j = lo(2)
-               if( maskm(i,-1 + j).gt.0 ) then
-                    innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               tander(i-1,j,n) = innder
-c     :::::: upper left side
-                j = hi(2)
-                if( maskp(i,1 + j).gt.0 ) then
-                   innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-                else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                endif
-                tander(i-1,j,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenx+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, n) = merge(
-     $                    bcval(lo(1)-1,j,n)*coef(-1),
-     $                    u(lo(1)-1, j, n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, n) = merge(
-     $                    0.0d0,
-     $                    u(lo(1)-1, j, n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1,j,n) = merge(
-     $                    u(lo(1)-1,j,n)
-     $                    + u(lo(1)+m, j, n)*coef(m),
-     $                    u(lo(1)-1,j,n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = merge(coef(0), 0.0d0,
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of left side
-               edgloc = 0.
-               i = lo(1)
-               do j=lo(2)+1,hi(2)-1
-                  if( mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(-1 + i,-1 + j,n) + U(-1 + i,1 + j,n))/(2.*hy)
-                  elseif( mask(-1 + i,j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(-1 + i,2 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(-1 + i,j,n) + 4*U(-1 + i,1 + j,n) - U(-1 + i,2 + j,n))/(2.*hy)
-                  elseif( mask(-1 + i,-2 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-1 + i,-2 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(-1 + i,j,n))/(2.*hy)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-            
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c     :::::: now end points
-c     :::::: lower leftside
-               j = lo(2)
-               if( mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (-U(-1 + i,-1 + j,n) + U(-1 + i,1 + j,n))/(2.*hy)
-               elseif( mask(-1 + i,j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(-1 + i,2 + j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (-3*U(-1 + i,j,n) + 4*U(-1 + i,1 + j,n) - U(-1 + i,2 + j,n))/(2.*hy)
-               else
-                   outloc = x(-1)
-                   if( flagbc .eq. 1) then
-                      outder = exttd(i-1,j,n)
-                   else
-                      outder = 0.
-                   endif
-               endif
-               if( maskm(i,-1 + j).gt.0 ) then
-                    innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-c     :::::: upper left side
-                j = hi(2)
-                if( mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (-U(-1 + i,-1 + j,n) + U(-1 + i,1 + j,n))/(2.*hy)
-                elseif( mask(-1 + i,-2 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (U(-1 + i,-2 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(-1 + i,j,n))/(2.*hy)
-                else
-                   outloc = x(-1)
-                   if( flagbc .eq. 1) then
-                      outder = exttd(i-1,j,n)
-                   else
-                      outder = 0.
-                   endif
-                endif
-                if( maskp(i,1 + j).gt.0 ) then
-                   innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-                else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                endif
-                innloc = 0.5
-                lambda = (edgloc-outloc)/(innloc-outloc)
-                tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do j = lo(2), hi(2)
-                  u(lo(1)-1, j, n) = merge(
-     $                 -u(lo(1),j,n),
-     $                 u(lo(1)-1, j, n),
-     $                 mask(lo(1)-1,j) .gt. 0)
-                  tander(lo(1)-1,j,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = merge(-1.0d0, 0.0d0,
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-               
-            else 
-               print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c     
-c     The Right face of the grid
-c
-      if(cdir .eq. 2) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  u(hi(1)+1,j,n) = merge(
-     $                 u(hi(1), j, n),
-     $                 u(hi(1)+1, j, n),
-     $                 mask(hi(1)+1,j) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n) = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of right side
-               i = hi(1)
-               do j=lo(2)+1,hi(2)-1
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                  tander(i+1,j,n) = innder
-               enddo
-c :::::: now end points
-c :::::: lower right side
-               j = lo(2)
-               if( maskm(i,-1 + j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               tander(i+1,j,n) = innder
-c     :::::: upper right side
-               j = hi(2)
-               if( maskp(i,1 + j).gt.0 ) then
-                  innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               tander(i+1,j,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenx+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = merge(
-     $                    bcval(hi(1)+1,j,n)*coef(-1),
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = merge(
-     $                    0.0d0,
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = merge(
-     $                    u(hi(1)+1,j,n)
-     $                    + u(hi(1)-m,j,n)*coef(m),
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n)   = merge(coef(0), 0.0d0,
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of right side
-               edgloc = 0.
-               i = hi(1)
-               do j=lo(2)+1,hi(2)-1
-                  if( mask(1 + i,-1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(1 + i,-1 + j,n) + U(1 + i,1 + j,n))/(2.*hy)
-                  elseif( mask(1 + i,j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(1 + i,2 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(1 + i,j,n) + 4*U(1 + i,1 + j,n) - U(1 + i,2 + j,n))/(2.*hy)
-                  elseif( mask(1 + i,-2 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(1 + i,j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(1 + i,-2 + j,n) - 4*U(1 + i,-1 + j,n) + 3*U(1 + i,j,n))/(2.*hy)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c :::::: now end points
-c :::::: lower right side
-               j = lo(2)
-               if( mask(1 + i,-1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(1 + i,-1 + j,n) + U(1 + i,1 + j,n))/(2.*hy)
-               elseif( mask(1 + i,j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(1 + i,2 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-3*U(1 + i,j,n) + 4*U(1 + i,1 + j,n) - U(1 + i,2 + j,n))/(2.*hy)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i+1,j,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskm(i,-1 + j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-c     :::::: upper right side
-               j = hi(2)
-               if( mask(1 + i,-1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(1 + i,-1 + j,n) + U(1 + i,1 + j,n))/(2.*hy)
-               elseif( mask(1 + i,-2 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(1 + i,j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (U(1 + i,-2 + j,n) - 4*U(1 + i,-1 + j,n) + 3*U(1 + i,j,n))/(2.*hy)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i+1,j,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskp(i,1 + j).gt.0 ) then
-                  innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do j = lo(2), hi(2)
-                  u(hi(1)+1, j, n) = merge(
-     $                 -u(hi(1),j,n),
-     $                 u(hi(1)+1, j, n),
-     $                 mask(hi(1)+1,j) .gt. 0)
-c                 ::: tangential der is trivial
-                  tander(hi(1)+1,j,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n) = merge(-1.0d0, 0.0d0,
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The Bottom of the Grid
-c
-      if(cdir .eq. 1) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do i = lo(1),hi(1)
-                  u(i,lo(2)-1,n) = merge(
-     $                 u(i,lo(2),n),
-     $                 u(i,lo(2)-1,n),
-     $                 mask(i,lo(2)-1) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1),hi(1)
-                     den(i,lo(2),n)   = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of bottom side
-               j = lo(2)
-               do i=lo(1)+1,hi(1)-1
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-                  tander(i,j-1,n) = innder
-               enddo
-c :::::: now end points
-c :::::: left bottom side
-               i = lo(1)
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j-1,n) = innder
-c :::::: right bottom side
-               i = hi(1)
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j-1,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, leny+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,n) = merge(
-     $                    bcval(i,lo(2)-1,n)*coef(-1),
-     $                    u(i,lo(2)-1,n),
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               else
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,n) = merge(
-     $                    0.0d0,
-     $                    u(i,lo(2)-1,n),
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               endif
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     u(i, lo(2)-1, n) = merge(
-     $                    u(i, lo(2)-1,n)
-     $                    + u(i, lo(2)+m,n)*coef(m),
-     $                    u(i, lo(2)-1, n),
-     $                    mask(i, lo(2)-1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i, lo(2),n)   = merge(coef(0), 0.0d0,
-     $                    mask(i, lo(2)-1) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of bottom side
-               edgloc = 0.
-               j = lo(2)
-               do i=lo(1)+1,hi(1)-1
-                  if(  mask(-1 + i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(-1 + i,-1 + j,n) + U(1 + i,-1 + j,n))/(2.*hx)
-                  else if(  mask(i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(2 + i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,-1 + j,n) + 4*U(1 + i,-1 + j,n) - U(2 + i,-1 + j,n))/(2.*hx)
-                  else if(  mask(-2 + i,-1 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,-1 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(i,-1 + j,n))/(2.*hx)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i,j-1,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c :::::: now end points
-c :::::: left bottom side
-               i = lo(1)
-               if(  mask(-1 + i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,-1 + j,n) + U(1 + i,-1 + j,n))/(2.*hx)
-               else if( mask(i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(2 + i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,-1 + j,n) + 4*U(1 + i,-1 + j,n) - U(2 + i,-1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j-1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-c :::::: right bottom side
-               i = hi(1)
-               if( mask(-1 + i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,-1 + j,n) + U(1 + i,-1 + j,n))/(2.*hx)
-               else if( mask(-2 + i,-1 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,-1 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(i,-1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j-1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do i = lo(1), hi(1)
-                  u(i,lo(2)-1,n) = merge(
-     $                 -u(i,lo(2),n),
-     $                 u(i,lo(2)-1,n),
-     $                 mask(i,lo(2)-1) .gt. 0)
-                  tander(i,lo(2)-1,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,lo(2),n) = merge(-1.0d0, 0.0d0,
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-               stop
-            endif
-        enddo
-      endif
-c     
-c     The top of the grid
-c
-      if (cdir .eq. 3) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do i = lo(1), hi(1)
-                  u(i,hi(2)+1,n) = merge(
-     $                 u(i,hi(2),n),
-     $                 u(i,hi(2)+1,n),
-     $                 mask(i,hi(2)+1) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n)   = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of top side
-               j = hi(2)
-               do i=lo(1)+1,hi(1)-1
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-                  tander(i,j+1,n) = innder
-               enddo
-c     :::::: now end points
-c     :::::: left top side
-               i = lo(1)
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j+1,n) = innder
-c     :::::: right top side
-               i = hi(1)
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j+1,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               if ( bct(n) .eq. LO_REFLECT_ODD ) leny = 0
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, leny+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,n) = merge(
-     $                    bcval(i,hi(2)+1,n)*coef(-1),
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               else
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,n) = merge(
-     $                    0.0d0,
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     u(i, hi(2)+1,n) = merge(
-     $                    u(i,hi(2)+1,n)
-     $                    + u(i, hi(2)-m,n)*coef(m),
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n)   = merge(coef(0), 0.0d0,
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of top side
-               edgloc = 0.
-               j = hi(2)
-               do i=lo(1)+1,hi(1)-1
-                  if(  mask(-1 + i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(-1 + i,1 + j,n) + U(1 + i,1 + j,n))/(2.*hx)
-                  else if(  mask(i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(2 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,1 + j,n) + 4*U(1 + i,1 + j,n) - U(2 + i,1 + j,n))/(2.*hx)
-                  else if( mask(-2 + i,1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,1 + j,n) - 4*U(-1 + i,1 + j,n) + 3*U(i,1 + j,n))/(2.*hx)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i,j+1,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-                  
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c     :::::: now end points
-c     :::::: left top side
-               i = lo(1)
-               if( mask(-1 + i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,1 + j,n) + U(1 + i,1 + j,n))/(2.*hx)
-               else if( mask(i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(2 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,1 + j,n) + 4*U(1 + i,1 + j,n) - U(2 + i,1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j+1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-c     :::::: right top side
-               i = hi(1)
-               if( mask(-1 + i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,1 + j,n) + U(1 + i,1 + j,n))/(2.*hx)
-               else if(  mask(-2 + i,1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,1 + j,n) - 4*U(-1 + i,1 + j,n) + 3*U(i,1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j+1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do i = lo(1), hi(1)
-                  u(i,hi(2)+1,n) = merge(
-     $                 -u(i,hi(2),n),
-     $                 u(i,hi(2)+1,n),
-     $                 mask(i,hi(2)+1) .gt. 0)
-                  tander(i,hi(2)+1,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n) = merge(-1.0d0, 0.0d0,
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-      end
-
-
-      subroutine FORT_GSRB (
-     $     u, DIMS(u),
-     $     rhs, DIMS(rhs),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     maskn,DIMS(maskn),
-     $     fn, DIMS(fn),
-     $     maske,DIMS(maske),
-     $     fe, DIMS(fe),
-     $     maskw,DIMS(maskw),
-     $     fw, DIMS(fw),
-     $     masks,DIMS(masks),
-     $     fs, DIMS(fs),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     lo,hi,h,nc,phaseflag
-     $     )
-
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(rhs)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(fn)
-      integer DIMDEC(fe)
-      integer DIMDEC(fw)
-      integer DIMDEC(fs)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      integer nc,phaseflag
-
-      REAL_T u(DIMV(u),2)
-      REAL_T rhs(DIMV(rhs),2)
-      REAL_T a(DIMV(a),2)
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      integer maskn(DIMV(maskn))
-      integer maske(DIMV(maske))
-      integer maskw(DIMV(maskw))
-      integer masks(DIMV(masks))
-      REAL_T fn(DIMV(fn),nc)
-      REAL_T fe(DIMV(fe),nc)
-      REAL_T fw(DIMV(fw),nc)
-      REAL_T fs(DIMV(fs),nc)
-      REAL_T trandern(DIMV(trandern),2)
-      REAL_T trandere(DIMV(trandere),2)
-      REAL_T tranderw(DIMV(tranderw),2)
-      REAL_T tranders(DIMV(tranders),2)
-
-      integer i,j,modx,mody
-      integer istart,jstart
-      REAL_T hx,hy
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw,dudyn,dudys
-      REAL_T dvdxe,dvdxw,dvdxn,dvdxs
-      REAL_T diagu, diagv
-      REAL_T operu, operv
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      if( nc .ne. 2 ) then
-         write(6,*)'FORT_GSRB: bad nc',nc
-         stop
-      endif
-
-c ::: convert phase flag into modx and mody
-      if(    phaseflag.eq.0 ) then
-         modx = 0
-         mody = 0
-      elseif(phaseflag.eq.1) then
-         modx = 1
-         mody = 0
-      elseif(phaseflag.eq.2) then
-         modx = 0
-         mody = 1
-      elseif(phaseflag.eq.3) then
-         modx = 1
-         mody = 1
-      else
-         write(6,*)'FORT_GSRB: bad phaseflag', phaseflag
-         stop
-      endif
-
-
-c ::: cases:
-c     ::: 1) interior.  All normal derivative expressions
-c     ::: 2) edge but not on corner.  check mask value to see if use outside
-c     :::    value or use interpolations
-c     ::: 3) corners.  Must check mask values to see if use outside values
-c     :::    values or use interpolations ON TWO SIDES.  But must also
-c     :::    check to see if need to do one-sided derivs for tangential
-c     :::    derivatives.
-
-c ::: case 1
-      istart = lo(1)+1
-      if( mod(istart,2) .ne. modx ) istart = istart+1
-      jstart = lo(2)+1
-      if( mod(jstart,2) .ne. mody ) jstart = jstart+1
-      do j = jstart,hi(2)-1,2
-         do i = istart,hi(1)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-
-            dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      enddo
-
-c ::: case 2a) north side
-c ::: Null
-c ::: Null
-      j = hi(2)
-      if( mod(j,2) .eq. mody ) then
-         do i = istart,hi(1)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( maskn(i,1 + j).gt.0.or.maskn(1 + i,1 + j).gt.0 ) then
-               dudye =         ((U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy) + 
-     -    (U(1 + i,-2 + j,1) - 4*U(1 + i,-1 + j,1) + 3*U(1 + i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            if( maskn(-1 + i,1 + j).gt.0.or.maskn(i,1 + j).gt.0 ) then
-               dudyw =         ((U(-1 + i,-2 + j,1) - 4*U(-1 + i,-1 + j,1) + 3*U(-1 + i,j,1))/
-     -     (2.*hy) + (U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskn(i,j+1).gt. 0) then
-	       diagu = diagu - fn(i,j,1)*beta*muY(i,j+1)/hy**2
-	       diagv = diagv - fn(i,j,2)*2*beta*muY(i,j+1)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-
-
-c ::: case 2b south side
-c ::: Null
-c ::: Null
-
-      j=lo(2)
-      if( mod(j,2) .eq. mody ) then
-         do i=istart,hi(1)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( masks(i,-1 + j).gt.0.or.masks(1 + i,-1 + j).gt.0 ) then
-               dudye =         ((-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy) + 
-     -    (-3*U(1 + i,j,1) + 4*U(1 + i,1 + j,1) - U(1 + i,2 + j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            if( masks(-1 + i,-1 + j).gt.0.or.masks(i,-1 + j).gt.0 ) then
-               dudyw =         ((-3*U(-1 + i,j,1) + 4*U(-1 + i,1 + j,1) - U(-1 + i,2 + j,1))/
-     -     (2.*hy) + (-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy))/2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( masks(i,j-1).gt. 0) then
-	       diagu = diagu - fs(i,j,1)*beta*muY(i,j)/hy**2
-	       diagv = diagv - fs(i,j,2)*2*beta*muY(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-
-c ::: case 2c: west side story
-c ::: Null
-c ::: Null
-      i=lo(1)
-      if( mod(i,2) .eq. modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-            
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-            
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            dudyw = tranderw(i-1,j,1)
-            
-            if( maskw(-1 + i,j).gt.0.or.maskw(-1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx) + 
-     -    (-3*U(i,1 + j,2) + 4*U(1 + i,1 + j,2) - U(2 + i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            if( maskw(-1 + i,-1 + j).gt.0.or.maskw(-1 + i,j).gt.0 ) then
-               dvdxs =         ((-3*U(i,-1 + j,2) + 4*U(1 + i,-1 + j,2) - U(2 + i,-1 + j,2))/
-     -     (2.*hx) + (-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx))/2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskw(i-1,j).gt. 0) then
-	       diagu = diagu - fw(i,j,1)*2*beta*muX(i,j)/hx**2
-	       diagv = diagv - fw(i,j,2)*  beta*muX(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-
-c ::: case 2d: east side story
-c ::: Null
-c ::: Null
-      i=hi(1)
-      if( mod(i,2) .eq. modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-
-            if( maske(1 + i,j).gt.0.or.maske(1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx) + 
-     -    (U(-2 + i,1 + j,2) - 4*U(-1 + i,1 + j,2) + 3*U(i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            if( maske(1 + i,-1 + j).gt.0.or.maske(1 + i,j).gt.0 ) then
-               dvdxs =         ((U(-2 + i,-1 + j,2) - 4*U(-1 + i,-1 + j,2) + 3*U(i,-1 + j,2))/
-     -     (2.*hx) + (U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maske(i+1,j).gt. 0) then
-	       diagu = diagu - fe(i,j,1)*2*beta*muX(i+1,j)/hx**2
-	       diagv = diagv - fe(i,j,2)*  beta*muX(i+1,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-c ::: case 3a: north-east corner, plus i, plus j
-c ::: Null
-c ::: Null
-      j=hi(2)
-      i=hi(1)
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            if( maskn(-1 + i,1 + j).gt.0.or.maskn(i,1 + j).gt.0 ) then
-               dudyw =         ((U(-1 + i,-2 + j,1) - 4*U(-1 + i,-1 + j,1) + 3*U(-1 + i,j,1))/
-     -     (2.*hy) + (U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            if( maske(1 + i,-1 + j).gt.0.or.maske(1 + i,j).gt.0 ) then
-               dvdxs =         ((U(-2 + i,-1 + j,2) - 4*U(-1 + i,-1 + j,2) + 3*U(i,-1 + j,2))/
-     -     (2.*hx) + (U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maske(i+1,j).gt. 0) then
-	       diagu = diagu - fe(i,j,1)*2*beta*muX(i+1,j)/hx**2
-	       diagv = diagv - fe(i,j,2)*  beta*muX(i+1,j)/hy**2
-	    endif
-	    if( maskn(i,j+1).gt. 0) then
-	       diagu = diagu - fn(i,j,1)*beta*muY(i,j+1)/hy**2
-	       diagv = diagv - fn(i,j,2)*2*beta*muY(i,j+1)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-
-c ::: case 3b: south-east corner, plus i, minus j, plus i, plus j
-c ::: Null
-      j=lo(2)
-      i=hi(1)
-      
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            dudye = trandere(i+1,j,1)
-            if( masks(-1 + i,-1 + j).gt.0.or.masks(i,-1 + j).gt.0 ) then 
-               dudyw =         ((-3*U(-1 + i,j,1) + 4*U(-1 + i,1 + j,1) - U(-1 + i,2 + j,1))/
-     -     (2.*hy) + (-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy))/2.
-            else
-               dudyw =         (-U(-1 + i,-1 + j,1) + U(-1 + i,1 + j,1) - U(i,-1 + j,1) + 
-     -    U(i,1 + j,1))/(4.*hy)
-            endif
-
-            if( maske(1 + i,j).gt.0.or.maske(1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((U(-2 + i,j,2) - 4*U(-1 + i,j,2) + 3*U(i,j,2))/(2.*hx) + 
-     -    (U(-2 + i,1 + j,2) - 4*U(-1 + i,1 + j,2) + 3*U(i,1 + j,2))/(2.*hx))/
-     -  2. 
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maske(i+1,j).gt. 0) then
-	       diagu = diagu - fe(i,j,1)*2*beta*muX(i+1,j)/hx**2
-	       diagv = diagv - fe(i,j,2)*  beta*muX(i+1,j)/hy**2
-	    endif
-	    if( masks(i,j-1).gt. 0) then
-	       diagu = diagu - fs(i,j,1)*beta*muY(i,j)/hy**2
-	       diagv = diagv - fs(i,j,2)*2*beta*muY(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-c ::: case 3c: south-west corner, minus i, minus j
-c ::: Null
-      j=lo(2)
-      i=lo(1)
-
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( masks(i,-1 + j).gt.0.or.masks(1 + i,-1 + j).gt.0 ) then
-               dudye =         ((-3*U(i,j,1) + 4*U(i,1 + j,1) - U(i,2 + j,1))/(2.*hy) + 
-     -    (-3*U(1 + i,j,1) + 4*U(1 + i,1 + j,1) - U(1 + i,2 + j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            if( maskw(-1 + i,j).gt.0.or.maskw(-1 + i,1 + j).gt.0 ) then
-               dvdxn =         ((-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx) + 
-     -    (-3*U(i,1 + j,2) + 4*U(1 + i,1 + j,2) - U(2 + i,1 + j,2))/(2.*hx))/
-     -  2.
-            else
-               dvdxn =         (-U(-1 + i,j,2) - U(-1 + i,1 + j,2) + U(1 + i,j,2) + 
-     -    U(1 + i,1 + j,2))/(4.*hx)
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskw(i-1,j).gt. 0) then
-	       diagu = diagu - fw(i,j,1)*2*beta*muX(i,j)/hx**2
-	       diagv = diagv - fw(i,j,2)*  beta*muX(i,j)/hy**2
-	    endif
-	    if( masks(i,j-1).gt. 0) then
-	       diagu = diagu - fs(i,j,1)*beta*muY(i,j)/hy**2
-	       diagv = diagv - fs(i,j,2)*2*beta*muY(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-
-
-c ::: case 3d: north-west corner, minus i, plus j
-c ::: Null
-      j=hi(2)
-      i=lo(1)
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = (-U(i,j,1) + U(1 + i,j,1))/hx
-            dudxw = (-U(-1 + i,j,1) + U(i,j,1))/hx
-
-            dvdyn = (-U(i,j,2) + U(i,1 + j,2))/hy
-            dvdys = (-U(i,-1 + j,2) + U(i,j,2))/hy
-
-            dudyn = (-U(i,j,1) + U(i,1 + j,1))/hy
-            dudys = (-U(i,-1 + j,1) + U(i,j,1))/hy
-            if( maskn(i,1 + j).gt.0.or.maskn(1 + i,1 + j).gt.0 ) then
-               dudye =         ((U(i,-2 + j,1) - 4*U(i,-1 + j,1) + 3*U(i,j,1))/(2.*hy) + 
-     -    (U(1 + i,-2 + j,1) - 4*U(1 + i,-1 + j,1) + 3*U(1 + i,j,1))/(2.*hy))/
-     -  2.
-            else
-               dudye =         (-U(i,-1 + j,1) + U(i,1 + j,1) - U(1 + i,-1 + j,1) + 
-     -    U(1 + i,1 + j,1))/(4.*hy)
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            dvdxn = trandern(i,j+1,2)
-            if( maskw(-1 + i,-1 + j).gt.0.or.maskw(-1 + i,j).gt.0 ) then
-               dvdxs =         ((-3*U(i,-1 + j,2) + 4*U(1 + i,-1 + j,2) - U(2 + i,-1 + j,2))/
-     -     (2.*hx) + (-3*U(i,j,2) + 4*U(1 + i,j,2) - U(2 + i,j,2))/(2.*hx))/2.
-            else
-               dvdxs =         (-U(-1 + i,-1 + j,2) - U(-1 + i,j,2) + U(1 + i,-1 + j,2) + 
-     -    U(1 + i,j,2))/(4.*hx)
-            endif
-            dvdxe = (-U(i,j,2) + U(1 + i,j,2))/hx
-            dvdxw = (-U(-1 + i,j,2) + U(i,j,2))/hx
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskw(i-1,j).gt. 0) then
-	       diagu = diagu - fw(i,j,1)*2*beta*muX(i,j)/hx**2
-	       diagv = diagv - fw(i,j,2)*  beta*muX(i,j)/hy**2
-	    endif
-	    if( maskn(i,j+1).gt. 0) then
-	       diagu = diagu - fn(i,j,1)*beta*muY(i,j+1)/hy**2
-	       diagv = diagv - fn(i,j,2)*2*beta*muY(i,j+1)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu =         -((beta*(hy*(-2*dudxw*muX(i,j) + 2*dudxe*muX(1 + i,j)) + 
-     -         hx*(-((dudys + dvdxs)*muY(i,j)) + (dudyn + dvdxn)*muY(i,1 + j))
-     -         ))/(hx*hy)) + alpha*a(i,j,1)*u(i,j,1)
-            operv =         -((beta*(hy*(-((dudyw + dvdxw)*muX(i,j)) + 
-     -            (dudye + dvdxe)*muX(1 + i,j)) + 
-     -         hx*(-2*dvdys*muY(i,j) + 2*dvdyn*muY(i,1 + j))))/(hx*hy)) + 
-     -  alpha*a(i,j,2)*u(i,j,2)
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-
-      return
-      end
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D1.F b/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D1.F
deleted file mode 100644
index 91ac1b31cd5..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D1.F
+++ /dev/null
@@ -1,3033 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: Null
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_DVAPPLY(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     muZ, DIMS(muZ),
-     $     out, DIMS(out),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     maskt,DIMS(maskt),
-     $     maskb,DIMS(maskb),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     trandert,DIMS(trandert),
-     $     tranderb,DIMS(tranderb),
-     $     lo,hi,h
-     $     )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(muZ)
-      integer DIMDEC(out)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(maskt)
-      integer DIMDEC(maskb)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer DIMDEC(trandert)
-      integer DIMDEC(tranderb)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),3)
-      REAL_T a(DIMV(a))
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T muZ(DIMV(muZ))
-      REAL_T out(DIMV(out),3)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-      integer  maskt(DIMV(maskt))
-      integer  maskb(DIMV(maskb))
-
-c ::: for transverse derives, first 3 is for variable, second 3 is for
-c ::: direction of derivative.  Obviously not all are used, but this is easy.
-      REAL_T trandern(DIMV(trandern),3,3)
-      REAL_T trandere(DIMV(trandere),3,3)
-      REAL_T tranderw(DIMV(tranderw),3,3)
-      REAL_T tranders(DIMV(tranders),3,3)
-      REAL_T trandert(DIMV(trandert),3,3)
-      REAL_T tranderb(DIMV(tranderb),3,3)
-
-      integer i,j,k
-      REAL_T hx,hy,hz,ihx,ihy,ihz,ihxyz
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw
-      REAL_T dudyn,dudys
-      REAL_T dvdxe,dvdxw
-      REAL_T dvdxn,dvdxs
-      REAL_T dudzb,dudzt
-      REAL_T dwdzt,dwdzb
-      REAL_T dwdxb,dwdxt
-      REAL_T dvdzb,dvdzt
-      REAL_T dwdyb,dwdyt
-      REAL_T dudzw,dudze
-      REAL_T dwdxw,dwdxe
-      REAL_T dvdzs,dvdzn
-      REAL_T dwdys,dwdyn
-
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-      ihx = 1.0d0/hx
-      ihy = 1.0d0/hy
-      ihz = 1.0d0/hz
-
-      ihxyz = 1.0d0/(hx*hy*hz)
-
-c ::: cases:
-c     ::: 0) interior.  All usual derivative expressions
-c     ::: 1-6) face but not on edge.  
-c     ::: 7-18) edge but not on corner.
-c     ::: 19-26) corners.
-
-c ::: case 0
-c ::: Null
-c ::: Null
-      do k=lo(3)+1,hi(3)-1
-         do j=lo(2)+1,hi(2)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-         enddo
-      enddo
-
-c ::: case 1, top face
-c ::: Null
-c ::: Null
-c ::: Null
-      k=hi(3)
-         do j=lo(2)+1,hi(2)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-         enddo
-
-c ::: case 2, bottom face
-c ::: Null
-c ::: Null
-c ::: Null
-      k=lo(3)
-         do j=lo(2)+1,hi(2)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*ihz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*ihz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-         enddo
-
-c ::: case 3, west face
-c ::: Null
-c ::: Null
-c ::: Null
-      i = lo(1)
-      do k=lo(3)+1,hi(3)-1
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*ihx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*ihx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-         enddo
-      enddo
-
-c ::: case 4, east face
-c ::: Null
-c ::: Null
-c ::: Null
-      i = hi(1)
-      do k=lo(3)+1,hi(3)-1
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=trandere(1+i,j,k,1,2)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-         enddo
-      enddo
-	
-c ::: case 5, north face
-c ::: Null
-c ::: Null
-c ::: Null
-      j = hi(2)
-      do k=lo(3)+1,hi(3)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-      enddo
-
-
-c ::: case 6, south face
-c ::: Null
-c ::: Null
-c ::: Null
-      j = lo(2)
-      do k=lo(3)+1,hi(3)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*ihy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*ihy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=tranders(i,-1+j,k,2,3)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-      enddo
-
-c ::: case 7, top-north edge 
-c ::: Null
-c ::: Null
-c ::: Null
-      k=hi(3)
-         j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-
-
-c ::: case 8, top-south edge 
-c ::: Null
-      k=hi(3)
-         j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*ihy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-
-
-c ::: case 9, top-west edge 
-c ::: Null
-      k=hi(3)
-      i=lo(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*ihx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-        
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-         enddo
-
-c ::: case 10, top-east edge 
-c ::: Null
-      k=hi(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=trandere(1+i,j,k,1,2)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-         enddo
-
-
-c ::: case 11, bottom-north edge 
-c ::: Null
-      k=lo(3)
-      j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*ihz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-
-
-c ::: case 12, bottom-south edge 
-c ::: Null
-      k=lo(3)
-      j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-               
-c     ::: get expressions for tangential derivatives
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*ihy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*ihy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*ihz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*ihz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-            enddo
-
-
-c ::: case 13, bottom-west edge 
-c ::: Null
-      k=lo(3)
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*ihx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*ihx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*ihz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*ihz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-         enddo
-
-
-c ::: case 14, bottom-east edge 
-c ::: Null
-      k=lo(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*ihz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-         enddo
-
-
-c ::: case 15, east-north edge
-c ::: Null
-      j=hi(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-      enddo
-
-
-c ::: case 16, east-south edge
-c ::: Null
-      j=lo(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*ihy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-      enddo
-
-
-c ::: case 17, west-north edge
-c ::: Null
-      j=hi(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*ihx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-      enddo
-
-
-c ::: case 18, west-south edge
-c ::: Null
-      j=lo(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*ihx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*ihx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*ihy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*ihy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=tranders(i,-1+j,k,2,3)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-      enddo
-
-
-c ::: case 19, top-north-east corner
-c ::: Null
-      k=hi(3)
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-c ::: case 20, top-north-west corner
-c ::: Null
-           i=lo(1)
-           j=hi(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-c ::: case 21, top-south-east corner
-c ::: Null
-           i=hi(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-c ::: case 22, top-south-west corner
-c ::: Null
-           i=lo(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*ihx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*ihy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-c ::: case 23, bottom-north-east corner
-c ::: Null
-           i=hi(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-c ::: case 24, bottom-north-west corner
-c ::: Null
-           i=lo(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*ihx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*ihy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*ihz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-c ::: case 25, bottom-south-east corner
-c ::: Null
-           i=hi(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*ihx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*ihx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*ihy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*ihz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-c ::: case 26, bottom-south-west corner
-c ::: Null
-           i=lo(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*ihx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*ihx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*ihx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*ihx)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*ihy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*ihy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*ihy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*ihz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*ihz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-               out(i,j,k,1) = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-               out(i,j,k,2) = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-               out(i,j,k,3) = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-
-
-
-
-
-
-      return
-      end
-
-
-
-
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D2.F b/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D2.F
deleted file mode 100644
index 02a27f989cd..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D2.F
+++ /dev/null
@@ -1,2002 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: Null
-
-
-
-
-c -------------------------------------------------------------------
-c ... a point of interpretation here: lo and hi are the covered area in
-c ... cell centered coordinates.  The dimension of the x and y fluxes have
-c ... to be at least one larger in the appropriate direction.
-c ... we use the "usual" interpretation of fluxes: cell i has a left flux
-c ... numbered i and a right flux numbered i+1
-
-      subroutine FORT_DVFLUX(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     muZ, DIMS(muZ),
-     $     xflux,DIMS(xflux),
-     $     yflux,DIMS(yflux),
-     $     zflux,DIMS(zflux),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     maskt,DIMS(maskt),
-     $     maskb,DIMS(maskb),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     trandert,DIMS(trandert),
-     $     tranderb,DIMS(tranderb),
-     $     lo,hi,h
-     $     )
-
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(muZ)
-      integer DIMDEC(xflux)
-      integer DIMDEC(yflux)
-      integer DIMDEC(zflux)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(maskt)
-      integer DIMDEC(maskb)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer DIMDEC(trandert)
-      integer DIMDEC(tranderb)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),3)
-      REAL_T a(DIMV(a))
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T muZ(DIMV(muZ))
-      REAL_T xflux(DIMV(xflux),3)
-      REAL_T yflux(DIMV(yflux),3)
-      REAL_T zflux(DIMV(zflux),3)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-      integer  maskt(DIMV(maskt))
-      integer  maskb(DIMV(maskb))
-
-c ::: for transverse derives, first 3 is for variable, second 3 is for
-c ::: direction of derivative.  Obviously not all are used, but this is easy.
-      REAL_T trandern(DIMV(trandern),3,3)
-      REAL_T trandere(DIMV(trandere),3,3)
-      REAL_T tranderw(DIMV(tranderw),3,3)
-      REAL_T tranders(DIMV(tranders),3,3)
-      REAL_T trandert(DIMV(trandert),3,3)
-      REAL_T tranderb(DIMV(tranderb),3,3)
-
-      integer i,j,k
-      REAL_T hx,hy,hz,ihx,ihy,ihz
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw
-      REAL_T dudyn,dudys
-      REAL_T dvdxe,dvdxw
-      REAL_T dvdxn,dvdxs
-      REAL_T dudzb,dudzt
-      REAL_T dwdzt,dwdzb
-      REAL_T dwdxb,dwdxt
-      REAL_T dvdzb,dvdzt
-      REAL_T dwdyb,dwdyt
-      REAL_T dudzw,dudze
-      REAL_T dwdxw,dwdxe
-      REAL_T dvdzs,dvdzn
-      REAL_T dwdys,dwdyn
-
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-      ihx = 1.0d0/hx
-      ihy = 1.0d0/hy
-      ihz = 1.0d0/hz
-
-c ::: cases:
-c     ::: 0) interior.  All usual derivative expressions
-c     ::: 1-6) face but not on edge.  
-c     ::: 7-18) edge but not on corner.
-c     ::: 19-26) corners.
-
-c ::: case 0
-c ::: Null
-c ::: Null
-      do k=lo(3)+1,hi(3)
-         do j=lo(2)+1,hi(2)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-              dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-              dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-              dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-              dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-              dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-              dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-              dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-              dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-              dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-            enddo
-         enddo
-      enddo
-
-
-c ::: case 1, top face
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: wst
-      k=hi(3)
-         do j=lo(2)+1,hi(2)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-            enddo
-         enddo
-
-c ::: case 2, bottom face
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: wsb
-      k=lo(3)
-         do j=lo(2)+1,hi(2)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-            enddo
-         enddo
-
-c ::: case 3, west face
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: wsb
-      i = lo(1)
-      do k=lo(3)+1,hi(3)
-         do j=lo(2)+1,hi(2)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-         enddo
-      enddo
-
-c ::: case 4, east face
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: esb
-      i = hi(1)
-      do k=lo(3)+1,hi(3)
-         do j=lo(2)+1,hi(2)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=trandere(1+i,j,k,1,2)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-         enddo
-      enddo
-
-c ::: case 5, north face
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: wnb
-      j = hi(2)
-      do k=lo(3)+1,hi(3)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-            enddo
-      enddo
-	
-c ::: case 6, south face
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: wsb
-      j = lo(2)
-      do k=lo(3)+1,hi(3)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-            enddo
-      enddo
-
-c ::: case 7, top-north edge 
-c ::: Null
-c ::: Null
-c ::: Null
-c ::: tnw
-      k=hi(3)
-         j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-            enddo
-
-c ::: case 8, top-south edge 
-c ::: Null
-c ::: tsw
-      k=hi(3)
-         j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-        
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-            enddo
-
-
-c ::: case 9, top-west edge 
-c ::: Null
-c ::: tsw
-      k=hi(3)
-      i=lo(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-         enddo
-
-
-c ::: case 10, top-east edge 
-c ::: Null
-c ::: tes
-      k=hi(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudye=trandere(1+i,j,k,1,2)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-         enddo
-
-
-c ::: case 11, bottom-north edge 
-c ::: Null
-c ::: bnw
-      k=lo(3)
-      j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-            enddo
-
-
-c ::: case 12, bottom-south edge 
-c ::: Null
-c ::: bsw
-      k=lo(3)
-      j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-            enddo
-
-
-c ::: case 13, bottom-west edge 
-c ::: Null
-c ::: bws
-      k=lo(3)
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-         enddo
-
-
-c ::: case 14, bottom-east edge 
-c ::: Null
-c ::: bse
-      k=lo(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-         enddo
-
-
-c ::: case 15, east-north edge
-c ::: Null
-c ::: neb
-      j=hi(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-      enddo
-
-c ::: case 16, east-south edge
-c ::: Null
-c ::: esb
-      j=lo(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-      enddo
-
-
-c ::: case 17, west-north edge
-c ::: Null
-c ::: nwb
-      j=hi(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-      enddo
-
-
-c ::: case 18, west-south edge
-c ::: Null
-c ::: swb
-      j=lo(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-      enddo
-
-
-c ::: case 19, top-north-east corner
-c ::: Null
-c ::: tbnsew
-      k=hi(3)
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-
-
-c ::: case 20, top-north-west corner
-c ::: Null
-c ::: tbnsw
-           i=lo(1)
-           j=hi(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-
-c ::: case 21, top-south-east corner
-c ::: Null
-c ::: tbsew
-           i=hi(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*ihx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-
-c ::: case 22, top-south-west corner
-c ::: Null
-c ::: tbsw
-           i=lo(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*ihz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*ihz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*ihx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*ihx))*.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*ihx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*ihy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*ihy))*.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*ihy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-              zflux(i,j,k+1,1)=-((dudzt+dwdxt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,2)=-((dvdzt+dwdyt)*muZ(i,j,1+k))
-              zflux(i,j,k+1,3)=-(2*dwdzt*muZ(i,j,1+k))
-
-c ::: case 23, bottom-north-east corner
-c ::: Null
-c ::: bnsew
-           i=hi(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*ihx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*ihy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-c ::: case 24, bottom-north-west corner
-c ::: Null
-c ::: bnsw
-           i=lo(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*ihy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*ihy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*ihx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*ihx))*.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*ihx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dudyw=tranderw(-1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*ihz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*ihz))*.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*ihz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              yflux(i,j+1,k,1)=-((dudyn+dvdxn)*muY(i,1+j,k))
-              yflux(i,j+1,k,2)=-(2*dvdyn*muY(i,1+j,k))
-              yflux(i,j+1,k,3)=-((dvdzn+dwdyn)*muY(i,1+j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-
-c ::: case 25, bottom-south-east corner
-c ::: Null
-c ::: bsew
-           i=hi(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*ihx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*ihx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*ihy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*ihy))*.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*ihy)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*ihz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*ihz))*.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*ihz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              xflux(i+1,j,k,1)=-(2*dudxe*muX(1+i,j,k))
-              xflux(i+1,j,k,2)=-((dudye+dvdxe)*muX(1+i,j,k))
-              xflux(i+1,j,k,3)=-((dudze+dwdxe)*muX(1+i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-
-c ::: case 26, bottom-south-west corner
-c ::: Null
-           i=lo(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*ihx
-
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*ihy
-
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*ihz
-
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*ihy
-
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*ihx
-
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*ihz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*ihz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*ihx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*ihy
-
-c     ::: get expressions for tangential derivatives
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dudyw=tranderw(-1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(2*dudxw*muX(i,j,k))
-              xflux(i,j,k,2)=-((dudyw+dvdxw)*muX(i,j,k))
-              xflux(i,j,k,3)=-((dudzw+dwdxw)*muX(i,j,k))
-              
-              yflux(i,j,k,1)=-((dudys+dvdxs)*muY(i,j,k))
-              yflux(i,j,k,2)=-(2*dvdys*muY(i,j,k))
-              yflux(i,j,k,3)=-((dvdzs+dwdys)*muY(i,j,k))
-
-              zflux(i,j,k,1)=-((dudzb+dwdxb)*muZ(i,j,k))
-              zflux(i,j,k,2)=-((dvdzb+dwdyb)*muZ(i,j,k))
-              zflux(i,j,k,3)=-(2*dwdzb*muZ(i,j,k))
-      end
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D3.F b/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D3.F
deleted file mode 100644
index d7a25ff48cd..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DV_3D3.F
+++ /dev/null
@@ -1,3975 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: Null
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_GSRB(
-     $                         u, DIMS(u),
-     $                         rhs, DIMS(rhs),
-     $                         alpha, beta,
-     $                         a, DIMS(a),
-     $                         muX, DIMS(muX),
-     $                         muY, DIMS(muY),
-     $                         muZ, DIMS(muZ),
-     $                         maskn,DIMS(maskn),
-     $                         fn, DIMS(fn),
-     $                         maske,DIMS(maske),
-     $                         fe, DIMS(fe),
-     $                         maskw,DIMS(maskw),
-     $                         fw, DIMS(fw),
-     $                         masks,DIMS(masks),
-     $                         fs, DIMS(fs),
-     $                         maskt,DIMS(maskt),
-     $                         ft, DIMS(ft),
-     $                         maskb,DIMS(maskb),
-     $                         fb, DIMS(fb),
-     $                         trandern,DIMS(trandern),
-     $                         trandere,DIMS(trandere),
-     $                         tranderw,DIMS(tranderw),
-     $                         tranders,DIMS(tranders),
-     $                         trandert,DIMS(trandert),
-     $                         tranderb,DIMS(tranderb),
-     $                         lo,hi,h,ncomp,phaseflag
-     $                         )
-      implicit none
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(rhs)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(muZ)
-      integer DIMDEC(maskn)
-      integer DIMDEC(fn)
-      integer DIMDEC(maske)
-      integer DIMDEC(fe)
-      integer DIMDEC(maskw)
-      integer DIMDEC(fw)
-      integer DIMDEC(masks)
-      integer DIMDEC(fs)
-      integer DIMDEC(maskt)
-      integer DIMDEC(ft)
-      integer DIMDEC(maskb)
-      integer DIMDEC(fb)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer DIMDEC(trandert)
-      integer DIMDEC(tranderb)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer ncomp
-      integer phaseflag
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),3)
-      REAL_T rhs(DIMV(rhs),3)
-      REAL_T a(DIMV(a))
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T muZ(DIMV(muZ))
-      integer  maskn(DIMV(maskn))
-      REAL_T fn(DIMV(fn),3)
-      integer  maske(DIMV(maske))
-      REAL_T fe(DIMV(fe),3)
-      integer  maskw(DIMV(maskw))
-      REAL_T fw(DIMV(fw),3)
-      integer  masks(DIMV(masks))
-      REAL_T fs(DIMV(fs),3)
-      integer  maskt(DIMV(maskt))
-      REAL_T ft(DIMV(ft),3)
-      integer  maskb(DIMV(maskb))
-      REAL_T fb(DIMV(fb),3)
-
-c ::: for transverse derives, first 3 is for variable, second 3 is for
-c ::: direction of derivative.  Obviously not all are used, but this is easy.
-      REAL_T trandern(DIMV(trandern),3,3)
-      REAL_T trandere(DIMV(trandere),3,3)
-      REAL_T tranderw(DIMV(tranderw),3,3)
-      REAL_T tranders(DIMV(tranders),3,3)
-      REAL_T trandert(DIMV(trandert),3,3)
-      REAL_T tranderb(DIMV(tranderb),3,3)
-
-      integer i,j,k
-      REAL_T hx,hy,hz,invhx,invhy,invhz,ihxsq,ihysq,ihzsq,ihxyz
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw
-      REAL_T dudyn,dudys
-      REAL_T dvdxe,dvdxw
-      REAL_T dvdxn,dvdxs
-      REAL_T dudzb,dudzt
-      REAL_T dwdzt,dwdzb
-      REAL_T dwdxb,dwdxt
-      REAL_T dvdzb,dvdzt
-      REAL_T dwdyb,dwdyt
-      REAL_T dudzw,dudze
-      REAL_T dwdxw,dwdxe
-      REAL_T dvdzs,dvdzn
-      REAL_T dwdys,dwdyn
-      integer modx,mody,modz
-      integer istart,jstart,kstart
-      REAL_T diagu,diagv,diagw
-      REAL_T operu,operv,operw
-
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-      invhx = 1.0d0/hx
-      invhy = 1.0d0/hy
-      invhz = 1.0d0/hz
-
-      ihxsq = 1.0d0/hx**2
-      ihysq = 1.0d0/hy**2
-      ihzsq = 1.0d0/hz**2
-
-      ihxyz = 1.0d0/(hx*hy*hz)
-
-      if( ncomp .ne. 3 ) then
-	write(6,*)'FORT_GSRB: bad ncomp',ncomp
-	stop
-      endif
-c ::: convert phase flag into modx and mody and modz
-
-      select case (phaseflag)
-      case (0)
-         modx = 0
-         mody = 0
-         modz = 0
-      case (1)
-         modx = 1
-         mody = 0
-         modz = 0
-      case (2)
-         modx = 0
-         mody = 1
-         modz = 0
-      case (3)
-         modx = 1
-         mody = 1
-         modz = 0
-      case (4)
-         modx = 0
-         mody = 0
-         modz = 1
-      case (5)
-         modx = 1
-         mody = 0
-         modz = 1
-      case (6)
-         modx = 0
-         mody = 1
-         modz = 1
-      case (7)
-         modx = 1
-         mody = 1
-         modz = 1
-      case default
-         write(6,*)'FORT_GSRB: bad phaseflag', phaseflag
-         stop
-      end select
-
-
-c ::: cases:
-c     ::: 0) interior.  All usual derivative expressions
-c     ::: 1-6) face but not on edge.  
-c     ::: 7-18) edge but not on corner.
-c     ::: 19-26) corners.
-
-c ::: case 0
-c ::: Null
-c ::: Null
-      istart = lo(1)+1
-      if( mod(istart,2) .ne. modx ) istart = istart+1
-      jstart = lo(2)+1
-      if( mod(jstart,2) .ne. mody ) jstart = jstart+1
-      kstart = lo(3)+1
-      if( mod(kstart,2) .ne. modz ) kstart = kstart+1
-      do k=kstart,hi(3)-1,2
-         do j=jstart,hi(2)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-      
-c     ::: get expressions for tangential derivatives
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: in interior, diagonal elements need no corrections
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-         enddo
-      enddo
-
-c ::: case 1, top face
-c ::: Null
-c ::: Null
-c ::: Null
-      k=hi(3)
-      if( mod(k,2) .eq. modz ) then
-         do j=jstart,hi(2)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-         enddo
-      endif
-
-c ::: case 2, bottom face
-c ::: Null
-c ::: Null
-c ::: Null
-      k=lo(3)
-      if( mod(k,2).eq.modz) then
-         do j=jstart,hi(2)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-               
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*invhz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*invhz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*invhz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*invhz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-         enddo
-      endif
-
-c ::: case 3, west face
-c ::: Null
-c ::: Null
-c ::: Null
-      i = lo(1)
-      if( mod(i,2) .eq. modx) then
-      do k=kstart,hi(3)-1,2
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal 
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*invhx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*invhx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*invhx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*invhx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-            enddo
-         enddo
-      endif
-
-c ::: case 4, east face
-c ::: Null
-c ::: Null
-c ::: Null
-      i = hi(1)
-      if( mod(i,2).eq.modx) then
-      do k=kstart,hi(3)-1,2
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dudye=trandere(1+i,j,k,1,2)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-      enddo
-      endif
-	
-
-c ::: case 5, north face
-c ::: Null
-c ::: Null
-c ::: Null
-      j = hi(2)
-      if( mod(j,2).eq.mody) then
-      do k=kstart,hi(3)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-               
-c     ::: get expressions for tangential derivatives
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-             enddo
-          enddo
-       endif
-
-
-
-c ::: case 6, south face
-c ::: Null
-c ::: Null
-c ::: Null
-      j = lo(2)
-      if( mod(j,2).eq.mody) then
-      do k=kstart,hi(3)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*invhy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*invhy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*invhy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*invhy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-        dvdzs=tranders(i,-1+j,k,2,3)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-
-            enddo
-         enddo
-      endif
-
-
-
-c ::: case 7, top-north edge 
-c ::: Null
-c ::: Null
-c ::: Null
-      k=hi(3)
-         j=hi(2)
-         if( mod(k,2).eq.modz .and. mod(j,2).eq.mody ) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,1)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-            enddo
-      endif
-
-c ::: case 8, top-south edge 
-c ::: Null
-      k=hi(3)
-         j=lo(2)
-         if( mod(k,2).eq.modz .and. mod(j,2).eq.mody) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*invhy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*invhy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*invhy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-            enddo
-      endif
-
-
-c ::: case 9, top-west edge 
-c ::: Null
-      k=hi(3)
-      i=lo(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*invhx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*invhx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*invhx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-      endif
-
-
-
-c ::: case 10, top-east edge 
-c ::: Null
-      k=hi(3)
-      i=hi(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-               
-c     ::: get expressions for tangential derivatives
-        dudye=trandere(1+i,j,k,1,2)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-        
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-      endif
-
-
-
-c ::: case 11, bottom-north edge 
-c ::: Null
-      k=lo(3)
-      j=hi(2)
-      if( mod(k,2).eq.modz .and. mod(j,2).eq.mody) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dvdxn=trandern(i,1+j,k,2,1)
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*invhz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*invhz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*invhz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-        
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-        endif
-
-
-
-c ::: case 12, bottom-south edge 
-c ::: Null
-      k=lo(3)
-      j=lo(2)
-      if( mod(k,2).eq.modz .and. mod(j,2).eq.mody ) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*invhy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*invhy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*invhy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*invhz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*invhz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*invhz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-       endif
-
-
-
-c ::: case 13, bottom-west edge 
-c ::: Null
-      k=lo(3)
-      i=lo(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx) then
-      do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*invhx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*invhx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*invhx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*invhz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*invhz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*invhz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-         endif
-
-
-
-c ::: case 14, bottom-east edge 
-c ::: Null
-      k=lo(3)
-      i=hi(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*invhz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*invhz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*invhz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-         endif
-
-
-
-c ::: case 15, east-north edge
-c ::: Null
-      j=hi(2)
-      i=hi(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      enddo
-      endif
-
-
-c ::: case 16, east-south edge
-c ::: Null
-      j=lo(2)
-      i=hi(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*invhy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*invhy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*invhy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-      enddo
-      endif
-
-
-
-c ::: case 17, west-north edge
-c ::: Null
-      j=hi(2)
-      i=lo(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*invhx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*invhx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*invhx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-        dvdzn=trandern(i,1+j,k,2,3)
-        
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-      enddo
-      endif
-
-
-
-c ::: case 18, west-south edge
-c ::: Null
-      j=lo(2)
-      i=lo(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*invhx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*invhx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*invhx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*invhy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*invhy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*invhy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-        dvdzs=tranders(i,-1+j,k,2,3)
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fw(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fw(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      enddo
-      endif
-
-
-c ::: case 19, top-north-east corner
-c ::: Null
-      k=hi(3)
-      j=hi(2)
-      i=hi(1)
-      if( mod(k,2).eq.modz .and. mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-       endif
-
-
-
-c ::: case 20, top-north-west corner
-c ::: Null
-           i=lo(1)
-           j=hi(2)
-           k=hi(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*invhx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*invhx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(maskn(i,1+j,-1+k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dwdyb=((U(i,-2+j,-1+k,3)-4*U(i,-1+j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhy)+(U(i,-2+j,k,3)-4*U(i,-1+j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskt(i,-1+j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dvdzs=((U(i,-1+j,-2+k,2)-4*U(i,-1+j,-1+k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhz)+(U(i,j,-2+k,2)-4*U(i,j,-1+k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-       endif
-
-
-
-c ::: case 21, top-south-east corner
-c ::: Null
-           i=hi(1)
-           j=lo(2)
-           k=hi(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maske(1+i,j,-1+k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dwdxb=((U(-2+i,j,-1+k,3)-4*U(-1+i,j,-1+k,3)+3*U(i,
-     &  j,-1+k,3))*(.5d0*invhx)+(U(-2+i,j,k,3)-4*U(-1+i,j,k,3
-     &  )+3*U(i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*invhy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*invhy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-      if(maskt(-1+i,j,1+k).gt.0.or.maskt(i,j,1+k).gt.0) then 
-        dudzw=((U(-1+i,j,-2+k,1)-4*U(-1+i,j,-1+k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhz)+(U(i,j,-2+k,1)-4*U(i,j,-1+k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      endif
-
-
-c ::: case 22, top-south-west corner
-c ::: Null
-           i=lo(1)
-           j=lo(2)
-           k=hi(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*invhx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-      if(maskw(-1+i,j,-1+k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dwdxb=((-3*U(i,j,-1+k,3)+4*U(1+i,j,-1+k,3)-U(2+i,j
-     &  ,-1+k,3))*(.5d0*invhx)+(-3*U(i,j,k,3)+4*U(1+i,j,k,3)-
-     &  U(2+i,j,k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxb=(-U(-1+i,j,-1+k,3)-U(-1+i,j,k,3)+U(1+i,j,-1+
-     &  k,3)+U(1+i,j,k,3))*(.25d0*invhx)
-      endif
-        dwdxt=trandert(i,j,1+k,3,1)
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*invhy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-      if(masks(i,-1+j,-1+k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dwdyb=((-3*U(i,j,-1+k,3)+4*U(i,1+j,-1+k,3)-U(i,2+j
-     &  ,-1+k,3))*(.5d0*invhy)+(-3*U(i,j,k,3)+4*U(i,1+j,k,3)-
-     &  U(i,2+j,k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyb=(-U(i,-1+j,-1+k,3)-U(i,-1+j,k,3)+U(i,1+j,-1+
-     &  k,3)+U(i,1+j,k,3))*(.25d0*invhy)
-      endif
-        dwdyt=trandert(i,j,1+k,3,2)
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(1+i,j,1+k).gt.0) then 
-        dudze=((U(i,j,-2+k,1)-4*U(i,j,-1+k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhz)+(U(1+i,j,-2+k,1)-4*U(1+i,j,-1+k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskt(i,j,1+k).gt.0.or.maskt(i,1+j,1+k).gt.0) then 
-        dvdzn=((U(i,j,-2+k,2)-4*U(i,j,-1+k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhz)+(U(i,1+j,-2+k,2)-4*U(i,1+j,-1+k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)*ihzsq)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)*ihzsq
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-        endif
-
-
-
-c ::: case 23, bottom-north-east corner
-c ::: Null
-           i=hi(1)
-           j=hi(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maske(1+i,-1+j,k).gt.0.or.maske(1+i,j,k).gt.0) then 
-        dvdxs=((U(-2+i,-1+j,k,2)-4*U(-1+i,-1+j,k,2)+3*U(i,
-     &  -1+j,k,2))*(.5d0*invhx)+(U(-2+i,j,k,2)-4*U(-1+i,j,k,2
-     &  )+3*U(i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(maskn(-1+i,1+j,k).gt.0.or.maskn(i,1+j,k).gt.0) then 
-        dudyw=((U(-1+i,-2+j,k,1)-4*U(-1+i,-1+j,k,1)+3*U(-1
-     &  +i,j,k,1))*(.5d0*invhy)+(U(i,-2+j,k,1)-4*U(i,-1+j,k,1
-     &  )+3*U(i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*invhz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*invhz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-
-       endif
-
-
-c ::: case 24, bottom-north-west corner
-c ::: Null
-           i=lo(1)
-           j=hi(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-        dvdxn=trandern(i,1+j,k,2,1)
-      if(maskw(-1+i,-1+j,k).gt.0.or.maskw(-1+i,j,k).gt.0) then 
-        dvdxs=((-3*U(i,-1+j,k,2)+4*U(1+i,-1+j,k,2)-U(2+i,-
-     &  1+j,k,2))*(.5d0*invhx)+(-3*U(i,j,k,2)+4*U(1+i,j,k,2)-
-     &  U(2+i,j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxs=(-U(-1+i,-1+j,k,2)-U(-1+i,j,k,2)+U(1+i,-1+j,
-     &  k,2)+U(1+i,j,k,2))*(.25d0*invhx)
-      endif
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*invhx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-      if(maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0) then 
-        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)
-     &  )*(.5d0*invhy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U
-     &  (1+i,j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(maskn(i,1+j,k).gt.0.or.maskn(i,1+j,1+k).gt.0) then 
-        dwdyt=((U(i,-2+j,k,3)-4*U(i,-1+j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhy)+(U(i,-2+j,1+k,3)-4*U(i,-1+j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*invhz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-      if(maskb(i,-1+j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dvdzs=((-3*U(i,-1+j,k,2)+4*U(i,-1+j,1+k,2)-U(i,-1+
-     &  j,2+k,2))*(.5d0*invhz)+(-3*U(i,j,k,2)+4*U(i,j,1+k,2)-
-     &  U(i,j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzs=(-U(i,-1+j,-1+k,2)+U(i,-1+j,1+k,2)-U(i,j,-1+
-     &  k,2)+U(i,j,1+k,2))*(.25d0*invhz)
-      endif
-        dvdzn=trandern(i,1+j,k,2,3)
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)*ihysq)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)*ihysq
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)*ihysq)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-
-       endif
-
-
-
-c ::: case 25, bottom-south-east corner
-c ::: Null
-           i=hi(1)
-           j=lo(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,1+j,k).gt.0) then 
-        dvdxn=((U(-2+i,j,k,2)-4*U(-1+i,j,k,2)+3*U(i,j,k,2)
-     &  )*(.5d0*invhx)+(U(-2+i,1+j,k,2)-4*U(-1+i,1+j,k,2)+3*U
-     &  (i,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maske(1+i,j,k).gt.0.or.maske(1+i,j,1+k).gt.0) then 
-        dwdxt=((U(-2+i,j,k,3)-4*U(-1+i,j,k,3)+3*U(i,j,k,3)
-     &  )*(.5d0*invhx)+(U(-2+i,j,1+k,3)-4*U(-1+i,j,1+k,3)+3*U
-     &  (i,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-        dudye=trandere(1+i,j,k,1,2)
-      if(masks(-1+i,-1+j,k).gt.0.or.masks(i,-1+j,k).gt.0) then 
-        dudyw=((-3*U(-1+i,j,k,1)+4*U(-1+i,1+j,k,1)-U(-1+i,
-     &  2+j,k,1))*(.5d0*invhy)+(-3*U(i,j,k,1)+4*U(i,1+j,k,1)-
-     &  U(i,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudyw=(-U(-1+i,-1+j,k,1)+U(-1+i,1+j,k,1)-U(i,-1+j,
-     &  k,1)+U(i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*invhy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-      if(maskb(-1+i,j,-1+k).gt.0.or.maskb(i,j,-1+k).gt.0) then 
-        dudzw=((-3*U(-1+i,j,k,1)+4*U(-1+i,j,1+k,1)-U(-1+i,
-     &  j,2+k,1))*(.5d0*invhz)+(-3*U(i,j,k,1)+4*U(i,j,1+k,1)-
-     &  U(i,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudzw=(-U(-1+i,j,-1+k,1)+U(-1+i,j,1+k,1)-U(i,j,-1+
-     &  k,1)+U(i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dudze=trandere(1+i,j,k,1,3)
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*invhz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)*ihxsq
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)*ihxsq)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-       endif
-
-
-
-c ::: case 26, bottom-south-west corner
-c ::: Null
-           i=lo(1)
-           j=lo(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = (-U(i,j,k,1)+U(1+i,j,k,1))*invhx
-               dudxw = (-U(-1+i,j,k,1)+U(i,j,k,1))*invhx
-
-               dvdyn = (-U(i,j,k,2)+U(i,1+j,k,2))*invhy
-               dvdys = (-U(i,-1+j,k,2)+U(i,j,k,2))*invhy
-
-               dwdzt = (-U(i,j,k,3)+U(i,j,1+k,3))*invhz
-               dwdzb = (-U(i,j,-1+k,3)+U(i,j,k,3))*invhz
-
-               dudyn = (-U(i,j,k,1)+U(i,1+j,k,1))*invhy
-               dudys = (-U(i,-1+j,k,1)+U(i,j,k,1))*invhy
-
-               dvdxe = (-U(i,j,k,2)+U(1+i,j,k,2))*invhx
-               dvdxw = (-U(-1+i,j,k,2)+U(i,j,k,2))*invhx
-
-               dudzt = (-U(i,j,k,1)+U(i,j,1+k,1))*invhz
-               dudzb = (-U(i,j,-1+k,1)+U(i,j,k,1))*invhz
-
-               dvdzb = (-U(i,j,-1+k,2)+U(i,j,k,2))*invhz
-               dvdzt = (-U(i,j,k,2)+U(i,j,1+k,2))*invhz
-
-               dwdxw = (-U(-1+i,j,k,3)+U(i,j,k,3))*invhx
-               dwdxe = (-U(i,j,k,3)+U(1+i,j,k,3))*invhx
-
-               dwdys = (-U(i,-1+j,k,3)+U(i,j,k,3))*invhy
-               dwdyn = (-U(i,j,k,3)+U(i,1+j,k,3))*invhy
-
-c     ::: get expressions for tangential derivatives
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,1+j,k).gt.0) then 
-        dvdxn=((-3*U(i,j,k,2)+4*U(1+i,j,k,2)-U(2+i,j,k,2))
-     &  *(.5d0*invhx)+(-3*U(i,1+j,k,2)+4*U(1+i,1+j,k,2)-U(2+i
-     &  ,1+j,k,2))*(.5d0*invhx))*0.5d0
-      else
-        dvdxn=(-U(-1+i,j,k,2)-U(-1+i,1+j,k,2)+U(1+i,j,k,2)
-     &  +U(1+i,1+j,k,2))*(.25d0*invhx)
-      endif
-        dvdxs=tranders(i,-1+j,k,2,1)
-        dwdxb=tranderb(i,j,-1+k,3,1)
-      if(maskw(-1+i,j,k).gt.0.or.maskw(-1+i,j,1+k).gt.0) then 
-        dwdxt=((-3*U(i,j,k,3)+4*U(1+i,j,k,3)-U(2+i,j,k,3))
-     &  *(.5d0*invhx)+(-3*U(i,j,1+k,3)+4*U(1+i,j,1+k,3)-U(2+i
-     &  ,j,1+k,3))*(.5d0*invhx))*0.5d0
-      else
-        dwdxt=(-U(-1+i,j,k,3)-U(-1+i,j,1+k,3)+U(1+i,j,k,3)
-     &  +U(1+i,j,1+k,3))*(.25d0*invhx)
-      endif
-      if(masks(i,-1+j,k).gt.0.or.masks(1+i,-1+j,k).gt.0) then 
-        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))
-     &  *(.5d0*invhy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i
-     &  ,2+j,k,1))*(.5d0*invhy))*0.5d0
-      else
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))*(.25d0*invhy)
-      endif
-        dudyw=tranderw(-1+i,j,k,1,2)
-        dwdyb=tranderb(i,j,-1+k,3,2)
-      if(masks(i,-1+j,k).gt.0.or.masks(i,-1+j,1+k).gt.0) then 
-        dwdyt=((-3*U(i,j,k,3)+4*U(i,1+j,k,3)-U(i,2+j,k,3))
-     &  *(.5d0*invhy)+(-3*U(i,j,1+k,3)+4*U(i,1+j,1+k,3)-U(i,2
-     &  +j,1+k,3))*(.5d0*invhy))*0.5d0
-      else
-        dwdyt=(-U(i,-1+j,k,3)-U(i,-1+j,1+k,3)+U(i,1+j,k,3)
-     &  +U(i,1+j,1+k,3))*(.25d0*invhy)
-      endif
-        dudzw=tranderw(-1+i,j,k,1,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(1+i,j,-1+k).gt.0) then 
-        dudze=((-3*U(i,j,k,1)+4*U(i,j,1+k,1)-U(i,j,2+k,1))
-     &  *(.5d0*invhz)+(-3*U(1+i,j,k,1)+4*U(1+i,j,1+k,1)-U(1+i
-     &  ,j,2+k,1))*(.5d0*invhz))*0.5d0
-      else
-        dudze=(-U(i,j,-1+k,1)+U(i,j,1+k,1)-U(1+i,j,-1+k,1)
-     &  +U(1+i,j,1+k,1))*(.25d0*invhz)
-      endif
-        dvdzs=tranders(i,-1+j,k,2,3)
-      if(maskb(i,j,-1+k).gt.0.or.maskb(i,1+j,-1+k).gt.0) then 
-        dvdzn=((-3*U(i,j,k,2)+4*U(i,j,1+k,2)-U(i,j,2+k,2))
-     &  *(.5d0*invhz)+(-3*U(i,1+j,k,2)+4*U(i,1+j,1+k,2)-U(i,1
-     &  +j,2+k,2))*(.5d0*invhz))*0.5d0
-      else
-        dvdzn=(-U(i,j,-1+k,2)+U(i,j,1+k,2)-U(i,1+j,-1+k,2)
-     &  +U(i,1+j,1+k,2))*(.25d0*invhz)
-      endif
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)*ihxsq+2.d0*beta*muX(1
-     &  +i,j,k)*ihxsq+beta*muY(i,j,k)*ihysq+beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +2.d0*beta*muY(i,j,k)*ihysq+2.d0*beta*muY(i,1+
-     &  j,k)*ihysq+beta*muZ(i,j,k)*ihzsq+beta*muZ(i,j,1+k
-     &  )*ihzsq
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)*ihxsq+beta*muX(1+i,j,k)*ihxsq
-     &  +beta*muY(i,j,k)*ihysq+beta*muY(i,1+j,k)*ihysq
-     &  +2.d0*beta*muZ(i,j,k)*ihzsq+2.d0*beta*muZ(i,j,1+k
-     &  )*ihzsq
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)*ihzsq)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)*ihzsq)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)*ihzsq
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)*ihysq)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)*ihysq
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)*ihysq)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)*ihxsq
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)*ihxsq)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)*ihxsq)
-      endif
-
-c     :::  evaluate expression
-      operu = -((beta*(hy*hz*(-2*dudxw*muX(i,j,k)+2*dudxe*muX(1+i,j,k))+
-     &  hx*hz*(-((dudys+dvdxs)*muY(i,j,k))+(dudyn+dvdxn)*m
-     &  uY(i,1+j,k))+hx*hy*(-((dudzb+dwdxb)*muZ(i,j,k))+(d
-     &  udzt+dwdxt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,1)
-      operv = -((beta*(hy*hz*(-((dudyw+dvdxw)*muX(i,j,k))+(dudye+dvdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-2*dvdys*muY(i,j,k)+2*dvdyn*m
-     &  uY(i,1+j,k))+hx*hy*(-((dvdzb+dwdyb)*muZ(i,j,k))+(d
-     &  vdzt+dwdyt)*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,2)
-      operw = -((beta*(hy*hz*(-((dudzw+dwdxw)*muX(i,j,k))+(dudze+dwdxe)*
-     &  muX(1+i,j,k))+hx*hz*(-((dvdzs+dwdys)*muY(i,j,k))+(
-     &  dvdzn+dwdyn)*muY(i,1+j,k))+hx*hy*(-2*dwdzb*muZ(i,j
-     &  ,k)+2*dwdzt*muZ(i,j,1+k))))*ihxyz)+alpha*a(i,
-     &  j,k)*u(i,j,k,3)
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      endif
-
-
-
-
-
-       return
-       end
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DivVis.H b/Src/LinearSolvers/C_TensorMG/AMReX_DivVis.H
deleted file mode 100644
index fc5f607b050..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DivVis.H
+++ /dev/null
@@ -1,355 +0,0 @@
-#ifndef AMREX_DivVis_H_
-#define AMREX_DivVis_H_
-
-#include <AMReX_Array.H>
-#include <AMReX_MCLinOp.H>
-
-namespace amrex {
-
-/**
-
-  \brief A DivVis tailors the description of a linear operator to apply
-  the second-order central difference approximation to the differential
-  operator, ``alpha*a(x).u(x) - beta*div[tau(u(x))]``, on a cell-centered
-  MultiFab, u(x).  Here, alpha and beta are constants, a(x) is a
-  cell-centered MultiFab, and b(x) is a vector of wall-centered
-  MultiFabs, 1 per dimension.  u(x) can have multiple components, but
-  all coefficient info is scalar, and norm reports on ALL components
-  together.
-  tau is a three by three tensor
-
-  ``b(x)*(u_{i,j}+u_{j,i})``
-
-  A DivVis tailors a LinOp (a virtual base class for general
-  linear operators) to compute the second-order central difference
-  approximation to the differential operator,
-
-  ``alpha*a(x).u(x) - beta*div[tau(u(x))]``
-
-  on a cell-centered
-  MultiFab, u(x).  Here, alpha and beta are constants, a(x) is a
-  cell-centered MultiFab, and b(x) is a vector of wall-centered
-  MultiFabs, 1 per dimension.  u(x) can have multiple components, but
-  all coefficient info is scalar, and norm reports on ALL components
-  together.
-  Tau is the 3 by 3 tensor
-
-  ``b(x)*(u_{i,j}+u_{j,i})``
-
-
-  This class provides the necessary
-  implementations for applying the operator, and for
-  smoothing a guessed solution to the linear equation system,
-  L(u(x)) = rhs (where rhs is another cell-centered MultiFab).  This
-  class also provides access functions to set/control the coefficient
-  MultiFabs a and b, as well as the scalars, alpha and beta.  These
-  customizations are designed for 2D and 3D, with constant (but
-  not necessarily equal) mesh spacing in each direction.
-
-  Application of the operator and smoothing are
-  "level" operations, and therefore must access "hidden" level data
-  (such as boundary conditions, etc) as required, in concert with the
-  semantics of the underlying LinOp defintions.  Accordingly, these
-  implementations are "protected" and called only by the publically
-  accessible members of the virtual base class, LinOp.  Note that these
-  implementations may therefore assume that boundary (ghost) nodes and
-  other pertinent information are filled properly by the base class
-  functions prior to call.
-
-  Defaults are as follows for the coefficients:
-
-   ``alpha = 1.0
-   beta = 1.0
-   a (MultiFab) = 0.0
-   b (MultiFab) = 1.0``
-  */
-
-class DivVis
-    :
-    public MCLinOp
-{
-public:
-
-    /**
-    * \brief Constructor for box array, boundary data and scalar mesh spacing.
-    *
-    * \param bd
-    * \param _h
-    */
-    DivVis (const BndryData& bd,
-	    Real             _h);
-
-    /**
-    * \brief Constructor for box array, boundary data and vector mesh spacing.
-    *
-    * \param bd
-    * \param _h
-    */
-    DivVis (const BndryData& bd,
-	    const Real*      _h);
-
-    /**
-    * \brief The destructor.
-    */
-    virtual ~DivVis () override;
-
-    /**
-    * \brief Set scalar coefficients.
-    *
-    * \param _alpha
-    * \param _beta
-    */
-    void setScalars (Real _alpha,
-		     Real _beta);
-
-    /**
-    * \brief Get scalar alpha coefficient.
-    */
-    Real get_alpha () const;
-
-    /**
-    * \brief Get scalar beta coefficient.
-    */
-    Real get_beta () const;
-
-    /**
-    * \brief Return reference to "a" coefficients for base level.
-    *
-    * \param level
-    */
-    const MultiFab& aCoefficients (int level = 0);
-
-    /**
-    * \brief Return reference to "b" coefficients for base level.
-    *
-    * \param dir
-    * \param level
-    */
-    const MultiFab& bCoefficients (int dir,
-				   int level = 0);
-
-    /**
-    * \brief Copy _a into "a" coeffs for base level.
-    *
-    * \param _a
-    */
-    void aCoefficients (const MultiFab& _a);
-
-    /**
-    * \brief Zero out the "a" coeffs for base level.
-    */
-    void ZeroACoefficients ();
-
-    /**
-    * \brief Copy _b into "b" coeffs in "dir" coordinate direction for base level.
-    *
-    * \param _b
-    * \param dir
-    */
-    void bCoefficients (const MultiFab& _b,
-			int             dir);
-
-    /**
-    * \brief copy _b into "b" coeffs in "dir" coordinate direction for base level
-    * at supplied gridno
-    *
-    * \param _b
-    * \param dir
-    * \param gridno
-    */
-    void bCoefficients (const FArrayBox& _b,
-                        int              dir,
-                        int              gridno);
-
-    //! Alternative (older) version of above members.
-    void setCoefficients (const MultiFab &_a,
-			  const MultiFab &_bX,
-			  const MultiFab &_bY
-#if BL_SPACEDIM==3
-			  ,const MultiFab &_bZ
-#endif
-	);
-
-    /**
-    * \brief Collective version of above members (taking an array of MultiFabs for "b").
-    *
-    * \param _a
-    * \param _b
-    */
-    void setCoefficients (const MultiFab& _a,
-			  const MultiFab* _b);
-
-    /**
-    * \brief Allocate/fill internal data for new level.
-    *
-    * \param level
-    */
-    virtual void prepareForLevel (int level) override;
-
-    /**
-    * \brief Remove internal data for this level and all levels above.
-    *
-    * \param level
-    */
-    virtual void clearToLevel (int level) override;
-
-    /**
-    * \brief Set flags so that a coeffs at lev and coarser require recalculation.
-    *
-    * \param lev
-    */
-    void invalidate_a_to_level (int lev);
-
-    /**
-    * \brief Set flags so that b coeffs at lev and coarser require recalculation.
-    *
-    * \param lev
-    */
-    void invalidate_b_to_level (int lev);
-
-    //! Computes flux associated with operator.
-    void compFlux (MultiFab &xflux,
-		   MultiFab &yflux,
-#if BL_SPACEDIM>2
-		   MultiFab &zflux,
-#endif
-		   MultiFab& in);
-
-protected:
-
-    /**
-    * \brief Initialize a full set (a,b) of coefficients on the box array.
-    *
-    * \param &_ba
-    * \param _dm
-    */
-    void initCoefficients (const BoxArray &_ba, const DistributionMapping& _dm);
-
-    /**
-    * \brief Compute out=L (in) at level=level.
-    *
-    * \param out
-    * \param in
-    * \param level
-    */
-    virtual void Fapply (MultiFab&       out,
-			 const MultiFab& in,
-			 int             level) override;
-
-    /**
-    * \brief Apply smoother to improve residual to L(solnL)=rhsL.
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param phaseflag
-    */
-    virtual void Fsmooth (MultiFab&       solnL,
-			  const MultiFab& rhsL,
-			  int             level,
-			  int             phaseflag) override;
-
-    /**
-    * \brief Return number of components.  This is virtual since only the derived knows.
-    */
-    virtual int numberComponents () override;
-
-    /**
-    * \brief Number of relaxation phases.  On derived class knows.
-    */
-    virtual int numberPhases () override;
-
-    /**
-    * \brief Helper function for object construction.
-    *
-    * \param _h
-    */
-    void initConstruct (const Real* _h);
-
-protected:
-
-    //! Vector (on level) of "a" coefficients
-    Vector< MultiFab* > acoefs;
-
-    //! Vector (on level) of Array (on dimension) of "b" coefficients
-    Vector< Array< MultiFab*, BL_SPACEDIM> > bcoefs;
-
-    //! Scalar "alpha" coefficient
-    Real alpha;
-
-    //! Scalar "beta" coefficient
-    Real beta;
-
-private:
-
-    //! Flag, can a coeffs be trusted at a level.
-    Vector<int> a_valid;
-
-    //! Flag, can b coeffs be trusted at a level.
-    Vector<int> b_valid;
-
-    //! Default value for a (MultiFab) coeficient.
-    static Real a_def;
-
-    //! Default value for b (MultiFab) coeficient.
-    static Real b_def;
-
-    //! Default value for alpha (scalar) coeficient.
-    static Real alpha_def;
-
-    //! Default value for beta (scalar) coeficient.
-    static Real beta_def;
-
-    /**
-    * \brief Disallow copy constructors (for now...to be fixed).
-    *
-    */
-    DivVis (const DivVis&);
-    DivVis& operator = (const DivVis&);
-};
-
-inline
-Real
-DivVis::get_alpha () const
-{
-    return alpha;
-}
-
-inline
-Real
-DivVis::get_beta () const
-{
-    return beta;
-}
-
-inline
-void
-DivVis::setCoefficients (const MultiFab &_a,
-			 const MultiFab &_bX,
-			 const MultiFab &_bY
-#if BL_SPACEDIM==3
-			 ,const MultiFab &_bZ
-#endif
-    )
-{
-    aCoefficients(_a);
-    bCoefficients(_bX, 0);
-    bCoefficients(_bY, 1);
-#if BL_SPACEDIM==3
-    bCoefficients(_bZ, 2);
-#endif
-}
-
-inline
-void
-DivVis::setCoefficients (const MultiFab& _a,
-			 const MultiFab* _b)
-{
-    aCoefficients(_a);
-    for (int n = 0; n < BL_SPACEDIM; ++n)
-        bCoefficients(_b[n], n);
-}
-
-}
-
-#endif /*_DivVis_H_*/
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DivVis.cpp b/Src/LinearSolvers/C_TensorMG/AMReX_DivVis.cpp
deleted file mode 100644
index e2f67c5083a..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DivVis.cpp
+++ /dev/null
@@ -1,655 +0,0 @@
-#include <AMReX_DivVis.H>
-#include <AMReX_DivVis_F.H>
-
-namespace amrex {
-
-Real DivVis::a_def     = 0.0;
-Real DivVis::b_def     = 1.0;
-Real DivVis::alpha_def = 1.0;
-Real DivVis::beta_def  = 1.0;
-
-int
-DivVis::numberComponents ()
-{
-    return BL_SPACEDIM;
-}
-
-int
-DivVis::numberPhases ()
-{
-    return BL_SPACEDIM==2 ? 4 : 8;
-}
-
-DivVis::DivVis (const BndryData& _bd,
-		Real             _h)
-    :
-    MCLinOp(_bd, _h),
-    alpha(alpha_def),
-    beta(beta_def)
-{
-    Real _hh[BL_SPACEDIM];
-
-    AMREX_D_TERM(_hh[0]=_h;, _hh[1]=_h;, _hh[2]=_h;);
-
-    initConstruct(_hh);
-}
-
-DivVis::DivVis (const BndryData& _bd,
-	        const Real*      _h)
-    :
-    MCLinOp(_bd, _h),
-    alpha(alpha_def),
-    beta(beta_def)
-{
-    initConstruct(_h);
-}
-
-void
-DivVis::initConstruct (const Real* _h)
-{
-    const int level       = 0;
-
-    const DistributionMapping& dm = DistributionMap();
-
-    initCoefficients(gbox[level], dm);
-
-    numcomp  = numberComponents(); // wyc
-    numphase = numberPhases();     // wyc
-
-    undrrelxr.resize(1);
-    undrrelxr[level].define(gbox[level], dm, 1, 0, 0, numcomp);
-    tangderiv.resize(1);
-#if BL_SPACEDIM==2
-    tangderiv[level].define(gbox[level], dm, 0, 1, 0, numcomp);
-#elif BL_SPACEDIM==3
-    tangderiv[level].define(gbox[level], dm, 0, 1, 0, numcomp*(1+3));
-#else
-# error "BL_SPACEDIME must be 2 or 3"
-#endif
-}
-
-DivVis::~DivVis ()
-{
-    clearToLevel(-1);
-}
-
-void
-DivVis::setScalars (Real _alpha,
-		    Real _beta)
-{
-    alpha = _alpha;
-    beta  = _beta;
-}
-
-void
-DivVis::clearToLevel (int level)
-{
-    BL_ASSERT(level >= -1);
-
-    for (int i = level+1; i < numLevels(); ++i)
-    {
-	delete acoefs[i];
-	for (int j = 0; j < BL_SPACEDIM; ++j)
-        {
-	    delete bcoefs[i][j];
-	}
-    }
-}
-
-void
-DivVis::prepareForLevel (int level)
-{
-    MCLinOp::prepareForLevel(level);
-    if (level == 0)
-        return;
-    prepareForLevel(level-1);
-    //
-    // If coefficients were marked invalid, or if not yet made, make new ones
-    // (Note: makeCoefficients is a MCLinOp routine, and it allocates AND
-    // fills coefficients.  A more efficient implementation would allocate
-    // and fill in separate steps--we could then use the a_valid bool
-    // along with the length of a_valid to separately determine whether to
-    // fill or allocate the coefficient MultiFabs.
-    //
-    if (level >= a_valid.size() || a_valid[level] == false)
-    {
-	if (acoefs.size() < level+1)
-        {
-	    acoefs.resize(level+1);
-	    acoefs[level] = new MultiFab;
-	}
-        else
-        {
-	    delete acoefs[level];
-	    acoefs[level] = new MultiFab;
-	}
-	makeCoefficients(*acoefs[level], *acoefs[level-1], level);
-	a_valid.resize(level+1);
-	a_valid[level] = true;
-    }
-    
-    if (level >= b_valid.size() || b_valid[level] == false)
-    {
-	if (bcoefs.size() < level+1)
-        {
-	    bcoefs.resize(level+1);
-	    for (int i = 0; i < BL_SPACEDIM; ++i)
-		bcoefs[level][i] = new MultiFab;
-	}
-        else
-        {
-	    for (int i = 0; i < BL_SPACEDIM; ++i)
-            {
-		delete bcoefs[level][i];
-		bcoefs[level][i] = new MultiFab;
-	    }
-	}
-	for (int i = 0; i < BL_SPACEDIM; ++i)
-	    makeCoefficients(*bcoefs[level][i], *bcoefs[level-1][i], level);
-
-	b_valid.resize(level+1);
-	b_valid[level] = true;
-    }
-}
-
-void
-DivVis::initCoefficients (const BoxArray &_ba, const DistributionMapping& _dm)
-{
-    const int nGrow = 0;
-    const int level = 0;
-
-    acoefs.resize(1);
-    bcoefs.resize(1);
-    //
-    // In 2D, need 2 components for "a" to handle r-z properly (will need three
-    // for r-theta-phi, but allowing only 3D cartesian for now).
-    //
-    const int nCompA = (BL_SPACEDIM == 2  ?  2  :  1);
-
-#ifdef AMREX_DEBUG
-    if (BL_SPACEDIM == 3)
-	BL_ASSERT(geomarray[level].IsCartesian());
-#endif
-
-    acoefs[level] = new MultiFab(_ba, _dm, nCompA, nGrow);
-    acoefs[level]->setVal(a_def);
-    a_valid.resize(1);
-    a_valid[level] = true;
-
-    for (int i = 0; i < BL_SPACEDIM; ++i)
-    {
-	BoxArray edge_boxes(_ba);
-	edge_boxes.surroundingNodes(i);
-	bcoefs[level][i] = new MultiFab(edge_boxes, _dm, 1, nGrow);
-	bcoefs[level][i]->setVal(b_def);
-    }
-    b_valid.resize(1);
-    b_valid[level] = true;
-}
-
-void
-DivVis::invalidate_a_to_level (int lev)
-{
-    lev = (lev >= 0 ? lev : 0);
-    for (int i = lev; i < numLevels(); i++)
-        a_valid[i]=false;
-}
-
-void
-DivVis::invalidate_b_to_level (int lev)
-{
-    lev = (lev >= 0 ? lev : 0);
-    for (int i = lev; i < numLevels(); i++)
-        b_valid[i]=false;
-}
-
-void
-DivVis::ZeroACoefficients ()
-{
-    invalidate_a_to_level(0);
-    (*acoefs[0]).setVal(0,0,acoefs[0]->nComp(),acoefs[0]->nGrow());
-}
-
-void
-DivVis::aCoefficients (const MultiFab& _a)
-{
-    BL_ASSERT(_a.ok());
-    BL_ASSERT(_a.boxArray() == (acoefs[0])->boxArray());
-    const int nCompA = (BL_SPACEDIM == 2  ?  2  :  1);
-    BL_ASSERT(_a.nComp() == nCompA);
-    invalidate_a_to_level(0);
-    (*acoefs[0]).copy(_a,0,0,nCompA);
-}
-
-void
-DivVis::bCoefficients (const MultiFab& _b,
-                       int             dir)
-{
-    BL_ASSERT(_b.ok());
-    BL_ASSERT(_b.boxArray() == (bcoefs[0][dir])->boxArray());
-    BL_ASSERT(_b.nComp() == 1);
-    invalidate_b_to_level(0);
-    (*bcoefs[0][dir]).copy(_b,0,0,1);
-}
-
-void
-DivVis::bCoefficients (const FArrayBox& _b,
-                       int              dir,
-                       int              gridno)
-{
-    BL_ASSERT(_b.box().contains((bcoefs[0][dir])->boxArray()[gridno]));
-    BL_ASSERT(_b.nComp() == 1);
-    invalidate_b_to_level(0);
-    (*bcoefs[0][dir])[gridno].copy<RunOn::Host>(_b,0,0,1);
-}
-
-const MultiFab&
-DivVis::aCoefficients (int level)
-{
-    prepareForLevel(level);
-    return *acoefs[level];
-}
-
-const MultiFab&
-DivVis::bCoefficients (int dir,
-                       int level)
-{
-    prepareForLevel(level);
-    return *bcoefs[level][dir];
-}
-
-//
-// Must be defined for MultiGrid/CGSolver to work.
-//
-void
-DivVis::Fsmooth (MultiFab&       solnL,
-                 const MultiFab& rhsL,
-                 int             level,
-                 int             phaseflag)
-{
-    OrientationIter oitr;
-
-    const FabSet& fw  = undrrelxr[level][oitr()]; 
-    const FabSet& tdw = tangderiv[level][oitr()];
-    const MultiMask& mmw = maskvals[level][oitr()];
-    oitr++;
-    const FabSet& fs  = undrrelxr[level][oitr()]; 
-    const FabSet& tds = tangderiv[level][oitr()];
-    const MultiMask& mms = maskvals[level][oitr()];
-    oitr++;
-#if BL_SPACEDIM>2
-    const FabSet& fb  = undrrelxr[level][oitr()]; 
-    const FabSet& tdb = tangderiv[level][oitr()];
-    const MultiMask& mmb = maskvals[level][oitr()];
-    oitr++;
-#endif
-    const FabSet& fe  = undrrelxr[level][oitr()]; 
-    const FabSet& tde = tangderiv[level][oitr()];
-    const MultiMask& mme = maskvals[level][oitr()];
-    oitr++;
-    const FabSet& fn  = undrrelxr[level][oitr()]; 
-    const FabSet& tdn = tangderiv[level][oitr()];
-    const MultiMask& mmn = maskvals[level][oitr()];
-    oitr++;
-#if BL_SPACEDIM>2
-    const FabSet& ft  = undrrelxr[level][oitr()]; 
-    const FabSet& tdt = tangderiv[level][oitr()];
-    const MultiMask& mmt = maskvals[level][oitr()];
-    oitr++;
-#endif
-    const MultiFab& a  = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-           const MultiFab& bY = bCoefficients(1,level);,
-           const MultiFab& bZ = bCoefficients(2,level););
-
-    int nc = solnL.nComp();
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter solnLmfi(solnL); solnLmfi.isValid(); ++solnLmfi)
-    {
-	const Box& vbx = solnLmfi.validbox();
-
-	AMREX_D_TERM(const Mask& mw = mmw[solnLmfi];,
-               const Mask& ms = mms[solnLmfi];,
-               const Mask& mb = mmb[solnLmfi];);
-
-	AMREX_D_TERM(const Mask& me = mme[solnLmfi];,
-               const Mask& mn = mmn[solnLmfi];,
-               const Mask& mt = mmt[solnLmfi];);
-
-        FArrayBox&       solfab = solnL[solnLmfi];
-        const FArrayBox& rhsfab = rhsL[solnLmfi];
-        const FArrayBox& afab   = a[solnLmfi];
-        const FArrayBox& fnfab  = fn[solnLmfi];
-        const FArrayBox& fefab  = fe[solnLmfi];
-        const FArrayBox& fwfab  = fw[solnLmfi];
-        const FArrayBox& fsfab  = fs[solnLmfi];
-        const FArrayBox& tdnfab = tdn[solnLmfi];
-        const FArrayBox& tdefab = tde[solnLmfi];
-        const FArrayBox& tdwfab = tdw[solnLmfi];
-        const FArrayBox& tdsfab = tds[solnLmfi];
-
-#if BL_SPACEDIM>2
-        const FArrayBox& ftfab  = ft[solnLmfi];
-        const FArrayBox& fbfab  = fb[solnLmfi];
-        const FArrayBox& tdtfab = tdt[solnLmfi];
-        const FArrayBox& tdbfab = tdb[solnLmfi];
-#endif
-
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[solnLmfi];,
-               const FArrayBox& byfab = bY[solnLmfi];,
-               const FArrayBox& bzfab = bZ[solnLmfi];);
-
-	FORT_GSRB(
-	    solfab.dataPtr(), 
-            ARLIM(solfab.loVect()),ARLIM(solfab.hiVect()),
-	    rhsfab.dataPtr(),
-            ARLIM(rhsfab.loVect()), ARLIM(rhsfab.hiVect()),
-	    &alpha, &beta,
-	    afab.dataPtr(),
-            ARLIM(afab.loVect()),    ARLIM(afab.hiVect()),
-	    bxfab.dataPtr(),
-            ARLIM(bxfab.loVect()),   ARLIM(bxfab.hiVect()),
-	    byfab.dataPtr(),
-            ARLIM(byfab.loVect()),   ARLIM(byfab.hiVect()),
-#if BL_SPACEDIM>2
-	    bzfab.dataPtr(),
-            ARLIM(bzfab.loVect()),   ARLIM(bzfab.hiVect()),
-#endif
-	    mn.dataPtr(),
-	    ARLIM(mn.loVect()),ARLIM(mn.hiVect()),
-	    fnfab.dataPtr(),
-            ARLIM(fnfab.loVect()),   ARLIM(fnfab.hiVect()),
-	    me.dataPtr(),
-	    ARLIM(me.loVect()),ARLIM(me.hiVect()),
-	    fefab.dataPtr(),
-            ARLIM(fefab.loVect()),   ARLIM(fefab.hiVect()),
-	    mw.dataPtr(),
-	    ARLIM(mw.loVect()),ARLIM(mw.hiVect()),
-	    fwfab.dataPtr(),
-            ARLIM(fwfab.loVect()),   ARLIM(fwfab.hiVect()),
-	    ms.dataPtr(),
-	    ARLIM(ms.loVect()),ARLIM(ms.hiVect()),
-	    fsfab.dataPtr(),
-            ARLIM(fsfab.loVect()),   ARLIM(fsfab.hiVect()),
-#if BL_SPACEDIM>2
-	    mt.dataPtr(),
-	    ARLIM(mt.loVect()),ARLIM(mt.hiVect()),
-	    ftfab.dataPtr(),
-            ARLIM(ftfab.loVect()),   ARLIM(ftfab.hiVect()),
-	    mb.dataPtr(),
-	    ARLIM(mb.loVect()),ARLIM(mb.hiVect()),
-	    fbfab.dataPtr(),
-            ARLIM(fbfab.loVect()),   ARLIM(fbfab.hiVect()),
-#endif
-	    tdnfab.dataPtr(),
-	    ARLIM(tdnfab.loVect()),ARLIM(tdnfab.hiVect()),
-	    tdefab.dataPtr(),
-	    ARLIM(tdefab.loVect()),ARLIM(tdefab.hiVect()),
-	    tdwfab.dataPtr(),
-	    ARLIM(tdwfab.loVect()),ARLIM(tdwfab.hiVect()),
-	    tdsfab.dataPtr(),
-	    ARLIM(tdsfab.loVect()),ARLIM(tdsfab.hiVect()),
-#if BL_SPACEDIM>2
-	    tdtfab.dataPtr(),
-	    ARLIM(tdtfab.loVect()),ARLIM(tdtfab.hiVect()),
-	    tdbfab.dataPtr(),
-	    ARLIM(tdbfab.loVect()),ARLIM(tdbfab.hiVect()),
-#endif
-	    vbx.loVect(), vbx.hiVect(),
-	    h[level].data(), nc, phaseflag);
-    }
-}
-
-void 
-DivVis::compFlux (AMREX_D_DECL(MultiFab& xflux, 
-                         MultiFab& yflux, 
-                         MultiFab& zflux), 
-                  MultiFab& x)
-{
-    const int level   = 0;
-    MCBC_Mode bc_mode = MCInhomogeneous_BC;
-    applyBC(x,level,bc_mode);
-    
-    const MultiFab& a  = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-           const MultiFab& bY = bCoefficients(1,level);,
-           const MultiFab& bZ = bCoefficients(2,level););
-
-    OrientationIter oitr;
-
-    const FabSet& tdw = tangderiv[level][oitr()]; 
-    const MultiMask& mmw = maskvals[level][oitr()];
-    oitr++;
-    const FabSet& tds = tangderiv[level][oitr()];
-    const MultiMask& mms = maskvals[level][oitr()];
-    oitr++;
-#if BL_SPACEDIM>2
-    const FabSet& tdb = tangderiv[level][oitr()];
-    const MultiMask& mmb = maskvals[level][oitr()];
-    oitr++;
-#endif
-    const FabSet& tde = tangderiv[level][oitr()];
-    const MultiMask& mme = maskvals[level][oitr()];
-    oitr++;
-    const FabSet& tdn = tangderiv[level][oitr()];
-    const MultiMask& mmn = maskvals[level][oitr()];
-    oitr++;
-#if BL_SPACEDIM>2
-    const FabSet& tdt = tangderiv[level][oitr()];
-    const MultiMask& mmt = maskvals[level][oitr()];
-    oitr++;
-#endif
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter xmfi(x); xmfi.isValid(); ++xmfi)
-    {
-	const Box& vbx = xmfi.validbox();
-
-	AMREX_D_TERM(const Mask& mw = mmw[xmfi];,
-               const Mask& ms = mms[xmfi];,
-               const Mask& mb = mmb[xmfi];);
-
-	AMREX_D_TERM(const Mask& me = mme[xmfi];,
-               const Mask& mn = mmn[xmfi];,
-               const Mask& mt = mmt[xmfi];);
-
-        FArrayBox&       xfab = x[xmfi];
-        const FArrayBox& afab = a[xmfi];
-        const FArrayBox& tdnfab = tdn[xmfi];
-        const FArrayBox& tdefab = tde[xmfi];
-        const FArrayBox& tdwfab = tdw[xmfi];
-        const FArrayBox& tdsfab = tds[xmfi];
-
-#if BL_SPACEDIM>2
-        const FArrayBox& tdtfab = tdt[xmfi];
-        const FArrayBox& tdbfab = tdb[xmfi];
-#endif
-
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[xmfi];,
-               const FArrayBox& byfab = bY[xmfi];,
-               const FArrayBox& bzfab = bZ[xmfi];);
-
-        AMREX_D_TERM(FArrayBox& xfluxfab = xflux[xmfi];,
-               FArrayBox& yfluxfab = yflux[xmfi];,
-               FArrayBox& zfluxfab = zflux[xmfi];);
-
-	FORT_DVFLUX(
-	    xfab.dataPtr(), 
-	    ARLIM(xfab.loVect()), ARLIM(xfab.hiVect()),
-	    &alpha, &beta,
-	    afab.dataPtr(), 
-	    ARLIM(afab.loVect()), ARLIM(afab.hiVect()),
-	    bxfab.dataPtr(), 
-	    ARLIM(bxfab.loVect()), ARLIM(bxfab.hiVect()),
-	    byfab.dataPtr(), 
-	    ARLIM(byfab.loVect()), ARLIM(byfab.hiVect()),
-#if BL_SPACEDIM>2
-	    bzfab.dataPtr(), 
-	    ARLIM(bzfab.loVect()), ARLIM(bzfab.hiVect()),
-#endif
-	    xfluxfab.dataPtr(), 
-	    ARLIM(xfluxfab.loVect()), ARLIM(xfluxfab.hiVect()),
-	    yfluxfab.dataPtr(), 
-	    ARLIM(yfluxfab.loVect()), ARLIM(yfluxfab.hiVect()),
-#if BL_SPACEDIM>2
-	    zfluxfab.dataPtr(), 
-	    ARLIM(zfluxfab.loVect()), ARLIM(zfluxfab.hiVect()),
-#endif
-	    mn.dataPtr(),
-	    ARLIM(mn.loVect()),ARLIM(mn.hiVect()),
-	    me.dataPtr(),
-	    ARLIM(me.loVect()),ARLIM(me.hiVect()),
-	    mw.dataPtr(),
-	    ARLIM(mw.loVect()),ARLIM(mw.hiVect()),
-	    ms.dataPtr(),
-	    ARLIM(ms.loVect()),ARLIM(ms.hiVect()),
-#if BL_SPACEDIM>2
-	    mt.dataPtr(),
-	    ARLIM(mt.loVect()),ARLIM(mt.hiVect()),
-	    mb.dataPtr(),
-	    ARLIM(mb.loVect()),ARLIM(mb.hiVect()),
-#endif
-	    tdnfab.dataPtr(),
-	    ARLIM(tdnfab.loVect()),ARLIM(tdnfab.hiVect()),
-	    tdefab.dataPtr(),
-	    ARLIM(tdefab.loVect()),ARLIM(tdefab.hiVect()),
-	    tdwfab.dataPtr(),
-	    ARLIM(tdwfab.loVect()),ARLIM(tdwfab.hiVect()),
-	    tdsfab.dataPtr(),
-	    ARLIM(tdsfab.loVect()),ARLIM(tdsfab.hiVect()),
-#if BL_SPACEDIM>2
-	    tdtfab.dataPtr(),
-	    ARLIM(tdtfab.loVect()),ARLIM(tdtfab.hiVect()),
-	    tdbfab.dataPtr(),
-	    ARLIM(tdbfab.loVect()),ARLIM(tdbfab.hiVect()),
-#endif
-	    vbx.loVect(), vbx.hiVect(),
-	    h[level].data());
-    }
-}
-
-void
-DivVis::Fapply (MultiFab&       y,
-                const MultiFab& x,
-                int             level)
-{
-    const MultiFab& a = aCoefficients(level);
-
-    AMREX_D_TERM(const MultiFab& bX = bCoefficients(0,level);,
-           const MultiFab& bY = bCoefficients(1,level);,
-           const MultiFab& bZ = bCoefficients(2,level););
-
-    OrientationIter oitr;
-
-    const FabSet& tdw = tangderiv[level][oitr()]; 
-    const MultiMask& mmw = maskvals[level][oitr()];
-    oitr++;
-    const FabSet& tds = tangderiv[level][oitr()];
-    const MultiMask& mms = maskvals[level][oitr()];
-    oitr++;
-#if BL_SPACEDIM>2
-    const FabSet& tdb = tangderiv[level][oitr()];
-    const MultiMask& mmb = maskvals[level][oitr()];
-    oitr++;
-#endif
-    const FabSet& tde = tangderiv[level][oitr()];
-    const MultiMask& mme = maskvals[level][oitr()];
-    oitr++;
-    const FabSet& tdn = tangderiv[level][oitr()];
-    const MultiMask& mmn = maskvals[level][oitr()];
-    oitr++;
-#if BL_SPACEDIM>2
-    const FabSet& tdt = tangderiv[level][oitr()];
-    const MultiMask& mmt = maskvals[level][oitr()];
-    oitr++;
-#endif
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter xmfi(x); xmfi.isValid(); ++xmfi)
-    {
-	const Box& vbx = xmfi.validbox();
-
-	AMREX_D_TERM(const Mask& mw = mmw[xmfi];,
-               const Mask& ms = mms[xmfi];,
-               const Mask& mb = mmb[xmfi];);
-
-	AMREX_D_TERM(const Mask& me = mme[xmfi];,
-               const Mask& mn = mmn[xmfi];,
-               const Mask& mt = mmt[xmfi];);
-
-        FArrayBox&       yfab = y[xmfi];
-        const FArrayBox& xfab = x[xmfi];
-
-        const FArrayBox& afab = a[xmfi];
-        const FArrayBox& tdnfab = tdn[xmfi];
-        const FArrayBox& tdefab = tde[xmfi];
-        const FArrayBox& tdwfab = tdw[xmfi];
-        const FArrayBox& tdsfab = tds[xmfi];
-
-#if BL_SPACEDIM>2
-        const FArrayBox& tdtfab = tdt[xmfi];
-        const FArrayBox& tdbfab = tdb[xmfi];
-#endif
-        AMREX_D_TERM(const FArrayBox& bxfab = bX[xmfi];,
-               const FArrayBox& byfab = bY[xmfi];,
-               const FArrayBox& bzfab = bZ[xmfi];);
-
-	FORT_DVAPPLY(
-	    xfab.dataPtr(), 
-            ARLIM(xfab.loVect()), ARLIM(xfab.hiVect()),
-	    &alpha, &beta,
-	    afab.dataPtr(), 
-            ARLIM(afab.loVect()), ARLIM(afab.hiVect()),
-	    bxfab.dataPtr(), 
-            ARLIM(bxfab.loVect()), ARLIM(bxfab.hiVect()),
-	    byfab.dataPtr(), 
-            ARLIM(byfab.loVect()), ARLIM(byfab.hiVect()),
-#if BL_SPACEDIM>2
-	    bzfab.dataPtr(), 
-            ARLIM(bzfab.loVect()), ARLIM(bzfab.hiVect()),
-#endif
-	    yfab.dataPtr(), 
-            ARLIM(yfab.loVect()), ARLIM(yfab.hiVect()),
-	    mn.dataPtr(),
-	    ARLIM(mn.loVect()),ARLIM(mn.hiVect()),
-	    me.dataPtr(),
-	    ARLIM(me.loVect()),ARLIM(me.hiVect()),
-	    mw.dataPtr(),
-	    ARLIM(mw.loVect()),ARLIM(mw.hiVect()),
-	    ms.dataPtr(),
-	    ARLIM(ms.loVect()),ARLIM(ms.hiVect()),
-#if BL_SPACEDIM>2
-	    mt.dataPtr(),
-	    ARLIM(mt.loVect()),ARLIM(mt.hiVect()),
-	    mb.dataPtr(),
-	    ARLIM(mb.loVect()),ARLIM(mb.hiVect()),
-#endif
-	    tdnfab.dataPtr(),
-	    ARLIM(tdnfab.loVect()),ARLIM(tdnfab.hiVect()),
-	    tdefab.dataPtr(),
-	    ARLIM(tdefab.loVect()),ARLIM(tdefab.hiVect()),
-	    tdwfab.dataPtr(),
-	    ARLIM(tdwfab.loVect()),ARLIM(tdwfab.hiVect()),
-	    tdsfab.dataPtr(),
-	    ARLIM(tdsfab.loVect()),ARLIM(tdsfab.hiVect()),
-#if BL_SPACEDIM>2
-	    tdtfab.dataPtr(),
-	    ARLIM(tdtfab.loVect()),ARLIM(tdtfab.hiVect()),
-	    tdbfab.dataPtr(),
-	    ARLIM(tdbfab.loVect()),ARLIM(tdbfab.hiVect()),
-#endif
-	    vbx.loVect(), vbx.hiVect(),
-	    h[level].data());
-    }
-}
-
-}
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_DivVis_F.H b/Src/LinearSolvers/C_TensorMG/AMReX_DivVis_F.H
deleted file mode 100644
index e01eef5ef34..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_DivVis_F.H
+++ /dev/null
@@ -1,215 +0,0 @@
-#ifndef AMREX_DivVis_F_H_
-#define AMREX_DivVis_F_H_
-
-#include <AMReX_REAL.H>
-
-#if   defined(BL_LANG_FORT)
-#   if  (BL_SPACEDIM==2)
-#     define FORT_DVAPPLY          dvapply2d
-#     define FORT_DVFLUX           dvflux2d
-#     define FORT_GSRB             gsrbvisc2d
-#     define FORT_APPLYBC          mcapplybc2dgen
-#   elif(BL_SPACEDIM==3)
-#     define FORT_DVAPPLY          dvapply3d
-#     define FORT_DVFLUX           dvflux3d
-#     define FORT_GSRB             gsrbvisc3d
-#     define FORT_APPLYBC          mcapplybc3dgen
-#   endif
-#else
-
-#if (BL_SPACEDIM == 2)
-
-# if defined(BL_FORT_USE_UPPERCASE)
-#  define FORT_DVAPPLY          DVAPPLY2D
-#  define FORT_DVFLUX           DVFLUX2D
-#  define FORT_GSRB             GSRBVISC2D
-#  define FORT_APPLYBC          MCAPPLYBC2DGEN
-# elif defined(BL_FORT_USE_LOWERCASE)
-#  define FORT_DVAPPLY          dvapply2d
-#  define FORT_DVFLUX           dvflux2d
-#  define FORT_GSRB             gsrbvisc2d
-#  define FORT_APPLYBC          mcapplybc2dgen
-# elif defined(BL_FORT_USE_UNDERSCORE)
-#  define FORT_DVAPPLY          dvapply2d_
-#  define FORT_DVFLUX           dvflux2d_
-#  define FORT_GSRB             gsrbvisc2d_
-#  define FORT_APPLYBC          mcapplybc2dgen_
-# endif
-
-#else
-
-# if defined(BL_FORT_USE_UPPERCASE)
-#  define FORT_DVAPPLY          DVAPPLY3D
-#  define FORT_DVFLUX           DVFLUX3D
-#  define FORT_GSRB             GSRBVISC3D
-#  define FORT_APPLYBC          MCAPPLYBC3DGEN
-# elif defined(BL_FORT_USE_LOWERCASE)
-#  define FORT_DVAPPLY          dvapply3d
-#  define FORT_DVFLUX           dvflux3d
-#  define FORT_GSRB             gsrbvisc3d
-#  define FORT_APPLYBC          mcapplybc3dgen
-# elif defined(BL_FORT_USE_UNDERSCORE)
-#  define FORT_DVAPPLY          dvapply3d_
-#  define FORT_DVFLUX           dvflux3d_
-#  define FORT_GSRB             gsrbvisc3d_
-#  define FORT_APPLYBC          mcapplybc3dgen_
-# endif
-
-#endif
-
-#include <AMReX_ArrayLim.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-  void FORT_DVAPPLY(
-		    const amrex_real*u, ARLIM_P(ulo), ARLIM_P(uhi),
-		    const amrex_real*alpha, const amrex_real*beta,
-		    const amrex_real*a, ARLIM_P(alo),   ARLIM_P(ahi),
-		    const amrex_real*muX, ARLIM_P(muXlo), ARLIM_P(muXhi),
-		    const amrex_real*muY, ARLIM_P(muYlo), ARLIM_P(muYhi),
-#if (BL_SPACEDIM > 2)
-		    const amrex_real*muZ, ARLIM_P(muZlo), ARLIM_P(muZhi),
-#endif
-		    amrex_real*out, ARLIM_P(outlo), ARLIM_P(outhi),
-		    const int*maskn, ARLIM_P(masknlo), ARLIM_P(masknhi),
-		    const int*maske, ARLIM_P(maskelo), ARLIM_P(maskehi),
-		    const int*maskw, ARLIM_P(maskwlo), ARLIM_P(maskwhi),
-		    const int*masks, ARLIM_P(maskslo), ARLIM_P(maskshi),
-#if (BL_SPACEDIM > 2)
-		    const int*maskt, ARLIM_P(masktlo), ARLIM_P(maskthi),
-		    const int*maskb, ARLIM_P(maskblo), ARLIM_P(maskbhi),
-#endif
-		    const amrex_real*trandern,
-		    ARLIM_P(trandernlo),ARLIM_P(trandernhi),
-		    const amrex_real*trandere,
-		    ARLIM_P(tranderelo),ARLIM_P(tranderehi),
-		    const amrex_real*tranderw,
-		    ARLIM_P(tranderwlo),ARLIM_P(tranderwhi),
-		    const amrex_real*tranders,
-		    ARLIM_P(tranderslo),ARLIM_P(trandershi),
-#if (BL_SPACEDIM > 2)
-		    const amrex_real*trandert,
-		    ARLIM_P(trandertlo),ARLIM_P(tranderthi),
-		    const amrex_real*tranderb,
-		    ARLIM_P(tranderblo),ARLIM_P(tranderbhi),
-#endif
-		    const int* lo, const int* hi, const amrex_real* h);
-
-  void FORT_DVFLUX(
-		   const amrex_real*u, ARLIM_P(ulo), ARLIM_P(uhi),
-		   const amrex_real*alpha, const amrex_real*beta,
-		   const amrex_real*a, ARLIM_P(alo),   ARLIM_P(ahi),
-		   const amrex_real*muX, ARLIM_P(muXlo), ARLIM_P(muXhi),
-		   const amrex_real*muY, ARLIM_P(muYlo), ARLIM_P(muYhi),
-#if BL_SPACEDIM>2
-		   const amrex_real*muZ, ARLIM_P(muZlo), ARLIM_P(muZhi),
-#endif
-		   amrex_real*xflux, ARLIM_P(xfluxlo), ARLIM_P(xfluxhi),
-		   amrex_real*yflux, ARLIM_P(yfluxlo), ARLIM_P(yfluxhi),
-#if BL_SPACEDIM>2
-		   amrex_real*zflux, ARLIM_P(zfluxlo), ARLIM_P(zfluxhi),
-#endif
-		   const int*maskn, ARLIM_P(masknlo), ARLIM_P(masknhi),
-		   const int*maske, ARLIM_P(maskelo), ARLIM_P(maskehi),
-		   const int*maskw, ARLIM_P(maskwlo), ARLIM_P(maskwhi),
-		   const int*masks, ARLIM_P(maskslo), ARLIM_P(maskshi),
-#if BL_SPACEDIM>2
-		   const int*maskt, ARLIM_P(masktlo), ARLIM_P(maskthi),
-		   const int*maskb, ARLIM_P(maskblo), ARLIM_P(maskbhi),
-#endif
-		   const amrex_real*trandern,
-		   ARLIM_P(trandernlo),ARLIM_P(trandernhi),
-		   const amrex_real*trandere,
-		   ARLIM_P(tranderelo),ARLIM_P(tranderehi),
-		   const amrex_real*tranderw,
-		   ARLIM_P(tranderwlo),ARLIM_P(tranderwhi),
-		   const amrex_real*tranders,
-		   ARLIM_P(tranderslo),ARLIM_P(trandershi),
-#if BL_SPACEDIM>2
-		   const amrex_real*trandert,
-		   ARLIM_P(trandertlo),ARLIM_P(tranderthi),
-		   const amrex_real*tranderb,
-		   ARLIM_P(tranderblo),ARLIM_P(tranderbhi),
-#endif
-		   const int* lo, const int* hi, const amrex_real* h);
-
-  void FORT_GSRB(
-		 amrex_real* u, ARLIM_P(ulo), ARLIM_P(uhi),
-		 const amrex_real* rhs, ARLIM_P(rhslo), ARLIM_P(rhshi),
-		 amrex_real* alpha, amrex_real* beta,
-		 const amrex_real* a, ARLIM_P(alo), ARLIM_P(ahi),
-		 const amrex_real* muX, ARLIM_P(muXlo), ARLIM_P(muXhi),
-		 const amrex_real* muY, ARLIM_P(muYlo), ARLIM_P(muYhi),
-#if BL_SPACEDIM>2
-		 const amrex_real* muZ, ARLIM_P(muZlo), ARLIM_P(muZhi),
-#endif
-		 const int* maskn, ARLIM_P(masknlo), ARLIM_P(masknhi),
-		 const amrex_real* fn, ARLIM_P(fnlo), ARLIM_P(fnhi),
-		 const int* maske, ARLIM_P(maskelo), ARLIM_P(maskehi),
-		 const amrex_real* fe, ARLIM_P(felo), ARLIM_P(fehi),
-		 const int* maskw, ARLIM_P(maskwlo), ARLIM_P(maskwhi),
-		 const amrex_real* fw, ARLIM_P(fwlo), ARLIM_P(fwhi),
-		 const int* masks, ARLIM_P(maskslo), ARLIM_P(maskshi),
-		 const amrex_real* fs, ARLIM_P(fslo), ARLIM_P(fshi),
-#if BL_SPACEDIM>2
-		 const int* maskt, ARLIM_P(masktlo), ARLIM_P(maskthi),
-		 const amrex_real* ft, ARLIM_P(ftlo), ARLIM_P(fthi),
-		 const int* maskb, ARLIM_P(maskblo), ARLIM_P(maskbhi),
-		 const amrex_real* fb, ARLIM_P(fblo), ARLIM_P(fbhi),
-#endif
-		 const amrex_real* trandern, 
-		 ARLIM_P(trandernlo), ARLIM_P(trandernhi),
-		 const amrex_real* trandere, 
-		 ARLIM_P(tranderelo), ARLIM_P(tranderehi),
-		 const amrex_real* tranderw, 
-		 ARLIM_P(tranderwlo), ARLIM_P(tranderwhi),
-		 const amrex_real* tranders, 
-		 ARLIM_P(tranderslo), ARLIM_P(trandershi),
-#if BL_SPACEDIM>2
-		 const amrex_real* trandert, 
-		 ARLIM_P(trandertlo), ARLIM_P(tranderthi),
-		 const amrex_real* tranderb, 
-		 ARLIM_P(tranderblo), ARLIM_P(tranderbhi),
-#endif
-		 const int* lo, const int* hi,
-		 const amrex_real* h, int &nc, int &phaseflag);
-		 
-  void FORT_APPLYBC(
-		    const int *flagden,  // 1 if want values in den
-		    const int *flagbc,   // 1 for inhomogeneous
-		    const int *maxorder, // maxorder of interpolant
-		    amrex_real *phi, ARLIM_P(phi_lo), ARLIM_P(phi_hi),
-		    const int *cdir,
-		    const int *bct,
-		    const amrex_real *bcl,
-		    const amrex_real *bcval, ARLIM_P(bcval_lo), ARLIM_P(bcval_hi),
-#if BL_SPACEDIM==2
-		    const int *mask,   ARLIM_P(mask_lo),  ARLIM_P(mask_hi), 
-		    const int *maskp,   ARLIM_P(maskp_lo),  ARLIM_P(maskp_hi), 
-		    const int *maskm,   ARLIM_P(maskm_lo),  ARLIM_P(maskm_hi), 
-#elif BL_SPACEDIM==3
-		    const int *maskn,   ARLIM_P(maskn_lo),  ARLIM_P(maskn_hi), 
-		    const int *maske,   ARLIM_P(maske_lo),  ARLIM_P(maske_hi), 
-		    const int *maskw,   ARLIM_P(maskw_lo),  ARLIM_P(maskw_hi), 
-		    const int *masks,   ARLIM_P(masks_lo),  ARLIM_P(masks_hi), 
-		    const int *maskt,   ARLIM_P(maskt_lo),  ARLIM_P(maskt_hi), 
-		    const int *maskb,   ARLIM_P(maskb_lo),  ARLIM_P(maskb_hi), 
-#endif
-		    amrex_real *den,         ARLIM_P(den_lo),   ARLIM_P(den_hi),
-		    const amrex_real *exttd, ARLIM_P(exttd_lo), ARLIM_P(exttd_hi),
-		    amrex_real *tander,      ARLIM_P(tander_lo),ARLIM_P(tander_hi),
-		    const int *lo, const int *hi, 
-		    const int *nc,
-		    const amrex_real *h
-		    );
-
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
-
-#endif
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCCGSolver.H b/Src/LinearSolvers/C_TensorMG/AMReX_MCCGSolver.H
deleted file mode 100644
index e7f8d7ee857..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCCGSolver.H
+++ /dev/null
@@ -1,291 +0,0 @@
-
-#ifndef AMREX_MCCGSOLVER_H_
-#define AMREX_MCCGSOLVER_H_
-
-#include <cmath>
-
-#include <AMReX_Array.H>
-#include <AMReX_Vector.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_MCLinOp.H>
-#include <AMReX_MCMultiGrid.H>
-
-namespace amrex {
-
-/**
-        A CGColver solves the linear equation, L(phi)=rhs, for a MCLinOp L and
-        MultiFabs rhs and phi, using the conjugate gradient algorithm, either
-        vanilla, or preconditioned via a single V-cycle of multigrid.
-
-        A MCCGSolver object solves the linear equation, L(phi)=rhs for a MCLinOp
-	L, and MultiFabs phi and rhs.  A MCCGSolver is constructed with a
-	fully initialized 2D or 3D MCLinOp, and responds to "solve" requests of
-	various signatures.  The solve request (implicitly) includes a flag
-	as to whether the system is to be solved with homogeneous boundary
-	conditions or no.  If homogeneous BCs are requested, all boundary
-	information within the MCLinOp is used, except that the values of
-	boundary FabSets are zeroed.  The algorithm follows closely that
-	described of p15 of the SIAM book, "Templates for the Solution of
-	Linear Systems".  Before solving a system, a small number of control
-	parameters may be modified (maximum number of allowed iterations,
-	reporting verbosity, etc).  Also, either on construction or via
-	member access functions, the user may choose to use a V-cycle
-	1-step MCMultiGrid preconditioner within the CG loop by setting
-	the appropriate bool flag (see members/ctrs below).  The MG
-	preconditioner used is just an instantiation of a MCMultiGrid class
-	object (the MCMultiGrid class is documented separately).
-
-	Implementation Notes:
-
-	This algorithm implements solution of equations in a way that
-	requires linearity of the operator.  In "residual correction form",
-	equations are solved only for the "correction" to the initial guess
-	that is required to solve the desired system.  In particular,
-	boundary conditions are assumed to be satisfied after a single
-	application of the linear operator (therefore, the correction is
-	homogeneous at the boundary).  As a result, after putting the
-	problem in residual correction form, the entire system CG system
-	has homigeneous boundary conditions.  This solver therefore cannot
-	incorporate fully nonlinear systems.
-
-	In general, a MCLinOp has the ability to apply high-order
-	interpolation methods for computing boundary values.  However, if
-	the operator used in this MCCGSolver is non-symmetric, cg performance
-	suffers tremendously.  As a result, BC's should be applied with
-	interpolants of order less than or equal to 2.  We do not enforce
-	this condition rigourosly, since it would interfere with the user's
-	definition of the operator.  If cg performance is bad however,
-	setting the MCLinOp's maxorder=2 is a good place to start.
-
-	Default settings:
-	The user has access to the following options in the cg algorithm:
-
-	maxiter(40) Maximum number of cg cycles allowed to solve the
-	            system before abandoning
-	verbose(0)  Verbosity (1-results, 2-progress, 3-detailed progress)
-	use_mg_precond(false) Whether to use the V-cycle multigrid
-                              solver for the preconditioner system
-*/
-
-class MCCGSolver
-{
-public:
-
-    /**
-    * \brief Constructor.
-    *
-    * \param _lp
-    * \param _use_mg_precond
-    * \param _lev
-    */
-    MCCGSolver (MCLinOp& _lp,
-		bool     _use_mg_precond = false,
-		int      _lev=0);
-
-    /**
-    * \brief Destructor.
-    */
-    virtual ~MCCGSolver ();
-
-    /**
-    * \brief Solve the system, Lp(solnL)=rhsL to relative err, tolerance.
-    *
-    * \param solnL
-    * \param rhsL
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    */
-    virtual void solve (MultiFab&       solnL,
-			const MultiFab& rhsL,
-			Real            eps_rel = -1.0,
-			Real            eps_abs = -1.0,
-			MCBC_Mode       bc_mode = MCInhomogeneous_BC);
-
-    /**
-    * \brief Set maximum allowed number of CG iterations.
-    *
-    * \param _maxiter
-    */
-    void setMaxIter (int _maxiter);
-
-    /**
-    * \brief Get maximum allowed number of CG iterations.
-    */
-    int getMaxIter () const;
-
-    /**
-    * \brief Set expert mode.
-    *
-    * \param flag
-    */
-    void setExpert( bool flag ) { isExpert = flag; }
-
-    /**
-    * \brief Get expert flag.
-    */
-    bool getExpert() { return isExpert; }
-
-    /**
-    * \brief Set flag determining whether MG preconditioning is used.
-    *
-    * \param _use_mg_precond
-    */
-    void setUseMGPrecond (bool _use_mg_precond);
-
-    /**
-    * \brief Get flag determining whether MG preconditioning is used.
-    */
-    bool getUseMGPrecond () const;
-
-    /**
-    * \brief Set the verbosity value.
-    *
-    * \param _verbose
-    */
-    void setVerbose (int _verbose);
-
-    /**
-    * \brief Return the verbosity value.
-    */
-    int getVerbose ();
-
-protected:
-
-    /**
-    * \brief Construct work space, initialize parameters.
-    */
-    static void Initialize ();
-
-    static void Finalize ();
-
-    /**
-    * \brief if (use_mg_precond == 1) then define the MCMultiGrid * mg_precond
-    */
-    void set_mg_precond ();
-
-    /**
-    * \brief Compute ``p = z  +  beta p`` in the CG algorithm.
-    *
-    * \param p
-    * \param beta
-    * \param z
-    */
-    void advance (MultiFab&       p,
-		  Real            beta,
-		  const MultiFab& z);
-
-    /**
-    * \brief Compute ``x =+ alpha p``  and  ``r -= alpha w`` in the CG algorithm.
-    *
-    * \param sol
-    * \param alpha
-    * \param r
-    * \param p
-    * \param w
-    */
-    void update (MultiFab&       sol,
-		 Real            alpha,
-		 MultiFab&       r,
-		 const MultiFab& p,
-		 const MultiFab& w);
-
-    /**
-    * \brief Compute ``w = A.p``, and return ``Transpose(p).w`` in the CG algorithm.
-    *
-    * \param w
-    * \param p
-    * \param bc_mode
-    */
-    Real axp (MultiFab& w,
-	      MultiFab& p,
-	      MCBC_Mode bc_mode);
-
-    /**
-    * \brief Compute a suitable norm of the residual, used to check stopping criteria.
-    *
-    * \param res
-    */
-    Real norm (const MultiFab& res);
-
-    //! MCMultiGrid solver to be used as preconditioner.
-    MCMultiGrid* mg_precond;
-
-    //! Default maximum number of allowed iterations, verbosity.
-    static int def_maxiter, def_verbose;
-
-    //! Flag: use multigrid as a preconditioner.
-    bool use_mg_precond;
-
-    //! Default unstable_criterion used to test for loss of accuracy in.
-    static double def_unstable_criterion;
-
-    //! Flag determining action when error conditions are hit.
-    static int def_isExpert;
-    bool isExpert;
-
-    //! Current maximum number of allowed iterations, verbosity.
-    int maxiter, verbose;
-
-    //! Reference to operator for linear system to be solved.
-    MCLinOp &Lp;
-
-    //! Integer to choose which "level" of the linear operator to use.
-    int lev;
-
-private:
-
-    /**
-    * \brief Disable copy constructor, = operator.
-    *
-    */
-    MCCGSolver (const MCCGSolver&);
-    MCCGSolver& operator= (const MCCGSolver&);
-};
-
-inline
-void
-MCCGSolver::setMaxIter (int _maxiter)
-{
-    maxiter = _maxiter;
-}
-
-inline
-int
-MCCGSolver::getMaxIter () const
-{
-    return maxiter;
-}
-
-inline
-void
-MCCGSolver::setUseMGPrecond (bool _use_mg_precond)
-{
-    use_mg_precond = _use_mg_precond;
-    set_mg_precond();
-}
-
-inline
-bool
-MCCGSolver::getUseMGPrecond () const
-{
-    return use_mg_precond;
-}
-
-inline
-void
-MCCGSolver::setVerbose (int _verbose)
-{
-    verbose = _verbose;
-}
-
-inline
-int
-MCCGSolver::getVerbose ()
-{
-    return verbose;
-}
-
-}
-
-#endif /*_MCCGSOLVER_H_*/
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCCGSolver.cpp b/Src/LinearSolvers/C_TensorMG/AMReX_MCCGSolver.cpp
deleted file mode 100644
index 539272b13f5..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCCGSolver.cpp
+++ /dev/null
@@ -1,361 +0,0 @@
-#include <algorithm>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_MCCGSolver.H>
-
-namespace amrex {
-
-namespace
-{
-    bool initialized = false;
-}
-//
-// Set default values for these in Initialize()!!!
-//
-int    MCCGSolver::def_maxiter;
-int    MCCGSolver::def_verbose;
-int    MCCGSolver::def_isExpert;
-double MCCGSolver::def_unstable_criterion;
-
-void
-MCCGSolver::Initialize ()
-{
-    if (initialized) return;
-    //
-    // Set defaults here!!!
-    //
-    MCCGSolver::def_maxiter            = 40;
-    MCCGSolver::def_verbose            = 0;
-    MCCGSolver::def_isExpert           = 0;
-    MCCGSolver::def_unstable_criterion = 10;
-
-    ParmParse pp("cg");
-
-    pp.query("maxiter",  def_maxiter);
-    pp.query("v",        def_verbose);
-    pp.query("isExpert", def_isExpert);
-    pp.query("unstable_criterion", def_unstable_criterion);
-
-    if (ParallelDescriptor::IOProcessor() && def_verbose)
-    {
-        amrex::OutStream() << "def_maxiter            = " << def_maxiter            << '\n'
-                           << "def_unstable_criterion = " << def_unstable_criterion << '\n'
-                           << "def_isExpert           = " << def_isExpert           << '\n';
-    }
-
-    amrex::ExecOnFinalize(MCCGSolver::Finalize);
-
-    initialized = true;
-}
-
-void
-MCCGSolver::Finalize ()
-{
-    initialized = false;
-}
-
-MCCGSolver::MCCGSolver (MCLinOp& _lp,
-			bool     _use_mg_precond,
-			int      _lev)
-    :
-    mg_precond(NULL),
-    use_mg_precond(_use_mg_precond),
-    isExpert((int)def_isExpert),
-    Lp(_lp),
-    lev(_lev)
-{
-    Initialize();
-    maxiter = def_maxiter;
-    verbose = def_verbose;
-    set_mg_precond();
-}
-
-void
-MCCGSolver::set_mg_precond ()
-{
-    delete mg_precond;
-    if (use_mg_precond)
-    {
-	mg_precond = new MCMultiGrid(Lp);
-	mg_precond->setNumIter(1);
-    }
-}
-
-MCCGSolver::~MCCGSolver ()
-{
-    delete mg_precond;
-}
-
-Real
-MCCGSolver::norm (const MultiFab& res)
-{
-    //
-    // Compute max-norm.
-    //
-    const int p = 0, ncomp = res.nComp();
-
-    Real restot = 0.0;
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(max:restot)
-#endif
-    for (MFIter mfi(res,true); mfi.isValid(); ++mfi)
-    {
-	restot = std::max(restot, res[mfi].norm<RunOn::Host>(mfi.tilebox(), p, 0, ncomp));
-    }
-    ParallelDescriptor::ReduceRealMax(restot);
-    return restot;
-}
-
-void
-MCCGSolver::solve (MultiFab&       sol,
-		   const MultiFab& rhs,
-		   Real            eps_rel,
-		   Real            eps_abs,
-		   MCBC_Mode       bc_mode)
-{
-    //
-    // algorithm:
-    //   k=0;r=rhs-A*soln_0;
-    //   while (||r_k||^2_2 > eps^2*||r_o||^2_2 && k < maxiter {
-    //      k++
-    //      solve Mz_k-1 = r_k-1 (if preconditioning, else z_k-1 = r_k-1)
-    //      rho_k-1 = r_k-1^T z_k-1
-    //      if (k=1) { p_1 = z_0 }
-    //      else { beta = rho_k-1/rho_k-2; p = z + beta*p }
-    //      w = Ap
-    //      alpha = rho_k-1/p^tw
-    //      x += alpha p
-    //      r -= alpha w
-    //   }
-    //
-    BL_ASSERT(sol.boxArray() == Lp.boxArray(lev));
-    BL_ASSERT(rhs.boxArray() == Lp.boxArray(lev));
-
-    int nghost = 1, ncomp  = sol.nComp();
-
-    const BoxArray& ba = sol.boxArray();
-    const DistributionMapping& dm = sol.DistributionMap();
-
-    MultiFab s(ba, dm, ncomp, nghost);
-    MultiFab r(ba, dm, ncomp, nghost);
-    MultiFab z(ba, dm, ncomp, nghost);
-    MultiFab w(ba, dm, ncomp, nghost);
-    MultiFab p(ba, dm, ncomp, nghost);
-    //
-    // Copy initial guess into a temp multifab guaranteed to have ghost cells.
-    //
-    int srccomp=0;  int destcomp=0;  nghost=0;
-    s.copy(sol,srccomp,destcomp,ncomp);
-
-    /* Note:
-	 This routine assumes the MCLinOp is linear, and that when bc_mode =
-	 MCHomogeneous_BC, MCLinOp::apply() on a zero vector will return a zero
-	 vector.  Given that, we define the problem we solve here from the
-	 original equation:
-
-	      Lp(sol) = rhs --> Lp(s) + Lp(sol,bc_mode=MCHomogeneous_BC) = rhs
-
-	 where s is set to the incoming solution guess.  Rewriting,
-
-	      Lp(sol,bc_mode=MCHomogeneous_BC) = r     [ = rhs - Lp(s) ].
-
-	 CG needs the residual of this equation on our initial guess.  But
-	 because we made the above assumption,
-
-	      r - Lp(sol,bc_mode=MCHomogeneous_BC) = r = rhs - Lp(s)
-
-	 Which is simply the residual of the original equation evaluated at
-	 the initial guess.  Thus we get by with only one call to Lp.residual.
-	 Without this assumption, we'd need two.
-         */
-    Lp.residual(r, rhs, s, lev, bc_mode);
-    //
-    // Set initial guess for correction to 0.
-    //
-    sol.setVal(0);
-    //
-    // Set bc_mode=homogeneous.
-    //
-    MCBC_Mode temp_bc_mode=MCHomogeneous_BC;
-    Real rnorm  = norm(r);
-    Real rnorm0 = rnorm;
-    Real minrnorm = rnorm;
-    int ret = 0; // will return this value if all goes well
-
-    if (verbose > 0 && ParallelDescriptor::IOProcessor())
-    {
-        for (int k = 0; k < lev; k++)
-            amrex::OutStream() << "   ";
-        amrex::OutStream() << "MCCGsolver: Initial error (error0) =  " << rnorm0 << '\n';
-    }
-
-    Real beta = 0, rho = 0, rhoold = 0;
-
-    /* WARNING:
-	 The MultiFab copies used below to update z and p require nghost=0
-	 to avoid the possibility of filling valid regions with uninitialized
-	 data in the invalid regions of neighboring grids.  The default
-	 behavior in MultiFab copies will likely be changed in the future.
-	 */
-
-    //
-    // Note: if eps_rel or eps_abs < 0: that test is effectively bypassed.
-    //
-    for (int nit = 0;
-         (nit < maxiter) && (rnorm > eps_rel*rnorm0) && (rnorm > eps_abs);
-         ++nit)
-    {
-	if (use_mg_precond)
-	{
-            //
-	    // solve Mz_k-1 = r_k-1  and  rho_k-1 = r_k-1^T z_k-1
-            //
-	    z.setVal(0);
-	    mg_precond->solve( z, r, eps_rel, eps_abs, temp_bc_mode );
-	}
-        else
-        {
-            //
-	    // No preconditioner, z_k-1 = r_k-1  and  rho_k-1 = r_k-1^T r_k-1.
-            //
-	    srccomp=0;  destcomp=0;  
-	    z.copy(r, srccomp, destcomp, ncomp);
-	}
-
-	rho = MultiFab::Dot(r, 0, z, 0, ncomp, 0);
-	
-	if (nit == 0)
-	{
-            //
-	    // k=1, p_1 = z_0.
-            //
-	    srccomp=0;  destcomp=0;  nghost=0;
-	    p.copy(z, srccomp, destcomp, ncomp);
-	}
-        else
-        {
-            //
-	    // k>1, beta = rho_k-1/rho_k-2 and  p = z + beta*p
-            //
-	    beta = rho/rhoold;
-	    advance( p, beta, z );
-	}
-        //
-	// w = Ap, and compute Transpose(p).w
-        //
-	Real pw = axp( w, p, temp_bc_mode );
-	//
-	// alpha = rho_k-1/p^tw.
-        //
-	Real alpha = rho/pw;
-	
-	if (verbose > 2 && ParallelDescriptor::IOProcessor())
-        {
-            for (int k = 0; k < lev; k++)
-                amrex::OutStream() << "   ";
-            amrex::OutStream() << "MCCGSolver:"
-                               << " nit " << nit
-                               << " pw "  << pw 
-                               << " rho " << rho
-                               << " alpha " << alpha;
-            if (nit == 0)
-                amrex::OutStream() << " beta undefined ...";
-            else
-                amrex::OutStream() << " beta " << beta << " ...";
-	}
-        //
-	// x += alpha p  and  r -= alpha w
-        //
-	rhoold = rho;
-	update( sol, alpha, r, p, w );
-	rnorm = norm(r);
-        if (rnorm > def_unstable_criterion*minrnorm)
-        {
-            ret = 2;
-            break;
-        }
-        else if (rnorm < minrnorm)
-        {
-            minrnorm = rnorm;
-        }
-
-	if (verbose > 1 ||
-            (((eps_rel > 0. && rnorm < eps_rel*rnorm0) ||
-              (eps_abs > 0. && rnorm < eps_abs)) && verbose))
-	{
-	    if (ParallelDescriptor::IOProcessor())
-	    {
-		for (int k = 0; k < lev; k++) {
-                    amrex::OutStream() << "   ";
-                }
-		amrex::OutStream() << "MCCGSolver: Iteration "
-                                   << nit
-                                   << " error/error0 "
-                                   << rnorm/rnorm0 << '\n';
-	    }
-	}
-    }
-
-    if (ret != 0 && isExpert == false)
-    {
-        amrex::Error("MCCGSolver:: apparent accuracy problem; try expert setting or change unstable_criterion");
-    }
-    if (ret==0 && rnorm > eps_rel*rnorm0 && rnorm > eps_abs)
-    {
-        amrex::Error("MCCGSolver:: failed to converge!");
-    }
-    //
-    // Omit ghost update since maybe not initialized in calling routine.
-    //
-    if (ret == 0)
-    {
-        srccomp=0; nghost=0;
-        sol.plus(s,srccomp,ncomp,nghost);
-    }
-}
-
-void
-MCCGSolver::advance (MultiFab&       p,
-		     Real            beta,
-		     const MultiFab& z)
-{
-    //
-    // Compute p = z  +  beta p
-    //
-    int ncomp = p.nComp();
-    int nghost = 0;
-    MultiFab::Xpay(p, beta, z, 0, 0, ncomp, nghost);
-}
-
-void
-MCCGSolver::update (MultiFab&       sol,
-		    Real            alpha,
-		    MultiFab&       r,
-		    const MultiFab& p,
-		    const MultiFab& w)
-{
-    //
-    // Compute sol =+ alpha p  and  r -= alpha w
-    //
-    int ncomp = r.nComp();
-    MultiFab::Saxpy(sol,  alpha, p, 0, 0, ncomp, 0);
-    MultiFab::Saxpy(r  , -alpha, w, 0, 0, ncomp, 0);
-}
-
-Real
-MCCGSolver::axp (MultiFab& w,
-		 MultiFab& p,
-		 MCBC_Mode bc_mode)
-{
-    //
-    // Compute w = A.p, and return Transpose(p).w
-    //
-    Lp.apply(w, p, lev, bc_mode);
-    int nghost = 0;
-    return MultiFab::Dot(w,0,p,0,p.nComp(),nghost);
-}
-
-}
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_2D.F b/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_2D.F
deleted file mode 100644
index ce63637d5f3..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_2D.F
+++ /dev/null
@@ -1,670 +0,0 @@
-#include "AMReX_BC_TYPES.H"
-#include "AMReX_REAL.H"
-#include "AMReX_CONSTANTS.H"
-#include "AMReX_MCINTERPBNDRYDATA_F.H"
-#include "AMReX_ArrayLim.H"
-
-#define SDIM 2
-#define NUMDERIV 2
-#define XDER   1
-#define X2DER  2
-      
-      
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPXLO : Interpolation on Xlo Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPXLO (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      integer  DIMDEC(cb)
-      REAL_T   bdry(DIMV(bdry),2*nvar)
-      REAL_T   derives(DIM2(cb),NUMDERIV)      
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine
-      REAL_T  hcrse
-
-      REAL_T   xx
-      integer  i, j, ic, jc, off, n
-      integer  jclo, jchi
-
-      jclo = ARG_L2(cb)
-      jchi = ARG_H2(cb)
-      ic   = ARG_L1(cb)-1
-      i    = lo(1)-1
-      hcrse = ratio*hfine
-
-      do n = 1, nvar
-c        ::::: define interp coefs
-         do jc = jclo, jchi
-            j = ratio*jc
-            if( mask(i,j-1).eq.not_covered .and.
-     &          mask(i,j+ratio).eq.not_covered ) then
-               derives(jc,XDER)  = (crse(ic,jc+1,n)-crse(ic,jc-1,n))/(2*hcrse)
-               derives(jc,X2DER) = (crse(ic,jc+1,n)
-     &           -                  crse(ic,jc  ,n) * two
-     &           +                  crse(ic,jc-1,n))/hcrse**2
-            else if( mask(i,j-1).ne.not_covered .and.
-     &               mask(i,j+ratio).ne.not_covered ) then
-c              ::: drop order by 2
-               derives(jc,XDER )  = zero
-               derives(jc,X2DER)  = zero
-            else if( mask(i,j+ratio).eq. not_covered ) then
-c              ::: j-1 bad, so try + dir
-               if( jc+2 .le. jchi+1 ) then
-                  if( mask(i,j+2*ratio).eq.not_covered ) then
-c                    ::: can use 3 point stencils for j,j+1,j+2
-                     derives(jc,XDER) = (-crse(ic,jc+2,n)+4*crse(ic,jc+1,n)-
-     &                    3*crse(ic,jc,n))/(2*hcrse)
-                     derives(jc,X2DER) = (crse(ic,jc+2,n)-2*crse(ic,jc+1,n)
-     &                    +crse(ic,jc,n))/hcrse**2
-                  else
-c                    ::: use j,j+1, drop order
-                     derives(jc,XDER) = (crse(ic,jc+1,n)-crse(ic,jc,n))/hcrse
-                     derives(jc,X2DER) = zero
-                  endif
-               else
-c                 ::: use j,j+1, drop order
-                  derives(jc,XDER) = (crse(ic,jc+1,n)-crse(ic,jc,n))/hcrse
-                  derives(jc,X2DER) = zero
-               endif
-            else if( mask(i,j-1) .eq. not_covered ) then
-c              ::: try - direction
-               if( jc-2 .ge. jclo-1 ) then
-                  if( mask(i,j-1) .eq. not_covered ) then
-c                    ::: can use 3 point stencils
-                     derives(jc,XDER) = (crse(ic,jc-2,n)-4*crse(ic,jc-1,n)
-     &                    +3*crse(ic,jc,n))/(2*hcrse)
-                     derives(jc,X2DER) = (crse(ic,jc-2,n)-2*crse(ic,jc-1,n)
-     &                    +crse(ic,jc,n))/hcrse**2
-                  else
-                     derives(jc,XDER) = (crse(ic,jc,n)-crse(ic,jc-1,n))/hcrse
-                     derives(jc,X2DER) = zero
-                  endif
-               else
-                  derives(jc,XDER) = (crse(ic,jc,n)-crse(ic,jc-1,n))/hcrse
-                  derives(jc,X2DER) = zero
-               endif
-            else
-               write(6,*)'impossible BDINTERPYLO'
-               stop
-            endif
-         enddo
-         do off = 0, ratio - 1
-            xx = (off+0.5)*hfine-hcrse/2
-            do jc = jclo, jchi
-               j = ratio*jc + off
-               bdry(i,j,n) = crse(ic,jc,n)
-     &              +derives(jc,XDER)*xx
-     &              +derives(jc,X2DER)*xx**2/2
-               bdry(i,j,n+nvar) =
-     &              derives(jc,XDER)+derives(jc,X2DER)*xx
-            enddo
-         enddo
-      enddo
-               
-
-      return
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPXHI : Interpolation on Xhi Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPXHI (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),2*nvar)
-      REAL_T   derives(DIM2(cb),NUMDERIV)      
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T  hfine
-      REAL_T  hcrse
-
-      REAL_T   xx
-      integer  i, j, ic, jc, off, n
-      integer  jclo, jchi
-
-      jclo = ARG_L2(cb)
-      jchi = ARG_H2(cb)
-      ic   = ARG_H1(cb)+1
-      i    = hi(1)+1
-      hcrse = ratio*hfine
-      
-      do n = 1, nvar
-c        ::::: define interp coefs
-         do jc = jclo, jchi
-            j = ratio*jc
-            if( mask(i,j-1).eq.not_covered .and.
-     &          mask(i,j+ratio).eq.not_covered ) then
-               derives(jc,XDER)  = (crse(ic,jc+1,n)-crse(ic,jc-1,n))/(2*hcrse)
-               derives(jc,X2DER) = (crse(ic,jc+1,n)
-     &           -                  crse(ic,jc  ,n) * two
-     &           +                  crse(ic,jc-1,n))/hcrse**2
-            else if( mask(i,j-1).ne.not_covered .and.
-     &               mask(i,j+ratio).ne.not_covered ) then
-c              ::: drop order by 2
-               derives(jc,XDER )  = zero
-               derives(jc,X2DER)  = zero
-            else if( mask(i,j+ratio).eq. not_covered ) then
-c              ::: j-1 bad, so try + dir
-               if( jc+2 .le. jchi+1 ) then
-                  if( mask(i,j+2*ratio).eq.not_covered ) then
-c                    ::: can use 3 point stencils for j,j+1,j+2
-                     derives(jc,XDER) = (-crse(ic,jc+2,n)+4*crse(ic,jc+1,n)-
-     &                    3*crse(ic,jc,n))/(2*hcrse)
-                     derives(jc,X2DER) = (crse(ic,jc+2,n)-2*crse(ic,jc+1,n)
-     &                    +crse(ic,jc,n))/hcrse**2
-                  else
-c                    ::: use j,j+1, drop order
-                     derives(jc,XDER) = (crse(ic,jc+1,n)-crse(ic,jc,n))/hcrse
-                     derives(jc,X2DER) = zero
-                  endif
-               else
-c                 ::: use j,j+1, drop order
-                  derives(jc,XDER) = (crse(ic,jc+1,n)-crse(ic,jc,n))/hcrse
-                  derives(jc,X2DER) = zero
-               endif
-            else if( mask(i,j-1) .eq. not_covered ) then
-c              ::: try - direction
-               if( jc-2 .ge. jclo-1 ) then
-                  if( mask(i,j-1) .eq. not_covered ) then
-c                    ::: can use 3 point stencils
-                     derives(jc,XDER) = (crse(ic,jc-2,n)-4*crse(ic,jc-1,n)
-     &                    +3*crse(ic,jc,n))/(2*hcrse)
-                     derives(jc,X2DER) = (crse(ic,jc-2,n)-2*crse(ic,jc-1,n)
-     &                    +crse(ic,jc,n))/hcrse**2
-                  else
-                     derives(jc,XDER) = (crse(ic,jc,n)-crse(ic,jc-1,n))/hcrse
-                     derives(jc,X2DER) = zero
-                  endif
-               else
-                  derives(jc,XDER) = (crse(ic,jc,n)-crse(ic,jc-1,n))/hcrse
-                  derives(jc,X2DER) = zero
-               endif
-            else
-               write(6,*)'impossible BDINTERPYLO'
-               stop
-            endif
-         enddo
-         do off = 0, ratio - 1
-            xx = (off+0.5)*hfine-hcrse/2
-            do jc = jclo, jchi
-               j = ratio*jc + off
-               bdry(i,j,n) = crse(ic,jc,n)
-     &              +derives(jc,XDER)*xx
-     &              +derives(jc,X2DER)*xx**2/2
-               bdry(i,j,n+nvar) =
-     &              derives(jc,XDER)+derives(jc,X2DER)*xx
-            enddo
-         enddo
-      enddo
-
-      return
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPYLO : Interpolation on Ylo Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPYLO (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),2*nvar)
-      REAL_T   derives(DIM1(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   xx
-      integer  i, j, ic, jc, off, n
-      integer  iclo, ichi
-      REAL_T  hfine
-      REAL_T  hcrse
-
-      iclo = ARG_L1(cb)
-      ichi = ARG_H1(cb)
-      jc   = ARG_L2(cb)-1
-      j    = lo(2)-1
-      hcrse = ratio*hfine
-
-      do n = 1, nvar
-c        ::::: define interp coefs
-         do ic = iclo, ichi
-            i = ratio*ic
-            if( mask(i-1,j).eq.not_covered .and. 
-     &           mask(i+ratio,j).eq.not_covered ) then
-c           :::: use adjoining points
-               derives(ic,XDER ) = (crse(ic+1,jc,n)-crse(ic-1,jc,n))/(2*hcrse)
-               derives(ic,X2DER) = (crse(ic+1,jc,n)-2*crse(ic,jc,n)+
-     &              crse(ic-1,jc,n))/hcrse**2
-            else if( mask(i-1,j).ne.not_covered .and.
-     &               mask(i+ratio,j).ne.not_covered ) then
-c              :::: must drop order by two
-               derives(ic,XDER ) = zero
-               derives(ic,X2DER) = zero
-            else if( mask(i+ratio,j).eq.not_covered ) then
-c              ::: i-1 bad, try other direction
-               if( ic+2 .le. ichi+1 ) then
-                  if( mask(i+2*ratio,j).eq.not_covered ) then
-c                    ::: can use 3 points stencils for i,i+1,i+2
-                     derives(ic,XDER ) = (-crse(ic+2,jc,n)+4*crse(ic+1,jc,n)-
-     &                    3*crse(ic,jc,n))/(2*hcrse)
-                     derives(ic,X2DER) = (crse(ic+2,jc,n)-2*crse(ic+1,jc,n)+
-     &                    crse(ic,jc,n))/hcrse**2
-                  else
-c                    ::: use i,i+1
-                     derives(ic,XDER ) = (crse(ic+1,jc,n)-crse(ic,jc,n))/hcrse
-                     derives(ic,X2DER) = zero
-                  endif
-              else
-c                ::: use i,i+1
-                 derives(ic,XDER ) = (crse(ic+1,jc,n)-crse(ic,jc,n))/hcrse
-                 derives(ic,X2DER) = zero
-              endif
-           else if( mask(i-1,j).eq.not_covered ) then
-c             ::: i+1 bad, try other direction
-              if( ic-2 .ge. iclo-1 ) then
-                 if( mask(i-1,j) .eq. not_covered ) then
-c                  ::: can use 3 points stencils for i,i-1,i-2
-                    derives(ic,XDER ) = (+crse(ic-2,jc,n)-4*crse(ic-1,jc,n)+
-     &                    3*crse(ic,jc,n))/(2*hcrse)
-                    derives(ic,X2DER) = (crse(ic-2,jc,n)-2*crse(ic-1,jc,n)+
-     &                    crse(ic,jc,n))/hcrse**2
-                 else
-c                   ::: use i,i-1
-                     derives(ic,XDER ) = (crse(ic,jc,n)-crse(ic-1,jc,n))/hcrse
-                     derives(ic,X2DER) = zero
-                 endif
-              else
-c                ::: use i,i-1
-                 derives(ic,XDER ) = (crse(ic,jc,n)-crse(ic-1,jc,n))/hcrse
-                 derives(ic,X2DER) = zero
-              endif
-           else
-               write(6,*)'impossible BDINTERPYLO'
-              stop
-           endif
-         enddo
-         do off = 0, ratio - 1
-            xx = (off+0.5)*hfine-hcrse/2
-            do ic = iclo, ichi
-               i = ratio*ic + off
-               bdry(i,j,n) = crse(ic,jc,n)
-     &              + derives(ic,XDER)*xx
-     &              + derives(ic,X2DER)*xx**2/2
-               bdry(i,j,n+nvar) =
-     &              + derives(ic,XDER) + derives(ic,X2DER)*xx
-            enddo
-         enddo
-      enddo
-
-      return
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPYHI : Interpolation on Yhi Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPYHI (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),2*nvar)
-      REAL_T   derives(DIM1(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   xx
-      integer  i, j, ic, jc, off, n
-      integer  iclo, ichi
-      REAL_T  hfine
-      REAL_T  hcrse
-
-      iclo = ARG_L1(cb)
-      ichi = ARG_H1(cb)
-      jc   = ARG_H2(cb)+1
-      j    = hi(2)+1
-      hcrse = ratio*hfine
-
-      do n = 1, nvar
-c        ::::: define interp coefs
-         do ic = iclo, ichi
-            i = ratio*ic
-            if( mask(i-1,j).eq.not_covered .and. 
-     &           mask(i+ratio,j).eq.not_covered ) then
-c           :::: use adjoining points
-               derives(ic,XDER ) = (crse(ic+1,jc,n)-crse(ic-1,jc,n))/(2*hcrse)
-               derives(ic,X2DER) = (crse(ic+1,jc,n)-2*crse(ic,jc,n)+
-     &              crse(ic-1,jc,n))/hcrse**2
-            else if( mask(i-1,j).ne.not_covered .and.
-     &               mask(i+ratio,j).ne.not_covered ) then
-c              :::: must drop order by two
-               derives(ic,XDER ) = zero
-               derives(ic,X2DER) = zero
-            else if( mask(i+ratio,j).eq.not_covered ) then
-c              ::: i-1 bad, try other direction
-               if( ic+2 .le. ichi+1 ) then
-                  if( mask(i+2*ratio,j).eq.not_covered ) then
-c                    ::: can use 3 points stencils for i,i+1,i+2
-                     derives(ic,XDER ) = (-crse(ic+2,jc,n)+4*crse(ic+1,jc,n)-
-     &                    3*crse(ic,jc,n))/(2*hcrse)
-                     derives(ic,X2DER) = (crse(ic+2,jc,n)-2*crse(ic+1,jc,n)+
-     &                    crse(ic,jc,n))/hcrse**2
-                  else
-c                    ::: use i,i+1
-                     derives(ic,XDER ) = (crse(ic+1,jc,n)-crse(ic,jc,n))/hcrse
-                     derives(ic,X2DER) = zero
-                  endif
-              else
-c                ::: use i,i+1
-                 derives(ic,XDER ) = (crse(ic+1,jc,n)-crse(ic,jc,n))/hcrse
-                 derives(ic,X2DER) = zero
-              endif
-           else if( mask(i-1,j).eq.not_covered ) then
-c             ::: i+1 bad, try other direction
-              if( ic-2 .ge. iclo-1 ) then
-                 if( mask(i-1,j) .eq. not_covered ) then
-c                  ::: can use 3 points stencils for i,i-1,i-2
-                    derives(ic,XDER ) = (+crse(ic-2,jc,n)-4*crse(ic-1,jc,n)+
-     &                    3*crse(ic,jc,n))/(2*hcrse)
-                    derives(ic,X2DER) = (crse(ic-2,jc,n)-2*crse(ic-1,jc,n)+
-     &                    crse(ic,jc,n))/hcrse**2
-                 else
-c                   ::: use i,i-1
-                     derives(ic,XDER ) = (crse(ic,jc,n)-crse(ic-1,jc,n))/hcrse
-                     derives(ic,X2DER) = zero
-                 endif
-              else
-c                ::: use i,i-1
-                 derives(ic,XDER ) = (crse(ic,jc,n)-crse(ic-1,jc,n))/hcrse
-                 derives(ic,X2DER) = zero
-              endif
-           else
-               write(6,*)'impossible BDINTERPYHI'
-              stop
-           endif
-         enddo
-         do off = 0, ratio - 1
-            xx = (off+0.5)*hfine-hcrse/2
-            do ic = iclo, ichi
-               i = ratio*ic + off
-               bdry(i,j,n) = crse(ic,jc,n)
-     &              + derives(ic,XDER)*xx
-     &              + derives(ic,X2DER)*xx**2/2
-               bdry(i,j,n+nvar) =
-     &              + derives(ic,XDER) + derives(ic,X2DER)*xx
-            enddo
-         enddo
-      enddo
-
-      return
-      end
-
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVXLO : copy from Xlo face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The second nvar values 
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write twice as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVXLO( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-      integer nvar
-      REAL_T  hfine
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),2*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,n
-
-      i = lo(1)-1
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do j=lo(2),hi(2)
-            bdry(i,j,n) = fine(i,j,n)
-         enddo
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-         do j=lo(2)+1,hi(2)-1
-            bdry(i,j,n+nvar) = (fine(i,j+1,n)-fine(i,j-1,n))/(2*hfine)
-         enddo
-         j = lo(2)
-         bdry(i,j,n+nvar) = (-fine(i,j+2,n)+4*fine(i,j+1,n)-3*fine(i,j,n))/
-     &        (2*hfine)
-         j = hi(2)
-         bdry(i,j,n+nvar) = (+fine(i,j-2,n)-4*fine(i,j-1,n)+3*fine(i,j,n))/
-     &        (2*hfine)
-      enddo
-
-      return
-      end
-      
-
-      subroutine FORT_BDIDERIVXHI( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-      integer nvar
-      REAL_T  hfine
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),2*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,n
-
-      i = hi(1)+1
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do j=lo(2),hi(2)
-            bdry(i,j,n) = fine(i,j,n)
-         enddo
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-         do j=lo(2)+1,hi(2)-1
-            bdry(i,j,n+nvar) = (fine(i,j+1,n)-fine(i,j-1,n))/(2*hfine)
-         enddo
-         j = lo(2)
-         bdry(i,j,n+nvar) = (-fine(i,j+2,n)+4*fine(i,j+1,n)-3*fine(i,j,n))/
-     &        (2*hfine)
-         j = hi(2)
-         bdry(i,j,n+nvar) = (+fine(i,j-2,n)-4*fine(i,j-1,n)+3*fine(i,j,n))/
-     &        (2*hfine)
-      enddo
-
-      return
-      end
-      
-
-      subroutine FORT_BDIDERIVYLO( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-      integer nvar
-      REAL_T  hfine
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),2*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,n
-
-      j = lo(2)-1
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do i=lo(1),hi(1)
-            bdry(i,j,n) = fine(i,j,n)
-         enddo
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-         do i=lo(1)+1,hi(1)-1
-            bdry(i,j,n+nvar) = (fine(i+1,j,n)-fine(i-1,j,n))/(2*hfine)
-         enddo
-         i = lo(1)
-         bdry(i,j,n+nvar) = (-fine(i+2,j,n)+4*fine(i+1,j,n)-3*fine(i,j,n))/
-     &        (2*hfine)
-         i = hi(1)
-         bdry(i,j,n+nvar) = (+fine(i-2,j,n)-4*fine(i-1,j,n)+3*fine(i,j,n))/
-     &        (2*hfine)
-      enddo
-
-      return
-      end
-      
-
-
-      subroutine FORT_BDIDERIVYHI( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-      integer nvar
-      REAL_T  hfine
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),2*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,n
-
-      j = hi(2)+1
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do i=lo(1),hi(1)
-            bdry(i,j,n) = fine(i,j,n)
-         enddo
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-         do i=lo(1)+1,hi(1)-1
-            bdry(i,j,n+nvar) = (fine(i+1,j,n)-fine(i-1,j,n))/(2*hfine)
-         enddo
-         i = lo(1)
-         bdry(i,j,n+nvar) = (-fine(i+2,j,n)+4*fine(i+1,j,n)-3*fine(i,j,n))/
-     &        (2*hfine)
-         i = hi(1)
-         bdry(i,j,n+nvar) = (+fine(i-2,j,n)-4*fine(i-1,j,n)+3*fine(i,j,n))/
-     &        (2*hfine)
-      enddo
-
-      return
-      end
-      
-
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_3D.F b/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_3D.F
deleted file mode 100644
index 6760334a108..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_3D.F
+++ /dev/null
@@ -1,2127 +0,0 @@
-#include "AMReX_BC_TYPES.H"
-#include "AMReX_REAL.H"
-#include "AMReX_CONSTANTS.H"
-#include "AMReX_MCINTERPBNDRYDATA_F.H"
-#include "AMReX_ArrayLim.H"
-
-#define SDIM 3
-#define NUMDERIV 9
-#define DX    1
-#define DY    2
-#define DZ    3
-#define D2X   4
-#define D2Y   5
-#define D2Z   6
-#define DXY   7
-#define DXZ   8
-#define DYZ   9
-
-c ::: CX,CY,CZ are the "component" number for storing derivative information
-c ::: see the assignments to bdry at the bottom of each of the subroutines.
-c ::: This should be more suggestive of how info is being stored than
-c ::: writing plain numbers.
-#define CX   1
-#define CY   2
-#define CZ   3
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPXLO : Interpolation on Xlo Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array for derivatives
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPXLO (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      implicit none
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),(1+3)*nvar)
-      REAL_T   derives(DIM23(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine(BL_SPACEDIM-1)
-
-      REAL_T   yy, zz
-      integer  i, j, k, ic, jc, kc, joff, koff, n
-      integer  jclo, jchi, kclo, kchi, ii, jj, kk
-      REAL_T   hc(3),hf(3)
-
-c ::: ------------ functions ------------------------------
-      logical notUsable,Usable
-      REAL_T ddycen,ddy2cen,ddyplus,ddyminus
-      REAL_T ddzcen,ddz2cen,ddzplus,ddzminus
-      REAL_T ddydzcen,ddydzpp,ddydzpm,ddydzmp,ddydzmm
-      logical okyzpp,okyzpm,okyzmp,okyzmm,okyzcen
-      REAL_T ddylowp,ddylowm
-      REAL_T ddzlowp,ddzlowm
-
-      notUsable(ii,jj,kk) = (mask(ii,jj,kk).ne.not_covered)
-      Usable(ii,jj,kk) = (mask(ii,jj,kk).eq.not_covered)
-
-      ddycen(ii,jj,kk,n) = (crse(ii,jj+1,kk,n)-crse(ii,jj-1,kk,n))/(2*hc(2))
-      ddzcen(ii,jj,kk,n) = (crse(ii,jj,kk+1,n)-crse(ii,jj,kk-1,n))/(2*hc(3))
-
-      ddy2cen(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-2*crse(ii,jj,kk,n)+crse(ii,jj-1,kk,n))
-     &     /(hc(2)**2)
-      ddz2cen(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-2*crse(ii,jj,kk,n)+crse(ii,jj,kk-1,n))
-     &     /(hc(3)**2)
-
-      ddyplus(ii,jj,kk,n)=(-crse(ii,jj+2,kk,n)+4*crse(ii,jj+1,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-      ddzplus(ii,jj,kk,n)=(-crse(ii,jj,kk+2,n)+4*crse(ii,jj,kk+1,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddyminus(ii,jj,kk,n)=(+crse(ii,jj-2,kk,n)-4*crse(ii,jj-1,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-      ddzminus(ii,jj,kk,n)=(+crse(ii,jj,kk-2,n)-4*crse(ii,jj,kk-1,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddydzcen(ii,jj,kk,n)=(crse(ii,jj+1,kk+1,n)-crse(ii,jj-1,kk+1,n)
-     &     -crse(ii,jj+1,kk-1,n)+crse(ii,jj-1,kk-1,n))/(4*hc(2)*hc(3))
-      okyzcen(ii,jj,kk)=(Usable(ii,jj+1,kk+1).and.Usable(ii,jj-1,kk+1)
-     &     .and.Usable(ii,jj+1,kk-1).and.Usable(ii,jj-1,kk-1))
-      ddydzpp(ii,jj,kk,n)=(crse(ii,jj+1,kk+1,n)-crse(ii,jj,kk+1,n)
-     &     -crse(ii,jj+1,kk,n)+crse(ii,jj,kk,n))/(hc(2)*hc(3))
-      okyzpp(ii,jj,kk)=(Usable(ii,jj+1,kk+1).and.Usable(ii,jj,kk+1)
-     &     .and.Usable(ii,jj+1,kk))
-      ddydzpm(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii,jj,kk,n)
-     &     -crse(ii,jj+1,kk-1,n)+crse(ii,jj,kk-1,n))/(4*hc(2)*hc(3))
-      okyzpm(ii,jj,kk)=(Usable(ii,jj+1,kk)
-     &     .and.Usable(ii,jj+1,kk-1).and.Usable(ii,jj,kk-1))
-      ddydzmp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii,jj-1,kk+1,n)
-     &     -crse(ii,jj,kk,n)+crse(ii,jj-1,kk,n))/(hc(2)*hc(3))
-      okyzmp(ii,jj,kk)=(Usable(ii,jj,kk+1).and.Usable(ii,jj-1,kk+1)
-     &     .and.Usable(ii,jj-1,kk))
-      ddydzmm(ii,jj,kk,n)=(crse(ii,jj,kk,n)-crse(ii,jj-1,kk,n)
-     &     -crse(ii,jj,kk-1,n)+crse(ii,jj-1,kk-1,n))/(hc(2)*hc(3))
-      okyzmm(ii,jj,kk)=(Usable(ii,jj-1,kk)
-     &     .and.Usable(ii,jj,kk-1).and.Usable(ii,jj-1,kk-1))
-
-      ddylowp(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii,jj,kk,n))/hc(2)
-      ddzlowp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii,jj,kk,n))/hc(3)
-
-      ddylowm(ii,jj,kk,n)=(-crse(ii,jj-1,kk,n)+crse(ii,jj,kk,n))/hc(2)
-      ddzlowm(ii,jj,kk,n)=(-crse(ii,jj,kk-1,n)+crse(ii,jj,kk,n))/hc(3)
-c ::: ------------ functions ------------------------------
-
-      kclo = ARG_L3(cb)
-      kchi = ARG_H3(cb)
-      jclo = ARG_L2(cb)
-      jchi = ARG_H2(cb)
-      ic   = ARG_L1(cb)-1
-      i    = lo(1)-1
-c ::: :::
-      hf(1) = 0
-      hf(2) = hfine(1)
-      hf(3) = hfine(2)
-      hc(1) = 0
-      hc(2) = hfine(1)*ratio
-      hc(3) = hfine(2)*ratio
-c ::: :::
-
-      do n = 1, nvar
-c     ::::: calculate derivatives for interpolation
-         do kc = kclo, kchi
-            k = ratio*kc
-            do jc = jclo, jchi
-               j = ratio*jc
-
-               derives(jc,kc,DY) = ddycen(ic,jc,kc,n)
-               derives(jc,kc,D2Y) = ddy2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j-1,k) .and. notUsable(i,j+ratio,k)  ) then
-                  derives(jc,kc,DY)  = zero
-                  derives(jc,kc,D2Y) = zero
-               else if( notUsable(i,j-1,k) .and. Usable(i,j+ratio,k) ) then
-c     :::: :::: : positive side usable
-                  if( jc+2.le.jchi+1 ) then
-                     if( Usable(i,j+2*ratio,k) ) then
-                        derives(jc,kc,DY)=ddyplus(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=ddy2cen(ic,jc+1,kc,n)
-                     else
-                        derives(jc,kc,DY)=ddylowp(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=zero
-                     endif
-                  else
-                     derives(jc,kc,DY)=ddylowp(ic,jc,kc,n)
-                     derives(jc,kc,D2Y)=zero
-                  endif
-               else if( Usable(i,j-1,k) .and. notUsable(i,j+ratio,k) ) then
-c     :::: :::: : negative side usable
-                  if( jc-2.ge.jclo-1 ) then
-                     if( Usable(i,j-1,k) ) then
-                        derives(jc,kc,DY)=ddyminus(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=ddy2cen(ic,jc-1,kc,n)
-                     else
-                        derives(jc,kc,DY)=ddylowm(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=zero
-                     endif
-                  else
-                     derives(jc,kc,DY)=ddylowm(ic,jc,kc,n)
-                     derives(jc,kc,D2Y)=zero
-                  endif
-               endif
-
-               derives(jc,kc,DZ)  = ddzcen(ic,jc,kc,n)
-               derives(jc,kc,D2Z) = ddz2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-                  derives(jc,kc,DZ)  = zero
-                  derives(jc,kc,D2Z) = zero
-               else if( notUsable(i,j,k-1) .and. Usable(i,j,k+ratio)) then
-c     :::: :::: : positive size usable
-                  if( kc+2.le.kchi+1 ) then
-                     if( Usable(i,j,k+2*ratio) ) then
-                        derives(jc,kc,DZ)  = ddzplus(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  ddz2cen(ic,jc,kc+1,n)
-                     else
-                        derives(jc,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(jc,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                     derives(jc,kc,D2Z) =  zero
-                  endif
-               else if( Usable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-c     :::: :::: : negative size usable
-                  if( kc-2.ge.kclo-1 ) then
-                     if( Usable(i,j,k-1) ) then
-                        derives(jc,kc,DZ)  = ddzminus(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  ddz2cen(ic,jc,kc-1,n)
-                     else
-                        derives(jc,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(jc,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                     derives(jc,kc,D2Z) =  zero
-                  endif
-               endif
-
-               if( okyzcen(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzcen(ic,jc,kc,n)
-               else if( okyzpp(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzpp(ic,jc,kc,n)
-               else if( okyzpm(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzpm(ic,jc,kc,n)
-               else if( okyzmp(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzmp(ic,jc,kc,n)
-               else if( okyzmm(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzmm(ic,jc,kc,n)
-               else
-                  derives(jc,kc,DYZ) = zero
-               endif
-
-            enddo
-         enddo
-
-c     ::::: interpolate to fine grid
-         do koff = 0, ratio - 1
-            zz = (koff+half)*hf(3)-hc(3)/2
-            do kc = kclo,kchi
-               k = ratio*kc + koff
-               do joff = 0, ratio - 1
-                  yy = (joff+half)*hf(2)-hc(2)/2
-                  do jc = jclo, jchi
-                     j = ratio*jc + joff
-                     bdry(i,j,k,n) = crse(ic,jc,kc,n) + 
-     &                    yy*derives(jc,kc,DY) +
-     &                    half*yy**2*derives(jc,kc,D2Y) + 
-     &                    zz*derives(jc,kc,DZ) +
-     &                    half*zz**2*derives(jc,kc,D2Z) + 
-     &                    yy*zz*derives(jc,kc,DYZ) 
-                     bdry(i,j,k,n+CY*nvar) =
-     &                    derives(jc,kc,DY)+
-     &                    yy*derives(jc,kc,D2Y)+
-     &                    zz*derives(jc,kc,DYZ)
-                     bdry(i,j,k,n+CZ*nvar) =
-     &                    derives(jc,kc,DZ)+
-     &                    zz*derives(jc,kc,D2Z)+
-     &                    yy*derives(jc,kc,DYZ)
-                  enddo
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPXHI : Interpolation on Xhi Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array for derivatives
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPXHI (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      implicit none
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),(1+3)*nvar)
-      REAL_T   derives(DIM23(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine(BL_SPACEDIM-1)
-
-      REAL_T   yy, zz
-      integer  i, j, k, ic, jc, kc, joff, koff, n
-      integer  jclo, jchi, kclo, kchi, ii, jj, kk
-      REAL_T   hc(3),hf(3)
-
-c ::: ------------ functions ------------------------------
-      logical notUsable,Usable
-      REAL_T ddycen,ddy2cen,ddyplus,ddyminus
-      REAL_T ddzcen,ddz2cen,ddzplus,ddzminus
-      REAL_T ddydzcen,ddydzpp,ddydzpm,ddydzmp,ddydzmm
-      logical okyzpp,okyzpm,okyzmp,okyzmm,okyzcen
-      REAL_T ddylowp,ddylowm
-      REAL_T ddzlowp,ddzlowm
-
-      notUsable(ii,jj,kk) = (mask(ii,jj,kk).ne.not_covered)
-      Usable(ii,jj,kk) = (mask(ii,jj,kk).eq.not_covered)
-
-      ddycen(ii,jj,kk,n) = (crse(ii,jj+1,kk,n)-crse(ii,jj-1,kk,n))/(2*hc(2))
-      ddzcen(ii,jj,kk,n) = (crse(ii,jj,kk+1,n)-crse(ii,jj,kk-1,n))/(2*hc(3))
-
-      ddy2cen(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-2*crse(ii,jj,kk,n)+crse(ii,jj-1,kk,n))
-     &     /(hc(2)**2)
-      ddz2cen(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-2*crse(ii,jj,kk,n)+crse(ii,jj,kk-1,n))
-     &     /(hc(3)**2)
-
-      ddyplus(ii,jj,kk,n)=(-crse(ii,jj+2,kk,n)+4*crse(ii,jj+1,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-      ddzplus(ii,jj,kk,n)=(-crse(ii,jj,kk+2,n)+4*crse(ii,jj,kk+1,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddyminus(ii,jj,kk,n)=(+crse(ii,jj-2,kk,n)-4*crse(ii,jj-1,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-      ddzminus(ii,jj,kk,n)=(+crse(ii,jj,kk-2,n)-4*crse(ii,jj,kk-1,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddydzcen(ii,jj,kk,n)=(crse(ii,jj+1,kk+1,n)-crse(ii,jj-1,kk+1,n)
-     &     -crse(ii,jj+1,kk-1,n)+crse(ii,jj-1,kk-1,n))/(4*hc(2)*hc(3))
-      okyzcen(ii,jj,kk)=(Usable(ii,jj+1,kk+1).and.Usable(ii,jj-1,kk+1)
-     &     .and.Usable(ii,jj+1,kk-1).and.Usable(ii,jj-1,kk-1))
-      ddydzpp(ii,jj,kk,n)=(crse(ii,jj+1,kk+1,n)-crse(ii,jj,kk+1,n)
-     &     -crse(ii,jj+1,kk,n)+crse(ii,jj,kk,n))/(hc(2)*hc(3))
-      okyzpp(ii,jj,kk)=(Usable(ii,jj+1,kk+1).and.Usable(ii,jj,kk+1)
-     &     .and.Usable(ii,jj+1,kk))
-      ddydzpm(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii,jj,kk,n)
-     &     -crse(ii,jj+1,kk-1,n)+crse(ii,jj,kk-1,n))/(4*hc(2)*hc(3))
-      okyzpm(ii,jj,kk)=(Usable(ii,jj+1,kk)
-     &     .and.Usable(ii,jj+1,kk-1).and.Usable(ii,jj,kk-1))
-      ddydzmp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii,jj-1,kk+1,n)
-     &     -crse(ii,jj,kk,n)+crse(ii,jj-1,kk,n))/(hc(2)*hc(3))
-      okyzmp(ii,jj,kk)=(Usable(ii,jj,kk+1).and.Usable(ii,jj-1,kk+1)
-     &     .and.Usable(ii,jj-1,kk))
-      ddydzmm(ii,jj,kk,n)=(crse(ii,jj,kk,n)-crse(ii,jj-1,kk,n)
-     &     -crse(ii,jj,kk-1,n)+crse(ii,jj-1,kk-1,n))/(hc(2)*hc(3))
-      okyzmm(ii,jj,kk)=(Usable(ii,jj-1,kk)
-     &     .and.Usable(ii,jj,kk-1).and.Usable(ii,jj-1,kk-1))
-
-      ddylowp(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii,jj,kk,n))/hc(2)
-      ddzlowp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii,jj,kk,n))/hc(3)
-
-      ddylowm(ii,jj,kk,n)=(-crse(ii,jj-1,kk,n)+crse(ii,jj,kk,n))/hc(2)
-      ddzlowm(ii,jj,kk,n)=(-crse(ii,jj,kk-1,n)+crse(ii,jj,kk,n))/hc(3)
-c ::: ------------ functions ------------------------------
-
-      kclo = ARG_L3(cb)
-      kchi = ARG_H3(cb)
-      jclo = ARG_L2(cb)
-      jchi = ARG_H2(cb)
-      ic   = ARG_H1(cb)+1
-      i    = hi(1)+1
-c ::: :::
-      hf(1) = 0
-      hf(2) = hfine(1)
-      hf(3) = hfine(2)
-      hc(1) = 0
-      hc(2) = hfine(1)*ratio
-      hc(3) = hfine(2)*ratio
-c ::: :::
-
-      do n = 1, nvar
-c     ::::: calculate derivatives for interpolation
-         do kc = kclo, kchi
-            k = ratio*kc
-            do jc = jclo, jchi
-               j = ratio*jc
-
-               derives(jc,kc,DY) = ddycen(ic,jc,kc,n)
-               derives(jc,kc,D2Y) = ddy2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j-1,k) .and. notUsable(i,j+ratio,k)  ) then
-                  derives(jc,kc,DY)  = zero
-                  derives(jc,kc,D2Y) = zero
-               else if( notUsable(i,j-1,k) .and. Usable(i,j+ratio,k) ) then
-c     :::: :::: : positive side usable
-                  if( jc+2.le.jchi+1 ) then
-                     if( Usable(i,j+2*ratio,k) ) then
-                        derives(jc,kc,DY)=ddyplus(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=ddy2cen(ic,jc+1,kc,n)
-                     else
-                        derives(jc,kc,DY)=ddylowp(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=zero
-                     endif
-                  else
-                     derives(jc,kc,DY)=ddylowp(ic,jc,kc,n)
-                     derives(jc,kc,D2Y)=zero
-                  endif
-               else if( Usable(i,j-1,k) .and. notUsable(i,j+ratio,k) ) then
-c     :::: :::: : negative side usable
-                  if( jc-2.ge.jclo-1 ) then
-                     if( Usable(i,j-1,k) ) then
-                        derives(jc,kc,DY)=ddyminus(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=ddy2cen(ic,jc-1,kc,n)
-                     else
-                        derives(jc,kc,DY)=ddylowm(ic,jc,kc,n)
-                        derives(jc,kc,D2Y)=zero
-                     endif
-                  else
-                     derives(jc,kc,DY)=ddylowm(ic,jc,kc,n)
-                     derives(jc,kc,D2Y)=zero
-                  endif
-               endif
-
-               derives(jc,kc,DZ)  = ddzcen(ic,jc,kc,n)
-               derives(jc,kc,D2Z) = ddz2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-                  derives(jc,kc,DZ)  = zero
-                  derives(jc,kc,D2Z) = zero
-               else if( notUsable(i,j,k-1) .and. Usable(i,j,k+ratio)) then
-c     :::: :::: : positive size usable
-                  if( kc+2.le.kchi+1 ) then
-                     if( Usable(i,j,k+2*ratio) ) then
-                        derives(jc,kc,DZ)  = ddzplus(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  ddz2cen(ic,jc,kc+1,n)
-                     else
-                        derives(jc,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(jc,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                     derives(jc,kc,D2Z) =  zero
-                  endif
-               else if( Usable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-c     :::: :::: : negative size usable
-                  if( kc-2.ge.kclo-1 ) then
-                     if( Usable(i,j,k-1) ) then
-                        derives(jc,kc,DZ)  = ddzminus(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  ddz2cen(ic,jc,kc-1,n)
-                     else
-                        derives(jc,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                        derives(jc,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(jc,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                     derives(jc,kc,D2Z) =  zero
-                  endif
-               endif
-
-               if( okyzcen(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzcen(ic,jc,kc,n)
-               else if( okyzpp(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzpp(ic,jc,kc,n)
-               else if( okyzpm(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzpm(ic,jc,kc,n)
-               else if( okyzmp(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzmp(ic,jc,kc,n)
-               else if( okyzmm(i,j,k) ) then
-                  derives(jc,kc,DYZ) = ddydzmm(ic,jc,kc,n)
-               else
-                  derives(jc,kc,DYZ) = zero
-               endif
-
-            enddo
-         enddo
-
-c     ::::: interpolate to fine grid
-         do koff = 0, ratio - 1
-            zz = (koff+half)*hf(3)-hc(3)/2
-            do kc = kclo,kchi
-               k = ratio*kc + koff
-               do joff = 0, ratio - 1
-                  yy = (joff+half)*hf(2)-hc(2)/2
-                  do jc = jclo, jchi
-                     j = ratio*jc + joff
-                     bdry(i,j,k,n) = crse(ic,jc,kc,n) + 
-     &                    yy*derives(jc,kc,DY) +
-     &                    half*yy**2*derives(jc,kc,D2Y) + 
-     &                    zz*derives(jc,kc,DZ) +
-     &                    half*zz**2*derives(jc,kc,D2Z) + 
-     &                    yy*zz*derives(jc,kc,DYZ) 
-                     bdry(i,j,k,n+CY*nvar) =
-     &                    derives(jc,kc,DY)+
-     &                    yy*derives(jc,kc,D2Y)+
-     &                    zz*derives(jc,kc,DYZ)
-                     bdry(i,j,k,n+CZ*nvar) =
-     &                    derives(jc,kc,DZ)+
-     &                    zz*derives(jc,kc,D2Z)+
-     &                    yy*derives(jc,kc,DYZ)
-                  enddo
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPYLO : Interpolation on Ylo Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array for derivatives
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPYLO (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      implicit none
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),(1+3)*nvar)
-      REAL_T   derives(DIM13(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine(BL_SPACEDIM-1)
-
-      REAL_T   xx, zz
-      integer  i, j, k, ic, jc, kc, ioff, koff, n
-      integer  iclo, ichi, kclo, kchi, ii, jj, kk
-      REAL_T   hc(3),hf(3)
-
-c ::: ------------ functions ------------------------------
-      logical notUsable,Usable
-      REAL_T ddxcen,ddx2cen,ddxplus,ddxminus
-      REAL_T ddzcen,ddz2cen,ddzplus,ddzminus
-      REAL_T ddxdzcen,ddxdzpp,ddxdzpm,ddxdzmp,ddxdzmm
-      logical okxzpp,okxzpm,okxzmp,okxzmm,okxzcen
-      REAL_T ddxlowp,ddxlowm
-      REAL_T ddzlowp,ddzlowm
-
-      notUsable(ii,jj,kk) = (mask(ii,jj,kk).ne.not_covered)
-      Usable(ii,jj,kk) = (mask(ii,jj,kk).eq.not_covered)
-
-      ddxcen(ii,jj,kk,n) = (crse(ii+1,jj,kk,n)-crse(ii-1,jj,kk,n))/(2*hc(1))
-      ddzcen(ii,jj,kk,n) = (crse(ii,jj,kk+1,n)-crse(ii,jj,kk-1,n))/(2*hc(3))
-
-      ddx2cen(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-2*crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))
-     &     /(hc(1)**2)
-      ddz2cen(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-2*crse(ii,jj,kk,n)+crse(ii,jj,kk-1,n))
-     &     /(hc(3)**2)
-
-      ddxplus(ii,jj,kk,n)=(-crse(ii+2,jj,kk,n)+4*crse(ii+1,jj,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddzplus(ii,jj,kk,n)=(-crse(ii,jj,kk+2,n)+4*crse(ii,jj,kk+1,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddxminus(ii,jj,kk,n)=(+crse(ii-2,jj,kk,n)-4*crse(ii-1,jj,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddzminus(ii,jj,kk,n)=(+crse(ii,jj,kk-2,n)-4*crse(ii,jj,kk-1,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddxdzcen(ii,jj,kk,n)=(crse(ii+1,jj,kk+1,n)-crse(ii-1,jj,kk+1,n)
-     &     -crse(ii+1,jj,kk-1,n)+crse(ii-1,jj,kk-1,n))/(4*hc(1)*hc(3))
-      okxzcen(ii,jj,kk)=(Usable(ii+1,jj,kk+1).and.Usable(ii-1,jj,kk+1)
-     &     .and.Usable(ii+1,jj,kk-1).and.Usable(ii-1,jj,kk-1))
-      ddxdzpp(ii,jj,kk,n)=(crse(ii+1,jj,kk+1,n)-crse(ii,jj,kk+1,n)
-     &     -crse(ii+1,jj,kk,n)+crse(ii,jj,kk,n))/(hc(1)*hc(3))
-      okxzpp(ii,jj,kk)=(Usable(ii+1,jj,kk+1).and.Usable(ii,jj,kk+1)
-     &     .and.Usable(ii+1,jj,kk))
-      ddxdzpm(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n)
-     &     -crse(ii+1,jj,kk-1,n)+crse(ii,jj,kk-1,n))/(4*hc(1)*hc(3))
-      okxzpm(ii,jj,kk)=(Usable(ii+1,jj,kk)
-     &     .and.Usable(ii+1,jj,kk-1).and.Usable(ii,jj,kk-1))
-      ddxdzmp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii-1,jj,kk+1,n)
-     &     -crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))/(hc(1)*hc(3))
-      okxzmp(ii,jj,kk)=(Usable(ii,jj,kk+1).and.Usable(ii-1,jj,kk+1)
-     &     .and.Usable(ii-1,jj,kk))
-      ddxdzmm(ii,jj,kk,n)=(crse(ii,jj,kk,n)-crse(ii-1,jj,kk,n)
-     &     -crse(ii,jj,kk-1,n)+crse(ii-1,jj,kk-1,n))/(hc(1)*hc(3))
-      okxzmm(ii,jj,kk)=(Usable(ii-1,jj,kk)
-     &     .and.Usable(ii,jj,kk-1).and.Usable(ii-1,jj,kk-1))
-
-      ddxlowp(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n))/hc(1)
-      ddzlowp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii,jj,kk,n))/hc(3)
-
-      ddxlowm(ii,jj,kk,n)=(-crse(ii-1,jj,kk,n)+crse(ii,jj,kk,n))/hc(1)
-      ddzlowm(ii,jj,kk,n)=(-crse(ii,jj,kk-1,n)+crse(ii,jj,kk,n))/hc(3)
-c ::: ------------ functions ------------------------------
-
-      kclo = ARG_L3(cb)
-      kchi = ARG_H3(cb)
-      iclo = ARG_L1(cb)
-      ichi = ARG_H1(cb)
-      jc   = ARG_L2(cb)-1
-      j    = lo(2)-1
-c ::: :::
-      hf(1) = hfine(1)
-      hf(2) = 0
-      hf(3) = hfine(2)
-      hc(1) = hfine(1)*ratio
-      hc(2) = 0
-      hc(3) = hfine(2)*ratio
-c ::: :::
-
-      do n = 1, nvar
-c     ::::: calculate derivatives for interpolation
-         do kc = kclo, kchi
-            k = ratio*kc
-            do ic = iclo, ichi
-               i = ratio*ic
-
-               derives(ic,kc,DX) = ddxcen(ic,jc,kc,n)
-               derives(ic,kc,D2X) = ddx2cen(ic,jc,kc,n)
-
-               if( notUsable(i-1,j,k) .and. notUsable(i+ratio,j,k)  ) then
-                  derives(ic,kc,DX)  = zero
-                  derives(ic,kc,D2X) = zero
-               else if( notUsable(i-1,j,k) .and. Usable(i+ratio,j,k) ) then
-c     :::: :::: : positive side usable
-                  if( ic+2.le.ichi+1 ) then
-                     if( Usable(i+2*ratio,j,k) ) then
-                        derives(ic,kc,DX)=ddxplus(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=ddx2cen(ic+1,jc,kc,n)
-                     else
-                        derives(ic,kc,DX)=ddxlowp(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,kc,DX)=ddxlowp(ic,jc,kc,n)
-                     derives(ic,kc,D2X)=zero
-                  endif
-               else if( Usable(i-1,j,k) .and. notUsable(i+ratio,j,k) ) then
-c     :::: :::: : negative side usable
-                  if( ic-2.ge.iclo-1 ) then
-                     if( Usable(i-1,j,k) ) then
-                        derives(ic,kc,DX)=ddxminus(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=ddx2cen(ic-1,jc,kc,n)
-                     else
-                        derives(ic,kc,DX)=ddxlowm(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,kc,DX)=ddxlowm(ic,jc,kc,n)
-                     derives(ic,kc,D2X)=zero
-                  endif
-               endif
-
-               derives(ic,kc,DZ)  = ddzcen(ic,jc,kc,n)
-               derives(ic,kc,D2Z) = ddz2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-                  derives(ic,kc,DZ)  = zero
-                  derives(ic,kc,D2Z) = zero
-               else if( notUsable(i,j,k-1) .and. Usable(i,j,k+ratio)) then
-c     :::: :::: : positive size usable
-                  if( kc+2.le.kchi+1 ) then
-                     if( Usable(i,j,k+2*ratio) ) then
-                        derives(ic,kc,DZ)  = ddzplus(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  ddz2cen(ic,jc,kc+1,n)
-                     else
-                        derives(ic,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(ic,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                     derives(ic,kc,D2Z) =  zero
-                  endif
-               else if( Usable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-c     :::: :::: : negative size usable
-                  if( kc-2.ge.kclo-1 ) then
-                     if( Usable(i,j,k-1) ) then
-                        derives(ic,kc,DZ)  = ddzminus(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  ddz2cen(ic,jc,kc-1,n)
-                     else
-                        derives(ic,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(ic,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                     derives(ic,kc,D2Z) =  zero
-                  endif
-               endif
-
-               if( okxzcen(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzcen(ic,jc,kc,n)
-               else if( okxzpp(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzpp(ic,jc,kc,n)
-               else if( okxzpm(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzpm(ic,jc,kc,n)
-               else if( okxzmp(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzmp(ic,jc,kc,n)
-               else if( okxzmm(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzmm(ic,jc,kc,n)
-               else
-                  derives(ic,kc,DXZ) = zero
-               endif
-
-            enddo
-         enddo
-
-c     ::::: interpolate to fine grid
-         do koff = 0, ratio - 1
-            zz = (koff+half)*hf(3)-hc(3)/2
-            do kc = kclo,kchi
-               k = ratio*kc + koff
-               do ioff = 0, ratio - 1
-                  xx = (ioff+half)*hf(1)-hc(1)/2
-                  do ic = iclo, ichi
-                     i = ratio*ic + ioff
-                     bdry(i,j,k,n) = crse(ic,jc,kc,n) + 
-     &                    xx*derives(ic,kc,DX) +
-     &                    half*xx**2*derives(ic,kc,D2X) + 
-     &                    zz*derives(ic,kc,DZ) +
-     &                    half*zz**2*derives(ic,kc,D2Z) + 
-     &                    xx*zz*derives(ic,kc,DXZ) 
-                     bdry(i,j,k,n+CX*nvar) =
-     &                    derives(ic,kc,DX)+
-     &                    xx*derives(ic,kc,D2X)+
-     &                    zz*derives(ic,kc,DXZ)
-                     bdry(i,j,k,n+CZ*nvar) =
-     &                    derives(ic,kc,DZ)+
-     &                    zz*derives(ic,kc,D2Z)+
-     &                    xx*derives(ic,kc,DXZ)
-                  enddo
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPYHI : Interpolation on Yhi Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array for derivatives
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPYHI (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      implicit none
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),(1+3)*nvar)
-      REAL_T   derives(DIM13(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine(BL_SPACEDIM-1)
-
-      REAL_T   xx, zz
-      integer  i, j, k, ic, jc, kc, ioff, koff, n
-      integer  iclo, ichi, kclo, kchi, ii, jj, kk
-      REAL_T   hc(3),hf(3)
-
-c ::: ------------ functions ------------------------------
-      logical notUsable,Usable
-      REAL_T ddxcen,ddx2cen,ddxplus,ddxminus
-      REAL_T ddzcen,ddz2cen,ddzplus,ddzminus
-      REAL_T ddxdzcen,ddxdzpp,ddxdzpm,ddxdzmp,ddxdzmm
-      logical okxzpp,okxzpm,okxzmp,okxzmm,okxzcen
-      REAL_T ddxlowp,ddxlowm
-      REAL_T ddzlowp,ddzlowm
-
-      notUsable(ii,jj,kk) = (mask(ii,jj,kk).ne.not_covered)
-      Usable(ii,jj,kk) = (mask(ii,jj,kk).eq.not_covered)
-
-      ddxcen(ii,jj,kk,n) = (crse(ii+1,jj,kk,n)-crse(ii-1,jj,kk,n))/(2*hc(1))
-      ddzcen(ii,jj,kk,n) = (crse(ii,jj,kk+1,n)-crse(ii,jj,kk-1,n))/(2*hc(3))
-
-      ddx2cen(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-2*crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))
-     &     /(hc(1)**2)
-      ddz2cen(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-2*crse(ii,jj,kk,n)+crse(ii,jj,kk-1,n))
-     &     /(hc(3)**2)
-
-      ddxplus(ii,jj,kk,n)=(-crse(ii+2,jj,kk,n)+4*crse(ii+1,jj,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddzplus(ii,jj,kk,n)=(-crse(ii,jj,kk+2,n)+4*crse(ii,jj,kk+1,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddxminus(ii,jj,kk,n)=(+crse(ii-2,jj,kk,n)-4*crse(ii-1,jj,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddzminus(ii,jj,kk,n)=(+crse(ii,jj,kk-2,n)-4*crse(ii,jj,kk-1,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(3))
-
-      ddxdzcen(ii,jj,kk,n)=(crse(ii+1,jj,kk+1,n)-crse(ii-1,jj,kk+1,n)
-     &     -crse(ii+1,jj,kk-1,n)+crse(ii-1,jj,kk-1,n))/(4*hc(1)*hc(3))
-      okxzcen(ii,jj,kk)=(Usable(ii+1,jj,kk+1).and.Usable(ii-1,jj,kk+1)
-     &     .and.Usable(ii+1,jj,kk-1).and.Usable(ii-1,jj,kk-1))
-      ddxdzpp(ii,jj,kk,n)=(crse(ii+1,jj,kk+1,n)-crse(ii,jj,kk+1,n)
-     &     -crse(ii+1,jj,kk,n)+crse(ii,jj,kk,n))/(hc(1)*hc(3))
-      okxzpp(ii,jj,kk)=(Usable(ii+1,jj,kk+1).and.Usable(ii,jj,kk+1)
-     &     .and.Usable(ii+1,jj,kk))
-      ddxdzpm(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n)
-     &     -crse(ii+1,jj,kk-1,n)+crse(ii,jj,kk-1,n))/(4*hc(1)*hc(3))
-      okxzpm(ii,jj,kk)=(Usable(ii+1,jj,kk)
-     &     .and.Usable(ii+1,jj,kk-1).and.Usable(ii,jj,kk-1))
-      ddxdzmp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii-1,jj,kk+1,n)
-     &     -crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))/(hc(1)*hc(3))
-      okxzmp(ii,jj,kk)=(Usable(ii,jj,kk+1).and.Usable(ii-1,jj,kk+1)
-     &     .and.Usable(ii-1,jj,kk))
-      ddxdzmm(ii,jj,kk,n)=(crse(ii,jj,kk,n)-crse(ii-1,jj,kk,n)
-     &     -crse(ii,jj,kk-1,n)+crse(ii-1,jj,kk-1,n))/(hc(1)*hc(3))
-      okxzmm(ii,jj,kk)=(Usable(ii-1,jj,kk)
-     &     .and.Usable(ii,jj,kk-1).and.Usable(ii-1,jj,kk-1))
-
-      ddxlowp(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n))/hc(1)
-      ddzlowp(ii,jj,kk,n)=(crse(ii,jj,kk+1,n)-crse(ii,jj,kk,n))/hc(3)
-
-      ddxlowm(ii,jj,kk,n)=(-crse(ii-1,jj,kk,n)+crse(ii,jj,kk,n))/hc(1)
-      ddzlowm(ii,jj,kk,n)=(-crse(ii,jj,kk-1,n)+crse(ii,jj,kk,n))/hc(3)
-c ::: ------------ functions ------------------------------
-
-      kclo = ARG_L3(cb)
-      kchi = ARG_H3(cb)
-      iclo = ARG_L1(cb)
-      ichi = ARG_H1(cb)
-      jc   = ARG_H2(cb)+1
-      j    = hi(2)+1
-c ::: :::
-      hf(1) = hfine(1)
-      hf(2) = 0
-      hf(3) = hfine(2)
-      hc(1) = hfine(1)*ratio
-      hc(2) = 0
-      hc(3) = hfine(2)*ratio
-c ::: :::
-
-      do n = 1, nvar
-c     ::::: calculate derivatives for interpolation
-         do kc = kclo, kchi
-            k = ratio*kc
-            do ic = iclo, ichi
-               i = ratio*ic
-
-               derives(ic,kc,DX) = ddxcen(ic,jc,kc,n)
-               derives(ic,kc,D2X) = ddx2cen(ic,jc,kc,n)
-
-               if( notUsable(i-1,j,k) .and. notUsable(i+ratio,j,k)  ) then
-                  derives(ic,kc,DX)  = zero
-                  derives(ic,kc,D2X) = zero
-               else if( notUsable(i-1,j,k) .and. Usable(i+ratio,j,k) ) then
-c     :::: :::: : positive side usable
-                  if( ic+2.le.ichi+1 ) then
-                     if( Usable(i+2*ratio,j,k) ) then
-                        derives(ic,kc,DX)=ddxplus(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=ddx2cen(ic+1,jc,kc,n)
-                     else
-                        derives(ic,kc,DX)=ddxlowp(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,kc,DX)=ddxlowp(ic,jc,kc,n)
-                     derives(ic,kc,D2X)=zero
-                  endif
-               else if( Usable(i-1,j,k) .and. notUsable(i+ratio,j,k) ) then
-c     :::: :::: : negative side usable
-                  if( ic-2.ge.iclo-1 ) then
-                     if( Usable(i-1,j,k) ) then
-                        derives(ic,kc,DX)=ddxminus(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=ddx2cen(ic-1,jc,kc,n)
-                     else
-                        derives(ic,kc,DX)=ddxlowm(ic,jc,kc,n)
-                        derives(ic,kc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,kc,DX)=ddxlowm(ic,jc,kc,n)
-                     derives(ic,kc,D2X)=zero
-                  endif
-               endif
-
-               derives(ic,kc,DZ)  = ddzcen(ic,jc,kc,n)
-               derives(ic,kc,D2Z) = ddz2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-                  derives(ic,kc,DZ)  = zero
-                  derives(ic,kc,D2Z) = zero
-               else if( notUsable(i,j,k-1) .and. Usable(i,j,k+ratio)) then
-c     :::: :::: : positive size usable
-                  if( kc+2.le.kchi+1 ) then
-                     if( Usable(i,j,k+2*ratio) ) then
-                        derives(ic,kc,DZ)  = ddzplus(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  ddz2cen(ic,jc,kc+1,n)
-                     else
-                        derives(ic,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(ic,kc,DZ)  = ddzlowp(ic,jc,kc,n)
-                     derives(ic,kc,D2Z) =  zero
-                  endif
-               else if( Usable(i,j,k-1) .and. notUsable(i,j,k+ratio)) then
-c     :::: :::: : negative size usable
-                  if( kc-2.ge.kclo-1 ) then
-                     if( Usable(i,j,k-1) ) then
-                        derives(ic,kc,DZ)  = ddzminus(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  ddz2cen(ic,jc,kc-1,n)
-                     else
-                        derives(ic,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                        derives(ic,kc,D2Z) =  zero
-                     endif
-                  else
-                     derives(ic,kc,DZ)  = ddzlowm(ic,jc,kc,n)
-                     derives(ic,kc,D2Z) =  zero
-                  endif
-               endif
-
-               if( okxzcen(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzcen(ic,jc,kc,n)
-               else if( okxzpp(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzpp(ic,jc,kc,n)
-               else if( okxzpm(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzpm(ic,jc,kc,n)
-               else if( okxzmp(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzmp(ic,jc,kc,n)
-               else if( okxzmm(i,j,k) ) then
-                  derives(ic,kc,DXZ) = ddxdzmm(ic,jc,kc,n)
-               else
-                  derives(ic,kc,DXZ) = zero
-               endif
-
-            enddo
-         enddo
-
-c     ::::: interpolate to fine grid
-         do koff = 0, ratio - 1
-            zz = (koff+half)*hf(3)-hc(3)/2
-            do kc = kclo,kchi
-               k = ratio*kc + koff
-               do ioff = 0, ratio - 1
-                  xx = (ioff+half)*hf(1)-hc(1)/2
-                  do ic = iclo, ichi
-                     i = ratio*ic + ioff
-                     bdry(i,j,k,n) = crse(ic,jc,kc,n) + 
-     &                    xx*derives(ic,kc,DX) +
-     &                    half*xx**2*derives(ic,kc,D2X) + 
-     &                    zz*derives(ic,kc,DZ) +
-     &                    half*zz**2*derives(ic,kc,D2Z) + 
-     &                    xx*zz*derives(ic,kc,DXZ) 
-                     bdry(i,j,k,n+CX*nvar) =
-     &                    derives(ic,kc,DX)+
-     &                    xx*derives(ic,kc,D2X)+
-     &                    zz*derives(ic,kc,DXZ)
-                     bdry(i,j,k,n+CZ*nvar) =
-     &                    derives(ic,kc,DZ)+
-     &                    zz*derives(ic,kc,D2Z)+
-     &                    xx*derives(ic,kc,DXZ)
-                  enddo
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPZLO : Interpolation on Zlo Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array for derivatives
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPZLO (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      implicit none
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),(1+3)*nvar)
-      REAL_T   derives(DIM12(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine(BL_SPACEDIM-1)
-
-      REAL_T   yy, xx 
-      integer  i, j, k, ic, jc, kc, ioff, joff, n
-      integer  iclo, ichi, jclo, jchi, ii, jj, kk
-      REAL_T   hc(3),hf(3)
-
-c ::: ------------ functions ------------------------------
-      logical notUsable,Usable
-      REAL_T ddxcen,ddx2cen,ddxplus,ddxminus
-      REAL_T ddycen,ddy2cen,ddyplus,ddyminus
-      REAL_T ddxdycen,ddxdypp,ddxdypm,ddxdymp,ddxdymm
-      logical okxypp,okxypm,okxymp,okxymm,okxycen
-      REAL_T ddxlowp,ddxlowm
-      REAL_T ddylowp,ddylowm
-
-      notUsable(ii,jj,kk) = (mask(ii,jj,kk).ne.not_covered)
-      Usable(ii,jj,kk) = (mask(ii,jj,kk).eq.not_covered)
-
-      ddxcen(ii,jj,kk,n) = (crse(ii+1,jj,kk,n)-crse(ii-1,jj,kk,n))/(2*hc(1))
-      ddycen(ii,jj,kk,n) = (crse(ii,jj+1,kk,n)-crse(ii,jj-1,kk,n))/(2*hc(2))
-
-      ddx2cen(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-2*crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))
-     &     /(hc(1)**2)
-      ddy2cen(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-2*crse(ii,jj,kk,n)+crse(ii,jj-1,kk,n))
-     &     /(hc(2)**2)
-
-      ddxplus(ii,jj,kk,n)=(-crse(ii+2,jj,kk,n)+4*crse(ii+1,jj,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddyplus(ii,jj,kk,n)=(-crse(ii,jj+2,kk,n)+4*crse(ii,jj+1,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-
-      ddxminus(ii,jj,kk,n)=(+crse(ii-2,jj,kk,n)-4*crse(ii-1,jj,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddyminus(ii,jj,kk,n)=(+crse(ii,jj-2,kk,n)-4*crse(ii,jj-1,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-
-      ddxdycen(ii,jj,kk,n)=(crse(ii+1,jj+1,kk,n)-crse(ii-1,jj+1,kk,n)
-     &     -crse(ii+1,jj-1,kk,n)+crse(ii-1,jj-1,kk,n))/(4*hc(1)*hc(2))
-      okxycen(ii,jj,kk)=(Usable(ii+1,jj+1,kk).and.Usable(ii-1,jj+1,kk)
-     &     .and.Usable(ii+1,jj-1,kk).and.Usable(ii-1,jj-1,kk))
-      ddxdypp(ii,jj,kk,n)=(crse(ii+1,jj+1,kk,n)-crse(ii,jj+1,kk,n)
-     &     -crse(ii+1,jj,kk,n)+crse(ii,jj,kk,n))/(hc(1)*hc(2))
-      okxypp(ii,jj,kk)=(Usable(ii+1,jj+1,kk).and.Usable(ii,jj+1,kk)
-     &     .and.Usable(ii+1,jj,kk))
-      ddxdypm(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n)
-     &     -crse(ii+1,jj-1,kk,n)+crse(ii,jj-1,kk,n))/(4*hc(1)*hc(2))
-      okxypm(ii,jj,kk)=(Usable(ii+1,jj,kk)
-     &     .and.Usable(ii+1,jj-1,kk).and.Usable(ii,jj-1,kk))
-      ddxdymp(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii-1,jj+1,kk,n)
-     &     -crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))/(hc(1)*hc(2))
-      okxymp(ii,jj,kk)=(Usable(ii,jj+1,kk).and.Usable(ii-1,jj+1,kk)
-     &     .and.Usable(ii-1,jj,kk))
-      ddxdymm(ii,jj,kk,n)=(crse(ii,jj,kk,n)-crse(ii-1,jj,kk,n)
-     &     -crse(ii,jj-1,kk,n)+crse(ii-1,jj-1,kk,n))/(hc(1)*hc(2))
-      okxymm(ii,jj,kk)=(Usable(ii-1,jj,kk)
-     &     .and.Usable(ii,jj-1,kk).and.Usable(ii-1,jj-1,kk))
-
-      ddxlowp(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n))/hc(1)
-      ddylowp(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii,jj,kk,n))/hc(2)
-
-      ddxlowm(ii,jj,kk,n)=(-crse(ii-1,jj,kk,n)+crse(ii,jj,kk,n))/hc(1)
-      ddylowm(ii,jj,kk,n)=(-crse(ii,jj-1,kk,n)+crse(ii,jj,kk,n))/hc(2)
-c ::: ------------ functions ------------------------------
-
-      jclo = ARG_L2(cb)
-      jchi = ARG_H2(cb)
-      iclo = ARG_L1(cb)
-      ichi = ARG_H1(cb)
-      kc   = ARG_L3(cb)-1
-      k    = lo(3)-1
-c ::: :::
-      hf(1) = hfine(1)
-      hf(2) = hfine(2)
-      hf(3) = 0
-      hc(1) = hfine(1)*ratio
-      hc(2) = hfine(2)*ratio
-      hc(3) = 0
-c ::: :::
-
-      do n = 1, nvar
-c     ::::: calculate derivatives for interpolation
-         do jc = jclo, jchi
-            j = ratio*jc
-            do ic = iclo, ichi
-               i = ratio*ic
-
-               derives(ic,jc,DX) = ddxcen(ic,jc,kc,n)
-               derives(ic,jc,D2X) = ddx2cen(ic,jc,kc,n)
-
-               if( notUsable(i-1,j,k) .and. notUsable(i+ratio,j,k)  ) then
-                  derives(ic,jc,DX)  = zero
-                  derives(ic,jc,D2X) = zero
-               else if( notUsable(i-1,j,k) .and. Usable(i+ratio,j,k) ) then
-c     :::: :::: : positive side usable
-                  if( ic+2.le.ichi+1 ) then
-                     if( Usable(i+2*ratio,j,k) ) then
-                        derives(ic,jc,DX)=ddxplus(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=ddx2cen(ic+1,jc,kc,n)
-                     else
-                        derives(ic,jc,DX)=ddxlowp(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,jc,DX)=ddxlowp(ic,jc,kc,n)
-                     derives(ic,jc,D2X)=zero
-                  endif
-               else if( Usable(i-1,j,k) .and. notUsable(i+ratio,j,k) ) then
-c     :::: :::: : negative side usable
-                  if( ic-2.ge.iclo-1 ) then
-                     if( Usable(i-1,j,k) ) then
-                        derives(ic,jc,DX)=ddxminus(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=ddx2cen(ic-1,jc,kc,n)
-                     else
-                        derives(ic,jc,DX)=ddxlowm(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,jc,DX)=ddxlowm(ic,jc,kc,n)
-                     derives(ic,jc,D2X)=zero
-                  endif
-               endif
-
-               derives(ic,jc,DY) = ddycen(ic,jc,kc,n)
-               derives(ic,jc,D2Y) = ddy2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j-1,k) .and. notUsable(i,j+ratio,k)  ) then
-                  derives(ic,jc,DY)  = zero
-                  derives(ic,jc,D2Y) = zero
-               else if( notUsable(i,j-1,k) .and. Usable(i,j+ratio,k) ) then
-c     :::: :::: : positive side usable
-                  if( jc+2.le.jchi+1 ) then
-                     if( Usable(i,j+2*ratio,k) ) then
-                        derives(ic,jc,DY)=ddyplus(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=ddy2cen(ic,jc+1,kc,n)
-                     else
-                        derives(ic,jc,DY)=ddylowp(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=zero
-                     endif
-                  else
-                     derives(ic,jc,DY)=ddylowp(ic,jc,kc,n)
-                     derives(ic,jc,D2Y)=zero
-                  endif
-               else if( Usable(i,j-1,k) .and. notUsable(i,j+ratio,k) ) then
-c     :::: :::: : negative side usable
-                  if( jc-2.ge.jclo-1 ) then
-                     if( Usable(i,j-1,k) ) then
-                        derives(ic,jc,DY)=ddyminus(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=ddy2cen(ic,jc-1,kc,n)
-                     else
-                        derives(ic,jc,DY)=ddylowm(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=zero
-                     endif
-                  else
-                     derives(ic,jc,DY)=ddylowm(ic,jc,kc,n)
-                     derives(ic,jc,D2Y)=zero
-                  endif
-               endif
-
-
-               if( okxycen(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdycen(ic,jc,kc,n)
-               else if( okxypp(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdypp(ic,jc,kc,n)
-               else if( okxypm(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdypm(ic,jc,kc,n)
-               else if( okxymp(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdymp(ic,jc,kc,n)
-               else if( okxymm(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdymm(ic,jc,kc,n)
-               else
-                  derives(ic,jc,DXY) = zero
-               endif
-
-            enddo
-         enddo
-
-c     ::::: interpolate to fine grid
-         do joff = 0, ratio - 1
-            yy = (joff+half)*hf(2)-hc(2)/2
-            do jc = jclo,jchi
-               j = ratio*jc + joff
-               do ioff = 0, ratio - 1
-                  xx = (ioff+half)*hf(1)-hc(1)/2
-                  do ic = iclo, ichi
-                     i = ratio*ic + ioff
-                     bdry(i,j,k,n) = crse(ic,jc,kc,n) + 
-     &                    xx*derives(ic,jc,DX) +
-     &                    half*xx**2*derives(ic,jc,D2X) + 
-     &                    yy*derives(ic,jc,DY) +
-     &                    half*yy**2*derives(ic,jc,D2Y) + 
-     &                    xx*yy*derives(ic,jc,DXY) 
-                     bdry(i,j,k,n+CX*nvar) =
-     &                    derives(ic,jc,DX)+
-     &                    xx*derives(ic,jc,D2X)+
-     &                    yy*derives(ic,jc,DXY)
-                     bdry(i,j,k,n+CY*nvar) =
-     &                    derives(ic,jc,DY)+
-     &                    yy*derives(ic,jc,D2Y)+
-     &                    xx*derives(ic,jc,DXY)
-                  enddo
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-c ---------------------------------------------------------------
-c ::  FORT_BDINTERPZHI : Interpolation on Zhi Face
-c ::       Quadratic Interpolation from crse data
-c ::       in directions transverse to face of grid
-c ::
-c ::  Inputs/Outputs:
-c ::  bdry       <=  fine grid bndry data strip
-c ::  DIMS(bdry)  => index limits of bdry
-c ::  lo,hi       => index limits of grd interior
-c ::  DIMS(cb)    => index limits of coarsened grid interior
-c ::  nvar        => number of variables in solution, half number in bdry
-c ::  ratio       => refinement ratio
-c ::  not_covered => mask is set to this value if cell is not
-c ::                 covered by another fine grid and not outside the domain.
-c ::  mask        => fine grid mask bndry strip
-c ::  DIMS(mask)  => index limits of mask array
-c ::  crse        => crse grid bndry data strip
-c ::  DIMS(crse)  => index limits of crse array
-c ::  derives     => crse grid tmp array for derivatives
-c ---------------------------------------------------------------
-
-      subroutine FORT_BDINTERPZHI (bdry,DIMS(bdry),
-     &           lo,hi,DIMS(cb),nvar,ratio,not_covered,
-     &           mask,DIMS(mask),crse,DIMS(crse),derives,hfine)
-
-      implicit none
-
-      integer  nvar, ratio, not_covered
-      integer  lo(SDIM), hi(SDIM)
-      integer  DIMDEC(bdry)
-      integer  DIMDEC(cb)
-      integer  DIMDEC(mask)
-      integer  DIMDEC(crse)
-      REAL_T   bdry(DIMV(bdry),(1+3)*nvar)
-      REAL_T   derives(DIM12(cb),NUMDERIV)
-      integer  mask(DIMV(mask))
-      REAL_T   crse(DIMV(crse),nvar)
-      REAL_T   hfine(BL_SPACEDIM-1)
-
-      REAL_T   yy, xx 
-      integer  i, j, k, ic, jc, kc, ioff, joff, n
-      integer  iclo, ichi, jclo, jchi, ii, jj, kk
-      REAL_T   hc(3),hf(3)
-
-c ::: ------------ functions ------------------------------
-      logical notUsable,Usable
-      REAL_T ddxcen,ddx2cen,ddxplus,ddxminus
-      REAL_T ddycen,ddy2cen,ddyplus,ddyminus
-      REAL_T ddxdycen,ddxdypp,ddxdypm,ddxdymp,ddxdymm
-      logical okxypp,okxypm,okxymp,okxymm,okxycen
-      REAL_T ddxlowp,ddxlowm
-      REAL_T ddylowp,ddylowm
-
-      notUsable(ii,jj,kk) = (mask(ii,jj,kk).ne.not_covered)
-      Usable(ii,jj,kk) = (mask(ii,jj,kk).eq.not_covered)
-
-      ddxcen(ii,jj,kk,n) = (crse(ii+1,jj,kk,n)-crse(ii-1,jj,kk,n))/(2*hc(1))
-      ddycen(ii,jj,kk,n) = (crse(ii,jj+1,kk,n)-crse(ii,jj-1,kk,n))/(2*hc(2))
-
-      ddx2cen(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-2*crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))
-     &     /(hc(1)**2)
-      ddy2cen(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-2*crse(ii,jj,kk,n)+crse(ii,jj-1,kk,n))
-     &     /(hc(2)**2)
-
-      ddxplus(ii,jj,kk,n)=(-crse(ii+2,jj,kk,n)+4*crse(ii+1,jj,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddyplus(ii,jj,kk,n)=(-crse(ii,jj+2,kk,n)+4*crse(ii,jj+1,kk,n)-3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-
-      ddxminus(ii,jj,kk,n)=(+crse(ii-2,jj,kk,n)-4*crse(ii-1,jj,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(1))
-      ddyminus(ii,jj,kk,n)=(+crse(ii,jj-2,kk,n)-4*crse(ii,jj-1,kk,n)+3*crse(ii,jj,kk,n))
-     &     /(2*hc(2))
-
-      ddxdycen(ii,jj,kk,n)=(crse(ii+1,jj+1,kk,n)-crse(ii-1,jj+1,kk,n)
-     &     -crse(ii+1,jj-1,kk,n)+crse(ii-1,jj-1,kk,n))/(4*hc(1)*hc(2))
-      okxycen(ii,jj,kk)=(Usable(ii+1,jj+1,kk).and.Usable(ii-1,jj+1,kk)
-     &     .and.Usable(ii+1,jj-1,kk).and.Usable(ii-1,jj-1,kk))
-      ddxdypp(ii,jj,kk,n)=(crse(ii+1,jj+1,kk,n)-crse(ii,jj+1,kk,n)
-     &     -crse(ii+1,jj,kk,n)+crse(ii,jj,kk,n))/(hc(1)*hc(2))
-      okxypp(ii,jj,kk)=(Usable(ii+1,jj+1,kk).and.Usable(ii,jj+1,kk)
-     &     .and.Usable(ii+1,jj,kk))
-      ddxdypm(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n)
-     &     -crse(ii+1,jj-1,kk,n)+crse(ii,jj-1,kk,n))/(4*hc(1)*hc(2))
-      okxypm(ii,jj,kk)=(Usable(ii+1,jj,kk)
-     &     .and.Usable(ii+1,jj-1,kk).and.Usable(ii,jj-1,kk))
-      ddxdymp(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii-1,jj+1,kk,n)
-     &     -crse(ii,jj,kk,n)+crse(ii-1,jj,kk,n))/(hc(1)*hc(2))
-      okxymp(ii,jj,kk)=(Usable(ii,jj+1,kk).and.Usable(ii-1,jj+1,kk)
-     &     .and.Usable(ii-1,jj,kk))
-      ddxdymm(ii,jj,kk,n)=(crse(ii,jj,kk,n)-crse(ii-1,jj,kk,n)
-     &     -crse(ii,jj-1,kk,n)+crse(ii-1,jj-1,kk,n))/(hc(1)*hc(2))
-      okxymm(ii,jj,kk)=(Usable(ii-1,jj,kk)
-     &     .and.Usable(ii,jj-1,kk).and.Usable(ii-1,jj-1,kk))
-
-      ddxlowp(ii,jj,kk,n)=(crse(ii+1,jj,kk,n)-crse(ii,jj,kk,n))/hc(1)
-      ddylowp(ii,jj,kk,n)=(crse(ii,jj+1,kk,n)-crse(ii,jj,kk,n))/hc(2)
-
-      ddxlowm(ii,jj,kk,n)=(-crse(ii-1,jj,kk,n)+crse(ii,jj,kk,n))/hc(1)
-      ddylowm(ii,jj,kk,n)=(-crse(ii,jj-1,kk,n)+crse(ii,jj,kk,n))/hc(2)
-
-c ::: ------------ functions ------------------------------
-
-      jclo = ARG_L2(cb)
-      jchi = ARG_H2(cb)
-      iclo = ARG_L1(cb)
-      ichi = ARG_H1(cb)
-      kc   = ARG_H3(cb)+1
-      k    = hi(3)+1
-c ::: :::
-      hf(1) = hfine(1)
-      hf(2) = hfine(2)
-      hf(3) = 0
-      hc(1) = hfine(1)*ratio
-      hc(2) = hfine(2)*ratio
-      hc(3) = 0
-c ::: :::
-
-      do n = 1, nvar
-c     ::::: calculate derivatives for interpolation
-         do jc = jclo, jchi
-            j = ratio*jc
-            do ic = iclo, ichi
-               i = ratio*ic
-
-               derives(ic,jc,DX) = ddxcen(ic,jc,kc,n)
-               derives(ic,jc,D2X) = ddx2cen(ic,jc,kc,n)
-
-               if( notUsable(i-1,j,k) .and. notUsable(i+ratio,j,k)  ) then
-                  derives(ic,jc,DX)  = zero
-                  derives(ic,jc,D2X) = zero
-               else if( notUsable(i-1,j,k) .and. Usable(i+ratio,j,k) ) then
-c     :::: :::: : positive side usable
-                  if( ic+2.le.ichi+1 ) then
-                     if( Usable(i+2*ratio,j,k) ) then
-                        derives(ic,jc,DX)=ddxplus(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=ddx2cen(ic+1,jc,kc,n)
-                     else
-                        derives(ic,jc,DX)=ddxlowp(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,jc,DX)=ddxlowp(ic,jc,kc,n)
-                     derives(ic,jc,D2X)=zero
-                  endif
-               else if( Usable(i-1,j,k) .and. notUsable(i+ratio,j,k) ) then
-c     :::: :::: : negative side usable
-                  if( ic-2.ge.iclo-1 ) then
-                     if( Usable(i-1,j,k) ) then
-                        derives(ic,jc,DX)=ddxminus(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=ddx2cen(ic-1,jc,kc,n)
-                     else
-                        derives(ic,jc,DX)=ddxlowm(ic,jc,kc,n)
-                        derives(ic,jc,D2X)=zero
-                     endif
-                  else
-                     derives(ic,jc,DX)=ddxlowm(ic,jc,kc,n)
-                     derives(ic,jc,D2X)=zero
-                  endif
-               endif
-
-               derives(ic,jc,DY) = ddycen(ic,jc,kc,n)
-               derives(ic,jc,D2Y) = ddy2cen(ic,jc,kc,n)
-
-               if( notUsable(i,j-1,k) .and. notUsable(i,j+ratio,k)  ) then
-                  derives(ic,jc,DY)  = zero
-                  derives(ic,jc,D2Y) = zero
-               else if( notUsable(i,j-1,k) .and. Usable(i,j+ratio,k) ) then
-c     :::: :::: : positive side usable
-                  if( jc+2.le.jchi+1 ) then
-                     if( Usable(i,j+2*ratio,k) ) then
-                        derives(ic,jc,DY)=ddyplus(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=ddy2cen(ic,jc+1,kc,n)
-                     else
-                        derives(ic,jc,DY)=ddylowp(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=zero
-                     endif
-                  else
-                     derives(ic,jc,DY)=ddylowp(ic,jc,kc,n)
-                     derives(ic,jc,D2Y)=zero
-                  endif
-               else if( Usable(i,j-1,k) .and. notUsable(i,j+ratio,k) ) then
-c     :::: :::: : negative side usable
-                  if( jc-2.ge.jclo-1 ) then
-                     if( Usable(i,j-1,k) ) then
-                        derives(ic,jc,DY)=ddyminus(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=ddy2cen(ic,jc-1,kc,n)
-                     else
-                        derives(ic,jc,DY)=ddylowm(ic,jc,kc,n)
-                        derives(ic,jc,D2Y)=zero
-                     endif
-                  else
-                     derives(ic,jc,DY)=ddylowm(ic,jc,kc,n)
-                     derives(ic,jc,D2Y)=zero
-                  endif
-               endif
-
-
-               if( okxycen(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdycen(ic,jc,kc,n)
-               else if( okxypp(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdypp(ic,jc,kc,n)
-               else if( okxypm(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdypm(ic,jc,kc,n)
-               else if( okxymp(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdymp(ic,jc,kc,n)
-               else if( okxymm(i,j,k) ) then
-                  derives(ic,jc,DXY) = ddxdymm(ic,jc,kc,n)
-               else
-                  derives(ic,jc,DXY) = zero
-               endif
-
-            enddo
-         enddo
-
-c     ::::: interpolate to fine grid
-         do joff = 0, ratio - 1
-            yy = (joff+half)*hf(2)-hc(2)/2
-            do jc = jclo,jchi
-               j = ratio*jc + joff
-               do ioff = 0, ratio - 1
-                  xx = (ioff+half)*hf(1)-hc(1)/2
-                  do ic = iclo, ichi
-                     i = ratio*ic + ioff
-                     bdry(i,j,k,n) = crse(ic,jc,kc,n) + 
-     &                    xx*derives(ic,jc,DX) +
-     &                    half*xx**2*derives(ic,jc,D2X) + 
-     &                    yy*derives(ic,jc,DY) +
-     &                    half*yy**2*derives(ic,jc,D2Y) + 
-     &                    xx*yy*derives(ic,jc,DXY) 
-                     bdry(i,j,k,n+CX*nvar) =
-     &                    derives(ic,jc,DX)+
-     &                    xx*derives(ic,jc,D2X)+
-     &                    yy*derives(ic,jc,DXY)
-                     bdry(i,j,k,n+CY*nvar) =
-     &                    derives(ic,jc,DY)+
-     &                    yy*derives(ic,jc,D2Y)+
-     &                    xx*derives(ic,jc,DXY)
-                  enddo
-               enddo
-            enddo
-         enddo
-      enddo
-
-      end
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVXLO : copy from Xlo face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The following 3*nvar values
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-c ::      NOTE: only the transverse derivs are computed, so one of the
-c ::      derivs if filled with error values
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write (3+1) times as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVXLO( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-
-      implicit none
-
-      integer nvar
-      REAL_T  hfine(3)
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),(3+1)*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,k,n
-      REAL_T h(3)
-c ::: ------ begin functions -------
-      REAL_T ddycen
-      REAL_T ddzcen
-      REAL_T ddyplus,ddyminus,ddzplus,ddzminus
-
-      ddycen(i,j,k,n) = (fine(i,j+1,k,n)-fine(i,j-1,k,n))/(2*h(2))
-      ddzcen(i,j,k,n) = (fine(i,j,k+1,n)-fine(i,j,k-1,n))/(2*h(3))
-
-      ddyplus(i,j,k,n)=(-fine(i,j+2,k,n)+4*fine(i,j+1,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(2))
-      ddzplus(i,j,k,n)=(-fine(i,j,k+2,n)+4*fine(i,j,k+1,n)-3*fine(i,j,k,n))
-     &     /(2*h(3))
-
-      ddyminus(i,j,k,n)=(+fine(i,j-2,k,n)-4*fine(i,j-1,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(2))
-      ddzminus(i,j,k,n)=(+fine(i,j,k-2,n)-4*fine(i,j,k-1,n)+3*fine(i,j,k,n))
-     &     /(2*h(3))
-c ::: ------ end   functions -------
-
-      i = lo(1)-1
-      h(1) = 0
-      h(2) = hfine(1)
-      h(3) = hfine(2)
-
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do k=lo(3),hi(3)
-            do j=lo(2),hi(2)
-               bdry(i,j,k,n) = fine(i,j,k,n)
-            enddo
-         enddo
-
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-
-c ::: ::: First, do y deriv
-         do k=lo(3),hi(3)
-            j=lo(2)
-            bdry(i,j,k,n+CY*nvar) = ddyplus(i,j,k,n)
-            do j=lo(2)+1,hi(2)-1
-               bdry(i,j,k,n+CY*nvar) = ddycen(i,j,k,n)
-            enddo
-            j=hi(2)
-            bdry(i,j,k,n+CY*nvar) = ddyminus(i,j,k,n)
-         enddo
-c ::: ::: next, do z deriv
-         do j=lo(2),hi(2)
-            k=lo(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzplus(i,j,k,n)
-            do k=lo(3)+1,hi(3)-1
-               bdry(i,j,k,n+CZ*nvar) = ddzcen(i,j,k,n)
-            enddo
-            k=hi(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzminus(i,j,k,n)
-         enddo
-
-      enddo
-
-      return
-      end
-      
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVXHI : copy from Xhi face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The following 3*nvar values
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-c ::      NOTE: only the transverse derivs are computed, so one of the
-c ::      derivs if filled with error values
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write (3+1) times as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVXHI( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-
-      implicit none
-
-      integer nvar
-      REAL_T  hfine(3)
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),(3+1)*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,k,n
-      REAL_T h(3)
-c ::: ------ begin functions -------
-      REAL_T ddycen
-      REAL_T ddzcen
-      REAL_T ddyplus,ddyminus,ddzplus,ddzminus
-
-      ddycen(i,j,k,n) = (fine(i,j+1,k,n)-fine(i,j-1,k,n))/(2*h(2))
-      ddzcen(i,j,k,n) = (fine(i,j,k+1,n)-fine(i,j,k-1,n))/(2*h(3))
-
-      ddyplus(i,j,k,n)=(-fine(i,j+2,k,n)+4*fine(i,j+1,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(2))
-      ddzplus(i,j,k,n)=(-fine(i,j,k+2,n)+4*fine(i,j,k+1,n)-3*fine(i,j,k,n))
-     &     /(2*h(3))
-
-      ddyminus(i,j,k,n)=(+fine(i,j-2,k,n)-4*fine(i,j-1,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(2))
-      ddzminus(i,j,k,n)=(+fine(i,j,k-2,n)-4*fine(i,j,k-1,n)+3*fine(i,j,k,n))
-     &     /(2*h(3))
-c ::: ------ end   functions -------
-
-      i = hi(1)+1
-      h(1) = 0
-      h(2) = hfine(1)
-      h(3) = hfine(2)
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do k=lo(3),hi(3)
-            do j=lo(2),hi(2)
-               bdry(i,j,k,n) = fine(i,j,k,n)
-            enddo
-         enddo
-
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-
-c ::: ::: First, do y deriv
-         do k=lo(3),hi(3)
-            j=lo(2)
-            bdry(i,j,k,n+CY*nvar) = ddyplus(i,j,k,n)
-            do j=lo(2)+1,hi(2)-1
-               bdry(i,j,k,n+CY*nvar) = ddycen(i,j,k,n)
-            enddo
-            j=hi(2)
-            bdry(i,j,k,n+CY*nvar) = ddyminus(i,j,k,n)
-         enddo
-c ::: ::: next, do z deriv
-         do j=lo(2),hi(2)
-            k=lo(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzplus(i,j,k,n)
-            do k=lo(3)+1,hi(3)-1
-               bdry(i,j,k,n+CZ*nvar) = ddzcen(i,j,k,n)
-            enddo
-            k=hi(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzminus(i,j,k,n)
-         enddo
-
-      enddo
-
-      return
-      end
-      
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVYLO : copy from Ylo face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The following 3*nvar values
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-c ::      NOTE: only the transverse derivs are computed, so one of the
-c ::      derivs if filled with error values
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write (3+1) times as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVYLO( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-
-      implicit none
-
-      integer nvar
-      REAL_T  hfine(3)
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),(3+1)*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,k,n
-      REAL_T h(3)
-c ::: ------ begin functions -------
-      REAL_T ddxcen
-      REAL_T ddzcen
-      REAL_T ddxplus,ddxminus,ddzplus,ddzminus
-
-      ddxcen(i,j,k,n) = (fine(i+1,j,k,n)-fine(i-1,j,k,n))/(2*h(1))
-      ddzcen(i,j,k,n) = (fine(i,j,k+1,n)-fine(i,j,k-1,n))/(2*h(3))
-
-      ddxplus(i,j,k,n)=(-fine(i+2,j,k,n)+4*fine(i+1,j,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddzplus(i,j,k,n)=(-fine(i,j,k+2,n)+4*fine(i,j,k+1,n)-3*fine(i,j,k,n))
-     &     /(2*h(3))
-
-      ddxminus(i,j,k,n)=(+fine(i-2,j,k,n)-4*fine(i-1,j,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddzminus(i,j,k,n)=(+fine(i,j,k-2,n)-4*fine(i,j,k-1,n)+3*fine(i,j,k,n))
-     &     /(2*h(3))
-c ::: ------ end   functions -------
-
-      j = lo(2)-1
-      h(1) = hfine(1)
-      h(2) = 0
-      h(3) = hfine(2)
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do k=lo(3),hi(3)
-            do i=lo(1),hi(1)
-               bdry(i,j,k,n) = fine(i,j,k,n)
-            enddo
-         enddo
-
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-
-c ::: ::: First, do x deriv
-         do k=lo(3),hi(3)
-            i=lo(1)
-            bdry(i,j,k,n+CX*nvar) = ddxplus(i,j,k,n)
-            do i=lo(1)+1,hi(1)-1
-               bdry(i,j,k,n+CX*nvar) = ddxcen(i,j,k,n)
-            enddo
-            i=hi(1)
-            bdry(i,j,k,n+CX*nvar) = ddxminus(i,j,k,n)
-         enddo
-c ::: ::: next, do z deriv
-         do i=lo(1),hi(1)
-            k=lo(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzplus(i,j,k,n)
-            do k=lo(3)+1,hi(3)-1
-               bdry(i,j,k,n+CZ*nvar) = ddzcen(i,j,k,n)
-            enddo
-            k=hi(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzminus(i,j,k,n)
-         enddo
-
-      enddo
-
-      return
-      end
-      
-
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVYHI : copy from Yhi face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The following 3*nvar values
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-c ::      NOTE: only the transverse derivs are computed, so one of the
-c ::      derivs if filled with error values
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write (3+1) times as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVYHI( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-
-      implicit none
-
-      integer nvar
-      REAL_T  hfine(3)
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),(3+1)*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,k,n
-      REAL_T h(3)
-c ::: ------ begin functions -------
-      REAL_T ddxcen
-      REAL_T ddzcen
-      REAL_T ddxplus,ddxminus,ddzplus,ddzminus
-
-      ddxcen(i,j,k,n) = (fine(i+1,j,k,n)-fine(i-1,j,k,n))/(2*h(1))
-      ddzcen(i,j,k,n) = (fine(i,j,k+1,n)-fine(i,j,k-1,n))/(2*h(3))
-
-      ddxplus(i,j,k,n)=(-fine(i+2,j,k,n)+4*fine(i+1,j,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddzplus(i,j,k,n)=(-fine(i,j,k+2,n)+4*fine(i,j,k+1,n)-3*fine(i,j,k,n))
-     &     /(2*h(3))
-
-      ddxminus(i,j,k,n)=(+fine(i-2,j,k,n)-4*fine(i-1,j,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddzminus(i,j,k,n)=(+fine(i,j,k-2,n)-4*fine(i,j,k-1,n)+3*fine(i,j,k,n))
-     &     /(2*h(3))
-c ::: ------ end   functions -------
-
-      j = hi(2)+1
-      h(1) = hfine(1)
-      h(2) = 0
-      h(3) = hfine(2)
-
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do k=lo(3),hi(3)
-            do i=lo(1),hi(1)
-               bdry(i,j,k,n) = fine(i,j,k,n)
-            enddo
-         enddo
-
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-
-c ::: ::: First, do x deriv
-         do k=lo(3),hi(3)
-            i=lo(1)
-            bdry(i,j,k,n+CX*nvar) = ddxplus(i,j,k,n)
-            do i=lo(1)+1,hi(1)-1
-               bdry(i,j,k,n+CX*nvar) = ddxcen(i,j,k,n)
-            enddo
-            i=hi(1)
-            bdry(i,j,k,n+CX*nvar) = ddxminus(i,j,k,n)
-         enddo
-c ::: ::: next, do z deriv
-         do i=lo(1),hi(1)
-            k=lo(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzplus(i,j,k,n)
-            do k=lo(3)+1,hi(3)-1
-               bdry(i,j,k,n+CZ*nvar) = ddzcen(i,j,k,n)
-            enddo
-            k=hi(3)
-            bdry(i,j,k,n+CZ*nvar) = ddzminus(i,j,k,n)
-         enddo
-
-      enddo
-
-      return
-      end
-      
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVZLO : copy from Zlo face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The following 3*nvar values
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-c ::      NOTE: only the transverse derivs are computed, so one of the
-c ::      derivs if filled with error values
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write (3+1) times as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVZLO( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-
-      implicit none
-
-      integer nvar
-      REAL_T  hfine(3)
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),(3+1)*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,k,n
-      REAL_T h(3)
-c ::: ------ begin functions -------
-      REAL_T ddxcen
-      REAL_T ddycen
-      REAL_T ddxplus,ddxminus,ddyplus,ddyminus
-
-      ddxcen(i,j,k,n) = (fine(i+1,j,k,n)-fine(i-1,j,k,n))/(2*h(1))
-      ddycen(i,j,k,n) = (fine(i,j+1,k,n)-fine(i,j-1,k,n))/(2*h(2))
-
-      ddxplus(i,j,k,n)=(-fine(i+2,j,k,n)+4*fine(i+1,j,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddyplus(i,j,k,n)=(-fine(i,j+2,k,n)+4*fine(i,j+1,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(2))
-
-      ddxminus(i,j,k,n)=(+fine(i-2,j,k,n)-4*fine(i-1,j,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddyminus(i,j,k,n)=(+fine(i,j-2,k,n)-4*fine(i,j-1,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(2))
-
-c ::: ------ end   functions -------
-
-      k = lo(3)-1
-      h(1) = hfine(1)
-      h(2) = hfine(2)
-      h(3) = 0
-
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do j=lo(2),hi(2)
-            do i=lo(1),hi(1)
-               bdry(i,j,k,n) = fine(i,j,k,n)
-            enddo
-         enddo
-
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-
-c ::: ::: First, do y deriv
-         do i=lo(1),hi(1)
-            j=lo(2)
-            bdry(i,j,k,n+CY*nvar) = ddyplus(i,j,k,n)
-            do j=lo(2)+1,hi(2)-1
-               bdry(i,j,k,n+CY*nvar) = ddycen(i,j,k,n)
-            enddo
-            j=hi(2)
-            bdry(i,j,k,n+CY*nvar) = ddyminus(i,j,k,n)
-         enddo
-c ::: ::: next, do x deriv
-         do j=lo(2),hi(2)
-            i=lo(1)
-            bdry(i,j,k,n+CX*nvar) = ddxplus(i,j,k,n)
-            do i=lo(1)+1,hi(1)-1
-               bdry(i,j,k,n+CX*nvar) = ddxcen(i,j,k,n)
-            enddo
-            i=hi(1)
-            bdry(i,j,k,n+CX*nvar) = ddxminus(i,j,k,n)
-         enddo
-
-      enddo
-
-      return
-      end
-      
-      
-
-c ------------------------------------------------------------------------
-c :: FORT_BDIDERIVZHI : copy from Zhi face of fine fab (getting values
-c ::      which were stuck there by the physical boundary condition routines)
-c ::      to get the first nvar values in bdry.  The following 3*nvar values
-c ::      are gotten by computing the transverse derivative.  Two formulas
-c ::      are used: 1) on the interior a centered difference is used; 
-c ::      2) at the end points a one-sided difference is used.  No check
-c ::      is made to check that the one-sided difference does not poke out
-c ::      the other side of the grid.  But if grids are that small, a lot
-c ::      of things will be blowing up.
-c ::      NOTE: only the transverse derivs are computed, so one of the
-c ::      derivs if filled with error values
-
-c :: Inputs/Outputs:
-c ::  bdry <= fine grid bndry data strip
-c ::  lo,hi => index limits of "grid". So all action takes place in cells
-c ::           outside the grid
-c ::  fine  => fine grid data which has phys-bc data stuffed in it
-c ::  nvar  => number of components in fine.  But you write (3+1) times as many
-c ::           components of data in bdry because you compute transverse
-c ::           derivatives as well
-c ::  hfine => delta x in transverse direction; needed for derivs
-c ------------------------------------------------------------------------
-      subroutine FORT_BDIDERIVZHI( bdry, DIMS(bdry),
-     &     lo, hi,
-     &     fine, DIMS(fine),
-     &     nvar, hfine)
-
-      implicit none
-
-      integer nvar
-      REAL_T  hfine(3)
-      integer lo(SDIM), hi(SDIM)
-      integer DIMDEC(bdry)
-      integer DIMDEC(fine)
-      REAL_T  bdry(DIMV(bdry),(3+1)*nvar)
-      REAL_T  fine(DIMV(fine),  nvar)
-
-      integer i,j,k,n
-      REAL_T h(3)
-c ::: ------ begin functions -------
-      REAL_T ddxcen
-      REAL_T ddycen
-      REAL_T ddxplus,ddxminus,ddyplus,ddyminus
-
-      ddxcen(i,j,k,n) = (fine(i+1,j,k,n)-fine(i-1,j,k,n))/(2*h(1))
-      ddycen(i,j,k,n) = (fine(i,j+1,k,n)-fine(i,j-1,k,n))/(2*h(2))
-
-      ddxplus(i,j,k,n)=(-fine(i+2,j,k,n)+4*fine(i+1,j,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddyplus(i,j,k,n)=(-fine(i,j+2,k,n)+4*fine(i,j+1,k,n)-3*fine(i,j,k,n))
-     &     /(2*h(2))
-
-      ddxminus(i,j,k,n)=(+fine(i-2,j,k,n)-4*fine(i-1,j,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(1))
-      ddyminus(i,j,k,n)=(+fine(i,j-2,k,n)-4*fine(i,j-1,k,n)+3*fine(i,j,k,n))
-     &     /(2*h(2))
-
-c ::: ------ end   functions -------
-
-      k = hi(3)+1
-      h(1) = hfine(1)
-      h(2) = hfine(2)
-      h(3) = 0
-
-      do n=1,nvar
-c ::: ::: copy boundary values over
-         do j=lo(2),hi(2)
-            do i=lo(1),hi(1)
-               bdry(i,j,k,n) = fine(i,j,k,n)
-            enddo
-         enddo
-
-c ::: ::: do stinking calculation of derivativ using centered difference
-c ::: ::: this ONLY makes sense for DIRICHLET BC.  For other BC,
-c ::: ::: we will not use these values.
-
-c ::: ::: First, do y deriv
-         do i=lo(1),hi(1)
-            j=lo(2)
-            bdry(i,j,k,n+CY*nvar) = ddyplus(i,j,k,n)
-            do j=lo(2)+1,hi(2)-1
-               bdry(i,j,k,n+CY*nvar) = ddycen(i,j,k,n)
-            enddo
-            j=hi(2)
-            bdry(i,j,k,n+CY*nvar) = ddyminus(i,j,k,n)
-         enddo
-c ::: ::: next, do x deriv
-         do j=lo(2),hi(2)
-            i=lo(1)
-            bdry(i,j,k,n+CX*nvar) = ddxplus(i,j,k,n)
-            do i=lo(1)+1,hi(1)-1
-               bdry(i,j,k,n+CX*nvar) = ddxcen(i,j,k,n)
-            enddo
-            i=hi(1)
-            bdry(i,j,k,n+CX*nvar) = ddxminus(i,j,k,n)
-         enddo
-
-      enddo
-
-      return
-      end
-      
-
-
-
-
-#undef SDIM
-#undef NUMDERIV
-#undef DX
-#undef DY
-#undef DZ
-#undef D2X
-#undef D2Y
-#undef D2Z
-#undef DXY
-#undef DXZ
-#undef DYZ
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_F.H b/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_F.H
deleted file mode 100644
index e50ce3fbeeb..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCINTERPBNDRYDATA_F.H
+++ /dev/null
@@ -1,117 +0,0 @@
-#ifndef AMREX_INTERPBNDRY_F_H_
-#define AMREX_INTERPBNDRY_F_H_
-
-#ifdef BL_LANG_FORT
-#    define FORT_BDINTERPXLO  mcbdintrpxlo
-#    define FORT_BDINTERPXHI  mcbdintrpxhi
-#    define FORT_BDIDERIVXLO  mcbdiderivxlo
-#    define FORT_BDIDERIVXHI  mcbdiderivxhi
-#  if (BL_SPACEDIM > 1)
-#    define FORT_BDINTERPYLO  mcbdintrpylo
-#    define FORT_BDINTERPYHI  mcbdintrpyhi
-#    define FORT_BDIDERIVYLO  mcbdiderivylo
-#    define FORT_BDIDERIVYHI  mcbdiderivyhi
-#  endif
-#  if (BL_SPACEDIM > 2)
-#    define FORT_BDINTERPZLO  mcbdintrpzlo
-#    define FORT_BDINTERPZHI  mcbdintrpzhi
-#    define FORT_BDIDERIVZLO  mcbdiderivzlo
-#    define FORT_BDIDERIVZHI  mcbdiderivzhi
-#  endif
-#else
-#  if defined(BL_FORT_USE_UPPERCASE)
-#    define FORT_BDINTERPXLO  MCBDINTRPXLO
-#    define FORT_BDINTERPXHI  MCBDINTRPXHI
-#    define FORT_BDIDERIVXLO  MCBDIDERIVXLO
-#    define FORT_BDIDERIVXHI  MCBDIDERIVXHI
-#    if (BL_SPACEDIM > 1)
-#    define FORT_BDINTERPYLO  MCBDINTRPYLO
-#    define FORT_BDINTERPYHI  MCBDINTRPYHI
-#    define FORT_BDIDERIVYLO  MCBDIDERIVYLO
-#    define FORT_BDIDERIVYHI  MCBDIDERIVYHI
-#    endif
-#    if (BL_SPACEDIM > 2)
-#    define FORT_BDINTERPZLO  MCBDINTRPZLO
-#    define FORT_BDINTERPZHI  MCBDINTRPZHI
-#    define FORT_BDIDERIVZLO  MCBDIDERIVZLO
-#    define FORT_BDIDERIVZHI  MCBDIDERIVZHI
-#    endif
-#  elif defined(BL_FORT_USE_LOWERCASE)
-#    define FORT_BDINTERPXLO  mcbdintrpxlo
-#    define FORT_BDINTERPXHI  mcbdintrpxhi
-#    define FORT_BDIDERIVXLO  mcbdiderivxlo
-#    define FORT_BDIDERIVXHI  mcbdiderivxhi
-#    if (BL_SPACEDIM > 1)
-#    define FORT_BDINTERPYLO  mcbdintrpylo
-#    define FORT_BDINTERPYHI  mcbdintrpyhi
-#    define FORT_BDIDERIVYLO  mcbdiderivylo
-#    define FORT_BDIDERIVYHI  mcbdiderivyhi
-#    endif
-#    if (BL_SPACEDIM > 2)
-#    define FORT_BDINTERPZLO  mcbdintrpzlo
-#    define FORT_BDINTERPZHI  mcbdintrpzhi
-#    define FORT_BDIDERIVZLO  mcbdiderivzlo
-#    define FORT_BDIDERIVZHI  mcbdiderivzhi
-#    endif
-#  elif defined(BL_FORT_USE_UNDERSCORE)
-#    define FORT_BDINTERPXLO  mcbdintrpxlo_
-#    define FORT_BDINTERPXHI  mcbdintrpxhi_
-#    define FORT_BDIDERIVXLO  mcbdiderivxlo_
-#    define FORT_BDIDERIVXHI  mcbdiderivxhi_
-#    if (BL_SPACEDIM > 1)
-#    define FORT_BDINTERPYLO  mcbdintrpylo_
-#    define FORT_BDINTERPYHI  mcbdintrpyhi_
-#    define FORT_BDIDERIVYLO  mcbdiderivylo_
-#    define FORT_BDIDERIVYHI  mcbdiderivyhi_
-#    endif
-#    if (BL_SPACEDIM > 2)
-#    define FORT_BDINTERPZLO  mcbdintrpzlo_
-#    define FORT_BDINTERPZHI  mcbdintrpzhi_
-#    define FORT_BDIDERIVZLO  mcbdiderivzlo_
-#    define FORT_BDIDERIVZHI  mcbdiderivzhi_
-#    endif
-#endif
-
-#include <AMReX_ArrayLim.H>
-
-typedef void BDInterpFunc(amrex_real* bndr, ARLIM_P(blo), ARLIM_P(bhi),
-			  const int* lo, const int* hi,
-			  ARLIM_P(cblo), ARLIM_P(cbhi),
-			  const int* nvar, const int* ratio,
-			  const int* not_covered,
-			  const int* mask,  ARLIM_P(mlo), ARLIM_P(mhi),
-			  const amrex_real* crse, ARLIM_P(clo), ARLIM_P(chi),
-			  amrex_real* derives, const amrex_real* hfine);
-typedef void BDPhysDerivative(amrex_real* bndr, ARLIM_P(blo), ARLIM_P(bhi),
-			      const int* lo, const int* hi,
-			      const amrex_real* finefab, ARLIM_P(flo), ARLIM_P(fhi),
-			      const int* nvar, const amrex_real* hfine);
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    BDInterpFunc FORT_BDINTERPXLO;
-    BDInterpFunc FORT_BDINTERPXHI;
-    BDPhysDerivative FORT_BDIDERIVXLO;
-    BDPhysDerivative FORT_BDIDERIVXHI;
-
-#if (BL_SPACEDIM > 1)    
-    BDInterpFunc FORT_BDINTERPYLO;
-    BDInterpFunc FORT_BDINTERPYHI;
-    BDPhysDerivative FORT_BDIDERIVYLO;
-    BDPhysDerivative FORT_BDIDERIVYHI;
-#endif    
-
-#if (BL_SPACEDIM > 2)    
-    BDInterpFunc FORT_BDINTERPZLO;
-    BDInterpFunc FORT_BDINTERPZHI;
-    BDPhysDerivative FORT_BDIDERIVZLO;
-    BDPhysDerivative FORT_BDIDERIVZHI;
-#endif    
-
-#ifdef __cplusplus
-}
-#endif
-#endif
-
-#endif
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCInterpBndryData.H b/Src/LinearSolvers/C_TensorMG/AMReX_MCInterpBndryData.H
deleted file mode 100644
index d76d4b19132..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCInterpBndryData.H
+++ /dev/null
@@ -1,123 +0,0 @@
-
-#ifndef AMREX_MCINTERPBNDRYDATA_H_
-#define AMREX_MCINTERPBNDRYDATA_H_
-
-#include <AMReX_BLassert.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Orientation.H>
-#include <AMReX_Mask.H>
-#include <AMReX_BCRec.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_BoundCond.H>
-#include <AMReX_BndryData.H>
-
-namespace amrex {
-
-/**
-        \brief An MCInterpBndryData object adds to a BndryData object the ability to
-	manipulate and set the data stored in the boundary cells.
-
-        The "Interpbndrydata" class is a virtual base class derived from
-	BndryData.  It is intended to provide a more physical method for
-	filling boundary-related data.  Boundary values in a BndryData object
-	are stored in FabSets around each grid in the domain, and the
-	MCInterpBndryData class provides a mechanism for filling these FabSets,
-	consistent with AMR-like numerical discretizations.  When asked to
-	set it's boundary values, an MCInterpBndryData object:
-
-	Fills with physical boundary values if the FAB is on the
-	domain boundary - the corresponding values are presumed to be
-	stored in the ghost cells of a MultiFab given to the boundary filling
-	routine
-
-	Fills on intersection with data from the VALID region of the
-	input MultiFab, ensuring that adjacent FABs use consistent data at
-	their intersection, and otherwise,
-
-	Fills with values interpolated from a coarser FAB that
-	bounds the cells that do not meet the above two criteria
-*/
-class MCInterpBndryData
-    :
-    public BndryData
-{
-public:
-
-    /**
-    * \brief Default constructor.
-    */
-    MCInterpBndryData () : BndryData() {}
-
-    /**
-    * \brief Constructor for given BoxArray, etc.
-    *
-    * \param _grids
-    * \param _dmap
-    * \param _ncomp
-    * \param geom
-    */
-    MCInterpBndryData (const BoxArray& _grids,
-		       const DistributionMapping& _dmap,
-		       int             _ncomp,
-		       const Geometry& geom);
-
-    virtual ~MCInterpBndryData () = default;
-
-    MCInterpBndryData (MCInterpBndryData&& rhs) = delete;
-    MCInterpBndryData (const MCInterpBndryData& rhs) = delete;
-    MCInterpBndryData& operator= (const MCInterpBndryData& rhs) = delete;
-    MCInterpBndryData& operator= (MCInterpBndryData&& rhs) = delete;
-
-
-    /**
-    * \brief Interpret user BCs to those expected by LinOp.
-    *
-    * \param phys_bc
-    * \param ratio
-    * \param comp
-    */
-    virtual void setBndryConds (const BCRec& phys_bc,
-                                int          ratio,
-                                int          comp=0) = 0;
-
-    /**
-    * \brief Set bndry values at coarse level (non interpolation performed).
-    *
-    * \param mf
-    * \param mf_start
-    * \param bnd_start
-    * \param num_comp
-    * \param phys_bc
-    */
-    void setBndryValues (const MultiFab&     mf,
-			 int                 mf_start,
-			 int                 bnd_start,
-			 int                 num_comp,
-			 const Vector<BCRec>& phys_bc);
-
-    /**
-    * \brief Set bndry values at fine level, performing necessary interpolations.
-    *
-    * \param crse
-    * \param c_start
-    * \param fine
-    * \param f_start
-    * \param bnd_start
-    * \param num_comp
-    * \param ratio
-    * \param phys_bc
-    */
-    void setBndryValues (const BndryRegister& crse,
-			 int                  c_start,
-			 const MultiFab&      fine,
-			 int                  f_start,
-			 int                  bnd_start,
-			 int                  num_comp,
-			 int                  ratio,
-			 const Vector<BCRec>&  phys_bc);
-};
-
-}
-
-#endif /*_MCINTERPBNDRYDATA_H_*/
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCInterpBndryData.cpp b/Src/LinearSolvers/C_TensorMG/AMReX_MCInterpBndryData.cpp
deleted file mode 100644
index fa91a4078dd..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCInterpBndryData.cpp
+++ /dev/null
@@ -1,263 +0,0 @@
-#include <cmath>
-
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_MCInterpBndryData.H>
-#include <AMReX_MCINTERPBNDRYDATA_F.H>
-#include <AMReX_MCLinOp.H>
-
-namespace amrex {
-
-static BDInterpFunc* bdfunc[2*BL_SPACEDIM];
-static BDPhysDerivative* bdider[2*BL_SPACEDIM];
-static int bdfunc_set = 0;
-
-static void bdfunc_init ()
-{
-    const Orientation xloface(0,Orientation::low);
-    const Orientation xhiface(0,Orientation::high);
-
-    bdfunc[xloface] = FORT_BDINTERPXLO;
-    bdfunc[xhiface] = FORT_BDINTERPXHI;
-    bdider[xloface] = FORT_BDIDERIVXLO;
-    bdider[xhiface] = FORT_BDIDERIVXHI;
-#if (BL_SPACEDIM > 1)
-    const Orientation yloface(1,Orientation::low);
-    const Orientation yhiface(1,Orientation::high);
-
-    bdfunc[yloface] = FORT_BDINTERPYLO;
-    bdfunc[yhiface] = FORT_BDINTERPYHI;
-    bdider[yloface] = FORT_BDIDERIVYLO;
-    bdider[yhiface] = FORT_BDIDERIVYHI;
-#endif
-#if (BL_SPACEDIM > 2)
-    const Orientation zloface(2,Orientation::low);
-    const Orientation zhiface(2,Orientation::high);
-
-    bdfunc[zloface] = FORT_BDINTERPZLO;
-    bdfunc[zhiface] = FORT_BDINTERPZHI;
-    bdider[zloface] = FORT_BDIDERIVZLO;
-    bdider[zhiface] = FORT_BDIDERIVZHI;
-#endif
-}
-
-#if (BL_SPACEDIM == 2)
-#define NUMDERIV 2
-#endif
-
-#if (BL_SPACEDIM == 3)
-#define NUMDERIV 9
-#endif
-
-#define DEF_LIMITS(fab,fabdat,fablo,fabhi)   \
-const int* fablo = (fab).loVect();           \
-const int* fabhi = (fab).hiVect();           \
-Real* fabdat = (fab).dataPtr();
-#define DEF_CLIMITS(fab,fabdat,fablo,fabhi)  \
-const int* fablo = (fab).loVect();           \
-const int* fabhi = (fab).hiVect();           \
-const Real* fabdat = (fab).dataPtr();
-
-MCInterpBndryData::MCInterpBndryData (const BoxArray& _grids,
-				      const DistributionMapping& _dmap,
-				      int             _ncomp,
-				      const Geometry& _geom)
-    :
-    BndryData(_grids,_dmap,MCLinOp::bcComponentsNeeded(_ncomp),_geom)
-{}
-
-//
-// At the coarsest level the bndry values are taken from adjacent grids.
-//
-void
-MCInterpBndryData::setBndryValues(const MultiFab&     mf,
-				  int                 mf_start,
-				  int                 bnd_start,
-				  int                 num_comp,
-				  const Vector<BCRec>& bc )
-{
-    if (!bdfunc_set)
-        bdfunc_init();
-
-    BL_ASSERT(grids.size());
-    BL_ASSERT(grids == mf.boxArray());
-    int nDer = MCLinOp::bcComponentsNeeded(num_comp);
-    BL_ASSERT(bc.size()==nDer);
-
-    int ratio = 1;
-    for (int n=bnd_start; n<bnd_start+nDer; ++n)
-        setBndryConds(bc[n], ratio, n);
-
-    const Real* h = geom.CellSize();
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(mf); mfi.isValid(); ++mfi)
-    {
-	BL_ASSERT(grids[mfi.index()] == mfi.validbox());
-
-        const Box& bx = mfi.validbox();
-
-        for (OrientationIter fi; fi; ++fi)
-        {
-            Orientation face(fi());
-
-	    const int dir = face.coordDir();
-            //
-	    // Physical bndry, copy from grid.
-            //
-            if (bx[face]==geom.Domain()[face]  && !geom.isPeriodic(dir))
-	    {
-                //
-		// Load up hfine with perpendicular h's
-                //
-		Real hfine[BL_SPACEDIM];
-		int kdir = 0;
-		for (int idir=0; idir<BL_SPACEDIM; ++idir)
-                {
-		    if (idir == dir)
-                        continue;
-		    hfine[kdir++] = h[idir];
-		}
-		//
-		// Copy and compute deriv.
-                //
-		bdider[face](bndry[face][mfi].dataPtr(bnd_start),
-			     ARLIM(bndry[face][mfi].loVect()),
-                             ARLIM(bndry[face][mfi].hiVect()),
-			     bx.loVect(),bx.hiVect(),
-			     mf[mfi].dataPtr(mf_start),
-			     ARLIM(mf[mfi].loVect()),ARLIM(mf[mfi].hiVect()),
-			     &num_comp,hfine);
-            }
-        }
-    }
-}
-
-//
-// (1) set bndry type and location of bndry value on each face of
-//     each grid
-// (2) set actual bndry value by:
-//     (A) Interpolate from crse bndryRegister at crse/fine interface
-//     (B) Copy from ghost region of MultiFab at physical bndry
-//
-void
-MCInterpBndryData::setBndryValues (const BndryRegister& crse,
-				   int                  c_start,
-				   const MultiFab&      fine,
-				   int                  f_start,
-				   int                  bnd_start,
-				   int                  num_comp,
-				   int                  ratio,
-				   const Vector<BCRec>&  bc)
-{
-    if (!bdfunc_set)
-        bdfunc_init();
-
-    BL_ASSERT(grids.size());
-    BL_ASSERT(grids == fine.boxArray());
-    int nDer = MCLinOp::bcComponentsNeeded(num_comp);
-    BL_ASSERT(bc.size()==nDer);
-
-    for (int n=bnd_start; n<bnd_start+nDer; ++n)
-        setBndryConds(bc[n], ratio, n);
-    
-    const Real* h = geom.CellSize();
-    //
-    // First interpolate from coarse to fine on bndry.
-    //
-    const Box& fine_domain = geom.Domain();
-    //
-    // Mask turned off if covered by fine grid.
-    //
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-    Real* derives = 0;
-    int tmplen    = 0;
-    
-    for (MFIter finemfi(fine); finemfi.isValid(); ++finemfi)
-    {
-        BL_ASSERT(grids[finemfi.index()] == finemfi.validbox());
-
-        const Box& fine_bx = finemfi.validbox();
-        Box crse_bx        = amrex::coarsen(fine_bx,ratio);
-        const int* cblo    = crse_bx.loVect();
-        const int* cbhi    = crse_bx.hiVect();
-        int mxlen          = crse_bx.longside() + 2;
-
-        if (std::pow((double)mxlen,(double)BL_SPACEDIM-1) > tmplen)
-        {
-            delete [] derives;
-            tmplen = mxlen;
-#if (BL_SPACEDIM > 2)
-	    tmplen *= mxlen;
-#endif	    
-            derives = new Real[tmplen*NUMDERIV];
-        }
-	const int* lo             = fine_bx.loVect();
-	const int* hi             = fine_bx.hiVect();
-	const FArrayBox& fine_grd = fine[finemfi];
-        const int* finelo         = fine_grd.loVect();
-        const int* finehi         = fine_grd.hiVect();
-        const Real* finedat       = fine_grd.dataPtr(f_start);
-
-	for (OrientationIter fi; fi; ++fi)
-        {
-	    const Orientation face(fi());
-	    const int         dir = face.coordDir();
-            //
-	    // Load up hfine with perpindicular h's.
-            //
-	    Real hfine[BL_SPACEDIM];
-	    int kdir = 0;
-	    for (int idir = 0; idir < BL_SPACEDIM; ++idir)
-	      if (idir != dir)
-                  hfine[kdir++] = h[idir];
-
-	    FArrayBox& bnd_fab = bndry[face][finemfi];
-	    const int* blo     = bnd_fab.loVect();
-	    const int* bhi     = bnd_fab.hiVect();
-	    Real* bdat         = bnd_fab.dataPtr(bnd_start);
-
-	    if (fine_bx[face] != fine_domain[face] || geom.isPeriodic(dir))
-            {
-		//
-                // Internal or periodic edge, interpolate from crse data.
-                //
-                const Mask& mask = masks[face][finemfi];
-                const int* mlo   = mask.loVect();
-                const int* mhi   = mask.hiVect();
-                const int* mdat  = mask.dataPtr();
-
-                const FArrayBox& crse_fab = crse[face][finemfi];
-                const int* clo            = crse_fab.loVect();
-                const int* chi            = crse_fab.hiVect();
-                const Real* cdat          = crse_fab.dataPtr(c_start);
-		int is_not_covered        = BndryData::not_covered;
-
-                bdfunc[face](bdat,ARLIM(blo),ARLIM(bhi),
-			     lo,hi,ARLIM(cblo),ARLIM(cbhi),
-                             &num_comp,&ratio,&is_not_covered,
-			     mdat,ARLIM(mlo),ARLIM(mhi),
-                             cdat,ARLIM(clo),ARLIM(chi),derives,hfine);
-            }
-            else
-            {
-                //
-		// This copies data from ghost region of grid, plus
-		// computes derivative.
-                //
-		bdider[face](bdat,ARLIM(blo),ARLIM(bhi),
-			     lo, hi,
-			     finedat,ARLIM(finelo),ARLIM(finehi),
-			     &num_comp,hfine);
-	    }
-	}
-    }
-    delete [] derives;
-    }
-}
-
-}
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_2D.F b/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_2D.F
deleted file mode 100644
index 464203424fa..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_2D.F
+++ /dev/null
@@ -1,985 +0,0 @@
-#include <AMReX_REAL.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_MCLO_F.H>
-#include <AMReX_ArrayLim.H>
-
-c-----------------------------------------------------------------------
-      subroutine FORT_HARMONIC_AVERAGEEC (
-     $     c, DIMS(c),
-     $     f, DIMS(f),
-     $     lo, hi, nc,
-     $     cdir
-     $     )
-c
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer DIMDEC(f)
-      REAL_T f(DIMV(f),nc)
-      integer DIMDEC(c)
-      REAL_T c(DIMV(c),nc)
-c
-      REAL_T factor, den
-      parameter(factor=2.00)
-      integer n
-      integer i
-      integer j
-c
-      if ( cdir .eq. 0 ) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  den = f(2*i,2*j,n) + f(2*i,2*j+1,n)
-                  if (den .ne. 0.0) then
-                    c(i,j,n) =  factor*f(2*i,2*j,n)*f(2*i,2*j+1,n)/den
-                  else
-                    c(i,j,n) =  0.0
-                  endif
-               enddo
-            enddo
-         enddo
-      else if (cdir .eq. 1 ) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  den = f(2*i,2*j,n) + f(2*i+1,2*j,n)
-                  if (den .ne. 0.0) then
-                    c(i,j,n) =  factor*f(2*i,2*j,n)*f(2*i+1,2*j,n)/den
-                  else
-                    c(i,j,n) =  0.0
-                  endif
-               enddo
-            enddo
-         enddo
-      endif
-c
-      end
-c-----------------------------------------------------------------------
-      subroutine FORT_AVERAGEEC (
-     $     c, DIMS(c),
-     $     f, DIMS(f),
-     $     lo, hi, nc,
-     $     cdir
-     $     )
-c
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer DIMDEC(f)
-      REAL_T f(DIMV(f),nc)
-      integer DIMDEC(c)
-      REAL_T c(DIMV(c),nc)
-c
-      integer n
-      integer i
-      integer j
-      REAL_T denom
-      parameter(denom=0.50d0)
-c
-      if (cdir .eq. 0 ) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  c(i,j,n) = (f(2*i,2*j,n) + f(2*i,2*j+1,n))*denom
-               enddo
-            enddo
-         enddo
-      else if (cdir .eq. 1) then
-         do n = 1, nc
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  c(i,j,n) = (f(2*i,2*j,n) + f(2*i+1,2*j,n))*denom
-               enddo
-            enddo
-         enddo
-      endif
-c
-      end
-c-----------------------------------------------------------------------
-      subroutine FORT_AVERAGECC (
-     $     c, DIMS(c),
-     $     f, DIMS(f),
-     $     lo, hi, nc
-     $     )
-c
-      integer nc
-      integer DIMDEC(f)
-      integer DIMDEC(c)
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      REAL_T f(DIMV(f),nc)
-      REAL_T c(DIMV(c),nc)
-c
-      integer i
-      integer j
-      integer n
-      REAL_T denom
-      parameter(denom=0.25d0)
-c
-      do n = 1, nc
-         do j = lo(2), hi(2)
-            do i = lo(1), hi(1)
-               c(i,j,n) =  (
-     $              f(2*i+1,2*j+1,n) + f(2*i  ,2*j+1,n)
-     $              + f(2*i+1,2*j  ,n) + f(2*i  ,2*j  ,n))*denom
-            enddo
-         enddo
-      enddo
-c
-      end
-c-----------------------------------------------------------------------
-      subroutine FORT_APPLYBC (
-     $     flagden, flagbc, maxorder,
-     $     u,   DIMS(u),
-     $     cdir, bct, bcl,
-     $     bcval, DIMS(bcval),
-     $     mask,  DIMS(mask),
-     $     maskp, DIMS(maskp),
-     $     maskm, DIMS(maskm),
-     $     den,   DIMS(den),
-     $     exttd, DIMS(exttd),
-     $     tander,DIMS(tander),
-     $     lo, hi, nc,
-     $     h
-     $     )
-c
-c     If the boundary is of Neumann type, set the ghost cell value to
-c     that of the outermost point in the valid data (2nd order accurate)
-c     and then fill the "den" array with the value "1"
-c     
-c     
-c     If flagbc==1:
-c     
-c     If the boundary is of Dirichlet type, construct a polynomial
-c     interpolation through the boundary location and internal points
-c     (at locations x(-1:len-2) that generates the ghost cell value (at
-c     location xInt).  Then fill the ghost cell with the interpolated value.
-c     If flagden==1, load the "den" array with the interpolation
-c     coefficient corresponding to outermost point in the valid region
-c     ( the coef(0) corresponding to the location x(0) )
-c      
-c     Note: 
-c     The bc type = LO_REFLECT_ODD is a special type of boundary condition.
-
-c ::: the old FORT_APPLYBC put values out in ghost cells.  The new
-c ::: FORT_APPLYBC makes a distinction between normal and tangential derivs.
-c ::: the normal derivatives are still evaluated with ghost cells ( and
-c ::: the den array for adjusting the diagonal element).  Tangential
-c ::: derivatives are NOT computed from the ghost cells (note: we are
-c ::: discussing here the tangential derivates which are centered on the
-c ::: external cells walls of the rectangular domain.  Internal tangential
-c ::: derivatives whose stencil extends outside the rectangular domain have
-c ::: still ANOTHER calculational trick, one sided derivatives, which is 
-c ::: implemented in the apply operator).  For these tangential derivatives,
-c ::: if some of the cells in the stencil are uncovered, the derivative is
-c ::: computed half from cells which are internal, plus an externally supplied
-c ::: tangential derivative centered at location bcl.
-c ??? exttd is the externally supplied tangential derivative which is
-c ??? centered at bcl from wall.  Since the location of exttd is
-c ??? indeterminate (determined by bcl), we arbitrarily index it in the
-c ??? cell just outside the wall.
-c ??? tander is the calculated tangential derivative which is centered at
-c ??? at the wall.  It is indexed as if it were a cell centered quantity
-c ??? just outside the wall.  This is anomalous since it is really edge
-c ??? centered on the outer wall.
-c      
-c ::: other notes since previous developers didn't bother to document
-c ::: cdir is mnemonic for coordinate direction, i.e. which side this is
-c ::: cdir==0 -> left wall
-c ::: cdir==2 -> right
-c ::: cdir==1 -> bottom
-c ::: cdir==3 -> top
-
-c ::: notes about mask
-c ::: since we now require other masks, there are 3.
-c ::: 1) mask -- the main one covering the cells off the side of valid domain.
-c ::: 2) maskp -- the plus end of transverse direction
-c ::: 3) maskn -- the minus end of transverse direction
-
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(u)
-      REAL_T u(DIMV(u),nc)
-      integer DIMDEC(den)
-      REAL_T den(DIMV(den),nc)
-      integer DIMDEC(exttd)
-      REAL_T exttd(DIMV(exttd),nc)
-      integer DIMDEC(tander)
-      REAL_T tander(DIMV(tander),nc)
-      integer DIMDEC(bcval)
-      REAL_T bcval(DIMV(bcval),nc)
-      integer DIMDEC(mask)
-      integer mask(DIMV(mask))
-      integer DIMDEC(maskp)
-      integer maskp(DIMV(maskp))
-      integer DIMDEC(maskm)
-      integer maskm(DIMV(maskm))
-      integer bct(nc)
-      REAL_T bcl
-      REAL_T h(BL_SPACEDIM)
-c
-      REAL_T hx,hy,lambda
-      REAL_T innder,outder
-      REAL_T innloc,outloc,edgloc
-      integer i
-      integer j
-      integer n
-      logical is_dirichlet
-      logical is_neumann
-c
-      integer lenx
-      integer leny
-      integer m
-c
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      REAL_T x(-1:maxmaxorder-2)
-      REAL_T coef(-1:maxmaxorder-2)
-      REAL_T xInt
-c
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-c
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET   )
-      is_neumann(i)   = ( i .eq. LO_NEUMANN )
-      hx = h(1)
-      hy = h(2)
-c
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      endif
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-c
-c     TODO:
-c     In order for this to work with growing multigrid, must
-c     sort xa[] because it is possible for the xb value to lay
-c     within this range.
-c     
-c     The Left face of the grid
-c
-      if(cdir .eq. 0) then
-         do n = 1, nc
-            if (is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  u(lo(1)-1,j,n) = merge(
-     $                 u(lo(1),j,n),
-     $                 u(lo(1)-1,j,n),
-     $                 mask(lo(1)-1,j) .gt. 0)
-               enddo
-               if ( flagden .eq. 1) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of left side
-               i = lo(1)
-               do j=lo(2)+1,hi(2)-1
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                  tander(i-1,j,n) = innder
-               enddo
-c     :::::: now end points
-c     :::::: lower leftside
-               j = lo(2)
-               if( maskm(i,-1 + j).gt.0 ) then
-                    innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               tander(i-1,j,n) = innder
-c     :::::: upper left side
-                j = hi(2)
-                if( maskp(i,1 + j).gt.0 ) then
-                   innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-                else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                endif
-                tander(i-1,j,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenx+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, n) = merge(
-     $                    bcval(lo(1)-1,j,n)*coef(-1),
-     $                    u(lo(1)-1, j, n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, n) = merge(
-     $                    0.0d0,
-     $                    u(lo(1)-1, j, n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1,j,n) = merge(
-     $                    u(lo(1)-1,j,n)
-     $                    + u(lo(1)+m, j, n)*coef(m),
-     $                    u(lo(1)-1,j,n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = merge(coef(0), 0.0d0,
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of left side
-               edgloc = 0.
-               i = lo(1)
-               do j=lo(2)+1,hi(2)-1
-                  if( mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(-1 + i,-1 + j,n) + U(-1 + i,1 + j,n))/(2.*hy)
-                  elseif( mask(-1 + i,j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(-1 + i,2 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(-1 + i,j,n) + 4*U(-1 + i,1 + j,n) - U(-1 + i,2 + j,n))/(2.*hy)
-                  elseif( mask(-1 + i,-2 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-1 + i,-2 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(-1 + i,j,n))/(2.*hy)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-            
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c     :::::: now end points
-c     :::::: lower leftside
-               j = lo(2)
-               if( mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (-U(-1 + i,-1 + j,n) + U(-1 + i,1 + j,n))/(2.*hy)
-               elseif( mask(-1 + i,j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(-1 + i,2 + j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (-3*U(-1 + i,j,n) + 4*U(-1 + i,1 + j,n) - U(-1 + i,2 + j,n))/(2.*hy)
-               else
-                   outloc = x(-1)
-                   if( flagbc .eq. 1) then
-                      outder = exttd(i-1,j,n)
-                   else
-                      outder = 0.
-                   endif
-               endif
-               if( maskm(i,-1 + j).gt.0 ) then
-                    innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-c     :::::: upper left side
-                j = hi(2)
-                if( mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (-U(-1 + i,-1 + j,n) + U(-1 + i,1 + j,n))/(2.*hy)
-                elseif( mask(-1 + i,-2 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(-1 + i,j).eq.0 ) then
-                   outloc = -0.5
-                   outder = (U(-1 + i,-2 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(-1 + i,j,n))/(2.*hy)
-                else
-                   outloc = x(-1)
-                   if( flagbc .eq. 1) then
-                      outder = exttd(i-1,j,n)
-                   else
-                      outder = 0.
-                   endif
-                endif
-                if( maskp(i,1 + j).gt.0 ) then
-                   innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-                else
-                   innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                endif
-                innloc = 0.5
-                lambda = (edgloc-outloc)/(innloc-outloc)
-                tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do j = lo(2), hi(2)
-                  u(lo(1)-1, j, n) = merge(
-     $                 -u(lo(1),j,n),
-     $                 u(lo(1)-1, j, n),
-     $                 mask(lo(1)-1,j) .gt. 0)
-                  tander(lo(1)-1,j,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = merge(-1.0d0, 0.0d0,
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-               
-            else 
-               print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c     
-c     The Right face of the grid
-c
-      if(cdir .eq. 2) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  u(hi(1)+1,j,n) = merge(
-     $                 u(hi(1), j, n),
-     $                 u(hi(1)+1, j, n),
-     $                 mask(hi(1)+1,j) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n) = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of right side
-               i = hi(1)
-               do j=lo(2)+1,hi(2)-1
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-                  tander(i+1,j,n) = innder
-               enddo
-c :::::: now end points
-c :::::: lower right side
-               j = lo(2)
-               if( maskm(i,-1 + j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               tander(i+1,j,n) = innder
-c     :::::: upper right side
-               j = hi(2)
-               if( maskp(i,1 + j).gt.0 ) then
-                  innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               tander(i+1,j,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenx+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = merge(
-     $                    bcval(hi(1)+1,j,n)*coef(-1),
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = merge(
-     $                    0.0d0,
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = merge(
-     $                    u(hi(1)+1,j,n)
-     $                    + u(hi(1)-m,j,n)*coef(m),
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n)   = merge(coef(0), 0.0d0,
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: Null
-c     :::::: interior part of right side
-               edgloc = 0.
-               i = hi(1)
-               do j=lo(2)+1,hi(2)-1
-                  if( mask(1 + i,-1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(1 + i,-1 + j,n) + U(1 + i,1 + j,n))/(2.*hy)
-                  elseif( mask(1 + i,j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(1 + i,2 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(1 + i,j,n) + 4*U(1 + i,1 + j,n) - U(1 + i,2 + j,n))/(2.*hy)
-                  elseif( mask(1 + i,-2 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(1 + i,j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(1 + i,-2 + j,n) - 4*U(1 + i,-1 + j,n) + 3*U(1 + i,j,n))/(2.*hy)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c :::::: now end points
-c :::::: lower right side
-               j = lo(2)
-               if( mask(1 + i,-1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(1 + i,-1 + j,n) + U(1 + i,1 + j,n))/(2.*hy)
-               elseif( mask(1 + i,j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(1 + i,2 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-3*U(1 + i,j,n) + 4*U(1 + i,1 + j,n) - U(1 + i,2 + j,n))/(2.*hy)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i+1,j,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskm(i,-1 + j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(i,1 + j,n) - U(i,2 + j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-c     :::::: upper right side
-               j = hi(2)
-               if( mask(1 + i,-1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(1 + i,-1 + j,n) + U(1 + i,1 + j,n))/(2.*hy)
-               elseif( mask(1 + i,-2 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(1 + i,j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (U(1 + i,-2 + j,n) - 4*U(1 + i,-1 + j,n) + 3*U(1 + i,j,n))/(2.*hy)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i+1,j,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskp(i,1 + j).gt.0 ) then
-                  innder = (U(i,-2 + j,n) - 4*U(i,-1 + j,n) + 3*U(i,j,n))/(2.*hy)
-               else
-                  innder = (-U(i,-1 + j,n) + U(i,1 + j,n))/(2.*hy)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do j = lo(2), hi(2)
-                  u(hi(1)+1, j, n) = merge(
-     $                 -u(hi(1),j,n),
-     $                 u(hi(1)+1, j, n),
-     $                 mask(hi(1)+1,j) .gt. 0)
-c                 ::: tangential der is trivial
-                  tander(hi(1)+1,j,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n) = merge(-1.0d0, 0.0d0,
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The Bottom of the Grid
-c
-      if(cdir .eq. 1) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do i = lo(1),hi(1)
-                  u(i,lo(2)-1,n) = merge(
-     $                 u(i,lo(2),n),
-     $                 u(i,lo(2)-1,n),
-     $                 mask(i,lo(2)-1) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1),hi(1)
-                     den(i,lo(2),n)   = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of bottom side
-               j = lo(2)
-               do i=lo(1)+1,hi(1)-1
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-                  tander(i,j-1,n) = innder
-               enddo
-c :::::: now end points
-c :::::: left bottom side
-               i = lo(1)
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j-1,n) = innder
-c :::::: right bottom side
-               i = hi(1)
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j-1,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, leny+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,n) = merge(
-     $                    bcval(i,lo(2)-1,n)*coef(-1),
-     $                    u(i,lo(2)-1,n),
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               else
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,n) = merge(
-     $                    0.0d0,
-     $                    u(i,lo(2)-1,n),
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               endif
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     u(i, lo(2)-1, n) = merge(
-     $                    u(i, lo(2)-1,n)
-     $                    + u(i, lo(2)+m,n)*coef(m),
-     $                    u(i, lo(2)-1, n),
-     $                    mask(i, lo(2)-1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i, lo(2),n)   = merge(coef(0), 0.0d0,
-     $                    mask(i, lo(2)-1) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of bottom side
-               edgloc = 0.
-               j = lo(2)
-               do i=lo(1)+1,hi(1)-1
-                  if(  mask(-1 + i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(-1 + i,-1 + j,n) + U(1 + i,-1 + j,n))/(2.*hx)
-                  else if(  mask(i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(2 + i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,-1 + j,n) + 4*U(1 + i,-1 + j,n) - U(2 + i,-1 + j,n))/(2.*hx)
-                  else if(  mask(-2 + i,-1 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,-1 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(i,-1 + j,n))/(2.*hx)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i,j-1,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c :::::: now end points
-c :::::: left bottom side
-               i = lo(1)
-               if(  mask(-1 + i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,-1 + j,n) + U(1 + i,-1 + j,n))/(2.*hx)
-               else if( mask(i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0.and.mask(2 + i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,-1 + j,n) + 4*U(1 + i,-1 + j,n) - U(2 + i,-1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j-1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-c :::::: right bottom side
-               i = hi(1)
-               if( mask(-1 + i,-1 + j).eq.0.and.mask(1 + i,-1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,-1 + j,n) + U(1 + i,-1 + j,n))/(2.*hx)
-               else if( mask(-2 + i,-1 + j).eq.0.and.mask(-1 + i,-1 + j).eq.0.and.mask(i,-1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,-1 + j,n) - 4*U(-1 + i,-1 + j,n) + 3*U(i,-1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j-1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do i = lo(1), hi(1)
-                  u(i,lo(2)-1,n) = merge(
-     $                 -u(i,lo(2),n),
-     $                 u(i,lo(2)-1,n),
-     $                 mask(i,lo(2)-1) .gt. 0)
-                  tander(i,lo(2)-1,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,lo(2),n) = merge(-1.0d0, 0.0d0,
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-               stop
-            endif
-        enddo
-      endif
-c     
-c     The top of the grid
-c
-      if (cdir .eq. 3) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do i = lo(1), hi(1)
-                  u(i,hi(2)+1,n) = merge(
-     $                 u(i,hi(2),n),
-     $                 u(i,hi(2)+1,n),
-     $                 mask(i,hi(2)+1) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n)   = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of top side
-               j = hi(2)
-               do i=lo(1)+1,hi(1)-1
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-                  tander(i,j+1,n) = innder
-               enddo
-c     :::::: now end points
-c     :::::: left top side
-               i = lo(1)
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j+1,n) = innder
-c     :::::: right top side
-               i = hi(1)
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               tander(i,j+1,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               if ( bct(n) .eq. LO_REFLECT_ODD ) leny = 0
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call amrex_tmg_polyInterpCoeff(xInt, x, leny+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,n) = merge(
-     $                    bcval(i,hi(2)+1,n)*coef(-1),
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               else
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,n) = merge(
-     $                    0.0d0,
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     u(i, hi(2)+1,n) = merge(
-     $                    u(i,hi(2)+1,n)
-     $                    + u(i, hi(2)-m,n)*coef(m),
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n)   = merge(coef(0), 0.0d0,
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of top side
-               edgloc = 0.
-               j = hi(2)
-               do i=lo(1)+1,hi(1)-1
-                  if(  mask(-1 + i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-U(-1 + i,1 + j,n) + U(1 + i,1 + j,n))/(2.*hx)
-                  else if(  mask(i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(2 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,1 + j,n) + 4*U(1 + i,1 + j,n) - U(2 + i,1 + j,n))/(2.*hx)
-                  else if( mask(-2 + i,1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,1 + j,n) - 4*U(-1 + i,1 + j,n) + 3*U(i,1 + j,n))/(2.*hx)
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i,j+1,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-                  
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c     :::::: now end points
-c     :::::: left top side
-               i = lo(1)
-               if( mask(-1 + i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,1 + j,n) + U(1 + i,1 + j,n))/(2.*hx)
-               else if( mask(i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0.and.mask(2 + i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (-3*U(i,1 + j,n) + 4*U(1 + i,1 + j,n) - U(2 + i,1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j+1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskm(-1 + i,j).gt.0 ) then
-                  innder = (-3*U(i,j,n) + 4*U(1 + i,j,n) - U(2 + i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-c     :::::: right top side
-               i = hi(1)
-               if( mask(-1 + i,1 + j).eq.0.and.mask(1 + i,1 + j).eq.0 ) then
-                  outloc = -0.5
-                  outder = (-U(-1 + i,1 + j,n) + U(1 + i,1 + j,n))/(2.*hx)
-               else if(  mask(-2 + i,1 + j).eq.0.and.mask(-1 + i,1 + j).eq.0.and.mask(i,1 + j).eq.0 ) then
-                     outloc = -0.5
-                     outder = (U(-2 + i,1 + j,n) - 4*U(-1 + i,1 + j,n) + 3*U(i,1 + j,n))/(2.*hx)
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j+1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( maskp(1 + i,j).gt.0 ) then
-                  innder = (U(-2 + i,j,n) - 4*U(-1 + i,j,n) + 3*U(i,j,n))/(2.*hx)
-               else
-                  innder = (-U(-1 + i,j,n) + U(1 + i,j,n))/(2.*hx)
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do i = lo(1), hi(1)
-                  u(i,hi(2)+1,n) = merge(
-     $                 -u(i,hi(2),n),
-     $                 u(i,hi(2)+1,n),
-     $                 mask(i,hi(2)+1) .gt. 0)
-                  tander(i,hi(2)+1,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n) = merge(-1.0d0, 0.0d0,
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-      end
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_3D.F b/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_3D.F
deleted file mode 100644
index a981f87d3ee..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_3D.F
+++ /dev/null
@@ -1,2063 +0,0 @@
-
-#include <AMReX_REAL.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_MCLO_F.H>
-#include <AMReX_ArrayLim.H>
-
-c-----------------------------------------------------------------------
-      subroutine FORT_HARMONIC_AVERAGEEC (
-     $     c, DIMS(c),
-     $     f, DIMS(f),
-     $     lo, hi, nc,
-     $     cdir
-     $     )
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer DIMDEC(f)
-      REAL_T f(DIMV(f),nc)
-      integer DIMDEC(c)
-      REAL_T c(DIMV(c),nc)
-
-      integer n, i, j, k
-
-      if ( cdir .eq. 0 ) then
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                  
-                     c(i,j,k,n) = 4.0d0/(
-     $                    + 1.0d0/f(2*i,2*j  ,2*k  ,n)
-     $                    + 1.0d0/f(2*i,2*j+1,2*k  ,n)
-     $                    + 1.0d0/f(2*i,2*j  ,2*k+1,n)
-     $                    + 1.0d0/f(2*i,2*j+1,2*k+1,n) )
-                     
-                  enddo
-               enddo
-            enddo
-         enddo
-      else if (cdir .eq. 1 ) then
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-
-                     c(i,j,k,n) = 4.0d0/(
-     $                    + 1.0d0/f(2*i  ,2*j,2*k  ,n)
-     $                    + 1.0d0/f(2*i+1,2*j,2*k  ,n)
-     $                    + 1.0d0/f(2*i  ,2*j,2*k+1,n)
-     $                    + 1.0d0/f(2*i+1,2*j,2*k+1,n) )
-                     
-                  enddo
-               enddo
-            enddo
-         enddo
-      else if (cdir .eq. 2 ) then
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     
-                     c(i,j,k,n) = 4.0d0/(
-     $                    + 1.0d0/f(2*i  ,2*j  ,2*k,n)
-     $                    + 1.0d0/f(2*i+1,2*j  ,2*k,n)
-     $                    + 1.0d0/f(2*i  ,2*j+1,2*k,n)
-     $                    + 1.0d0/f(2*i+1,2*j+1,2*k,n) )
-                     
-                  enddo
-               enddo
-            enddo
-         enddo
-      endif
-
-      end
-c-----------------------------------------------------------------------
-      subroutine FORT_AVERAGEEC (
-     $     c, DIMS(c),
-     $     f, DIMS(f),
-     $     lo, hi, nc,
-     $     cdir
-     $     )
-
-      integer nc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer cdir
-      integer DIMDEC(f)
-      REAL_T f(DIMV(f),nc)
-      integer DIMDEC(c)
-      REAL_T c(DIMV(c),nc)
-     
-      integer n, i, j, k
-
-      if ( cdir .eq. 0 ) then
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-     
-                     c(i,j,k,n) = 0.25d0*(
-     $                    + f(2*i,2*j  ,2*k  ,n)
-     $                    + f(2*i,2*j+1,2*k  ,n)
-     $                    + f(2*i,2*j  ,2*k+1,n)
-     $                    + f(2*i,2*j+1,2*k+1,n) )
-                     
-                  enddo
-               enddo
-            enddo
-         enddo
-      else if (cdir .eq. 1 ) then
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     
-                     c(i,j,k,n) = 0.25d0*(
-     $                    + f(2*i  ,2*j,2*k  ,n)
-     $                    + f(2*i+1,2*j,2*k  ,n)
-     $                    + f(2*i  ,2*j,2*k+1,n)
-     $                    + f(2*i+1,2*j,2*k+1,n) )
-                     
-                  enddo
-               enddo
-            enddo
-         enddo
-      else if (cdir .eq. 2 ) then
-         do n = 1, nc
-            do k = lo(3), hi(3)
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-     
-                     c(i,j,k,n) = 0.25d0*(
-     $                    + f(2*i  ,2*j  ,2*k,n)
-     $                    + f(2*i+1,2*j  ,2*k,n)
-     $                    + f(2*i  ,2*j+1,2*k,n)
-     $                    + f(2*i+1,2*j+1,2*k,n) )
-                     
-                  enddo
-               enddo
-            enddo
-         enddo
-      endif
-     
-      end
-c-----------------------------------------------------------------------
-      subroutine FORT_AVERAGECC (
-     $     c, DIMS(c),
-     $     f, DIMS(f),
-     $     lo, hi, nc
-     $     )
-
-      integer nc
-      integer DIMDEC(f)
-      integer DIMDEC(c)
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      REAL_T f(DIMV(f),nc)
-      REAL_T c(DIMV(c),nc)
-
-      integer i, j, k, n
-
-      do n = 1, nc
-         do k = lo(3), hi(3)
-            do j = lo(2), hi(2)
-               do i = lo(1), hi(1)
-                  
-                  c(i,j,k,n) =  0.125d0*(
-     $                 + f(2*i+1,2*j+1,2*k  ,n)
-     $                 + f(2*i  ,2*j+1,2*k  ,n)
-     $                 + f(2*i+1,2*j  ,2*k  ,n)
-     $                 + f(2*i  ,2*j  ,2*k  ,n)
-     $                 + f(2*i+1,2*j+1,2*k+1,n)
-     $                 + f(2*i  ,2*j+1,2*k+1,n)
-     $                 + f(2*i+1,2*j  ,2*k+1,n)
-     $                 + f(2*i  ,2*j  ,2*k+1,n) )
-                     
-               enddo
-            enddo
-         enddo
-      enddo
-     
-      end
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: Null
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 1a) trander is 3x3 for each location; first is component number, then
-c :::     derivative direction.  Not all of these are used, in fact, only the
-c :::     component which is normal to the face is used, and only the 
-c :::     tangential directions are used.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_APPLYBC (
-     $     flagden, flagbc, maxorder,
-     $     u, DIMS(u),
-     $     cdir, bct, bcl,
-     $     bcval, DIMS(bcval),
-     $     maskn, DIMS(maskn),
-     $     maske, DIMS(maske),
-     $     maskw, DIMS(maskw),
-     $     masks, DIMS(masks),
-     $     maskt, DIMS(maskt),
-     $     maskb, DIMS(maskb),
-     $     den, DIMS(den),
-     $     exttd,DIMS(exttd),
-     $     trander,DIMS(trander),
-     $     lo, hi, nc,
-     $     h
-     $     )
-c
-c     If the boundary is of Neumann type, set the ghost cell value to
-c     that of the outermost point in the valid data (2nd order accurate)
-c     and then fill the "den" array with the value "1"
-c     
-c     
-c     If flagbc==1:
-c     
-c     If the boundary is of Dirichlet type, construct a polynomial
-c     interpolation through the boundary location and internal points
-c     (at locations x(-1:len-2) that generates the ghost cell value (at
-c     location xInt).  Then fill the ghost cell with the interpolated value.
-c     If flagden==1, load the "den" array with the interpolation
-c     coefficient corresponding to outermost point in the valid region
-c     ( the coef(0) corresponding to the location x(0) )
-c
-c     Note: 
-c     The bc type = LO_REFLECT_ODD is a special type of dirichlet condition,
-c     in that we want a "zeroth" order interpolant to fill the ghost cell.
-c     If this were treated in the normal way, then ALL boundaries would be
-c     low order.
-
-c ::: other notes since previous developers didn't bother to document
-c ::: cdir is mnemonic for coordinate direction. i.e. which side is
-c ::: cdir==0->west
-c ::: cdir==3->east
-c ::: cdir==1->south
-c ::: cdir==4->north
-c ::: cdir==2->bottom
-c ::: cdir==5->top
-c      
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(u)
-      REAL_T u(DIMV(u),nc)
-      integer DIMDEC(den)
-      REAL_T den(DIMV(den),nc)
-      integer DIMDEC(exttd)
-      REAL_T exttd(DIMV(exttd),nc,3)
-      integer DIMDEC(bcval)
-      REAL_T bcval(DIMV(bcval),nc)
-      integer DIMDEC(maskn)
-      integer maskn(DIMV(maskn))
-      integer DIMDEC(maske)
-      integer maske(DIMV(maske))
-      integer DIMDEC(maskw)
-      integer maskw(DIMV(maskw))
-      integer DIMDEC(masks)
-      integer masks(DIMV(masks))
-      integer DIMDEC(maskt)
-      integer maskt(DIMV(maskt))
-      integer DIMDEC(maskb)
-      integer maskb(DIMV(maskb))
-      integer DIMDEC(trander)
-      REAL_T trander(DIMV(trander),3,3)
-      integer bct(nc)
-      REAL_T bcl
-      REAL_T h(BL_SPACEDIM)
-c
-      integer i
-      integer j
-      integer k
-      integer n
-      logical is_dirichlet
-      logical is_neumann
-      REAL_T innder,outder,innloc
-      REAL_T edgloc,outloc
-      REAL_T lambda
-      REAL_T hx,hy,hz,i2hx,i2hy,i2hz
-      parameter(edgloc = 0.0d0)
-      parameter(innloc = 0.5d0)
-c
-      integer lenx
-      integer leny
-      integer lenz
-      integer m
-      integer tmplen
-      parameter(tmplen=256)
-      REAL_T tmp(0:tmplen)
-c
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      REAL_T x(-1:maxmaxorder-2)
-      REAL_T coef(-1:maxmaxorder-2)
-      REAL_T xInt
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-      parameter( xInt = -0.5d0 )
-c
-      is_dirichlet(ii) = (ii .eq. LO_DIRICHLET)
-      is_neumann(ii) = (ii .eq. LO_NEUMANN)
-c
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      endif
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-      lenz = MIN(hi(3)-lo(3), Lmaxorder-2)
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-      i2hx = 1.d0/(2.d0*hx)
-      i2hy = 1.d0/(2.d0*hy)
-      i2hz = 1.d0/(2.d0*hz)
-
-      do m=0,maxmaxorder-2
-         x(m) = m + 0.5D0
-      end do
-
-      if( (hi(1)-lo(1)+1).gt.tmplen .or. 
-     &     (hi(2)-lo(2)+1).gt.tmplen .or. 
-     &     (hi(3)-lo(3)+1).gt.tmplen) then
-         write(6,*)'FORT_APPLYBC: tmplen must be larger'
-         stop
-      endif
-
-c
-c     TODO:
-c     In order for this to work with growing multigrid, must
-c     sort xa[] because it is possible for the xb value to lay
-c     within this range.
-
-c     
-c     The west face of the grid
-c
-      if(cdir .eq. 0) then
-         do n = 1,nc
-            if (is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1,j,k,n) = merge(
-     $                    u(lo(1),j,k,n),
-     $                    u(lo(1)-1,j,k,n),
-     $                    maskw(lo(1)-1,j,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(lo(1),j,k,n) = 1.0d0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-c ::: ::: Null
-               i = lo(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of west face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))/(2d0*hy)
-                     trander(i-1,j,k,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if(masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i-1,j,k,n,2) = innder
-                  j = hi(2)
-                  if(maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i-1,j,k,n,2) = innder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                     trander(i-1,j,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i-1,j,k,n,3) = innder
-                  k = hi(3)
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i-1,j,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               x(-1) = - bcl/h(1)
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenx+2, coef)
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = bcval(lo(1)-1,j,k,n)*coef(-1)
-                     enddo
-                  else
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = 0.0d0
-                     enddo
-                  endif
-                  do m = 0, lenx
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = tmp(j-lo(2))+u(lo(1)+m,j,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, k, n) = merge(
-     &                    tmp(j-lo(2)),
-     $                    u(lo(1)-1, j,k, n),
-     $                    maskw(lo(1)-1,j,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(lo(1),j,k,n) = merge(coef(0), 0.0d0,
-     $                       maskw(lo(1)-1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: Null
-c ::: ::: interior part of west side
-               i = lo(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-                  do j=lo(2)+1,hi(2)-1
-                     if( maskw(-1+i,-1+j,k).eq.0.and.maskw(-1+i,1+j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-U(-1+i,-1+j,k,n)+U(-1+i,1+j,k,n))*i2hy
-                     elseif( maskw(-1+i,j,k).eq.0.and.maskw(-1+i,1+j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-3*U(-1+i,j,k,n)+4*U(-1+i,1+j,k,n)-U(-1+i,2+j,k,n))*i2hy
-                     elseif( maskw(-1+i,-1+j,k).eq.0.and.maskw(-1+i,j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (U(-1+i,-2+j,k,n)-4*U(-1+i,-1+j,k,n)+3*U(-1+i,j,k,n))*i2hy
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i-1,j,k,n,2)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i-1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  j = lo(2)
-                  if( maskw(-1+i,-1+j,k).eq.0.and.maskw(-1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,-1+j,k,n)+U(-1+i,1+j,k,n))*i2hy
-                  elseif( maskw(-1+i,j,k).eq.0.and.maskw(-1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(-1+i,j,k,n)+4*U(-1+i,1+j,k,n)-U(-1+i,2+j,k,n))*i2hy
-                  elseif( maskw(-1+i,-1+j,k).eq.0.and.maskw(-1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-1+i,-2+j,k,n)-4*U(-1+i,-1+j,k,n)+3*U(-1+i,j,k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( maskw(-1+i,-1+j,k).eq.0.and.maskw(-1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,-1+j,k,n)+U(-1+i,1+j,k,n))*i2hy
-                  elseif( maskw(-1+i,j,k).eq.0.and.maskw(-1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(-1+i,j,k,n)+4*U(-1+i,1+j,k,n)-U(-1+i,2+j,k,n))*i2hy
-                  elseif( maskw(-1+i,-1+j,k).eq.0.and.maskw(-1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-1+i,-2+j,k,n)-4*U(-1+i,-1+j,k,n)+3*U(-1+i,j,k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     if( maskw(-1+i,j,-1+k).eq.0.and.maskw(-1+i,j,1+k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-U(-1+i,j,-1+k,n)+U(-1+i,j,1+k,n))*i2hz
-                     elseif( maskw(-1+i,j,k).eq.0.and.maskw(-1+i,j,1+k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-3*U(-1+i,j,k,n)+4*U(-1+i,j,1+k,n)-U(-1+i,j,2+k,n))*i2hz
-                     elseif( maskw(-1+i,j,-1+k).eq.0.and.maskw(-1+i,j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (U(-1+i,j,-2+k,n)-4*U(-1+i,j,-1+k,n)+3*U(-1+i,j,k,n))*i2hz
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i-1,j,k,n,3)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i-1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  k = lo(3)
-                  if( maskw(-1+i,j,-1+k).eq.0.and.maskw(-1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,j,-1+k,n)+U(-1+i,j,1+k,n))*i2hz
-                  elseif( maskw(-1+i,j,k).eq.0.and.maskw(-1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(-1+i,j,k,n)+4*U(-1+i,j,1+k,n)-U(-1+i,j,2+k,n))*i2hz
-                  elseif( maskw(-1+i,j,-1+k).eq.0.and.maskw(-1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-1+i,j,-2+k,n)-4*U(-1+i,j,-1+k,n)+3*U(-1+i,j,k,n))*i2hz
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,3)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( maskw(-1+i,j,-1+k).eq.0.and.maskw(-1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,j,-1+k,n)+U(-1+i,j,1+k,n))*i2hz
-                  elseif( maskw(-1+i,j,k).eq.0.and.maskw(-1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(-1+i,j,k,n)+4*U(-1+i,j,1+k,n)-U(-1+i,j,2+k,n))*i2hz
-                  elseif( maskw(-1+i,j,-1+k).eq.0.and.maskw(-1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-1+i,j,-2+k,n)-4*U(-1+i,j,-1+k,n)+3*U(-1+i,j,k,n))*i2hz
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,3)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, k, n) = merge(
-     $                   -u(lo(1),j,k,n),
-     $                    u(lo(1)-1,j,k,n),
-     $                    maskw(lo(1)-1,j,k) .gt. 0)
-                     trander(lo(1)-1,j,k,n,2) = 0.
-                     trander(lo(1)-1,j,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(lo(1),j,k,n) = merge(-1.0d0, 0.0d0,
-     $                       maskw(lo(1)-1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON WEST FACE IN APPLYBC'
-               stop
-            endif
-	 enddo
-      endif
-c
-c     The east face of the grid
-c
-      if(cdir .eq. 3) then
-         do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,k,n) = merge(
-     $                    u(hi(1), j, k, n),
-     $                    u(hi(1)+1, j, k, n),
-     $                    maske(hi(1)+1,j,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(hi(1),j,k,n) = 1.0d0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               i = hi(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of west face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                     trander(i+1,j,k,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if(masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i+1,j,k,n,2) = innder
-                  j = hi(2)
-                  if(maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i+1,j,k,n,2) = innder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                     trander(i+1,j,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i+1,j,k,n,3) = innder
-                  k = hi(3)
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i+1,j,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               x(-1) = - bcl/h(1)
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenx+2, coef)
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = bcval(hi(1)+1,j,k,n)*coef(-1)
-                     enddo
-                  else
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = 0.0d0
-                     enddo
-                  endif
-                  do m = 0, lenx
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = tmp(j-lo(2))+u(hi(1)-m,j,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,k,n) = merge(
-     $                    tmp(j-lo(2)),
-     $                    u(hi(1)+1,j,k,n),
-     $                    maske(hi(1)+1,j,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(hi(1),j,k,n)   = merge(coef(0), 0.0d0,
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part of west side
-               i = hi(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-                  do j=lo(2)+1,hi(2)-1
-                     if( maske(1+i,-1+j,k).eq.0.and.maske(1+i,1+j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-U(1+i,-1+j,k,n)+U(1+i,1+j,k,n))*i2hy
-                     elseif( maske(1+i,j,k).eq.0.and.maske(1+i,1+j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-3*U(1+i,j,k,n)+4*U(1+i,1+j,k,n)-U(1+i,2+j,k,n))*i2hy
-                     elseif( maske(1+i,-1+j,k).eq.0.and.maske(1+i,j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (U(1+i,-2+j,k,n)-4*U(1+i,-1+j,k,n)+3*U(1+i,j,k,n))*i2hy
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i+1,j,k,n,2)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i+1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  j = lo(2)
-                  if( maske(1+i,-1+j,k).eq.0.and.maske(1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(1+i,-1+j,k,n)+U(1+i,1+j,k,n))*i2hy
-                  elseif( maske(1+i,j,k).eq.0.and.maske(1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(1+i,j,k,n)+4*U(1+i,1+j,k,n)-U(1+i,2+j,k,n))*i2hy
-                  elseif( maske(1+i,-1+j,k).eq.0.and.maske(1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(1+i,-2+j,k,n)-4*U(1+i,-1+j,k,n)+3*U(1+i,j,k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( maske(1+i,-1+j,k).eq.0.and.maske(1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(1+i,-1+j,k,n)+U(1+i,1+j,k,n))*i2hy
-                  elseif( maske(1+i,j,k).eq.0.and.maske(1+i,1+j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(1+i,j,k,n)+4*U(1+i,1+j,k,n)-U(1+i,2+j,k,n))*i2hy
-                  elseif( maske(1+i,-1+j,k).eq.0.and.maske(1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(1+i,-2+j,k,n)-4*U(1+i,-1+j,k,n)+3*U(1+i,j,k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     if( maske(1+i,j,-1+k).eq.0.and.maske(1+i,j,1+k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-U(1+i,j,-1+k,n)+U(1+i,j,1+k,n))*i2hz
-                     elseif( maske(1+i,j,k).eq.0.and.maske(1+i,j,1+k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (-3*U(1+i,j,k,n)+4*U(1+i,j,1+k,n)-U(1+i,j,2+k,n))*i2hz
-                     elseif( maske(1+i,j,-1+k).eq.0.and.maske(1+i,j,k).eq.0)then
-                         outloc = -0.5d0
-                         outder = (U(1+i,j,-2+k,n)-4*U(1+i,j,-1+k,n)+3*U(1+i,j,k,n))*i2hz
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i+1,j,k,n,3)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i+1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  k = lo(3)
-                  if( maske(1+i,j,-1+k).eq.0.and.maske(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(1+i,j,-1+k,n)+U(1+i,j,1+k,n))*i2hz
-                  elseif( maske(1+i,j,k).eq.0.and.maske(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(1+i,j,k,n)+4*U(1+i,j,1+k,n)-U(1+i,j,2+k,n))*i2hz
-                  elseif( maske(1+i,j,-1+k).eq.0.and.maske(1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(1+i,j,-2+k,n)-4*U(1+i,j,-1+k,n)+3*U(1+i,j,k,n))*i2hz
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,3)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( maske(1+i,j,-1+k).eq.0.and.maske(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(1+i,j,-1+k,n)+U(1+i,j,1+k,n))*i2hz
-                  elseif( maske(1+i,j,k).eq.0.and.maske(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(1+i,j,k,n)+4*U(1+i,j,1+k,n)-U(1+i,j,2+k,n))*i2hz
-                  elseif( maske(1+i,j,-1+k).eq.0.and.maske(1+i,j,k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(1+i,j,-2+k,n)-4*U(1+i,j,-1+k,n)+3*U(1+i,j,k,n))*i2hz
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,3)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1, j, k, n) = merge(
-     $                   -u(hi(1),j,k,n),
-     $                    u(hi(1)+1,j,k,n),
-     $                    maske(hi(1)+1,j,k) .gt. 0)
-                     trander(hi(1)+1,j,k,n,2) = 0.
-                     trander(hi(1)+1,j,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(hi(1),j,k,n) = merge(-1.0d0, 0.0d0,
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The south of the Grid
-c
-      if(cdir .eq. 1) then
-	 do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do i = lo(1),hi(1)
-                     u(i,lo(2)-1,k,n) = merge(
-     $                    u(i,lo(2),k,n),
-     $                    u(i,lo(2)-1,k,n),
-     $                    masks(i,lo(2)-1,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1),hi(1)
-                        den(i,lo(2),k,n)   = 1.0d0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               j = lo(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of south face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                     trander(i,j-1,k,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if(maskw(-1+i,j,k).gt.0) then
-                       innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                       innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j-1,k,n,1) = innder
-                  i = hi(1)
-                  if(maske(1+i,j,k).gt.0) then
-                     innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j-1,k,n,1) = innder
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1),hi(1)
-c ::: ::: ::: ::: interior part of south face
-                  do k=lo(3)+1,hi(3)-1
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                     trander(i,j-1,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i,j-1,k,n,3) = innder
-                  k = hi(3)
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i,j-1,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               x(-1) = - bcl/h(2)
-               call amrex_tmg_polyInterpCoeff(xInt, x, leny+2, coef)
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,lo(2)-1,k,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0d0
-                     enddo
-                  endif
-                  do m = 0, leny
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))+u(i,lo(2)+m,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,k,n) = merge(
-     $                    tmp(i-lo(1)),
-     $                    u(i,lo(2)-1,k,n),
-     $                    masks(i,lo(2)-1,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i, lo(2),k,n)   = merge(coef(0), 0.0d0,
-     $                       masks(i, lo(2)-1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               j=lo(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-                  do i=lo(1)+1, hi(1)-1
-                     if( masks(-1+i,-1+j,k).eq.0.and.masks(1+i,-1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-U(-1+i,-1+j,k,n)+U(1+i,-1+j,k,n))*i2hx
-                    elseif( masks(i,-1+j,k).eq.0.and.masks(1+i,-1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-3*U(i,-1+j,k,n)+4*U(1+i,-1+j,k,n)-U(2+i,-1+j,k,n))*i2hx
-                    elseif( masks(-1+i,-1+j,k).eq.0.and.masks(i,-1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (U(-2+i,-1+j,k,n)-4*U(-1+i,-1+j,k,n)+3*U(i,-1+j,k,n))*i2hx
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j-1,k,n,1)
-                       else
-                          outder = 0.0d0
-                       endif
-                    endif
-                    innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j-1,k,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( masks(-1+i,-1+j,k).eq.0.and.masks(1+i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(-1+i,-1+j,k,n)+U(1+i,-1+j,k,n))*i2hx
-                  elseif( masks(i,-1+j,k).eq.0.and.masks(1+i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,-1+j,k,n)+4*U(1+i,-1+j,k,n)-U(2+i,-1+j,k,n))*i2hx
-                  elseif( masks(-1+i,-1+j,k).eq.0.and.masks(i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(-2+i,-1+j,k,n)-4*U(-1+i,-1+j,k,n)+3*U(i,-1+j,k,n))*i2hx
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,1)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maskw(-1+i,j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( masks(-1+i,-1+j,k).eq.0.and.masks(1+i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(-1+i,-1+j,k,n)+U(1+i,-1+j,k,n))*i2hx
-                  elseif( masks(i,-1+j,k).eq.0.and.masks(1+i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,-1+j,k,n)+4*U(1+i,-1+j,k,n)-U(2+i,-1+j,k,n))*i2hx
-                  elseif( masks(-1+i,-1+j,k).eq.0.and.masks(i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(-2+i,-1+j,k,n)-4*U(-1+i,-1+j,k,n)+3*U(i,-1+j,k,n))*i2hx
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,1)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maske(1+i,j,k).gt.0) then
-                     innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,1) = lambda*innder+(1-lambda)*outder                 
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1), hi(1)
-                  do k=lo(3)+1,hi(3)-1
-                     if( masks(i,-1+j,-1+k).eq.0.and.masks(i,-1+j,1+k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-U(i,-1+j,-1+k,n)+U(i,-1+j,1+k,n))*i2hz
-                    elseif( masks(i,-1+j,k).eq.0.and.masks(i,-1+j,1+k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-3*U(i,-1+j,k,n)+4*U(i,-1+j,1+k,n)-U(i,-1+j,2+k,n))*i2hz
-                    elseif( masks(i,-1+j,-1+k).eq.0.and.masks(i,-1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (U(i,-1+j,-2+k,n)-4*U(i,-1+j,-1+k,n)+3*U(i,-1+j,k,n))*i2hz
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j-1,k,n,3)
-                       else
-                          outder = 0.0d0
-                       endif
-                    endif
-                    innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j-1,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  k = lo(3)
-                  if( masks(i,-1+j,-1+k).eq.0.and.masks(i,-1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(i,-1+j,-1+k,n)+U(i,-1+j,1+k,n))*i2hz
-                  elseif( masks(i,-1+j,k).eq.0.and.masks(i,-1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,-1+j,k,n)+4*U(i,-1+j,1+k,n)-U(i,-1+j,2+k,n))*i2hz
-                  elseif( masks(i,-1+j,-1+k).eq.0.and.masks(i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(i,-1+j,-2+k,n)-4*U(i,-1+j,-1+k,n)+3*U(i,-1+j,k,n))*i2hz
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,3)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( masks(i,-1+j,-1+k).eq.0.and.masks(i,-1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(i,-1+j,-1+k,n)+U(i,-1+j,1+k,n))*i2hz
-                  elseif( masks(i,-1+j,k).eq.0.and.masks(i,-1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,-1+j,k,n)+4*U(i,-1+j,1+k,n)-U(i,-1+j,2+k,n))*i2hz
-                  elseif( masks(i,-1+j,-1+k).eq.0.and.masks(i,-1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(i,-1+j,-2+k,n)-4*U(i,-1+j,-1+k,n)+3*U(i,-1+j,k,n))*i2hz
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,3)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,3) = lambda*innder+(1-lambda)*outder                 
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     u(i, lo(2)-1, k, n) = merge(
-     $                   -u(i,lo(2),k,n),
-     $                    u(i,lo(2)-1,k,n),
-     $                    masks(i,lo(2)-1,k) .gt. 0)
-                     trander(i,lo(2)-1,k,n,1) = 0.
-                     trander(i,lo(2)-1,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,lo(2),k,n) = merge(-1.0d0, 0.0d0,
-     $                       masks(i,lo(2)-1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The north of the grid
-c
-      if (cdir .eq. 4) then
-         do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,k,n) = merge(
-     $                    u(i,hi(2),k,n),
-     $                    u(i,hi(2)+1,k,n),
-     $                    maskn(i,hi(2)+1,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k,n)   = 1.0d0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               j = hi(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of south face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                     trander(i,j+1,k,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if(maskw(-1+i,j,k).gt.0) then
-                       innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                       innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j+1,k,n,1) = innder
-                  i = hi(1)
-                  if(maske(1+i,j,k).gt.0) then
-                     innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j+1,k,n,1) = innder
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1),hi(1)
-c ::: ::: ::: ::: interior part of south face
-                  do k=lo(3)+1,hi(3)-1
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                     trander(i,j+1,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i,j+1,k,n,3) = innder
-                  k = hi(3)
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  trander(i,j+1,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               x(-1) = - bcl/h(2)
-               call amrex_tmg_polyInterpCoeff(xInt, x, leny+2, coef)
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,hi(2)+1,k,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0d0
-                     enddo
-                  endif
-                  do m = 0, leny
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))+u(i,hi(2)-m,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,k,n) = merge(
-     $                    tmp(i-lo(1)),
-     $                    u(i,hi(2)+1,k,n),
-     $                    maskn(i,hi(2)+1,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k,n)   = merge(coef(0), 0.0d0,
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               j=hi(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-                  do i=lo(1)+1, hi(1)-1
-                     if( maskn(-1+i,1+j,k).eq.0.and.maskn(1+i,1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-U(-1+i,1+j,k,n)+U(1+i,1+j,k,n))*i2hx
-                    elseif( maskn(i,1+j,k).eq.0.and.maskn(1+i,1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-3*U(i,1+j,k,n)+4*U(1+i,1+j,k,n)-U(2+i,1+j,k,n))*i2hx
-                    elseif( maskn(-1+i,1+j,k).eq.0.and.maskn(i,1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (U(-2+i,1+j,k,n)-4*U(-1+i,1+j,k,n)+3*U(i,1+j,k,n))*i2hx
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j+1,k,n,1)
-                       else
-                          outder = 0.0d0
-                       endif
-                    endif
-                    innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j+1,k,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( maskn(-1+i,1+j,k).eq.0.and.maskn(1+i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(-1+i,1+j,k,n)+U(1+i,1+j,k,n))*i2hx
-                  elseif( maskn(i,1+j,k).eq.0.and.maskn(1+i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,1+j,k,n)+4*U(1+i,1+j,k,n)-U(2+i,1+j,k,n))*i2hx
-                  elseif( maskn(-1+i,1+j,k).eq.0.and.maskn(i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(-2+i,1+j,k,n)-4*U(-1+i,1+j,k,n)+3*U(i,1+j,k,n))*i2hx
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,1)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maskw(-1+i,j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( maskn(-1+i,1+j,k).eq.0.and.maskn(1+i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(-1+i,1+j,k,n)+U(1+i,1+j,k,n))*i2hx
-                  elseif( maskn(i,1+j,k).eq.0.and.maskn(1+i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,1+j,k,n)+4*U(1+i,1+j,k,n)-U(2+i,1+j,k,n))*i2hx
-                  elseif( maskn(-1+i,1+j,k).eq.0.and.maskn(i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(-2+i,1+j,k,n)-4*U(-1+i,1+j,k,n)+3*U(i,1+j,k,n))*i2hx
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,1)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maske(1+i,j,k).gt.0) then
-                     innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,1) = lambda*innder+(1-lambda)*outder                 
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1), hi(1)
-                  do k=lo(3)+1,hi(3)-1
-                     if( maskn(i,1+j,-1+k).eq.0.and.maskn(i,1+j,1+k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-U(i,1+j,-1+k,n)+U(i,1+j,1+k,n))*i2hz
-                    elseif( maskn(i,1+j,k).eq.0.and.maskn(i,1+j,1+k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (-3*U(i,1+j,k,n)+4*U(i,1+j,1+k,n)-U(i,1+j,2+k,n))*i2hz
-                    elseif( maskn(i,1+j,-1+k).eq.0.and.maskn(i,1+j,k).eq.0)then
-                       outloc = -0.5d0
-                       outder = (U(i,1+j,-2+k,n)-4*U(i,1+j,-1+k,n)+3*U(i,1+j,k,n))*i2hz
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j+1,k,n,3)
-                       else
-                          outder = 0.0d0
-                       endif
-                    endif
-                    innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j+1,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  k = lo(3)
-                  if( maskn(i,1+j,-1+k).eq.0.and.maskn(i,1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(i,1+j,-1+k,n)+U(i,1+j,1+k,n))*i2hz
-                  elseif( maskn(i,1+j,k).eq.0.and.maskn(i,1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,1+j,k,n)+4*U(i,1+j,1+k,n)-U(i,1+j,2+k,n))*i2hz
-                  elseif( maskn(i,1+j,-1+k).eq.0.and.maskn(i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(i,1+j,-2+k,n)-4*U(i,1+j,-1+k,n)+3*U(i,1+j,k,n))*i2hz
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,3)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maskb(i,j,-1+k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,j,1+k,n)-U(i,j,2+k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( maskn(i,1+j,-1+k).eq.0.and.maskn(i,1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-U(i,1+j,-1+k,n)+U(i,1+j,1+k,n))*i2hz
-                  elseif( maskn(i,1+j,k).eq.0.and.maskn(i,1+j,1+k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (-3*U(i,1+j,k,n)+4*U(i,1+j,1+k,n)-U(i,1+j,2+k,n))*i2hz
-                  elseif( maskn(i,1+j,-1+k).eq.0.and.maskn(i,1+j,k).eq.0)then
-                    outloc = -0.5d0
-                    outder = (U(i,1+j,-2+k,n)-4*U(i,1+j,-1+k,n)+3*U(i,1+j,k,n))*i2hz
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,3)
-                    else
-                       outder = 0.0d0
-                    endif
-                  endif
-                  if(maskt(i,j,1+k).gt.0) then
-                     innder = (U(i,j,-2+k,n)-4*U(i,j,-1+k,n)+3*U(i,j,k,n))*i2hz
-                  else
-                     innder = (-U(i,j,-1+k,n)+U(i,j,1+k,n))*i2hz
-                  endif
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,3) = lambda*innder+(1-lambda)*outder                 
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     u(i, hi(2)+1, k, n) = merge(
-     $                   -u(i,hi(2),k,n),
-     $                    u(i,hi(2)+1,k,n),
-     $                    maskn(i,hi(2)+1,k) .gt. 0)
-                     trander(i,hi(2)+1,k,n,1) = 0.
-                     trander(i,hi(2)+1,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k,n) = merge(-1.0d0, 0.0d0,
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The bottom of the Grid
-c
-      if(cdir .eq. 2) then
-         do n = 1,nc
-           if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  do i = lo(1),hi(1)
-                     u(i,j,lo(3)-1,n) = merge(
-     $                    u(i,j,lo(3),n),
-     $                    u(i,j,lo(3)-1,n),
-     $                    maskb(i,j,lo(3)-1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1),hi(1)
-                        den(i,j,lo(3),n)   = 1.0d0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               k = lo(3)
-c ::: ::: X
-               do j=lo(2),hi(2)
-c ::: ::: ::: interior part of bottom face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                     trander(i,j,k-1,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if( maskw(-1+i,j,k).gt.0) then
-                       innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                       innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j,k-1,n,1) = innder
-                  i = hi(1)
-                  if( maske(1+i,j,k).gt.0) then
-                       innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                       innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j,k-1,n,1) = innder
-               enddo
-c ::: ::: ::: Y
-               do i=lo(1),hi(1)
-c ::: ::: ::: interior part of bottom face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                     trander(i,j,k-1,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if( masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i,j,k-1,n,2) = innder
-                  j = hi(2)
-                  if( maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i,j,k-1,n,2) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               x(-1) = - bcl/h(3)
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenz+2, coef)
-               do j = lo(2), hi(2)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,j,lo(3)-1,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0d0
-                     enddo
-                  endif
-                  do m = 0, lenz
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))+u(i,j,lo(3)+m,n)*coef(m)
-                     enddo
-                  enddo
-                  do i=lo(1),hi(1)
-                     u(i,j,lo(3)-1,n) = merge(
-     &                    tmp(i-lo(1)),
-     &                    u(i,j,lo(3)-1,n),
-     &                    maskb(i,j,lo(3)-1).gt. 0 )
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i, j, lo(3),n)   = merge(coef(0), 0.0d0,
-     $                       maskb(i, j, lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               k = lo(3)
-c ::: ::: ::: X
-               do j=lo(2),hi(2)
-                  do i=lo(1)+1, hi(1)-1
-                     if( maskb(-1+i,j,-1+k).eq.0.and.maskb(1+i,j,-1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-U(-1+i,j,-1+k,n)+U(1+i,j,-1+k,n))*i2hx
-                     else if( maskb(i,j,-1+k).eq.0.and.maskb(1+i,j,-1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-3*U(i,j,-1+k,n)+4*U(1+i,j,-1+k,n)-U(2+i,j,-1+k,n))*i2hx
-                     else if( maskb(-1+i,j,-1+k).eq.0.and.maskb(i,j,-1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (U(-2+i,j,-1+k,n)-4*U(-1+i,j,-1+k,n)+3*U(i,j,-1+k,n))*i2hx
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k-1,n,1)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-u(-1+i,j,k,n)+u(1+i,j,k,n))*i2hx
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k-1,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( maskb(-1+i,j,-1+k).eq.0.and.maskb(1+i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,j,-1+k,n)+U(1+i,j,-1+k,n))*i2hx
-                  else if( maskb(i,j,-1+k).eq.0.and.maskb(1+i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,-1+k,n)+4*U(1+i,j,-1+k,n)-U(2+i,j,-1+k,n))*i2hx
-                  else if( maskb(-1+i,j,-1+k).eq.0.and.maskb(i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-2+i,j,-1+k,n)-4*U(-1+i,j,-1+k,n)+3*U(i,j,-1+k,n))*i2hx
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,1)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskw(-1+i,j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( maskb(-1+i,j,-1+k).eq.0.and.maskb(1+i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,j,-1+k,n)+U(1+i,j,-1+k,n))*i2hx
-                  else if( maskb(i,j,-1+k).eq.0.and.maskb(1+i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,-1+k,n)+4*U(1+i,j,-1+k,n)-U(2+i,j,-1+k,n))*i2hx
-                  else if( maskb(-1+i,j,-1+k).eq.0.and.maskb(i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-2+i,j,-1+k,n)-4*U(-1+i,j,-1+k,n)+3*U(i,j,-1+k,n))*i2hx
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,1)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maske(1+i,j,k).gt.0) then
-                     innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,1) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Y               
-               do i=lo(1), hi(1)
-                  do j=lo(2)+1,hi(2)-1
-                     if( maskb(i,-1+j,-1+k).eq.0.and.maskb(i,1+j,-1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-U(i,-1+j,-1+k,n)+U(i,1+j,-1+k,n))*i2hy
-                     else if( maskb(i,j,-1+k).eq.0.and.maskb(i,1+j,-1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-3*U(i,j,-1+k,n)+4*U(i,1+j,-1+k,n)-U(i,2+j,-1+k,n))*i2hy
-                     else if( maskb(i,-1+j,-1+k).eq.0.and.maskb(i,j,-1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (U(i,-2+j,-1+k,n)-4*U(i,-1+j,-1+k,n)+3*U(i,j,-1+k,n))*i2hy
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k-1,n,2)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-u(i,-1+j,k,n)+u(i,1+j,k,n))*i2hy
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k-1,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  j = lo(2)
-                  if( maskb(i,-1+j,-1+k).eq.0.and.maskb(i,1+j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(i,-1+j,-1+k,n)+U(i,1+j,-1+k,n))*i2hy
-                  else if( maskb(i,j,-1+k).eq.0.and.maskb(i,1+j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,-1+k,n)+4*U(i,1+j,-1+k,n)-U(i,2+j,-1+k,n))*i2hy
-                  else if( maskb(i,-1+j,-1+k).eq.0.and.maskb(i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(i,-2+j,-1+k,n)-4*U(i,-1+j,-1+k,n)+3*U(i,j,-1+k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( maskb(i,-1+j,-1+k).eq.0.and.maskb(i,1+j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(i,-1+j,-1+k,n)+U(i,1+j,-1+k,n))*i2hy
-                  else if( maskb(i,j,-1+k).eq.0.and.maskb(i,1+j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,-1+k,n)+4*U(i,1+j,-1+k,n)-U(i,2+j,-1+k,n))*i2hy
-                  else if( maskb(i,-1+j,-1+k).eq.0.and.maskb(i,j,-1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(i,-2+j,-1+k,n)-4*U(i,-1+j,-1+k,n)+3*U(i,j,-1+k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     u(i, j, lo(3)-1, n) = merge(
-     $                   -u(i,j,lo(3),n),
-     $                    u(i,j,lo(3)-1,n),
-     $                    maskb(i,j,lo(3)-1) .gt. 0)
-                     trander(i,j,lo(3)-1,n,1) = 0.
-                     trander(i,j,lo(3)-1,n,2) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j,lo(3),n) = merge(-1.0d0, 0.0d0,
-     $                       maskb(i,j,lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON FRONT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The top of the grid
-c
-      if (cdir .eq. 5) then
-         do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     u(i,j, hi(3)+1,n) = merge(
-     $                    u(i,j, hi(3),n),
-     $                    u(i,j, hi(3)+1,n),
-     $                    maskt(i,j, hi(3)+1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j, hi(3),n)   = 1.0d0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               k = hi(3)
-c ::: ::: X
-               do j=lo(2),hi(2)
-c ::: ::: ::: interior part of bottom face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                     trander(i,j,k+1,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if( maskw(-1+i,j,k).gt.0) then
-                       innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                       innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j,k+1,n,1) = innder
-                  i = hi(1)
-                  if( maske(1+i,j,k).gt.0) then
-                       innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                       innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif
-                  trander(i,j,k+1,n,1) = innder
-               enddo
-c ::: ::: ::: Y
-               do i=lo(1),hi(1)
-c ::: ::: ::: interior part of bottom face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                     trander(i,j,k+1,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if( masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i,j,k+1,n,2) = innder
-                  j = hi(2)
-                  if( maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif
-                  trander(i,j,k+1,n,2) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               x(-1) = - bcl/h(3)
-               call amrex_tmg_polyInterpCoeff(xInt, x, lenz+2, coef)
-               do j = lo(2), hi(2)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,j, hi(3)+1,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0d0
-                     enddo
-                  endif
-                  do m = 0, lenz
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))
-     $                       + u(i, j, hi(3)-m,n)*coef(m)
-                     enddo
-                  enddo
-                  do i = lo(1), hi(1)
-                     u(i,j, hi(3)+1,n) = merge(
-     $                    tmp(i-lo(1)),
-     $                    u(i,j, hi(3)+1,n),
-     $                    maskt(i,j, hi(3)+1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j, hi(3),n)   = merge(coef(0), 0.0d0,
-     $                       maskt(i,j, hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               k = hi(3)
-c ::: ::: ::: X
-               do j=lo(2),hi(2)
-                  do i=lo(1)+1, hi(1)-1
-                     if( maskt(-1+i,j,1+k).eq.0.and.maskt(1+i,j,1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-U(-1+i,j,1+k,n)+U(1+i,j,1+k,n))*i2hx
-                     else if( maskt(i,j,1+k).eq.0.and.maskt(1+i,j,1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-3*U(i,j,1+k,n)+4*U(1+i,j,1+k,n)-U(2+i,j,1+k,n))*i2hx
-                     else if( maskt(-1+i,j,1+k).eq.0.and.maskt(i,j,1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (U(-2+i,j,1+k,n)-4*U(-1+i,j,1+k,n)+3*U(i,j,1+k,n))*i2hx
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k+1,n,1)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-u(-1+i,j,k,n)+u(1+i,j,k,n))*i2hx
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k+1,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( maskt(-1+i,j,1+k).eq.0.and.maskt(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,j,1+k,n)+U(1+i,j,1+k,n))*i2hx
-                  else if( maskt(i,j,1+k).eq.0.and.maskt(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,1+k,n)+4*U(1+i,j,1+k,n)-U(2+i,j,1+k,n))*i2hx
-                  else if( maskt(-1+i,j,1+k).eq.0.and.maskt(i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-2+i,j,1+k,n)-4*U(-1+i,j,1+k,n)+3*U(i,j,1+k,n))*i2hx
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,1)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskw(-1+i,j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(1+i,j,k,n)-U(2+i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( maskt(-1+i,j,1+k).eq.0.and.maskt(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(-1+i,j,1+k,n)+U(1+i,j,1+k,n))*i2hx
-                  else if( maskt(i,j,1+k).eq.0.and.maskt(1+i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,1+k,n)+4*U(1+i,j,1+k,n)-U(2+i,j,1+k,n))*i2hx
-                  else if( maskt(-1+i,j,1+k).eq.0.and.maskt(i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(-2+i,j,1+k,n)-4*U(-1+i,j,1+k,n)+3*U(i,j,1+k,n))*i2hx
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,1)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maske(1+i,j,k).gt.0) then
-                     innder = (U(-2+i,j,k,n)-4*U(-1+i,j,k,n)+3*U(i,j,k,n))*i2hx
-                  else
-                     innder = (-U(-1+i,j,k,n)+U(1+i,j,k,n))*i2hx
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,1) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Y      
-               do i=lo(1), hi(1)
-                  do j=lo(2)+1,hi(2)-1
-                     if( maskt(i,-1+j,1+k).eq.0.and.maskt(i,1+j,1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-U(i,-1+j,1+k,n)+U(i,1+j,1+k,n))*i2hy
-                     else if( maskt(i,j,1+k).eq.0.and.maskt(i,1+j,1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (-3*U(i,j,1+k,n)+4*U(i,1+j,1+k,n)-U(i,2+j,1+k,n))*i2hy
-                     else if( maskt(i,-1+j,1+k).eq.0.and.maskt(i,j,1+k).eq.0)then
-                        outloc = -0.5d0
-                        outder = (U(i,-2+j,1+k,n)-4*U(i,-1+j,1+k,n)+3*U(i,j,1+k,n))*i2hy
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k+1,n,2)
-                        else
-                           outder = 0.0d0
-                        endif
-                     endif
-                     innder = (-u(i,-1+j,k,n)+u(i,1+j,k,n))*i2hy
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k+1,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  j = lo(2)
-                  if( maskt(i,-1+j,1+k).eq.0.and.maskt(i,1+j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(i,-1+j,1+k,n)+U(i,1+j,1+k,n))*i2hy
-                  else if( maskt(i,j,1+k).eq.0.and.maskt(i,1+j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,1+k,n)+4*U(i,1+j,1+k,n)-U(i,2+j,1+k,n))*i2hy
-                  else if( maskt(i,-1+j,1+k).eq.0.and.maskt(i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(i,-2+j,1+k,n)-4*U(i,-1+j,1+k,n)+3*U(i,j,1+k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(masks(i,-1+j,k).gt.0) then
-                     innder = (-3*U(i,j,k,n)+4*U(i,1+j,k,n)-U(i,2+j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( maskt(i,-1+j,1+k).eq.0.and.maskt(i,1+j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-U(i,-1+j,1+k,n)+U(i,1+j,1+k,n))*i2hy
-                  else if( maskt(i,j,1+k).eq.0.and.maskt(i,1+j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (-3*U(i,j,1+k,n)+4*U(i,1+j,1+k,n)-U(i,2+j,1+k,n))*i2hy
-                  else if( maskt(i,-1+j,1+k).eq.0.and.maskt(i,j,1+k).eq.0)then
-                     outloc = -0.5d0
-                     outder = (U(i,-2+j,1+k,n)-4*U(i,-1+j,1+k,n)+3*U(i,j,1+k,n))*i2hy
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,2)
-                     else
-                        outder = 0.0d0
-                     endif
-                  endif
-                  if(maskn(i,1+j,k).gt.0) then
-                     innder = (U(i,-2+j,k,n)-4*U(i,-1+j,k,n)+3*U(i,j,k,n))*i2hy
-                  else
-                     innder = (-U(i,-1+j,k,n)+U(i,1+j,k,n))*i2hy
-                  endif                     
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     u(i, j, hi(3)+1, n) = merge(
-     $                   -u(i,j,hi(3),n),
-     $                    u(i,j,hi(3)+1,n),
-     $                    maskt(i,j,hi(3)+1) .gt. 0)
-                     trander(i,j,hi(3)+1,n,1) = 0.
-                     trander(i,j,hi(3)+1,n,2) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j,hi(3),n) = merge(-1.0d0, 0.0d0,
-     $                       maskt(i,j,hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON BACK FACE IN APPLYBC'
-               stop
-            endif
-	 enddo
-      endif
-      end
-
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_F.H b/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_F.H
deleted file mode 100644
index bf61e304bf4..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCLO_F.H
+++ /dev/null
@@ -1,87 +0,0 @@
-#ifndef AMREX_MCLO_F_H_
-#define AMREX_MCLO_F_H_
-
-#include <AMReX_REAL.H>
-
-#if defined(BL_LANG_FORT)
-#  define FORT_AVERAGECC mcaveragecc
-#  define FORT_AVERAGEEC mcaverageec
-#  define FORT_HARMONIC_AVERAGEEC mcharaverageec
-#  define FORT_APPLYBC   mcapplybc
-#else
-#  if defined(BL_FORT_USE_UPPERCASE)
-#    define FORT_AVERAGECC MCAVERAGECC
-#    define FORT_AVERAGEEC MCAVERAGEEC
-#    define FORT_HARMONIC_AVERAGEEC MCHARAVERAGEEC
-#    define FORT_APPLYBC   MCAPPLYBC
-#  elif defined(BL_FORT_USE_LOWERCASE)
-#    define FORT_AVERAGECC mcaveragecc
-#    define FORT_AVERAGEEC mcaverageec
-#    define FORT_HARMONIC_AVERAGEEC mcharaverageec
-#    define FORT_APPLYBC   mcapplybc
-#  elif defined(BL_FORT_USE_UNDERSCORE)
-#    define FORT_AVERAGECC mcaveragecc_
-#    define FORT_AVERAGEEC mcaverageec_
-#    define FORT_HARMONIC_AVERAGEEC mcharaverageec_
-#    define FORT_APPLYBC   mcapplybc_
-#  endif
-
-#include <AMReX_ArrayLim.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    void FORT_APPLYBC(
-		    const int *flagden,  // 1 if want values in den
-		    const int *flagbc,   // 1 for inhomogeneous
-		    const int *maxorder, // maxorder of interpolant
-		    amrex_real *phi, ARLIM_P(phi_lo), ARLIM_P(phi_hi),
-		    const int *cdir,
-		    const int *bct,
-		    const amrex_real *bcl,
-		    const amrex_real *bcval, ARLIM_P(bcval_lo), ARLIM_P(bcval_hi),
-#if BL_SPACEDIM==2
-		    const int *mask,   ARLIM_P(mask_lo),  ARLIM_P(mask_hi), 
-		    const int *maskp,  ARLIM_P(maskp_lo),  ARLIM_P(maskp_hi), 
-		    const int *maskm,  ARLIM_P(maskm_lo),  ARLIM_P(maskm_hi), 
-#elif BL_SPACEDIM==3
-		    const int *maskn,  ARLIM_P(maskn_lo),  ARLIM_P(maskn_hi), 
-		    const int *maske,  ARLIM_P(maske_lo),  ARLIM_P(maske_hi), 
-		    const int *maskw,  ARLIM_P(maskw_lo),  ARLIM_P(maskw_hi), 
-		    const int *masks,  ARLIM_P(masks_lo),  ARLIM_P(masks_hi), 
-		    const int *maskt,  ARLIM_P(maskt_lo),  ARLIM_P(maskt_hi), 
-		    const int *maskb,  ARLIM_P(maskb_lo),  ARLIM_P(maskb_hi), 
-#endif
-		    amrex_real *den,         ARLIM_P(den_lo),   ARLIM_P(den_hi),
-		    const amrex_real *exttd, ARLIM_P(exttd_lo), ARLIM_P(exttd_hi),
-		    amrex_real *tander,      ARLIM_P(tander_lo),ARLIM_P(tander_hi),
-		    const int *lo, const int *hi, 
-		    const int *nc,
-		    const amrex_real *h
-		    );
-    void FORT_AVERAGECC (
-	amrex_real* crseX,       ARLIM_P(crseX_lo), ARLIM_P(crseX_hi),
-	const amrex_real* fineX, ARLIM_P(fineX_lo), ARLIM_P(fineX_hi),
-	const int *tlo, const int *thi, const int *nc
-	);
-
-    void FORT_AVERAGEEC (
-	amrex_real* crseX,       ARLIM_P(crseX_lo), ARLIM_P(crseX_hi),
-	const amrex_real* fineX, ARLIM_P(fineX_lo), ARLIM_P(fineX_hi),
-	const int *tlo, const int *thi, const int *nc,
-	const int *axis
-	);
-
-    void FORT_HARMONIC_AVERAGEEC (
-	amrex_real* crseX,       ARLIM_P(crseX_lo), ARLIM_P(crseX_hi),
-	const amrex_real* fineX, ARLIM_P(fineX_lo), ARLIM_P(fineX_hi),
-	const int *tlo, const int *thi, const int *nc,
-	const int *axis
-	);
-#ifdef __cplusplus
-}
-#endif
-#endif
-
-#endif /*_MCLO_F_H_*/
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCLinOp.H b/Src/LinearSolvers/C_TensorMG/AMReX_MCLinOp.H
deleted file mode 100644
index a8787f9c82f..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCLinOp.H
+++ /dev/null
@@ -1,435 +0,0 @@
-
-#ifndef AMREX_MCLINOP_H_
-#define AMREX_MCLINOP_H_
-
-#include <AMReX_BLassert.H>
-#include <AMReX_Array.H>
-#include <AMReX_Vector.H>
-#include <AMReX_REAL.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_MultiFab.H>
-
-#include <AMReX_BndryData.H>
-
-namespace amrex {
-
-enum MCBC_Mode { MCHomogeneous_BC = 0, MCInhomogeneous_BC };
-
-/**
-        \brief A MCLinOp is a virtual base class for general linear operators capable
-	of acting on multicomponent MultiFabs.  Eventually, this should
-	be merged back into LinOp. All implementation and access functions are
-	designed to make a MCLinOp object useful for representing and solving
-	a set of linear equations on a union of rectangles in 2D or 3D.
-
-        A MCLinOp contains all the information necessary to construct and
-	maintain a linear operator which acts on a cell-centered MultiFab.  It
-	is a virtual base class, and therefore cannot itself be
-	instantiated.  The virtual functions implement "apply"
- 	and "smooth" operators (for the internal nodes), and therefore
-	determine the mathematical character of the operator.  MCLinOp,
-	on the other hand, determines the implementation,
-	filling ghost cells and creating coarsened versions
-	of the domain and operator, etc. necessary for solving linear systems.
-
-	MCLinOp is designed specifically for representing discrete
-	approximations
-	to partial differential operators.  It requires a BndryData object,
-	which maintains ghost cell data surrounding each rectangle in the
-	domain, as well as position and boundary condition type
-	specifiers.  It also requires a (vector/scalar) grid spacing.  On
-	levels above the base level, MCLinOp internally recognizes adjacent
-	domain rectangles (using methods similar to those in the BndryData
-	class) and when applying boundary conditions (filling ghost cell
-	regions) will give preference to "valid" data (i.e. ghost cells
-	covered by adjacent grids are filled with the corresponding data from
-	the interior of that adjacent grid rather than via the auxiliary
-	boundary instructions).
-
-	A MCLinOp constructs a set of "levels", which are useful for linear
-	solution methods such as multigrid.  On each grid, a new level is
-	created by uniformly coarsening the grid structure by a factor of
-	two in each coordinate direction (and then allocating and initializing
-	any internal data necessary--new level grid spacing, for example).
-	A MCLinOp can fill boundary ghost cells,
-	compute a "norm" and coordinate
-	the "apply" and "smooth"  operations at each level.
-	Note that there are the same number of levels on each grid in the
-	MCLinOp's domain.
-
-	If a boundary type specifier indicates the type "BndryData::
-	LO_DIRICHLET", the ghost cells not covered by adjacent grids are
-	filled on demand by a polynomial interpolant (of settable order) to
-	compute the value specified in the BndryData FabSets along the edge
-	of the grid boxes.  A value is put into the ghost cell of the input
-	multifab that can be assumed to exist outside the domain, at equal
-	spacing with the rest of the nodes.
-	"BndryData::LO_NEUMANN" conditions result in ghost cells filled by
-	second order extrapolation, and results in again filling the
-	ghost cell with a value appropriate for application in a constant
-	spacing cell-centered discretization.
-	The order of the interpolant is set
-	by default in this class to 2, which is compatible with most
-	simple algebraic relaxation methods for linear systems based on
-	numerical PDE's.  The interpolant can be queried/set via member
-	functions, and is applied uniformly over the domain.  The boundary
-	location is specified as a distance from the wall of the grid block,
-	and is given in the same units that the grid spacing, h, is specified.
-
-	All the member functions of MCLinOp which interact directly with the
-	apply() member take a MCBC_Mode flag.  The BC_mode can be either
-	MCHomogeneous_BC, or MCInhomogeneous_BC.  It is a strict requirement of
-	the linear operator that
-	MCLinOp::apply(out,in,level,bc_mode=MCHomogeneous_BC)
-	acting on in=0 returns out=0.
-*/
-class MCLinOp
-{
-public:
-
-    /**
-    * \brief allocate a MCLinOp for this box array, boundary and (uniform) spacing info
-    *
-    * \param mgb
-    * \param _h
-    * \param _nc
-    */
-    MCLinOp (const BndryData& mgb,
-	     const Real       _h,
-	     int              _nc = MCLinOp::def_ncomp);
-
-    /**
-    * \brief allocate MCLinOp for this boxArray, boundary data and spacing array info
-    *
-    * \param mgb
-    * \param _h
-    * \param _nc
-    */
-    MCLinOp (const BndryData& mgb,
-	     const Real*      _h,
-	     int              _nc = MCLinOp::def_ncomp);
-
-    /**
-    * \brief destructor
-    */
-    virtual ~MCLinOp ();
-
-    /**
-    * \brief applies level MCLinOp to "in", returns "out", uses BC_mode flag
-    *
-    * \param out
-    * \param in
-    * \param level
-    * \param bc_mode
-    */
-    virtual void apply (MultiFab& out,
-                        MultiFab& in,
-                        int       level = 0,
-                        MCBC_Mode bc_mode = MCInhomogeneous_BC);
-
-    /**
-    * \brief fills level boundary cells using BC_mode flag, int. BC data if reqd
-    *
-    * \param inout
-    * \param level
-    * \param bc_mode
-    */
-    virtual void applyBC (MultiFab& inout,
-                          int       level = 0,
-                          MCBC_Mode bc_mode = MCInhomogeneous_BC);
-
-    /**
-    * \brief compute the level ``residual = rhsL - L(solnL)``
-    *
-    * \param residL
-    * \param rhsL
-    * \param solnL
-    * \param level
-    * \param bc_mode
-    */
-    virtual void residual (MultiFab&       residL,
-                           const MultiFab& rhsL,
-                           MultiFab&       solnL,
-                           int             level = 0,
-                           MCBC_Mode       bc_mode = MCInhomogeneous_BC);
-
-    /**
-    * \brief smooth the level system ``L(solnL)=rhsL``
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param bc_mode
-    */
-    virtual void smooth (MultiFab&       solnL,
-                         const MultiFab& rhsL,
-                         int             level = 0,
-                         MCBC_Mode       bc_mode = MCInhomogeneous_BC);
-
-    /**
-    * \brief Compute the norm of "in"
-    *
-    * \param in
-    * \param level
-    */
-    virtual Real norm (const MultiFab& in,
-                       int             level = 0) const;
-
-    /**
-    * \brief return the boundary data object
-    */
-    const BndryData& bndryData () const;
-
-    /**
-    * \brief set the boundary data object
-    *
-    * \param bd
-    */
-    void bndryData (const BndryData& bd);
-
-    /**
-    * \brief return the box array
-    *
-    * \param level
-    */
-    const BoxArray& boxArray (int level = 0) const;
-
-    const DistributionMapping& DistributionMap () const;
-
-    /**
-    * \brief return the number of grids
-    */
-    int numGrids () const;
-
-    /**
-    * \brief return the number of components
-    */
-    int nComp () const {return numcomp;}
-
-    /**
-    * \brief return the number of levels
-    */
-    int numLevels () const;
-
-    /**
-    * \brief return the order of the boundary condition interpolant
-    */
-    int maxOrder () const;
-
-    /**
-    * \brief set the order of the boundary condition interpolant
-    *
-    * \param maxorder_
-    */
-    int maxOrder (int maxorder_);
-
-    /**
-    * \brief construct/allocate internal data necessary for adding a new level
-    *
-    * \param level
-    */
-    virtual void prepareForLevel (int level);
-
-    /**
-    * \brief remove internal data necessary for a level and all higher
-    *
-    * \param level
-    */
-    virtual void clearToLevel (int level);
-
-    /**
-    * \brief return number of components.  This is virtual since only the derived knows
-    */
-    virtual int numberComponents () = 0;
-
-    /**
-    * \brief number of relaxation phases.  Only derived class knows.
-    */
-    virtual int numberPhases () = 0;
-
-    /**
-    * \brief output the operator to an ASCII stream
-    *
-    * \param os
-    * \param lp
-    */
-    friend std::ostream& operator<< (std::ostream& os, const MCLinOp&  lp);
-
-    /**
-    * \brief compute the number of components required in BCRec.
-    *
-    * \param nComp
-    */
-    static int bcComponentsNeeded(int nComp = MCLinOp::def_ncomp);
-
-protected:
-
-    //! number of components
-    int numcomp;
-
-    //! number of relaxation phases
-    int numphase;
-
-    /**
-    * \brief virtual to apply the level operator to the internal nodes of "in", return result in "out"
-    *
-    * \param out
-    * \param in
-    * \param level
-    */
-    virtual void Fapply (MultiFab&       out,
-			 const MultiFab& in,
-			 int             level) = 0;
-
-    /**
-    * \brief virtual to carry out the level smoothing operation for ``L(solnL)=rhsL``
-    * on internal nodes.  Modify solnL in place.
-    *
-    * \param solnL
-    * \param rhsL
-    * \param level
-    * \param phaseflag
-    */
-    virtual void Fsmooth (MultiFab&       solnL,
-			  const MultiFab& rhsL,
-			  int             level,
-			  int             phaseflag) = 0;
-protected:
-
-    /**
-    * \brief build coefficients at coarser level by interpolating "fine" (builds in
-    * appropriate node/cell centering)
-    *
-    * \param crse
-    * \param fine
-    * \param level
-    */
-    void makeCoefficients (MultiFab&       crse,
-			   const MultiFab& fine,
-			   int             level);
-
-    /**
-    * \brief initialize MCLinOp internal data
-    */
-    static void Initialize ();
-
-    static void Finalize ();
-
-    /**
-    * \brief Helper functin for object construction
-    *
-    * \param _h
-    */
-    void initConstruct (const Real* _h);
-
-    //! Vector (on level) of Arrays (on dimension) of grid spacings
-    Vector< Array<Real, BL_SPACEDIM> > h;
-
-    //! Vector (on level) of pointers to BoxArray's of MCLinOp's domain
-    Vector< BoxArray > gbox;
-
-    //! Vector (on level) of pointers to BndryRegisters along each grid for scratch data required to modify internal stencil on boundary
-    Vector< BndryRegister > undrrelxr;
-
-    //! Vector (on level) of pointers to BndryRegisters along each grid for tangential derivative data
-    Vector< BndryRegister > tangderiv;
-
-    /**
-    * \brief Vector (on level) of Vectors (on orientation) of MultiMasks for
-    * whether boundary Fabs are covered, not_covered, outside_domain
-    */
-    Vector<Vector<MultiMask> > maskvals;
-
-    //! boundary data class
-    BndryData bgb;
-
-    //! Vector (on level) of geometry objects.  Needed for determining whether stuff intersects on periodic domains
-    Vector< Geometry > geomarray;
-
-    //! flag (=1 if use harmonic averaged interpolation for coefficients, =0 is arithmetic averaging)
-    int harmavg;
-
-    //! flag (\>0 is verbose execution)
-    int verbose;
-
-    //! maximum interpolation order used for constructing Dirichlet ghost node values
-    int maxorder;
-
-    //! default value for harm_avg
-    static int def_harmavg;
-
-    //! default value for verbose
-    static int def_verbose;
-
-    //! default maximum BC interpolant order
-    static int def_maxorder;
-
-    //! default number of components
-    static int def_ncomp;
-};
-
-inline
-const BndryData&
-MCLinOp::bndryData () const
-{
-    return bgb;
-}
-
-inline
-void
-MCLinOp::bndryData (const BndryData& bd)
-{
-    BL_ASSERT(gbox[0] == bd.boxes());
-    bgb = bd;
-}
-
-inline
-int
-MCLinOp::numLevels () const
-{
-    return h.size();
-}
-
-inline
-const BoxArray&
-MCLinOp::boxArray (int level) const
-{
-    BL_ASSERT(level < numLevels());
-    return gbox[level];
-}
-
-inline
-const DistributionMapping&
-MCLinOp::DistributionMap () const
-{
-    return bgb.DistributionMap();
-}
-
-inline
-int
-MCLinOp::numGrids () const
-{
-    return gbox[0].size();
-}
-
-inline
-int
-MCLinOp::maxOrder () const
-{
-    return maxorder;
-}
-
-inline
-int
-MCLinOp::maxOrder (int maxorder_)
-{
-    BL_ASSERT(maxorder_ >= 2);
-    maxorder_ = (maxorder_ < 2 ? 2 : maxorder_ );
-    int omaxorder = maxorder;
-    maxorder = maxorder_;
-    return omaxorder;
-}
-
-}
-
-#endif /*_MCLINOP_H_*/
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCLinOp.cpp b/Src/LinearSolvers/C_TensorMG/AMReX_MCLinOp.cpp
deleted file mode 100644
index 24d07dab6dc..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCLinOp.cpp
+++ /dev/null
@@ -1,545 +0,0 @@
-#include <iostream>
-#include <cstdlib>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_MCLO_F.H>
-#include <AMReX_MCLinOp.H>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-namespace amrex {
-
-namespace
-{
-    bool initialized = false;
-}
-//
-// Set default values for these in Initialize()!!!
-//
-int MCLinOp::def_harmavg;
-int MCLinOp::def_verbose;
-int MCLinOp::def_maxorder;
-int MCLinOp::def_ncomp = BL_SPACEDIM;
-
-//
-// MCLinOp::applyBC fills MCLinOp_grow ghost cells with data expected in
-// MCLinOp::apply() therefore, the incoming MultiFab to MCLinOp::applyBC()
-// better have this many ghost allocated.
-//
-namespace {
-    const int MCLinOp_grow = 1;
-}
-
-void
-MCLinOp::Initialize ()
-{
-    if (initialized) return;
-    MCLinOp::def_harmavg  = 0;
-    MCLinOp::def_verbose  = 0;
-    MCLinOp::def_maxorder = 2;
-
-    ParmParse pp("MCLp");
-
-    pp.query("harmavg", def_harmavg);
-    pp.query("v",       def_verbose);
-    pp.query("maxorder",def_maxorder);
-
-    if (ParallelDescriptor::IOProcessor() && def_verbose) {
-        amrex::Print() << "def_harmavg = " << def_harmavg << '\n';
-    }
-
-    amrex::ExecOnFinalize(MCLinOp::Finalize);
-
-    initialized = true;
-}
-
-void
-MCLinOp::Finalize ()
-{
-    initialized = false;
-}
-
-MCLinOp::MCLinOp (const BndryData& _bgb,
-		  const Real       _h,
-		  int              _nc)
-    : numcomp(_nc), bgb(_bgb)
-{
-    BL_ASSERT (MCLinOp::bcComponentsNeeded(numcomp) == bgb.nComp());
-    Real _hh[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        _hh[i] = _h;
-    }
-    initConstruct(_hh);
-}
-
-MCLinOp::MCLinOp (const BndryData& _bgb,
-		  const Real*      _h,
-		  int              _nc)
-    : numcomp(_nc), bgb(_bgb)
-{
-    BL_ASSERT (MCLinOp::bcComponentsNeeded(numcomp) == bgb.nComp());
-    initConstruct(_h);
-}
-
-MCLinOp::~MCLinOp ()
-{
-}
-
-void
-MCLinOp::initConstruct (const Real* _h)
-{   
-    Initialize();
-    //
-    // We'll reserve() space to cut down on copying during resize()s.
-    //
-    const int N = 10;
-
-    h.reserve(N);
-    gbox.reserve(N);
-    undrrelxr.reserve(N);
-    tangderiv.reserve(N);
-    maskvals.reserve(N);
-    geomarray.reserve(N);
-
-    harmavg = def_harmavg;
-    verbose = def_verbose;
-    gbox.resize(1);
-    int level = 0;
-    gbox[level] = bgb.boxes();
-    geomarray.resize(1);
-    geomarray[level] = bgb.getGeom();
-    h.resize(1);
-    maxorder = def_maxorder;
-    for (int i = 0; i < BL_SPACEDIM; ++i)
-    {
-	h[level][i] = _h[i];
-    }
-    maskvals.resize(1);
-    maskvals[0].resize(2*BL_SPACEDIM);
-
-    for (OrientationIter oitr; oitr; ++oitr)
-    {
-	const Orientation face = oitr();
-	const MultiMask& m = bgb.bndryMasks(face);
-	maskvals[0][face].define(m.boxArray(), m.DistributionMap(), 1);
-	MultiMask::Copy(maskvals[0][face], m);
-    }
-}
-
-int
-MCLinOp::bcComponentsNeeded(int ncomp)
-{
-  int nc;
-#if (BL_SPACEDIM==2)
-  nc = ncomp * 2; // Tangential derivatives for each comp
-#else
-  nc = ncomp * (1 + BL_SPACEDIM); // D-1 tang derivs for ea, but waste one slot to simplify indexing
-#endif
-  return nc;
-}
-
-void
-MCLinOp::apply (MultiFab& out,
-		MultiFab& in,
-		int       level,
-		MCBC_Mode bc_mode)
-{
-    applyBC(in,level,bc_mode);
-    Fapply(out,in,level);
-}
-
-void
-MCLinOp::applyBC (MultiFab& inout,
-		  int       level,
-		  MCBC_Mode bc_mode)
-{
-    //
-    // The inout MultiFab must have at least MCLinOp_grow ghost cells
-    // for applyBC()
-    //
-    BL_ASSERT(inout.nGrow() >= MCLinOp_grow);
-    //
-    // The inout MultiFab must have at least Periodic_BC_grow cells for the
-    // algorithms taking care of periodic boundary conditions.
-    //
-    BL_ASSERT(inout.nGrow() >= MCLinOp_grow);
-    //
-    // No coarsened boundary values, cannot apply inhomog at lev>0.
-    //
-    BL_ASSERT(!(level>0 && bc_mode == MCInhomogeneous_BC));
-    
-    int flagden = 1;	// fill in the bndry data and undrrelxr
-    int flagbc  = 1;	// with values
-    if (bc_mode == MCHomogeneous_BC)
-        flagbc = 0; // nodata if homog
-    int nc = inout.nComp();
-    BL_ASSERT(nc == numcomp );
-
-    inout.setBndry(-1.e30);
-
-    prepareForLevel(level);
-
-    inout.FillBoundary(geomarray[level].periodicity());
-
-    //
-    // Fill boundary cells.
-    //
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter mfi(inout); mfi.isValid(); ++mfi)
-    {
-        const int gn = mfi.index();
-
-	const Box& iobx = inout.box(gn);
-
-        BL_ASSERT(gbox[level][gn] == inout.box(gn));
-
-        const BndryData::RealTuple&      bdl = bgb.bndryLocs(gn);
-        const Vector< Vector<BoundCond> >& bdc = bgb.bndryConds(gn);
-
-        for (OrientationIter oitr; oitr; ++oitr)
-        {
-            const Orientation face = oitr();
-            FabSet& f  = undrrelxr[level][face];
-            FabSet& td = tangderiv[level][face];
-            int cdr(face);
-            const FabSet& fs = bgb.bndryValues(face);
-	    Real bcl = bdl[face];
-            const Vector<BoundCond>& bc = bdc[face];
-	    const int *bct = (const int*) bc.dataPtr();
-	    const FArrayBox& fsfab = fs[gn];
-	    const Real* bcvalptr = fsfab.dataPtr();
-            //
-	    // Way external derivs stored.
-            //
-	    const Real* exttdptr = fsfab.dataPtr(numcomp); 
-	    const int* fslo      = fsfab.loVect();
-	    const int* fshi      = fsfab.hiVect();
-	    FArrayBox& inoutfab  = inout[gn];
-	    FArrayBox& denfab    = f[gn];
-	    FArrayBox& tdfab     = td[gn];
-#if BL_SPACEDIM==2
-            int cdir = face.coordDir(), perpdir = -1;
-	    if (cdir == 0)
-                perpdir = 1;
-	    else if (cdir == 1)
-                perpdir = 0;
-	    else
-                amrex::Abort("MCLinOp::applyBC(): bad logic");
-
-            const Mask& m    = maskvals[level][face][mfi];
-	    const Mask& mphi = maskvals[level][Orientation(perpdir,Orientation::high)][mfi];
-	    const Mask& mplo = maskvals[level][Orientation(perpdir,Orientation::low) ][mfi];
-	    FORT_APPLYBC(
-		&flagden, &flagbc, &maxorder,
-		inoutfab.dataPtr(), 
-                ARLIM(inoutfab.loVect()), ARLIM(inoutfab.hiVect()),
-		&cdr, bct, &bcl,
-		bcvalptr, ARLIM(fslo), ARLIM(fshi),
-		m.dataPtr(),    ARLIM(m.loVect()),    ARLIM(m.hiVect()),
-		mphi.dataPtr(), ARLIM(mphi.loVect()), ARLIM(mphi.hiVect()),
-		mplo.dataPtr(), ARLIM(mplo.loVect()), ARLIM(mplo.hiVect()),
-		denfab.dataPtr(), 
-		ARLIM(denfab.loVect()), ARLIM(denfab.hiVect()),
-		exttdptr, ARLIM(fslo), ARLIM(fshi),
-		tdfab.dataPtr(),ARLIM(tdfab.loVect()),ARLIM(tdfab.hiVect()),
-		iobx.loVect(), iobx.hiVect(),
-		&nc, h[level].data());
-#elif BL_SPACEDIM==3
-	    const Mask& mn = maskvals[level][Orientation(1,Orientation::high)][mfi];
-	    const Mask& me = maskvals[level][Orientation(0,Orientation::high)][mfi];
-	    const Mask& mw = maskvals[level][Orientation(0,Orientation::low) ][mfi];
-	    const Mask& ms = maskvals[level][Orientation(1,Orientation::low) ][mfi];
-	    const Mask& mt = maskvals[level][Orientation(2,Orientation::high)][mfi];
-	    const Mask& mb = maskvals[level][Orientation(2,Orientation::low) ][mfi];
-	    FORT_APPLYBC(
-		&flagden, &flagbc, &maxorder,
-		inoutfab.dataPtr(), 
-                ARLIM(inoutfab.loVect()), ARLIM(inoutfab.hiVect()),
-		&cdr, bct, &bcl,
-		bcvalptr, ARLIM(fslo), ARLIM(fshi),
-		mn.dataPtr(),ARLIM(mn.loVect()),ARLIM(mn.hiVect()),
-		me.dataPtr(),ARLIM(me.loVect()),ARLIM(me.hiVect()),
-		mw.dataPtr(),ARLIM(mw.loVect()),ARLIM(mw.hiVect()),
-		ms.dataPtr(),ARLIM(ms.loVect()),ARLIM(ms.hiVect()),
-		mt.dataPtr(),ARLIM(mt.loVect()),ARLIM(mt.hiVect()),
-		mb.dataPtr(),ARLIM(mb.loVect()),ARLIM(mb.hiVect()),
-		denfab.dataPtr(), 
-		ARLIM(denfab.loVect()), ARLIM(denfab.hiVect()),
-		exttdptr, ARLIM(fslo), ARLIM(fshi),
-		tdfab.dataPtr(),ARLIM(tdfab.loVect()),ARLIM(tdfab.hiVect()),
-		iobx.loVect(), iobx.hiVect(),
-		&nc, h[level].data());
-#endif
-	}
-    }
-}
-    
-void
-MCLinOp::residual (MultiFab&       residL,
-		   const MultiFab& rhsL,
-		   MultiFab&       solnL,
-		   int             level,
-		   MCBC_Mode       bc_mode)
-{
-    apply(residL, solnL, level, bc_mode);
-    MultiFab::Xpay(residL, -1.0, rhsL, 0, 0, residL.nComp(), 0);
-}
-
-void
-MCLinOp::smooth (MultiFab&       solnL,
-		 const MultiFab& rhsL,
-		 int             level,
-		 MCBC_Mode       bc_mode)
-{
-    for (int phaseflag = 0; phaseflag < numphase; phaseflag++)
-    {
-	applyBC(solnL, level, bc_mode);
-	Fsmooth(solnL, rhsL, level, phaseflag);
-    }
-}
-
-Real
-MCLinOp::norm (const MultiFab& in,
-	       int             level) const
-{
-    Real nm = MultiFab::Dot(in, 0, in, 0, in.nComp(), 0);
-    return nm;
-}
-
-void
-MCLinOp::clearToLevel (int level)
-{
-    for (int i = level+1; i < numLevels(); ++i)
-    {
-	gbox[i].clear();
-    }
-    h.resize(level+1);
-    gbox.resize(level+1);
-    undrrelxr.resize(level+1);
-    tangderiv.resize(level+1);
-}
-
-void
-MCLinOp::prepareForLevel (int level)
-{
-    if (level == 0) return;
-
-    MCLinOp::prepareForLevel(level-1);
-
-    if (h.size() > level) return;
-    //
-    // Assume from here down that this is a new level one coarser than existing
-    //
-    BL_ASSERT(h.size() == level);
-    h.resize(level+1);
-    int i;
-    for (i = 0; i < BL_SPACEDIM; ++i)
-	h[level][i] = h[level-1][i]*2.0;
-
-    geomarray.resize(level+1);
-    Box curdomain = Box( geomarray[level-1].Domain() ).coarsen(2);
-    geomarray[level].define( curdomain );
-    //
-    // Add a box to the new coarser level (assign removes old BoxArray)
-    //
-    gbox.resize(level+1);
-    gbox[level] = BoxArray(gbox[level-1]).coarsen(2);
-    //
-    // Add the BndryRegister of relax values to the new coarser level.
-    //
-    BL_ASSERT(undrrelxr.size() == level);
-    undrrelxr.resize(level+1);
-    undrrelxr[level].define(gbox[level], DistributionMap(), 1, 0, 0, numcomp);
-    //
-    // Add the BndryRegister to hold tagential derivatives to the new
-    // coarser level.
-    //
-    BL_ASSERT(tangderiv.size() == level);
-    tangderiv.resize(level+1);
-    //
-    // Figure out how many components.
-    //
-    const FabSet& samplefs = tangderiv[level-1][Orientation(0,Orientation::low)];
-    tangderiv[level].define(gbox[level], DistributionMap(), 0,1,0,samplefs.nComp());
-    //
-    // Add an Array of Array of maskvals to the new coarser level
-    // For each orientation, build NULL masks, then use distributed allocation
-    // Initial masks for coarse levels, ignore outside_domain possibility since
-    // we always solve homogeneous equation on coarse levels.
-    //
-    BL_ASSERT(maskvals.size() == level);
-    maskvals.resize(level+1);
-    maskvals[level].resize(2*BL_SPACEDIM);
-
-    for (OrientationIter fi; fi; ++fi)
-    {
-        Orientation face = fi();
-	maskvals[level][face].define(gbox[level], 
-				     DistributionMap(),
-				     geomarray[level],
-				     face, 0, 1, 1, 1, true);
-    }
-}
-
-void
-MCLinOp::makeCoefficients (MultiFab&       cs,
-                           const MultiFab& fn,
-                           int             level)
-{
-    const int nc = fn.nComp();
-    //
-    // Determine index type of incoming MultiFab.
-    //
-    const IndexType iType(fn.boxArray().ixType());
-    const IndexType cType(AMREX_D_DECL(IndexType::CELL, IndexType::CELL, IndexType::CELL));
-    const IndexType xType(AMREX_D_DECL(IndexType::NODE, IndexType::CELL, IndexType::CELL));
-    const IndexType yType(AMREX_D_DECL(IndexType::CELL, IndexType::NODE, IndexType::CELL));
-#if (BL_SPACEDIM == 3)    
-    const IndexType zType(AMREX_D_DECL(IndexType::CELL, IndexType::CELL, IndexType::NODE));
-#endif
-    int cdir;
-    if (iType == cType)
-    {
-        cdir = -1;
-    }
-    else if (iType == xType)
-    {
-        cdir = 0;
-    }
-    else if (iType == yType)
-    {
-        cdir = 1;
-    }
-#if (BL_SPACEDIM == 3)
-    else if (iType == zType)
-    {
-        cdir = 2;
-    }
-#endif
-    else
-        amrex::Abort("MCLinOp::makeCoeffients(): Bad index type");
-    
-    BoxArray d(gbox[level]);
-    if (cdir >= 0)
-	d.surroundingNodes(cdir);
-
-    int nGrow=0;
-    cs.define(d, DistributionMap(), nc, nGrow);
-    cs.setVal(0.0);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter csmfi(cs,true); csmfi.isValid(); ++csmfi)
-    {
-        const Box&       bx    = csmfi.tilebox();
-        FArrayBox&       csfab = cs[csmfi];
-        const FArrayBox& fnfab = fn[csmfi];
-
-	switch(cdir)
-        {
-	case -1:
-	    FORT_AVERAGECC(
-		csfab.dataPtr(),
-                ARLIM(csfab.loVect()), ARLIM(csfab.hiVect()),
-		fnfab.dataPtr(),
-                ARLIM(fnfab.loVect()), ARLIM(fnfab.hiVect()),
-		bx.loVect(),
-                bx.hiVect(), &nc);
-	    break;
-	case 0:
-	case 1:
-	case 2:
-	    if ( harmavg )
-            {
-		FORT_HARMONIC_AVERAGEEC(
-		    csfab.dataPtr(), 
-                    ARLIM(csfab.loVect()), ARLIM(csfab.hiVect()),
-		    fnfab.dataPtr(), 
-                    ARLIM(fnfab.loVect()), ARLIM(fnfab.hiVect()),
-		    bx.loVect(),
-                    bx.hiVect(), &nc, &cdir);
-	    }
-            else
-            {
-		FORT_AVERAGEEC(
-		    csfab.dataPtr(), 
-                    ARLIM(csfab.loVect()), ARLIM(csfab.hiVect()),
-		    fnfab.dataPtr(), 
-                    ARLIM(fnfab.loVect()), ARLIM(fnfab.hiVect()),
-		    bx.loVect(),
-                    bx.hiVect(), &nc, &cdir);
-	    }
-	    break;
-	default:
-	    amrex::Error("MCLinOp::makeCoeffients(): bad coefficient coarsening direction!");
-	}
-    }
-}
-
-std::ostream&
-operator<< (std::ostream&  os,
-            const MCLinOp& lp)
-{
-    if (ParallelDescriptor::IOProcessor())
-    {
-	os << "MCLinOp" << '\n';
-	os << "Grids: " << '\n';
-	for (int level = 0; level < lp.h.size(); ++level)
-	{
-	    os << " level = " << level << ": " << lp.gbox[level] << '\n';
-	}
-	os << "Grid Spacing: " << '\n';
-	for (int level = 0; level < lp.h.size(); ++level)
-	{
-	    os << " level = " << level << ", dx = ";
-	    for (int d =0; d < BL_SPACEDIM; ++d)
-	    {
-		os << lp.h[level][d] << "  ";
-	    }
-	    os << '\n';
-	}
-	os << "Harmonic average? " << (lp.harmavg == 1 ? "yes" : "no") << '\n';
-	os << "Verbosity: " << lp.verbose << '\n';
-	os << "Max Order: " << lp.maxorder << '\n';
-    }
-
-    if (ParallelDescriptor::IOProcessor())
-	os << "Masks:" << '\n';
-
-    for (int level = 0; level < lp.h.size(); ++level)
-    {
-	if (ParallelDescriptor::IOProcessor())
-	    os << "level = " << level << '\n';
-
-	for (int nproc = 0; nproc < ParallelDescriptor::NProcs(); ++nproc)
-	{
-	    if (nproc == ParallelDescriptor::MyProc())
-	    {
-		os << "Processor " << nproc << '\n';
-
-		for (OrientationIter oitr; oitr; ++oitr)
-		{
-		    const Orientation face = oitr();
-
-		    for (MultiMaskIter mmi(lp.maskvals[level][face]); mmi.isValid(); ++mmi)
-		    {
-                        os << lp.maskvals[level][face][mmi];
-                    }
-		}
-	    }
-	}
-    }    
-    
-    return os;
-}
-
-}
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCMultiGrid.H b/Src/LinearSolvers/C_TensorMG/AMReX_MCMultiGrid.H
deleted file mode 100644
index 25a899d910f..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCMultiGrid.H
+++ /dev/null
@@ -1,638 +0,0 @@
-
-#ifndef AMREX_MCMULTIGRID_H_
-#define AMREX_MCMULTIGRID_H_
-
-#include <AMReX_Array.H>
-#include <AMReX_Vector.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_MCLinOp.H>
-
-namespace amrex {
-
-/**
-  \brief A MCMultiGrid solves the linear equation, L(phi)=rhs, for a MCLinOp L and
-  MultiFabs rhs and phi using a V-type cycle of the MCMultiGrid algorithm
-
-  A MCMultiGrid object solves the linear equation, L(phi)=rhs for a MCLinOp
-  L, and MultiFabs phi and rhs.  A MCMultiGrid is constructed with a
-  fully initialized 2D or 3D MCLinOp, and responds to "solve" requests of
-  various signatures, ultimately performing a recursive "relax"
-  operation over a hierachy of grid levels.  The MCLinOp therefore must
-  employ "levels" of application, as well as be able to provide an
-  implementation of the Gauss-Seidel red-black iterations on all levels.
-  At the coarsest level, the user has the option of applying the
-  GSRB smoother a set number of iterations.  Optionally, a Conjugate
-  Gradient solver, CGSolver, may be used to solve the coarsest system.
-
-  If the user chooses to use the conjugate gradient bottom solve,
-  the absolute and relative tolerances of this solve are independently
-  settable distinct from the tolerances of the mg solve.  However,
-  it rarely makes sense to stop cg after a fixed number of iterations,
-  so that capability was omited, wrt the mg options.  As a final
-  option, the user may choose to follow the cg solve with a fixed
-  number of relaxation passes (the relaxer within the class MCLinOp).
-
-  The solve request (implicitly) includes a flag as to whether the
-  system is to be solved with homogeneous boundary conditions or no.
-  If homogeneous BCs are requested, all boundary information within
-  the MCLinOp is used, except that the values of boundary FabSets are
-  zeroed.
-
-  Implementation Note:
-  This algorithm implements solution of equations in a way that
-  requires linearity of the operator.  In "residual correction form",
-  equations are solved only for the "correction" to the initial guess
-  that is required to solve the desired system.  In particular,
-  boundary conditions are assumed to be satisfied after a single
-  application of the linear operator (therefore, the correction is
-  homogeneous at the boundary).  As a result, after putting the
-  problem in residual correction form, the entire system MG hierarchy
-  has homigeneous boundary conditions (thus avoiding the need to
-  interpolate BC values, and simplifying the logic of the coarse-fine
-  transfer operations).  This solver therefore cannot incorporate
-  fully nonlinear systems.
-
-  Default settings:
-  There are a number of options in the multigrid algorithm details.
-  In addition to changing the actual smoothers employed, the user
-  has access to the following parameters (defaults shown in parentheses):
-
-  nu_1(2) Number of passes of the pre-smoother
-  nu_2(2) Number of passes of the post-smoother
-  nu_0(1) Number of passes of the coarse-grid smoother per cycle
-  nu_f(8) Number of passes of the bottom smoother (if not using
-          the conjugate-gradient bottom solve)
-  maxiter(40) Maximum number of full multigrid cycles allowed to
-              solve the system
-  numiter(-1) Number of full multigrid cycles to perform
-              (should be less than maxiter for fixed number of MG cycles;
-              value is ignored if < 0)
-  verbose(0) Verbosity (1-results, 2-progress)
-  usecg(1) Whether to use the conjugate-gradient solver for the
-           coarsest (bottom) solve of the multigrid hierarchy
-  atol_b(-1.0) Absolute error tolerance (<0 => ignored) for cg
-  rtol_b(.01)  Relative error tolerance (<0 => ignored) for cg
-  nu_b(0)      Number of passes of the bottom smoother taken
-               AFTER} the cg bottom solve (value ignored if <= 0)
-  numLevelsMAX(1024) maximum number of mg levels
-  */
-
-class MCMultiGrid
-{
-public:
-
-    /**
-    * \brief Constructor.
-    *
-    * \param &_lp
-    */
-    MCMultiGrid (MCLinOp &_lp);
-
-    /**
-    * \brief Destructor.
-    */
-    virtual ~MCMultiGrid ();
-
-    /**
-    * \brief Solve the system to relative err eps_rel, absolute err eps_abs.
-    *
-    * \param solution
-    * \param _rhs
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    */
-    virtual void solve (MultiFab&       solution,
-			const MultiFab& _rhs,
-			Real            eps_rel = -1.0,
-			Real            eps_abs = -1.0,
-			MCBC_Mode       bc_mode = MCInhomogeneous_BC);
-
-    /**
-    * \brief Return the linear operator.
-    */
-    MCLinOp& linOp ();
-
-    /**
-    * \brief Set the maximum permitted multigrid iterations.
-    *
-    * \param _maxiter
-    */
-    void setMaxIter (int _maxiter);
-
-    /**
-    * \brief Return the maximum permitted multigrid iterations.
-    */
-    int getMaxIter () const;
-
-    /**
-    * \brief Set the number of multigrid iterations to perform.
-    *
-    * \param _numiter
-    */
-    void setNumIter (int _numiter);
-
-    /**
-    * \brief Return the number of multigrid iterations.
-    */
-    int getNumIter () const;
-
-    /**
-    * \brief Set the flag for whether to use CGSolver at coarsest level.
-    *
-    * \param _usecg
-    */
-    void setUseCG (int _usecg);
-
-    /**
-    * \brief Return the flag for whether to use CGSolver at coarsest level.
-    */
-    int getUseCG () const;
-
-    /**
-    * \brief Set/return the number of multigrid levels.
-    *
-    * \param _numlevels
-    */
-    int getNumLevels (int _numlevels);
-
-    /**
-    * \brief Return the number of multigrid levels.
-    */
-    int getNumLevels () const;
-
-    /**
-    * \brief Return the number of components in solution.
-    */
-    int getNumComponents () const;
-
-    /**
-    * \brief Set the verbosity value.
-    *
-    * \param _verbose
-    */
-    void setVerbose (int _verbose);
-
-    /**
-    * \brief Return the verbosity value.
-    */
-    int getVerbose ();
-
-    /**
-    * \brief Set the number of passes of the pre-smoother.
-    *
-    * \param pre_smooth
-    */
-    void set_preSmooth (int pre_smooth);
-
-    /**
-    * \brief Set the number of passes of the post-smoother.
-    *
-    * \param post_smooth
-    */
-    void set_postSmooth (int post_smooth);
-
-    /**
-    * \brief Set the number of passes of the coarse-grid smoother/mg iteration.
-    *
-    * \param cnt_relax
-    */
-    void set_cntRelax (int cnt_relax);
-
-    /**
-    * \brief Set the number of passes of the bottom mg relaxer.
-    *
-    * \param final_smooth
-    */
-    void set_finalSmooth (int final_smooth);
-
-    /**
-    * \brief Return the number of pre-smooth iterations at the level.
-    */
-    int preSmooth () const;
-
-    /**
-    * \brief Return the number of post-smooth iterations at the level.
-    */
-    int postSmooth () const;
-
-    /**
-    * \brief Return the number of level relaxations  (not implemented).
-    */
-    int cntRelax () const;
-
-    /**
-    * \brief Return the number of smoothing passes at bottom of MG (if no cg).
-    */
-    int finalSmooth () const;
-
-    /**
-    * \brief Set the maximum permitted absolute tolerance (\<0 bypasses test).
-    *
-    * \param atol
-    */
-    void set_atol_b (Real atol);
-
-    /**
-    * \brief Get the maximum permitted absolute tolerance.
-    */
-    Real get_atol_b () const;
-
-    /**
-    * \brief Set the maximum permitted relative tolerance (\<0 bypasses test).
-    *
-    * \param rtol
-    */
-    void set_rtol_b (Real rtol);
-
-    /**
-    * \brief Get the maximum permitted relative tolerance.
-    */
-    Real get_rtol_b () const;
-
-    /**
-    * \brief Set the number of post-cg relax passes.
-    *
-    * \param _nu_b
-    */
-    void set_nu_b (int _nu_b);
-
-    /**
-    * \brief Set the number of post-cg relax passes.
-    */
-    int get_nu_b () const;
-
-protected:
-
-    /**
-    * \brief Solve the linear system to relative and absolute tolerance
-    *
-    * \param _sol
-    * \param _eps_rel
-    * \param _eps_abs
-    * \param bc_mode
-    * \param level
-    */
-    virtual int solve_ (MultiFab& _sol,
-			Real      _eps_rel,
-			Real      _eps_abs,
-			MCBC_Mode bc_mode,
-			int       level);
-
-    /**
-    * \brief Put the system in r-c form
-    *
-    * \param newrhs
-    * \param oldrhs
-    * \param initialsolution
-    * \param inisol
-    * \param bc_mode
-    * \param level
-    */
-    void residualCorrectionForm (MultiFab&       newrhs,
-				 const MultiFab& oldrhs,
-				 MultiFab&       initialsolution,
-				 const MultiFab& inisol,
-				 MCBC_Mode       bc_mode,
-				 int             level);
-
-    /**
-    * \brief Make space, set switches for new solution level
-    *
-    * \param level
-    */
-    void prepareForLevel (int level);
-
-    /**
-    * \brief Compute the number of multigrid levels, assuming ratio=2
-    */
-    int numLevels () const;
-
-    /**
-    * \brief Return scalar estimate of error
-    *
-    * \param level
-    * \param bc_mode
-    * \param local
-    */
-    virtual Real errorEstimate (int       level,
-				MCBC_Mode bc_mode,
-                                bool      local = false);
-
-    /**
-    * \brief Transfer MultiFab from fine to coarse level
-    *
-    * \param c
-    * \param f
-    */
-    void average (MultiFab&       c,
-		  const MultiFab& f);
-
-    /**
-    * \brief Transfer MultiFab from coarse to fine level
-    *
-    * \param f
-    * \param c
-    */
-    void interpolate (MultiFab&       f,
-		      const MultiFab& c);
-
-    /**
-    * \brief Perform a MG V-cycle
-    *
-    * \param solL
-    * \param rhsL
-    * \param level
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    */
-    void relax (MultiFab& solL,
-		MultiFab& rhsL,
-		int       level,
-		Real      eps_rel,
-		Real      eps_abs,
-		MCBC_Mode bc_mode);
-
-    /**
-    * \brief Perform relaxation at bottom of V-cycle
-    *
-    * \param solL
-    * \param rhsL
-    * \param level
-    * \param eps_rel
-    * \param eps_abs
-    * \param bc_mode
-    */
-    virtual void coarsestSmooth (MultiFab& solL,
-				 MultiFab& rhsL,
-				 int       level,
-				 Real      eps_rel,
-				 Real      eps_abs,
-				 MCBC_Mode bc_mode);
-protected:
-
-    //! Default flag, whether to use CG at bottom of MG cycle.
-    static int def_usecg;
-
-    /**
-    * \brief Set flags, etc.
-    */
-    static void Initialize ();
-
-    static void Finalize ();
-
-    //! Default number of level, pre-, post and bottom smooths.
-    static int def_nu_0, def_nu_1, def_nu_2, def_nu_f;
-
-    //! Default number of post-cg relax passes.
-    static int def_nu_b;
-
-    //! Default maximum number of complete MG cycle iterations.
-    static int def_maxiter;
-
-    //! Default number of complete MG cycle iterations to perform.
-    static int def_numiter;
-
-    //! Default verbosity.
-    static int def_verbose;
-
-    //! Default relative, absolute tolerances for cg solve.
-    static Real def_rtol_b, def_atol_b;
-
-    //! Default maximum number of mg levels.
-    static int def_numLevelsMAX;
-
-    //! verbosity
-    int verbose;
-
-    //! Number of MG levels.  numlevels-1 is coarsest grid allowed.
-    int numlevels;
-
-    //! Number of components in solution.
-    int numcomps;
-
-    //! Current maximum number of allowed iterations.
-    int maxiter;
-
-    //! Current number of iterations to take.
-    int numiter;
-
-    //! Current number of level, pre-, post- and bottom smooths.
-    int nu_0, nu_1, nu_2, nu_f;
-
-    //! Current number of post-cg relax passes.
-    int nu_b;
-
-    //! Current flag, whether to use CG at bottom of MG cycle.
-    int usecg;
-
-    //! Relative, absolute tolerances.
-    Real rtol_b, atol_b;
-
-    //! Maximum number of mg levels.
-    int numLevelsMAX;
-
-    //! Internal temp data to store initial guess of solution.
-    MultiFab* initialsolution;
-
-    //! Internal temp data.
-    Vector< MultiFab* > res;
-
-    //! Internal temp data.
-    Vector< MultiFab* > rhs;
-
-    //! Internal temp data.
-    Vector< MultiFab* > cor;
-
-    //! Internal reference to linear operator.
-    MCLinOp &Lp;
-
-private:
-
-    /**
-    * \brief Disallow copy constructor, assignment operator
-    *
-    */
-    MCMultiGrid (const MCMultiGrid&);
-    MCMultiGrid& operator= (const MCMultiGrid&);
-};
-
-inline
-MCLinOp&
-MCMultiGrid::linOp ()
-{
-    return Lp;
-}
-
-inline
-void
-MCMultiGrid::setMaxIter (int _maxiter)
-{
-    maxiter = _maxiter;
-}
-
-inline
-int
-MCMultiGrid::getMaxIter () const
-{
-    return maxiter;
-}
-
-inline
-void
-MCMultiGrid::setNumIter (int _numiter)
-{
-    numiter = _numiter;
-}
-
-inline
-int
-MCMultiGrid::getNumIter () const
-{
-    return numiter;
-}
-
-inline
-void
-MCMultiGrid::setUseCG (int _usecg)
-{
-    usecg = _usecg;
-}
-
-inline
-int
-MCMultiGrid::getUseCG () const
-{
-    return usecg;
-}
-
-inline
-int
-MCMultiGrid::getNumLevels () const
-{
-    return numlevels;
-}
-
-inline
-int
-MCMultiGrid::getNumComponents () const
-{
-    return numcomps;
-}
-
-inline
-void
-MCMultiGrid::setVerbose (int _verbose)
-{
-    verbose = _verbose;
-}
-
-inline
-int
-MCMultiGrid::getVerbose ()
-{
-    return verbose;
-}
-
-inline
-void
-MCMultiGrid::set_preSmooth (int pre_smooth)
-{
-    nu_1 = pre_smooth;
-}
-
-inline
-void
-MCMultiGrid::set_postSmooth (int post_smooth)
-{
-    nu_2 = post_smooth;
-}
-
-inline
-void
-MCMultiGrid::set_cntRelax (int cnt_relax)
-{
-    nu_0 = cnt_relax;
-}
-
-inline
-void
-MCMultiGrid::set_finalSmooth (int final_smooth)
-{
-    nu_f = final_smooth;
-}
-
-inline
-int
-MCMultiGrid::preSmooth () const
-{
-    return nu_1;
-}
-
-inline
-int
-MCMultiGrid::postSmooth () const
-{
-    return nu_2;
-}
-
-inline
-int
-MCMultiGrid::cntRelax () const
-{
-    return nu_0;
-}
-
-inline
-int
-MCMultiGrid::finalSmooth () const
-{
-    return nu_f;
-}
-
-inline
-void
-MCMultiGrid::set_atol_b (Real atol)
-{
-    atol_b = atol;
-}
-
-inline
-Real
-MCMultiGrid::get_atol_b () const
-{
-    return atol_b;
-}
-
-inline
-void
-MCMultiGrid::set_rtol_b (Real rtol)
-{
-    rtol_b = rtol;
-}
-
-inline
-Real
-MCMultiGrid::get_rtol_b () const
-{
-    return rtol_b;
-}
-
-inline
-void
-MCMultiGrid::set_nu_b (int _nu_b)
-{
-    nu_b = _nu_b;
-}
-
-inline
-int
-MCMultiGrid::get_nu_b () const
-{
-    return nu_b;
-}
-
-}
-
-#endif /*_MCMULTIGRID_H_*/
diff --git a/Src/LinearSolvers/C_TensorMG/AMReX_MCMultiGrid.cpp b/Src/LinearSolvers/C_TensorMG/AMReX_MCMultiGrid.cpp
deleted file mode 100644
index 4e33f83fcea..00000000000
--- a/Src/LinearSolvers/C_TensorMG/AMReX_MCMultiGrid.cpp
+++ /dev/null
@@ -1,552 +0,0 @@
-
-#include <algorithm>
-#include <cstdlib>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_Utility.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_MCCGSolver.H>
-#include <AMReX_MG_F.H>
-#include <AMReX_MCMultiGrid.H>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-namespace amrex {
-
-namespace
-{
-    bool initialized = false;
-}
-//
-// Set default values for these in Initialize()!!!
-//
-int  MCMultiGrid::def_nu_0;
-int  MCMultiGrid::def_nu_1;
-int  MCMultiGrid::def_nu_2;
-int  MCMultiGrid::def_nu_f;
-int  MCMultiGrid::def_maxiter;
-int  MCMultiGrid::def_numiter;
-int  MCMultiGrid::def_verbose;
-int  MCMultiGrid::def_usecg;
-Real MCMultiGrid::def_rtol_b;
-Real MCMultiGrid::def_atol_b;
-int  MCMultiGrid::def_nu_b;
-int  MCMultiGrid::def_numLevelsMAX;
-
-void
-MCMultiGrid::Initialize ()
-{
-    if (initialized) return;
-    //
-    // Set defaults here!!!
-    //
-    MCMultiGrid::def_nu_0         = 1;
-    MCMultiGrid::def_nu_1         = 2;
-    MCMultiGrid::def_nu_2         = 2;
-    MCMultiGrid::def_nu_f         = 8;
-    MCMultiGrid::def_maxiter      = 40;
-    MCMultiGrid::def_numiter      = -1;
-    MCMultiGrid::def_verbose      = 0;
-    MCMultiGrid::def_usecg        = 1;
-    MCMultiGrid::def_rtol_b       = 0.01;
-    MCMultiGrid::def_atol_b       = -1.0;
-    MCMultiGrid::def_nu_b         = 0;
-    MCMultiGrid::def_numLevelsMAX = 1024;
-
-    ParmParse pp("mg");
-
-    pp.query("maxiter",      def_maxiter);
-    pp.query("numiter",      def_numiter);
-    pp.query("nu_0",         def_nu_0);
-    pp.query("nu_1",         def_nu_1);
-    pp.query("nu_2",         def_nu_2);
-    pp.query("nu_f",         def_nu_f);
-    pp.query("v",            def_verbose);
-    pp.query("usecg",        def_usecg);
-    pp.query("rtol_b",       def_rtol_b);
-    pp.query("bot_atol",     def_atol_b);
-    pp.query("nu_b",         def_nu_b);
-    pp.query("numLevelsMAX", def_numLevelsMAX);
-
-    if (ParallelDescriptor::IOProcessor() && def_verbose)
-    {
-	amrex::OutStream() << "def_nu_0         = " << def_nu_0         << '\n'
-                           << "def_nu_1         = " << def_nu_1         << '\n'
-                           << "def_nu_2         = " << def_nu_2         << '\n'
-                           << "def_nu_f         = " << def_nu_f         << '\n'
-                           << "def_maxiter      = " << def_maxiter      << '\n'
-                           << "def_usecg        = " << def_usecg        << '\n'
-                           << "def_rtol_b       = " << def_rtol_b       << '\n'
-                           << "def_atol_b       = " << def_atol_b       << '\n'
-                           << "def_nu_b         = " << def_nu_b         << '\n'
-                           << "def_numLevelsMAX = " << def_numLevelsMAX << '\n'
-                           << "def_verbose      = " << def_verbose      << '\n';
-    }
-
-    amrex::ExecOnFinalize(MCMultiGrid::Finalize);
-
-    initialized = true;
-}
-
-void
-MCMultiGrid::Finalize ()
-{
-    initialized = false;
-}
-
-static
-Real
-norm_inf (const MultiFab& res, bool local = false)
-{
-    Real restot = 0.0;
-#ifdef _OPENMP
-#pragma omp parallel reduction(max:restot)
-#endif
-    for (MFIter mfi(res,true); mfi.isValid(); ++mfi) 
-    {
-      restot = std::max(restot, res[mfi].norm<RunOn::Host>(mfi.tilebox(), 0, 0, res.nComp()));
-    }
-    if ( !local )
-        ParallelDescriptor::ReduceRealMax(restot);
-    return restot;
-}
-
-static
-void
-Spacer (std::ostream& os, int lev)
-{
-    for (int k = 0; k < lev; k++)
-    {
-        os << "   ";
-    }
-}
-
-MCMultiGrid::MCMultiGrid (MCLinOp &_lp)
-    :
-    initialsolution(0),
-    Lp(_lp)
-{
-    Initialize();
-
-    maxiter = def_maxiter;
-    numiter = def_numiter;
-    nu_0 = def_nu_0;
-    nu_1 = def_nu_1;
-    nu_2 = def_nu_2;
-    nu_f = def_nu_f;
-    usecg = def_usecg;
-    verbose = def_verbose;
-    rtol_b = def_rtol_b;
-    atol_b = def_atol_b;
-    nu_b = def_nu_b;
-    numLevelsMAX = def_numLevelsMAX;
-    numlevels = numLevels();
-    numcomps = _lp.numberComponents();
-    if ( ParallelDescriptor::IOProcessor() && (verbose > 2) )
-    {
-	BoxArray tmp = Lp.boxArray();
-	amrex::OutStream() << "MCMultiGrid: numlevels = " << numlevels 
-                           << ": ngrid = " << tmp.size() << ", npts = [";
-	for ( int i = 0; i < numlevels; ++i ) 
-        {
-	    if ( i > 0 ) tmp.coarsen(2);
-	    amrex::OutStream() << tmp.d_numPts() << " ";
-        }
-	amrex::OutStream() << "]" << '\n';
-
-	amrex::OutStream() << "MCMultiGrid: " << numlevels
-                           << " multigrid levels created for this solve" << '\n';
-    }
-
-    if ( ParallelDescriptor::IOProcessor() && (verbose > 4) )
-    {
-	amrex::OutStream() << "Grids: " << '\n';
-	BoxArray tmp = Lp.boxArray();
-	for (int i = 0; i < numlevels; ++i)
-	{
-            Orientation face(0, Orientation::low);
-            const DistributionMapping& map = Lp.bndryData().bndryValues(face).DistributionMap();
-	    if (i > 0)
-		tmp.coarsen(2);
-	    amrex::OutStream() << " Level: " << i << '\n';
-	    for (int k = 0; k < tmp.size(); k++)
-	    {
-		const Box& b = tmp[k];
-		amrex::OutStream() << "  [" << k << "]: " << b << "   ";
-		for (int j = 0; j < BL_SPACEDIM; j++)
-		    amrex::OutStream() << b.length(j) << ' ';
-                amrex::OutStream() << ":: " << map[k] << '\n';
-	    }
-	}
-    }
-}
-
-MCMultiGrid::~MCMultiGrid ()
-{
-    delete initialsolution;
-
-    for (int i = 0; i < cor.size(); ++i)
-    {
-	delete res[i];
-	delete rhs[i];
-	delete cor[i];
-    }
-}
-
-Real
-MCMultiGrid::errorEstimate (int       level,
-			    MCBC_Mode bc_mode,
-                            bool      local)
-{
-    Lp.residual(*res[level], *rhs[level], *cor[level], level, bc_mode);
-    return norm_inf(*res[level], local);
-}
-
-void
-MCMultiGrid::prepareForLevel (int level)
-{
-    //
-    // Build this level by allocating reqd internal MultiFabs if necessary
-    //
-    if (cor.size() > level)
-	return;
-    res.resize(level+1, (MultiFab*)0);
-    rhs.resize(level+1, (MultiFab*)0);
-    cor.resize(level+1, (MultiFab*)0);
-    Lp.prepareForLevel(level);
-    if (cor[level] == 0)
-    {
-	const BoxArray& ba = Lp.boxArray(level);
-	const DistributionMapping& dm = Lp.DistributionMap();
-	res[level] = new MultiFab(ba,dm,numcomps,1);
-	rhs[level] = new MultiFab(ba,dm,numcomps,1);
-	cor[level] = new MultiFab(ba,dm,numcomps,1);
-	if (level == 0)
-        {
-	    initialsolution = new MultiFab(ba, dm, numcomps, 1);
-	    
-	}
-    }
-}
-
-void
-MCMultiGrid::residualCorrectionForm (MultiFab&       resL,
-				     const MultiFab& rhsL,
-				     MultiFab&       solnL,
-				     const MultiFab& inisol,
-				     MCBC_Mode       bc_mode,
-				     int             level)
-{
-    //
-    // Using the linearity of the operator, Lp, we can solve this system
-    // instead by solving for the correction required to the initial guess.
-    //
-    initialsolution->copy(inisol);
-    solnL.copy(inisol);
-    Lp.residual(resL, rhsL, solnL, level, bc_mode);
-}
-
-void
-MCMultiGrid::solve (MultiFab&       _sol,
-		    const MultiFab& _rhs,
-		    Real            _eps_rel,
-		    Real            _eps_abs,
-		    MCBC_Mode       bc_mode)
-{
-    BL_ASSERT(numcomps == _sol.nComp());
-    //
-    // Prepare memory for new level, and solve the general boundary
-    // value problem to within relative error _eps_rel.  Customized
-    // to solve at level=0
-    //
-    int level = 0;
-    prepareForLevel(level);
-    residualCorrectionForm(*rhs[level],_rhs,*cor[level],_sol,bc_mode,level);
-    if (!solve_(_sol, _eps_rel, _eps_abs, MCHomogeneous_BC, level))
-      amrex::Error("MCMultiGrid::solve(): failed to converge!");
-}
-
-int
-MCMultiGrid::solve_ (MultiFab& _sol,
-		     Real      eps_rel,
-		     Real      eps_abs,
-		     MCBC_Mode bc_mode,
-		     int       level)
-{
-  //
-  // Relax system maxiter times, stop if relative error <= _eps_rel or
-  // if absolute err <= _abs_eps
-  //
-  const Real strt_time = amrex::second();
-  //
-  // Elide a reduction by doing these together.
-  //
-  Real tmp[2] = { norm_inf(*rhs[level],true), errorEstimate(level,bc_mode,true) };
-
-  ParallelDescriptor::ReduceRealMax(tmp,2);
-
-  const Real norm_rhs  = tmp[0];
-  const Real error0    = tmp[1];
-  int        returnVal = 0;
-  Real       error     = error0;
-
-  if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-  {
-      Spacer(amrex::OutStream(), level);
-      amrex::OutStream() << "MCMultiGrid: Initial rhs                = " << norm_rhs << '\n'
-                         << "MCMultiGrid: Initial error (error0)     = " << error0 << '\n';
-  }
-  
-  if ( ParallelDescriptor::IOProcessor() && eps_rel < 1.0e-16 && eps_rel > 0 )
-  {
-      amrex::OutStream() << "MCMultiGrid: Tolerance "
-                         << eps_rel
-                         << " < 1e-16 is probably set too low" << '\n';
-  }
-  //
-  // Initialize correction to zero at this level (auto-filled at levels below)
-  //
-  (*cor[level]).setVal(0.0);
-  //
-  // Note: if eps_rel, eps_abs < 0 then that test is effectively bypassed.
-  //
-  int        nit         = 1;
-  const Real new_error_0 = norm_rhs;
-  //const Real norm_Lp     = Lp.norm(0, level);
-
-
-  for ( ;
-        error > eps_abs &&
-          error > eps_rel*norm_rhs &&
-          nit <= maxiter;
-        ++nit)
-  {
-    relax(*cor[level], *rhs[level], level, eps_rel, eps_abs, bc_mode);
-
-    error = errorEstimate(level,bc_mode);
-	
-    if ( ParallelDescriptor::IOProcessor() && verbose > 1 )
-    {
-      const Real rel_error = (error0 != 0) ? error/new_error_0 : 0;
-      Spacer(amrex::OutStream(), level);
-      amrex::OutStream() << "MCMultiGrid: Iteration   "
-                         << nit
-                         << " error/error0 = "
-                         << rel_error << '\n';
-    }
-  }
-
-  Real run_time = (amrex::second() - strt_time);
-  if ( verbose > 0 )
-  {
-      if ( ParallelDescriptor::IOProcessor() )
-      {
-          const Real rel_error = (error0 != 0) ? error/error0 : 0;
-          Spacer(amrex::OutStream(), level);
-          amrex::OutStream() << "MCMultiGrid: Final Iter. "
-                             << nit-1
-                             << " error/error0 = "
-                             << rel_error;
-      }
-
-      if ( verbose > 1 )
-      {
-        
-        ParallelDescriptor::ReduceRealMax(run_time);
-
-        amrex::Print() << ", Solve time: " << run_time << '\n';
-      }
-  }
-
-  if ( ParallelDescriptor::IOProcessor() && (verbose > 0) )
-  {
-    if ( error < eps_rel*norm_rhs )
-    {
-      amrex::OutStream() << "   Converged res < eps_rel*bnorm\n";
-    } 
-    else if ( error < eps_abs )
-    {
-      amrex::OutStream() << "   Converged res < eps_abs\n";
-    }
-  }
-  //
-  // Omit ghost update since maybe not initialized in calling routine.
-  // Add to boundary values stored in initialsolution.
-  //
-  _sol.copy(*cor[level]);
-  _sol.plus(*initialsolution,0,_sol.nComp(),0);
-
-  if ( error <= eps_rel*(norm_rhs) ||
-       error <= eps_abs )
-    returnVal = 1;
-
-  //
-  // Otherwise, failed to solve satisfactorily
-  //
-  return returnVal;
-}
-
-int
-MCMultiGrid::getNumLevels (int _numlevels)
-{
-    BL_ASSERT(_numlevels >= 0);
-    int oldnumlevels = numlevels;
-    numlevels = std::min(_numlevels, numLevels());
-    return oldnumlevels;
-}
-
-int
-MCMultiGrid::numLevels () const
-{
-    int ng = Lp.numGrids();
-    int lv = numLevelsMAX - 1;
-    //
-    // The routine `falls through' since coarsening and refining
-    // a unit box does not yield the initial box.
-    //
-    const BoxArray &bs = Lp.boxArray(0);
-
-    for (int i = 0; i < ng; ++i)
-    {
-	int llv = 0;
-	Box tmp = bs[i];
-
-	if (tmp.shortside() <= 3 )
-	    amrex::Error("MCMultiGrid::numLevels(): fine grid too small");
-
-	for (;;)
-        {
-	    Box ctmp  = tmp; ctmp.coarsen(2);
-	    Box rctmp = ctmp; rctmp.refine(2);
-	    if (tmp != rctmp)
-		break;
-
-	    if (ctmp.numPts() == 1)
-		break;
-            //
-	    // wyc -- change so grid does not get too small
-	    // wyc -- this is necessary for one-sided derivs in tensor-solve
-	    // wyc -- when BBMGoUR is implemented, this will only be
-	    // wyc -- necessary on finest level
-            //
-	    if (ctmp.shortside() <= 3)
-		break;
-	    llv++;
-	    tmp = ctmp;
-	}
-        //
-	// Set number of levels so that every box can be refined to there.
-        //
-	lv = (lv < llv)? lv : llv;
-    }
-    return lv+1;		// including coarsest
-}
-
-void
-MCMultiGrid::relax (MultiFab& solL,
-		    MultiFab& rhsL,
-		    int       level,
-		    Real      eps_rel,
-		    Real      eps_abs,
-		    MCBC_Mode bc_mode)
-{
-  //
-  // Recursively relax system.  Equivalent to multigrid V-cycle.
-  // At coarsest grid, call coarsestSmooth.
-  //
-  if (level < numlevels - 1 ) {
-    for (int i = preSmooth() ; i > 0 ; i--) {
-      Lp.smooth(solL, rhsL, level, bc_mode);
-    }
-    
-    Lp.residual(*res[level], rhsL, solL, level, bc_mode);
-    prepareForLevel(level+1);
-    average(*rhs[level+1], *res[level]);
-    cor[level+1]->setVal(0.0);
-    for (int i = cntRelax(); i > 0 ; i--) {
-      relax(*cor[level+1],*rhs[level+1],level+1,eps_rel,eps_abs,bc_mode);
-    }
-    interpolate(solL, *cor[level+1]);
-    for (int i = postSmooth(); i > 0 ; i--) {
-      Lp.smooth(solL, rhsL, level, bc_mode);
-    }
-  } else {
-    coarsestSmooth(solL, rhsL, level, eps_rel, eps_abs, bc_mode);
-  }
-}
-
-void
-MCMultiGrid::coarsestSmooth (MultiFab& solL,
-			     MultiFab& rhsL,
-			     int       level,
-			     Real      eps_rel,
-			     Real      eps_abs,
-			     MCBC_Mode bc_mode)
-{
-    prepareForLevel(level);
-        
-    if (usecg == 0)
-    {
-        for (int i = finalSmooth(); i > 0; i--)
-            Lp.smooth(solL, rhsL, level, bc_mode);
-    }
-    else
-    {
-        bool use_mg_precond = false;
-        MCCGSolver cg(Lp, use_mg_precond, level);
-        cg.solve(solL, rhsL, rtol_b, atol_b, bc_mode);
-        for(int i=0; i<nu_b; i++)
-            Lp.smooth(solL, rhsL, level, bc_mode);
-    }
-}
-
-void
-MCMultiGrid::average (MultiFab&       c,
-		      const MultiFab& f)
-{
-    //
-    // Use Fortran function to average down (restrict) f to c.
-    //
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter cmfi(c,true); cmfi.isValid(); ++cmfi)
-    {
-        const Box&       bx   = cmfi.tilebox();
-	int              nc   = c.nComp();
-        FArrayBox&       cfab = c[cmfi];
-        const FArrayBox& ffab = f[cmfi];
-	amrex_mg_average(
-	    cfab.dataPtr(),ARLIM(cfab.loVect()),ARLIM(cfab.hiVect()),
-	    ffab.dataPtr(),ARLIM(ffab.loVect()),ARLIM(ffab.hiVect()),
-	    bx.loVect(), bx.hiVect(), &nc);
-    }
-}
-
-void
-MCMultiGrid::interpolate (MultiFab&       f,
-			  const MultiFab& c)
-{
-    //
-    // Use fortran function to interpolate up (prolong) c to f
-    // Note: returns f=f+P(c) , i.e. ADDS interp'd c to f
-    //
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    for (MFIter fmfi(c,true); fmfi.isValid(); ++fmfi)
-    {
-	const Box&       bx   = fmfi.tilebox();
-	int              nc   = f.nComp();
-        const FArrayBox& cfab = c[fmfi];
-        FArrayBox&       ffab = f[fmfi];
-	amrex_mg_interp(
-	    ffab.dataPtr(),ARLIM(ffab.loVect()),ARLIM(ffab.hiVect()),
-	    cfab.dataPtr(),ARLIM(cfab.loVect()),ARLIM(cfab.hiVect()),
-	    bx.loVect(), bx.hiVect(), &nc);
-    }
-}
-
-}
diff --git a/Src/LinearSolvers/C_TensorMG/DV_2D.mF b/Src/LinearSolvers/C_TensorMG/DV_2D.mF
deleted file mode 100644
index ff5f034c42b..00000000000
--- a/Src/LinearSolvers/C_TensorMG/DV_2D.mF
+++ /dev/null
@@ -1,2630 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a two by two tensor
-c     tau = | t_xx     t_xy |
-c           | t_xy     t_yy |
-c
-c     t_xx = 2*mu * u_x
-c     t_xy = mu*(u_y + v_x)
-c     t_yy = 2*mu * v_y
-
-c     and alpha is a diagonal 2x2 matrix, says rick
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc2d.ma
-c ::: <* standardrepl = { dudx[i+half  ,j       ]->dudxe,
-                          dudx[i-1+half,j       ]->dudxw,
-                          dvdy[i,j+half]-> dvdyn ,
-                          dvdy[i,j-1+half]-> dvdys ,
-                          dudy[i,j  +half]-> dudyn ,
-                          dudy[i,j-1+half]-> dudys ,
-                          dudy[i+half,j]-> dudye ,
-                          dudy[i-1+half,j]-> dudyw ,
-                          dvdx[i,j  +half]-> dvdxn ,
-                          dvdx[i,j-1+half]-> dvdxs ,
-                          dvdx[i+half,j]-> dvdxe ,
-                          dvdx[i-1+half,j]-> dvdxw ,
-                          murepl1, murepl2,
-                          tauxxdef, tauyydef, tauxydef,vol->hx*hy };  *>
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_DVAPPLY(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     out, DIMS(out),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     lo,hi,h
-     $     )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(out)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),2)
-      REAL_T a(DIMV(a),2)
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T out(DIMV(out),2)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-
-      REAL_T trandern(DIMV(trandern),2)
-      REAL_T trandere(DIMV(trandere),2)
-      REAL_T tranderw(DIMV(tranderw),2)
-      REAL_T tranders(DIMV(tranders),2)
-
-      integer i,j
-      REAL_T tauxxw,tauxxe,tauyyn,tauyys
-      REAL_T tauxye,tauxyw,tauxyn,tauxys
-      REAL_T hx,hy
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw,dudyn,dudys
-      REAL_T dvdxe,dvdxw,dvdxn,dvdxs
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-
-c ::: make some mathematica definitions
-c ::: allDerivAllUV makes replacements for the deriv expressions and
-c ::: maps U and V to the correct values
-c ::: <* allDerivAllUV = {dudxdef,dvdydef,dudydef1,dudydef2,
-                          dvdxdef1,dvdxdef2,urepl,vrepl} ; *>
-
-c ::: cases:
-c     ::: 1) interior.  All normal derivative expressions
-c     ::: 2) edge but not on corner.  check mask value to see if use outside
-c     :::    value or use interpolations
-c     ::: 3) corners.  Must check mask values to see if use outside values
-c     :::    values or use interpolations ON TWO SIDES.  But must also
-c     :::    check to see if need to do one-sided derivs for tangential
-c     :::    derivatives.
-
-c ::: case 1
-      do j=lo(2)+1,hi(2)-1
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-
-            dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-         enddo
-      enddo
-
-c ::: ::: case 2a: north side
-c ::: <* indexcond = Function[ {i,j}, (j>0) ] ; *>
-c ::: <* maskray = maskn ; *>
-c :::
-      j = hi(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudye = <* (DOneY[u,i  ,j,-1]+ 
-                           DOneY[u,i+1,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudyw = <* (DOneY[u,i  ,j,-1]+
-                           DOneY[u,i-1,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-         enddo
-
-c ::: case 2b south side
-c ::: <* indexcond = Function[ {i,j}, (j<0) ] ; *>
-c ::: <* maskray = masks ; *>
-      j=lo(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudye = <* (DOneY[u,i  ,j,+1]+ 
-                           DOneY[u,i+1,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudyw = <* (DOneY[u,i  ,j,+1]+
-                           DOneY[u,i-1,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-         enddo
-
-
-c ::: case 2c: west side story
-c ::: <* indexcond = Function[ {i,j}, (i<0) ] ; *>
-c ::: <* maskray = maskw ; *>
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            dudyw = tranderw(i-1,j,1)
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j  ,+1]+
-                           DOneX[v,i,j+1,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j  ,+1]+
-                           DOneX[v,i,j-1,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-      enddo
-
-c ::: case 2d: east side story
-c ::: <* indexcond = Function[ {i,j}, (i>0) ] ; *>
-c ::: <* maskray = maske ; *>
-      i=hi(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j  ,-1]+
-                           DOneX[v,i,j+1,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j  ,-1]+
-                           DOneX[v,i,j-1,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-         enddo
-
-c ::: case 3a: north-east corner
-c ::: <* indexcond = Function[ {i,j}, (i>0)||(j>0) ] ; *>
-c ::: <* Clear[ maskray ] ; *>
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            if( <* 
-                 dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                          indexcond,maskn]
-                 *> ) then
-               dudyw = <* (DOneY[u,i-1,j,-1]+
-                           DOneY[u,i  ,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                          indexcond,maske]
-                *> ) then
-               dvdxs = <* (DOneX[v,i,j-1,-1]+
-                           DOneX[v,i,j  ,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-
-c ::: case 3b: south-east corner, plus i, minus j, plus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i>0)||(j<0) ] ; *>
-      j=lo(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            if( <* 
-                 dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                               indexcond,masks]
-                 *> ) then 
-               dudyw = <* (DOneY[u,i-1,j,+1]+
-                           DOneY[u,i  ,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                               indexcond,maske]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j+1,-1]+
-                           DOneX[v,i,j  ,-1])/2 //. allDerivAllUV *> 
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-
-c ::: case 3c: south-west corner, minus i, minus j
-c ::: <* indexcond = Function[ {i,j}, (i<0)||(j<0) ] ; *>
-      j=lo(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                                 indexcond,masks]
-                 *> ) then
-               dudye = <* (DOneY[u,i+1,j,+1]+
-                           DOneY[u,i  ,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //. allDerivAllUV,
-                                               indexcond,maskw]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j+1,+1]+
-                           DOneX[v,i,j  ,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-
-c ::: case 3d: north-west corner, minus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i<0)||(j>0) ] ; *>
-      j=hi(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                               indexcond,maskn]
-                *> ) then
-               dudye = <* (DOneY[u,i+1,j,-1]+
-                           DOneY[u,i  ,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            dvdxn = trandern(i,j+1,2)
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //. allDerivAllUV,
-                                               indexcond,maskw]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j-1,+1]+
-                           DOneX[v,i,j  ,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            out(i,j,1) = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            out(i,j,2) = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-
-
-
-      return
-      end
-
-
-c -------------------------------------------------------------------
-c ... a point of interpretation here: lo and hi are the covered area in
-c ... cell centered coordinates.  The dimension of the x and y fluxes have
-c ... to be at least one larger in the appropriate direction.
-c ... we use the "usual" interpretation of fluxes: cell i has a left flux
-c ... numbered i and a right flux numbered i+1
-
-      subroutine FORT_DVFLUX(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     xflux,DIMS(xflux),
-     $     yflux,DIMS(yflux),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     lo,hi,h
-     $     )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(xflux)
-      integer DIMDEC(yflux)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),2)
-      REAL_T a(DIMV(a),2)
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T xflux(DIMV(xflux),2)
-      REAL_T yflux(DIMV(yflux),2)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-
-      REAL_T trandern(DIMV(trandern),2)
-      REAL_T trandere(DIMV(trandere),2)
-      REAL_T tranderw(DIMV(tranderw),2)
-      REAL_T tranders(DIMV(tranders),2)
-
-      integer i,j
-      REAL_T tauxxw,tauxxe,tauyyn,tauyys
-      REAL_T tauxye,tauxyw,tauxyn,tauxys
-      REAL_T hx,hy
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw,dudyn,dudys
-      REAL_T dvdxe,dvdxw,dvdxn,dvdxs
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-
-c ::: make some mathematica definitions
-c ::: allDerivAllUV makes replacements for the deriv expressions and
-c ::: maps U and V to the correct values
-c ::: <* allDerivAllUV = {dudxdef,dvdydef,dudydef1,dudydef2,
-                          dvdxdef1,dvdxdef2,urepl,vrepl} ; *>
-
-c ::: cases:
-c     ::: 1) interior.  All normal derivative expressions
-c     ::: 2) edge but not on corner.  check mask value to see if use outside
-c     :::    value or use interpolations
-c     ::: 3) corners.  Must check mask values to see if use outside values
-c     :::    values or use interpolations ON TWO SIDES.  But must also
-c     :::    check to see if need to do one-sided derivs for tangential
-c     :::    derivatives.
-
-c ::: case 1
-      do j=lo(2)+1,hi(2)
-         do i=lo(1)+1,hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-
-            dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-         enddo
-      enddo
-
-c ::: ::: case 2a: north side
-c ::: <* indexcond = Function[ {i,j}, (j>0) ] ; *>
-c ::: <* maskray = maskn ; *>
-c :::
-      j = hi(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            if( <* 
-                dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudyw = <* (DOneY[u,i  ,j,-1]+
-                           DOneY[u,i-1,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            yflux(i,j+1,1) = -(<* tauxy[i,j+half] //. standardrepl *>)
-            yflux(i,j+1,2) = -(<* tauyy[i,j+half] //. standardrepl *>)
-         enddo
-
-c ::: case 2b south side
-c ::: <* indexcond = Function[ {i,j}, (j<0) ] ; *>
-c ::: <* maskray = masks ; *>
-      j=lo(2)
-         do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for appropriate derivatives
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudyw = <* (DOneY[u,i  ,j,+1]+
-                           DOneY[u,i-1,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxs = tranders(i,j-1,2)
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-         enddo
-
-
-c ::: case 2c: west side story
-c ::: <* indexcond = Function[ {i,j}, (i<0) ] ; *>
-c ::: <* maskray = maskw ; *>
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudyw = tranderw(i-1,j,1)
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j  ,+1]+
-                           DOneX[v,i,j-1,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-      enddo
-
-c ::: case 2d: east side story
-c ::: <* indexcond = Function[ {i,j}, (i>0) ] ; *>
-c ::: <* maskray = maske ; *>
-      i=hi(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j  ,-1]+
-                           DOneX[v,i,j-1,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i+1,j,1) = -(<* tauxx[i+half,j] //. standardrepl *>)
-            xflux(i+1,j,2) = -(<* tauxy[i+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-         enddo
-
-c ::: case 3a: north-east corner
-c ::: <* indexcond = Function[ {i,j}, (i>0)||(j>0) ] ; *>
-c ::: <* Clear[ maskray ] ; *>
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            if( <* 
-                 dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                          indexcond,maskn]
-                 *> ) then
-               dudyw = <* (DOneY[u,i-1,j,-1]+
-                           DOneY[u,i  ,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                          indexcond,maske]
-                *> ) then
-               dvdxs = <* (DOneX[v,i,j-1,-1]+
-                           DOneX[v,i,j  ,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            xflux(i+1,j,1) = -(<* tauxx[i+half,j] //. standardrepl *>)
-            xflux(i+1,j,2) = -(<* tauxy[i+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j+1,1) = -(<* tauxy[i,j+half] //. standardrepl *>)
-            yflux(i,j+1,2) = -(<* tauyy[i,j+half] //. standardrepl *>)
-
-c ::: case 3b: south-east corner, plus i, minus j, plus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i>0)||(j<0) ] ; *>
-      j=lo(2)
-      i=hi(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            if( <* 
-                 dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                               indexcond,masks]
-                 *> ) then 
-               dudyw = <* (DOneY[u,i-1,j,+1]+
-                           DOneY[u,i  ,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                               indexcond,maske]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j+1,-1]+
-                           DOneX[v,i,j  ,-1])/2 //. allDerivAllUV *> 
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            xflux(i+1,j,1) = -(<* tauxx[i+half,j] //. standardrepl *>)
-            xflux(i+1,j,2) = -(<* tauxy[i+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j+1,1) = -(<* tauxy[i,j+half] //. standardrepl *>)
-            yflux(i,j+1,2) = -(<* tauyy[i,j+half] //. standardrepl *>)
-
-c ::: case 3c: south-west corner, minus i, minus j
-c ::: <* indexcond = Function[ {i,j}, (i<0)||(j<0) ] ; *>
-      j=lo(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                                 indexcond,masks]
-                 *> ) then
-               dudye = <* (DOneY[u,i+1,j,+1]+
-                           DOneY[u,i  ,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //. allDerivAllUV,
-                                               indexcond,maskw]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j+1,+1]+
-                           DOneX[v,i,j  ,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            xflux(i+1,j,1) = -(<* tauxx[i+half,j] //. standardrepl *>)
-            xflux(i+1,j,2) = -(<* tauxy[i+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j+1,1) = -(<* tauxy[i,j+half] //. standardrepl *>)
-            yflux(i,j+1,2) = -(<* tauyy[i,j+half] //. standardrepl *>)
-
-c ::: case 3d: north-west corner, minus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i<0)||(j>0) ] ; *>
-      j=hi(2)
-      i=lo(1)
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                               indexcond,maskn]
-                *> ) then
-               dudye = <* (DOneY[u,i+1,j,-1]+
-                           DOneY[u,i  ,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            dvdxn = trandern(i,j+1,2)
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //. allDerivAllUV,
-                                               indexcond,maskw]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j-1,+1]+
-                           DOneX[v,i,j  ,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  evaluate expression
-            xflux(i,j,1) = -(<* tauxx[i-1+half,j] //. standardrepl *>)
-            xflux(i,j,2) = -(<* tauxy[i-1+half,j] //. standardrepl *>)
-            xflux(i+1,j,1) = -(<* tauxx[i+half,j] //. standardrepl *>)
-            xflux(i+1,j,2) = -(<* tauxy[i+half,j] //. standardrepl *>)
-            yflux(i,j,1) = -(<* tauxy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j,2) = -(<* tauyy[i,j-1+half] //. standardrepl *>)
-            yflux(i,j+1,1) = -(<* tauxy[i,j+half] //. standardrepl *>)
-            yflux(i,j+1,2) = -(<* tauyy[i,j+half] //. standardrepl *>)
-
-
-
-      return
-      end
-
-
-
-c-----------------------------------------------------------------------
-      subroutine FORT_APPLYBC (
-     $     flagden, flagbc, maxorder,
-     $     u,   DIMS(u),
-     $     cdir, bct, bcl,
-     $     bcval, DIMS(bcval),
-     $     mask,  DIMS(mask),
-     $     maskp, DIMS(maskp),
-     $     maskm, DIMS(maskm),
-     $     den,   DIMS(den),
-     $     exttd, DIMS(exttd),
-     $     tander,DIMS(tander),
-     $     lo, hi, nc,
-     $     h
-     $     )
-c
-c     If the boundary is of Neumann type, set the ghost cell value to
-c     that of the outermost point in the valid data (2nd order accurate)
-c     and then fill the "den" array with the value "1"
-c     
-c     
-c     If flagbc==1:
-c     
-c     If the boundary is of Dirichlet type, construct a polynomial
-c     interpolation through the boundary location and internal points
-c     (at locations x(-1:len-2) that generates the ghost cell value (at
-c     location xInt).  Then fill the ghost cell with the interpolated value.
-c     If flagden==1, load the "den" array with the interpolation
-c     coefficient corresponding to outermost point in the valid region
-c     ( the coef(0) corresponding to the location x(0) )
-c      
-c     Note: 
-c     The bc type = LO_REFLECT_ODD is a special type of boundary condition.
-
-c ::: the old FORT_APPLYBC put values out in ghost cells.  The new
-c ::: FORT_APPLYBC makes a distinction between normal and tangential derivs.
-c ::: the normal derivatives are still evaluated with ghost cells ( and
-c ::: the den array for adjusting the diagonal element).  Tangential
-c ::: derivatives are NOT computed from the ghost cells (note: we are
-c ::: discussing here the tangential derivates which are centered on the
-c ::: external cells walls of the rectangular domain.  Internal tangential
-c ::: derivatives whose stencil extends outside the rectangular domain have
-c ::: still ANOTHER calculational trick, one sided derivatives, which is 
-c ::: implemented in the apply operator).  For these tangential derivatives,
-c ::: if some of the cells in the stencil are uncovered, the derivative is
-c ::: computed half from cells which are internal, plus an externally supplied
-c ::: tangential derivative centered at location bcl.
-c ??? exttd is the externally supplied tangential derivative which is
-c ??? centered at bcl from wall.  Since the location of exttd is
-c ??? indeterminate (determined by bcl), we arbitrarily index it in the
-c ??? cell just outside the wall.
-c ??? tander is the calculated tangential derivative which is centered at
-c ??? at the wall.  It is indexed as if it were a cell centered quantity
-c ??? just outside the wall.  This is anomalous since it is really edge
-c ??? centered on the outer wall.
-c      
-c ::: other notes since previous developers didn't bother to document
-c ::: cdir is mnemonic for coordinate direction, i.e. which side this is
-c ::: cdir==0 -> left wall
-c ::: cdir==2 -> right
-c ::: cdir==1 -> bottom
-c ::: cdir==3 -> top
-
-c ::: notes about mask
-c ::: since we now require other masks, there are 3.
-c ::: 1) mask -- the main one covering the cells off the side of valid domain.
-c ::: 2) maskp -- the plus end of transverse direction
-c ::: 3) maskn -- the minus end of transverse direction
-
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(u)
-      REAL_T u(DIMV(u),nc)
-      integer DIMDEC(den)
-      REAL_T den(DIMV(den),nc)
-      integer DIMDEC(exttd)
-      REAL_T exttd(DIMV(exttd),nc)
-      integer DIMDEC(tander)
-      REAL_T tander(DIMV(tander),nc)
-      integer DIMDEC(bcval)
-      REAL_T bcval(DIMV(bcval),nc)
-      integer DIMDEC(mask)
-      integer mask(DIMV(mask))
-      integer DIMDEC(maskp)
-      integer maskp(DIMV(maskp))
-      integer DIMDEC(maskm)
-      integer maskm(DIMV(maskm))
-      integer bct(nc)
-      REAL_T bcl
-      REAL_T h(BL_SPACEDIM)
-c
-      REAL_T hx,hy,lambda
-      REAL_T innder,outder
-      REAL_T innloc,outloc,edgloc
-      integer i
-      integer j
-      integer n
-      logical is_dirichlet
-      logical is_neumann
-      logical is_odd
-      REAL_T xb
-c
-      integer lenx
-      integer leny
-      integer m
-c
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      REAL_T x(-1:maxmaxorder-2)
-      REAL_T coef(-1:maxmaxorder-2)
-      REAL_T xInt
-c
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-c
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET   )
-      is_neumann(i)   = ( i .eq. LO_NEUMANN )
-      hx = h(1)
-      hy = h(2)
-c
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      endif
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-c
-c     TODO:
-c     In order for this to work with growing multigrid, must
-c     sort xa[] because it is possible for the xb value to lay
-c     within this range.
-c     
-c     The Left face of the grid
-c
-      if(cdir .eq. 0) then
-         do n = 1, nc
-            if (is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  u(lo(1)-1,j,n) = cvmgt(
-     $                 u(lo(1),j,n),
-     $                 u(lo(1)-1,j,n),
-     $                 mask(lo(1)-1,j) .gt. 0)
-               enddo
-               if ( flagden .eq. 1) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: <* Clear[indexcond] ; *>
-c     :::::: interior part of left side
-               i = lo(1)
-               do j=lo(2)+1,hi(2)-1
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-                  tander(i-1,j,n) = innder
-               enddo
-c     :::::: now end points
-c     :::::: lower leftside
-               j = lo(2)
-               if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                    Function[{i,j}, (j<0)], maskm]
-                    *> ) then
-                    innder = <* DOneY[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                   innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i-1,j,n) = innder
-c     :::::: upper left side
-                j = hi(2)
-                if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                       Function[{i,j}, (j>0)], maskp]
-                      *> ) then
-                   innder = <* DOneY[U,i,j,n,-1] //. allDerivAllUV *>
-                else
-                   innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-                endif
-                tander(i-1,j,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, lenx+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, n) = cvmgt(
-     $                    bcval(lo(1)-1,j,n)*coef(-1),
-     $                    u(lo(1)-1, j, n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, n) = cvmgt(
-     $                    0.0,
-     $                    u(lo(1)-1, j, n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1,j,n) = cvmgt(
-     $                    u(lo(1)-1,j,n)
-     $                    + u(lo(1)+m, j, n)*coef(m),
-     $                    u(lo(1)-1,j,n),
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = cvmgt(coef(0), 0.0,
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: <* Clear[indexcond] ; *>
-c     :::::: interior part of left side
-               edgloc = 0.
-               i = lo(1)
-               do j=lo(2)+1,hi(2)-1
-                  if( <*
-                     dependentCellsCovered[DTwoY[u,i-1,j] //. allDerivAllUV,
-                     Function[{i,j},(i<0)],mask] *> ) then
-                     outloc = -0.5
-                     outder = <* DTwoY[U,i-1,j,n] //. allDerivAllUV *>
-                  elseif( <*
-                     dependentCellsCovered[DOneY[u,i-1,j,+1] //. allDerivAllUV,
-                     Function[{i,j},(i<0)],mask] *> ) then
-                     outloc = -0.5
-                     outder = <* DOneY[U,i-1,j,n,+1] //. allDerivAllUV *>
-                  elseif( <*
-                     dependentCellsCovered[DOneY[u,i-1,j,-1] //. allDerivAllUV,
-                     Function[{i,j},(i<0)],mask] *> ) then
-                     outloc = -0.5
-                     outder = <* DOneY[U,i-1,j,n,-1] //. allDerivAllUV *>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-            
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c     :::::: now end points
-c     :::::: lower leftside
-               j = lo(2)
-               if( <* 
-                   dependentCellsCovered[DTwoY[u,i-1,j] //. allDerivAllUV,
-                   Function[{i,j}, (i<0)], mask]
-                   *> ) then
-                   outloc = -0.5
-                   outder = <* DTwoY[U,i-1,j,n] //. allDerivAllUV *>
-               elseif( <* 
-                   dependentCellsCovered[DOneY[u,i-1,j,+1] //. allDerivAllUV,
-                   Function[{i,j}, (i<0)], mask]
-                   *> ) then
-                   outloc = -0.5
-                   outder = <* DOneY[U,i-1,j,n,+1] //. allDerivAllUV *>
-               else
-                   outloc = x(-1)
-                   if( flagbc .eq. 1) then
-                      outder = exttd(i-1,j,n)
-                   else
-                      outder = 0.
-                   endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                    Function[{i,j}, (j<0)], maskm]
-                    *> ) then
-                    innder = <* DOneY[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                   innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-c     :::::: upper left side
-                j = hi(2)
-                if( <* 
-                     dependentCellsCovered[DTwoY[u,i-1,j] //. allDerivAllUV,
-                     Function[{i,j}, (i<0)], mask]
-                     *> ) then
-                   outloc = -0.5
-                   outder = <* DTwoY[U,i-1,j,n] //. allDerivAllUV *>
-                elseif( <* 
-                     dependentCellsCovered[DOneY[u,i-1,j,-1] //. allDerivAllUV,
-                     Function[{i,j}, (i<0)], mask]
-                     *> ) then
-                   outloc = -0.5
-                   outder = <* DOneY[U,i-1,j,n,-1] //. allDerivAllUV *>
-                else
-                   outloc = x(-1)
-                   if( flagbc .eq. 1) then
-                      outder = exttd(i-1,j,n)
-                   else
-                      outder = 0.
-                   endif
-                endif
-                if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                       Function[{i,j}, (j>0)], maskp]
-                      *> ) then
-                   innder = <* DOneY[U,i,j,n,-1] //. allDerivAllUV *>
-                else
-                   innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-                endif
-                innloc = 0.5
-                lambda = (edgloc-outloc)/(innloc-outloc)
-                tander(i-1,j,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do j = lo(2), hi(2)
-                  u(lo(1)-1, j, n) = cvmgt(
-     $                 -u(lo(1),j,n),
-     $                 u(lo(1)-1, j, n),
-     $                 mask(lo(1)-1,j) .gt. 0)
-                  tander(lo(1)-1,j,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(lo(1),j,n) = cvmgt(-1.0, 0.0,
-     $                    mask(lo(1)-1,j) .gt. 0)
-                  enddo
-               endif
-               
-            else 
-               print *,'UNKNOWN BC ON LEFT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c     
-c     The Right face of the grid
-c
-      if(cdir .eq. 2) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  u(hi(1)+1,j,n) = cvmgt(
-     $                 u(hi(1), j, n),
-     $                 u(hi(1)+1, j, n),
-     $                 mask(hi(1)+1,j) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n) = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: <* Clear[indexcond] ; *>
-c     :::::: interior part of right side
-               i = hi(1)
-               do j=lo(2)+1,hi(2)-1
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-                  tander(i+1,j,n) = innder
-               enddo
-c :::::: now end points
-c :::::: lower right side
-               j = lo(2)
-               if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (j<0)], maskm]
-                   *> ) then
-                  innder = <* DOneY[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i+1,j,n) = innder
-c     :::::: upper right side
-               j = hi(2)
-               if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (j>0)], maskp]
-                   *> ) then
-                  innder = <* DOneY[U,i,j,n,-1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i+1,j,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, lenx+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = cvmgt(
-     $                    bcval(hi(1)+1,j,n)*coef(-1),
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = cvmgt(
-     $                    0.0,
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-               do m = 0, lenx
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,n) = cvmgt(
-     $                    u(hi(1)+1,j,n)
-     $                    + u(hi(1)-m,j,n)*coef(m),
-     $                    u(hi(1)+1,j,n),
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n)   = cvmgt(coef(0), 0.0,
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: <* Clear[indexcond] ; *>
-c     :::::: interior part of right side
-               edgloc = 0.
-               i = hi(1)
-               do j=lo(2)+1,hi(2)-1
-                  if( <*
-                    dependentCellsCovered[DTwoY[u,i+1,j] //. allDerivAllUV,
-                                              Function[{i,j},(i>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DTwoY[U,i+1,j,n] //. allDerivAllUV *>
-                  elseif( <*
-                    dependentCellsCovered[DOneY[u,i+1,j,+1] //. allDerivAllUV,
-                                              Function[{i,j},(i>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneY[U,i+1,j,n,+1] //. allDerivAllUV *>
-                  elseif( <*
-                    dependentCellsCovered[DOneY[u,i+1,j,-1] //. allDerivAllUV,
-                                              Function[{i,j},(i>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneY[U,i+1,j,n,-1] //. allDerivAllUV *>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c :::::: now end points
-c :::::: lower right side
-               j = lo(2)
-               if( <* 
-                    dependentCellsCovered[DTwoY[u,i+1,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], mask]
-                                *> ) then
-                  outloc = -0.5
-                  outder = <* DTwoY[U,i+1,j,n] //. allDerivAllUV *>
-               elseif( <* 
-                    dependentCellsCovered[DOneY[u,i+1,j,+1] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], mask]
-                                *> ) then
-                  outloc = -0.5
-                  outder = <* DOneY[U,i+1,j,n,+1] //. allDerivAllUV *>
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i+1,j,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (j<0)], maskm]
-                   *> ) then
-                  innder = <* DOneY[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-c     :::::: upper right side
-               j = hi(2)
-               if( <* 
-                   dependentCellsCovered[DTwoY[u,i+1,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], mask]
-                               *> ) then
-                  outloc = -0.5
-                  outder = <* DTwoY[U,i+1,j,n] //. allDerivAllUV *>
-               elseif( <* 
-                   dependentCellsCovered[DOneY[u,i+1,j,-1] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], mask]
-                               *> ) then
-                  outloc = -0.5
-                  outder = <* DOneY[U,i+1,j,n,-1] //. allDerivAllUV *>
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i+1,j,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoY[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (j>0)], maskp]
-                   *> ) then
-                  innder = <* DOneY[U,i,j,n,-1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoY[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i+1,j,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do j = lo(2), hi(2)
-                  u(hi(1)+1, j, n) = cvmgt(
-     $                 -u(hi(1),j,n),
-     $                 u(hi(1)+1, j, n),
-     $                 mask(hi(1)+1,j) .gt. 0)
-c                 ::: tangential der is trivial
-                  tander(hi(1)+1,j,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     den(hi(1),j,n) = cvmgt(-1.0, 0.0,
-     $                    mask(hi(1)+1,j) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The Bottom of the Grid
-c
-      if(cdir .eq. 1) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do i = lo(1),hi(1)
-                  u(i,lo(2)-1,n) = cvmgt(
-     $                 u(i,lo(2),n),
-     $                 u(i,lo(2)-1,n),
-     $                 mask(i,lo(2)-1) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1),hi(1)
-                     den(i,lo(2),n)   = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of bottom side
-               j = lo(2)
-               do i=lo(1)+1,hi(1)-1
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-                  tander(i,j-1,n) = innder
-               enddo
-c :::::: now end points
-c :::::: left bottom side
-               i = lo(1)
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i<0)], maskm]
-                    *> ) then
-                  innder = <* DOneX[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i,j-1,n) = innder
-c :::::: right bottom side
-               i = hi(1)
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], maskp]
-                   *> ) then
-                  innder = <* DOneX[U,i,j,n,-1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i,j-1,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,n) = cvmgt(
-     $                    bcval(i,lo(2)-1,n)*coef(-1),
-     $                    u(i,lo(2)-1,n),
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               else
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,n) = cvmgt(
-     $                    0.0,
-     $                    u(i,lo(2)-1,n),
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               endif
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     u(i, lo(2)-1, n) = cvmgt(
-     $                    u(i, lo(2)-1,n)
-     $                    + u(i, lo(2)+m,n)*coef(m),
-     $                    u(i, lo(2)-1, n),
-     $                    mask(i, lo(2)-1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i, lo(2),n)   = cvmgt(coef(0), 0.0,
-     $                    mask(i, lo(2)-1) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of bottom side
-               edgloc = 0.
-               j = lo(2)
-               do i=lo(1)+1,hi(1)-1
-                  if(  <*
-                   dependentCellsCovered[DTwoX[u,i,j-1] //. allDerivAllUV,
-                                              Function[{i,j},(j<0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DTwoX[U,i,j-1,n] //. allDerivAllUV *>
-                  else if(  <*
-                   dependentCellsCovered[DOneX[u,i,j-1,+1]//. allDerivAllUV,
-                                              Function[{i,j},(j<0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j-1,n,+1] //. allDerivAllUV *>
-                  else if(  <*
-                   dependentCellsCovered[DOneX[u,i,j-1,-1]//. allDerivAllUV,
-                                              Function[{i,j},(j<0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j-1,n,-1] //. allDerivAllUV *>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i,j-1,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c :::::: now end points
-c :::::: left bottom side
-               i = lo(1)
-               if(  <* 
-                    dependentCellsCovered[DTwoX[u,i,j-1] //. allDerivAllUV,
-                    Function[{i,j}, (j<0)], mask]
-                   *> ) then
-                  outloc = -0.5
-                  outder = <* DTwoX[U,i,j-1,n] //. allDerivAllUV *>
-               else if( <*
-                   dependentCellsCovered[DOneX[u,i,j-1,+1]//. allDerivAllUV,
-                                              Function[{i,j},(j<0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j-1,n,+1] //. allDerivAllUV *>
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j-1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i<0)], maskm]
-                    *> ) then
-                  innder = <* DOneX[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-c :::::: right bottom side
-               i = hi(1)
-               if( <* 
-                    dependentCellsCovered[DTwoX[u,i,j-1] //. allDerivAllUV,
-                                    Function[{i,j}, (j<0)], mask]
-                                *> ) then
-                  outloc = -0.5
-                  outder = <* DTwoX[U,i,j-1,n] //. allDerivAllUV *>
-               else if( <*
-                   dependentCellsCovered[DOneX[u,i,j-1,-1]//. allDerivAllUV,
-                                              Function[{i,j},(j<0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j-1,n,-1] //. allDerivAllUV *>
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j-1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], maskp]
-                   *> ) then
-                  innder = <* DOneX[U,i,j,n,-1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j-1,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do i = lo(1), hi(1)
-                  u(i,lo(2)-1,n) = cvmgt(
-     $                 -u(i,lo(2),n),
-     $                 u(i,lo(2)-1,n),
-     $                 mask(i,lo(2)-1) .gt. 0)
-                  tander(i,lo(2)-1,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,lo(2),n) = cvmgt(-1.0, 0.0,
-     $                    mask(i,lo(2)-1) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-               stop
-            endif
-        enddo
-      endif
-c     
-c     The top of the grid
-c
-      if (cdir .eq. 3) then
-         do n = 1, nc
-            if(is_neumann(bct(n))) then
-               do i = lo(1), hi(1)
-                  u(i,hi(2)+1,n) = cvmgt(
-     $                 u(i,hi(2),n),
-     $                 u(i,hi(2)+1,n),
-     $                 mask(i,hi(2)+1) .gt. 0)
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n)   = 1.0
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of top side
-               j = hi(2)
-               do i=lo(1)+1,hi(1)-1
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-                  tander(i,j+1,n) = innder
-               enddo
-c     :::::: now end points
-c     :::::: left top side
-               i = lo(1)
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i<0)], maskm]
-                    *> ) then
-                  innder = <* DOneX[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i,j+1,n) = innder
-c     :::::: right top side
-               i = hi(1)
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], maskp]
-                    *> ) then
-                  innder = <* DOneX[U,i,j,n,-1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               tander(i,j+1,n) = innder
-            else if (is_dirichlet(bct(n))) then
-               if ( bct(n) .eq. LO_REFLECT_ODD ) leny = 0
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-               if ( flagbc .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,n) = cvmgt(
-     $                    bcval(i,hi(2)+1,n)*coef(-1),
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               else
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,n) = cvmgt(
-     $                    0.0,
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-               do m = 0, leny
-                  do i = lo(1), hi(1)
-                     u(i, hi(2)+1,n) = cvmgt(
-     $                    u(i,hi(2)+1,n)
-     $                    + u(i, hi(2)-m,n)*coef(m),
-     $                    u(i,hi(2)+1,n),
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n)   = cvmgt(coef(0), 0.0,
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-c     :::::: now do the tangential derivative part
-c     :::::: interior part of top side
-               edgloc = 0.
-               j = hi(2)
-               do i=lo(1)+1,hi(1)-1
-                  if(  <*
-                   dependentCellsCovered[DTwoX[u,i,j+1] //. allDerivAllUV,
-                                              Function[{i,j},(j>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DTwoX[U,i,j+1,n] //. allDerivAllUV *>
-                  else if(  <*
-                   dependentCellsCovered[DOneX[u,i,j+1,+1]//. allDerivAllUV,
-                                              Function[{i,j},(j>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j+1,n,+1]//. allDerivAllUV *>
-                  else if( <*
-                   dependentCellsCovered[DOneX[u,i,j+1,-1]//. allDerivAllUV,
-                                              Function[{i,j},(j>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j+1,n,-1]//. allDerivAllUV *>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i,j+1,n)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  innloc = 0.5
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-                  
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-               enddo
-c     :::::: now end points
-c     :::::: left top side
-               i = lo(1)
-               if( <* 
-                    dependentCellsCovered[DTwoX[u,i,j+1] //. allDerivAllUV,
-                                    Function[{i,j}, (j>0)], mask]
-                               *> ) then
-                  outloc = -0.5
-                  outder = <* DTwoX[U,i,j+1,n] //. allDerivAllUV *>
-               else if( <*
-                   dependentCellsCovered[DOneX[u,i,j+1,+1]//. allDerivAllUV,
-                                              Function[{i,j},(j>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j+1,n,+1]//. allDerivAllUV *>
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j+1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i<0)], maskm]
-                    *> ) then
-                  innder = <* DOneX[U,i,j,n,+1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-c     :::::: right top side
-               i = hi(1)
-               if( <* 
-                    dependentCellsCovered[DTwoX[u,i,j+1] //. allDerivAllUV,
-                                    Function[{i,j}, (j>0)], mask]
-                                 *> ) then
-                  outloc = -0.5
-                  outder = <* DTwoX[U,i,j+1,n] //. allDerivAllUV *>
-               else if(  <*
-                   dependentCellsCovered[DOneX[u,i,j+1,-1]//. allDerivAllUV,
-                                              Function[{i,j},(j>0)],mask]
-                       *> ) then
-                     outloc = -0.5
-                     outder = <* DOneX[U,i,j+1,n,-1]//. allDerivAllUV *>
-               else
-                  outloc = x(-1)
-                  if( flagbc .eq. 1) then
-                     outder = exttd(i,j+1,n)
-                  else
-                     outder = 0.
-                  endif
-               endif
-               if( <* dependentCellsNotCovered[DTwoX[u,i,j] //. allDerivAllUV,
-                                    Function[{i,j}, (i>0)], maskp]
-                    *> ) then
-                  innder = <* DOneX[U,i,j,n,-1] //. allDerivAllUV *>
-               else
-                  innder = <* DTwoX[U,i,j,n] //. allDerivAllUV *>
-               endif
-               innloc = 0.5
-               lambda = (edgloc-outloc)/(innloc-outloc)
-               tander(i,j+1,n) = lambda*innder+(1-lambda)*outder
-               
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               
-               do i = lo(1), hi(1)
-                  u(i,hi(2)+1,n) = cvmgt(
-     $                 -u(i,hi(2),n),
-     $                 u(i,hi(2)+1,n),
-     $                 mask(i,hi(2)+1) .gt. 0)
-                  tander(i,hi(2)+1,n) = 0.0
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do i = lo(1), hi(1)
-                     den(i,hi(2),n) = cvmgt(-1.0, 0.0,
-     $                    mask(i,hi(2)+1) .gt. 0)
-                  enddo
-               endif
-               
-            else
-               print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-      end
-
-
-      subroutine FORT_GSRB (
-     $     u, DIMS(u),
-     $     rhs, DIMS(rhs),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     maskn,DIMS(maskn),
-     $     fn, DIMS(fn),
-     $     maske,DIMS(maske),
-     $     fe, DIMS(fe),
-     $     maskw,DIMS(maskw),
-     $     fw, DIMS(fw),
-     $     masks,DIMS(masks),
-     $     fs, DIMS(fs),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     lo,hi,h,nc,phaseflag
-     $     )
-
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(rhs)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(fn)
-      integer DIMDEC(fe)
-      integer DIMDEC(fw)
-      integer DIMDEC(fs)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      integer nc,phaseflag
-
-      REAL_T u(DIMV(u),2)
-      REAL_T rhs(DIMV(rhs),2)
-      REAL_T a(DIMV(a),2)
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      integer maskn(DIMV(maskn))
-      integer maske(DIMV(maske))
-      integer maskw(DIMV(maskw))
-      integer masks(DIMV(masks))
-      REAL_T fn(DIMV(fn),nc)
-      REAL_T fe(DIMV(fe),nc)
-      REAL_T fw(DIMV(fw),nc)
-      REAL_T fs(DIMV(fs),nc)
-      REAL_T trandern(DIMV(trandern),2)
-      REAL_T trandere(DIMV(trandere),2)
-      REAL_T tranderw(DIMV(tranderw),2)
-      REAL_T tranders(DIMV(tranders),2)
-
-      integer i,j,modx,mody
-      integer istart,jstart
-      REAL_T tauxxw,tauxxe,tauyyn,tauyys
-      REAL_T tauxye,tauxyw,tauxyn,tauxys
-      REAL_T hx,hy
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw,dudyn,dudys
-      REAL_T dvdxe,dvdxw,dvdxn,dvdxs
-      REAL_T diagu, diagv
-      REAL_T operu, operv
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      if( nc .ne. 2 ) then
-         write(6,*)'FORT_GSRB: bad nc',nc
-         stop
-      endif
-
-c ::: convert phase flag into modx and mody
-      if(    phaseflag.eq.0 ) then
-         modx = 0
-         mody = 0
-      elseif(phaseflag.eq.1) then
-         modx = 1
-         mody = 0
-      elseif(phaseflag.eq.2) then
-         modx = 0
-         mody = 1
-      elseif(phaseflag.eq.3) then
-         modx = 1
-         mody = 1
-      else
-         write(6,*)'FORT_GSRB: bad phaseflag', phaseflag
-         stop
-      endif
-
-
-c ::: cases:
-c     ::: 1) interior.  All normal derivative expressions
-c     ::: 2) edge but not on corner.  check mask value to see if use outside
-c     :::    value or use interpolations
-c     ::: 3) corners.  Must check mask values to see if use outside values
-c     :::    values or use interpolations ON TWO SIDES.  But must also
-c     :::    check to see if need to do one-sided derivs for tangential
-c     :::    derivatives.
-
-c ::: case 1
-      istart = lo(1)+1
-      if( mod(istart,2) .ne. modx ) istart = istart+1
-      jstart = lo(2)+1
-      if( mod(jstart,2) .ne. mody ) jstart = jstart+1
-      do j = jstart,hi(2)-1,2
-         do i = istart,hi(1)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-
-            dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      enddo
-
-c ::: case 2a) north side
-c ::: <* indexcond = Function[ {i,j}, (j>0) ] ; *>
-c ::: <* maskray = maskn ; *>
-      j = hi(2)
-      if( mod(j,2) .eq. mody ) then
-         do i = istart,hi(1)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudye = <* (DOneY[u,i  ,j,-1]+ 
-                           DOneY[u,i+1,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudyw = <* (DOneY[u,i  ,j,-1]+
-                           DOneY[u,i-1,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskn(i,j+1).gt. 0) then
-	       diagu = diagu - fn(i,j,1)*beta*muY(i,j+1)/hy**2
-	       diagv = diagv - fn(i,j,2)*2*beta*muY(i,j+1)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-
-
-c ::: case 2b south side
-c ::: <* indexcond = Function[ {i,j}, (j<0) ] ; *>
-c ::: <* maskray = masks ; *>
-
-      j=lo(2)
-      if( mod(j,2) .eq. mody ) then
-         do i=istart,hi(1)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudye = <* (DOneY[u,i  ,j,+1]+ 
-                           DOneY[u,i+1,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                            indexcond,maskray]
-                *> ) then
-               dudyw = <* (DOneY[u,i  ,j,+1]+
-                           DOneY[u,i-1,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( masks(i,j-1).gt. 0) then
-	       diagu = diagu - fs(i,j,1)*beta*muY(i,j)/hy**2
-	       diagv = diagv - fs(i,j,2)*2*beta*muY(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-
-c ::: case 2c: west side story
-c ::: <* indexcond = Function[ {i,j}, (i<0) ] ; *>
-c ::: <* maskray = maskw ; *>
-      i=lo(1)
-      if( mod(i,2) .eq. modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-            
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-            
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            dudyw = tranderw(i-1,j,1)
-            
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j  ,+1]+
-                           DOneX[v,i,j+1,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j  ,+1]+
-                           DOneX[v,i,j-1,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskw(i-1,j).gt. 0) then
-	       diagu = diagu - fw(i,j,1)*2*beta*muX(i,j)/hx**2
-	       diagv = diagv - fw(i,j,2)*  beta*muX(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-
-c ::: case 2d: east side story
-c ::: <* indexcond = Function[ {i,j}, (i>0) ] ; *>
-c ::: <* maskray = maske ; *>
-      i=hi(1)
-      if( mod(i,2) .eq. modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j  ,-1]+
-                           DOneX[v,i,j+1,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                            indexcond, maskray]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j  ,-1]+
-                           DOneX[v,i,j-1,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maske(i+1,j).gt. 0) then
-	       diagu = diagu - fe(i,j,1)*2*beta*muX(i+1,j)/hx**2
-	       diagv = diagv - fe(i,j,2)*  beta*muX(i+1,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-         enddo
-      endif
-
-c ::: case 3a: north-east corner, plus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i>0)||(j>0) ] ; *>
-c ::: <* Clear[ maskray ] ; *>
-      j=hi(2)
-      i=hi(1)
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            if( <* 
-                 dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                          indexcond,maskn]
-                 *> ) then
-               dudyw = <* (DOneY[u,i-1,j,-1]+
-                           DOneY[u,i  ,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            dvdxn = trandern(i,j+1,2)
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //.  allDerivAllUV,
-                                          indexcond,maske]
-                *> ) then
-               dvdxs = <* (DOneX[v,i,j-1,-1]+
-                           DOneX[v,i,j  ,-1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maske(i+1,j).gt. 0) then
-	       diagu = diagu - fe(i,j,1)*2*beta*muX(i+1,j)/hx**2
-	       diagv = diagv - fe(i,j,2)*  beta*muX(i+1,j)/hy**2
-	    endif
-	    if( maskn(i,j+1).gt. 0) then
-	       diagu = diagu - fn(i,j,1)*beta*muY(i,j+1)/hy**2
-	       diagv = diagv - fn(i,j,2)*2*beta*muY(i,j+1)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-
-c ::: case 3b: south-east corner, plus i, minus j, plus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i>0)||(j<0) ] ; *>
-      j=lo(2)
-      i=hi(1)
-      
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            dudye = trandere(i+1,j,1)
-            if( <* 
-                 dependentCellsNotCovered[dudy[i-1+half,j] //. allDerivAllUV,
-                                               indexcond,masks]
-                 *> ) then 
-               dudyw = <* (DOneY[u,i-1,j,+1]+
-                           DOneY[u,i  ,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudyw = <* dudy[i-1+half,j] //.  allDerivAllUV *>
-            endif
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //.  allDerivAllUV,
-                                               indexcond,maske]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j+1,-1]+
-                           DOneX[v,i,j  ,-1])/2 //. allDerivAllUV *> 
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maske(i+1,j).gt. 0) then
-	       diagu = diagu - fe(i,j,1)*2*beta*muX(i+1,j)/hx**2
-	       diagv = diagv - fe(i,j,2)*  beta*muX(i+1,j)/hy**2
-	    endif
-	    if( masks(i,j-1).gt. 0) then
-	       diagu = diagu - fs(i,j,1)*beta*muY(i,j)/hy**2
-	       diagv = diagv - fs(i,j,2)*2*beta*muY(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-c ::: case 3c: south-west corner, minus i, minus j
-c ::: <* indexcond = Function[ {i,j}, (i<0)||(j<0) ] ; *>
-      j=lo(2)
-      i=lo(1)
-
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                                 indexcond,masks]
-                 *> ) then
-               dudye = <* (DOneY[u,i+1,j,+1]+
-                           DOneY[u,i  ,j,+1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j+half] //. allDerivAllUV,
-                                               indexcond,maskw]
-                 *> ) then
-               dvdxn = <* (DOneX[v,i,j+1,+1]+
-                           DOneX[v,i,j  ,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxn = <* dvdx[i,j  +half] //.  allDerivAllUV *>
-            endif
-            dvdxs = tranders(i,j-1,2)
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskw(i-1,j).gt. 0) then
-	       diagu = diagu - fw(i,j,1)*2*beta*muX(i,j)/hx**2
-	       diagv = diagv - fw(i,j,2)*  beta*muX(i,j)/hy**2
-	    endif
-	    if( masks(i,j-1).gt. 0) then
-	       diagu = diagu - fs(i,j,1)*beta*muY(i,j)/hy**2
-	       diagv = diagv - fs(i,j,2)*2*beta*muY(i,j)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-
-
-c ::: case 3d: north-west corner, minus i, plus j
-c ::: <* indexcond = Function[ {i,j}, (i<0)||(j>0) ] ; *>
-      j=hi(2)
-      i=lo(1)
-      if( mod(i,2).eq.modx .and. mod(j,2).eq.mody) then
-c     :::  get expressions for appropriate derivatives
-            dudxe = <* dudx[i+half,j] //. allDerivAllUV  *>
-            dudxw = <* dudx[i-1+half,j] //. allDerivAllUV *>
-
-            dvdyn = <* dvdy[i,j+half] //.  allDerivAllUV *>
-            dvdys = <* dvdy[i,j-1+half] //.  allDerivAllUV *>
-
-            dudyn = <* dudy[i,j  +half] //.  allDerivAllUV *>
-            dudys = <* dudy[i,j-1+half] //.  allDerivAllUV *>
-            if( <* 
-                 dependentCellsNotCovered[dudy[i+half,j] //. allDerivAllUV,
-                                               indexcond,maskn]
-                *> ) then
-               dudye = <* (DOneY[u,i+1,j,-1]+
-                           DOneY[u,i  ,j,-1])/2 //. allDerivAllUV *>
-            else
-               dudye = <* dudy[i+half,j] //.  allDerivAllUV *>
-            endif
-            dudyw = tranderw(i-1,j,1)
-
-            dvdxn = trandern(i,j+1,2)
-            if( <* 
-                 dependentCellsNotCovered[dvdx[i,j-1+half] //. allDerivAllUV,
-                                               indexcond,maskw]
-                 *> ) then
-               dvdxs = <* (DOneX[v,i,j-1,+1]+
-                           DOneX[v,i,j  ,+1])/2 //. allDerivAllUV *>
-            else
-               dvdxs = <* dvdx[i,j-1+half] //.  allDerivAllUV *>
-            endif
-            dvdxe = <* dvdx[i+half,j] //.  allDerivAllUV *>
-            dvdxw = <* dvdx[i-1+half,j] //.  allDerivAllUV *>
-c     :::  get diagonal element
-            diagu = alpha*a(i,j,1) + 
-     $           2*beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $             beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-            diagv = alpha*a(i,j,2) +
-     $             beta*(muX(i,j)+muX(i+1,j))/(hx**2)+
-     $           2*beta*(muY(i,j)+muY(i,j+1))/(hy**2)
-	    if( maskw(i-1,j).gt. 0) then
-	       diagu = diagu - fw(i,j,1)*2*beta*muX(i,j)/hx**2
-	       diagv = diagv - fw(i,j,2)*  beta*muX(i,j)/hy**2
-	    endif
-	    if( maskn(i,j+1).gt. 0) then
-	       diagu = diagu - fn(i,j,1)*beta*muY(i,j+1)/hy**2
-	       diagv = diagv - fn(i,j,2)*2*beta*muY(i,j+1)/hy**2
-	    endif
-c     :::  evaluate operator
-            operu = <* (alpha*a[i,j,1]*u[i,j,1] - beta* (
-                            hy*(tauxx[i+half,j]-tauxx[i-1+half,j])+ 
-                            hx*(tauxy[i,j+half]-tauxy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-            operv = <* (alpha*a[i,j,2]*u[i,j,2] - beta* (
-                            hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-                            hx*(tauyy[i,j+half]-tauyy[i,j-1+half] ))/vol
-                            ) //. standardrepl *>
-c     :::  do relaxation
-            u(i,j,1) = (rhs(i,j,1)-operu)/diagu + u(i,j,1)
-            u(i,j,2) = (rhs(i,j,2)-operv)/diagv + u(i,j,2)
-      endif
-
-
-      return
-      end
diff --git a/Src/LinearSolvers/C_TensorMG/DV_3D1.mF b/Src/LinearSolvers/C_TensorMG/DV_3D1.mF
deleted file mode 100644
index 39d6a492c9f..00000000000
--- a/Src/LinearSolvers/C_TensorMG/DV_3D1.mF
+++ /dev/null
@@ -1,2234 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: <* standardrepl = { dudx[i+half  ,j       ,k       ]->dudxe,
-                          dudx[i-1+half,j       ,k       ]->dudxw,
-                          dvdy[i,       j+half  ,k       ]->dvdyn ,
-                          dvdy[i,       j-1+half,k       ]->dvdys ,
-			  dwdz[i,       j       ,k+half  ]->dwdzt,
-			  dwdz[i,       j       ,k-1+half]->dwdzb,
-
-                          dudy[i,       j  +half,k]-> dudyn ,
-                          dudy[i,       j-1+half,k]-> dudys ,
-                          dudy[i+half,  j       ,k]-> dudye ,
-                          dudy[i-1+half,j       ,k]-> dudyw ,
-
-                          dvdx[i,       j  +half,k]-> dvdxn ,
-                          dvdx[i,       j-1+half,k]-> dvdxs ,
-                          dvdx[i+half,  j       ,k]-> dvdxe ,
-                          dvdx[i-1+half,j       ,k]-> dvdxw ,
-
-			  dudz[i       ,j       ,k+half  ]->dudzt,
-			  dudz[i       ,j       ,k-1+half]->dudzb,
-			  dudz[i+half  ,j       ,k       ]->dudze,
-			  dudz[i-1+half,j       ,k       ]->dudzw,
-
-			  dvdz[i       ,j       ,k+half  ]->dvdzt,
-			  dvdz[i       ,j       ,k-1+half]->dvdzb,
-			  dvdz[i       ,j+half  ,k       ]->dvdzn,
-			  dvdz[i       ,j-1+half,k       ]->dvdzs,
-
-			  dwdx[i+half  ,j       ,k       ]->dwdxe,
-			  dwdx[i+half-1,j       ,k       ]->dwdxw,
-			  dwdx[i       ,j       ,k+half  ]->dwdxt,
-			  dwdx[i       ,j       ,k+half-1]->dwdxb,
-
-			  dwdy[i       ,j+half  ,k       ]->dwdyn,
-			  dwdy[i       ,j+half-1,k       ]->dwdys,
-			  dwdy[i       ,j       ,k+half  ]->dwdyt,
-			  dwdy[i       ,j       ,k+half-1]->dwdyb,
-
-                          murepl1, murepl2,murepl3,
-                          tauxxdef, tauyydef,tauxydef,tauxzdef,tauyzdef,
-                          tauzzdef,
-			  vol->hx*hy*hz };  *>
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_DVAPPLY(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     muZ, DIMS(muZ),
-     $     out, DIMS(out),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     maskt,DIMS(maskt),
-     $     maskb,DIMS(maskb),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     trandert,DIMS(trandert),
-     $     tranderb,DIMS(tranderb),
-     $     lo,hi,h
-     $     )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(muZ)
-      integer DIMDEC(out)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(maskt)
-      integer DIMDEC(maskb)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer DIMDEC(trandert)
-      integer DIMDEC(tranderb)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),3)
-      REAL_T a(DIMV(a))
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T muZ(DIMV(muZ))
-      REAL_T out(DIMV(out),3)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-      integer  maskt(DIMV(maskt))
-      integer  maskb(DIMV(maskb))
-
-c ::: for transverse derives, first 3 is for variable, second 3 is for
-c ::: direction of derivative.  Obviously not all are used, but this is easy.
-      REAL_T trandern(DIMV(trandern),3,3)
-      REAL_T trandere(DIMV(trandere),3,3)
-      REAL_T tranderw(DIMV(tranderw),3,3)
-      REAL_T tranders(DIMV(tranders),3,3)
-      REAL_T trandert(DIMV(trandert),3,3)
-      REAL_T tranderb(DIMV(tranderb),3,3)
-
-      integer i,j,k
-      REAL_T tauxxw,tauxxe,tauyyn,tauyys
-      REAL_T tauxye,tauxyw,tauxyn,tauxys
-      REAL_T hx,hy,hz
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw
-      REAL_T dudyn,dudys
-      REAL_T dvdxe,dvdxw
-      REAL_T dvdxn,dvdxs
-      REAL_T dudzb,dudzt
-      REAL_T dwdzt,dwdzb
-      REAL_T dwdxb,dwdxt
-      REAL_T dvdzb,dvdzt
-      REAL_T dwdyb,dwdyt
-      REAL_T dudzw,dudze
-      REAL_T dwdxw,dwdxe
-      REAL_T dvdzs,dvdzn
-      REAL_T dwdys,dwdyn
-
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-c ::: cases:
-c     ::: 0) interior.  All usual derivative expressions
-c     ::: 1-6) face but not on edge.  
-c     ::: 7-18) edge but not on corner.
-c     ::: 19-26) corners.
-
-c ::: case 0
-c ::: <* indexcond = Function[ {i,j,k}, False ] ; *>
-c ::: <* maskray = maskerr ; *>
-      do k=lo(3)+1,hi(3)-1
-         do j=lo(2)+1,hi(2)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-         enddo
-      enddo
-
-c ::: case 1, top face
-c ::: <* indexcond = Function[{i,j,k},k>0] ; *>
-c ::: <* maskray = maskt ; *>
-c ::: <* tranderiv = trandert ; *>
-      k=hi(3)
-         do j=lo(2)+1,hi(2)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-         enddo
-
-c ::: case 2, bottom face
-c ::: <* indexcond = Function[{i,j,k},k<0] ; *>
-c ::: <* maskray = maskb ; *>
-c ::: <* tranderiv = tranderb ; *>
-      k=lo(3)
-         do j=lo(2)+1,hi(2)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-         enddo
-
-c ::: case 3, west face
-c ::: <* indexcond = Function[{i,j,k},i<0] ; *>
-c ::: <* maskray = maskw ; *>
-c ::: <* tranderiv = tranderw ; *>
-      i = lo(1)
-      do k=lo(3)+1,hi(3)-1
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-         enddo
-      enddo
-
-c ::: case 4, east face
-c ::: <* indexcond = Function[{i,j,k},i>0] ; *>
-c ::: <* maskray = maske ; *>
-c ::: <* tranderiv = trandere ; *>
-      i = hi(1)
-      do k=lo(3)+1,hi(3)-1
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-         enddo
-      enddo
-	
-c ::: case 5, north face
-c ::: <* indexcond = Function[{i,j,k},j>0] ; *>
-c ::: <* maskray = maskn ; *>
-c ::: <* tranderiv = trandern ; *>
-      j = hi(2)
-      do k=lo(3)+1,hi(3)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-      enddo
-
-
-c ::: case 6, south face
-c ::: <* indexcond = Function[{i,j,k},j<0] ; *>
-c ::: <* maskray = masks ; *>
-c ::: <* tranderiv = tranders ; *>
-      j = lo(2)
-      do k=lo(3)+1,hi(3)-1
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-      enddo
-
-c ::: case 7, top-north edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0)] ; *>
-c ::: <* Clear[maskray] *>
-c ::: <* Clear[tranderiv] *>
-      k=hi(3)
-         j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-
-
-c ::: case 8, top-south edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0)] ; *>
-      k=hi(3)
-         j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-
-
-c ::: case 9, top-west edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||i<0)] ; *>
-      k=hi(3)
-      i=lo(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-         enddo
-
-c ::: case 10, top-east edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||i>0)] ; *>
-      k=hi(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-         enddo
-
-
-c ::: case 11, bottom-north edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0)] ; *>
-      k=lo(3)
-      j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-
-
-c ::: case 12, bottom-south edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0)] ; *>
-      k=lo(3)
-      j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-            enddo
-
-
-
-c ::: case 13, bottom-west edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||i<0)] ; *>
-      k=lo(3)
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-         enddo
-
-
-
-c ::: case 14, bottom-east edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||i>0)] ; *>
-      k=lo(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-         enddo
-
-
-c ::: case 15, east-north edge
-c ::: <* indexcond = Function[{i,j,k},(j>0||i>0)] ; *>
-      j=hi(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      enddo
-
-
-c ::: case 16, east-south edge
-c ::: <* indexcond = Function[{i,j,k},(j<0||i>0)] ; *>
-      j=lo(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      enddo
-
-
-c ::: case 17, west-north edge
-c ::: <* indexcond = Function[{i,j,k},(j>0||i<0)] ; *>
-      j=hi(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      enddo
-
-
-
-c ::: case 18, west-south edge
-c ::: <* indexcond = Function[{i,j,k},(j<0||i<0)] ; *>
-      j=lo(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      enddo
-
-c ::: case 19, top-north-east corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0||i>0)] ; *>
-      k=hi(3)
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-c ::: case 20, top-north-west corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0||i<0)] ; *>
-           i=lo(1)
-           j=hi(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-c ::: case 21, top-south-east corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0||i>0)] ; *>
-           i=hi(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-c ::: case 22, top-south-west corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0||i<0)] ; *>
-           i=lo(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-c ::: case 23, bottom-north-east corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0||i>0)] ; *>
-           i=hi(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-c ::: case 24, bottom-north-west corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0||i<0)] ; *>
-           i=lo(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-c ::: case 25, bottom-south-east corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0||i>0)] ; *>
-           i=hi(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-c ::: case 26, bottom-south-west corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0||i<0)] ; *>
-           i=lo(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-               out(i,j,k,1) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,2) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-               out(i,j,k,3) = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-
-
-
-
-
-
-      return
-      end
-
-
-
-
diff --git a/Src/LinearSolvers/C_TensorMG/DV_3D2.mF b/Src/LinearSolvers/C_TensorMG/DV_3D2.mF
deleted file mode 100644
index f7c5e01a6ab..00000000000
--- a/Src/LinearSolvers/C_TensorMG/DV_3D2.mF
+++ /dev/null
@@ -1,1614 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: <* standardrepl = { dudx[i+half  ,j       ,k       ]->dudxe,
-                          dudx[i-1+half,j       ,k       ]->dudxw,
-                          dvdy[i,       j+half  ,k       ]->dvdyn ,
-                          dvdy[i,       j-1+half,k       ]->dvdys ,
-			  dwdz[i,       j       ,k+half  ]->dwdzt,
-			  dwdz[i,       j       ,k-1+half]->dwdzb,
-
-                          dudy[i,       j  +half,k]-> dudyn ,
-                          dudy[i,       j-1+half,k]-> dudys ,
-                          dudy[i+half,  j       ,k]-> dudye ,
-                          dudy[i-1+half,j       ,k]-> dudyw ,
-
-                          dvdx[i,       j  +half,k]-> dvdxn ,
-                          dvdx[i,       j-1+half,k]-> dvdxs ,
-                          dvdx[i+half,  j       ,k]-> dvdxe ,
-                          dvdx[i-1+half,j       ,k]-> dvdxw ,
-
-			  dudz[i       ,j       ,k+half  ]->dudzt,
-			  dudz[i       ,j       ,k-1+half]->dudzb,
-			  dudz[i+half  ,j       ,k       ]->dudze,
-			  dudz[i-1+half,j       ,k       ]->dudzw,
-
-			  dvdz[i       ,j       ,k+half  ]->dvdzt,
-			  dvdz[i       ,j       ,k-1+half]->dvdzb,
-			  dvdz[i       ,j+half  ,k       ]->dvdzn,
-			  dvdz[i       ,j-1+half,k       ]->dvdzs,
-
-			  dwdx[i+half  ,j       ,k       ]->dwdxe,
-			  dwdx[i+half-1,j       ,k       ]->dwdxw,
-			  dwdx[i       ,j       ,k+half  ]->dwdxt,
-			  dwdx[i       ,j       ,k+half-1]->dwdxb,
-
-			  dwdy[i       ,j+half  ,k       ]->dwdyn,
-			  dwdy[i       ,j+half-1,k       ]->dwdys,
-			  dwdy[i       ,j       ,k+half  ]->dwdyt,
-			  dwdy[i       ,j       ,k+half-1]->dwdyb,
-
-                          murepl1, murepl2,murepl3,
-                          tauxxdef, tauyydef,tauxydef,tauxzdef,tauyzdef,
-                          tauzzdef,
-			  vol->hx*hy*hz };  *>
-
-
-
-
-c -------------------------------------------------------------------
-c ... a point of interpretation here: lo and hi are the covered area in
-c ... cell centered coordinates.  The dimension of the x and y fluxes have
-c ... to be at least one larger in the appropriate direction.
-c ... we use the "usual" interpretation of fluxes: cell i has a left flux
-c ... numbered i and a right flux numbered i+1
-
-      subroutine FORT_DVFLUX(
-     $     u, DIMS(u),
-     $     alpha, beta,
-     $     a, DIMS(a),
-     $     muX, DIMS(muX),
-     $     muY, DIMS(muY),
-     $     muZ, DIMS(muZ),
-     $     xflux,DIMS(xflux),
-     $     yflux,DIMS(yflux),
-     $     zflux,DIMS(zflux),
-     $     maskn,DIMS(maskn),
-     $     maske,DIMS(maske),
-     $     maskw,DIMS(maskw),
-     $     masks,DIMS(masks),
-     $     maskt,DIMS(maskt),
-     $     maskb,DIMS(maskb),
-     $     trandern,DIMS(trandern),
-     $     trandere,DIMS(trandere),
-     $     tranderw,DIMS(tranderw),
-     $     tranders,DIMS(tranders),
-     $     trandert,DIMS(trandert),
-     $     tranderb,DIMS(tranderb),
-     $     lo,hi,h
-     $     )
-
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(muZ)
-      integer DIMDEC(xflux)
-      integer DIMDEC(yflux)
-      integer DIMDEC(zflux)
-      integer DIMDEC(maskn)
-      integer DIMDEC(maske)
-      integer DIMDEC(maskw)
-      integer DIMDEC(masks)
-      integer DIMDEC(maskt)
-      integer DIMDEC(maskb)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer DIMDEC(trandert)
-      integer DIMDEC(tranderb)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),3)
-      REAL_T a(DIMV(a))
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T muZ(DIMV(muZ))
-      REAL_T xflux(DIMV(xflux),3)
-      REAL_T yflux(DIMV(yflux),3)
-      REAL_T zflux(DIMV(zflux),3)
-      integer  maskn(DIMV(maskn))
-      integer  maske(DIMV(maske))
-      integer  maskw(DIMV(maskw))
-      integer  masks(DIMV(masks))
-      integer  maskt(DIMV(maskt))
-      integer  maskb(DIMV(maskb))
-
-c ::: for transverse derives, first 3 is for variable, second 3 is for
-c ::: direction of derivative.  Obviously not all are used, but this is easy.
-      REAL_T trandern(DIMV(trandern),3,3)
-      REAL_T trandere(DIMV(trandere),3,3)
-      REAL_T tranderw(DIMV(tranderw),3,3)
-      REAL_T tranders(DIMV(tranders),3,3)
-      REAL_T trandert(DIMV(trandert),3,3)
-      REAL_T tranderb(DIMV(tranderb),3,3)
-
-      integer i,j,k
-      REAL_T tauxxw,tauxxe,tauyyn,tauyys
-      REAL_T tauxye,tauxyw,tauxyn,tauxys
-      REAL_T hx,hy,hz
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw
-      REAL_T dudyn,dudys
-      REAL_T dvdxe,dvdxw
-      REAL_T dvdxn,dvdxs
-      REAL_T dudzb,dudzt
-      REAL_T dwdzt,dwdzb
-      REAL_T dwdxb,dwdxt
-      REAL_T dvdzb,dvdzt
-      REAL_T dwdyb,dwdyt
-      REAL_T dudzw,dudze
-      REAL_T dwdxw,dwdxe
-      REAL_T dvdzs,dvdzn
-      REAL_T dwdys,dwdyn
-
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-c ::: cases:
-c     ::: 0) interior.  All usual derivative expressions
-c     ::: 1-6) face but not on edge.  
-c     ::: 7-18) edge but not on corner.
-c     ::: 19-26) corners.
-
-c ::: case 0
-c ::: <* indexcond = Function[ {i,j,k}, False ] ; *>
-c ::: <* maskray = maskerr ; *>
-      do k=lo(3)+1,hi(3)
-         do j=lo(2)+1,hi(2)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-              dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-              dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-              dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-              dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-              dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-              dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-              dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-              dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-              dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-            enddo
-         enddo
-      enddo
-
-
-c ::: case 1, top face
-c ::: <* indexcond = Function[{i,j,k},k>0] ; *>
-c ::: <* maskray = maskt ; *>
-c ::: <* tranderiv = trandert ; *>
-c ::: wst
-      k=hi(3)
-         do j=lo(2)+1,hi(2)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-            enddo
-         enddo
-
-c ::: case 2, bottom face
-c ::: <* indexcond = Function[{i,j,k},k<0] ; *>
-c ::: <* maskray = maskb ; *>
-c ::: <* tranderiv = tranderb ; *>
-c ::: wsb
-      k=lo(3)
-         do j=lo(2)+1,hi(2)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-            enddo
-         enddo
-
-
-c ::: case 3, west face
-c ::: <* indexcond = Function[{i,j,k},i<0] ; *>
-c ::: <* maskray = maskw ; *>
-c ::: <* tranderiv = tranderw ; *>
-c ::: wsb
-      i = lo(1)
-      do k=lo(3)+1,hi(3)
-         do j=lo(2)+1,hi(2)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-         enddo
-      enddo
-
-
-c ::: case 4, east face
-c ::: <* indexcond = Function[{i,j,k},i>0] ; *>
-c ::: <* maskray = maske ; *>
-c ::: <* tranderiv = trandere ; *>
-c ::: esb
-      i = hi(1)
-      do k=lo(3)+1,hi(3)
-         do j=lo(2)+1,hi(2)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-         enddo
-      enddo
-
-
-c ::: case 5, north face
-c ::: <* indexcond = Function[{i,j,k},j>0] ; *>
-c ::: <* maskray = maskn ; *>
-c ::: <* tranderiv = trandern ; *>
-c ::: wnb
-      j = hi(2)
-      do k=lo(3)+1,hi(3)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-            enddo
-      enddo
-
-	
-c ::: case 6, south face
-c ::: <* indexcond = Function[{i,j,k},j<0] ; *>
-c ::: <* maskray = masks ; *>
-c ::: <* tranderiv = tranders ; *>
-c ::: wsb
-      j = lo(2)
-      do k=lo(3)+1,hi(3)
-            do i=lo(1)+1,hi(1)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-            enddo
-      enddo
-
-c ::: case 7, top-north edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0)] ; *>
-c ::: <* Clear[maskray] *>
-c ::: <* Clear[tranderiv] *>
-c ::: tnw
-      k=hi(3)
-         j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-            enddo
-
-c ::: case 8, top-south edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0)] ; *>
-c ::: tsw
-      k=hi(3)
-         j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-            enddo
-
-
-c ::: case 9, top-west edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||i<0)] ; *>
-c ::: tsw
-      k=hi(3)
-      i=lo(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-         enddo
-
-c ::: case 10, top-east edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||i>0)] ; *>
-c ::: tes
-      k=hi(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-         enddo
-c ::: case 11, bottom-north edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0)] ; *>
-c ::: bnw
-      k=lo(3)
-      j=hi(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-            enddo
-
-c ::: case 12, bottom-south edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0)] ; *>
-c ::: bsw
-      k=lo(3)
-      j=lo(2)
-            do i=lo(1)+1,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-            enddo
-
-
-c ::: case 13, bottom-west edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||i<0)] ; *>
-c ::: bws
-      k=lo(3)
-      i=lo(1)
-      do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-         enddo
-
-
-
-c ::: case 14, bottom-east edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||i>0)] ; *>
-c ::: bse
-      k=lo(3)
-      i=hi(1)
-         do j=lo(2)+1,hi(2)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-         enddo
-
-
-
-c ::: case 15, east-north edge
-c ::: <* indexcond = Function[{i,j,k},(j>0||i>0)] ; *>
-c ::: neb
-      j=hi(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-      enddo
-
-
-c ::: case 16, east-south edge
-c ::: <* indexcond = Function[{i,j,k},(j<0||i>0)] ; *>
-c ::: esb
-      j=lo(2)
-      i=hi(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-      enddo
-
-c ::: case 17, west-north edge
-c ::: <* indexcond = Function[{i,j,k},(j>0||i<0)] ; *>
-c ::: nwb
-      j=hi(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-      enddo
-
-
-c ::: case 18, west-south edge
-c ::: <* indexcond = Function[{i,j,k},(j<0||i<0)] ; *>
-c ::: swb
-      j=lo(2)
-      i=lo(1)
-      do k=lo(3)+1,hi(3)-1
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskray] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-      enddo
-
-
-c ::: case 19, top-north-east corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0||i>0)] ; *>
-c ::: tbnsew
-      k=hi(3)
-      j=hi(2)
-      i=hi(1)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-
-
-c ::: case 20, top-north-west corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0||i<0)] ; *>
-c ::: tbnsw
-           i=lo(1)
-           j=hi(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-
-c ::: case 21, top-south-east corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0||i>0)] ; *>
-c ::: tbsew
-           i=hi(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-
-c ::: case 22, top-south-west corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0||i<0)] ; *>
-c ::: tbsw
-           i=lo(1)
-           j=lo(2)
-           k=hi(3)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-              zflux(i,j,k+1,1)=-(<*FA[tauxz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,2)=-(<*FA[tauyz[i,j,k+half]//. standardrepl] *>)
-              zflux(i,j,k+1,3)=-(<*FA[tauzz[i,j,k+half]//. standardrepl] *>)
-
-c ::: case 23, bottom-north-east corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0||i>0)] ; *>
-c ::: bnsew
-           i=hi(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-c ::: case 24, bottom-north-west corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0||i<0)] ; *>
-c ::: bnsw
-           i=lo(1)
-           j=hi(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              yflux(i,j+1,k,1)=-(<*FA[tauxy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,2)=-(<*FA[tauyy[i,j+half,k]//. standardrepl] *>)
-              yflux(i,j+1,k,3)=-(<*FA[tauyz[i,j+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-
-c ::: case 25, bottom-south-east corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0||i>0)] ; *>
-c ::: bsew
-           i=hi(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              xflux(i+1,j,k,1)=-(<*FA[tauxx[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,2)=-(<*FA[tauxy[i+half,j,k]//. standardrepl] *>)
-              xflux(i+1,j,k,3)=-(<*FA[tauxz[i+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-c ::: case 26, bottom-south-west corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0||i<0)] ; *>
-           i=lo(1)
-           j=lo(2)
-           k=lo(3)
-c     :::  get expressions for normal derivatives
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-
-c     :::  evaluate expression
-              xflux(i,j,k,1)=-(<*FA[tauxx[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,2)=-(<*FA[tauxy[i-1+half,j,k]//. standardrepl] *>)
-              xflux(i,j,k,3)=-(<*FA[tauxz[i-1+half,j,k]//. standardrepl] *>)
-              
-              yflux(i,j,k,1)=-(<*FA[tauxy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,2)=-(<*FA[tauyy[i,j-1+half,k]//. standardrepl] *>)
-              yflux(i,j,k,3)=-(<*FA[tauyz[i,j-1+half,k]//. standardrepl] *>)
-
-              zflux(i,j,k,1)=-(<*FA[tauxz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,2)=-(<*FA[tauyz[i,j,k-1+half]//. standardrepl] *>)
-              zflux(i,j,k,3)=-(<*FA[tauzz[i,j,k-1+half]//. standardrepl] *>)
-
-
-
-
-      end
diff --git a/Src/LinearSolvers/C_TensorMG/DV_3D3.mF b/Src/LinearSolvers/C_TensorMG/DV_3D3.mF
deleted file mode 100644
index 8e3407f13ee..00000000000
--- a/Src/LinearSolvers/C_TensorMG/DV_3D3.mF
+++ /dev/null
@@ -1,3177 +0,0 @@
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: <* standardrepl = { dudx[i+half  ,j       ,k       ]->dudxe,
-                          dudx[i-1+half,j       ,k       ]->dudxw,
-                          dvdy[i,       j+half  ,k       ]->dvdyn ,
-                          dvdy[i,       j-1+half,k       ]->dvdys ,
-			  dwdz[i,       j       ,k+half  ]->dwdzt,
-			  dwdz[i,       j       ,k-1+half]->dwdzb,
-
-                          dudy[i,       j  +half,k]-> dudyn ,
-                          dudy[i,       j-1+half,k]-> dudys ,
-                          dudy[i+half,  j       ,k]-> dudye ,
-                          dudy[i-1+half,j       ,k]-> dudyw ,
-
-                          dvdx[i,       j  +half,k]-> dvdxn ,
-                          dvdx[i,       j-1+half,k]-> dvdxs ,
-                          dvdx[i+half,  j       ,k]-> dvdxe ,
-                          dvdx[i-1+half,j       ,k]-> dvdxw ,
-
-			  dudz[i       ,j       ,k+half  ]->dudzt,
-			  dudz[i       ,j       ,k-1+half]->dudzb,
-			  dudz[i+half  ,j       ,k       ]->dudze,
-			  dudz[i-1+half,j       ,k       ]->dudzw,
-
-			  dvdz[i       ,j       ,k+half  ]->dvdzt,
-			  dvdz[i       ,j       ,k-1+half]->dvdzb,
-			  dvdz[i       ,j+half  ,k       ]->dvdzn,
-			  dvdz[i       ,j-1+half,k       ]->dvdzs,
-
-			  dwdx[i+half  ,j       ,k       ]->dwdxe,
-			  dwdx[i+half-1,j       ,k       ]->dwdxw,
-			  dwdx[i       ,j       ,k+half  ]->dwdxt,
-			  dwdx[i       ,j       ,k+half-1]->dwdxb,
-
-			  dwdy[i       ,j+half  ,k       ]->dwdyn,
-			  dwdy[i       ,j+half-1,k       ]->dwdys,
-			  dwdy[i       ,j       ,k+half  ]->dwdyt,
-			  dwdy[i       ,j       ,k+half-1]->dwdyb,
-
-                          murepl1, murepl2,murepl3,
-                          tauxxdef, tauyydef,tauxydef,tauxzdef,tauyzdef,
-                          tauzzdef,
-			  vol->hx*hy*hz };  *>
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_GSRB(
-     $                         u, DIMS(u),
-     $                         rhs, DIMS(rhs),
-     $                         alpha, beta,
-     $                         a, DIMS(a),
-     $                         muX, DIMS(muX),
-     $                         muY, DIMS(muY),
-     $                         muZ, DIMS(muZ),
-     $                         maskn,DIMS(maskn),
-     $                         fn, DIMS(fn),
-     $                         maske,DIMS(maske),
-     $                         fe, DIMS(fe),
-     $                         maskw,DIMS(maskw),
-     $                         fw, DIMS(fw),
-     $                         masks,DIMS(masks),
-     $                         fs, DIMS(fs),
-     $                         maskt,DIMS(maskt),
-     $                         ft, DIMS(ft),
-     $                         maskb,DIMS(maskb),
-     $                         fb, DIMS(fb),
-     $                         trandern,DIMS(trandern),
-     $                         trandere,DIMS(trandere),
-     $                         tranderw,DIMS(tranderw),
-     $                         tranders,DIMS(tranders),
-     $                         trandert,DIMS(trandert),
-     $                         tranderb,DIMS(tranderb),
-     $                         lo,hi,h,ncomp,phaseflag
-     $                         )
-      REAL_T alpha, beta
-      integer DIMDEC(u)
-      integer DIMDEC(rhs)
-      integer DIMDEC(a)
-      integer DIMDEC(muX)
-      integer DIMDEC(muY)
-      integer DIMDEC(muZ)
-      integer DIMDEC(maskn)
-      integer DIMDEC(fn)
-      integer DIMDEC(maske)
-      integer DIMDEC(fe)
-      integer DIMDEC(maskw)
-      integer DIMDEC(fw)
-      integer DIMDEC(masks)
-      integer DIMDEC(fs)
-      integer DIMDEC(maskt)
-      integer DIMDEC(ft)
-      integer DIMDEC(maskb)
-      integer DIMDEC(fb)
-      integer DIMDEC(trandern)
-      integer DIMDEC(trandere)
-      integer DIMDEC(tranderw)
-      integer DIMDEC(tranders)
-      integer DIMDEC(trandert)
-      integer DIMDEC(tranderb)
-      integer lo(BL_SPACEDIM), hi(BL_SPACEDIM)
-      integer ncomp
-      integer phaseflag
-      REAL_T h(BL_SPACEDIM)
-      REAL_T u(DIMV(u),3)
-      REAL_T rhs(DIMV(rhs),3)
-      REAL_T a(DIMV(a))
-      REAL_T muX(DIMV(muX))
-      REAL_T muY(DIMV(muY))
-      REAL_T muZ(DIMV(muZ))
-      integer  maskn(DIMV(maskn))
-      REAL_T fn(DIMV(fn),3)
-      integer  maske(DIMV(maske))
-      REAL_T fe(DIMV(fe),3)
-      integer  maskw(DIMV(maskw))
-      REAL_T fw(DIMV(fw),3)
-      integer  masks(DIMV(masks))
-      REAL_T fs(DIMV(fs),3)
-      integer  maskt(DIMV(maskt))
-      REAL_T ft(DIMV(ft),3)
-      integer  maskb(DIMV(maskb))
-      REAL_T fb(DIMV(fb),3)
-
-c ::: for transverse derives, first 3 is for variable, second 3 is for
-c ::: direction of derivative.  Obviously not all are used, but this is easy.
-      REAL_T trandern(DIMV(trandern),3,3)
-      REAL_T trandere(DIMV(trandere),3,3)
-      REAL_T tranderw(DIMV(tranderw),3,3)
-      REAL_T tranders(DIMV(tranders),3,3)
-      REAL_T trandert(DIMV(trandert),3,3)
-      REAL_T tranderb(DIMV(tranderb),3,3)
-
-      integer i,j,k
-      REAL_T tauxxw,tauxxe,tauyyn,tauyys
-      REAL_T tauxye,tauxyw,tauxyn,tauxys
-      REAL_T hx,hy,hz
-      REAL_T dudxe,dudxw
-      REAL_T dvdyn,dvdys
-      REAL_T dudye,dudyw
-      REAL_T dudyn,dudys
-      REAL_T dvdxe,dvdxw
-      REAL_T dvdxn,dvdxs
-      REAL_T dudzb,dudzt
-      REAL_T dwdzt,dwdzb
-      REAL_T dwdxb,dwdxt
-      REAL_T dvdzb,dvdzt
-      REAL_T dwdyb,dwdyt
-      REAL_T dudzw,dudze
-      REAL_T dwdxw,dwdxe
-      REAL_T dvdzs,dvdzn
-      REAL_T dwdys,dwdyn
-      integer modx,mody,modz
-      integer istart,jstart,kstart
-      REAL_T diagu,diagv,diagw
-      REAL_T operu,operv,operw
-      
-
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-
-
-      if( ncomp .ne. 3 ) then
-	write(6,*)'FORT_GSRB: bad ncomp',ncomp
-	stop
-      endif
-c ::: convert phase flag into modx and mody and modz
-      if(    phaseflag.eq.0 ) then
-         modx = 0
-         mody = 0
-         modz = 0
-      elseif(phaseflag.eq.1) then
-         modx = 1
-         mody = 0
-         modz = 0
-      elseif(phaseflag.eq.2) then
-         modx = 0
-         mody = 1
-         modz = 0
-      elseif(phaseflag.eq.3) then
-         modx = 1
-         mody = 1
-         modz = 0
-      elseif(phaseflag.eq.4) then
-         modx = 0
-         mody = 0
-         modz = 1
-      elseif(phaseflag.eq.5) then
-         modx = 1
-         mody = 0
-         modz = 1
-      elseif(phaseflag.eq.6) then
-         modx = 0
-         mody = 1
-         modz = 1
-      elseif(phaseflag.eq.7) then
-         modx = 1
-         mody = 1
-         modz = 1
-      else
-         write(6,*)'FORT_GSRB: bad phaseflag', phaseflag
-         stop
-      endif
-
-
-c ::: cases:
-c     ::: 0) interior.  All usual derivative expressions
-c     ::: 1-6) face but not on edge.  
-c     ::: 7-18) edge but not on corner.
-c     ::: 19-26) corners.
-
-c ::: case 0
-c ::: <* indexcond = Function[ {i,j,k}, False ] ; *>
-c ::: <* maskray = maskerr ; *>
-      istart = lo(1)+1
-      if( mod(istart,2) .ne. modx ) istart = istart+1
-      jstart = lo(2)+1
-      if( mod(jstart,2) .ne. mody ) jstart = jstart+1
-      kstart = lo(3)+1
-      if( mod(kstart,2) .ne. modz ) kstart = kstart+1
-
-      do k=kstart,hi(3)-1,2
-         do j=jstart,hi(2)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: in interior, diagonal elements need no corrections
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-         enddo
-      enddo
-
-c ::: case 1, top face
-c ::: <* indexcond = Function[{i,j,k},k>0] ; *>
-c ::: <* maskray = maskt ; *>
-c ::: <* tranderiv = trandert ; *>
-      k=hi(3)
-      if( mod(k,2) .eq. modz ) then
-         do j=jstart,hi(2)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-         enddo
-      endif
-
-
-c ::: case 2, bottom face
-c ::: <* indexcond = Function[{i,j,k},k<0] ; *>
-c ::: <* maskray = maskb ; *>
-c ::: <* tranderiv = tranderb ; *>
-      k=lo(3)
-      if( mod(k,2).eq.modz) then
-         do j=jstart,hi(2)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-         enddo
-      endif
-         
-
-
-c ::: case 3, west face
-c ::: <* indexcond = Function[{i,j,k},i<0] ; *>
-c ::: <* maskray = maskw ; *>
-c ::: <* tranderiv = tranderw ; *>
-      i = lo(1)
-      if( mod(i,2) .eq. modx) then
-      do k=kstart,hi(3)-1,2
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-            enddo
-         enddo
-      endif
-
-c ::: case 4, east face
-c ::: <* indexcond = Function[{i,j,k},i>0] ; *>
-c ::: <* maskray = maske ; *>
-c ::: <* tranderiv = trandere ; *>
-      i = hi(1)
-      if( mod(i,2).eq.modx) then
-      do k=kstart,hi(3)-1,2
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-      enddo
-      endif
-	
-
-c ::: case 5, north face
-c ::: <* indexcond = Function[{i,j,k},j>0] ; *>
-c ::: <* maskray = maskn ; *>
-c ::: <* tranderiv = trandern ; *>
-      j = hi(2)
-      if( mod(j,2).eq.mody) then
-      do k=kstart,hi(3)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-             enddo
-          enddo
-       endif
-
-
-
-c ::: case 6, south face
-c ::: <* indexcond = Function[{i,j,k},j<0] ; *>
-c ::: <* maskray = masks ; *>
-c ::: <* tranderiv = tranders ; *>
-      j = lo(2)
-      if( mod(j,2).eq.mody) then
-      do k=kstart,hi(3)-1,2
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-
-            enddo
-         enddo
-      endif
-
-
-
-c ::: case 7, top-north edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0)] ; *>
-c ::: <* Clear[maskray] *>
-c ::: <* Clear[tranderiv] *>
-      k=hi(3)
-         j=hi(2)
-         if( mod(k,2).eq.modz .and. mod(j,2).eq.mody ) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,1)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-            enddo
-      endif
-
-c ::: case 8, top-south edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0)] ; *>
-      k=hi(3)
-         j=lo(2)
-         if( mod(k,2).eq.modz .and. mod(j,2).eq.mody) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-            enddo
-      endif
-
-
-c ::: case 9, top-west edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||i<0)] ; *>
-      k=hi(3)
-      i=lo(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-      endif
-
-
-
-c ::: case 10, top-east edge 
-c ::: <* indexcond = Function[{i,j,k},(k>0||i>0)] ; *>
-      k=hi(3)
-      i=hi(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskt  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-      endif
-
-
-
-c ::: case 11, bottom-north edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0)] ; *>
-      k=lo(3)
-      j=hi(2)
-      if( mod(k,2).eq.modz .and. mod(j,2).eq.mody) then
-            do i=istart,hi(1)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-        endif
-
-
-
-c ::: case 12, bottom-south edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0)] ; *>
-      k=lo(3)
-      j=lo(2)
-      if( mod(k,2).eq.modz .and. mod(j,2).eq.mody ) then
-            do i=istart,hi(1)-1
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskray] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskray] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskray] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-            enddo
-       endif
-
-
-
-c ::: case 13, bottom-west edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||i<0)] ; *>
-      k=lo(3)
-      i=lo(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx) then
-      do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskray] *>
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-         endif
-
-
-
-c ::: case 14, bottom-east edge 
-c ::: <* indexcond = Function[{i,j,k},(k<0||i>0)] ; *>
-      k=lo(3)
-      i=hi(1)
-      if( mod(k,2).eq.modz .and. mod(i,2).eq.modx ) then
-         do j=jstart,hi(2)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskray] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskray] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskray] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskray] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskb  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-         enddo
-         endif
-
-
-
-c ::: case 15, east-north edge
-c ::: <* indexcond = Function[{i,j,k},(j>0||i>0)] ; *>
-      j=hi(2)
-      i=hi(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      enddo
-      endif
-
-
-c ::: case 16, east-south edge
-c ::: <* indexcond = Function[{i,j,k},(j<0||i>0)] ; *>
-      j=lo(2)
-      i=hi(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-      enddo
-      endif
-
-
-
-c ::: case 17, west-north edge
-c ::: <* indexcond = Function[{i,j,k},(j>0||i<0)] ; *>
-      j=hi(2)
-      i=lo(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskray] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-      enddo
-      endif
-
-
-
-c ::: case 18, west-south edge
-c ::: <* indexcond = Function[{i,j,k},(j<0||i<0)] ; *>
-      j=lo(2)
-      i=lo(1)
-      if( mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-      do k=kstart,hi(3)-1,2
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,tranderiv,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,tranderiv,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,tranderiv,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,tranderiv,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskray] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,tranderiv,1,3,indexcond,maskray] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskray] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,tranderiv,2,3,indexcond,maskray] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fw(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fw(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      enddo
-      endif
-
-
-c ::: case 19, top-north-east corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0||i>0)] ; *>
-      k=hi(3)
-      j=hi(2)
-      i=hi(1)
-      if( mod(k,2).eq.modz .and. mod(j,2).eq.mody .and. mod(i,2).eq.modx ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-       endif
-
-
-
-c ::: case 20, top-north-west corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j>0||i<0)] ; *>
-           i=lo(1)
-           j=hi(2)
-           k=hi(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-       endif
-
-
-
-c ::: case 21, top-south-east corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0||i>0)] ; *>
-           i=hi(1)
-           j=lo(2)
-           k=hi(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      endif
-
-
-c ::: case 22, top-south-west corner
-c ::: <* indexcond = Function[{i,j,k},(k>0||j<0||i<0)] ; *>
-           i=lo(1)
-           j=lo(2)
-           k=hi(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskt  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskt  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskt  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskt  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskt(i,j,k+1) .gt. 0 ) then
-         diagu = diagu -ft(i,j,k,1)*(beta*muZ(i,j,1+k)/hz**2)
-         diagv = diagv -ft(i,j,k,2)*(beta*muZ(i,j,1+k)/hz**2)
-         diagw = diagw -ft(i,j,k,3)*2.d0*beta*muZ(i,j,1+k)/hz**2
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-        endif
-
-
-
-c ::: case 23, bottom-north-east corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0||i>0)] ; *>
-           i=hi(1)
-           j=hi(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-
-       endif
-
-
-c ::: case 24, bottom-north-west corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j>0||i<0)] ; *>
-           i=lo(1)
-           j=hi(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,maskn  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,maskn  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,maskn  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,maskn  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( maskn(i,j+1,k) .gt. 0 ) then
-         diagu = diagu -fn(i,j,k,1)*(beta*muY(i,1+j,k)/hy**2)
-         diagv = diagv -fn(i,j,k,2)*2.d0*beta*muY(i,1+j,k)/hy**2
-         diagw = diagw -fn(i,j,k,3)*(beta*muY(i,1+j,k)/hy**2)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-
-       endif
-
-
-
-c ::: case 25, bottom-south-east corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0||i>0)] ; *>
-           i=hi(1)
-           j=lo(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maske  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maske  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maske  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maske  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-      if( maske(i+1,j,k) .gt. 0 ) then
-         diagu = diagu -fe(i,j,k,1)*2.d0*beta*muX(1+i,j,k)/hx**2
-         diagv = diagv -fe(i,j,k,2)*(beta*muX(1+i,j,k)/hx**2)
-         diagw = diagw -fe(i,j,k,3)*(beta*muX(1+i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-       endif
-
-
-
-c ::: case 26, bottom-south-west corner
-c ::: <* indexcond = Function[{i,j,k},(k<0||j<0||i<0)] ; *>
-           i=lo(1)
-           j=lo(2)
-           k=lo(3)
-           if( mod(i,2).eq.modx .and. mod(j,2).eq.mody .and. mod(k,2).eq.modz ) then
-c     :::  get expressions for normal derivatives
-               dudxe = <* FA[ dudx[i+half,j,k] //.    allDerivAllUV ] *>
-               dudxw = <* FA[ dudx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dvdyn = <* FA[ dvdy[i,j+half,k] //.    allDerivAllUV ] *>
-               dvdys = <* FA[ dvdy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dwdzt = <* FA[ dwdz[i,j,k+half]   //.  allDerivAllUV ] *>
-               dwdzb = <* FA[ dwdz[i,j,k-1+half] //.  allDerivAllUV ] *>
-
-               dudyn = <* FA[ dudy[i,j  +half,k] //.  allDerivAllUV ] *>
-               dudys = <* FA[ dudy[i,j-1+half,k] //.  allDerivAllUV ] *>
-
-               dvdxe = <* FA[ dvdx[i+half,j,k]   //.  allDerivAllUV ] *>
-               dvdxw = <* FA[ dvdx[i-1+half,j,k] //.  allDerivAllUV ] *>
-
-               dudzt = <* FA[ dudz[i       ,j,k  +half] //. allDerivAllUV ] *>
-               dudzb = <* FA[ dudz[i       ,j,k-1+half] //. allDerivAllUV ] *>
-
-               dvdzb = <* FA[ dvdz[i, j, k-1+half] //. allDerivAllUV ] *>
-               dvdzt = <* FA[ dvdz[i, j, k  +half] //. allDerivAllUV ] *>
-
-               dwdxw = <* FA[ dwdx[i-1+half,j,k  ] //. allDerivAllUV ] *>
-               dwdxe = <* FA[ dwdx[i  +half,j,k  ] //. allDerivAllUV ] *>
-
-               dwdys = <* FA[ dwdy[i,j-1+half,k  ] //. allDerivAllUV ] *>
-               dwdyn = <* FA[ dwdy[i,j  +half,k  ] //. allDerivAllUV ] *>
-
-c     ::: get expressions for tangential derivatives
-<*altgen[dvdxn,i,j  +half,k,dvdx,dvdxalt,trandern ,2,1,indexcond,maskw  ] *>
-<*altgen[dvdxs,i,j-1+half,k,dvdx,dvdxalt,tranders ,2,1,indexcond,maskw  ] *>
-<*altgen[dwdxb,i,j,k-1+half,dwdx,dwdxalt,tranderb ,3,1,indexcond,maskw  ] *>
-<*altgen[dwdxt,i,j,k  +half,dwdx,dwdxalt,trandert ,3,1,indexcond,maskw  ] *>
-<*altgen[dudye,i  +half,j,k,dudy,dudyalt,trandere ,1,2,indexcond,masks  ] *>
-<*altgen[dudyw,i-1+half,j,k,dudy,dudyalt,tranderw ,1,2,indexcond,masks  ] *>
-<*altgen[dwdyb,i,j,k-1+half,dwdy,dwdyalt,tranderb ,3,2,indexcond,masks  ] *>
-<*altgen[dwdyt,i,j,k  +half,dwdy,dwdyalt,trandert ,3,2,indexcond,masks  ] *>
-<*altgen[dudzw,i-1+half,j,k,dudz,dudzalt,tranderw ,1,3,indexcond,maskb  ] *>
-<*altgen[dudze,i  +half,j,k,dudz,dudzalt,trandere ,1,3,indexcond,maskb  ] *>
-<*altgen[dvdzs,i,j-1+half,k,dvdz,dvdzalt,tranders ,2,3,indexcond,maskb  ] *>
-<*altgen[dvdzn,i,j  +half,k,dvdz,dvdzalt,trandern ,2,3,indexcond,maskb  ] *>
-
-
-c ::: get diagonal element
-      diagu = alpha*a(i,j,k)+2.d0*beta*muX(i,j,k)/hx**2+2.d0*beta*muX(1
-     &  +i,j,k)/hx**2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagv = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+2.d0*beta*muY(i,j,k)/hy**2+2.d0*beta*muY(i,1+
-     &  j,k)/hy**2+beta*muZ(i,j,k)/hz**2+beta*muZ(i,j,1+k
-     &  )/hz**2
-      diagw = alpha*a(i,j,k)+beta*muX(i,j,k)/hx**2+beta*muX(1+i,j,k)/hx
-     &  **2+beta*muY(i,j,k)/hy**2+beta*muY(i,1+j,k)/hy**2
-     &  +2.d0*beta*muZ(i,j,k)/hz**2+2.d0*beta*muZ(i,j,1+k
-     &  )/hz**2
-c ::: correct diagonal elements for ghost cell contrib
-      if( maskb(i,j,k-1) .gt. 0 ) then
-         diagu = diagu -fb(i,j,k,1)*(beta*muZ(i,j,k)/hz**2)
-         diagv = diagv -fb(i,j,k,2)*(beta*muZ(i,j,k)/hz**2)
-         diagw = diagw -fb(i,j,k,3)*2.d0*beta*muZ(i,j,k)/hz**2
-      endif
-      if( masks(i,j-1,k) .gt. 0 ) then
-         diagu = diagu -fs(i,j,k,1)*(beta*muY(i,j,k)/hy**2)
-         diagv = diagv -fs(i,j,k,2)*2.d0*beta*muY(i,j,k)/hy**2
-         diagw = diagw -fs(i,j,k,3)*(beta*muY(i,j,k)/hy**2)
-      endif
-      if( maskw(i-1,j,k) .gt. 0 ) then
-         diagu = diagu -fw(i,j,k,1)*2.d0*beta*muX(i,j,k)/hx**2
-         diagv = diagv -fw(i,j,k,2)*(beta*muX(i,j,k)/hx**2)
-         diagw = diagw -fw(i,j,k,3)*(beta*muX(i,j,k)/hx**2)
-      endif
-
-c     :::  evaluate expression
-      operu = <* FA[ (alpha*a[i,j,k]*u[i,j,k,1] - beta* (
-                                hy*hz*(tauxx[i+half  ,j       ,k]-
-                                       tauxx[i-1+half,j       ,k])+ 
-                                hx*hz*(tauxy[i       ,j+half  ,k]-
-                                       tauxy[i       ,j-1+half,k] )+
-                                hx*hy*(tauxz[i       ,j       ,k+half]-
-                                       tauxz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operv = <* FA[ (alpha*a[i,j,k]*u[i,j,k,2] - beta* (
-                                hy*hz*(tauxy[i+half  ,j       ,k]-
-                                       tauxy[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyy[i       ,j+half  ,k]-
-                                       tauyy[i       ,j-1+half,k] )+
-                                hx*hy*(tauyz[i       ,j       ,k+half]-
-                                       tauyz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-      operw = <* FA[ (alpha*a[i,j,k]*u[i,j,k,3] - beta* (
-                                hy*hz*(tauxz[i+half  ,j       ,k]-
-                                       tauxz[i-1+half,j       ,k])+ 
-                                hx*hz*(tauyz[i       ,j+half  ,k]-
-                                       tauyz[i       ,j-1+half,k] )+
-                                hx*hy*(tauzz[i       ,j       ,k+half]-
-                                       tauzz[i       ,j       ,k-1+half]))/vol
-                                ) //. standardrepl ] *>
-c ::: do relaxation
-               u(i,j,k,1) = (rhs(i,j,k,1)-operu)/diagu+u(i,j,k,1)
-               u(i,j,k,2) = (rhs(i,j,k,2)-operv)/diagv+u(i,j,k,2)
-               u(i,j,k,3) = (rhs(i,j,k,3)-operw)/diagw+u(i,j,k,3)
-
-      endif
-
-
-
-
-
-       return
-       end
diff --git a/Src/LinearSolvers/C_TensorMG/DV_3D4.mF b/Src/LinearSolvers/C_TensorMG/DV_3D4.mF
deleted file mode 100644
index e927d2d1f4b..00000000000
--- a/Src/LinearSolvers/C_TensorMG/DV_3D4.mF
+++ /dev/null
@@ -1,2467 +0,0 @@
-#define USE_TMP 1
-#include <AMReX_REAL.H>
-
-#include "AMReX_DivVis_F.H"
-#include <AMReX_LO_BCTYPES.H>
-#include "AMReX_ArrayLim.H"
-
-c :::: usage:
-c :::: this .mF file is meant to be run through Mathematica.  This converts
-c :::: compact symbolic expressions into fortran which is stored in a .F
-c :::: file.
-
-c----------------------------------------------------------------
-c     this is the fortran support file for the the operator 
-c     L(U) = alpha*a(x)*U - beta*Div( tau )
-c
-c     where U is the two component vector (u,v) and
-c     tau is a three by three tensor
-c     tau = | t_xx     t_xy 	t_xz|
-c           | t_xy     t_yy 	t_yz|
-c	    | t_xz     t_yz	t_zz|
-c
-c     t_xx = 2*mu * u_x
-c     t_yy = 2*mu * v_y
-c     t_zz = 2*mu * w_z
-c     t_xy = mu*(u_y + v_x)
-c     t_xz = mu*(u_z + w_x)
-c     t_yz = mu*(v_z + w_y)
-
-c ::: define standard replacements used by Mathematica
-c ::: see file visc3d.ma
-c ::: <* standardrepl = { dudx[i+half  ,j       ,k       ]->dudxe,
-                          dudx[i-1+half,j       ,k       ]->dudxw,
-                          dvdy[i,       j+half  ,k       ]->dvdyn ,
-                          dvdy[i,       j-1+half,k       ]->dvdys ,
-			  dwdz[i,       j       ,k+half  ]->dwdzt,
-			  dwdz[i,       j       ,k-1+half]->dwdzb,
-
-                          dudy[i,       j  +half,k]-> dudyn ,
-                          dudy[i,       j-1+half,k]-> dudys ,
-                          dudy[i+half,  j       ,k]-> dudye ,
-                          dudy[i-1+half,j       ,k]-> dudyw ,
-
-                          dvdx[i,       j  +half,k]-> dvdxn ,
-                          dvdx[i,       j-1+half,k]-> dvdxs ,
-                          dvdx[i+half,  j       ,k]-> dvdxe ,
-                          dvdx[i-1+half,j       ,k]-> dvdxw ,
-
-			  dudz[i       ,j       ,k+half  ]->dudzt,
-			  dudz[i       ,j       ,k-1+half]->dudzb,
-			  dudz[i+half  ,j       ,k       ]->dudze,
-			  dudz[i-1+half,j       ,k       ]->dudzw,
-
-			  dvdz[i       ,j       ,k+half  ]->dvdzt,
-			  dvdz[i       ,j       ,k-1+half]->dvdzb,
-			  dvdz[i       ,j+half  ,k       ]->dvdzn,
-			  dvdz[i       ,j-1+half,k       ]->dvdzs,
-
-			  dwdx[i+half  ,j       ,k       ]->dwdxe,
-			  dwdx[i+half-1,j       ,k       ]->dwdxw,
-			  dwdx[i       ,j       ,k+half  ]->dwdxt,
-			  dwdx[i       ,j       ,k+half-1]->dwdxb,
-
-			  dwdy[i       ,j+half  ,k       ]->dwdyn,
-			  dwdy[i       ,j+half-1,k       ]->dwdys,
-			  dwdy[i       ,j       ,k+half  ]->dwdyt,
-			  dwdy[i       ,j       ,k+half-1]->dwdyb,
-
-                          murepl1, murepl2,murepl3,
-                          tauxxdef, tauyydef,tauxydef,tauxzdef,tauyzdef,
-                          tauzzdef,
-			  vol->hx*hy*hz };  *>
-
-c ::: interface notes:
-c ::: 1) trander* ALWAYS have values in them, even if the cells are
-c :::    all covered.  Might as well.  These are edge located derivative
-c :::    values.  In index space, they are located the same as the mask
-c :::    cells.  Which is somewhat anomalous.  These are edge values, after
-c :::    all.  While the masks are cell-centered.  But it seems easier
-c :::    at the moment.
-c ::: 1a) trander is 3x3 for each location; first is component number, then
-c :::     derivative direction.  Not all of these are used, in fact, only the
-c :::     component which is normal to the face is used, and only the 
-c :::     tangential directions are used.
-c ::: 2) the normal derivatives are evaluated in the normal fashion.
-c ::: 3) tangential derivatives which reach outside the rectangle DO have
-c :::    to check the masks.  
-
-      subroutine FORT_APPLYBC (
-     $     flagden, flagbc, maxorder,
-     $     u, DIMS(u),
-     $     cdir, bct, bcl,
-     $     bcval, DIMS(bcval),
-     $     maskn, DIMS(maskn),
-     $     maske, DIMS(maske),
-     $     maskw, DIMS(maskw),
-     $     masks, DIMS(masks),
-     $     maskt, DIMS(maskt),
-     $     maskb, DIMS(maskb),
-     $     den, DIMS(den),
-     $     exttd,DIMS(exttd),
-     $     trander,DIMS(trander),
-     $     lo, hi, nc,
-     $     h
-     $     )
-c
-c     If the boundary is of Neumann type, set the ghost cell value to
-c     that of the outermost point in the valid data (2nd order accurate)
-c     and then fill the "den" array with the value "1"
-c     
-c     
-c     If flagbc==1:
-c     
-c     If the boundary is of Dirichlet type, construct a polynomial
-c     interpolation through the boundary location and internal points
-c     (at locations x(-1:len-2) that generates the ghost cell value (at
-c     location xInt).  Then fill the ghost cell with the interpolated value.
-c     If flagden==1, load the "den" array with the interpolation
-c     coefficient corresponding to outermost point in the valid region
-c     ( the coef(0) corresponding to the location x(0) )
-c
-c     Note: 
-c     The bc type = LO_REFLECT_ODD is a special type of dirichlet condition,
-c     in that we want a "zeroth" order interpolant to fill the ghost cell.
-c     If this were treated in the normal way, then ALL boundaries would be
-c     low order.
-
-c ::: other notes since previous developers didn't bother to document
-c ::: cdir is mnemonic for coordinate direction. i.e. which side is
-c ::: cdir==0->west
-c ::: cdir==3->east
-c ::: cdir==1->south
-c ::: cdir==4->north
-c ::: cdir==2->bottom
-c ::: cdir==5->top
-c      
-      integer maxorder
-      integer nc, cdir, flagden, flagbc
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(u)
-      REAL_T u(DIMV(u),nc)
-      integer DIMDEC(den)
-      REAL_T den(DIMV(den),nc)
-      integer DIMDEC(exttd)
-      REAL_T exttd(DIMV(exttd),nc,3)
-      integer DIMDEC(bcval)
-      REAL_T bcval(DIMV(bcval),nc)
-      integer DIMDEC(maskn)
-      integer maskn(DIMV(maskn))
-      integer DIMDEC(maske)
-      integer maske(DIMV(maske))
-      integer DIMDEC(maskw)
-      integer maskw(DIMV(maskw))
-      integer DIMDEC(masks)
-      integer masks(DIMV(masks))
-      integer DIMDEC(maskt)
-      integer maskt(DIMV(maskt))
-      integer DIMDEC(maskb)
-      integer maskb(DIMV(maskb))
-      integer DIMDEC(trander)
-      REAL_T trander(DIMV(trander),3,3)
-      integer bct(nc)
-      REAL_T bcl
-      REAL_T h(BL_SPACEDIM)
-c
-      integer i
-      integer j
-      integer k
-      integer n
-      logical is_dirichlet
-      logical is_neumann
-      logical is_odd
-      REAL_T xb
-      REAL_T innder,outder,innloc
-      REAL_T edgloc,outloc
-      REAL_T lambda
-      REAL_T hx,hy,hz
-c
-      integer lenx
-      integer leny
-      integer lenz
-      integer m
-c...........trial change .................
-      integer tmplen
-      parameter(tmplen=256)
-      REAL_T tmp(0:tmplen)
-c...........trial change .................
-c
-      integer Lmaxorder
-      integer maxmaxorder
-      parameter(maxmaxorder=4)
-      REAL_T x(-1:maxmaxorder-2)
-      REAL_T coef(-1:maxmaxorder-2)
-      REAL_T xInt
-      logical False, True
-      parameter( False=.false.)
-      parameter( True=.true. )
-c
-      is_dirichlet(i) = ( i .eq. LO_DIRICHLET )
-      is_neumann(i) = (i .eq. LO_NEUMANN)
-c
-      if ( maxorder .eq. -1 ) then
-         Lmaxorder = maxmaxorder
-      else
-         Lmaxorder = MIN(maxorder,maxmaxorder)
-      endif
-      lenx = MIN(hi(1)-lo(1), Lmaxorder-2)
-      leny = MIN(hi(2)-lo(2), Lmaxorder-2)
-      lenz = MIN(hi(3)-lo(3), Lmaxorder-2)
-      hx = h(1)
-      hy = h(2)
-      hz = h(3)
-c...........trial change .................
-      if( (hi(1)-lo(1)+1).gt.tmplen .or. 
-     &     (hi(2)-lo(2)+1).gt.tmplen .or. 
-     &     (hi(3)-lo(3)+1).gt.tmplen) then
-         write(6,*)'FORT_APPLYBC: tmplen must be larger'
-         stop
-      endif
-c...........trial change .................
-
-c
-c     TODO:
-c     In order for this to work with growing multigrid, must
-c     sort xa[] because it is possible for the xb value to lay
-c     within this range.
-
-c     
-c     The west face of the grid
-c
-      if(cdir .eq. 0) then
-         do n = 1,nc
-            if (is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1,j,k,n) = cvmgt(
-     $                    u(lo(1),j,k,n),
-     $                    u(lo(1)-1,j,k,n),
-     $                    maskw(lo(1)-1,j,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(lo(1),j,k,n) = 1.0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-c ::: ::: <* Clear[indexcond]; *>
-               i = lo(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of west face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = <* FA[DTwoY[U,i,j,k,n] //. allUVW] *>
-                     trander(i-1,j,k,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoY[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(j<0)], masks]]*>) then
-                     innder = <* FA[DOneY[U,i,j,k,n,+1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoY[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i-1,j,k,n,2) = innder
-                  j = hi(2)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoY[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(j>0)], maskn]]*>) then
-                     innder = <* FA[DOneY[U,i,j,k,n,-1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoY[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i-1,j,k,n,2) = innder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     innder = <* FA[DTwoZ[U,i,j,k,n] //. allUVW ]*>
-                     trander(i-1,j,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k<0)], maskb]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,+1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i-1,j,k,n,3) = innder
-                  k = hi(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k>0)], maskt]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,-1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i-1,j,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, lenx+2, coef)
-#if USE_TMP
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = bcval(lo(1)-1,j,k,n)*coef(-1)
-                     enddo
-                  else
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = 0.0
-                     enddo
-                  endif
-                  do m = 0, lenx
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = tmp(j-lo(2))+u(lo(1)+m,j,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, k, n) = cvmgt(
-     &                    tmp(j-lo(2)),
-     $                    u(lo(1)-1, j,k, n),
-     $                    maskw(lo(1)-1,j,k) .gt. 0)
-                  enddo
-               enddo
-#else
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        u(lo(1)-1, j, k, n) = cvmgt(
-     $                       bcval(lo(1)-1,j,k,n)*coef(-1),
-     $                       u(lo(1)-1, j,k, n),
-     $                       maskw(lo(1)-1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        u(lo(1)-1, j, k, n) = cvmgt(
-     $                       0.0,
-     $                       u(lo(1)-1, j, k, n),
-     $                       maskw(lo(1)-1,j, k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-               do k = lo(3), hi(3)
-                  do m = 0, lenx
-                     do j = lo(2), hi(2)
-                        u(lo(1)-1,j,k,n) = cvmgt(
-     $                       u(lo(1)-1,j,k,n)
-     $                       + u(lo(1)+m, j, k, n)*coef(m),
-     $                       u(lo(1)-1,j,k,n),
-     $                       maskw(lo(1)-1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               enddo
-#endif
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(lo(1),j,k,n) = cvmgt(coef(0), 0.0,
-     $                       maskw(lo(1)-1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: <* Clear[indexcond] ; *>
-c ::: ::: interior part of west side
-               edgloc = 0.
-               i = lo(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-                  do j=lo(2)+1,hi(2)-1
-                     if( <* FA[
-                        dependentCellsCovered[DTwoY[u,i-1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DTwoY[U,i-1,j,k,n]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i-1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneY[U,i-1,j,k,n,+1]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i-1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneY[U,i-1,j,k,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i-1,j,k,n,2)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <* FA[ DTwoY[U,i,j,k,n] ]*>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i-1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  j = lo(2)
-                  if( <* FA[dependentCellsCovered[DTwoY[u,i-1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i-1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i-1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i-1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i-1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i-1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j<0)],masks]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( <* FA[dependentCellsCovered[DTwoY[u,i-1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i-1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i-1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i-1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i-1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i-1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j>0)],maskn]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     if( <* FA[
-                        dependentCellsCovered[DTwoZ[u,i-1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DTwoZ[U,i-1,j,k,n]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i-1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneZ[U,i-1,j,k,n,+1]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i-1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneZ[U,i-1,j,k,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i-1,j,k,n,3)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <* FA[ DTwoZ[U,i,j,k,n] ]*>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i-1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  k = lo(3)
-                  if( <* FA[dependentCellsCovered[DTwoZ[u,i-1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoZ[U,i-1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i-1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i-1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i-1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i-1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,3)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(k<0)],maskb]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( <* FA[dependentCellsCovered[DTwoZ[u,i-1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoZ[U,i-1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i-1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i-1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i-1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i<0)],maskw]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i-1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i-1,j,k,n,3)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(k>0)],maskt]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i-1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(lo(1)-1, j, k, n) = cvmgt(
-     $                   -u(lo(1),j,k,n),
-     $                    u(lo(1)-1,j,k,n),
-     $                    maskw(lo(1)-1,j,k) .gt. 0)
-                     trander(lo(1)-1,j,k,n,2) = 0.
-                     trander(lo(1)-1,j,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(lo(1),j,k,n) = cvmgt(-1.0, 0.0,
-     $                       maskw(lo(1)-1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON WEST FACE IN APPLYBC'
-               stop
-            endif
-	 enddo
-      endif
-c
-c     The east face of the grid
-c
-      if(cdir .eq. 3) then
-         do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,k,n) = cvmgt(
-     $                    u(hi(1), j, k, n),
-     $                    u(hi(1)+1, j, k, n),
-     $                    maske(hi(1)+1,j,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(hi(1),j,k,n) = 1.0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               i = hi(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of west face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = <* FA[DTwoY[U,i,j,k,n] //. allUVW] *>
-                     trander(i+1,j,k,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoY[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(j<0)], masks]]*>) then
-                     innder = <* FA[DOneY[U,i,j,k,n,+1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoY[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i+1,j,k,n,2) = innder
-                  j = hi(2)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoY[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(j>0)], maskn]]*>) then
-                     innder = <* FA[DOneY[U,i,j,k,n,-1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoY[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i+1,j,k,n,2) = innder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     innder = <* FA[DTwoZ[U,i,j,k,n] //. allUVW ]*>
-                     trander(i+1,j,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k<0)], maskb]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,+1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i+1,j,k,n,3) = innder
-                  k = hi(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k>0)], maskt]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,-1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i+1,j,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenx
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(1)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, lenx+2, coef)
-#if USE_TMP
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = bcval(hi(1)+1,j,k,n)*coef(-1)
-                     enddo
-                  else
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = 0.0
-                     enddo
-                  endif
-                  do m = 0, lenx
-                     do j = lo(2), hi(2)
-                        tmp(j-lo(2)) = tmp(j-lo(2))+u(hi(1)-m,j,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1,j,k,n) = cvmgt(
-     $                    tmp(j-lo(2)),
-     $                    u(hi(1)+1,j,k,n),
-     $                    maske(hi(1)+1,j,k) .gt. 0)
-                  enddo
-               enddo
-#else
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        u(hi(1)+1,j,k,n) = cvmgt(
-     $                       bcval(hi(1)+1,j,k,n)*coef(-1),
-     $                       u(hi(1)+1,j,k,n),
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        u(hi(1)+1,j,k,n) = cvmgt(
-     $                       0.0,
-     $                       u(hi(1)+1,j,k,n),
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-               do k = lo(3), hi(3)
-                  do m = 0, lenx
-                     do j = lo(2), hi(2)
-                        u(hi(1)+1,j,k,n) = cvmgt(
-     $                       u(hi(1)+1,j,k,n)
-     $                       + u(hi(1)-m,j,k,n)*coef(m),
-     $                       u(hi(1)+1,j,k,n),
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               enddo
-#endif
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(hi(1),j,k,n)   = cvmgt(coef(0), 0.0,
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part of west side
-               edgloc = 0.
-               i = hi(1)
-c ::: ::: ::: Y
-               do k=lo(3),hi(3)
-                  do j=lo(2)+1,hi(2)-1
-                     if( <* FA[
-                        dependentCellsCovered[DTwoY[u,i+1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DTwoY[U,i+1,j,k,n]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i+1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneY[U,i+1,j,k,n,+1]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i+1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneY[U,i+1,j,k,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i+1,j,k,n,2)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <* FA[ DTwoY[U,i,j,k,n] ]*>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i+1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  j = lo(2)
-                  if( <* FA[dependentCellsCovered[DTwoY[u,i+1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i+1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i+1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i+1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i+1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i+1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j<0)],masks]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( <* FA[dependentCellsCovered[DTwoY[u,i+1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i+1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i+1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i+1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneY[u,i+1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i+1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j>0)],maskn]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Z
-               do j=lo(2),hi(2)
-                  do k=lo(3)+1,hi(3)-1
-                     if( <* FA[
-                        dependentCellsCovered[DTwoZ[u,i+1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DTwoZ[U,i+1,j,k,n]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i+1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneZ[U,i+1,j,k,n,+1]]*>
-                     elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i+1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                         outloc = -0.5
-                         outder = <*FA[DOneZ[U,i+1,j,k,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1) then
-                           outder = exttd(i+1,j,k,n,3)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <* FA[ DTwoZ[U,i,j,k,n] ]*>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i+1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-c ::: ::: ::: now endpoints
-                  k = lo(3)
-                  if( <* FA[dependentCellsCovered[DTwoZ[u,i+1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoZ[U,i+1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i+1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i+1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i+1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i+1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,3)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(k<0)],maskb]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( <* FA[dependentCellsCovered[DTwoZ[u,i+1,j,k]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoZ[U,i+1,j,k,n]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i+1,j,k,+1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i+1,j,k,n,+1]]*>
-                  elseif( <* FA[
-                        dependentCellsCovered[DOneZ[u,i+1,j,k,-1]//.allUVW,
-                                      Function[{i,j,k},(i>0)],maske]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneZ[U,i+1,j,k,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1) then
-                        outder = exttd(i+1,j,k,n,3)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(k>0)],maskt]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i+1,j,k,n,3) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do j = lo(2), hi(2)
-                     u(hi(1)+1, j, k, n) = cvmgt(
-     $                   -u(hi(1),j,k,n),
-     $                    u(hi(1)+1,j,k,n),
-     $                    maske(hi(1)+1,j,k) .gt. 0)
-                     trander(hi(1)+1,j,k,n,2) = 0.
-                     trander(hi(1)+1,j,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do j = lo(2), hi(2)
-                        den(hi(1),j,k,n) = cvmgt(-1.0, 0.0,
-     $                       maske(hi(1)+1,j,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON RIGHT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The south of the Grid
-c
-      if(cdir .eq. 1) then
-	 do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do i = lo(1),hi(1)
-                     u(i,lo(2)-1,k,n) = cvmgt(
-     $                    u(i,lo(2),k,n),
-     $                    u(i,lo(2)-1,k,n),
-     $                    masks(i,lo(2)-1,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1),hi(1)
-                        den(i,lo(2),k,n)   = 1.0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               j = lo(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of south face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = <* FA[DTwoX[U,i,j,k,n]] *>
-                     trander(i,j-1,k,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if(<*FA[
-                  dependentCellsNotCovered[DTwoX[u,i,j,k] //. allUVW,
-                                    Function[{i,j,k},(i<0)],maskw]]*>) then
-                       innder = <* FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                       innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j-1,k,n,1) = innder
-                  i = hi(1)
-                  if(<*FA[
-                    dependentCellsNotCovered[DTwoX[u,i,j,k] //. allUVW,
-                                    Function[{i,j,k},(i>0)],maske]]*>) then
-                     innder = <* FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j-1,k,n,1) = innder
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1),hi(1)
-c ::: ::: ::: ::: interior part of south face
-                  do k=lo(3)+1,hi(3)-1
-                     innder = <* FA[DTwoZ[U,i,j,k,n]]*>
-                     trander(i,j-1,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k<0)], maskb]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,+1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i,j-1,k,n,3) = innder
-                  k = hi(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k>0)], maskt]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,-1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i,j-1,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-#if USE_TMP
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,lo(2)-1,k,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0
-                     enddo
-                  endif
-                  do m = 0, leny
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))+u(i,lo(2)+m,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do i = lo(1), hi(1)
-                     u(i,lo(2)-1,k,n) = cvmgt(
-     $                    tmp(i-lo(1)),
-     $                    u(i,lo(2)-1,k,n),
-     $                    masks(i,lo(2)-1,k) .gt. 0)
-                  enddo
-               enddo
-#else
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        u(i,lo(2)-1,k,n) = cvmgt(
-     $                       bcval(i,lo(2)-1,k,n)*coef(-1),
-     $                       u(i,lo(2)-1,k,n),
-     $                       masks(i,lo(2)-1,k) .gt. 0)
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        u(i,lo(2)-1,k,n) = cvmgt(
-     $                       0.0,
-     $                       u(i,lo(2)-1,k,n),
-     $                       masks(i,lo(2)-1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-               do k = lo(3), hi(3)
-                  do m = 0, leny
-                     do i = lo(1), hi(1)
-                        u(i, lo(2)-1, k, n) = cvmgt(
-     $                       u(i, lo(2)-1,k,n)
-     $                       + u(i, lo(2)+m, k,n)*coef(m),
-     $                       u(i, lo(2)-1, k, n),
-     $                       masks(i, lo(2)-1, k) .gt. 0)
-                     enddo
-                  enddo
-               enddo
-#endif
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i, lo(2),k,n)   = cvmgt(coef(0), 0.0,
-     $                       masks(i, lo(2)-1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               edgloc = 0.
-               j=lo(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-                  do i=lo(1)+1, hi(1)-1
-                     if( <* FA[
-                      dependentCellsCovered[DTwoX[u,i,j-1,k]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DTwoX[U,i,j-1,k,n]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j-1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneX[U,i,j-1,k,n,+1]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j-1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneX[U,i,j-1,k,n,-1]]*>
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j-1,k,n,1)
-                       else
-                          outder = 0.
-                       endif
-                    endif
-                    innloc = 0.5
-                    innder = <*FA[ DTwoX[U,i,j,k,n] ] *>
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j-1,k,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoX[u,i,j-1,k]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoX[U,i,j-1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j-1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j-1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j-1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j-1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,1)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(i<0)],maskw]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoX[u,i,j-1,k]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoX[U,i,j-1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j-1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j-1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j-1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j-1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,1)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(i>0)],maske]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,1) = lambda*innder+(1-lambda)*outder                 
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1), hi(1)
-                  do k=lo(3)+1,hi(3)-1
-                     if( <* FA[
-                      dependentCellsCovered[DTwoZ[u,i,j-1,k]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DTwoZ[U,i,j-1,k,n]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j-1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneZ[U,i,j-1,k,n,+1]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j-1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneZ[U,i,j-1,k,n,-1]]*>
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j-1,k,n,3)
-                       else
-                          outder = 0.
-                       endif
-                    endif
-                    innloc = 0.5
-                    innder = <*FA[ DTwoZ[U,i,j,k,n] ] *>
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j-1,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  k = lo(3)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoZ[u,i,j-1,k]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoZ[U,i,j-1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j-1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j-1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j-1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j-1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,3)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(k<0)],maskb]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoZ[u,i,j-1,k]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoZ[U,i,j-1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j-1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j-1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j-1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j<0)],masks]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j-1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j-1,k,n,3)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(k>0)],maskt]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j-1,k,n,3) = lambda*innder+(1-lambda)*outder                 
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     u(i, lo(2)-1, k, n) = cvmgt(
-     $                   -u(i,lo(2),k,n),
-     $                    u(i,lo(2)-1,k,n),
-     $                    masks(i,lo(2)-1,k) .gt. 0)
-                     trander(i,lo(2)-1,k,n,1) = 0.
-                     trander(i,lo(2)-1,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,lo(2),k,n) = cvmgt(-1.0, 0.0,
-     $                       masks(i,lo(2)-1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON BOTTOM FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The north of the grid
-c
-      if (cdir .eq. 4) then
-         do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,k,n) = cvmgt(
-     $                    u(i,hi(2),k,n),
-     $                    u(i,hi(2)+1,k,n),
-     $                    maskn(i,hi(2)+1,k) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k,n)   = 1.0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               j = hi(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-c ::: ::: ::: ::: interior part of south face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = <* FA[DTwoX[U,i,j,k,n]] *>
-                     trander(i,j+1,k,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if(<*FA[
-                  dependentCellsNotCovered[DTwoX[u,i,j,k] //. allUVW,
-                                    Function[{i,j,k},(i<0)],maskw]]*>) then
-                       innder = <* FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                       innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j+1,k,n,1) = innder
-                  i = hi(1)
-                  if(<*FA[
-                    dependentCellsNotCovered[DTwoX[u,i,j,k] //. allUVW,
-                                    Function[{i,j,k},(i>0)],maske]]*>) then
-                     innder = <* FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j+1,k,n,1) = innder
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1),hi(1)
-c ::: ::: ::: ::: interior part of south face
-                  do k=lo(3)+1,hi(3)-1
-                     innder = <* FA[DTwoZ[U,i,j,k,n]]*>
-                     trander(i,j+1,k,n,3) = innder
-                  enddo
-                  k = lo(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k<0)], maskb]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,+1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i,j+1,k,n,3) = innder
-                  k = hi(3)
-                  if(<* FA[
-                  dependentCellsNotCovered[DTwoZ[u,i,j,k] //. allUVW, 
-                                      Function[{i,j,k},(k>0)], maskt]]*>) then
-                     innder = <* FA[DOneZ[U,i,j,k,n,-1] //. allUVW ]*>
-                  else
-                     innder = <* FA[DTwoZ[U,i,j,k,n]  ]*>
-                  endif
-                  trander(i,j+1,k,n,3) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               do m=0,leny
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(2)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, leny+2, coef)
-#if USE_TMP
-               do k = lo(3), hi(3)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,hi(2)+1,k,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0
-                     enddo
-                  endif
-                  do m = 0, leny
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))+u(i,hi(2)-m,k,n)*coef(m)
-                     enddo
-                  enddo
-                  do i = lo(1), hi(1)
-                     u(i,hi(2)+1,k,n) = cvmgt(
-     $                    tmp(i-lo(1)),
-     $                    u(i,hi(2)+1,k,n),
-     $                    maskn(i,hi(2)+1,k) .gt. 0)
-                  enddo
-               enddo
-#else
-               if ( flagbc .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        u(i,hi(2)+1,k,n) = cvmgt(
-     $                       bcval(i,hi(2)+1,k,n)*coef(-1),
-     $                       u(i,hi(2)+1,k,n),
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               else
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        u(i,hi(2)+1,k,n) = cvmgt(
-     $                       0.0,
-     $                       u(i,hi(2)+1,k,n),
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-               do k = lo(3), hi(3)
-                  do m = 0, leny
-                     do i = lo(1), hi(1)
-                        u(i, hi(2)+1,k,n) = cvmgt(
-     $                       u(i,hi(2)+1,k,n)
-     $                       + u(i, hi(2)-m,k,n)*coef(m),
-     $                       u(i,hi(2)+1,k,n),
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               enddo
-#endif
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k,n)   = cvmgt(coef(0), 0.0,
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               edgloc = 0.
-               j=hi(2)
-c ::: ::: ::: X
-               do k=lo(3),hi(3)
-                  do i=lo(1)+1, hi(1)-1
-                     if( <* FA[
-                      dependentCellsCovered[DTwoX[u,i,j+1,k]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DTwoX[U,i,j+1,k,n]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j+1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneX[U,i,j+1,k,n,+1]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j+1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneX[U,i,j+1,k,n,-1]]*>
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j+1,k,n,1)
-                       else
-                          outder = 0.
-                       endif
-                    endif
-                    innloc = 0.5
-                    innder = <*FA[ DTwoX[U,i,j,k,n] ] *>
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j+1,k,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoX[u,i,j+1,k]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoX[U,i,j+1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j+1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j+1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j+1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j+1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,1)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(i<0)],maskw]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoX[u,i,j+1,k]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoX[U,i,j+1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j+1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j+1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneX[u,i,j+1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneX[U,i,j+1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,1)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(i>0)],maske]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,1) = lambda*innder+(1-lambda)*outder                 
-               enddo
-c ::: ::: ::: Z
-               do i=lo(1), hi(1)
-                  do k=lo(3)+1,hi(3)-1
-                     if( <* FA[
-                      dependentCellsCovered[DTwoZ[u,i,j+1,k]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DTwoZ[U,i,j+1,k,n]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j+1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneZ[U,i,j+1,k,n,+1]]*>
-                    elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j+1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                       outloc = -0.5
-                       outder = <*FA[DOneZ[U,i,j+1,k,n,-1]]*>
-                    else
-                       outloc = x(-1)
-                       if( flagbc .eq. 1 ) then
-                          outder = exttd(i,j+1,k,n,3)
-                       else
-                          outder = 0.
-                       endif
-                    endif
-                    innloc = 0.5
-                    innder = <*FA[ DTwoZ[U,i,j,k,n] ] *>
-                    lambda = (edgloc-outloc)/(innloc-outloc)
-                    trander(i,j+1,k,n,3) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  k = lo(3)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoZ[u,i,j+1,k]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoZ[U,i,j+1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j+1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j+1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j+1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j+1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,3)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(k<0)],maskb]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,3) = lambda*innder+(1-lambda)*outder
-
-                  k = hi(3)
-                  if( <* FA[
-                      dependentCellsCovered[DTwoZ[u,i,j+1,k]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DTwoZ[U,i,j+1,k,n]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j+1,k,+1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j+1,k,n,+1]]*>
-                  elseif( <* FA[
-                      dependentCellsCovered[DOneZ[u,i,j+1,k,-1]//.allUVW,
-                                    Function[{i,j,k},(j>0)],maskn]]*>)then
-                    outloc = -0.5
-                    outder = <*FA[DOneZ[U,i,j+1,k,n,-1]]*>
-                  else
-                    outloc = x(-1)
-                    if( flagbc .eq. 1 ) then
-                       outder = exttd(i,j+1,k,n,3)
-                    else
-                       outder = 0.
-                    endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoZ[u,i,j,k]//.allUVW,
-                              Function[{i,j,k},(k>0)],maskt]]*>) then
-                     innder = <*FA[DOneZ[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoZ[U,i,j,k,n]]*>
-                  endif
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j+1,k,n,3) = lambda*innder+(1-lambda)*outder                 
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do k = lo(3), hi(3)
-                  do i = lo(1), hi(1)
-                     u(i, hi(2)+1, k, n) = cvmgt(
-     $                   -u(i,hi(2),k,n),
-     $                    u(i,hi(2)+1,k,n),
-     $                    maskn(i,hi(2)+1,k) .gt. 0)
-                     trander(i,hi(2)+1,k,n,1) = 0.
-                     trander(i,hi(2)+1,k,n,3) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do k = lo(3), hi(3)
-                     do i = lo(1), hi(1)
-                        den(i,hi(2),k,n) = cvmgt(-1.0, 0.0,
-     $                       maskn(i,hi(2)+1,k) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON TOP FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The bottom of the Grid
-c
-      if(cdir .eq. 2) then
-         do n = 1,nc
-           if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  do i = lo(1),hi(1)
-                     u(i,j,lo(3)-1,n) = cvmgt(
-     $                    u(i,j,lo(3),n),
-     $                    u(i,j,lo(3)-1,n),
-     $                    maskb(i,j,lo(3)-1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1),hi(1)
-                        den(i,j,lo(3),n)   = 1.0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               k = lo(3)
-c ::: ::: X
-               do j=lo(2),hi(2)
-c ::: ::: ::: interior part of bottom face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = <* FA[DTwoX[U,i,j,k,n]] *>
-                     trander(i,j,k-1,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if( <*FA[
-                   dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                                   Function[{i,j,k},(i<0)],maskw]]*>) then
-                       innder = <* FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                       innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j,k-1,n,1) = innder
-                  i = hi(1)
-                  if( <*FA[
-                   dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                                   Function[{i,j,k},(i>0)],maske]]*>) then
-                       innder = <* FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                       innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j,k-1,n,1) = innder
-               enddo
-c ::: ::: ::: Y
-               do i=lo(1),hi(1)
-c ::: ::: ::: interior part of bottom face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = <* FA[ DTwoY[U,i,j,k,n]] *>
-                     trander(i,j,k-1,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if( <* FA[
-                    dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                                  Function[{i,j,k},(j<0)],masks]]*>) then
-                     innder = <* FA[ DOneY[U,i,j,k,n,+1] ] *>
-                  else
-                     innder = <* FA[ DTwoY[U,i,j,k,n] ] *>
-                  endif
-                  trander(i,j,k-1,n,2) = innder
-                  j = hi(2)
-                  if( <* FA[
-                    dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                                  Function[{i,j,k},(j>0)],maskn]]*>) then
-                     innder = <* FA[ DOneY[U,i,j,k,n,-1] ] *>
-                  else
-                     innder = <* FA[ DTwoY[U,i,j,k,n] ] *>
-                  endif
-                  trander(i,j,k-1,n,2) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenz
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(3)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, lenz+2, coef)
-#if USE_TMP
-               do j = lo(2), hi(2)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,j,lo(3)-1,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0
-                     enddo
-                  endif
-                  do m = 0, lenz
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))+u(i,j,lo(3)+m,n)*coef(m)
-                     enddo
-                  enddo
-                  do i=lo(1),hi(1)
-                     u(i,j,lo(3)-1,n) = cvmgt(
-     &                    tmp(i-lo(1)),
-     &                    u(i,j,lo(3)-1,n),
-     &                    maskb(i,j,lo(3)-1).gt. 0 )
-                  enddo
-               enddo
-#else
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        u(i,j,lo(3)-1,n) = cvmgt(
-     $                       bcval(i,j,lo(3)-1,n)*coef(-1),
-     $                       u(i,j,lo(3)-1,n),
-     $                       maskb(i,j,lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        u(i,j,lo(3)-1,n) = cvmgt(
-     $                       0.0,
-     $                       u(i,j,lo(3)-1,n),
-     $                       maskb(i,j,lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-               do j = lo(2), hi(2)
-                  do m = 0, lenz
-                     do i = lo(1), hi(1)
-                        u(i, j, lo(3)-1, n) = cvmgt(
-     $                       u(i, j, lo(3)-1,n)
-     $                       + u(i, j, lo(3)+m, n)*coef(m),
-     $                       u(i, j, lo(3)-1,n),
-     $                       maskb(i, j, lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               enddo
-#endif
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i, j, lo(3),n)   = cvmgt(coef(0), 0.0,
-     $                       maskb(i, j, lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               edgloc = 0.
-               k = lo(3)
-c ::: ::: ::: X
-               do j=lo(2),hi(2)
-                  do i=lo(1)+1, hi(1)-1
-                     if( <* FA[
-                         dependentCellsCovered[DTwoX[u,i,j,k-1]//.allUVW,
-                                 Function[{i,j,k},(k<0)],maskb]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DTwoX[U,i,j,k-1,n]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneX[u,i,j,k-1,+1]//.allUVW,
-                                 Function[{i,j,k},(k<0)],maskb]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneX[U,i,j,k-1,n,+1]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneX[u,i,j,k-1,-1]//.allUVW,
-                                 Function[{i,j,k},(k<0)],maskb]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneX[U,i,j,k-1,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k-1,n,1)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <*FA[ DTwoX[u,i,j,k,n] ] *>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k-1,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoX[u,i,j,k-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoX[U,i,j,k-1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k-1,+1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k-1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k-1,-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k-1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,1)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(i<0)],maskw]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoX[u,i,j,k-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoX[U,i,j,k-1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k-1,+1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k-1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k-1,-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k-1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,1)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(i>0)],maske]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,1) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Y               
-               do i=lo(1), hi(1)
-                  do j=lo(2)+1,hi(2)-1
-                     if( <* FA[
-                         dependentCellsCovered[DTwoY[u,i,j,k-1]//.allUVW,
-                                 Function[{i,j,k},(k<0)],maskb]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DTwoY[U,i,j,k-1,n]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneY[u,i,j,k-1,+1]//.allUVW,
-                                 Function[{i,j,k},(k<0)],maskb]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneY[U,i,j,k-1,n,+1]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneY[u,i,j,k-1,-1]//.allUVW,
-                                 Function[{i,j,k},(k<0)],maskb]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneY[U,i,j,k-1,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k-1,n,2)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <*FA[ DTwoY[u,i,j,k,n] ] *>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k-1,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  j = lo(2)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoY[u,i,j,k-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i,j,k-1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k-1,+1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k-1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k-1,-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k-1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j<0)],masks]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoY[u,i,j,k-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i,j,k-1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k-1,+1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k-1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k-1,-1]//.allUVW,
-                                Function[{i,j,k},(k<0)],maskb]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k-1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k-1,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j>0)],maskn]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k-1,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     u(i, j, lo(3)-1, n) = cvmgt(
-     $                   -u(i,j,lo(3),n),
-     $                    u(i,j,lo(3)-1,n),
-     $                    maskb(i,j,lo(3)-1) .gt. 0)
-                     trander(i,j,lo(3)-1,n,1) = 0.
-                     trander(i,j,lo(3)-1,n,2) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j,lo(3),n) = cvmgt(-1.0, 0.0,
-     $                       maskb(i,j,lo(3)-1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON FRONT FACE IN APPLYBC'
-               stop
-            endif
-         enddo
-      endif
-c
-c     The top of the grid
-c
-      if (cdir .eq. 5) then
-         do n = 1,nc
-            if(is_neumann(bct(n))) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     u(i,j, hi(3)+1,n) = cvmgt(
-     $                    u(i,j, hi(3),n),
-     $                    u(i,j, hi(3)+1,n),
-     $                    maskt(i,j, hi(3)+1) .gt. 0)
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j, hi(3),n)   = 1.0
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential derivative part
-               k = hi(3)
-c ::: ::: X
-               do j=lo(2),hi(2)
-c ::: ::: ::: interior part of bottom face
-                  do i=lo(1)+1,hi(1)-1
-                     innder = <* FA[DTwoX[U,i,j,k,n]] *>
-                     trander(i,j,k+1,n,1) = innder
-                  enddo
-                  i = lo(1)
-                  if( <*FA[
-                   dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                                   Function[{i,j,k},(i<0)],maskw]]*>) then
-                       innder = <* FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                       innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j,k+1,n,1) = innder
-                  i = hi(1)
-                  if( <*FA[
-                   dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                                   Function[{i,j,k},(i>0)],maske]]*>) then
-                       innder = <* FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                       innder = <* FA[DTwoX[U,i,j,k,n]]*>
-                  endif
-                  trander(i,j,k+1,n,1) = innder
-               enddo
-c ::: ::: ::: Y
-               do i=lo(1),hi(1)
-c ::: ::: ::: interior part of bottom face
-                  do j=lo(2)+1,hi(2)-1
-                     innder = <* FA[ DTwoY[U,i,j,k,n]] *>
-                     trander(i,j,k+1,n,2) = innder
-                  enddo
-                  j = lo(2)
-                  if( <* FA[
-                    dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                                  Function[{i,j,k},(j<0)],masks]]*>) then
-                     innder = <* FA[ DOneY[U,i,j,k,n,+1] ] *>
-                  else
-                     innder = <* FA[ DTwoY[U,i,j,k,n] ] *>
-                  endif
-                  trander(i,j,k+1,n,2) = innder
-                  j = hi(2)
-                  if( <* FA[
-                    dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                                  Function[{i,j,k},(j>0)],maskn]]*>) then
-                     innder = <* FA[ DOneY[U,i,j,k,n,-1] ] *>
-                  else
-                     innder = <* FA[ DTwoY[U,i,j,k,n] ] *>
-                  endif
-                  trander(i,j,k+1,n,2) = innder
-               enddo
-            else if (is_dirichlet(bct(n))) then
-               do m=0,lenz
-                  x(m) = m + 0.5
-               enddo
-               x(-1) = - bcl/h(3)
-               xInt = - 0.5
-               call polyInterpCoeff(xInt, x, lenz+2, coef)
-#if USE_TMP
-               do j = lo(2), hi(2)
-                  if ( flagbc .eq. 1 ) then
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = bcval(i,j, hi(3)+1,n)*coef(-1)
-                     enddo
-                  else
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = 0.0
-                     enddo
-                  endif
-                  do m = 0, lenz
-                     do i = lo(1), hi(1)
-                        tmp(i-lo(1)) = tmp(i-lo(1))
-     $                       + u(i, j, hi(3)-m,n)*coef(m)
-                     enddo
-                  enddo
-                  do i = lo(1), hi(1)
-                     u(i,j, hi(3)+1,n) = cvmgt(
-     $                    tmp(i-lo(1)),
-     $                    u(i,j, hi(3)+1,n),
-     $                    maskt(i,j, hi(3)+1) .gt. 0)
-                  enddo
-               enddo
-#else
-               if ( flagbc .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        u(i,j, hi(3)+1,n) = cvmgt(
-     $                       bcval(i,j, hi(3)+1,n)*coef(-1),
-     $                       u(i,j, hi(3)+1,n),
-     $                       maskt(i,j, hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               else
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        u(i,j, hi(3)+1,n) = cvmgt(
-     $                       0.0,
-     $                       u(i,j, hi(3)+1,n),
-     $                       maskt(i,j, hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-               do j = lo(2), hi(2)
-                  do m = 0, lenz
-                     do i = lo(1), hi(1)
-                        u(i, j, hi(3)+1,n) = cvmgt(
-     $                       u(i,j, hi(3)+1,n)
-     $                       + u(i, j, hi(3)-m,n)*coef(m),
-     $                       u(i,j, hi(3)+1,n),
-     $                       maskt(i,j, hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               enddo
-#endif
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j, hi(3),n)   = cvmgt(coef(0), 0.0,
-     $                       maskt(i,j, hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-c ::: ::: now do the tangential deriv part
-c ::: ::: interior part first, followed by end points
-               edgloc = 0.
-               k = hi(3)
-c ::: ::: ::: X
-               do j=lo(2),hi(2)
-                  do i=lo(1)+1, hi(1)-1
-                     if( <* FA[
-                         dependentCellsCovered[DTwoX[u,i,j,k+1]//.allUVW,
-                                 Function[{i,j,k},(k>0)],maskt]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DTwoX[U,i,j,k+1,n]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneX[u,i,j,k+1,+1]//.allUVW,
-                                 Function[{i,j,k},(k>0)],maskt]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneX[U,i,j,k+1,n,+1]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneX[u,i,j,k+1,-1]//.allUVW,
-                                 Function[{i,j,k},(k>0)],maskt]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneX[U,i,j,k+1,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k+1,n,1)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <*FA[ DTwoX[u,i,j,k,n] ] *>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k+1,n,1) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  i = lo(1)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoX[u,i,j,k+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoX[U,i,j,k+1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k+1,+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k+1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k+1,-1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k+1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,1)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(i<0)],maskw]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,1) = lambda*innder+(1-lambda)*outder
-
-                  i = hi(1)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoX[u,i,j,k+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoX[U,i,j,k+1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k+1,+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k+1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneX[u,i,j,k+1,-1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneX[U,i,j,k+1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,1)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoX[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(i>0)],maske]]*>) then
-                     innder = <*FA[DOneX[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoX[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,1) = lambda*innder+(1-lambda)*outder
-               enddo
-c ::: ::: ::: Y               
-               do i=lo(1), hi(1)
-                  do j=lo(2)+1,hi(2)-1
-                     if( <* FA[
-                         dependentCellsCovered[DTwoY[u,i,j,k+1]//.allUVW,
-                                 Function[{i,j,k},(k>0)],maskt]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DTwoY[U,i,j,k+1,n]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneY[u,i,j,k+1,+1]//.allUVW,
-                                 Function[{i,j,k},(k>0)],maskt]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneY[U,i,j,k+1,n,+1]]*>
-                     else if( <* FA[
-                         dependentCellsCovered[DOneY[u,i,j,k+1,-1]//.allUVW,
-                                 Function[{i,j,k},(k>0)],maskt]]*>)then
-                        outloc = -0.5
-                        outder = <*FA[DOneY[U,i,j,k+1,n,-1]]*>
-                     else
-                        outloc = x(-1)
-                        if( flagbc .eq. 1 ) then
-                           outder = exttd(i,j,k+1,n,2)
-                        else
-                           outder = 0.
-                        endif
-                     endif
-                     innloc = 0.5
-                     innder = <*FA[ DTwoY[u,i,j,k,n] ] *>
-                     lambda = (edgloc-outloc)/(innloc-outloc)
-                     trander(i,j,k+1,n,2) = lambda*innder+(1-lambda)*outder
-                  enddo
-
-                  j = lo(2)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoY[u,i,j,k+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i,j,k+1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k+1,+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k+1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k+1,-1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k+1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j<0)],masks]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,+1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,2) = lambda*innder+(1-lambda)*outder
-
-                  j = hi(2)
-                  if( <* FA[
-                       dependentCellsCovered[DTwoY[u,i,j,k+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DTwoY[U,i,j,k+1,n]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k+1,+1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k+1,n,+1]]*>
-                  else if( <* FA[
-                       dependentCellsCovered[DOneY[u,i,j,k+1,-1]//.allUVW,
-                                Function[{i,j,k},(k>0)],maskt]]*>)then
-                     outloc = -0.5
-                     outder = <*FA[DOneY[U,i,j,k+1,n,-1]]*>
-                  else
-                     outloc = x(-1)
-                     if( flagbc .eq. 1 ) then
-                        outder = exttd(i,j,k+1,n,2)
-                     else
-                        outder = 0.
-                     endif
-                  endif
-                  if(<*FA[dependentCellsNotCovered[DTwoY[u,i,j,k]//.allUVW,
-                          Function[{i,j,k},(j>0)],maskn]]*>) then
-                     innder = <*FA[DOneY[U,i,j,k,n,-1]]*>
-                  else
-                     innder = <*FA[DTwoY[U,i,j,k,n]]*>
-                  endif                     
-                  innloc = 0.5
-                  lambda = (edgloc-outloc)/(innloc-outloc)
-                  trander(i,j,k+1,n,2) = lambda*innder+(1-lambda)*outder
-               enddo
-            else if ( bct(n) .eq. LO_REFLECT_ODD ) then
-               do j = lo(2), hi(2)
-                  do i = lo(1), hi(1)
-                     u(i, j, hi(3)+1, n) = cvmgt(
-     $                   -u(i,j,hi(3),n),
-     $                    u(i,j,hi(3)+1,n),
-     $                    maskt(i,j,hi(3)+1) .gt. 0)
-                     trander(i,j,hi(3)+1,n,1) = 0.
-                     trander(i,j,hi(3)+1,n,2) = 0.
-                  enddo
-               enddo
-               if ( flagden .eq. 1 ) then
-                  do j = lo(2), hi(2)
-                     do i = lo(1), hi(1)
-                        den(i,j,hi(3),n) = cvmgt(-1.0, 0.0,
-     $                       maskt(i,j,hi(3)+1) .gt. 0)
-                     enddo
-                  enddo
-               endif
-            else
-               print *,'UNKNOWN BC ON BACK FACE IN APPLYBC'
-               stop
-            endif
-	 enddo
-      endif
-      end
-
diff --git a/Src/LinearSolvers/C_TensorMG/Format.m b/Src/LinearSolvers/C_TensorMG/Format.m
deleted file mode 100644
index 9f9858c9d26..00000000000
--- a/Src/LinearSolvers/C_TensorMG/Format.m
+++ /dev/null
@@ -1,1745 +0,0 @@
-(* :Name: Format` *)
-
-(* :Title: Extensions to the built-in Format rules and more... *)
-
-(* :Author: Mark Sofroniou *)
-
-(* :Summary:
- This package extends Mathematica's built-in format rules.
- Assignments to expressions and lists are now possible.
- The package adds definitions Assign, CAssign and FortranAssign
- and MapleAssign. Many shortcomings of the built-in formatting code
- have also been addressed, such as the limit on continuation lines
- in FORTRAN77 and assignments to Expressions.
- Code optimization is possible via the auxiliary package Optimize.m
- and the option AssignOptimize.
- The functions are primarily intended for use with the Splice command.
- When using Splice, the option FormatType->OutputForm should be
- specified.
- Interactive output within a Mathematica session is also possible
- (see also the AssignToFile option).
- All expressions are written as Strings. This enable more precise
- formatting of expressions, removing the need for text editing.
- Any Mathematica print form (e.g. TeXForm) can be specified as an
- argument of the Assign command. *)
-
-(* :Context: Format` *)
-
-(* :Package Version: 1.5 *)
-
-(* :Copyright: Copyright 1992-4,  Mark Sofroniou.
- Permission is hereby granted to modify and/or make copies of
- this file for any purpose other than direct profit, or as part
- of a commercial product, provided this copyright notice is left
- intact. Sale, other than for the cost of media, is prohibited.
-
- Permission is hereby granted to reproduce part or all of
- this file, provided that the source is acknowledged. *)
-
-(* :History:
- December 1994 - Modifications to MapleAssign.
-
- August 1994 - Version 1.5. Removed option AssignExp.
- Added array and sequence formatting for temporaries.
- Better handling of Arrays in C.
-
- April 1994 - Version 1.4. Removed options AssignComplexRules,
- AssignLevel, AssignMinSize, AssignRecursive. Renamed AssignNProtect
- as AssignToArray. Improved linebreaking and option/argument
- testing and scoping. Improved MapleAssign functionality.
-
- September 1993 - Version 1.3. Added option AssignOptimize
- and modified evaluation process accordingly. 1.3.1 minor
- modifications to FORTRAN numbering and optimization.
-
- August 1993 - Version 1.2. New MapleAssign accepts standard
- Mathematica input and returns analogous maple code. Options
- AssignIndex and AssignZero added.
-
- June 1993 - Version 1.1. Changed evaluation process.
- Removed support for log10 function and changed representation
- of rational powers in CAssign and FortranAssign.
-
- April 1993 - added lists of assignments.
-
- October 1992 - automatic breaking of long FORTRAN expressions
- and Maple format added.
-
- Original Version by Mark Sofroniou, July, 1992.
- 
- Those who have contributed suggestions (historical order):
- Dave Withoff, Rolf Mertig, Emily Martin, Troels Petersen,
- Alain Kessi, Richard Fateman, Christophe Pichon. *)
-
-(* :Keywords:
- Assign, CAssign, CForm, InputForm, FortranAssign, FortranForm,
- OutputForm, TeXForm. *)
-
-(* :Source:
- Mark Sofroniou, Ph.D. Thesis, Loughborough University, Loughborough,
- Leicestershire LE11 3TU, England. *)
-
-(* :Mathematica Version: 2.1 *)
-
-(* :Limitations:
- This package has been developed to address limitations and problems
- encountered when using Mathematica's format rules. Commands are
- encapsulated to avoid interference with Mathematica's built-in
- definitions. Necessary rules are therefore added and removed upon
- each execution.
- Recursive code breaking may be slow for large FORTRAN
- expressions especially if too strict a tolerance is specified.
- This is a particular weakness of FortranForm.
- Suggestions for improvements and enhancements are welcome. *)
-
-BeginPackage["Format`","Utilities`FilterOptions`"]
-
-Assign::usage = "Assign[lhs,rhs,outputformat,options]\n
-Assign converts the assignment of lhs to rhs into specified
-outputformat strings (such as TeXForm). If assignments to
-expressions are not required, the lhs argument may be omitted.\n
-When used with Splice, the option FormatType->OutputForm
-should be specified."
-
-CAssign::usage = "CAssign[lhs,rhs,options]\n
-CAssign converts the assignment of lhs to rhs into C compatible
-strings. Options enable control over the conversion process, such as
-the precision of real numbers. If assignments to expressions
-are not required, the lhs argument may be omitted.\n When used
-with Splice, the option FormatType->OutputForm should be specified."
-
-FortranAssign::usage = "FortranAssign[lhs,rhs,options]\n
-FortranAssign converts the assignment of lhs to rhs into
-FORTRAN compatible strings. Options enable control over the conversion
-process. Expressions are broken up and continuation characters are
-added by default. The precision of real numbers in expressions may
-be specified together with single or double precision exponents.
-Generic FORTRAN functions are used since compilers can infer the
-function type from the precision of the argument. If assignments
-to expressions are not required, the lhs argument may be omitted.\n
-When used with Splice, the option FormatType->OutputForm should be
-specified."
-
-MapleAssign::usage = "MapleAssign[lhs,rhs,options]\n
-converts Mathematica expressions into Maple expressions and assignments.
-MapleAssign converts the assignment of lhs to rhs into strings
-suitable as input to Maple. If assignments to expressions are not
-required, the lhs argument may be omitted.\n When used with Splice,
-the option FormatType->OutputForm should be specified."
-
-(* Options: *)
-
-AssignBreak::usage = "AssignBreak specifies how long lines of
-code should be broken up. AssignBreak may evaluate to a List of
-{linewidth,string} or False. One of the string characters is
-assumed to be \\n."
-
-AssignCase::usage = "AssignCase specifies whether case conversion
-of characters should be performed. AssignCase may evaluate to
-Default, Lower or Upper."
-
-AssignEnd::usage = "AssignEnd is a string appended to expressions.
-It can be used to add C-style statement delimiters (AssignEnd->\";\")
-or separate multiple expressions (AssignEnd->\"\\n\")."
-
-AssignFortranNumbers::usage= "AssignFortranNumbers specifies whether
-real numbers should be formatted in standard single or double precision
-FORTRAN notation (e.g. 7.2d0, 10.3e1). Its value may be True or False
-(uses default exponentiation)."
-
-AssignFunction::usage = "The message AssignFunction::undef is generated
-whenever a non ANSI C or FORTRAN function is encountered for the first time.
-The message may be suppressed using Off."
-
-AssignHyperbolic::usage = "AssignHyperbolic is an option of
-CAssign and FortranAssign specifying whether to transform
-reciprocal and inverse hyperbolic functions (these are not
-supported by some compilers). Unique principal values are
-assumed by writing in terms of hyperbolic functions and/or
-log and sqrt. E.g. atanh(x) = log((1+x)/(1-x))/2.
-AssignHyperbolic may evaluate to True or False."
-
-AssignIndent::usage = "AssignIndent specifies a string to prepend
-to an expression."
-
-AssignIndex::usage = "AssignIndex specifies the starting index of an
-assignment array. Its value may be any positive integer or zero."
-
-AssignLabel::usage = "AssignLabel specifies a string or positive integer
-to attach to the first in a list of expressions. Less than 6 characters
-or digits must be involved."
-
-AssignMaxSize::usage = "AssignMaxSize specifies an upper bound for the
-maximum number of bytes of a single expression. In FORTRAN77, there is
-compiler dependent limit on the allowable number of continuation lines
-an expression may occupy (typically 19). Some editors such as vi in UNIX
-impose limitations on the permissible length of a single line.
-AssignMaxSize specifies a limit on the number of bytes using ByteCount.
-This is an approximate heuristic which is roughly proportional to the
-number of characters in an expression. The setting AssignMaxSize->Infinity
-ensures that no expressions are broken up. AssignMaxSize
-may evaluate to a positive integer (>= 200) or Infinity. See also the option
-AssignTemporary."
-
-AssignOptimize::usage = "AssignOptimize is an option of CAssign and
-FortranAssign specifying whether to generate an optimized computational
-sequence. This option requires the auxiliary package Optimize.m.
-The degreee of optimization performed can be set as options to the
-function Optimize. AssignOptimize may evaluate to True or False."
-
-AssignPrecision::usage = "AssignPrecision specifies the precision
-of real numbers in expressions. Its value may be any positive integer
-or infinity."
-
-AssignRange::usage = "AssignRange is an option of CAssign and FortranAssign.
-AssignRange is used to check the range of real and integer numbers in an
-expression. Numbers are checked against IEEE standards for single and double
-precision according to the setting of AssignPrecision. AssignRange may evaluate
-to True or False."
-
-AssignReplace::usage = "AssignReplace specifies a list of String
-replacement rules. AssignReplace can be used to compact expressions
-by AssignReplace->{\" \"->\"\"}."
-
-AssignTemporary::usage = "AssignTemporary specifies the name and format
-of the temporary assignment variable used. Temporary variables are introduced
-in order to break up large expressions when specified bounds are exceeded.
-For example, specifying {t,Sequence} introduces the variables t1, t2,... etc.
-User definitions for a symbol may interfere with the assigment process.
-AssignTemporary may evaluate to an empty list or a pair {var,form} where var
-is a symbol or a string and form is either Array or Sequence."
-
-AssignTemporaryIndex::usage = "AssignTemporaryIndex stores the maximum number
-of temporary variables introduced during each assignment. This is useful for
-array dimensioning."
-
-AssignToArray::usage= "AssignToArray is used to convert
-Mathematica arrays and functions into arrays in C and FORTRAN.
-Arguments are protected from N and maintained in exact form.
-AssignToArray may evaluate to any list of symbols."
-
-AssignToFile::usage = "AssignToFile specifies the name of an output
-file to write results. Any previous contents of the file will be
-overwritten. AssignToFile may evaluate to any string. See also the
-Mathematica function Splice."
-
-AssignTrig::usage = "AssignTrig is an option of CAssign and
-FortranAssign specifying whether to transform reciprocal and
-inverse trigonometric functions (these are not supported by
-some compilers). Unique principal values in terms of trigonometric
-functions are assumed. E.g. cot(x) = tan(1/x).
-AssignTrig may evaluate to True or False."
-
-AssignZero::usage = "AssignZero specifies whether zero-valued
-elements in an array should be assigned or removed. This is
-useful when assigning large arrays in ANSI C (default values
-are zero). AssignZero may evaluate to True or False."
-
-
-(* Set general error message for arguments. *)
-
-Assign::args = "The `1` did not evaluate to `2`."
-CAssign::args = "The `1` did not evaluate to `2`."
-FortranAssign::args = "The `1` did not evaluate to `2`."
-MapleAssign::args = "The `1` did not evaluate to `2`."
-
-AssignFunction::undef = "Expression contains the function
-`1` which is not part of the ANSI `2` standard."
-
-AssignOptimize::fail = "Unable to optimize expression - check
-default options for Optimize. Continuing with unoptimized
-expression."
-
-(* Symbols used to format real numbers in FORTRAN. *)
-
-d::usage="d is the exponent used to format double precision
-numbers in FortranAssign.";
-e::usage="e is the exponent used to format single precision
-numbers in FortranAssign.";
-
-(* Symbols used to format CAssign, FortranAssign and MapleAssign functions. *)
-
-abs::usage="The symbol abs is used to format Abs in CAssign, FortranAssign
-and MapleAssign.";
-acos::usage="The symbol acos is used to format ArcCos in CAssign and
-FortranAssign.";
-aimag::usage="The symbol aimag is used in the test for ANSI compatible
-functions in FortranAssign.";
-aint::usage="The symbol aint is used in the test for ANSI compatible
-functions in FortranAssign.";
-alog::usage="The symbol alog is used in the test for ANSI compatible
-functions in FortranAssign.";
-alog10::usage="The symbol alog10 is used in the test for ANSI compatible
-functions in FortranAssign.";
-amax0::usage="The symbol amax0 is used in the test for ANSI compatible
-functions in FortranAssign.";
-amax1::usage="The symbol amax1 is used in the test for ANSI compatible
-functions in FortranAssign.";
-amin0::usage="The symbol amin0 is used in the test for ANSI compatible
-functions in FortranAssign.";
-amin1::usage="The symbol amin1 is used in the test for ANSI compatible
-functions in FortranAssign.";
-amod::usage="The symbol amod is used in the test for ANSI compatible
-functions in FortranAssign.";
-and::usage="The symbol and is used to format And in MapleAssign.";
-anint::usage="The symbol anint is used in the test for ANSI compatible
-functions in FortranAssign.";
-arccos::usage="The symbol arccos is used to format ArcCos in MapleAssign.";
-acosh::usage="The symbol acosh is used to format ArcCosh in CAssign and
-FortranAssign. If the compiler does not support an acosh function,
-then the option AssignHyperbolic may be used.";
-Ai::usage="The symbol Ai is used to format AiryAi in MapleAssign.";
-arccosh::usage="The symbol arccosh is used to format ArcCosh in MapleAssign.";
-arccot::usage="The symbol arccot is used to format ArcCot in MapleAssign.";
-arccoth::usage="The symbol arccoth is used to format ArcCoth in MapleAssign.";
-arccsc::usage="The symbol arccsc is used to format ArcCsc in MapleAssign.";
-arccsch::usage="The symbol arccsch is used to format ArcCsch in MapleAssign.";
-arcsec::usage="The symbol arcsec is used to format ArcSec in MapleAssign.";
-arcsech::usage="The symbol arcsech is used to format ArcSech in MapleAssign.";
-asin::usage="The symbol asin is used to format ArcSin in CAssign and
-FortranAssign.";
-arcsin::usage="The symbol arcsin is used to format ArcSin in MapleAssign.";
-asinh::usage="The symbol asinh is used to format ArcSinh in CAssign and 
-FortranAssign. If the compiler does not support an asinh function,
-then the option AssignHyperbolic may be used.";
-arcsinh::usage="The symbol arcsinh is used to format ArcSinh in MapleAssign.";
-atan::usage="The symbol atan is used to format ArcTan in CAssign and
-FortranAssign. If the compiler does not support an atanh function,
-then the option AssignHyperbolic may be used.";
-arctan::usage="The symbol arctan is used to format ArcTan in MapleAssign.";
-atan2::usage="The symbol atan2 is used in the test for ANSI compatible
-functions in CAssign and FortranAssign.";
-atanh::usage="The symbol atanh is used to format ArcTanh in CAssign and
-FortranAssign.";
-arctanh::usage="The symbol arctanh is used to format ArcTanh in MapleAssign.";
-bernoulli::usage="The symbol bernoulli is used to format BernoulliB in
-MapleAssign.";
-Bi::usage="The symbol Bi is used to format AiryBi in MapleAssign.";
-binomial::usage="The symbol binomial is used to format Binomial in
-MapleAssign.";
-cabs::usage="The symbol cabs is used in the test for ANSI compatible
-functions in FortranAssign.";
-ccos::usage="The symbol ccos is used in the test for ANSI compatible
-functions in FortranAssign.";
-ceil::usage="The symbol ceil is used to format Round in CAssign.";
-cexp::usage="The symbol cexp is used in the test for ANSI compatible
-functions in FortranAssign.";
-char::usage="The symbol char is used in the test for ANSI compatible functions
-in FortranAssign.";
-Ci::usage="The symbol Ci is used to format CosIntegral in MapleAssign.";
-clog::usage="The symbol clog is used in the test for ANSI compatible
-functions in FortranAssign.";
-cmplx::usage="The symbol cmplx is used in the test for ANSI compatible
-functions in FortranAssign.";
-collect::usage="The symbol collect is used to format Collect in MapleAssign.";
-conjg::usage="The symbol cmplx is used to format Conjugate in FortranAssign.";
-cos::usage="The symbol cos is used to format Cos in CAssign, FortranAssign
-and MapleAssign.";
-cosh::usage="The symbol cosh is used to format Cosh in CAssign, FortranAssign
-and MapleAssign.";
-cot::usage="The symbol cot is used to format Cot in MapleAssign.";
-coth::usage="The symbol coth is used to format Coth in MapleAssign.";
-csc::usage="The symbol csc is used to format Csc in MapleAssign.";
-csch::usage="The symbol csch is used to format Csch in MapleAssign.";
-csin::usage="The symbol csin is used in the test for ANSI compatible
-functions in FortranAssign.";
-csqrt::usage="The symbol csqrt is used in the test for ANSI compatible
-functions in FortranAssign.";
-dabs::usage="The symbol dabs is used in the test for ANSI compatible
-functions in FortranAssign.";
-dacos::usage="The symbol dacos is used in the test for ANSI compatible
-functions in FortranAssign.";
-dasin::usage="The symbol dasin is used in the test for ANSI compatible
-functions in FortranAssign.";
-datan::usage="The symbol datan is used in the test for ANSI compatible
-functions in FortranAssign.";
-datan2::usage="The symbol datan is used in the test for ANSI compatible
-functions in FortranAssign.";
-dble::usage="The symbol dble is used in the test for ANSI compatible functions
-in FortranAssign.";
-dcos::usage="The symbol dcos is used in the test for ANSI compatible
-functions in FortranAssign.";
-dcosh::usage="The symbol dcosh is used in the test for ANSI compatible
-functions in FortranAssign.";
-ddim::usage="The symbol ddim is used in the test for ANSI compatible
-functions in FortranAssign.";
-denom::usage="The symbol denom is used to format Denominator in MapleAssign.";
-dexp::usage="The symbol dexp is used in the test for ANSI compatible
-functions in FortranAssign.";
-diff::usage="The symbol diff is used to format D in MapleAssign.";
-dilog::usage="The symbol dilog is used to format PolyLog in MapleAssign.";
-dim::usage="The symbol dim is used in the test for ANSI compatible functions in
-FortranAssign.";
-dint::usage="The symbol dint is used in the test for ANSI compatible
-functions in FortranAssign.";
-div::usage="The symbol div is used in the test for ANSI compatible functions in
-CAssign.";
-dlog::usage="The symbol dlog is used in the test for ANSI compatible
-functions in FortranAssign.";
-dlog10::usage="The symbol dlog10 is used in the test for ANSI compatible
-functions in FortranAssign.";
-dmax1::usage="The symbol dmax1 is used in the test for ANSI compatible
-functions in FortranAssign.";
-dmin1::usage="The symbol dmin1 is used in the test for ANSI compatible
-functions in FortranAssign.";
-dmod::usage="The symbol dmod is used in the test for ANSI compatible
-functions in FortranAssign.";
-dnint::usage="The symbol dnint is used in the test for ANSI compatible
-functions in FortranAssign.";
-dprod::usage="The symbol dprod is used in the test for ANSI compatible
-functions in FortranAssign.";
-dsign::usage="The symbol dsign is used in the test for ANSI compatible
-functions in FortranAssign.";
-dsin::usage="The symbol dsin is used in the test for ANSI compatible
-functions in FortranAssign.";
-dsinh::usage="The symbol dsinh is used in the test for ANSI compatible
-functions in FortranAssign.";
-dsqrt::usage="The symbol dsqrt is used in the test for ANSI compatible
-functions in FortranAssign.";
-dtan::usage="The symbol dtan is used in the test for ANSI compatible
-functions in FortranAssign.";
-dtanh::usage="The symbol dtanh is used in the test for ANSI compatible
-functions in FortranAssign.";
-Ei::usage="The symbol Ei is used to format ExpIntegral in MapleAssign.";
-erf::usage="The symbol erf is used to format Erf in MapleAssign.";
-erfc::usage="The symbol erfc is used to format Erfc in MapleAssign.";
-euler::usage="The symbol euler is used to format EulerE in MapleAssign.";
-evalf::usage="The symbol evalf is used to format N in MapleAssign.";
-exp::usage="The symbol exp is used to format Exp in CAssign, FortranAssign
-and MapleAssign.";
-expand::usage="The symbol expand is used to format Expand in MapleAssign.";
-fabs::usage="The symbol fabs is used in the test for ANSI compatible functions
-in CAssign.";
-factor::usage="The symbol factor is used to format Factor in MapleAssign.";
-false::usage="The symbol false is used to format False in MapleAssign.";
-float::usage="The symbol float is used in the test for ANSI compatible
-functions in FortranAssign.";
-floor::usage="The symbol floor is used to format Floor in CAssign.";
-fmod::usage="The symbol fmod is used in the test for ANSI compatible functions
-in CAssign.";
-frexp::usage="The symbol frexp is used in the test for ANSI compatible
-functions in CAssign.";
-fsolve::usage="The symbol fsolve is used to format NSolve in MapleAssign.";
-GAMMA::usage="The symbol GAMMA is used to format Gamma in MapleAssign.";
-iabs::usage="The symbol iabs is used in the test for ANSI compatible
-functions in FortranAssign.";
-ichar::usage="The symbol ichar is used in the test for ANSI compatible
-functions in FortranAssign.";
-idim::usage="The symbol idim is used in the test for ANSI compatible
-functions in FortranAssign.";
-idint::usage="The symbol idint is used in the test for ANSI compatible
-functions in FortranAssign.";
-idnint::usage="The symbol idnint is used in the test for ANSI compatible
-functions in FortranAssign.";
-ifix::usage="The symbol ifix is used in the test for ANSI compatible
-functions in FortranAssign.";
-index::usage="The symbol index is used in the test for ANSI compatible
-functions in FortranAssign.";
-infinity::usage="The symbol infinity is used to format ComplexInfinity,
-and Infinity in MapleAssign.";
-int::usage="The symbol int is used to format Floor in FortranAssign and
-Integrate and NIntegrate in MapleAssign.";
-isign::usage="The symbol isign is used in the test for ANSI compatible
-functions in FortranAssign.";
-labs::usage="The symbol labs is used in the test for ANSI compatible
-functions in CAssign.";
-ldexp::usage="The symbol ldexp is used in the test for ANSI compatible
-functions in CAssign.";
-ldiv::usage="The symbol ldiv is used in the test for ANSI compatible
-functions in CAssign.";
-len::usage="The symbol len is used in the test for ANSI compatible
-functions in FortranAssign.";
-lge::usage="The symbol lge is used in the test for ANSI compatible
-functions in FortranAssign.";
-lgt::usage="The symbol lgt is used in the test for ANSI compatible
-functions in FortranAssign.";
-lle::usage="The symbol lle is used in the test for ANSI compatible
-functions in FortranAssign.";
-llt::usage="The symbol llt is used in the test for ANSI compatible
-functions in FortranAssign.";
-lnGAMMA::usage="The symbol lnGAMMA is used to format LogGamma in MapleAssign.";
-log::usage="The symbol log is used to format Log in CAssign, FortranAssign
-and MapleAssign.";
-log10::usage="The symbol log10 is used in the test for ANSI compatible
-functions in CAssign and FortranAssign.";
-map::usage="The symbol map is used to format Map in MapleAssign.";
-max::usage="The symbol max is used to format Max in FortranAssign and
-MapleAssign.";
-max0::usage="The symbol max0 is used in the test for ANSI compatible
-functions in FortranAssign.";
-max1::usage="The symbol max1 is used in the test for ANSI compatible
-functions in FortranAssign.";
-min::usage="The symbol min is used to format Min in FortranAssign and
-MapleAssign.";
-min0::usage="The symbol min0 is used in the test for ANSI compatible
-functions in FortranAssign.";
-min1::usage="The symbol min1 is used in the test for ANSI compatible
-functions in FortranAssign.";
-mod::usage="The symbol mod is used to format Mod in CAssign, FortranAssign
-and MapleAssign.";
-mtaylor::usage="The symbol mtaylor is used to format Series in MapleAssign.";
-modf::usage="The symbol modf is used in the test for ANSI compatible
-functions in CAssign.";
-nint::usage="The symbol nint is used to format Round in FortranAssign.";
-nops::usage="The symbol nops is used to format Length in MapleAssign.";
-normal::usage="The symbol normal is used to format Together in MapleAssign.";
-not::usage="The symbol not is used to format Not in MapleAssign.";
-NULL::usage="The symbol NULL is used to format Null in MapleAssign.";
-num::usage="The symbol num is used to format Numerator in MapleAssign.";
-op::usage="The symbol op is used to format Part in MapleAssign. op(0,expr)
-is analogous to Head[expr]";
-or::usage="The symbol or is used to format Or in MapleAssign.";
-pow::usage="The symbol pow is used to format Power in CAssign.";
-product::usage="The symbol product is used to format Product in MapleAssign.";
-Psi::usage="The symbol Psi is used to format PolyGamma in MapleAssign.";
-rand::usage="The symbol rand is used to format Random in CAssign.";
-real::usage="The symbol real is used to format Re in FortranAssign.";
-RootOf::usage="The symbol RootOf is used to format Roots in MapleAssign.";
-round::usage="The symbol round is used to format Round in MapleAssign.";
-sec::usage="The symbol sec is used to format Sec in MapleAssign.";
-sech::usage="The symbol sech is used to format Sech in MapleAssign.";
-series::usage="The symbol series is used to format Series in MapleAssign.";
-Si::usage="The symbol Si is used to format SinIntegral in MapleAssign.";
-sign::usage="The symbol sign is used to format Sign in MapleAssign and
-in the test for ANSI compatible functions in FortranAssign.";
-simplify::usage="The symbol simplify is used to format Simplify in
-MapleAssign.";
-sin::usage="The symbol sin is used to format Sin in CAssign, FortranAssign
-and MapleAssign.";
-sinh::usage="The symbol sinh is used to format Sinh in CAssign, FortranAssign
-and MapleAssign.";
-sngl::usage="The symbol sngl is used in the test for ANSI compatible
-functions in FortranAssign.";
-solve::usage="The symbol solve is used to format Solve in MapleAssign.";
-sqrt::usage="The symbol sqrt is used to format Sqrt in CAssign, FortranAssign
-and MapleAssign.";
-srand::usage="The symbol srand is used in the test for ANSI compatible
-functions in CAssign and FortranAssign.";
-subs::usage="The symbol subs is used to format ReplaceAll in MapleAssign.";
-sum::usage="The symbol sum is used to format Sum in MapleAssign.";
-tan::usage="The symbol tan is used to format Tan in CAssign, FortranAssign
-and MapleAssign.";
-tanh::usage="The symbol tanh is used to format Tanh in CAssign, FortranAssign
-and MapleAssign.";
-true::usage="The symbol true is used to format True in MapleAssign.";
-trig::usage="The symbol trig is used to format the option Trig->True
-(used in Simplify and related functions) in MapleAssign.";
-
-(* Symbols used to format ASCII strings. Default already exists
- in the global context. *)
-
-Lower::usage="Lower is used to format ASCII strings via
-the option AssignCase.";
-Upper::usage="Upper is used to format ASCII strings via
-the option AssignCase.";
-
-Unprotect[d,e,abs,acos,acosh,Ai,aimag,aint,alog,alog10,amax0,amax1,amin0,amin1,
-amod,and,anint,arccos,arccosh,arccot,arccoth,arccsc,arccsch,arcsec,arcsech,arcsin,
-arcsinh,arctan,arctanh,asin,asinh,atan,atan2,atanh,bernoulli,Bi,binomial,cabs,
-ccos,ceil,cexp,char,Ci,clog,cmplx,collect,conjg,cos,cosh,cot,coth,csc,csch,csin,
-csqrt,dabs,dacos,dasin,datan,datan2,dble,dcos,dcosh,ddim,denom,dexp,dilog,dim,
-dint,dlog,dlog10,dmax1,dmin1,dmod,dnint,dprod,dsign,dsin,dsinh,dsqrt,dtan,dtanh,
-Ei,erf,erfc,euler,evalf,exp,expand,factor,factorial,false,float,fsolve,GAMMA,iabs,
-ichar,idim,idint,idnint,ifix,index,infinity,int,isign,len,lge,lgt,lle,llt,log,log10,lnGAMMA,
-map,max,max0,max1,min,min0,min1,mod,mtaylor,nint,not,NULL,num,op,or,pow,Psi,real,RootOf,
-round,sec,sech,series,Si,sign,sin,sinh,sngl,solve,sqrt,subs,tan,tanh,true,
-Lower,Upper,Assign,AssignBreak,AssignCase,AssignEnd,AssignFortranNumbers,
-AssignIndent,AssignHyperbolic,AssignLabel,AssignMaxSize,AssignPrecision,
-AssignRange,AssignReplace,AssignTemporary,AssignToArray,AssignToFile,AssignTrig,
-CAssign,FortranAssign,MapleAssign];
-
-
-Begin["`Private`"]
-
-machinePrecision = If[$VersionNumber >= 5.0, Ceiling[$MachinePrecision],$MachinePrecision];
-
-errmsgs = {
-  {"argument lhs","a (flat) list of the same length as rhs"},
-  {"option AssignBreak","False or a List of a positive integer and a string"},
-  {"option AssignCase","Default, Lower, or Upper"},
-  {"option AssignEnd","a string"},
-  {"option AssignFortranNumbers","True or False"},
-  {"option AssignHyperbolic","True or False"},
-  {"option AssignIndent","a string or a positive integer"},
-  {"option AssignIndex","a positive integer or zero"},
-  {"option AssignLabel","a string or positive integer"},
-  {"option AssignMaxSize","a positive integer (>= 200) or infinity"},
-  {"option AssignOptimize","True or False"},
-  {"option AssignPrecision","a positive integer or infinity"},
-  {"option AssignRange","True or False"},
-  {"option AssignReplace","a (possibly empty) list of string replacement rules"},
-  {"option AssignTemporary","a list of the form {_Symbol|_String,Sequence|Array}"},
-  {"option AssignToArray","a (possibly empty) list of symbols"},
-  {"option AssignToFile","a string"},
-  {"option AssignTrig","True or False"},
-  {"option AssignZero","True or False"}};
-
-(* Function to check the data types of options with error messages. *)
-
-OptionTest[expr_,var_,assignfn_,opts___?OptionQ]:= 
-  Module[{defaults=Options[assignfn],optlist,types,linbrk,acase,
-    aend,fnumsQ,hypQ,indent,index,albl,amxsz,optQ,
-    prec,rangeQ,arep,tvar,atoarry,atofile,trigQ,zeroQ},
-
-    optlist =
-      {linbrk,acase,aend,fnumsQ,hypQ,indent,index,albl,amxsz,optQ,
-       prec,rangeQ,arep,tvar,atoarry,atofile,trigQ,zeroQ} =
-         Map[First,defaults] /. {opts} /. defaults;
-
-    types = {
-If[VectorQ[var],
-  MatchQ[expr,_List]&&Length[var]===Length[expr],
-  If[ListQ[var],False,True]
-],
-MatchQ[linbrk,False|{_Integer?Positive,_String}],
-MatchQ[acase,Default|Lower|Upper],
-StringQ[aend],
-MatchQ[fnumsQ,True|False],
-MatchQ[hypQ,True|False],
-StringQ[indent],
-MatchQ[index,_Integer?Positive|0],
-MatchQ[albl,_Integer?(0<#<100000&)|_String?(StringLength[#]<6&)],
-MatchQ[amxsz,_Integer?(#>=200&)|Infinity],
-MatchQ[optQ,True|False],
-MatchQ[prec,_Integer?Positive|Infinity],
-MatchQ[rangeQ,True|False],
-MatchQ[arep,{}|{(_String->_String)...}],
-MatchQ[tvar,{}|{_Symbol|_String,Sequence|Array}],
-MatchQ[atoarry,{___Symbol}],
-StringQ[atofile],
-MatchQ[trigQ,True|False],
-MatchQ[zeroQ,True|False] };
-
-(* Add optimization variable to list of arrays and avoid duplicates. *)
-
-If[optQ&&MatchQ[#,{_Symbol,Array}],
-  optlist[[-4]] = Union[ Join[ atoarry, {First[#]} ] ]
-]& @ (Optimize`OptimizeVariable /. {opts} /. Options[Optimize`Optimize]);
-
-    Check[
-      MapThread[
-        If[#1,#1,Message[assignfn::args,Apply[Sequence,#2]]]&,
-        {types,errmsgs}
-      ]; optlist,      (* Return list of option values. *)
-      $Failed,         (* Option of wrong type. *)
-      assignfn::args   (* Check only for these messages. *)
-    ]
-  ];    (* End of OptionTest. *)
-
-
-
-(* C assignment format. *)
-
-SetAttributes[CAssign,HoldFirst];
-
-Options[CAssign]:= {
-AssignBreak->{Options[$Output,PageWidth][[1,2]]-2,"\\\n"},
-AssignCase->Default, AssignEnd->";", AssignFortranNumbers->False, AssignHyperbolic->False,
-AssignIndent->"", AssignIndex->0, AssignLabel->"", AssignMaxSize->Infinity,
-AssignOptimize->False, AssignPrecision-> machinePrecision-1,
-AssignRange->False, AssignReplace->{" "->""}, AssignTemporary->{"t",Array},
-AssignToArray->{}, AssignToFile->"", AssignTrig->True, AssignZero->True};
-
-CAssign[lhs_:"",expr_?(!OptionQ[#]&),opts___?OptionQ]:=
-  Module[{optvals},
-    optvals /; 
-      And[
-        (optvals = OptionTest[expr,GetShape[lhs],CAssign,FilterOptions[CAssign,opts]])=!=$Failed,
-        optvals = CMain[lhs,expr,optvals,{FilterOptions[Optimize`Optimize,opts]}];
-        True
-      ]
-  ];
-
-
-(* Perform assignments and code translation. Output resulting list as a 
- column and avoid string delimiters "". *)
-
-SetAttributes[CMain,HoldFirst];
-
-CMain[lhs_,expr_,{linbrk_,acase_,aend_,fnumsQ_,hypQ_,indent_,index_,albl_,
-amxsz_,optQ_,prec_,rangeQ_,arep_,tvar_,atoarry_,atofile_,trigQ_,zeroQ_},optopts_]:=
-Block[{$RecursionLimit=Infinity},
-  Block[atoarry,
-
-    AssignTemporaryIndex = 0;
-
-(* Format C Arrays. *)
-
-    Map[ (Format[#[i__],CForm]:=HoldForm[Part[#,i]])&, atoarry ];
-
-    ColumnForm[
-      Flatten[
-        CommonAssign[
-          Makelhs[lhs,CForm],
-          RangeTest[
-            CDefs[
-              MyN[expr,prec,atoarry,CMain],
-            trigQ,hypQ,optQ,prec,atoarry,optopts],
-          prec,CForm,rangeQ],
-          CForm,
-          " = ",acase,aend,tvar,atofile,zeroQ,
-          indent,index,albl,linbrk,amxsz,arep
-        ]
-      ]
-    ] //OutputForm
-  ]
-]; (* End of CMain.*)
-
-
-
-(* Define rules for C translation. *)
-
-(* C expression head replacement. *)
-
-SetAttributes[ApplyCDefs,Listable];
-
-ApplyCDefs[expr_]:= CRH[Map[CRH,expr,-2]];
-
-Literal[CRH[ArcTan[x_,y_]]]:= atan2[y,x];
-
-(* Nest logical operators. *)
-
-Literal[CRH[Equal[x_,y_,z__]]]:= Apply[CD[And], Map[CD[Equal][x,#]&,{y,z}] ];
-Literal[CRH[e:Unequal[x_,y_,z__]]]:=
-  Apply[CD[And],
-    Flatten[ Table[Map[CD[Unequal][e[[i]],#]&,Drop[{x,y,z},i]],{i,Length[e]-1}] ]
-  ];
-Literal[CRH[(h:Greater|GreaterEqual|Less|LessEqual)[x_,y__,z_]]]:=
-  Apply[CD[And],MapThread[CD[h],{{x,y},{y,z}}]];
-Literal[CRH[Inequality[x_,op_,y_,z__]]]:= CD[And][CD[op][x,y],CRH[Inequality[y,z]]];
-Literal[CRH[Inequality[x_,op_,y_]]]:= CD[op][x,y];
-
-(* Recover minus sign. *)
-
-Literal[CRH[Times[-1.,x__]]]:= CD[Times][-1,x];
-
-(* Replace heads in remaining expressions. *)
-
-Literal[CRH[expr_]]:= Operate[CD,expr];
-
-(* Legal C functions. *)
-
-cfuns = {abs,acos,AddTo,asin,atan,atan2,ceil,cos,cosh,Decrement,
-  div,DivideBy,exp,fabs,floor,fmod,frexp,Increment,labs,ldexp,ldiv,
-  log,log10,mod,modf,pow,Power,PreIncrement,PreDecrement,rand,srand,
-  sin,sinh,sqrt,SubtractFrom,tan,tanh,TimesBy};
-
-ANSIC[funct_]:=
- If[MemberQ[cfuns,funct],
-   funct,
-   Message[AssignFunction::undef,funct,"C"]; funct
- ];
-
-(* Add C definitions. *)
-
-SetAttributes[CDefs,{HoldAll}];
-
-CDefs[expr_,trigQ_,hypQ_,optQ_,prec_,atoarry_,{optopts___}]:=
-  Block[{Csc,Cot,Sec,ArcCsc,ArcCot,ArcSec,Csch,Coth,Sech,
-    ArcCsch,ArcCoth,ArcSech,acosh,asinh,atanh,CD,pow},
-    With[{one=N[1,prec],two=N[2,prec]},
-      Module[{optexpr},
-
-(* Handled correctly by CForm. *)
-
-        CD[Times]=Times; CD[Plus]=Plus; CD[Equal]=Equal; CD[Unequal]=Unequal;
-        CD[Greater]=Greater; CD[Less]=Less; CD[GreaterEqual]=GreaterEqual;
-        CD[LessEqual]=LessEqual; CD[Or]=Or; CD[And]=And; CD[Not]=Not;
-
-(* Needs additional rules. *)
-
-        CD[Power]=Power;
-
-(* Numeric. *)
-
-        CD[Abs]=abs; CD[Conjugate]=conjg; CD[Floor]=floor; CD[Max]=max;
-        CD[Min]=min; CD[Mod]=mod;  CD[Random]=rand; CD[Round]=ceil;
-        CD[Sign]=sign; CD[Sqrt]=sqrt;
-
-(* Trigonometric related. *)
-
-        CD[ArcCos]=acos; CD[ArcCosh]=acosh; CD[ArcSin]=asin;
-        CD[ArcSinh]=asinh; CD[ArcTan]=atan; CD[ArcTanh]=atanh;
-        CD[Cos]=cos; CD[Cosh]=cosh; CD[Sin]=sin; CD[Sinh]=sinh;
-        CD[Tan]=tan; CD[Tanh]=tanh; CD[Log]=log; CD[exp]=exp;
-
-(* Numbers. *)
-
-        CD[Complex]=Complex; CD[Rational]=Rational;
-
-(* Arrays. *)
-
-        Map[ (CD[#]=#)&, atoarry];
-
-(* Legal C function? Only check head once. *)
-
-        CD[x_]:= CD[x]=ANSIC[x];
-
-(* Add format rules. *)
-
-        If[trigQ,
-          Csc[x_]:= Evaluate[one/CD[Sin][x]];
-          Cot[x_]:= Evaluate[one/CD[Tan][x]];
-          Sec[x_]:= Evaluate[one/CD[Cos][x]];
-          ArcCsc[x_]:= Evaluate[CD[ArcSin][one/x]];
-          ArcCot[x_]:= Evaluate[CD[ArcTan][one/x]];
-          ArcSec[x_]:= Evaluate[CD[ArcCos][one/x]];
-        ];
-
-        If[hypQ,
-          Csch[x_]:= Evaluate[one/CD[Sinh][x]];
-          Coth[x_]:= Evaluate[one/CD[Tanh][x]];
-          Sech[x_]:= Evaluate[one/CD[Cosh][x]];
-          ArcCsch[x_]:= Evaluate[CD[ArcSinh][one/x]];
-          ArcCoth[x_]:= Evaluate[CD[ArcTanh][one/x]];
-          ArcSech[x_]:= Evaluate[CD[ArcCosh][one/x]];
-          CD[ArcCosh][x_]:= Evaluate[CD[Log][x+CD[Sqrt][x^2-one]]];
-          CD[ArcSinh][x_]:= Evaluate[CD[Log][x+CD[Sqrt][x^2+one]]];
-          CD[ArcTanh][x_]:= Evaluate[CD[Log][(one+x)/(one-x)]/two];
-          CD[ArcTanh][(x_:one)/y_]:= Evaluate[CD[Log][(y+x)/(y-x)]/two];
-        ];
-
-(* Apply formatting rules and optimize. *)
-
-        optexpr = If[optQ, AssignOpt[#,optopts], # ]& @ ApplyCDefs[expr];
-
-(* Add remaining formatting rules. These are applied here to avoid
- any conflict with code optimization. *)
-
-        Block[{Power},
-
-(* Rational powers. *)
-
-          Power[x_,Rational[1,2]]:= Evaluate[CD[Sqrt][x]];
-          Power[x_,Rational[-1,2]]:= Evaluate[one/CD[Sqrt][x]];
-
-          Power[a_,Rational[b_,c_]]:=
-            With[{nb=N[b,prec],nc=N[c,prec]}, pow[a,HoldForm[nb/nc]] ];
-
-(* Remaining powers. *)
-
-          Power[a_,b_?(NumberQ[#]&&#!=-1&)]:= pow[a,N[b,prec]];
-          Power[a_,b_?(#=!=-1&)]:= pow[a,b];
-
-          optexpr
-
-        ]
-      ]
-    ]
-  ];  (* End of CDefs. *)
-
-
-
-(* Define FORTRAN assignment format. *)
-
-SetAttributes[FortranAssign,HoldFirst];
-
-Options[FortranAssign]:= {
-AssignBreak->{If[#>72,72,#]&[-1+Options[$Output,PageWidth][[1,2]]],
-  "\n     &  "}, AssignCase->Default, AssignEnd->"",
-AssignFortranNumbers->True, AssignHyperbolic->False,
-AssignIndent->"        ", AssignIndex->1, AssignLabel->"",
-AssignMaxSize->5000, AssignOptimize->False,
-AssignPrecision->machinePrecision-1, AssignRange->False,
-AssignReplace->{" "->""}, AssignTemporary->{"t",Sequence}, AssignToArray->{},
-AssignToFile->"", AssignTrig->True, AssignZero->True};
-
-
-FortranAssign[lhs_:"",expr_?(!OptionQ[#]&),opts___?OptionQ]:=
-  Module[{optvals},
-    optvals /;
-      And[
-        (optvals = OptionTest[expr,GetShape[lhs],FortranAssign,
-          FilterOptions[FortranAssign,opts]])=!=$Failed,
-	    optvals = FMain[lhs,expr,optvals,{FilterOptions[Optimize`Optimize,opts]}];
-	    True
-	  ]
-  ];
-
-
-SetAttributes[FMain,HoldFirst];
-
-FMain[lhs_,expr_,{linbrk_,acase_,aend_,fnumsQ_,hypQ_,indent_,index_,albl_,
-amxsz_,optQ_,prec_,rangeQ_,arep_,tvar_,atoarry_,atofile_,trigQ_,zeroQ_},optopts_]:=
-  Block[{d,e,$RecursionLimit=Infinity},
-    Module[{newexpr,expsymb,AvoidRule=False},
-
-      AssignTemporaryIndex = 0;
-
-(* Attach rule for formatting real numbers with FortranForm. *)
-
-      If[fnumsQ,
-        Unprotect[Real];
-        Format[expsymb,FortranForm] = If[prec>8, d, e]; (* Choose exponent. *)
-
-(* Toggle to avoid infinite recursion formatting FORTRAN numbers. *)
-
-        Real/: Format[r_Real,FortranForm]:=
-                 (SequenceForm[First[#] 10, expsymb, -1+Last[#]]& @
-                   MantissaExponent[r]) /; (AvoidRule=!AvoidRule);
-      ];
-
-(* Perform assignments and code translation. *)
-
-      newexpr =
-        CommonAssign[
-          Makelhs[lhs,FortranForm],
-          RangeTest[
-            FortranDefs[
-              MyN[expr,prec,atoarry,FMain],
-            trigQ,hypQ,optQ,prec,atoarry,optopts],
-          prec,FortranForm,rangeQ],
-          FortranForm,
-          " = ",acase,aend,tvar,atofile,zeroQ,
-          indent,index,albl,linbrk,amxsz,arep
-        ];
-
-(* Remove real number rule. *)
-
-      If[fnumsQ,
-        Format[Format`Private`r$_Real,FortranForm]=.;
-        Protect[Real];
-      ];
-
-(* Output a list as a column and avoid string delimiters "". *)
-
-      ColumnForm[ Flatten[newexpr] ]  //OutputForm
-
-    ]
-  ]; (* End of FMain. *)
-
-
-
-(* Define rules for FORTRAN translation. *)
-
-(* FORTRAN expression head replacement. *)
-
-SetAttributes[ApplyFortDefs,Listable];
-
-ApplyFortDefs[expr_]:= FRH[Map[FRH,expr,-2]];
-
-Literal[FRH[ArcTan[x_,y_]]]:= atan2[y,x];
-
-(* Nest logical operators. *)
-
-Literal[FRH[Equal[x_,y_,z__]]]:= Apply[FD[And], Map[FD[Equal][x,#]&,{y,z}] ];
-Literal[FRH[e:Unequal[x_,y_,z__]]]:=
-  Apply[FD[And],
-    Flatten[ Table[Map[FD[Unequal][e[[i]],#]&,Drop[{x,y,z},i]],{i,Length[e]-1}] ]
-  ];
-Literal[FRH[(h:Greater|GreaterEqual|Less|LessEqual)[x_,y__,z_]]]:=
-  Apply[FD[And],MapThread[FD[h],{{x,y},{y,z}}]];
-Literal[FRH[Inequality[x_,op_,y_,z__]]]:= FD[And][FD[op][x,y],FRH[Inequality[y,z]]];
-Literal[FRH[Inequality[x_,op_,y_]]]:= FD[op][x,y];
-
-(* Recover minus sign. *)
-
-Literal[FRH[Times[-1.,x__]]]:= FD[Times][-1,x];
-
-(* Replace heads in remaining expressions. *)
-
-Literal[FRH[expr_]]:= Operate[FD,expr];
-
-(* Legal FORTRAN functions. *)
-
-fortfuns = {abs,acos,aimag,aint,alog,alog10,amax0,amax1,amin0,amin1,amod,
-  anint,asin,atan,atan2,cabs,ccos,cexp,char,clog,cmplx,conjg,cos,cosh,
-  csin,csqrt,dabs,dacos,dasin,datan,datan2,dble,dcos,dcosh,ddim,dexp,
-  dim,dint,dlog,dlog10,dmax1,dmin1,dmod,dnint,dprod,dsign,dsin,dsinh,
-  dsqrt,dtan,dtanh,exp,float,iabs,ichar,idim,idint,idnint,ifix,index,
-  int,isign,len,lge,lgt,lle,llt,log,log10,max,max0,max1,min,min0,min1,
-  mod,nint,real,sign,sin,sinh,sngl,sqrt,tan,tanh};
-
-ANSIF[funct_]:=
- If[MemberQ[fortfuns,funct],
-   funct,
-   Message[AssignFunction::undef,funct,"FORTRAN"]; funct
- ];
-
-(* Add FORTRAN definitions. *)
-
-SetAttributes[FortranDefs,{HoldAll}];
-
-FortranDefs[expr_,trigQ_,hypQ_,optQ_,prec_,atoarry_,{optopts___}]:=
-  Block[{Csc,Cot,Sec,ArcCsc,ArcCot,ArcSec,Csch,Coth,Sech,
-    ArcCsch,ArcCoth,ArcSech,acosh,asinh,atanh,FD},
-    With[{one=N[1,prec],two=N[2,prec]},
-      Module[{optexpr},
-
-(* Handled correctly by FortranForm. *)
-
-        FD[Times]=Times; FD[Plus]=Plus; FD[Equal]=Equal; FD[Unequal]=Unequal;
-        FD[Greater]=Greater; FD[Less]=Less; FD[GreaterEqual]=GreaterEqual;
-        FD[LessEqual]=LessEqual; FD[Or]=Or; FD[And]=And; FD[Not]=Not;
-
-(* Needs additional rules. *)
-
-        FD[Power]=Power;
-
-(* Numeric. *)
-
-        FD[Abs]=abs; FD[Conjugate]=conjg; FD[Floor]=int; FD[Max]=max;
-        FD[Min]=min; FD[Mod]=mod; FD[Re]=real; FD[Round]=nint; FD[Sqrt]=sqrt;
-
-(* Trigonometric related. *)
-
-        FD[ArcCos]=acos; FD[ArcCosh]=acosh; FD[ArcSin]=asin;
-        FD[ArcSinh]=asinh; FD[ArcTan]=atan; FD[ArcTanh]=atanh;
-        FD[Cos]=cos; FD[Cosh]=cosh; FD[Sin]=sin; FD[Sinh]=sinh;
-        FD[Tan]=tan; FD[Tanh]=tanh; FD[Log]=log; FD[exp]=exp;
-
-(* Numbers. *)
-
-        FD[Complex]=Complex; FD[Rational]=Rational;
-
-(* Arrays. *)
-
-        Map[ (FD[#]=#)&, atoarry ];
-
-(* Legal FORTRAN function? Only check head once. *)
-
-        FD[x_]:= FD[x]=ANSIF[x];
-
-(* Add format rules. *)
-
-        If[trigQ,
-          Csc[x_]:= Evaluate[one/FD[Sin][x]];
-          Cot[x_]:= Evaluate[one/FD[Tan][x]];
-          Sec[x_]:= Evaluate[one/FD[Cos][x]];
-          ArcCsc[x_]:= Evaluate[FD[ArcSin][one/x]];
-          ArcCot[x_]:= Evaluate[FD[ArcTan][one/x]];
-          ArcSec[x_]:= Evaluate[FD[ArcCos][one/x]];
-        ];
-
-        If[hypQ,
-          Csch[x_]:= Evaluate[one/FD[Sinh][x]];
-          Coth[x_]:= Evaluate[one/FD[Tanh][x]];
-          Sech[x_]:= Evaluate[one/FD[Cosh][x]];
-          ArcCsch[x_]:= Evaluate[FD[ArcSinh][one/x]];
-          ArcCoth[x_]:= Evaluate[FD[ArcTanh][one/x]];
-          ArcSech[x_]:= Evaluate[FD[ArcCosh][one/x]];
-          FD[ArcCosh][x_]:= Evaluate[FD[Log][x+FD[Sqrt][x^2-one]]];
-          FD[ArcSinh][x_]:= Evaluate[FD[Log][x+FD[Sqrt][x^2+one]]];
-          FD[ArcTanh][x_]:= Evaluate[FD[Log][(one+x)/(one-x)]/two];
-          FD[ArcTanh][(x_:one)/y_]:= Evaluate[FD[Log][(y+x)/(y-x)]/two];
-        ];
-
-(* Apply formatting rules and optimize. *)
-
-        optexpr = If[optQ,AssignOpt[#,optopts],#]& @ ApplyFortDefs[expr];
-
-(* Add remaining formatting rules. These are applied here to avoid
- any conflict with code optimization. *)
-
-        Block[{Power},
-
-(* Rational powers. *)
-
-          Power[x_,Rational[1,2]]:= Evaluate[FD[Sqrt][x]];
-          Power[x_,Rational[-1,2]]:= Evaluate[one/FD[Sqrt][x]];
-
-          Power[a_,Rational[b_,c_]]:=
-            With[{nb=N[b,prec],nc=N[c,prec]}, HoldForm[a^(nb/nc)] ];
-
-          optexpr
-        ]
-
-      ]
-    ]
-  ];  (* End of FortranDefs. *)
-
-
-
-
-(* Define Maple assignment format. *)
-
-SetAttributes[MapleAssign,HoldAll];
-
-Options[MapleAssign]:= {
-AssignBreak->{Options[$Output,PageWidth][[1,2]]-2,"\\\n"},
-AssignCase->Default, AssignEnd->";", AssignFortranNumbers->False, AssignHyperbolic->False,
-AssignIndent->"", AssignIndex->1, AssignLabel->"", AssignMaxSize->Infinity,
-AssignOptimize->False, AssignPrecision->Infinity, AssignRange->False,
-AssignReplace->{}, AssignTemporary->{}, AssignToArray->{},
-AssignToFile->"", AssignTrig->False, AssignZero->True};
-
-
-MapleAssign[lhs_:"",expr_?(!OptionQ[#]&),opts___?OptionQ]:=
-  Module[{optvals},
-    optvals /;
-      And[
-        (optvals = OptionTest[expr,GetShape[lhs],MapleAssign,opts])=!=$Failed,
-	    optvals = MMain[lhs,Unevaluated[expr],optvals]; True
-	  ]
-  ];
-
-
-SetAttributes[MMain,HoldFirst];
-
-MMain[lhs_,expr_,{linbrk_,acase_,aend_,fnumsQ_,hypQ_,indent_,index_,albl_,
-amxsz_,optQ_,prec_,rangeQ_,arep_,tvar_,atoarry_,atofile_,trigQ_,zeroQ_}]:=
-  Block[{$RecursionLimit=Infinity},
-
-    AssignTemporaryIndex = 0;
-
-(* Perform assignments and code translation. *)
-
-    OutputForm[
-      Flatten[
-        CommonAssign[
-          Makelhs[lhs,InputForm],
-          MyN[Evaluate[MapleDefs[expr]],prec,atoarry],
-          InputForm,
-          " := ",acase,aend,tvar,atofile,zeroQ,
-          indent,index,albl,linbrk,amxsz,arep
-        ]
-      ] //ColumnForm
-    ]
-
-  ] (* End of MMain. *)
-
-
-
-(**** Maple function redefinitions. ****)
-
-SetAttributes[MRH,HoldAll];
-
-ApplyMapleDefs[expr_]:= MapAll[ MRH, Unevaluated[expr] ];
-
-(* Special Mathematica expressions. *)
-
-Literal[MRH[Head[x_]]]:= MapleFun[Head,0,x];
-Literal[MRH[Part[x_,y_]]]:= MapleFun[Part,0,x];
-Literal[MRH[Part[x_,y_List]]]:= MapleFun[Part,Apply[Sequence,y],x];
-
-Literal[MRH[Replace[x_,rep_]]]:= MapleFun[Replace,rep,x];
-Literal[MRH[ReplaceAll[x_,rep_]]]:= MapleFun[ReplaceAll,rep,x];
-
-Literal[MRH[Rule[Trig,True]]]:= trig;
-Literal[MRH[Rule[x_,y_]]]:= SequenceForm[MapleArgs["=",x,y]];
-Literal[MRH[Equal[x_,y_]]]:= SequenceForm[MapleArgs["=",x,y]];
-
-(* Nest logical operators. *)
-
-Literal[MRH[Equal[x_,y_,z__]]]:=
-  Apply[MD[And], Map[SequenceForm[MapleArgs[MD[Equal],x,#]]&,{y,z}] ];
-Literal[MRH[e:Unequal[x_,y_,z__]]]:=
-  Apply[MD[And],
-    Flatten[
-      Table[
-        Map[SequenceForm[MapleArgs[MD[Unequal],e[[i]],#]]&,Drop[{x,y,z},i]],
-      {i,Length[e]-1}]
-    ]
-  ];
-Literal[MRH[Unequal[x_,y_]]]:= SequenceForm[MapleArgs[MD[Unequal],x,y]];
-Literal[MRH[(h:Greater|GreaterEqual|Less|LessEqual)[x_,y__,z_]]]:=
-  Apply[MD[And],MapThread[SequenceForm[MapleArgs[MD[h],#1,#2]]&,{{x,y},{y,z}}]];
-Literal[MRH[(h:Greater|GreaterEqual|Less|LessEqual)[x_,y_]]]:=
-  SequenceForm[MapleArgs[MD[h],x,y]];
-Literal[MRH[Inequality[x_,op_,y_,z__]]]:=
-MD[And][SequenceForm[MapleArgs[MD[op],x,y]],MRH[Inequality[y,z]]];
-Literal[MRH[Inequality[x_,op_,y_]]]:= SequenceForm[MapleArgs[MD[op],x,y]];
-
-(* Logicals. *)
-
-MRH[True] = true;  MRH[False] = false;
-
-(* Trigonometric related. *)
-
-Literal[MRH[ArcTan[x_,y_]]]:= Evaluate[MapleFun[MD[ArcTan],y,x]];
-Literal[MRH[Power[MRH[E],x_]]]:= Evaluate[MapleFun[MD[Exp],x]];
-
-(* Required for formatting. *)
-
-Literal[MRH[x_SequenceForm|x_OutputForm]]:= x;
-
-(* Arithmetic. *)
-
-Literal[MRH[x_Plus|x_Power|x_Times]]:= x;
-
-Literal[MRH[x_Complex|x_Integer|x_Rational|x_Real]]:= x;
-
-Literal[MRH[Infinity|ComplexInfinity|DirectedInfinity[___]]]:=
-  Evaluate[MD[DirectedInfinity]];
-
-(* Lists. *)
-
-Literal[MRH[List[x__]]]:= SequenceForm[OutputForm["["],MapleArgs[",",x],OutputForm["]"]];
-
-(* General function head replacement. *)
-
-special = {And,Or,Complex,D,Factorial,Integrate,Product,Sum,
-  Series,Sign,NSolve,Solve};
-
-Literal[MRH[f_[x__]]]:= If[MemberQ[special,f], MD[f][x], MapleFun[f,x] ];
-
-(* Remaining expressions. *)
-
-Literal[MRH[expr_]]:= MD[expr];
-
-(**** End of Maple function redefinitions. ****)
-
-
-(**** Maple function head redefinitions. ****)
-
-    MD[Abs]=abs; MD[AiryAi]=Ai; MD[AiryBi]=Bi; MD[And]=and; MD[ArcCos]=arccos; MD[ArcCosh]=arccosh;
-    MD[ArcCot]=arccot; MD[ArcCoth]=arccoth; MD[ArcCsc]=arccsc; MD[ArcCsch]=arccsch;
-    MD[ArcSec]=arcsec; MD[ArcSech]=arcsech; MD[ArcSin]=arcsin; MD[ArcSinh]=arcsinh;
-    MD[ArcTan]=arctan; MD[ArcTanh]=arctanh; MD[BernoulliB]=bernoulli;
-    MD[Binomial]=binomial; MD[Collect]=collect; MD[Cos]=cos; MD[Cosh]=cosh;
-    MD[CosIntegral]=Ci; MD[Cot]=cot; MD[Coth]=coth; MD[Csc]=csc; MD[Csch]=csch;
-    MD[D]=diff; MD[Denominator]=denom; MD[DirectedInfinity]=infinity; MD[Erf]=erf;
-    MD[Erfc]=erfc; MD[EulerE]=euler; MD[Exp]=exp; MD[Expand]=expand; MD[ExpIntegral]=Ei;
-    MD[Factor]=factor; MD[Factorial]=factorial; MD[Gamma]=GAMMA;
-    MD[Head]=op; MD[Integrate]=int;
-    MD[Length]=nops; MD[Log]=log; MD[LogGamma]=lnGAMMA; MD[Map]=map; MD[Max]=max;
-    MD[Min]=min; MD[Mod]=mod; MD[N]=evalf; MD[NIntegrate]=int; MD[NSolve]=fsolve; MD[Not]=not;
-    MD[Null]=NULL; MD[Numerator]=num; MD[Or]=or; MD[Part]=op; MD[PolyGamma]=Psi;
-    MD[PolyLog]=dilog; MD[Product]=product; MD[Replace]=subs; MD[ReplaceAll]=subs;
-    MD[Roots]=RootOf; MD[Round]=round; MD[Sec]=sec; MD[Sech]=sech;
-    MD[Series]=series; MD[Sign]=sign; MD[Simplify]=simplify; MD[Sin]=sin;
-    MD[Sinh]=sinh; MD[SinIntegral]=Si; MD[Solve]=solve; MD[Sqrt]=sqrt; MD[Sum]=sum;
-    MD[Tan]=tan; MD[Tanh]=tanh; MD[Together]=normal;
-
-(* Logical symbols. *)
-
-    MD[Greater]=">"; MD[GreaterEqual]=">="; MD[Less]="<"; MD[LessEqual]="<=";
-    MD[Equal]="="; MD[Unequal]="<>";
-
-(* Not yet implemented. *)
-
-    MD[x_]:= x;
-
-(**** End of Maple function head redefinitions. ****)
-
-
-
-
-(**** Rules to convert arguments and functions to Maple form. ****)
-
-(* Recursive argument conversion. *)
-
-MapleArgs[str_,x_]:= x;
-MapleArgs[str_,x_,y__]:= Sequence[x,OutputForm[str],MapleArgs[str,y]];
-
-(* Function conversion. *)
-
-MapleFun[f_,x__]:= SequenceForm[MD[f],OutputForm["("],MapleArgs[",",x],OutputForm[")"]];
-
-MapleDerivs[SequenceForm[_,a_,_,b_,_]]:= SequenceForm[a,OutputForm["$"],b];
-
-MapleDerivs[x_]:= x;
-
-MapleRange[SequenceForm[_,x_,_,r2_,_],str_]:=
-  SequenceForm[ x,OutputForm["="],MapleArgs[str,1,r2] ];
-
-MapleRange[SequenceForm[_,x_,_,r1_,_,r2_,_],str_]:=
-  SequenceForm[ x,OutputForm["="],MapleArgs[str,r1,r2] ];
-
-MapleRange[x__,y_]:= x;
-
-MapleSeries[x_]:=
-  Module[{mterms = Map[MapleRange[#,","]&,x],trunc},
-    trunc = Max[Map[Part[#,-1]&,mterms]]; (* Max truncation order. *)
-    SequenceForm[
-      OutputForm["["],
-      Apply[Sequence, Insert[ Map[Drop[#,-1]&,mterms], OutputForm["]"], {-1,-2}] ],
-      trunc
-    ]
-  ];
-
-(**** End of rules to convert arguments and functions to Maple form. ****)
-
-
-(* Define rules for Maple translation. *)
-
-SetAttributes[MapleDefs,{HoldAll}];
-
-MapleDefs[expr_]:=
-  Block[{and,or,diff,factorial,int,product,sum,series,sign,fsolve,solve},
-
-(* Add formatting rules. *)
-
-    and[x__]:= SequenceForm[MapleArgs[" and ",x]];
-    or[x__]:= SequenceForm[MapleArgs[" or ",x]];
-    diff[x_,a_]:= MapleFun[diff,x,MapleDerivs[a]];
-    diff[x_,a__,b_]:= diff[ diff[x,a], MapleDerivs[b]];
-    factorial[x_]:= SequenceForm[x,OutputForm["!"]];
-    int[f_,x_]:= MapleFun[int,f,MapleRange[x,".."]];
-    int[f_,x__,y_]:= MapleFun[int,int[f,x], MapleRange[y,".."]];
-    product[x_,y_]:= MapleFun[product,x,MapleRange[y,".."]];
-    product[x_,y__,z_]:= MapleFun[product,product[x,y],MapleRange[z,".."]];
-    sum[x_,y_]:= MapleFun[sum,x,MapleRange[y]];
-    sum[x_,y__,z_]:= MapleFun[sum,sum[x,y],MapleRange[z]];
-    series[x_,y_]:= MapleFun[series,x,MapleRange[y,","]];
-    series[x_,y__,z_]:= MapleFun[mtaylor,x,MapleSeries[{y,z}]];
-    sign[x_Complex]:= MapleFun[signum,x];
-    sign[x_]:= MapleFun[sign,x];
-    fsolve[x__]:= MapleFun[fsolve,x] /. {"["->"{","]"->"}"};
-    solve[x__]:= MapleFun[solve,x] /. {"["->"{","]"->"}"};
-
-    ApplyMapleDefs[Unevaluated[expr]]
-
-  ]; (* End of Maple Defs. *)
-
-
-
-
-(* Define assignment for specified format. *)
-
-SetAttributes[Assign,HoldFirst];
-
-Options[Assign]:= {
-AssignBreak->{Options[$Output,PageWidth][[1,2]]-1,"\n"},
-AssignCase->Default, AssignEnd->"", AssignFortranNumbers->False, AssignHyperbolic->False,
-AssignIndent->"", AssignIndex->1, AssignLabel->"", AssignMaxSize->Infinity,
-AssignOptimize->False, AssignPrecision->Infinity, AssignRange->False,
-AssignReplace->{}, AssignTemporary->{}, AssignToArray->{},
-AssignToFile->"", AssignTrig->False, AssignZero->True};
-
-
-Assign[lhs_:"",expr_?(!OptionQ[#]&),form_?(!OptionQ[#]&),opts___?OptionQ]:=
-  Module[{optvals},
-    optvals /;
-      And[
-        (optvals = OptionTest[expr,GetShape[lhs],Assign,opts])=!=$Failed,
-	    optvals = AMain[lhs,expr,form,optvals]; True
-	  ]
-  ];
-
-
-(* Perform assignments and code translation. *)
-
-SetAttributes[AMain,HoldFirst];
-
-AMain[lhs_,expr_,form_,{linbrk_,acase_,aend_,fnumsQ_,hypQ_,indent_,index_,
-albl_,amxsz_,optQ_,prec_,rangeQ_,arep_,tvar_,atoarry_,atofile_,trigQ_,zeroQ_}]:=
-Block[{$RecursionLimit=Infinity},
-
-  AssignTemporaryIndex = 0;
-
-  OutputForm[
-    Flatten[
-      CommonAssign[
-        Makelhs[lhs,form],
-        MyN[expr,prec,atoarry],
-        form,
-        " = ",acase,aend,tvar,atofile,zeroQ,
-        indent,index,albl,linbrk,amxsz,arep
-      ]
-    ] //ColumnForm
-  ]
-]; (* End of AMain. *)
-
-
-
-(* Define main assignment formatting. *)
-
-(* This definition ensures compatibility with the code optimization
- package Optimize.m - which returns a list of replacement rules
- and an optimized expression or list of expressions. *)
-
-CommonAssign[lhs_,{optrules:{__Rule},expr_},form_,args__]:=
-  Apply[
-    CommonAssign[ Join[Makelhs[#1,form],{lhs}],
-      Join[#2,{expr}],form,args]&,
-    Thread[optrules,Rule]
-  ];
-
-(* Assignments to single expressions. *)
-
-CommonAssign[lhs_,expr_,form_,eqstr_,acase_,aend_,tvar_,atofile_,
-  zeroQ_,indent_,index_,albl_,linbrk_,amxsz_,arep_]:=
-  Module[{outchan,lbllen,redexpr,strings},
-
-(* Remove zero-valued expressions and add array indices to lhs. *)
-
-    redexpr = RemoveZeros[lhs,expr,form,index,!zeroQ];
-
-(* Break up long expressions and convert to strings. *)
-
-    strings =
-      Map[BreakExpression[#,eqstr,amxsz,tvar,form]&,redexpr];
-
-(* Apply string replacement rules and indentation/termination strings. *)
-
-    strings =
-      Map[
-        StringJoin[ indent, #, aend ]&,
-        StringReplace[ Flatten[{strings}],arep ]
-      ];
-
-(* Attach a label to the first expression. *)
-
-    label = ToString[albl];  lbllen = StringLength[label];
-
-    If[ lbllen =!=0,
-      strings[[1]] = StringJoin[label,StringDrop[strings[[1]],lbllen]]
-    ];
-
-(* Convert to Lower, or Upper case. *)
-
-    Switch[acase,
-      Upper,strings = Map[ToUpperCase,strings],
-      Lower,strings = Map[ToLowerCase,strings]
-    ];
-
-(* Add continuation characters to break up long lines of code. *)
-
-    If[ListQ[linbrk], strings = Map[BreakLines[#,linbrk]&,strings] ];
-
-(* Output results to a file. *)
-
-    If[atofile=!="",
-      outchan = OpenWrite[atofile,FormatType->OutputForm];
-      Write[outchan, strings //ColumnForm];
-      Close[outchan] ];
-
-    strings    (* Output. *)
-
-  ];  (* End of CommonAssign. *)
-
-
-
-(* Add index and delete zero-valued elements. *)
-
-(* Remove zero-valued elements. The variable index is used as
- an offset for the starting index. *)
-
-(* Lists of assignments (remove outer List). *)
-
-RemoveZeros[lhs_List,rhs_List,format_,index_,remzero_]:=
-  Apply[Join,MapThread[ RemoveZeros[#1,#2,format,index,remzero]&, {lhs,rhs} ]];
-
-(* No zeros removed. *)
-
-RemoveZeros["",rhs_List,format_,index_,False]:= Thread[{"",Flatten[rhs]}];
-
-RemoveZeros[lhs_,rhs_List,format_,index_,False]:=
-  JoinIndices[lhs,FindPositions[rhs,Null],Flatten[rhs],format,index];
-
-RemoveZeros[lhs_,rhs_,format_,index_,False]:= {{lhs,rhs}};
-
-(* Zeros removed. *)
-
-(* Check for expressions with no non-zeros present. *)
-
-AssignZero::continue = "Expression encountered with no non-zero elements.
-Continuing with zero assignments.";
-
-RemoveZeros[lhs_,0,format_,index_,True]:=
-  (Message[AssignZero::continue]; {{lhs,0}});
-
-RemoveZeros["",rhs_List,format_,index_,True]:=
-  Module[{redrhs = Flatten[Delete[rhs,Position[rhs,0,Heads->False]]]},
-    If[redrhs==={}, Message[AssignZero::continue]; redrhs = Flatten[rhs]];
-    Thread[{"",redrhs}]
-  ];
-
-RemoveZeros[lhs_,rhs_List,format_,index_,True]:=
-  Module[{redrhs = Flatten[Delete[rhs,Position[rhs,0,Heads->False]]],posntest=0},
-    If[redrhs==={},
-      Message[AssignZero::continue]; redrhs = Flatten[rhs]; posntest=Null;];
-    JoinIndices[lhs,FindPositions[rhs,posntest],redrhs,format,index]
-  ];
-
-RemoveZeros[lhs_,rhs_,format_,index_,True]:= {{lhs,rhs}};
-
-(* Find positions of non-null and non-zero elements. *)
-
-FindPositions[expr_,Null]:=
-  Position[ Function[x,UnsameQ[x,Null],Listable][expr],True,Heads->False];
-
-FindPositions[expr_,0]:=
-  Position[ Function[x,UnsameQ[x,0]&&UnsameQ[x,Null],Listable][expr],True,Heads->False];
-
-(* Join index string to lhs string. *)
-
-JoinIndices[lhs_,posns_List,rhs_,format_,index_]:=
-  (MapThread[
-    {StringJoin[ lhs, StringIndex[#1,format] ],#2}&,
-    {posns+index-1,Flatten[rhs]}
-  ]);
-
-(* StringIndex is used to convert the position into the
- appropriate form for an array element. *)
-
-StringIndex[psn_,CForm]:= 
-  StringReplace[ ToString[psn] ,{"{"->"[","}"->"]",", "->"]["}];
-
-(* Default is FORTRAN case. *)
-
-StringIndex[psn_,_]:= 
-  StringReplace[ ToString[psn] ,{"{"->"(","}"->")"}];
-
-
-
-(* Break up large expressions into sub-expressions. *)
-
-BreakUp[subexpr_,maxlen_,temp_]:=
-  If[LengthTest[subexpr,maxlen],
-    Fragment[subexpr,maxlen,temp],
-    subexpr (* else *)
-  ];
-
-(* Add temporary variable and sub-expression to list. *)
-
-AddTemp[temp_,subexpr_]:= (parts = Join[parts,{{temp,subexpr}}]; temp);
-
-(* Test used for permissible sub-expression size. *)
-
-LengthTest[expr_,maxlen_]:= ByteCount[expr]>maxlen;
-
-(* Ignore numeric exponents, temporary variables etc. *)
-
-Fragment[subexpr:(_temp|_?AtomQ),maxlen_,tmpvar_]:= subexpr;
-
-(* Binary decomposition of Plus and Times. *)
-
-Fragment[subexpr:(_Plus|_Times),maxlen_,temp_]:=
-  If[LengthTest[subexpr,maxlen],
-    With[{quo = Quotient[Length[subexpr],2]},
-      BreakUp[
-        Head[subexpr][
-          Fragment[Take[subexpr,quo],maxlen,temp],
-          Fragment[Drop[subexpr,quo],maxlen,temp]
-        ],
-      maxlen,temp]
-    ],
-    AddTemp[temp[++index],subexpr] (* else *)
-  ];
-
-(* n-ary decomposition of remaining functions. *)
-
-Fragment[subexpr_,maxlen_,temp_]:=
-  If[LengthTest[subexpr,maxlen],
-    BreakUp[Map[Fragment[#,maxlen,temp]&,subexpr],maxlen,temp],
-    AddTemp[temp[++index],subexpr] (* else *)
-  ];
-
-
-(* Recursively decompose expression. *)
-
-BreakExpression[args_,eqstr_,Infinity,_,form_]:=
-  MyFormat[args,eqstr,form];
-
-Assign::notemp = "No temporary variable was specified. Continuing
-with original expression.";
-
-BreakExpression[args_,eqstr_,maxlen_,{}|{"",_},form_]:=
-  (Message[Assign::notemp]; MyFormat[args,eqstr,form]);
-
-BreakExpression[{lhs_,expr_},eqstr_,maxlen_,{tvar_,tform_},form_]:=
-  Block[{index=0,parts={},$RecursionLimit=Infinity},
-    Module[{outexpr,tmp},
-
-(* Array or sequence of temporaries. *)
-
-      If[tform===Array,
-        If[form===CForm,
-          Format[tmp[i_],form]:=HoldForm[Part[#,i]],
-          Format[tmp[i_],form]:=#[i]
-        ],
-        Format[tmp[i_],form]:= SequenceForm[#,i]
-      ]& @ ToExpression[ToString[tvar]];
-
-(* Recursively break up expression and re-use temporary variables. *)
-
-      outexpr = BreakUp[expr,maxlen,tmp];
-
-(* Store maximum number of temporaries introduced. *)
-
-      If[ index>AssignTemporaryIndex, AssignTemporaryIndex=index ];
-
-(* Output list of temp strings and final expression. *)
-
-      {Map[ MyFormat[#,eqstr,form]&, parts ],
-       MyFormat[{lhs,outexpr},eqstr,form]}
-    ]
-  ]; (* End of BreakExpression *)
-
-
-(* Convert the expression to a string of appropriate form. *)
-
-MyFormat[{"",expr_},_,form_]:= ToString[ expr, FormatType->form ];
-
-MyFormat[{lhs_String,expr_},eqstr_,form_]:=
-  StringJoin[ lhs, eqstr, ToString[ expr, FormatType->form ] ];
-
-MyFormat[{lhs_,expr_},eqstr_,form_]:=
-  StringJoin[
-    ToString[ lhs, FormatType->form ],
-    eqstr,
-    ToString[ expr, FormatType->form ]
-  ];
-
-
-(* Break up long lines of code and add continuation characters. *)
-
-BreakLines[string_,{lineln_,indstr_}]:= 
-  Module[{indlen=StringLength[indstr],linelen,numlines,
-    strlen=StringLength[string]},
-
-(* (\n is counted as one character). *)
-
-    linelen = lineln - indlen + 1;
-
-    If[strlen >=linelen,
-      numlines = Floor[(strlen - (linelen+indlen))/linelen];
-      StringJoin[
-        StringTake[string,indlen-1],  (* first part *)
-          Table[
-            StringTake[
-              string,                         (* middle part *)
-              {linelen i + indlen,
-               linelen (i+1) + indlen-1}
-            ]<>indstr
-          ,{i,0,numlines}],
-          StringTake[
-            string                            (* end part *)
-          ,((numlines+1) linelen + indlen-1) - strlen]
-        ],
-        string (* else *)
-      ]
-    ];  (* End of BreakLines. *)
-
-
-(* Determine `shape' of lhs lists. Extract elements to avoid evaluation. *)
-
-SetAttributes[GetShape,{Listable,HoldAll}];
-GetShape[_]:="";
-
-
-(* Make lhs into a list of held strings. *)
-
-SetAttributes[Makelhs,{Listable,HoldAll}];
-Makelhs[lhs_String,_]:= lhs;
-Makelhs[lhs_,InputForm]:= ToString[ HoldForm[lhs] ];
-Makelhs[lhs_,form_]:= ToString[ form[HoldForm[lhs]] ];
-
-
-(* Slightly modified version of N. Arguments to specified
- symbols are temporarily protected from N. *)
-
-SetAttributes[MyN,HoldAll];
-
-(* Protect exponential from N. *)
-
-MyN[expr_,_DirectedInfinity,_,CMain|FMain]:=
-  Block[{E}, E /: Power[E,x_]:= exp[x]; expr ];
-
-(* Approximate numeric Exp. *)
-
-MyN[args__,CMain|FMain]:=
-  Block[{E}, E /: Power[E,x_?(!NumberQ[#]&)]:= exp[x]; MyN[args] ];
-
-(* Infinite Precision. *)
-
-MyN[expr_,_DirectedInfinity,__]:= expr;
-
-(* Finite precision. *)
-
-MyN[expr_,prec_,{}]:=
-  If[$VersionNumber >= 5.0,
-  If[prec=== MachinePrecision,
-    #,
-    # //. {r_Real:>SetPrecision[r,prec]}
-  ]& @ N[ expr, prec ],
-  If[prec===$MachinePrecision,
-    #,
-    # //. {r_Real:>SetPrecision[r,prec]}
-  ]& @ N[ expr, prec ]]
-
-(* Finite Precision, protect array arguments from N. *)
-
-MyN[expr_,prec_,atoarry_]:=
-  Block[atoarry,
-    SetAttributes[atoarry,NHoldAll];
-    MyN[ expr, prec, {} ]
-  ];
-
-
-(* Optimize expressions. *)
-
-AssignOpt[expr_,optopts___?OptionQ]:=
-  Check[
-    RuleGen[
-      Optimize`Optimize[expr,optopts],
-      expr
-    ],
-    Message[AssignOptimize::fail]; expr, (* Else proceed with unoptimized expression. *)
-    Optimize`Optimize::args              (* Check only for this message. *)
-  ];
-
-(* Check for optimization. *)
-
-RuleGen[{{},expr_},expr_]:= expr;     (* No optimization. *)
-RuleGen[optexpr_,_]:= optexpr;        (* Optimization. *)
-
-
-
-(* Test range of real and integer numbers. *)
-
-spfortran = {2.^-126,2.^127,HoldForm[-2^31],HoldForm[2^31-1],
-             -2^31,2^31-1,"single"};
-spc = {2.^-125,2.^128,HoldForm[-2^31],HoldForm[2^31-1],-2^31,2^31-1,"single"};
-dpfortran = {2.^-1022,2.^1023,HoldForm[-2^63],HoldForm[2^63-1],
-             -2^63,2^63-1,"double"};
-dpc = {2.^-1021,2.^1024,HoldForm[-2^63],HoldForm[2^63-1],-2^63,2^63-1,"double"};
-
-SetAttributes[RangeTest,HoldFirst];
-
-RangeTest[expr_,nprec_,form_,False]:= expr;
-
-RangeTest[expr_,nprec_,FortranForm,True]:=
-  CheckRange[expr,FortranForm,If[nprec<=8, spfortran, dpfortran]];
-
-RangeTest[expr_,nprec_,CForm,True]:=
-  CheckRange[expr,CForm,If[nprec<=8, spc, dpc]];
-
-AssignRange::float = "Expression contains machine numbers outside
-the permissible range `1` to `2` for IEEE `3` precision.";
-
-AssignRange::integer = "Expression contains integers outside the
-permissible range `1` to `2` which cannot be represented in IEEE
-`3` precision and have been converted to floating point numbers.";
-
-CheckRange[expr_,form_,{xrmin_,xrmax_,xihmin_,xihmax_,ximin_,ximax_,prec_}]:=
-  Module[{complxQ,intmsg=True,intQ,realQ,rlmsg=True},
-
-    realQ = r_Real?((Abs[#]>xrmax||Abs[#]<xrmin)&&rlmsg&):>
-              (If[rlmsg, rlmsg=False; Message[AssignRange::float,xrmin,xrmax,prec]];
-                 r);
-
-    intQ = i_Integer?(#>ximax||#<ximin&):>
-             (If[intmsg,  intmsg=False; Message[AssignRange::integer,xihmin,xihmax,prec]];
-                N[i] /. realQ);
-
-    cmplxQ = Complex[r_,i_]:>Complex[r /. {realQ,intQ},i /. {realQ,intQ}];
-
-    expr /. {realQ,intQ,cmplxQ}
-  ]; (* End of CheckRange. *)
-
-
-End[];  (* End `Private` Context. *)
-
-(* Protect exported symbols. *)
-
-SetAttributes[{Assign,CAssign,FortranAssign,MapleAssign},ReadProtected];
-
-Protect[d,e,abs,acos,acosh,Ai,aimag,aint,alog,alog10,amax0,amax1,amin0,amin1,
-amod,and,anint,arccos,arccosh,arccot,arccoth,arccsc,arccsch,arcsec,arcsech,arcsin,
-arcsinh,arctan,arctanh,asin,asinh,atan,atan2,atanh,bernoulli,Bi,binomial,cabs,
-ccos,ceil,cexp,char,Ci,clog,cmplx,collect,conjg,cos,cosh,cot,coth,csc,csch,csin,
-csqrt,dabs,dacos,dasin,datan,datan2,dble,dcos,dcosh,ddim,denom,dexp,dilog,dim,
-dint,dlog,dlog10,dmax1,dmin1,dmod,dnint,dprod,dsign,dsin,dsinh,dsqrt,dtan,dtanh,
-Ei,erf,erfc,euler,evalf,exp,expand,factor,factorial,false,float,fsolve,GAMMA,iabs,
-ichar,idim,idint,idnint,ifix,index,infinity,int,isign,len,lge,lgt,lle,llt,log,log10,lnGAMMA,
-map,max,max0,max1,min,min0,min1,mod,mtaylor,nint,not,NULL,num,op,or,pow,Psi,real,RootOf,
-round,sec,sech,series,Si,sign,sin,sinh,sngl,solve,sqrt,subs,tan,tanh,true,
-Lower,Upper,Assign,AssignBreak,AssignCase,AssignEnd,AssignFortranNumbers,
-AssignIndent,AssignHyperbolic,AssignLabel,AssignMaxSize,AssignPrecision,
-AssignRange,AssignReplace,AssignTemporary,AssignToArray,AssignToFile,AssignTrig,
-CAssign,FortranAssign,MapleAssign];
-
-EndPackage[];    (* End package Context. *)
diff --git a/Src/LinearSolvers/C_TensorMG/Make.package b/Src/LinearSolvers/C_TensorMG/Make.package
deleted file mode 100644
index 3007e380124..00000000000
--- a/Src/LinearSolvers/C_TensorMG/Make.package
+++ /dev/null
@@ -1,23 +0,0 @@
-MCMG_BASE=EXE
-ifeq ($(LBASE),mcmg)
-  MCMG_BASE=LIB
-endif
-C$(MCMG_BASE)_headers += AMReX_DivVis.H AMReX_MCCGSolver.H AMReX_MCInterpBndryData.H AMReX_MCLinOp.H
-C$(MCMG_BASE)_headers += AMReX_MCMultiGrid.H
-
-C$(MCMG_BASE)_sources += AMReX_DivVis.cpp AMReX_MCCGSolver.cpp AMReX_MCInterpBndryData.cpp AMReX_MCLinOp.cpp
-C$(MCMG_BASE)_sources += AMReX_MCMultiGrid.cpp
-
-F$(MCMG_BASE)_headers += AMReX_DivVis_F.H AMReX_MCINTERPBNDRYDATA_F.H AMReX_MCLO_F.H
-F$(MCMG_BASE)_sources += AMReX_MCLO_$(DIM)D.F AMReX_MCINTERPBNDRYDATA_$(DIM)D.F
-
-ifeq ($(DIM),2)
-  F$(MCMG_BASE)_sources += AMReX_DV_2D.F
-else
-  F$(MCMG_BASE)_sources += AMReX_DV_3D1.F AMReX_DV_3D2.F AMReX_DV_3D3.F
-endif
-
-F90$(MCMG_BASE)_sources += amrex_tmg_util.F90
-
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/LinearSolvers/C_TensorMG
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/LinearSolvers/C_TensorMG
diff --git a/Src/LinearSolvers/C_TensorMG/OpenSource.txt b/Src/LinearSolvers/C_TensorMG/OpenSource.txt
deleted file mode 100755
index 7b5c4862d3d..00000000000
--- a/Src/LinearSolvers/C_TensorMG/OpenSource.txt
+++ /dev/null
@@ -1,177 +0,0 @@
-SOURCE CODE LICENSE AGREEMENT
-Software: TensorMG
-Version: Oct. 12, 2000 Release
-
-IMPORTANT - READ CAREFULLY: This License Agreement ("Agreement") is a
-legal agreement between you (in your capacity as an individual and as
-an agent for your company, institution or other entity) and The
-Regents of the University of California, Department of Energy
-contract-operators of the Ernest Orlando Lawrence Berkeley National
-Laboratory ("Berkeley Lab").  Downloading, installing, using, or
-copying of the Software (as defined below) by you or by a third party
-on your behalf indicates your agreement to be bound by the terms and
-conditions of this Agreement.  If you do not agree to these terms and
-conditions, do not download, install or use the Software.
-
-1.  LICENSE GRANT. Berkeley Lab grants you, and you hereby accept, a
-    non-exclusive, royalty-free perpetual license to install, use,
-    modify, prepare derivative works, incorporate into other computer
-    software, and distribute the version noted above of the computer
-    software program noted above, in binary and source code format, or
-    any derivative work thereof, together with any associated media,
-    printed materials, and on-line or electronic documentation (if
-    any) provided by Berkeley Lab (collectively, the "Software"),
-    subject to the following terms and conditions: (i) any
-    distribution of the Software shall bind the receiver to the terms
-    and conditions of this Agreement; (ii) any distribution of the
-    Software in modified form shall clearly state that the Software
-    has been modified from the version originally obtained from
-    Berkeley Lab.  This version of the Software constitutes a research
-    prototype and may be changed substantially.  The license grant set
-    forth above is subject to receipt by Berkeley Lab of any required
-    U.S. Department of Energy approvals.
-
-2.  COPYRIGHT; RETENTION OF RIGHTS.  The above license grant is
-    conditioned on the following: (i) you must reproduce all copyright
-    notices and other proprietary notices on any copies of the
-    Software and you must not remove such notices; (ii) in the event
-    you compile the Software, you will include the copyright notice
-    with the binary in such a manner as to allow it to be easily
-    viewable; (iii) if you incorporate the Software into other code,
-    you must provide notice that the code contains the Software and
-    include a copy of the copyright notices and other proprietary
-    notices.  All copies of the Software shall be subject to the terms
-    of this Agreement.  Subject to approval by the U.S. Department of
-    Energy: (a) you hereby acknowledge that the Software is protected
-    by United States copyright law and international treaty
-    provisions; (b) Berkeley Lab, and its licensors (if any), hereby
-    reserve all rights in the Software which are not explicitly
-    granted to you herein; (c) without limiting the generality of the
-    foregoing, Berkeley Lab and its licensors retain all title,
-    copyright, and other proprietary interests in the Software and any
-    copies thereof, and you do not acquire any rights, express or
-    implied, in the Software, other than those specifically set forth
-    in this Agreement.
-
-3.  NO MAINTENANCE OR SUPPORT; TREATMENT OF ENHANCEMENTS YOU CHOOSE TO
-    PROVIDE TO BERKELEY LAB.  Berkeley Lab is under no obligation
-    whatsoever to: (i) provide maintenance or support for the
-    Software; or (ii) to notify you of bug fixes, patches, or upgrades
-    to the features, functionality or performance of the Software
-    ("Enhancements") (if any), whether developed by Berkeley Lab or
-    third parties.  If, in its sole discretion, Berkeley Lab makes an
-    Enhancement available to you and Berkeley Lab does not separately
-    enter into a written license agreement with you relating to such
-    bug fix, patch or upgrade, then it shall be deemed incorporated
-    into the Software and subject to this Agreement.  You are under no
-    obligation whatsoever to provide any Enhancements to Berkeley Lab
-    that you may develop over time; however, if you choose to provide
-    Berkeley Lab with Enhancements in source code form that you have
-    developed without contemporaneously requiring Berkeley Lab to
-    enter into a separate written license agreement, then you hereby
-    grant Berkeley Lab a non-exclusive, royalty-free perpetual license
-    to install, use, modify, prepare derivative works, incorporate
-    into the Software or other computer software, distribute, and
-    sublicense your Enhancements or derivative works thereof, in
-    binary and source code form.
-
-4.  U.S. GOVERNMENT RIGHTS.  The Software was developed under funding
-    from the U.S. Department of Energy and the U.S. Government
-    consequently retains certain rights as follows: the
-    U.S. Government has been granted for itself and others acting on
-    its behalf a paid-up, nonexclusive, irrevocable, worldwide license
-    in the Software to reproduce, prepare derivative works, and
-    perform publicly and display publicly.  Beginning five (5) years
-    after the date permission to assert copyright was granted by the
-    U.S. Dept. of Energy, and subject to any subsequent five (5) year
-    renewals, the U.S. Government is granted for itself and others
-    acting on its behalf a paid-up, nonexclusive, irrevocable,
-    worldwide license in the Software to reproduce, prepare derivative
-    works, distribute copies to the public, perform publicly and
-    display publicly, and to permit others to do so.
-
-5.  WARRANTY DISCLAIMER.  THE SOFTWARE IS SUPPLIED "AS IS" WITHOUT
-    WARRANTY OF ANY KIND.  BERKELEY LAB, ITS LICENSORS, THE UNITED
-    STATES, THE UNITED STATES DEPARTMENT OF ENERGY, AND THEIR
-    EMPLOYEES: (1) DISCLAIM ANY WARRANTIES, EXPRESS OR IMPLIED,
-    INCLUDING BUT NOT LIMITED TO ANY IMPLIED WARRANTIES OF
-    MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, TITLE OR
-    NON-INFRINGEMENT, (2) DO NOT ASSUME ANY LEGAL LIABILITY OR
-    RESPONSIBILITY FOR THE ACCURACY, COMPLETENESS, OR USEFULNESS OF
-    THE SOFTWARE, (3) DO NOT REPRESENT THAT USE OF THE SOFTWARE WOULD
-    NOT INFRINGE PRIVATELY OWNED RIGHTS, (4) DO NOT WARRANT THAT THE
-    SOFTWARE WILL FUNCTION UNINTERRUPTED, THAT IT IS ERROR-FREE OR
-    THAT ANY ERRORS WILL BE CORRECTED.
-
-6.  LIMITATION OF LIABILITY. IN NO EVENT WILL BERKELEY LAB OR ITS
-    LICENSORS BE LIABLE FOR ANY INDIRECT, INCIDENTAL, CONSEQUENTIAL,
-    SPECIAL OR PUNITIVE DAMAGES OF ANY KIND OR NATURE, INCLUDING BUT
-    NOT LIMITED TO LOSS OF PROFITS OR LOSS OF DATA, FOR ANY REASON
-    WHATSOEVER, WHETHER SUCH LIABILITY IS ASSERTED ON THE BASIS OF
-    CONTRACT, TORT (INCLUDING NEGLIGENCE OR STRICT LIABILITY), OR
-    OTHERWISE, EVEN IF BERKELEY LAB HAS BEEN WARNED OF THE POSSIBILITY
-    OF SUCH LOSS OR DAMAGES.  IN NO EVENT SHALL BERKELEY LAB'S
-    LIABILITY FOR DAMAGES ARISING FROM OR IN CONNECTION WITH THIS
-    AGREEMENT EXCEED THE AMOUNT PAID BY YOU FOR THE SOFTWARE.
-
-7.  INDEMNITY.  You shall indemnify, defend, and hold harmless
-    Berkeley Lab, the U.S. Government, the Software developers, the
-    Software sponsors, and their agents, officers, and employees,
-    against any and all claims, suits, losses, damage, costs, fees,
-    and expenses arising out of or in connection with this Agreement.
-    You shall pay all costs incurred by Berkeley Lab in enforcing this
-    provision, including reasonable attorney fees.
-
-8.  TERM AND TERMINATION.  The license granted to you under this
-    Agreement will continue perpetually unless terminated by Berkeley
-    Lab in accordance with this Agreement.  If you breach any term of
-    this Agreement, and fail to cure such breach within thirty (30)
-    days of the date of written notice, this Agreement shall
-    immediately terminate. Upon such termination, you shall
-    immediately cease using the Software, return to Berkeley Lab, or
-    destroy, all copies of the Software, and provide Berkeley Lab with
-    written certification of your compliance with the foregoing.
-    Termination shall not relieve you from your obligations arising
-    prior to such termination. Notwithstanding any provision of this
-    Agreement to the contrary, Sections 5 through 10 shall survive
-    termination of this Agreement.
-
-9.  EXPORT CONTROLS. You shall observe all applicable United States
-    and foreign laws and regulations (if any) with respect to the
-    export, re-export, diversion or transfer of the Software, related
-    technical data and direct products thereof, including, without
-    limitation, the International Traffic in Arms Regulations (ITAR)
-    and the Export Administration Regulations.
-
-10. NO ENDORSEMENT.  In accordance with California Education Code
-    Section 92000, you shall not use in advertising, publicity or
-    other promotional activities any name, trade name, trademark, or
-    other designation of the University of California, nor shall you
-    so use "Ernest Orlando Lawrence Berkeley National Laboratory" or
-    "United States Department of Energy" (including any contraction,
-    abbreviation, or simulation of any of the foregoing) without
-    Berkeley Lab's prior written consent.
-
-11. GENERAL.  This Agreement shall be governed by the laws of the
-    State of California, excluding its rules governing conflicts of
-    laws.  No provision in either party's purchase orders, or in any
-    other business forms employed by either party will supersede the
-    terms of this Agreement, and no modification or amendment of this
-    Agreement is binding, unless in writing signed by a duly
-    authorized representative of each party.  This Agreement is
-    binding upon and shall inure to the benefit of Berkeley Lab, its
-    successors and assigns.  This Agreement represents the entire
-    understanding of the parties, and supersedes all previous
-    communications, written or oral, relating to the subject of this
-    Agreement. If you have any questions concerning this license,
-    contact Lawrence Berkeley National Laboratory, Technology Transfer
-    Department, One Cyclotron Road, MS 90-1070, Berkeley, CA 94720,
-    Attn: Software Licensing or via e-mail at TTD@lbl.gov.
-
-If you have any questions or feedback concerning this Software,
-contact the Center for Computational Sciences and Engineering,
-Lawrence Berkeley National Laboratory, One Cyclotron Road, MS
-50A-1148, Berkeley, CA 94720 or via email at webmaster@mothra.lbl.gov.
-
-Form rev000928
-
diff --git a/Src/LinearSolvers/C_TensorMG/Optimize.m b/Src/LinearSolvers/C_TensorMG/Optimize.m
deleted file mode 100644
index f565f3eaefa..00000000000
--- a/Src/LinearSolvers/C_TensorMG/Optimize.m
+++ /dev/null
@@ -1,741 +0,0 @@
-(* :Name: Optimize` *)
-
-(* :Title: Expression Optimization. *)
-
-(* :Author: Mark Sofroniou *)
-
-(* :Summary:
- This package adds the procedure Optimize for performing common
- sub-expression optimization on Mathematica expressions.
- An optimized Module and an optimized compiled Module is also possible.
- The function Horner factors uni-variate and multi-variate polynomials
- in efficient computational form.
- The function Cost measures the computational expense of numerical
- evaluation of an expression.
- The additional package Format.m (MathSource) enables the production of
- efficient C and Fortran code. *)
-
-(* :Context: Optimize` *)
-
-(* :Package Version: 1.2 *)
-
-(* :Copyright: Copyright 1993-4,  Mark Sofroniou.
- Permission is hereby granted to modify and/or make copies of
- this file for any purpose other than direct profit, or as part
- of a commercial product, provided this copyright notice is left
- intact. Sale, other than for the cost of media, is prohibited.
-
- Permission is hereby granted to reproduce part or all of
- this file, provided that the source is acknowledged. *)
-
-(* :History:
- Modified Optimize syntax and improved performance, August 1994.
- Significantly revised and publicly released May, 1994.
- Original Version by Mark Sofroniou, September, 1993. *)
-
-(* :Keywords:
- Assign, C, CAssign, Common, Compile, Cost, CForm, FORTRAN,
- FortranAssign, FortranForm, Horner, Optimize, Optimization,
- Polynomial, Sub-Expression, Syntactic. *)
-
-(* :Source:
- Mark Sofroniou, Ph.D. Thesis, Loughborough University, Loughborough,
- Leicestershire LE11 3TU, England. *)
-
-(* :Mathematica Version: 2.2 *)
-
-(* :Limitations:
- This package enables syntactic optimization in linear time.
- Optimization is used in the sense of improving the arithmetic
- operation count and compactness of the code, rather than the
- best possible.
- Expressions containing non-binary arithmetic operators (Plus
- and Times) are optimized by matching only entire sub-expressions
- possibly after extracting numeric coefficients.
- These operations rarely dominate the computational cost.
- Options enable control over the optimization process.
- The issue of numerical stability has not been addressed. *)
-
-BeginPackage["Optimize`"]
-
-Cost::usage = "Cost[expr,options] returns a list of Mathematica operators
-present in expr, providing a count of the basic arithmetic operations and
-function calls. Cost has attribute HoldAll so that arguments are maintained
-in unevaluated form. Some examples of the behaviour (using options):\n
-1+2*3 is counted as an addition and a multiplication.
-a+b+c is counted as two additions and a*b*c as two multiplications.\n
-Power[E,x] is counted as the exponential function Exp[x].
-Power[x,-1] is counted as a division.\n
-Power[x,y] is calculated as y-1 multiplications for integer y."
-
-Horner::usage = "Horner[poly] puts the polynomial poly in Horner or nested form
-with respect to the default variables Variables[poly]. This is an efficient form
-for numerical evaluation. Horner[poly,vars] specifies the variable ordering
-explicitly as the List vars. Multinomial conversion is applied recursively.
-Horner factorisation of rational polynomials is possible as Horner[p1/p2] or
-Horner[p1/p2,v1,v2]. Pre-conditioning of the coefficients is sometimes necessary
-to attain numerical stability and more efficient methods exist in this case.
-Horner's rule is optimal if no pre-conditioning is assumed, requiring n
-multiplications and n additions to evaluate a polynomial of degree n."
-
-Optimize::usage = "Optimize[expr,opts]\n
-Optimize transforms expr into a sequence of optimization statements and an
-optimized expression. Optimization is performed in linear time (O(n) operations)
-providing an efficient means of reducing the arithmetic operation count - not the
-best possible. The optimization performed is mainly syntactic (only exact common
-sub-expressions are matched) with a few heuristics. Options opts control the
-type of optimizations performed and the format of the output."
-
-
-(* Options: *)
-
-CostDivide::usage = "CostDivide is an option of Cost specifying whether
-to consider negative exponentiations as divisions. The setting All
-corresponds to the standard evaluation procedure and the compiler.
-The setting Share counts only one division in an expression such as
-(x^-2)*(y^-2) in correspondence with OuputForm and C and FORTRAN code
-translation. CostDivide may evaluate to All, Share or False. 
-See also CostPower"
-
-CostExp::usage = "CostExp is an option of Cost specifying whether to
-consider Power[E,x] as a call to the exponential function Exp[x].
-CostExp may evaluate to True or False."
-
-CostNull::usage = "CostNull is an option of Cost specifying a
-list of symbols to be omitted for the purposes of costing. This is
-useful, for example, for removing named arrays from consideration
-(which have the same syntax as functions).
-CostNull may evaluate to a (possibly empty) list of symbols."
-
-CostPower::usage="CostPower is an option of Cost specifying whether to
-consider Power[x,y] as calculated using two function calls, namely
-Exp[y*Log[x]]. The setting Integer assumes in addition that integer
-powers are calculated using y-1 multiplications. This is particularly
-useful when costing expressions optimized using the option
-OptimizePower->Binary. CostPower may evaluate to Integer, True or False.
-See also CostDivide"
-
-Binary::usage = "Binary is an argument of the option OptimizePower
-specifying whether to perform repeated binary factoring of exponents."
-
-OptimizeCoefficients::usage = "OptimizeCoefficients is an option of
-Optimize specifying whether to extract numerical coefficients in
-expressions with head Plus and Times. OptimizeCoefficients may
-evaluate to True or False."
-
-OptimizeFunction::usage = "OptimizeFunction is an option of Optimize
-specifying whether to optimize common sub-expressions which are
-neither atoms (?AtomQ) nor expressions with head Plus, Power,
-or Times. OptimizeFunction may evaluate to True or False."
-
-OptimizeNull::usage = "OptimizeNull is an option of Optimize specifying
-a list of symbols to be disregarded during the optimization process.
-This is useful, for example, for specifying a named array (which has the
-same syntax as a function). OptimizeNull may evaluate to a (possibly empty)
-list of symbols."
-
-OptimizePlus::usage = "OptimizePlus is an option of Optimize specifying
-whether to extract common sub-expressions with head Plus. Only exact
-sub-expressions are matched. Numerical coefficients may be extracted
-using OptimizeCoefficients. OptimizePlus may evaluate to True or False."
-
-OptimizePower::usage = "OptimizePower is an option of Optimize
-specifying whether to optimize sub-expressions with head Power.
-Integer and rational powers can be factored efficiently by repeated
-binary exponentiation. OptimizePower may evaluate to True, False,
-or Binary."
-
-OptimizeProcedure::usage = "OptimizeProcedure is an option of Optimize
-specifying the form of the output returned. The setting True returns a
-Module wrapped in Hold. Function, Compile and SetDelayed all know
-about Optimize and make use of the option OptimizeProcedure (automatically
-removing Hold). Applying ReleaseHold recovers the original (unoptimized)
-expression. With the setting False a list of transformation
-rules is returned together with the optimized expression. A definition
-{optrules,optexpr} = Optimize[expr] enables the original
-(unoptimized) expression to be recovered as optexpr //. Dispatch[optrules]."
-
-OptimizeTimes::usage = "OptimizeTimes is an option of Optimize specifying
-whether to extract common sub-expressions with head Times. Only exact
-sub-expressions are matched. Numerical coefficients may be extracted
-using OptimizeCoefficients. OptimizeTimes may evaluate to True or False."
-
-OptimizeVariable::usage = "OptimizeVariable is an option of Optimize
-specifying a pair {symb,form} where symb is the optimization variable
-to introduce and form is the type of format to use.
-The format can be either Sequence (o1,o2,...) or Array (o[1],o[2],...).
-Consecutively numbered variables are returned."
-
-(* Default optimization symbol. *)
-
-SetAttributes[o,NHoldAll];
-
-o::usage="o is the default optimization symbol introduced by
-Optimize when performing common sub-expression optimization."
-
-Unprotect[Binary, Cost, CostDivide, CostExp, CostNull, CostPower, Horner, o,
-Optimize, OptimizeCoefficients, OptimizeFunction, OptimizeNull, OptimizePlus,
-OptimizePower, OptimizeProcedure, OptimizeTimes, OptimizeVariable];
-
-Begin["`Private`"]
-
-(* Function to check the data types of Cost options with error
- messages. *)
-
-Options[Cost] = {CostDivide->All,CostExp->True,
-CostNull->{Block,Module,With,CompoundExpression,Hold},
-CostPower->Integer};
-
-Cost::args = "The `1` did not evaluate to `2`.";
-
-costerrmssgs = {{"option CostDivide","All, Share or False"},
-{"option CostExp","True or False"},
-{"option CostNull","a (possibly empty) list of symbols"},
-{"option CostAsAtom","Integer, True or False"}};
-
-CostOptTest[opts___]:=
-  Module[{costdiv,costexp,costnull,costpower,types,defaults=Options[Cost]},
-
-    optlist = {costdiv,costexp,costnull,costpower} =
-      Map[First,defaults] /. {opts} /. defaults;
-
-    types = {MatchQ[costdiv,All|Share|False],
-      MatchQ[costexp,True|False],
-      MatchQ[costnull,{___Symbol}],
-      MatchQ[costpower,Integer|True|False]};
-
-    Check[
-      MapThread[
-        If[#1,#1,Message[Cost::args,Apply[Sequence,#2]]]&,
-        {types,costerrmssgs}
-      ]; optlist,      (* Return list of option values. *)
-      $Failed,         (* Option of wrong type. *)
-      Cost::args       (* Check only for these messages. *)
-    ]
-  ];
-
-
-SetAttributes[{Cost,MainCost},HoldAll];
-
-Cost[expr_,opts___?OptionQ]:=
-  Module[{optvals},
-    optvals /;
-      And[
-        (optvals = CostOptTest[opts])=!=$Failed,
-        optvals = MainCost[Unevaluated[expr],Evaluate[optvals]]; True
-      ]
-  ];
-
-
-
-(* Function for counting cost of basic operations. *)
-
-MainCost[expr_,{costdiv_,costexp_,costnull_,costpower_}]:=
-  Block[{CostFunction},
-
-(* Prevent evaluation during costing. *)
-
-    SetAttributes[{CostFunction},HoldAll];
-
-(* Rules to cost expressions. *)
-
-    If[costexp, CostFunction[Power[E,_]]:= Exp ];
-
-(* Integer powers as multiplications and divisions. *)
-
-    If[costpower===Integer,
-      If[MatchQ[costdiv,All|Share],
-        CostFunction[Power[_,y_Integer?Positive]]:= (y-1) Times;
-        CostFunction[Power[_,y_Integer?Negative]]:= Divide + (-y-1) Times,
-        CostFunction[Power[_,y_Integer]]:= (Abs[y]-1) Times  (* No divisions. *)
-      ]
-    ];
-
-(* x^y calculated as Exp[y Log[x]]. *)
-
-    If[MatchQ[costpower,Integer|True],
-      If[MatchQ[costdiv,All|Share],
-        CostFunction[Power[_,_?Negative]]:= Divide+Exp+Log ];
-      CostFunction[_Power]:= Exp+Log
-    ];
-
-(* Add back in occurrances of shared divisions. *)
-
-    If[costdiv===Share,
-
-(* Pure reciprocal case. *)
-
-      Literal[CostFunction[e:Times[Power[_,_?Negative]..]]]:=
-        (1-Length[Unevaluated[e]]) Divide + (Length[Unevaluated[e]]-1) Times;
-
-(* Mixed case: (a*b..)/(c*d..). Similar to above, but don't count first
- division as a multiplication. Hence: Length[num]-1+Length[denom]-1 = Length[e]-2. *)
-
-      Literal[CostFunction[e:(Times[___,Power[_,_?Negative],___]..)]]:=
-        (1-Count[Unevaluated[e],Power[_,_?Negative]]) Divide +
-          (Length[Unevaluated[e]]-2) Times;
-    ];
-
-(* Arithmetic operators. *)
-
-    CostFunction[x_Plus]:= (Length[Unevaluated[x]]-1) Plus;
-    CostFunction[x_Times]:= (Length[Unevaluated[x]]-1) Times;
-
-(* Ignore Lists. *)
-
-    CostFunction[x_List]:= 0;
-
-(* Cost remaining functions. *)
-
-    CostFunction[x_]:= Head[Unevaluated[x]];
-
-(* Cost required operators. *)
-
-    DeleteCases[
-      If[Head[#]===Plus,Apply[List,#],{#}]&[
-        Apply[Plus,
-          Map[CostFunction, Level[Unevaluated[{expr}],-2,Unevaluated] ]
-        ]
-      ],
-      Apply[Alternatives,Times[costnull,_.]] (* Remove specified operands. *)
-    ]
-
-  ]; (* End of MainCost *)
-
-
-
-(* Horner's rule. *)
-
-(* Default variables. *)
-
-Horner[p1_/p2_]:=
-  Block[{$RecursionLimit=Infinity},
-    HornerRule[ Expand[p1], Variables[p1] ]/
-      HornerRule[ Expand[p2], Variables[p2] ]
-  ];
-
-Horner[ser_SeriesData]:=
-  Block[{$RecursionLimit=Infinity},
-    HornerRule[Expand[#],Variables[#]]& @ Normal[ser]
-  ];
-
-Horner[poly_]:=
-  Block[{$RecursionLimit=Infinity},
-    HornerRule[Expand[poly],Variables[poly]]
-  ];
-
-
-(* Specified variables. *)
-
-Horner[p1_/p2_,varsp1_?VectorQ,varsp2_?VectorQ]:=
-  Block[{$RecursionLimit=Infinity},
-    Times[
-      HornerRule[ Expand[p1], varsp1 ],
-      Power[ HornerRule[ Expand[p2], varsp2 ], -1]
-    ]
-  ];
-
-Horner[ser_SeriesData,vars_?VectorQ]:=
-  Block[{$RecursionLimit=Infinity},
-    HornerRule[ Expand[Normal[ser]], vars]
-  ];
-
-Horner[poly_,vars_?VectorQ]:=
-  Block[{$RecursionLimit=Infinity},
-    HornerRule[ Expand[poly], vars ]
-  ];
-
-Horner[poly_,var_]:=
-  Block[{$RecursionLimit=Infinity},
-    HornerRule[ Expand[poly], var ]
-  ];
-
-(* No variables found by Variables. *)
-
-HornerRule[poly_,{}]:= poly;
-
-HornerRule[0,_]:= 0;
-
-(* Horner's rule for multi-variate polynomials as recursive univariate
- decomposition. *)
-
-HornerRule[poly_,{v_,rem__}]:=
-  Fold[
-    SumCoeffs,
-    0,
-
-(* Pair off variable with coefficients as {var^exp,hcoeff} where hcoeff
- is the coefficient in Horner form. *)
-
-    Thread[{
-      v^Offsets[#],
-      Map[ HornerRule[#,{rem}]&, GetCoeffs[poly,v,#] ]
-    }]& @ Reverse[ Exponent[poly,v,Union[{##}]&] ] (* Powers sorted in descending order. *)
-  ];
-
-(* Horner's rule for uni-variate polynomials. *)
-
-HornerRule[poly_,{v_}]:=
-  Fold[
-    SumCoeffs,
-    0,
-
-(* Pair off variable with coefficients as {var^exp,coeff}. *)
-
-    Thread[{
-      v^Offsets[#], GetCoeffs[poly,v,#]
-    }]& @ Reverse[ Exponent[poly,v,Union[{##}]&] ] (* Powers sorted in descending order. *)
-  ];
-
-(* Calculate offset powers as successive differences (not necessarily
- incremental). *)
-
-Offsets[e:{_}]:= e;
-Offsets[e_]:= Join[-Drop[e,1],{0}] + e;
-
-(* Accumulate Horner form of polynomial. *)
-
-SumCoeffs[sum_,{v_,c_}]:= v (c + sum);
-
-(* Can eventually be replaced by CoefficientList when bugs are fixed. *)
-
-SetAttributes[GetCoeffs,Listable];
-GetCoeffs[c_,v_,0]:= Coefficient[c,v,0];
-GetCoeffs[c_,v_,p_]:= Coefficient[c,v^p];
-
-
-(* Optimization of expressions. *)
-
-(* Function to check the data types of Optimize options with
- error messages. *)
-
-Options[Optimize] = {OptimizeCoefficients->False,OptimizeFunction->True,
-OptimizeNull->{List},OptimizePlus->True,OptimizePower->True,
-OptimizeProcedure->False,OptimizeTimes->True,OptimizeVariable->{o,Sequence}};
-
-Optimize::args = "The `1` did not evaluate to `2`.";
-
-opterrmsgs = {
-      {"option OptimizeCoefficients","True or False"},
-      {"option OptimizeFunction","True or False"},
-      {"option OptimizeNull","a (possibly empty) list of symbols"},
-      {"option OptimizePlus","True or False"},
-      {"option OptimizePower","True, False or Binary"},
-      {"option OptimizeProcedure","True or False"},
-      {"option OptimizeTimes","True or False"},
-      {"option OptimizeVariable","a pair of the form {Symbol,Sequence|Array}"}};
-
-OptimizeOptionTest[opts___]:= 
-  Module[{defaults,types,optcoeff,optfunc,optlist,optnull,optplus,
-    optpower,optproc,opttimes,optoutv},
-
-    defaults = Options[Optimize];
-
-    optlist = {optcoeff,optfunc,optnull,optplus,optpower,optproc,opttimes,
-      optoutv} = Map[First,defaults] /. {opts} /. defaults;
-
-    types = {
-      MatchQ[optcoeff,True|False],
-      MatchQ[optfunc,True|False],
-      MatchQ[optnull,{___Symbol}],
-      MatchQ[optplus,True|False],
-      MatchQ[optpower,Binary|True|False],
-      MatchQ[optproc,True|False],
-      MatchQ[opttimes,True|False],
-      MatchQ[optoutv,{_Symbol,Sequence|Array}]};
-
-    Check[
-      MapThread[
-        If[#1,#1,Message[Optimize::args,Apply[Sequence,#2]]]&,
-        {types,opterrmsgs}
-      ]; optlist,      (* Return list of option values. *)
-      $Failed,         (* Option of wrong type. *)
-      Optimize::args   (* Check only for these messages. *)
-    ]
-  ]; (* End of OptimizeOptionTest. *)
-
-
-(* Default optimization symbol is o. *)
-
-Optimize[expr_,opts___?OptionQ]:=
-  Module[{optvals},
-    optvals /;
-      And[
-        (optvals = OptimizeOptionTest[opts])=!=$Failed,
-	    optvals = MainOptimize[expr,optvals]; True
-	  ]
-  ];
-
-
-
-(* Define optimization function. All expression heads are wrapped
- in Hold to prevent re-evaluation during the optimization process. *)
-
-MainOptimize[expr_,{optcoeff_,optfunc_,optnull_,optplus_,optpower_,optproc_,
-  opttimes_,{outvar_,outform_}}]:=
-Block[{$RecursionLimit=Infinity,BinPowDecomp,BinPowRule,downvals,HoldHead,
-    index=0,keeprules,MakeBins,MakeRule,outvar,OptRule,optexpr,optvar},
-
-(* Store sub-expression by making a new DownValue for OptRule and replace
- expression by a new optimization variable. *)
-
-  SetAttributes[MakeRule,HoldAll];
-
-  MakeRule[e_]:= (OptRule[e]:=OptRule[e]=#; #)& @ optvar[++index];
-
-(* Rules for reciprocals. *)
-
-  If[optpower=!=False,
-    OptRule[e:Hold[Power][_,-1]]:= MakeRule[e];
-
-    OptRule[Hold[Power][x_,y_?(NumberQ[#]&&Negative[#]&)]]:=
-      OptRule[Hold[Power][OptRule[Hold[Power][x,-y]],-1]];
-  ];
-
-(* Rules to binary factor integer and rational powers. *)
-
-  Switch[optpower,
-
-(* Rules for binary decomposition of positive powers. *)
-
-    Binary,
-
-(* Save all binary power optimizations (even if they only occur once). *)
-
-    MakeBins[e_]:= OptRule[e]=optvar[++index];
-
-(* Calculate and store binary power decomposition. *)
-
-    BinPowDecomp[p_]:= BinPowDecomp[p]=
-      2^(-1+Flatten[Position[Reverse[IntegerDigits[p,2]],1]]);
-
-(* Decompose as products of binary powers. *)
-
-    binprod[{p_}]:= p;
-      binprod[{p__}]:= OptRule[ Hold[Times][p] ];
-
-    OptRule[Hold[Power][x_,p_Integer]]:=
-      binprod[ BinPowRule[x,BinPowDecomp[p]] ];
-
-    SetAttributes[BinPowRule,{Listable}];
-
-(* Binary power stopping criterion. *)
-
-    BinPowRule[e_,1]:= e;
-
-(* Store all binary powers. *)
-
-    BinPowRule[x_,p_]:=
-      BinPowRule[x,p]=
-        MakeBins[ Hold[Power][BinPowRule[x,Quotient[p,2]],2] ];
-
-(* Rule for positive rational power with unit numerator. *)
-
-    OptRule[e:Hold[Power][_,Rational[1,_]]]:= MakeBins[e];
-
-(* Rules to binary decompose fractional exponents. *)
-
-    OptRule[Hold[Power][x_,Rational[y_,z_]]]:=
-      If[y<z,
-
-(* Rule to decompose rational power as: x^(n/m) -> (x^(1/m))^n. *)
-
-        OptRule[ Hold[Power][ OptRule[Hold[Power][x,Rational[1,z]]] ,y] ],
-
-(* Rule to decompose rational power as: x^(c/d) -> x^(q+r/d) -> x^(q)*x^(r/d). *)
-
-        OptRule[
-          Hold[Times][
-            OptRule[ Hold[Power][ x, Quotient[y,z] ] ],
-            OptRule[ Hold[Power][ OptRule[Hold[Power][x,Rational[1,z]]], Mod[y,z]] ]
-          ]
-        ]
-      ];
-
-(* Rule for general (non-numeric) and non-binary powers. *)
-
-    OptRule[e:Blank[Hold[Power]]]:= MakeRule[e],
-
-(* Rule for literal powers. *)
-
-    True,
-
-    OptRule[e:Blank[Hold[Power]]]:= MakeRule[e],
-
-    False,
-
-    OptRule[e:Blank[Hold[Power]]]:= e (* Else disregard head Power. *)
-  ];
-
-
-(* Plus rules. *)
-
-  If[optplus,
-
-(* Extract numerical coefficient. *)
-
-    If[optcoeff,
-      OptRule[ Hold[Plus][n_?NumberQ,x_,y__] ]:=
-        OptRule[ Hold[Plus][ n, OptRule[Hold[Plus][x,y]] ] ]
-    ];
-
-(* Store literal sub-expression. *)
-
-    OptRule[e:Blank[Hold[Plus]]]:= MakeRule[e],
-
-    OptRule[e:Blank[Hold[Plus]]]:= e (* Else disregard head Plus. *)
-
-  ]; (* End of rules for expressions with head Plus. *)
-
-
-(* Times rules. *)
-
-  If[opttimes,
-
-(* Extract numerical coefficient. *)
-
-    If[optcoeff,
-      OptRule[ Hold[Times][n_?NumberQ,x_,y__] ]:=
-        OptRule[ Hold[Times][ n, OptRule[Hold[Times][x,y]] ] ]
-    ];
-
-(* Store literal sub-expression. *)
-
-    OptRule[e:Blank[Hold[Times]]]:= MakeRule[e],
-
-    OptRule[e:Blank[Hold[Times]]]:= e (* Else disregard head Times. *)
-
-  ]; (* End of rules for expressions with head Times. *)
-
-
-(* Rule for functions. *)
-
-  If[optfunc,
-    OptRule[e_]:= MakeRule[e],
-
-    OptRule[e_]:= e (* Else disregard remaining expressions. *)
-  ];
-
-
-(* Don't make rules for specified symbols, but enable argument evaluation. *)
-
-  Map[(HoldHead[e:Blank[#]]:= Operate[Hold,e])&, optnull ];
-
-(* Wrap up function heads to prevent re-evaluation. Enables held
- functions arguments to be evaluated. *)
-
-  HoldHead[e_]:= OptRule[Operate[Hold,e]];
-
-(* Map function for creating optimization rules at non-atomic levels.
- Include special case of binary power factorisation. *)
-
-  optexpr = If[ Head[expr]===Power&&optpower===Binary, HoldHead[#], # ]& @
-              Map[ HoldHead, expr, -2 ];
-
-
-(* Find occurances of temporary variables in optimized expression and
- in optimization rules. Decide which temporary variables to keep and
- which to discard by pattern look-up. *)
-
-  downvals = DownValues[OptRule];
-
-(* Discard rules by assigning optimization variable to subexpression.
- Head replacement makes this efficient by avoiding re-evaluation. *)
-
-  Cases[downvals,Literal[_:>(OptRule[rhs_]=lhs_)]:>(lhs=rhs)];
-
-(* Substitute discarded rules into optimized expression. *)
-
-  optexpr = optexpr;
-
-(* Save ordered list of repeated rules. *)
-
-  keeprules =
-    Sort[
-      Cases[downvals,Literal[_[OptRule[rhs:_]]:>lhs:_optvar]:>lhs->rhs]
-    ];
-
-
-(* Format optimization variable. Reset index for consecutively numbered
- output variables. *)
-
-  index = 0;
-
-  If[outform===Sequence,
-
-(* Write optimization variable as consecutive symbols o1, o2, ...
- Store indexing string function (not localised). *)
-
-    istr[i_]:= istr[i]=ToString[i];
-    (optvar[i_]:= optvar[i]=ToExpression[#<>istr[++index]])& @ ToString[outvar],
-
-(* Write optimization variable as a consecutive array o[1], o[2], ... *)
-
-    optvar[i_]:= optvar[i]=outvar[++index]
-  ];
-
-
-(* Create a Module or leave as a list of replacement rules and
- apply formatting rules for optimization variable. *)
-
-  If[keeprules==={},
-    If[optproc, expr, {{},expr} ], (* No optimization performed *)
-    If[optproc,
-      MakeProc[outvar,outform,ReleaseHold[keeprules],ReleaseHold[optexpr]],
-      ReleaseHold[ {keeprules, optexpr} ]
-    ]
-  ]
-
-]; (* End of MainOptimize.*)
-
-
-
-(* Convert output to a held module. *)
-
-MakeProc[optvar_,optform_,{optseq__Rule},optexpr_]:=
-  (Hold[ Module[#,optseq; optexpr] ] /. Rule->Set)& @
-    If[optform===Sequence, First[Thread[{optseq},Rule]], {optvar}];
-
-(* Create an optimized procedure. *)
-
-RemoveHold[expr_Hold]:= Apply[Unevaluated,expr];
-RemoveHold[expr_]:= Unevaluated[expr];
-
-(* SetDelayed definition. *)
-
-Optimize /:
-  (lhs_:=Optimize[expr_,opts___?OptionQ]):=
-    (Unevaluated[lhs]:=#)& @
-      RemoveHold[ Optimize[expr,OptimizeProcedure->True,opts] ];
-
-(* Compile definition. *)
-
-Optimize /:
-  Compile[args_,Optimize[expr_,opts___?OptionQ],info___]:=
-    Compile[Unevaluated[args],#,info]& @
-      RemoveHold[ Optimize[expr,OptimizeProcedure->True,opts] ];
-
-(* Function definition. *)
-
-Optimize /:
-  Function[args_,Optimize[expr_,opts___?OptionQ],attr___]:=
-    ReleaseHold[
-      Function[
-        args,
-        Evaluate[Optimize[expr,OptimizeProcedure->True,opts]],
-        attr
-      ]
-    ];
-
-
-End[];  (* End `Private` Context. *)
-
-(* Protect exported symbols. *)
-
-SetAttributes[{Cost,Horner,Optimize},ReadProtected];
-
-Protect[Binary, Cost, CostDivide, CostExp, CostNull, CostPower, Horner, o,
-Optimize, OptimizeCoefficients, OptimizeFunction, OptimizeNull, OptimizePlus,
-OptimizePower, OptimizeProcedure, OptimizeTimes, OptimizeVariable];
-
-EndPackage[];    (* End package Context. *)
diff --git a/Src/LinearSolvers/C_TensorMG/amrex_tmg_util.F90 b/Src/LinearSolvers/C_TensorMG/amrex_tmg_util.F90
deleted file mode 100644
index 62df527e996..00000000000
--- a/Src/LinearSolvers/C_TensorMG/amrex_tmg_util.F90
+++ /dev/null
@@ -1,9 +0,0 @@
-
-subroutine amrex_tmg_polyInterpCoeff (xInt, x, N, c)
-  use amrex_fort_module, only : amrex_real
-  use amrex_lo_util_module, only : polyInterpCoeff
-  implicit none
-  integer :: N
-  real(amrex_real) :: xInt, x(N), c(N)
-  call polyInterpCoeff(xInt, x, N, c)
-end subroutine amrex_tmg_polyInterpCoeff
diff --git a/Src/LinearSolvers/C_TensorMG/visc2d.m b/Src/LinearSolvers/C_TensorMG/visc2d.m
deleted file mode 100644
index b54ca5bf3c5..00000000000
--- a/Src/LinearSolvers/C_TensorMG/visc2d.m
+++ /dev/null
@@ -1,100 +0,0 @@
-(* definition of tau *)
-
-tauxxdef = tauxx[i_ + half, j_] -> 2 mu[i + half, j] dudx[i + half, j]
-tauyydef = tauyy[i_, j_ + half] -> 2 mu[i, j + half] dvdy[i, j + half]
-tauxydef = tauxy[i_, j_] -> mu[i, j] (dudy[i, j] + dvdx[i, j])
-
-(* definitions of derivatives *)
-
-dudydef1 = dudy[i_, j_ + half] -> (u[i, j + 1] - u[i, j])/hy
-dvdxdef1 = dvdx[i_ + half, j_] -> (v[i + 1, j] - v[i, j])/hx
-dudydef2 = dudy[i_ + half, j_] -> (u[i, j + 1] - u[i, j - 1] + u[i + 1, j + 1] - u[i + 1, j - 1])/(4 hy)
-dvdxdef2 = dvdx[i_, j_ + half] -> (v[i + 1, j + 1] - v[i - 1, j + 1] + v[i + 1, j] - v[i - 1, j])/(4 hx)
-dudxdef  = dudx[i_ + half, j_] -> (u[i + 1, j] - u[i, j])/hx
-dvdydef  = dvdy[i_, j_ + half] -> (v[i, j + 1] - v[i, j])/hy
-
-(* definitions used for fortran output *)
-
-murepl1 = mu[i_, j_ + half] -> muY[i, j + 1]
-murepl2 = mu[i_ + half, j_] -> muX[i + 1, j]
-urepl = u[i_, j_] -> U[i, j, 1]
-vrepl = v[i_, j_] -> U[i, j, 2]
-
-(* 
-dependentCellsNotCovered is a function which returns a logical
-expression suitable for inclusion in fortran.  Give an expression,
-exp, we wish to determine which mesh locations are accessed by the
-expression.  However, we do not wish to examine all possible
-locations, only those outside the grid patch region.  So we provide a
-second argument, which is a boolean function taking two arguments.
-The combination will give logical expressions testing the mask for
-cells utilized by the expression and for which the boolean function,
-logfunc[il,jl], evaluates as true. The third argument is the name of
-the mask array.
-*)
-
-Clear[dependentCellsNotCovered]
-dependentCellsNotCovered[exp_, logfunc_, maskfun_] := 
-  Module[{cond = False, lexp = exp, il, jl, kl}, 
-    For[il = -2, il <= +2, il++, 
-      For[jl = -2, jl <= +2, jl++, 
-        For[kl = 1, kl <= 2, kl++, 
-          If[logfunc[il, jl] && 
-              Coefficient[Expand[exp], U[i + il, j + jl, kl]] =!= 0, 
-            cond = cond || maskfun[i + il, j + jl] > 0]]]]; cond]
-
-(*
-dependentCellsCovered is more or less the converse of
-dependentCellsNotCovered.  dependentCellsCovered will return true if
-all the cells in the expression (properly restricted by the mask
-function) ARE covered.  dependentCellsNotCovered returned true if
-one or more of the cells were not covered.
-*)
-
-Clear[dependentCellsCovered]
-dependentCellsCovered[exp_, logfunc_, maskfun_] := 
-  Module[{cond = True, lexp = exp, il, jl, kl}, 
-    For[il = -2, il <= +2, il++, 
-      For[jl = -2, jl <= +2, jl++, 
-        For[kl = 1, kl <= 2, kl++, 
-          If[logfunc[il, jl] && 
-              Coefficient[Expand[exp], U[i + il, j + jl, kl]] =!= 0, 
-            cond = cond && maskfun[i + il, j + jl] == 0]]]]; cond]
-
-(* 
-definitions for Do One-sided Derivative in X direction.  if sign is
-positive, it means extend the stencil in the positivie x direction.
-if negative, extend in other direction
-*)
-
-DOneX[u_, i_, j_, sign_] := (-u[i + 2, j] + 4*u[i + 1, j] - 3*u[i, j])/(2*hx) /; sign == 1
-DOneX[u_, i_, j_, sign_] := (u[i - 2, j] - 4*u[i - 1, j] + 3*u[i, j])/(2*hx) /; sign == -1
-DOneX[u_, i_, j_, k_, sign_] := (-u[i + 2, j, k] + 4*u[i + 1, j, k] - 3*u[i, j, k])/(2*hx) /; sign == 1
-DOneX[u_, i_, j_, k_, sign_] := (u[i - 2, j, k] - 4*u[i - 1, j, k] + 3*u[i, j, k])/(2*hx) /; sign == -1
-
-(*
-definitions for Do One-sided Derivative in Y direction.  if sign is
-positive, it means extend the stencil in the positivie y direction.
-if negative, extend in other direction
-*)
-
-DOneY[u_, i_, j_, sign_] := (-u[i, j + 2] + 4*u[i, j + 1] - 3*u[i, j])/(2*hy) /; sign == 1
-DOneY[u_, i_, j_, sign_] := (u[i, j - 2] - 4*u[i, j - 1] + 3*u[i, j])/(2*hy) /;  sign == -1
-DOneY[u_, i_, j_, k_, sign_] := (-u[i, j + 2, k] + 4*u[i, j + 1, k] - 3*u[i, j, k])/(2*hy) /; sign == 1
-DOneY[u_, i_, j_, k_, sign_] := (u[i, j - 2, k] - 4*u[i, j - 1, k] + 3*u[i, j, k])/(2*hy) /; sign == -1
-
-(* definitions for two sided deriv in x direction. *)
-
-DTwoX[u_, i_, j_] := (u[i + 1, j] - u[i - 1, j])/(2 hx)
-DTwoX[u_, i_, j_, k_] := (u[i + 1, j, k] - u[i - 1, j, k])/(2 hx)
-DTwoY[u_, i_, j_] := (u[i, j + 1] - u[i, j - 1])/(2 hy)
-DTwoY[u_, i_, j_, k_] := (u[i, j + 1, k] - u[i, j - 1, k])/(2 hy)
-
-(*
-DeleteFile["dog.mf"];
-CopyFile["DV_2D.mF", "dog.mf"];
-Splice["dog.mf"];
-DeleteFile["DV_2D.F"];
-CopyFile["dog.f", "DV_2D.F"];
-SetFileDate["DV_2D.F"];
-*)
diff --git a/Src/LinearSolvers/C_TensorMG/visc2d.ma b/Src/LinearSolvers/C_TensorMG/visc2d.ma
deleted file mode 100644
index bc4ce676608..00000000000
--- a/Src/LinearSolvers/C_TensorMG/visc2d.ma
+++ /dev/null
@@ -1,1317 +0,0 @@
-(*^
-
-::[	Information =
-
-	"This is a Mathematica Notebook file.  It contains ASCII text, and can be
-	transferred by email, ftp, or other text-file transfer utility.  It should
-	be read or edited using a copy of Mathematica or MathReader.  If you 
-	received this as email, use your mail application or copy/paste to save 
-	everything from the line containing (*^ down to the line containing ^*)
-	into a plain text file.  On some systems you may have to give the file a 
-	name ending with ".ma" to allow Mathematica to recognize it as a Notebook.
-	The line below identifies what version of Mathematica created this file,
-	but it can be opened using any other version as well.";
-
-	FrontEndVersion = "X Window System Mathematica Notebook Front End Version 2.2";
-
-	X11StandardFontEncoding; 
-	
-	fontset = title, inactive, noPageBreakBelow, noPageBreakInGroup, nohscroll, preserveAspect, groupLikeTitle, center, M7, bold, e8,  24, fontName, "times";
-	fontset = subtitle, inactive, noPageBreakBelow, noPageBreakInGroup, nohscroll, preserveAspect, groupLikeTitle, center, M7, bold, e6,  18, fontName, "times";
-	fontset = subsubtitle, inactive, noPageBreakBelow, noPageBreakInGroup, nohscroll, preserveAspect, groupLikeTitle, center, M7, italic, e6,  14, fontName, "times";
-	fontset = section, inactive, noPageBreakBelow, nohscroll, preserveAspect, groupLikeSection, grayBox, M22, bold, a20,  18, fontName, "times";
-	fontset = subsection, inactive, noPageBreakBelow, nohscroll, preserveAspect, groupLikeSection, blackBox, M19, bold, a15,  14, fontName, "times";
-	fontset = subsubsection, inactive, noPageBreakBelow, nohscroll, preserveAspect, groupLikeSection, whiteBox, M18, bold, a12,  12, fontName, "times";
-	fontset = text, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = smalltext, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  10, fontName, "times";
-	fontset = input, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeInput, M42, N23, bold,  12, fontName, "courier";
-	fontset = output, output, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23, L-5,  12, fontName, "courier";
-	fontset = message, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23,  12, fontName, "courier";
-	fontset = print, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23,  12, fontName, "courier";
-	fontset = info, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23,  12, fontName, "courier";
-	fontset = postscript, PostScript, formatAsPostScript, output, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeGraphics, M7, l34, w282, h287,  12, fontName, "courier";
-	fontset = name, inactive, noPageBreakInGroup, nohscroll, preserveAspect, M7, italic, B65535,  10, fontName, "times";
-	fontset = header, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7, italic,  12, fontName, "times";
-	fontset = leftheader,  12, fontName, "times";
-	fontset = footer, inactive, nohscroll, noKeepOnOnePage, preserveAspect, center, M7, italic,  12, fontName, "times";
-	fontset = leftfooter,  12, fontName, "times";
-	fontset = help, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = clipboard, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = completions, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "courier";
-	fontset = special1, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special2, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special3, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special4, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special5, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";paletteColors = 128; automaticGrouping; currentKernel; 
-]
-:[font = section; inactive; preserveAspect; startGroup]
-definition of tau
-:[font = input; preserveAspect; startGroup]
-tauxxdef = tauxx[i_ + half, j_ ] -> 
-		2*mu[i+half,j]*dudx[i+half,j]
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauxx[half + (i_), j_] -> 2*dudx[half + i, j]*mu[half + i, j]
-;[o]
-tauxx[half + (i_), j_] -> 2 dudx[half + i, j] mu[half + i, j]
-:[font = input; preserveAspect; startGroup]
-tauyydef = tauyy[i_, j_ + half] ->
-		2*mu[i,j+half] * dvdy[i,j+half]
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauyy[i_, half + (j_)] -> 2*dvdy[i, half + j]*mu[i, half + j]
-;[o]
-tauyy[i_, half + (j_)] -> 2 dvdy[i, half + j] mu[i, half + j]
-:[font = input; preserveAspect; startGroup]
-tauxydef = tauxy[i_,j_] -> mu[i,j]*(dudy[i,j]+dvdx[i,j])
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauxydef"
-     is similar to existing symbols {tauxxdef, tauyydef}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauxy"
-     is similar to existing symbols {tauxx, tauyy}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dudy"
-     is similar to existing symbols {dudx, dvdy}.
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-tauxy[i_, j_] -> (dudy[i, j] + dvdx[i, j])*mu[i, j]
-;[o]
-tauxy[i_, j_] -> (dudy[i, j] + dvdx[i, j]) mu[i, j]
-:[font = section; inactive; preserveAspect; startGroup]
-definitions of derivatives
-:[font = input; preserveAspect; startGroup]
-dudydef1 = dudy[i_,j_+half] -> (u[i,j+1]-u[i,j])/hy
-:[font = output; output; inactive; preserveAspect; endGroup]
-dudy[i_, half + (j_)] -> (-u[i, j] + u[i, 1 + j])/hy
-;[o]
-                         -u[i, j] + u[i, 1 + j]
-dudy[i_, half + (j_)] -> ----------------------
-                                   hy
-:[font = input; preserveAspect; startGroup]
-dvdxdef1 = dvdx[i_+half,j_] -> (v[i+1,j]-v[i,j])/hx
-:[font = output; output; inactive; preserveAspect; endGroup]
-dvdx[half + (i_), j_] -> (-v[i, j] + v[1 + i, j])/hx
-;[o]
-                         -v[i, j] + v[1 + i, j]
-dvdx[half + (i_), j_] -> ----------------------
-                                   hx
-:[font = input; preserveAspect; startGroup]
-dudydef2 = dudy[i_+half,j_] -> 
-		(u[i,j+1]-u[i,j-1]+u[i+1,j+1]-u[i+1,j-1])/(4*hy)
-:[font = output; output; inactive; preserveAspect; endGroup]
-dudy[half + (i_), j_] -> 
- 
-  (-u[i, -1 + j] + u[i, 1 + j] - u[1 + i, -1 + j] + 
- 
-     u[1 + i, 1 + j])/(4*hy)
-;[o]
-dudy[half + (i_), j_] -> 
- 
-  (-u[i, -1 + j] + u[i, 1 + j] - u[1 + i, -1 + j] + 
- 
-     u[1 + i, 1 + j]) / (4 hy)
-:[font = input; preserveAspect; startGroup]
-dvdxdef2 = dvdx[i_,j_+half] ->
-		(v[i+1,j+1]-v[i-1,j+1]+v[i+1,j]-v[i-1,j])/(4*hx)
-:[font = output; output; inactive; preserveAspect; endGroup]
-dvdx[i_, half + (j_)] -> 
- 
-  (-v[-1 + i, j] - v[-1 + i, 1 + j] + v[1 + i, j] + 
- 
-     v[1 + i, 1 + j])/(4*hx)
-;[o]
-dvdx[i_, half + (j_)] -> 
- 
-  (-v[-1 + i, j] - v[-1 + i, 1 + j] + v[1 + i, j] + 
- 
-     v[1 + i, 1 + j]) / (4 hx)
-:[font = input; preserveAspect; startGroup]
-dudxdef = dudx[i_+half,j_] -> 
-		(u[i+1,j]-u[i,j])/hx
-:[font = output; output; inactive; preserveAspect; endGroup]
-dudx[half + (i_), j_] -> (-u[i, j] + u[1 + i, j])/hx
-;[o]
-                         -u[i, j] + u[1 + i, j]
-dudx[half + (i_), j_] -> ----------------------
-                                   hx
-:[font = input; preserveAspect; startGroup]
-dvdydef = dvdy[i_,j_+half] ->
-		(v[i,j+1]-v[i,j])/hy
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dvdy[i_, half + (j_)] -> (-v[i, j] + v[i, 1 + j])/hy
-;[o]
-                         -v[i, j] + v[i, 1 + j]
-dvdy[i_, half + (j_)] -> ----------------------
-                                   hy
-:[font = section; inactive; preserveAspect; startGroup]
-definitions used to test taylor expansions
-:[font = input; preserveAspect; startGroup]
-taylorudef = u[i_,j_]->
-			U[x0,y0]+
-			DuDx[x0,y0]*((i+1/2)*hx-x0)+
-			DuDy[x0,y0]*((j+1/2)*hy-y0)+
-			D2uDy2[x0,y0]/2*((i+1/2)*hx-x0)^2+
-			D2uDx2[x0,y0]/2*((j+1/2)*hy-y0)^2+
-			D2uDxDy[x0,y0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "DuDy"
-     is similar to existing symbol "DuDx".
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "D2uDx2"
-     is similar to existing symbol "D2uDy2".
-:[font = output; output; inactive; preserveAspect; endGroup]
-u[i_, j_] -> 
- 
-  (hx*(1/2 + i) - x0)*DuDx[x0, y0] + 
- 
-   (hy*(1/2 + j) - y0)*DuDy[x0, y0] + 
- 
-   (hx*(1/2 + i) - x0)*(hy*(1/2 + j) - y0)*D2uDxDy[x0, y0] + 
- 
-   ((hy*(1/2 + j) - y0)^2*D2uDx2[x0, y0])/2 + 
- 
-   ((hx*(1/2 + i) - x0)^2*D2uDy2[x0, y0])/2 + U[x0, y0]
-;[o]
-u[i_, j_] -> 
- 
-       1
-  (hx (- + i) - x0) DuDx[x0, y0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DuDy[x0, y0] + 
-        2
- 
-        1                 1
-   (hx (- + i) - x0) (hy (- + j) - y0) D2uDxDy[x0, y0] + 
-        2                 2
- 
-        1           2
-   (hy (- + j) - y0)  D2uDx2[x0, y0]
-        2
-   --------------------------------- + 
-                   2
- 
-        1           2
-   (hx (- + i) - x0)  D2uDy2[x0, y0]
-        2
-   --------------------------------- + U[x0, y0]
-                   2
-:[font = input; preserveAspect]
-dog = dudy[i+half,j] //. {dudydef1,dudydef2,taylorudef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,x0->hx,y0->hy/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx, hy/2]
-;[o]
-         hy
-DuDy[hx, --]
-         2
-:[font = input; preserveAspect]
-dog = dudy[i,j+half] //. {dudydef1,dudydef2,taylorudef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,x0->hx/2,y0->hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx/2, hy]
-;[o]
-     hx
-DuDy[--, hy]
-     2
-:[font = input; preserveAspect]
-dog = dudx[i+half,j] //. {dudxdef,taylorudef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,x0->hx,y0->hy/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDx[hx, hy/2]
-;[o]
-         hy
-DuDx[hx, --]
-         2
-:[font = input; preserveAspect; startGroup]
-taylorvdef = v[i_,j_]->
-			V[x0,y0]+
-			DvDx[x0,y0]*((i+1/2)*hx-x0)+
-			DvDy[x0,y0]*((j+1/2)*hy-y0)+
-			D2vDy2[x0,y0]/2*((i+1/2)*hx-x0)^2+
-			D2vDx2[x0,y0]/2*((j+1/2)*hy-y0)^2+
-			D2vDxDy[x0,y0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "taylorvdef"
-     is similar to existing symbol "taylorudef".
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "DvDx"
-     is similar to existing symbol "DuDx".
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DvDy"
-     is similar to existing symbols {DuDy, DvDx}.
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "D2vDy2"
-     is similar to existing symbol "D2uDy2".
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell1
-     will be suppressed during this calculation.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "D2vDx2"
-     is similar to existing symbols {D2uDx2, D2vDy2}.
-:[font = output; output; inactive; preserveAspect; endGroup]
-v[i_, j_] -> 
- 
-  (hx*(1/2 + i) - x0)*DvDx[x0, y0] + 
- 
-   (hy*(1/2 + j) - y0)*DvDy[x0, y0] + 
- 
-   (hx*(1/2 + i) - x0)*(hy*(1/2 + j) - y0)*D2vDxDy[x0, y0] + 
- 
-   ((hy*(1/2 + j) - y0)^2*D2vDx2[x0, y0])/2 + 
- 
-   ((hx*(1/2 + i) - x0)^2*D2vDy2[x0, y0])/2 + V[x0, y0]
-;[o]
-v[i_, j_] -> 
- 
-       1
-  (hx (- + i) - x0) DvDx[x0, y0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DvDy[x0, y0] + 
-        2
- 
-        1                 1
-   (hx (- + i) - x0) (hy (- + j) - y0) D2vDxDy[x0, y0] + 
-        2                 2
- 
-        1           2
-   (hy (- + j) - y0)  D2vDx2[x0, y0]
-        2
-   --------------------------------- + 
-                   2
- 
-        1           2
-   (hx (- + i) - x0)  D2vDy2[x0, y0]
-        2
-   --------------------------------- + V[x0, y0]
-                   2
-:[font = input; preserveAspect]
-dog = dvdy[i,j+half] //. {dvdydef, taylorvdef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,x0->hx/2,y0->hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DvDy[hx/2, hy]
-;[o]
-     hx
-DvDy[--, hy]
-     2
-:[font = input; preserveAspect]
-dog = dvdx[i,j+half] //. {dvdxdef1,dvdxdef2,taylorvdef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,x0->hx/2,y0->hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DvDx[hx/2, hy]
-;[o]
-     hx
-DvDx[--, hy]
-     2
-:[font = input; preserveAspect]
-dog = dvdx[i+half,j] //. {dvdxdef1,dvdxdef2,taylorvdef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,x0->hx,y0->hy/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DvDx[hx, hy/2]
-;[o]
-         hy
-DvDx[hx, --]
-         2
-:[font = input; preserveAspect; startGroup]
-taylormudef = mu[i_,j_]->
-			MU[x0,y0]+
-			DmuDx[x0,y0]*((i+1/2)*hx-x0)+
-			DmuDy[x0,y0]*((j+1/2)*hy-y0)
-
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "taylormudef"
-     is similar to existing symbol "taylorudef".
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "DmuDx"
-     is similar to existing symbol "DuDx".
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DmuDy"
-     is similar to existing symbols {DmuDx, DuDy}.
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-mu[i_, j_] -> 
- 
-  (hx*(1/2 + i) - x0)*DmuDx[x0, y0] + 
- 
-   (hy*(1/2 + j) - y0)*DmuDy[x0, y0] + MU[x0, y0]
-;[o]
-mu[i_, j_] -> 
- 
-       1
-  (hx (- + i) - x0) DmuDx[x0, y0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DmuDy[x0, y0] + MU[x0, y0]
-        2
-:[font = section; inactive; preserveAspect; startGroup]
-tests
-:[font = input; preserveAspect]
-dog = tauxx[i+half,j] //.
-		{tauxxdef,dudxdef,taylormudef,taylorudef};
-:[font = input; preserveAspect; startGroup]
- dog //. {half->1/2,i->0,j->0,x0->hx,y0 -> hy/2 } 
-:[font = output; output; inactive; preserveAspect; endGroup]
-2*DuDx[hx, hy/2]*MU[hx, hy/2]
-;[o]
-           hy         hy
-2 DuDx[hx, --] MU[hx, --]
-           2          2
-:[font = input; preserveAspect]
-dog = tauyy[i,j+half] //. 
-		{tauyydef,dvdydef,taylormudef,taylorvdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,x0->hx/2,y0->hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-2*DvDy[hx/2, hy]*MU[hx/2, hy]
-;[o]
-       hx         hx
-2 DvDy[--, hy] MU[--, hy]
-       2          2
-:[font = input; preserveAspect]
-dog = tauxy[i,j+half] //.
-		{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-		 taylormudef,taylorudef,taylorvdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,x0->hx/2,y0->hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-(DuDy[hx/2, hy] + DvDx[hx/2, hy])*MU[hx/2, hy]
-;[o]
-      hx             hx          hx
-(DuDy[--, hy] + DvDx[--, hy]) MU[--, hy]
-      2              2           2
-:[font = input; preserveAspect]
-dog = tauxy[i+half,j] //.
-		{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-		 taylormudef,taylorudef,taylorvdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,x0->hx,y0->hy/2}
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-(DuDy[hx, hy/2] + DvDx[hx, hy/2])*MU[hx, hy/2]
-;[o]
-          hy             hy          hy
-(DuDy[hx, --] + DvDx[hx, --]) MU[hx, --]
-          2              2           2
-:[font = section; inactive; preserveAspect; startGroup]
-definitions used for fortran output
-:[font = input; preserveAspect; startGroup]
-murepl1 = mu[i_,j_+half] -> muY[i,j+1]
-:[font = output; output; inactive; preserveAspect; endGroup]
-mu[i_, half + (j_)] -> muY[i, 1 + j]
-;[o]
-mu[i_, half + (j_)] -> muY[i, 1 + j]
-:[font = input; preserveAspect; startGroup]
-murepl2 = mu[i_+half,j_] -> muX[i+1,j]
-:[font = output; output; inactive; preserveAspect; endGroup]
-mu[half + (i_), j_] -> muX[1 + i, j]
-;[o]
-mu[half + (i_), j_] -> muX[1 + i, j]
-:[font = input; preserveAspect; startGroup]
-urepl = u[i_,j_] -> U[i,j,1]
-:[font = output; output; inactive; preserveAspect; endGroup]
-u[i_, j_] -> U[i, j, 1]
-;[o]
-u[i_, j_] -> U[i, j, 1]
-:[font = input; preserveAspect; startGroup]
-vrepl = v[i_,j_] -> U[i,j,2]
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "vrepl"
-     is similar to existing symbol "urepl".
-:[font = output; output; inactive; preserveAspect; endGroup]
-v[i_, j_] -> U[i, j, 2]
-;[o]
-v[i_, j_] -> U[i, j, 2]
-:[font = input; preserveAspect; startGroup]
-tauxy[i,j+half] //. 
-	{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-	 murepl1,murepl2,urepl,vrepl}
-:[font = output; output; inactive; preserveAspect; endGroup]
-muY[i, 1 + j]*((-U[i, j, 1] + U[i, 1 + j, 1])/hy + 
- 
-    (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-       U[1 + i, j, 2] + U[1 + i, 1 + j, 2])/(4*hx))
-;[o]
-               -U[i, j, 1] + U[i, 1 + j, 1]
-muY[i, 1 + j] (---------------------------- + 
-                            hy
- 
-    (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-       U[1 + i, j, 2] + U[1 + i, 1 + j, 2]) / (4 hx))
-:[font = input; preserveAspect; startGroup]
-(tauxy[i,j+half]-tauxy[i,j-1+half]+
- tauxx[i+half,j]-tauxx[i-1+half,j]) //. 
-	{tauxxdef,tauxydef,
-	 dudydef1,dudydef2,dvdxdef1,dvdxdef2,dudxdef,dvdydef,
-	 murepl1,murepl2,urepl,vrepl}
-:[font = output; output; inactive; preserveAspect; endGroup]
-(-2*muX[i, j]*(-U[-1 + i, j, 1] + U[i, j, 1]))/hx + 
- 
-  (2*muX[1 + i, j]*(-U[i, j, 1] + U[1 + i, j, 1]))/hx - 
- 
-  muY[i, j]*((-U[i, -1 + j, 1] + U[i, j, 1])/hy + 
- 
-     (-U[-1 + i, -1 + j, 2] - U[-1 + i, j, 2] + 
- 
-        U[1 + i, -1 + j, 2] + U[1 + i, j, 2])/(4*hx)) + 
- 
-  muY[i, 1 + j]*((-U[i, j, 1] + U[i, 1 + j, 1])/hy + 
- 
-     (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-        U[1 + i, j, 2] + U[1 + i, 1 + j, 2])/(4*hx))
-;[o]
--2 muX[i, j] (-U[-1 + i, j, 1] + U[i, j, 1])
--------------------------------------------- + 
-                     hx
- 
-  2 muX[1 + i, j] (-U[i, j, 1] + U[1 + i, j, 1])
-  ---------------------------------------------- - 
-                        hx
- 
-             -U[i, -1 + j, 1] + U[i, j, 1]
-  muY[i, j] (----------------------------- + 
-                          hy
- 
-     (-U[-1 + i, -1 + j, 2] - U[-1 + i, j, 2] + 
- 
-        U[1 + i, -1 + j, 2] + U[1 + i, j, 2]) / (4 hx)) + 
- 
-                 -U[i, j, 1] + U[i, 1 + j, 1]
-  muY[i, 1 + j] (---------------------------- + 
-                              hy
- 
-     (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-        U[1 + i, j, 2] + U[1 + i, 1 + j, 2]) / (4 hx))
-:[font = subsection; inactive; preserveAspect; startGroup]
-Extract stencil information from operator
-:[font = input; preserveAspect; startGroup]
-dog = alpha*a[i,j]*U[i,j,1]-
-	beta*(hy*(tauxx[i+half,j]-tauxx[i-1+half,j]) +
-	      hx*(tauxy[i,j+half]-tauxy[i,j-1+half]))/vol //.
-	      {tauxxdef,tauxydef,
-	 		dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-	 		dudxdef,dvdydef,
-	 		murepl1,murepl2,urepl,vrepl,vol->hx*hy}
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "beta"
-     is similar to existing symbol "Beta".
-:[font = output; output; inactive; preserveAspect; endGroup]
-alpha*a[i, j]*U[i, j, 1] - 
- 
-  (beta*(hy*((-2*muX[i, j]*(-U[-1 + i, j, 1] + U[i, j, 1]))/
- 
-           hx + (2*muX[1 + i, j]*
- 
-             (-U[i, j, 1] + U[1 + i, j, 1]))/hx) + 
- 
-       hx*(-(muY[i, j]*((-U[i, -1 + j, 1] + U[i, j, 1])/
- 
-                hy + (-U[-1 + i, -1 + j, 2] - 
- 
-                  U[-1 + i, j, 2] + U[1 + i, -1 + j, 2] + 
- 
-                  U[1 + i, j, 2])/(4*hx))) + 
- 
-          muY[i, 1 + j]*((-U[i, j, 1] + U[i, 1 + j, 1])/
- 
-              hy + (-U[-1 + i, j, 2] - 
- 
-                U[-1 + i, 1 + j, 2] + U[1 + i, j, 2] + 
- 
-                U[1 + i, 1 + j, 2])/(4*hx)))))/(hx*hy)
-;[o]
-alpha a[i, j] U[i, j, 1] - 
- 
-             -2 muX[i, j] (-U[-1 + i, j, 1] + U[i, j, 1])
-  (beta (hy (-------------------------------------------- + 
-                                  hx
- 
-          2 muX[1 + i, j] (-U[i, j, 1] + U[1 + i, j, 1])
-          ----------------------------------------------) + 
-                                hx
- 
-                        -U[i, -1 + j, 1] + U[i, j, 1]
-       hx (-(muY[i, j] (----------------------------- + 
-                                     hy
- 
-               (-U[-1 + i, -1 + j, 2] - U[-1 + i, j, 2] + 
- 
-                  U[1 + i, -1 + j, 2] + U[1 + i, j, 2]) / 
- 
-                (4 hx))) + 
- 
-                         -U[i, j, 1] + U[i, 1 + j, 1]
-          muY[i, 1 + j] (---------------------------- + 
-                                      hy
- 
-             (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-                U[1 + i, j, 2] + U[1 + i, 1 + j, 2]) / 
- 
-              (4 hx))))) / (hx hy)
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i,j,1]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-alpha*a[i, j] + (2*beta*muX[i, j])/hx^2 + 
- 
-  (2*beta*muX[1 + i, j])/hx^2 + (beta*muY[i, j])/hy^2 + 
- 
-  (beta*muY[i, 1 + j])/hy^2
-;[o]
-                2 beta muX[i, j]   2 beta muX[1 + i, j]
-alpha a[i, j] + ---------------- + -------------------- + 
-                        2                    2
-                      hx                   hx
- 
-  beta muY[i, j]   beta muY[i, 1 + j]
-  -------------- + ------------------
-         2                  2
-       hy                 hy
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i+1,j,1]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-(-2*beta*muX[1 + i, j])/hx^2
-;[o]
--2 beta muX[1 + i, j]
----------------------
-           2
-         hx
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i-1,j,1]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-(-2*beta*muX[i, j])/hx^2
-;[o]
--2 beta muX[i, j]
------------------
-         2
-       hx
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i,j+1,1]]
-:[font = output; output; inactive; preserveAspect; endGroup]
--((beta*muY[i, 1 + j])/hy^2)
-;[o]
-  beta muY[i, 1 + j]
--(------------------)
-           2
-         hy
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i,j-1,1]]
-:[font = output; output; inactive; preserveAspect; endGroup]
--((beta*muY[i, j])/hy^2)
-;[o]
-  beta muY[i, j]
--(--------------)
-         2
-       hy
-:[font = input; preserveAspect; startGroup]
-dog = alpha*a[i,j]*U[i,j,2] -
-	beta*(hy*(tauxy[i+half,j]-tauxy[i-1+half,j])+
-	      hx*(tauyy[i,j+half]-tauyy[i,j-1+half]))/vol //.
-	      {tauyydef,tauxydef,
-	 		dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-	 		dudxdef,dvdydef,
-	 		murepl1,murepl2,urepl,vrepl,vol->hx*hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-alpha*a[i, j]*U[i, j, 2] - 
- 
-  (beta*(hx*((-2*muY[i, j]*(-U[i, -1 + j, 2] + U[i, j, 2]))/
- 
-           hy + (2*muY[i, 1 + j]*
- 
-             (-U[i, j, 2] + U[i, 1 + j, 2]))/hy) + 
- 
-       hy*(-(muX[i, j]*((-U[-1 + i, j, 2] + U[i, j, 2])/
- 
-                hx + (-U[-1 + i, -1 + j, 1] + 
- 
-                  U[-1 + i, 1 + j, 1] - U[i, -1 + j, 1] + 
- 
-                  U[i, 1 + j, 1])/(4*hy))) + 
- 
-          muX[1 + i, j]*((-U[i, j, 2] + U[1 + i, j, 2])/
- 
-              hx + (-U[i, -1 + j, 1] + U[i, 1 + j, 1] - 
- 
-                U[1 + i, -1 + j, 1] + U[1 + i, 1 + j, 1])/
- 
-              (4*hy)))))/(hx*hy)
-;[o]
-alpha a[i, j] U[i, j, 2] - 
- 
-             -2 muY[i, j] (-U[i, -1 + j, 2] + U[i, j, 2])
-  (beta (hx (-------------------------------------------- + 
-                                  hy
- 
-          2 muY[i, 1 + j] (-U[i, j, 2] + U[i, 1 + j, 2])
-          ----------------------------------------------) + 
-                                hy
- 
-                        -U[-1 + i, j, 2] + U[i, j, 2]
-       hy (-(muX[i, j] (----------------------------- + 
-                                     hx
- 
-               (-U[-1 + i, -1 + j, 1] + 
- 
-                  U[-1 + i, 1 + j, 1] - U[i, -1 + j, 1] + 
- 
-                  U[i, 1 + j, 1]) / (4 hy))) + 
- 
-                         -U[i, j, 2] + U[1 + i, j, 2]
-          muX[1 + i, j] (---------------------------- + 
-                                      hx
- 
-             (-U[i, -1 + j, 1] + U[i, 1 + j, 1] - 
- 
-                U[1 + i, -1 + j, 1] + U[1 + i, 1 + j, 1]) / 
- 
-              (4 hy))))) / (hx hy)
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i,j,2]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-alpha*a[i, j] + (beta*muX[i, j])/hx^2 + 
- 
-  (beta*muX[1 + i, j])/hx^2 + (2*beta*muY[i, j])/hy^2 + 
- 
-  (2*beta*muY[i, 1 + j])/hy^2
-;[o]
-                beta muX[i, j]   beta muX[1 + i, j]
-alpha a[i, j] + -------------- + ------------------ + 
-                       2                  2
-                     hx                 hx
- 
-  2 beta muY[i, j]   2 beta muY[i, 1 + j]
-  ---------------- + --------------------
-          2                    2
-        hy                   hy
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i+1,j,2]]
-:[font = output; output; inactive; preserveAspect; endGroup]
--((beta*muX[1 + i, j])/hx^2)
-;[o]
-  beta muX[1 + i, j]
--(------------------)
-           2
-         hx
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i-1,j,2]]
-:[font = output; output; inactive; preserveAspect; endGroup]
--((beta*muX[i, j])/hx^2)
-;[o]
-  beta muX[i, j]
--(--------------)
-         2
-       hx
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i,j+1,2]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-(-2*beta*muY[i, 1 + j])/hy^2
-;[o]
--2 beta muY[i, 1 + j]
----------------------
-           2
-         hy
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[dog],U[i,j-1,2]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-(-2*beta*muY[i, j])/hy^2
-;[o]
--2 beta muY[i, j]
------------------
-         2
-       hy
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dependentCellsNotCovered is a function which returns a logical expression suitable for
-inclusion in fortran.  Give an expression, exp, we wish to determine which mesh locations are accessed by the expression.  However, we do not wish to examine
-all possible locations, only those outside the grid patch region.  So we provide
-a second argument, which is a boolean function taking two arguments.  The combination will give logical expressions testing the mask for cells utilized by the
-expression and for which the boolean function, logfunc[il,jl], evaluates as true. The
-third argument is the name of the mask array
-:[font = input; preserveAspect]
-Clear[ dependentCellsNotCovered ]
-:[font = input; preserveAspect; endGroup]
-dependentCellsNotCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp},
-	cond = False;
-	lexp = exp;
-	For[il=-2,il<=+2,il++,
-      For[jl=-2,jl<=+2,jl++,
-        For[kl=1,kl<=2,kl++,
-          If[ (logfunc[il,jl]) &&
-	        (Coefficient[
-		      Expand[ 
-		        exp
-		      ] ,
-		      U[i+il,j+jl,kl]
-	        ] =!= 0), cond = cond || (maskfun[i+il,j+jl]>0)
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dependentCellsCovered is more or less the converse of dependentCellsNotCovered.
-dependentCellsCovered will return true if all the cells in the expression (properly
-restricted by the mask function) ARE covered.  dependentCellsNotCovered returned
-true if one or more of the cells were not covered.
-:[font = input; preserveAspect]
-Clear[ dependentCellsCovered ]
-:[font = input; preserveAspect; endGroup]
-dependentCellsCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp},
-	cond = True;
-	lexp = exp;
-	For[il=-2,il<=+2,il++,
-      For[jl=-2,jl<=+2,jl++,
-        For[kl=1,kl<=2,kl++,
-          If[ (logfunc[il,jl]) &&
-	        (Coefficient[
-		      Expand[ 
-		        exp
-		      ] ,
-		      U[i+il,j+jl,kl]
-	        ] =!= 0), cond = cond && (maskfun[i+il,j+jl]==0)
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-this is an alternate definition which treats cells with mask .eq. 1 as untrusted,
-rather than mask .gt. 0
-:[font = input; preserveAspect]
-dependentCellsNotCoveredalt[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp},
-	cond = False;
-	lexp = exp;
-	For[il=-2,il<=+2,il++,
-      For[jl=-2,jl<=+2,jl++,
-        For[kl=1,kl<=2,kl++,
-          If[ (logfunc[il,jl]) &&
-	        (Coefficient[
-		      Expand[ 
-		        exp
-		      ] ,
-		      U[i+il,j+jl,kl]
-	        ] =!= 0), cond = cond || (maskfun[i+il,j+jl]==1)
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-:[font = input; preserveAspect; startGroup]
-dependentCellsNotCovered[abba*U[i+1,j-1,1]+U[i-1,j-1,2]
-							, (#2<0)& , masks  ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-masks[-1 + i, -1 + j] > 0 || masks[1 + i, -1 + j] > 0
-;[o]
-masks[-1 + i, -1 + j] > 0 || masks[1 + i, -1 + j] > 0
-:[font = input; preserveAspect]
-f[x_] := f1*(x-x2)(x-x3)/(x1-x2)/(x1-x3)+
-		 f2*(x-x1)(x-x3)/(x2-x1)/(x2-x3)+
-		 f3*(x-x1)(x-x2)/(x3-x1)/(x3-x2)
-:[font = input; preserveAspect; startGroup]
-dog = Simplify[ D[f[x],x] /. {x1->0,x2->-h,x3->-2*h,x->0} ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-(3*f1 - 4*f2 + f3)/(2*h)
-;[o]
-3 f1 - 4 f2 + f3
-----------------
-      2 h
-:[font = input; preserveAspect; startGroup]
-dog /. {f1->0, f2->h^2, f3->4*h^2 }
-:[font = output; output; inactive; preserveAspect; endGroup]
-0
-;[o]
-0
-:[font = input; preserveAspect; startGroup]
-dog  /. {f1->0,f2->h^3,f3->8*h^3}
-:[font = output; output; inactive; preserveAspect; endGroup]
-2*h^2
-;[o]
-   2
-2 h
-:[font = input; preserveAspect; startGroup]
-dog = Simplify[ D[f[x],x,x] /. {x1->0,x2->-h,x3->-2*h,x->0} ]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup; endGroup]
-(f1 - 2*f2 + f3)/h^2
-;[o]
-f1 - 2 f2 + f3
---------------
-       2
-      h
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for Do One-sided Derivative in X direction.  if sign is positive, 
-it means extend the stencil in the positivie x direction.  if negative, extend
-in other direction
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,sign_] := (-u[i+2,j]+4*u[i+1,j]-3*u[i,j])/
-									(2*hx)  /; sign==1
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,sign_] := (u[i-2,j]-4*u[i-1,j]+3*u[i,j])/
-									(2*hx)  /; sign==-1
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,k_,sign_] := (-u[i+2,j,k]+4*u[i+1,j,k]-
-							3*u[i,j,k])/(2*hx) /; sign==1
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,k_,sign_] := (u[i-2,j,k]-4*u[i-1,j,k]+
-							3*u[i,j,k])/(2*hx) /; sign==-1
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneX[u,0,0,-1] //. {taylorudef,x0->hx/2,y0->hy/2}]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDx[hx/2, hy/2]
-;[o]
-     hx  hy
-DuDx[--, --]
-     2   2
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneX[u,0,0,+1] //. {taylorudef,x0->hx/2,y0->hy/2}]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-DuDx[hx/2, hy/2]
-;[o]
-     hx  hy
-DuDx[--, --]
-     2   2
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for Do One-sided Derivative in Y direction.  if sign is positive, 
-it means extend the stencil in the positivie y direction.  if negative, extend
-in other direction
-:[font = input; preserveAspect; startGroup]
-DOneY[u_,i_,j_,sign_] := (-u[i,j+2]+4*u[i,j+1]-3*u[i,j])/
-									(2*hy)  /; sign==1
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "DOneY"
-     is similar to existing symbol "DOneX".
-:[font = input; preserveAspect]
-DOneY[u_,i_,j_,sign_] := (u[i,j-2]-4*u[i,j-1]+3*u[i,j])/
-									(2*hy)  /; sign==-1
-:[font = input; preserveAspect]
-DOneY[u_,i_,j_,k_,sign_] := (-u[i,j+2,k]+4*u[i,j+1,k]-
-							3*u[i,j,k])/(2*hy)  /; sign==1
-:[font = input; preserveAspect]
-DOneY[u_,i_,j_,k_,sign_] := (u[i,j-2,k]-4*u[i,j-1,k]+
-							3*u[i,j,k])/(2*hy)  /; sign==-1
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneY[u,0,0,-1] //. {taylorudef,x0->hx/2,y0->hy/2}]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx/2, hy/2]
-;[o]
-     hx  hy
-DuDy[--, --]
-     2   2
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneY[u,0,0,+1] //. {taylorudef,x0->hx/2,y0->hy/2}]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-DuDy[hx/2, hy/2]
-;[o]
-     hx  hy
-DuDy[--, --]
-     2   2
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for two sided deriv in x direction.
-:[font = input; preserveAspect]
-DTwoX[u_,i_,j_] := (u[i+1,j]-u[i-1,j])/(2*hx)
-:[font = input; preserveAspect]
-DTwoX[u_,i_,j_,k_] := (u[i+1,j,k]-u[i-1,j,k])/(2*hx)
-:[font = input; preserveAspect; startGroup]
-Simplify[ DTwoX[u,0,0] //. {taylorudef,x0->hx/2,y0->hy/2} ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDx[hx/2, hy/2]
-;[o]
-     hx  hy
-DuDx[--, --]
-     2   2
-:[font = input; preserveAspect; startGroup]
-DTwoY[u_,i_,j_] := (u[i,j+1]-u[i,j-1])/(2*hy)
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "DTwoY"
-     is similar to existing symbol "DTwoX".
-:[font = input; preserveAspect]
-DTwoY[u_,i_,j_,k_] := (u[i,j+1,k]-u[i,j-1,k])/(2*hy)
-:[font = input; preserveAspect; startGroup]
-Simplify[ DTwoY[u,0,0] //. {taylorudef,x0->hx/2,y0->hy/2} ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx/2, hy/2]
-;[o]
-     hx  hy
-DuDy[--, --]
-     2   2
-:[font = input; preserveAspect; endGroup; endGroup]
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_2D.mF" , "dog.mf"];
-Splice["dog.mf"];
-DeleteFile[ "DV_2D.F"];
-CopyFile[ "dog.f", "DV_2D.F" ];
-<<"!touch DV_2D.F"
-
-:[font = section; inactive; preserveAspect; startGroup]
-Start figuring out how to write stencil
-:[font = input; preserveAspect; startGroup]
-out1 = alpha*a[i,j]*U[i,j,1]-
-	beta*(hy*(tauxx[i+half,j]-tauxx[i-1+half,j]) +
-	      hx*(tauxy[i,j+half]-tauxy[i,j-1+half]))/vol //.
-	      {tauxxdef,tauxydef,
-	 		dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-	 		dudxdef,dvdydef,
-	 		murepl1,murepl2,urepl,vrepl,vol->hx*hy}
-:[font = output; output; inactive; preserveAspect; endGroup]
-alpha*a[i, j]*U[i, j, 1] - 
- 
-  (beta*(hy*((-2*muX[i, j]*(-U[-1 + i, j, 1] + U[i, j, 1]))/
- 
-           hx + (2*muX[1 + i, j]*
- 
-             (-U[i, j, 1] + U[1 + i, j, 1]))/hx) + 
- 
-       hx*(-(muY[i, j]*((-U[i, -1 + j, 1] + U[i, j, 1])/hy + 
- 
-               (-U[-1 + i, -1 + j, 2] - U[-1 + i, j, 2] + 
- 
-                  U[1 + i, -1 + j, 2] + U[1 + i, j, 2])/
- 
-                (4*hx))) + 
- 
-          muY[i, 1 + j]*((-U[i, j, 1] + U[i, 1 + j, 1])/hy + 
- 
-             (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-                U[1 + i, j, 2] + U[1 + i, 1 + j, 2])/(4*hx)))
- 
-       ))/(hx*hy)
-;[o]
-alpha a[i, j] U[i, j, 1] - 
- 
-             -2 muX[i, j] (-U[-1 + i, j, 1] + U[i, j, 1])
-  (beta (hy (-------------------------------------------- + 
-                                  hx
- 
-          2 muX[1 + i, j] (-U[i, j, 1] + U[1 + i, j, 1])
-          ----------------------------------------------) + 
-                                hx
- 
-                        -U[i, -1 + j, 1] + U[i, j, 1]
-       hx (-(muY[i, j] (----------------------------- + 
-                                     hy
- 
-               (-U[-1 + i, -1 + j, 2] - U[-1 + i, j, 2] + 
- 
-                  U[1 + i, -1 + j, 2] + U[1 + i, j, 2]) / 
- 
-                (4 hx))) + 
- 
-                         -U[i, j, 1] + U[i, 1 + j, 1]
-          muY[i, 1 + j] (---------------------------- + 
-                                      hy
- 
-             (-U[-1 + i, j, 2] - U[-1 + i, 1 + j, 2] + 
- 
-                U[1 + i, j, 2] + U[1 + i, 1 + j, 2]) / (4 hx)
- 
-             )))) / (hx hy)
-:[font = input; preserveAspect; startGroup]
-Coefficient[Expand[out1],U[i,j,1]]
-:[font = output; output; inactive; preserveAspect; endGroup]
-alpha*a[i, j] + (2*beta*muX[i, j])/hx^2 + 
- 
-  (2*beta*muX[1 + i, j])/hx^2 + (beta*muY[i, j])/hy^2 + 
- 
-  (beta*muY[i, 1 + j])/hy^2
-;[o]
-                2 beta muX[i, j]   2 beta muX[1 + i, j]
-alpha a[i, j] + ---------------- + -------------------- + 
-                        2                    2
-                      hx                   hx
- 
-  beta muY[i, j]   beta muY[i, 1 + j]
-  -------------- + ------------------
-         2                  2
-       hy                 hy
-:[font = subsection; inactive; preserveAspect; startGroup]
-setup to use the Format.m package 
-:[font = input; preserveAspect]
-Off[General::spell,General::spell1];
-:[font = input; preserveAspect]
-SetOptions[$Output,PageWidth->73];
-:[font = input; preserveAspect; startGroup]
-<</usr/people/wyc/_math/MathSource/Format/Format.m
-:[font = message; inactive; preserveAspect]
-exp::shdw: Warning: Symbol exp appears in multiple contexts 
-    {Format`, Global`}; definitions in context Format`
-     may shadow or be shadowed by other definitions.
-:[font = message; inactive; preserveAspect; endGroup]
-sign::shdw: Warning: Symbol sign appears in multiple contexts 
-    {Format`, Global`}; definitions in context Format`
-     may shadow or be shadowed by other definitions.
-:[font = input; preserveAspect]
-stencilDef[exp_,kin_] := 
-	Block[{iind,il,jl,kl,list1,list2,indices,tmp,indtrn},
-		indices={
-					{ 0, 0,KO},
-					{-1, 0,KW},
-					{ 0,-1,KS},
-					{-1,-1,KSW},
-					{-1,+1,KNW}
-				};
-		list1={};
-		list2={};
-		For[iind=1,iind<=5,iind++,
-			il = indices[[iind,1]];
-			jl = indices[[iind,2]];
-			indtrn = indices[[iind,3]];
-			For[kl=1,kl<=2,kl++,
-				tmp=Coefficient[Expand[exp],U[i+il,j+jl,kl]];
-				If[tmp=!=0,
-					list1=Append[list1,coef[i,j,indtrn,kin,kl]];
-					list2=Append[list2,+
-					  Coefficient[Expand[exp],U[i+il,j,kl]]] 
-				]
-			]
-		];
-		FortranAssign[Evaluate[list1],list2,
-				AssignToArray->{muY,muX,a,coef,polycoef}]
-	]
-
-							
-:[font = input; preserveAspect]
-stencilInc[exp_,kin_] := 
-	Block[{iind,il,jl,kl,list1,list2,indices,tmp,indtrn},
-		indices={
-					{ 0, 0,KO},
-					{-1, 0,KW},
-					{ 0,-1,KS},
-					{-1,-1,KSW},
-					{-1,+1,KNW}
-				};
-		list1={};
-		list2={};
-		For[iind=1,iind<=5,iind++,
-			il = indices[[iind,1]];
-			jl = indices[[iind,2]];
-			indtrn = indices[[iind,3]];
-			For[kl=1,kl<=2,kl++,
-				tmp=Coefficient[Expand[exp],U[i+il,j+jl,kl]];
-				If[tmp=!=0,
-					list1=Append[list1,coef[i,j,indtrn,kin,kl]];
-					list2=Append[list2,coef[i,j,indtrn,kin,kl]+
-					  Coefficient[Expand[exp],U[i+il,j,kl]]] 
-				]
-			]
-		];
-		FortranAssign[Evaluate[list1],list2,
-				AssignToArray->{muY,muX,a,coef,polycoef}]
-	]
-	
-
-							
-:[font = input; preserveAspect; endGroup]
-stencilDec[exp_,kin_] := 
-	Block[{iind,il,jl,kl,list1,list2,indices,tmp,indtrn},
-		indices={
-					{ 0, 0,KO},
-					{-1, 0,KW},
-					{ 0,-1,KS},
-					{-1,-1,KSW},
-					{-1,+1,KNW}
-				};
-		list1={};
-		list2={};
-		For[iind=1,iind<=5,iind++,
-			il = indices[[iind,1]];
-			jl = indices[[iind,2]];
-			indtrn = indices[[iind,3]];
-			For[kl=1,kl<=2,kl++,
-				tmp=Coefficient[Expand[exp],U[i+il,j+jl,kl]];
-				If[tmp=!=0,
-					list1=Append[list1,coef[i,jl,indtrn,kin,kl]];
-					list2=Append[list2,coef[i,j,indtrn,kin,kl]-
-					  Coefficient[Expand[exp],U[i+il,j,kl]]] 
-				]
-			]
-		];
-		FortranAssign[Evaluate[list1],list2,
-				AssignToArray->{muY,muX,a,coef,polycoef}]
-	]
-	
-
-							
-:[font = subsection; inactive; preserveAspect; startGroup]
-This is slight variation on dependentCellsNotCovered.  Uses Format.m
-:[font = input; preserveAspect]
-Clear[ depCellNotCovered ]
-:[font = input; preserveAspect]
-dependentCellIsCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp},
-	cond = False;
-	lexp = exp;
-	For[il=-2,il<=+2,il++,
-      For[jl=-2,jl<=+2,jl++,
-        For[kl=1,kl<=2,kl++,
-          If[ (logfunc[il,jl]) &&
-	        (Coefficient[
-		      Expand[ 
-		        exp
-		      ] ,
-		      U[i+il,j+jl,kl]
-	        ] =!= 0), cond = cond || (maskfun[i+il,j+jl]>0)
-	      ]
-        ]
-      ]
-    ];
-    FortranAssign[ cond, AssignToArray->{maskray} ]
-  ]
-:[font = input; preserveAspect]
-Clear[stencoef]
-:[font = input; preserveAspect; startGroup]
-stencilDef[out1,1]
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-        coef(i,j,KO,1,1)=alpha*a(i,j)+2.d0*beta*muX(i,j)/hx
-     &  **2+2.d0*beta*muX(1+i,j)/hx**2+beta*muY(i,j)/hy**2+
-     &  beta*muY(i,1+j)/hy**2
-        coef(i,j,KW,1,1)=-2.d0*beta*muX(i,j)/hx**2
-        coef(i,j,KW,1,2)=-2.5d-1*beta*muY(i,j)/(hx*hy)+2.5d
-     &  -1*beta*muY(i,1+j)/(hx*hy)
-        coef(i,j,KS,1,1)=alpha*a(i,j)+2.d0*beta*muX(i,j)/hx
-     &  **2+2.d0*beta*muX(1+i,j)/hx**2+beta*muY(i,j)/hy**2+
-     &  beta*muY(i,1+j)/hy**2
-        coef(i,j,KSW,1,2)=-2.5d-1*beta*muY(i,j)/(hx*hy)+2.5
-     &  d-1*beta*muY(i,1+j)/(hx*hy)
-        coef(i,j,KNW,1,2)=-2.5d-1*beta*muY(i,j)/(hx*hy)+2.5
-     &  d-1*beta*muY(i,1+j)/(hx*hy)
-;[o]
-        coef(i,j,KO,1,1)=alpha*a(i,j)+2.d0*beta*muX(i,j)/hx
-     &  **2+2.d0*beta*muX(1+i,j)/hx**2+beta*muY(i,j)/hy**2+
-     &  beta*muY(i,1+j)/hy**2
-        coef(i,j,KW,1,1)=-2.d0*beta*muX(i,j)/hx**2
-        coef(i,j,KW,1,2)=-2.5d-1*beta*muY(i,j)/(hx*hy)+2.5d
-     &  -1*beta*muY(i,1+j)/(hx*hy)
-        coef(i,j,KS,1,1)=alpha*a(i,j)+2.d0*beta*muX(i,j)/hx
-     &  **2+2.d0*beta*muX(1+i,j)/hx**2+beta*muY(i,j)/hy**2+
-     &  beta*muY(i,1+j)/hy**2
-        coef(i,j,KSW,1,2)=-2.5d-1*beta*muY(i,j)/(hx*hy)+2.5
-     &  d-1*beta*muY(i,1+j)/(hx*hy)
-        coef(i,j,KNW,1,2)=-2.5d-1*beta*muY(i,j)/(hx*hy)+2.5
-     &  d-1*beta*muY(i,1+j)/(hx*hy)
-:[font = input; preserveAspect; startGroup]
-dog1 = Expand[ vol*(alpha*a[i,j]*U[i,j,1]-
-	beta*(hy*(tauxx[i+half,j]-tauxx[i-1+half,j]) +
-	      hx*(tauxy[i,j+half]-tauxy[i,j-1+half]))/vol ) //.
-	      {tauxxdef,tauxydef,
-	 		murepl1,murepl2,urepl,vrepl,vol->hx*hy} ] //InputForm
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-InputForm[2*beta*hy*dudx[-1 + half + i, j]*muX[i, j] - 
- 
-   2*beta*hy*dudx[half + i, j]*muX[1 + i, j] + 
- 
-   beta*hx*dudy[i, -1 + half + j]*muY[i, j] + 
- 
-   beta*hx*dvdx[i, -1 + half + j]*muY[i, j] - 
- 
-   beta*hx*dudy[i, half + j]*muY[i, 1 + j] - 
- 
-   beta*hx*dvdx[i, half + j]*muY[i, 1 + j] + 
- 
-   alpha*hx*hy*a[i, j]*U[i, j, 1]]
-;[o]
-2*beta*hy*dudx[-1 + half + i, j]*muX[i, j] - 
-  2*beta*hy*dudx[half + i, j]*muX[1 + i, j] + 
-  beta*hx*dudy[i, -1 + half + j]*muY[i, j] + 
-  beta*hx*dvdx[i, -1 + half + j]*muY[i, j] - 
-  beta*hx*dudy[i, half + j]*muY[i, 1 + j] - 
-  beta*hx*dvdx[i, half + j]*muY[i, 1 + j] + 
-  alpha*hx*hy*a[i, j]*U[i, j, 1]
-:[font = input; preserveAspect; startGroup]
-Splice[ "dog.mf",FormatType->OutputForm]
-:[font = message; inactive; preserveAspect]
-Splice::splicx: 
-   Syntax error in Mathematica input 
-    dependentCellsNotCovered[DOneX[u,i,j+1,+1]//..
-       allDerivAllUV,
-                                                 
-       Function[{i,j},(j>0),mask]
-:[font = output; output; inactive; preserveAspect; endGroup]
-Splice["dog.mf", FormatType -> OutputForm]
-;[o]
-Splice[dog.mf, FormatType -> OutputForm]
-:[font = input; preserveAspect; startGroup]
-Splice[ "ratdog.mf",FormatType->OutputForm]
-:[font = output; output; inactive; preserveAspect; endGroup]
-"ratdog.mf"
-;[o]
-ratdog.mf
-:[font = input; preserveAspect; startGroup]
-exntop+exnbot
-:[font = output; output; inactive; preserveAspect; endGroup]
-(beta*muY[i, j]*(-U[-1 + i, -1 + j, 2] + 
- 
-       U[1 + i, -1 + j, 2]))/4 + 
- 
-  (beta*muY[i, j]*(-U[-1 + i, j, 2] + U[1 + i, j, 2]))/4
-;[o]
-(beta muY[i, j] (-U[-1 + i, -1 + j, 2] + 
- 
-       U[1 + i, -1 + j, 2])) / 4 + 
- 
-  beta muY[i, j] (-U[-1 + i, j, 2] + U[1 + i, j, 2])
-  --------------------------------------------------
-                          4
-:[font = input; preserveAspect; startGroup]
-dependentCellIsCovered[exntop+exnbot,indexcond,maskray]
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-        (masklox(-1+i,-1+j).gt.0).or.(masklox(-1+i,j).gt.0)
-;[o]
-        (masklox(-1+i,-1+j).gt.0).or.(masklox(-1+i,j).gt.0)
-:[font = input; preserveAspect; startGroup]
-Expand[exntop]
-:[font = output; output; inactive; preserveAspect; endGroup]
--(beta*muY[i, j]*U[-1 + i, j, 2])/4 + 
- 
-  (beta*muY[i, j]*U[1 + i, j, 2])/4
-;[o]
--(beta muY[i, j] U[-1 + i, j, 2])
---------------------------------- + 
-                4
- 
-  beta muY[i, j] U[1 + i, j, 2]
-  -----------------------------
-                4
-:[font = input; preserveAspect; startGroup]
-outdog = 2*beta*hy*dudx[-1+half+i,j] //. 
-			{dudxdef,u[i-1,j]->u[i,j]}
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup; endGroup]
-0
-;[o]
-0
-^*)
\ No newline at end of file
diff --git a/Src/LinearSolvers/C_TensorMG/visc2d.nb b/Src/LinearSolvers/C_TensorMG/visc2d.nb
deleted file mode 100644
index 6682c4e76c5..00000000000
--- a/Src/LinearSolvers/C_TensorMG/visc2d.nb
+++ /dev/null
@@ -1,1813 +0,0 @@
-(***********************************************************************
-
-                    Mathematica-Compatible Notebook
-
-This notebook can be used on any computer system with Mathematica 3.0,
-MathReader 3.0, or any compatible application. The data for the notebook 
-starts with the line of stars above.
-
-To get the notebook into a Mathematica-compatible application, do one of 
-the following:
-
-* Save the data starting with the line of stars above into a file
-  with a name ending in .nb, then open the file inside the application;
-
-* Copy the data starting with the line of stars above to the
-  clipboard, then use the Paste menu command inside the application.
-
-Data for notebooks contains only printable 7-bit ASCII and can be
-sent directly in email or through ftp in text mode.  Newlines can be
-CR, LF or CRLF (Unix, Macintosh or MS-DOS style).
-
-NOTE: If you modify the data for this notebook not in a Mathematica-
-compatible application, you must delete the line below containing the 
-word CacheID, otherwise Mathematica-compatible applications may try to 
-use invalid cache data.
-
-For more information on notebooks and Mathematica-compatible 
-applications, contact Wolfram Research:
-  web: http://www.wolfram.com
-  email: info@wolfram.com
-  phone: +1-217-398-0700 (U.S.)
-
-Notebook reader applications are available free of charge from 
-Wolfram Research.
-***********************************************************************)
-
-(*CacheID: 232*)
-
-
-(*NotebookFileLineBreakTest
-NotebookFileLineBreakTest*)
-(*NotebookOptionsPosition[     40789,       1347]*)
-(*NotebookOutlinePosition[     41639,       1377]*)
-(*  CellTagsIndexPosition[     41595,       1373]*)
-(*WindowFrame->Normal*)
-
-
-
-Notebook[{
-
-Cell[CellGroupData[{
-Cell[TextData["definition of tau"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(tauxxdef = 
-      tauxx[i_ + half, j_] \[Rule] 2\ mu[i + half, j]\ dudx[i + half, j]\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(tauxx[half + i_, j_] \[Rule] 2\ dudx[half + i, j]\ mu[half + i, j]\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(tauyydef = 
-      tauyy[i_, j_ + half] \[Rule] 2\ mu[i, j + half]\ dvdy[i, j + half]\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(tauyy[i_, half + j_] \[Rule] 2\ dvdy[i, half + j]\ mu[i, half + j]\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(tauxydef = 
-      tauxy[i_, j_] \[Rule] mu[i, j]\ \((dudy[i, j] + dvdx[i, j])\)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauxydef\)\" is similar \
-to existing symbols \!\({tauxxdef, tauyydef}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauxy\)\" is similar to \
-existing symbols \!\({tauxx, tauyy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudy\)\" is similar to \
-existing symbols \!\({dudx, dvdy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(tauxy[i_, j_] \[Rule] \((dudy[i, j] + dvdx[i, j])\)\ mu[i, j]\)], 
-  "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions of derivatives"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dudydef1 = 
-      dudy[i_, j_ + half] \[Rule] \(u[i, j + 1] - u[i, j]\)\/hy\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dudy[i_, half + j_] \[Rule] \(\(-u[i, j]\) + u[i, 1 + j]\)\/hy\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dvdxdef1 = 
-      dvdx[i_ + half, j_] \[Rule] \(v[i + 1, j] - v[i, j]\)\/hx\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dvdx[half + i_, j_] \[Rule] \(\(-v[i, j]\) + v[1 + i, j]\)\/hx\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dudydef2 = 
-      dudy[i_ + half, j_] \[Rule] 
-        \(u[i, j + 1] - u[i, j - 1] + u[i + 1, j + 1] - u[i + 1, j - 1]\)\/\(4
-            \ hy\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dudy[half + i_, j_] \[Rule] 
-      \(\(-u[i, \(-1\) + j]\) + u[i, 1 + j] - u[1 + i, \(-1\) + j] + 
-          u[1 + i, 1 + j]\)\/\(4\ hy\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dvdxdef2 = 
-      dvdx[i_, j_ + half] \[Rule] 
-        \(v[i + 1, j + 1] - v[i - 1, j + 1] + v[i + 1, j] - v[i - 1, j]\)\/\(4
-            \ hx\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dvdx[i_, half + j_] \[Rule] 
-      \(\(-v[\(-1\) + i, j]\) - v[\(-1\) + i, 1 + j] + v[1 + i, j] + 
-          v[1 + i, 1 + j]\)\/\(4\ hx\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dudxdef = dudx[i_ + half, j_] \[Rule] \(u[i + 1, j] - u[i, j]\)\/hx\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dudx[half + i_, j_] \[Rule] \(\(-u[i, j]\) + u[1 + i, j]\)\/hx\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dvdydef = dvdy[i_, j_ + half] \[Rule] \(v[i, j + 1] - v[i, j]\)\/hy\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dvdy[i_, half + j_] \[Rule] \(\(-v[i, j]\) + v[i, 1 + j]\)\/hy\)], 
-  "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions used to test taylor expansions"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(taylorudef = 
-      u[i_, j_] \[Rule] 
-        U[x0, y0] + DuDx[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\) + 
-          DuDy[x0, y0]\ \((\((j + 1\/2)\)\ hy - y0)\) + 
-          1\/2\ D2uDy2[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\)\^2 + 
-          1\/2\ D2uDx2[x0, y0]\ \((\((j + 1\/2)\)\ hy - y0)\)\^2 + 
-          D2uDxDy[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\)\ 
-            \((\((j + 1\/2)\)\ hy - y0)\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DuDy\)\" is similar to \
-existing symbol \"\!\(DuDx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2uDx2\)\" is similar \
-to existing symbol \"\!\(D2uDy2\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(u[i_, j_] \[Rule] 
-      1\/2\ \((hy\ \((1\/2 + j)\) - y0)\)\^2\ D2uDx2[x0, y0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hy\ \((1\/2 + j)\) - y0)\)\ 
-          D2uDxDy[x0, y0] + 
-        1\/2\ \((hx\ \((1\/2 + i)\) - x0)\)\^2\ D2uDy2[x0, y0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ DuDx[x0, y0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DuDy[x0, y0] + U[x0, y0]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = dudy[i + half, j] //. {dudydef1, dudydef2, taylorudef}; \)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx, y0 \[Rule] hy\/2}\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = dudy[i, j + half] //. {dudydef1, dudydef2, taylorudef}; \)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx\/2, y0 \[Rule] hy}\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = dudx[i + half, j] //. {dudxdef, taylorudef}; \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx, y0 \[Rule] hy\/2}\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(taylorvdef = 
-      v[i_, j_] \[Rule] 
-        V[x0, y0] + DvDx[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\) + 
-          DvDy[x0, y0]\ \((\((j + 1\/2)\)\ hy - y0)\) + 
-          1\/2\ D2vDy2[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\)\^2 + 
-          1\/2\ D2vDx2[x0, y0]\ \((\((j + 1\/2)\)\ hy - y0)\)\^2 + 
-          D2vDxDy[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\)\ 
-            \((\((j + 1\/2)\)\ hy - y0)\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(taylorvdef\)\" is \
-similar to existing symbol \"\!\(taylorudef\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DvDx\)\" is similar to \
-existing symbol \"\!\(DuDx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DvDy\)\" is similar to \
-existing symbols \!\({DuDy, DvDx}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2vDy2\)\" is similar \
-to existing symbol \"\!\(D2uDy2\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell1\"\) will be suppressed \
-during this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2vDx2\)\" is similar \
-to existing symbols \!\({D2uDx2, D2vDy2}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(v[i_, j_] \[Rule] 
-      1\/2\ \((hy\ \((1\/2 + j)\) - y0)\)\^2\ D2vDx2[x0, y0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hy\ \((1\/2 + j)\) - y0)\)\ 
-          D2vDxDy[x0, y0] + 
-        1\/2\ \((hx\ \((1\/2 + i)\) - x0)\)\^2\ D2vDy2[x0, y0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ DvDx[x0, y0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DvDy[x0, y0] + V[x0, y0]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = dvdy[i, j + half] //. {dvdydef, taylorvdef}; \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx\/2, y0 \[Rule] hy}\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DvDy[hx\/2, hy]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = dvdx[i, j + half] //. {dvdxdef1, dvdxdef2, taylorvdef}; \)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx\/2, y0 \[Rule] hy}\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DvDx[hx\/2, hy]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = dvdx[i + half, j] //. {dvdxdef1, dvdxdef2, taylorvdef}; \)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx, y0 \[Rule] hy\/2}\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DvDx[hx, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(taylormudef = 
-      mu[i_, j_] \[Rule] 
-        MU[x0, y0] + DmuDx[x0, y0]\ \((\((i + 1\/2)\)\ hx - x0)\) + 
-          DmuDy[x0, y0]\ \((\((j + 1\/2)\)\ hy - y0)\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(taylormudef\)\" is \
-similar to existing symbol \"\!\(taylorudef\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DmuDx\)\" is similar to \
-existing symbol \"\!\(DuDx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DmuDy\)\" is similar to \
-existing symbols \!\({DmuDx, DuDy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(mu[i_, j_] \[Rule] 
-      \((hx\ \((1\/2 + i)\) - x0)\)\ DmuDx[x0, y0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DmuDy[x0, y0] + MU[x0, y0]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["tests"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(dog = 
-      tauxx[i + half, j] //. {tauxxdef, dudxdef, taylormudef, taylorudef}; 
-    \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog //. {half \[Rule] 1\/2, i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx, 
-        y0 \[Rule] hy\/2}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(2\ DuDx[hx, hy\/2]\ MU[hx, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = 
-      tauyy[i, j + half] //. {tauyydef, dvdydef, taylormudef, taylorvdef}; 
-    \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog //. {half \[Rule] 1\/2, i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx\/2, 
-        y0 \[Rule] hy}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(2\ DvDy[hx\/2, hy]\ MU[hx\/2, hy]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = 
-      tauxy[i, j + half] //. {tauxydef, dudydef1, dudydef2, dvdxdef1, 
-          dvdxdef2, taylormudef, taylorudef, taylorvdef}; \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog //. {half \[Rule] 1\/2, i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx\/2, 
-        y0 \[Rule] hy}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DuDy[hx\/2, hy] + DvDx[hx\/2, hy])\)\ MU[hx\/2, hy]\)], "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(\(dog = 
-      tauxy[i + half, j] //. {tauxydef, dudydef1, dudydef2, dvdxdef1, 
-          dvdxdef2, taylormudef, taylorudef, taylorvdef}; \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog //. {half \[Rule] 1\/2, i \[Rule] 0, j \[Rule] 0, x0 \[Rule] hx, 
-        y0 \[Rule] hy\/2}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DuDy[hx, hy\/2] + DvDx[hx, hy\/2])\)\ MU[hx, hy\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions used for fortran output"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(murepl1 = mu[i_, j_ + half] \[Rule] muY[i, j + 1]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(mu[i_, half + j_] \[Rule] muY[i, 1 + j]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(murepl2 = mu[i_ + half, j_] \[Rule] muX[i + 1, j]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(mu[half + i_, j_] \[Rule] muX[1 + i, j]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(urepl = u[i_, j_] \[Rule] U[i, j, 1]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(u[i_, j_] \[Rule] U[i, j, 1]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(vrepl = v[i_, j_] \[Rule] U[i, j, 2]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(vrepl\)\" is similar to \
-existing symbol \"\!\(urepl\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(v[i_, j_] \[Rule] U[i, j, 2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(tauxy[i, j + half] //. {tauxydef, dudydef1, dudydef2, dvdxdef1, 
-        dvdxdef2, murepl1, murepl2, urepl, vrepl}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(muY[i, 1 + j]\ 
-      \((\(\(-U[i, j, 1]\) + U[i, 1 + j, 1]\)\/hy + 
-          \(1\/\(4\ hx\)\((
-            \(-U[\(-1\) + i, j, 2]\) - U[\(-1\) + i, 1 + j, 2] + 
-              U[1 + i, j, 2] + U[1 + i, 1 + j, 2])\)\))\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(tauxy[i, j + half] - tauxy[i, j - 1 + half] + tauxx[i + half, j] - 
-        tauxx[i - 1 + half, j] //. {tauxxdef, tauxydef, dudydef1, dudydef2, 
-        dvdxdef1, dvdxdef2, dudxdef, dvdydef, murepl1, murepl2, urepl, vrepl}
-        \)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(2\ muX[i, j]\ \((\(-U[\(-1\) + i, j, 1]\) + U[i, j, 1])\)\)\/hx
-            \)\) + \(2\ muX[1 + i, j]\ 
-          \((\(-U[i, j, 1]\) + U[1 + i, j, 1])\)\)\/hx - 
-      muY[i, j]\ 
-        \((\(\(-U[i, \(-1\) + j, 1]\) + U[i, j, 1]\)\/hy + 
-            \(1\/\(4\ hx\)\((
-              \(-U[\(-1\) + i, \(-1\) + j, 2]\) - U[\(-1\) + i, j, 2] + 
-                U[1 + i, \(-1\) + j, 2] + U[1 + i, j, 2])\)\))\) + 
-      muY[i, 1 + j]\ 
-        \((\(\(-U[i, j, 1]\) + U[i, 1 + j, 1]\)\/hy + 
-            \(1\/\(4\ hx\)\((
-              \(-U[\(-1\) + i, j, 2]\) - U[\(-1\) + i, 1 + j, 2] + 
-                U[1 + i, j, 2] + U[1 + i, 1 + j, 2])\)\))\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["Extract stencil information from operator"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog = 
-      alpha\ a[i, j]\ U[i, j, 1] - 
-          \(1\/vol\) 
-            \((beta\ \((
-                  hy\ \((tauxx[i + half, j] - tauxx[i - 1 + half, j])\) + 
-                    hx\ \((tauxy[i, j + half] - tauxy[i, j - 1 + half])\))\))
-              \) //. {tauxxdef, tauxydef, dudydef1, dudydef2, dvdxdef1, 
-          dvdxdef2, dudxdef, dvdydef, murepl1, murepl2, urepl, vrepl, 
-          vol \[Rule] hx\ hy}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(beta\)\" is similar to \
-existing symbol \"\!\(Beta\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(alpha\ a[i, j]\ U[i, j, 1] - 
-      \(1\/\(hx\ hy\)\((
-        beta\ \((
-            hy\ \((\(-\(\(2\ muX[i, j]\ 
-                            \((\(-U[\(-1\) + i, j, 1]\) + U[i, j, 1])\)\)\/hx
-                          \)\) + 
-                    \(2\ muX[1 + i, j]\ 
-                        \((\(-U[i, j, 1]\) + U[1 + i, j, 1])\)\)\/hx)\) + 
-              hx\ \((\(-muY[i, j]\)\ 
-                      \((\(\(-U[i, \(-1\) + j, 1]\) + U[i, j, 1]\)\/hy + 
-                          \(1\/\(4\ hx\)\((
-                            \(-U[\(-1\) + i, \(-1\) + j, 2]\) - 
-                              U[\(-1\) + i, j, 2] + U[1 + i, \(-1\) + j, 2] + 
-                              U[1 + i, j, 2])\)\))\) + 
-                    muY[i, 1 + j]\ 
-                      \((\(\(-U[i, j, 1]\) + U[i, 1 + j, 1]\)\/hy + 
-                          \(1\/\(4\ hx\)\((
-                            \(-U[\(-1\) + i, j, 2]\) - 
-                              U[\(-1\) + i, 1 + j, 2] + U[1 + i, j, 2] + 
-                              U[1 + i, 1 + j, 2])\)\))\))\))\))\)\)\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i, j, 1]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(alpha\ a[i, j] + \(2\ beta\ muX[i, j]\)\/hx\^2 + 
-      \(2\ beta\ muX[1 + i, j]\)\/hx\^2 + \(beta\ muY[i, j]\)\/hy\^2 + 
-      \(beta\ muY[i, 1 + j]\)\/hy\^2\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i + 1, j, 1]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(2\ beta\ muX[1 + i, j]\)\/hx\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i - 1, j, 1]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(2\ beta\ muX[i, j]\)\/hx\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i, j + 1, 1]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(beta\ muY[i, 1 + j]\)\/hy\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i, j - 1, 1]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(beta\ muY[i, j]\)\/hy\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog = 
-      alpha\ a[i, j]\ U[i, j, 2] - 
-          \(1\/vol\) 
-            \((beta\ \((
-                  hy\ \((tauxy[i + half, j] - tauxy[i - 1 + half, j])\) + 
-                    hx\ \((tauyy[i, j + half] - tauyy[i, j - 1 + half])\))\))
-              \) //. {tauyydef, tauxydef, dudydef1, dudydef2, dvdxdef1, 
-          dvdxdef2, dudxdef, dvdydef, murepl1, murepl2, urepl, vrepl, 
-          vol \[Rule] hx\ hy}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(alpha\ a[i, j]\ U[i, j, 2] - 
-      \(1\/\(hx\ hy\)\((
-        beta\ \((
-            hx\ \((\(-\(\(2\ muY[i, j]\ 
-                            \((\(-U[i, \(-1\) + j, 2]\) + U[i, j, 2])\)\)\/hy
-                          \)\) + 
-                    \(2\ muY[i, 1 + j]\ 
-                        \((\(-U[i, j, 2]\) + U[i, 1 + j, 2])\)\)\/hy)\) + 
-              hy\ \((\(-muX[i, j]\)\ 
-                      \((\(\(-U[\(-1\) + i, j, 2]\) + U[i, j, 2]\)\/hx + 
-                          \(1\/\(4\ hy\)\((
-                            \(-U[\(-1\) + i, \(-1\) + j, 1]\) + 
-                              U[\(-1\) + i, 1 + j, 1] - U[i, \(-1\) + j, 1] + 
-                              U[i, 1 + j, 1])\)\))\) + 
-                    muX[1 + i, j]\ 
-                      \((\(\(-U[i, j, 2]\) + U[1 + i, j, 2]\)\/hx + 
-                          \(1\/\(4\ hy\)\((
-                            \(-U[i, \(-1\) + j, 1]\) + U[i, 1 + j, 1] - 
-                              U[1 + i, \(-1\) + j, 1] + U[1 + i, 1 + j, 1])
-                            \)\))\))\))\))\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i, j, 2]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(alpha\ a[i, j] + \(beta\ muX[i, j]\)\/hx\^2 + 
-      \(beta\ muX[1 + i, j]\)\/hx\^2 + \(2\ beta\ muY[i, j]\)\/hy\^2 + 
-      \(2\ beta\ muY[i, 1 + j]\)\/hy\^2\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i + 1, j, 2]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(beta\ muX[1 + i, j]\)\/hx\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i - 1, j, 2]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(beta\ muX[i, j]\)\/hx\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i, j + 1, 2]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(2\ beta\ muY[i, 1 + j]\)\/hy\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Coefficient[Expand[dog], U[i, j - 1, 2]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(-\(\(2\ beta\ muY[i, j]\)\/hy\^2\)\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"dependentCellsNotCovered is a function which returns a logical expression \
-suitable for\ninclusion in fortran.  Give an expression, exp, we wish to \
-determine which mesh locations are accessed by the expression.  However, we \
-do not wish to examine\nall possible locations, only those outside the grid \
-patch region.  So we provide\na second argument, which is a boolean function \
-taking two arguments.  The combination will give logical expressions testing \
-the mask for cells utilized by the\nexpression and for which the boolean \
-function, logfunc[il,jl], evaluates as true. The\nthird argument is the name \
-of the mask array"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Clear[dependentCellsNotCovered]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dependentCellsNotCovered[exp_, logfunc_, maskfun_] := 
-      Module[{cond, lexp}, cond = False; lexp = exp; 
-        For[il = \(-2\), il \[LessEqual] \(+2\), \(il++\), 
-          For[jl = \(-2\), jl \[LessEqual] \(+2\), \(jl++\), 
-            For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-              If[logfunc[il, jl] && 
-                  Coefficient[Expand[exp], U[i + il, j + jl, kl]] =!= 0, 
-                cond = cond || maskfun[i + il, j + jl] > 0]]]]; cond]\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(exp\)\" is similar to \
-existing symbol \"\!\(Exp\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(lexp\)\" is similar to \
-existing symbol \"\!\(exp\)\"."\)], "Message"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"dependentCellsCovered is more or less the converse of \
-dependentCellsNotCovered.\ndependentCellsCovered will return true if all the \
-cells in the expression (properly\nrestricted by the mask function) ARE \
-covered.  dependentCellsNotCovered returned\ntrue if one or more of the cells \
-were not covered."], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Clear[dependentCellsCovered]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dependentCellsCovered[exp_, logfunc_, maskfun_] := 
-      Module[{cond, lexp}, cond = True; lexp = exp; 
-        For[il = \(-2\), il \[LessEqual] \(+2\), \(il++\), 
-          For[jl = \(-2\), jl \[LessEqual] \(+2\), \(jl++\), 
-            For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-              If[logfunc[il, jl] && 
-                  Coefficient[Expand[exp], U[i + il, j + jl, kl]] =!= 0, 
-                cond = cond && maskfun[i + il, j + jl] == 0]]]]; cond]\)], 
-  "Input",
-  AspectRatioFixed->True]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"this is an alternate definition which treats cells with mask .eq. 1 as \
-untrusted,\nrather than mask .gt. 0"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dependentCellsNotCoveredalt[exp_, logfunc_, maskfun_] := 
-      Module[{cond, lexp}, cond = False; lexp = exp; 
-        For[il = \(-2\), il \[LessEqual] \(+2\), \(il++\), 
-          For[jl = \(-2\), jl \[LessEqual] \(+2\), \(jl++\), 
-            For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-              If[logfunc[il, jl] && 
-                  Coefficient[Expand[exp], U[i + il, j + jl, kl]] =!= 0, 
-                cond = cond || maskfun[i + il, j + jl] == 1]]]]; cond]\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dependentCellsNotCovered[
-      abba\ U[i + 1, j - 1, 1] + U[i - 1, j - 1, 2], #2 < 0&, masks]\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(masks[\(-1\) + i, \(-1\) + j] > 0 || masks[1 + i, \(-1\) + j] > 0\)], 
-  "Output"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(f[x_] := 
-      \(f1\ \((x - x2)\)\ \((x - x3)\)\)\/\(\((x1 - x2)\)\ \((x1 - x3)\)\) + 
-        \(f2\ \((x - x1)\)\ \((x - x3)\)\)\/\(\((x2 - x1)\)\ 
-            \((x2 - x3)\)\) + 
-        \(f3\ \((x - x1)\)\ \((x - x2)\)\)\/\(\((x3 - x1)\)\ 
-            \((x3 - x2)\)\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog = 
-      Simplify[\[PartialD]\_x f[x] /. {x1 \[Rule] 0, x2 \[Rule] \(-h\), 
-            x3 \[Rule] \(-2\)\ h, x \[Rule] 0}]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(3\ f1 - 4\ f2 + f3\)\/\(2\ h\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {f1 \[Rule] 0, f2 \[Rule] h\^2, f3 \[Rule] 4\ h\^2}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(0\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog /. {f1 \[Rule] 0, f2 \[Rule] h\^3, f3 \[Rule] 8\ h\^3}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(2\ h\^2\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dog = 
-      Simplify[\[PartialD]\_\(x, x\)f[x] /. {x1 \[Rule] 0, x2 \[Rule] \(-h\), 
-            x3 \[Rule] \(-2\)\ h, x \[Rule] 0}]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(f1 - 2\ f2 + f3\)\/h\^2\)], "Output"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"definitions for Do One-sided Derivative in X direction.  if sign is \
-positive, \nit means extend the stencil in the positivie x direction.  if \
-negative, extend\nin other direction"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, sign_]\  := \ 
-      \((\(-u[i + 2, j]\) + 4*u[i + 1, j] - 3*u[i, j])\)/\((2*hx)\)\  /; \ 
-        sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(sign\)\" is similar to \
-existing symbol \"\!\(Sign\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, sign_]\  := \ 
-      \((u[i - 2, j] - 4*u[i - 1, j] + 3*u[i, j])\)/\((2*hx)\)\  /; \ 
-        sign == \(-1\)\)], "Input"],
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, k_, sign_]\  := \ 
-      \((\(-u[i + 2, j, k]\) + 4*u[i + 1, j, k] - 3*u[i, j, k])\)/
-          \((2*hx)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, k_, sign_]\  := \ 
-      \((u[i - 2, j, k] - 4*u[i - 1, j, k] + 3*u[i, j, k])\)/\((2*hx)\)\  /; 
-        \ sign == \(-1\)\)], "Input"],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Simplify[
-      DOneX[u, 0, 0, \(-1\)] //. {taylorudef, x0 \[Rule] hx\/2, 
-          y0 \[Rule] hy\/2}]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx\/2, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Simplify[
-      DOneX[u, 0, 0, \(+1\)] //. {taylorudef, x0 \[Rule] hx\/2, 
-          y0 \[Rule] hy\/2}]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx\/2, hy\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"definitions for Do One-sided Derivative in Y direction.  if sign is \
-positive, \nit means extend the stencil in the positivie y direction.  if \
-negative, extend\nin other direction"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, sign_]\  := \ 
-      \((\(-u[i, j + 2]\) + 4*u[i, j + 1] - 3*u[i, j])\)/\((2*hy)\)\  /; \ 
-        sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DOneY\)\" is similar to \
-existing symbol \"\!\(DOneX\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, sign_]\  := \ 
-      \((u[i, j - 2] - 4*u[i, j - 1] + 3*u[i, j])\)/\((2*hy)\)\  /; \ 
-        sign == \(-1\)\)], "Input"],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, k_, sign_]\  := \ 
-      \((\(-u[i, j + 2, k]\) + 4*u[i, j + 1, k] - 3*u[i, j, k])\)/
-          \((2*hy)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, k_, sign_]\  := \ 
-      \((u[i, j - 2, k] - 4*u[i, j - 1, k] + 3*u[i, j, k])\)/\((2*hy)\)\  /; 
-        \ sign == \(-1\)\)], "Input"],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Simplify[
-      DOneY[u, 0, 0, \(-1\)] //. {taylorudef, x0 \[Rule] hx\/2, 
-          y0 \[Rule] hy\/2}]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Simplify[
-      DOneY[u, 0, 0, \(+1\)] //. {taylorudef, x0 \[Rule] hx\/2, 
-          y0 \[Rule] hy\/2}]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions for two sided deriv in x direction."], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DTwoX[u_, i_, j_] := \(u[i + 1, j] - u[i - 1, j]\)\/\(2\ hx\)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DTwoX[u_, i_, j_, k_] := 
-      \(u[i + 1, j, k] - u[i - 1, j, k]\)\/\(2\ hx\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Simplify[
-      DTwoX[u, 0, 0] //. {taylorudef, x0 \[Rule] hx\/2, y0 \[Rule] hy\/2}]
-      \)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx\/2, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(DTwoY[u_, i_, j_] := \(u[i, j + 1] - u[i, j - 1]\)\/\(2\ hy\)\)], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DTwoY\)\" is similar to \
-existing symbol \"\!\(DTwoX\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(DTwoY[u_, i_, j_, k_] := 
-      \(u[i, j + 1, k] - u[i, j - 1, k]\)\/\(2\ hy\)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Simplify[
-      DTwoY[u, 0, 0] //. {taylorudef, x0 \[Rule] hx\/2, y0 \[Rule] hy\/2}]
-      \)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[{
-    \(\(DeleteFile["\<dog.mf\>"]; \)\), 
-    \(\(CopyFile["\<DV_2D.mF\>", "\<dog.mf\>"]; \)\), 
-    \(\(Splice["\<dog.mf\>"]; \)\), 
-    \(\(DeleteFile["\<DV_2D.F\>"]; \)\), 
-    \(\(CopyFile["\<dog.f\>", "\<DV_2D.F\>"]; \)\), 
-    \(<< "\<!touch DV_2D.F\>"\)}], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudxe\)\" is similar to \
-existing symbol \"\!\(dudx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudxw\)\" is similar to \
-existing symbols \!\({dudx, dudxe}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dvdyn\)\" is similar to \
-existing symbol \"\!\(dvdy\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dvdys\)\" is similar to \
-existing symbols \!\({dvdy, dvdyn}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudyn\)\" is similar to \
-existing symbols \!\({dudy, dvdyn}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(maskn\)\" is similar to \
-existing symbol \"\!\(masks\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell1\"\) will be suppressed \
-during this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(DeleteFile::"nffil" \( : \ \) 
-      "File not found during \!\(DeleteFile[\"DV_2D.F\"]\)."\)], "Message"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["Start figuring out how to write stencil"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(out1 = 
-      alpha\ a[i, j]\ U[i, j, 1] - 
-          \(1\/vol\((
-            beta\ \((
-                hy\ \((tauxx[i + half, j] - tauxx[i - 1 + half, j])\) + 
-                  hx\ \((tauxy[i, j + half] - tauxy[i, j - 1 + half])\))\))
-            \)\) //. {tauxxdef, tauxydef, dudydef1, dudydef2, dvdxdef1, 
-          dvdxdef2, dudxdef, dvdydef, murepl1, murepl2, urepl, vrepl, 
-          vol \[Rule] hx\ hy}\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Coefficient[Expand[out1], U[i, j, 1]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[TextData["setup to use the Format.m package "], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(Off[General::"\<spell\>", General::"\<spell1\>"]; \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\(SetOptions[$Output, PageWidth \[Rule] 73]; \)\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(<< "\</usr/people/wyc/_math/MathSource/Format/Format.m\>"\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(stencilDef[exp_, kin_] := 
-      Block[{iind, il, jl, kl, list1, list2, indices, tmp, indtrn}, 
-        indices = {{0, 0, KO}, {\(-1\), 0, KW}, {0, \(-1\), KS}, {\(-1\), 
-              \(-1\), KSW}, {\(-1\), \(+1\), KNW}}; list1 = {}; list2 = {}; 
-        For[iind = 1, iind \[LessEqual] 5, \(iind++\), 
-          il = indices\[LeftDoubleBracket]iind, 1\[RightDoubleBracket]; 
-          jl = indices\[LeftDoubleBracket]iind, 2\[RightDoubleBracket]; 
-          indtrn = indices\[LeftDoubleBracket]iind, 3\[RightDoubleBracket]; 
-          For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-            tmp = Coefficient[Expand[exp], U[i + il, j + jl, kl]]; 
-            If[tmp =!= 0, list1 = Append[list1, coef[i, j, indtrn, kin, kl]]; 
-              list2 = Append[list2, 
-                  \(+Coefficient[Expand[exp], U[i + il, j, kl]]\)]]]]; 
-        FortranAssign[Evaluate[list1], list2, 
-          AssignToArray \[Rule] {muY, muX, a, coef, polycoef}]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(stencilInc[exp_, kin_] := 
-      Block[{iind, il, jl, kl, list1, list2, indices, tmp, indtrn}, 
-        indices = {{0, 0, KO}, {\(-1\), 0, KW}, {0, \(-1\), KS}, {\(-1\), 
-              \(-1\), KSW}, {\(-1\), \(+1\), KNW}}; list1 = {}; list2 = {}; 
-        For[iind = 1, iind \[LessEqual] 5, \(iind++\), 
-          il = indices\[LeftDoubleBracket]iind, 1\[RightDoubleBracket]; 
-          jl = indices\[LeftDoubleBracket]iind, 2\[RightDoubleBracket]; 
-          indtrn = indices\[LeftDoubleBracket]iind, 3\[RightDoubleBracket]; 
-          For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-            tmp = Coefficient[Expand[exp], U[i + il, j + jl, kl]]; 
-            If[tmp =!= 0, list1 = Append[list1, coef[i, j, indtrn, kin, kl]]; 
-              list2 = Append[list2, 
-                  coef[i, j, indtrn, kin, kl] + 
-                    Coefficient[Expand[exp], U[i + il, j, kl]]]]]]; 
-        FortranAssign[Evaluate[list1], list2, 
-          AssignToArray \[Rule] {muY, muX, a, coef, polycoef}]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(stencilDec[exp_, kin_] := 
-      Block[{iind, il, jl, kl, list1, list2, indices, tmp, indtrn}, 
-        indices = {{0, 0, KO}, {\(-1\), 0, KW}, {0, \(-1\), KS}, {\(-1\), 
-              \(-1\), KSW}, {\(-1\), \(+1\), KNW}}; list1 = {}; list2 = {}; 
-        For[iind = 1, iind \[LessEqual] 5, \(iind++\), 
-          il = indices\[LeftDoubleBracket]iind, 1\[RightDoubleBracket]; 
-          jl = indices\[LeftDoubleBracket]iind, 2\[RightDoubleBracket]; 
-          indtrn = indices\[LeftDoubleBracket]iind, 3\[RightDoubleBracket]; 
-          For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-            tmp = Coefficient[Expand[exp], U[i + il, j + jl, kl]]; 
-            If[tmp =!= 0, 
-              list1 = Append[list1, coef[i, jl, indtrn, kin, kl]]; 
-              list2 = Append[list2, 
-                  coef[i, j, indtrn, kin, kl] - 
-                    Coefficient[Expand[exp], U[i + il, j, kl]]]]]]; 
-        FortranAssign[Evaluate[list1], list2, 
-          AssignToArray \[Rule] {muY, muX, a, coef, polycoef}]]\)], "Input",
-  AspectRatioFixed->True]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"This is slight variation on dependentCellsNotCovered.  Uses Format.m"], 
-  "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Clear[depCellNotCovered]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dependentCellIsCovered[exp_, logfunc_, maskfun_] := 
-      Module[{cond, lexp}, cond = False; lexp = exp; 
-        For[il = \(-2\), il \[LessEqual] \(+2\), \(il++\), 
-          For[jl = \(-2\), jl \[LessEqual] \(+2\), \(jl++\), 
-            For[kl = 1, kl \[LessEqual] 2, \(kl++\), 
-              If[logfunc[il, jl] && 
-                  Coefficient[Expand[exp], U[i + il, j + jl, kl]] =!= 0, 
-                cond = cond || maskfun[i + il, j + jl] > 0]]]]; 
-        FortranAssign[cond, AssignToArray \[Rule] {maskray}]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Clear[stencoef]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(stencilDef[out1, 1]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dog1 = 
-      InputForm[
-        Expand[vol\ 
-              \((alpha\ a[i, j]\ U[i, j, 1] - 
-                  \(1\/vol\((
-                    beta\ \((
-                        hy\ \((tauxx[i + half, j] - tauxx[i - 1 + half, j])
-                              \) + hx\ 
-                            \((tauxy[i, j + half] - tauxy[i, j - 1 + half])\))
-                        \))\)\))\) //. {tauxxdef, tauxydef, murepl1, murepl2, 
-              urepl, vrepl, vol \[Rule] hx\ hy}]]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Splice["\<dog.mf\>", FormatType \[Rule] OutputForm]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Splice["\<ratdog.mf\>", FormatType \[Rule] OutputForm]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(exntop + exnbot\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dependentCellIsCovered[exntop + exnbot, indexcond, maskray]\)], "Input",\
-
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Expand[exntop]\)], "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(outdog = 
-      2\ beta\ hy\ dudx[\(-1\) + half + i, j] //. {dudxdef, 
-          u[i - 1, j] \[Rule] u[i, j]}\)], "Input",
-  AspectRatioFixed->True]
-}, Open  ]]
-}, Open  ]]
-},
-FrontEndVersion->"X 3.0",
-ScreenRectangle->{{0, 1280}, {0, 1024}},
-WindowToolbars->{},
-CellGrouping->Manual,
-WindowSize->{535, 959},
-WindowMargins->{{Automatic, 359}, {Automatic, 22}},
-PrivateNotebookOptions->{"ColorPalette"->{RGBColor, -1}},
-ShowCellLabel->True,
-ShowCellTags->False,
-RenderingOptions->{"ObjectDithering"->True,
-"RasterDithering"->False}
-]
-
-
-(***********************************************************************
-Cached data follows.  If you edit this Notebook file directly, not using
-Mathematica, you must remove the line containing CacheID at the top of 
-the file.  The cache data will then be recreated when you save this file 
-from within Mathematica.
-***********************************************************************)
-
-(*CellTagsOutline
-CellTagsIndex->{}
-*)
-
-(*CellTagsIndex
-CellTagsIndex->{}
-*)
-
-(*NotebookFileOutline
-Notebook[{
-
-Cell[CellGroupData[{
-Cell[1731, 51, 94, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[1850, 57, 146, 4, 27, "Input"],
-Cell[1999, 63, 103, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[2139, 70, 146, 4, 27, "Input"],
-Cell[2288, 76, 103, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[2428, 83, 141, 4, 27, "Input"],
-Cell[2572, 89, 191, 3, 55, "Message"],
-Cell[2766, 94, 182, 3, 39, "Message"],
-Cell[2951, 99, 179, 3, 39, "Message"],
-Cell[3133, 104, 160, 3, 39, "Message"],
-Cell[3296, 109, 98, 2, 27, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[3443, 117, 103, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[3571, 123, 134, 3, 50, "Input"],
-Cell[3708, 128, 99, 2, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[3844, 135, 134, 3, 47, "Input"],
-Cell[3981, 140, 99, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[4117, 147, 203, 5, 69, "Input"],
-Cell[4323, 154, 171, 3, 69, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[4531, 162, 203, 5, 65, "Input"],
-Cell[4737, 169, 171, 3, 65, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[4945, 177, 129, 3, 47, "Input"],
-Cell[5077, 182, 99, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[5213, 189, 129, 3, 50, "Input"],
-Cell[5345, 194, 99, 2, 50, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[5493, 202, 119, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[5637, 208, 458, 9, 190, "Input"],
-Cell[6098, 219, 175, 3, 39, "Message"],
-Cell[6276, 224, 179, 3, 39, "Message"],
-Cell[6458, 229, 401, 7, 193, "Output"]
-}, Open  ]],
-Cell[6874, 239, 128, 3, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[7027, 246, 128, 3, 47, "Input"],
-Cell[7158, 251, 49, 1, 47, "Output"]
-}, Open  ]],
-Cell[7222, 255, 128, 3, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[7375, 262, 128, 3, 47, "Input"],
-Cell[7506, 267, 49, 1, 47, "Output"]
-}, Open  ]],
-Cell[7570, 271, 114, 2, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[7709, 277, 128, 3, 47, "Input"],
-Cell[7840, 282, 49, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[7926, 288, 458, 9, 190, "Input"],
-Cell[8387, 299, 187, 3, 39, "Message"],
-Cell[8577, 304, 175, 3, 39, "Message"],
-Cell[8755, 309, 179, 3, 39, "Message"],
-Cell[8937, 314, 179, 3, 39, "Message"],
-Cell[9119, 319, 161, 3, 39, "Message"],
-Cell[9283, 324, 185, 3, 39, "Message"],
-Cell[9471, 329, 401, 7, 193, "Output"]
-}, Open  ]],
-Cell[9887, 339, 114, 2, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[10026, 345, 128, 3, 47, "Input"],
-Cell[10157, 350, 49, 1, 47, "Output"]
-}, Open  ]],
-Cell[10221, 354, 128, 3, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[10374, 361, 128, 3, 47, "Input"],
-Cell[10505, 366, 49, 1, 47, "Output"]
-}, Open  ]],
-Cell[10569, 370, 128, 3, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[10722, 377, 128, 3, 47, "Input"],
-Cell[10853, 382, 49, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[10939, 388, 223, 5, 65, "Input"],
-Cell[11165, 395, 188, 3, 39, "Message"],
-Cell[11356, 400, 176, 3, 39, "Message"],
-Cell[11535, 405, 181, 3, 39, "Message"],
-Cell[11719, 410, 173, 3, 88, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[11941, 419, 82, 2, 47, "Section",
-  Evaluatable->False],
-Cell[12026, 423, 150, 4, 43, "Input"],
-
-Cell[CellGroupData[{
-Cell[12201, 431, 154, 3, 47, "Input"],
-Cell[12358, 436, 67, 1, 47, "Output"]
-}, Open  ]],
-Cell[12440, 440, 150, 4, 43, "Input"],
-
-Cell[CellGroupData[{
-Cell[12615, 448, 154, 3, 47, "Input"],
-Cell[12772, 453, 67, 1, 47, "Output"]
-}, Open  ]],
-Cell[12854, 457, 199, 4, 43, "Input"],
-
-Cell[CellGroupData[{
-Cell[13078, 465, 154, 3, 47, "Input"],
-Cell[13235, 470, 88, 1, 47, "Output"]
-}, Open  ]],
-Cell[13338, 474, 199, 4, 43, "Input"],
-
-Cell[CellGroupData[{
-Cell[13562, 482, 154, 3, 47, "Input"],
-Cell[13719, 487, 88, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[13856, 494, 112, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[13993, 500, 108, 2, 27, "Input"],
-Cell[14104, 504, 73, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[14214, 510, 108, 2, 27, "Input"],
-Cell[14325, 514, 73, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[14435, 520, 95, 2, 27, "Input"],
-Cell[14533, 524, 62, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[14632, 530, 95, 2, 27, "Input"],
-Cell[14730, 534, 177, 3, 39, "Message"],
-Cell[14910, 539, 62, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[15009, 545, 173, 3, 43, "Input"],
-Cell[15185, 550, 254, 5, 95, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[15476, 560, 290, 5, 75, "Input"],
-Cell[15769, 567, 686, 13, 266, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[16492, 585, 121, 2, 45, "Subsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[16638, 591, 475, 10, 115, "Input"],
-Cell[17116, 603, 175, 3, 39, "Message"],
-Cell[17294, 608, 1081, 21, 397, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[18412, 634, 95, 2, 27, "Input"],
-Cell[18510, 638, 192, 3, 91, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[18739, 646, 99, 2, 27, "Input"],
-Cell[18841, 650, 76, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[18954, 656, 99, 2, 27, "Input"],
-Cell[19056, 660, 72, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[19165, 666, 99, 2, 27, "Input"],
-Cell[19267, 670, 73, 1, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[19377, 676, 99, 2, 27, "Input"],
-Cell[19479, 680, 69, 1, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[19585, 686, 475, 10, 115, "Input"],
-Cell[20063, 698, 1076, 20, 382, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[21176, 723, 95, 2, 27, "Input"],
-Cell[21274, 727, 192, 3, 91, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[21503, 735, 99, 2, 27, "Input"],
-Cell[21605, 739, 73, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[21715, 745, 99, 2, 27, "Input"],
-Cell[21817, 749, 69, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[21923, 755, 99, 2, 27, "Input"],
-Cell[22025, 759, 76, 1, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[22138, 765, 99, 2, 27, "Input"],
-Cell[22240, 769, 72, 1, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[22349, 775, 720, 11, 154, "Subsubsection",
-  Evaluatable->False],
-Cell[23072, 788, 90, 2, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[23187, 794, 527, 10, 123, "Input"],
-Cell[23717, 806, 173, 3, 39, "Message"],
-Cell[23893, 811, 174, 3, 39, "Message"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[24116, 820, 390, 7, 90, "Subsubsection",
-  Evaluatable->False],
-Cell[24509, 829, 87, 2, 27, "Input"],
-Cell[24599, 833, 524, 10, 123, "Input"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[25160, 848, 192, 4, 58, "Subsubsection",
-  Evaluatable->False],
-Cell[25355, 854, 531, 10, 123, "Input"],
-
-Cell[CellGroupData[{
-Cell[25911, 868, 156, 4, 43, "Input"],
-Cell[26070, 874, 102, 2, 27, "Output"]
-}, Open  ]],
-Cell[26187, 879, 329, 7, 68, "Input"],
-
-Cell[CellGroupData[{
-Cell[26541, 890, 186, 4, 27, "Input"],
-Cell[26730, 896, 66, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[26833, 902, 117, 2, 34, "Input"],
-Cell[26953, 906, 35, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[27025, 912, 117, 2, 34, "Input"],
-Cell[27145, 916, 41, 1, 32, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[27223, 922, 192, 4, 28, "Input"],
-Cell[27418, 928, 59, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[27538, 936, 263, 5, 79, "Subsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[27826, 945, 159, 3, 43, "Input"],
-Cell[27988, 950, 175, 3, 39, "Message"]
-}, Open  ]],
-Cell[28178, 956, 159, 3, 43, "Input"],
-Cell[28340, 961, 174, 3, 59, "Input"],
-Cell[28517, 966, 172, 3, 59, "Input"],
-
-Cell[CellGroupData[{
-Cell[28714, 973, 162, 4, 47, "Input"],
-Cell[28879, 979, 52, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[28968, 985, 162, 4, 47, "Input"],
-Cell[29133, 991, 52, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[29234, 998, 263, 5, 79, "Subsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[29522, 1007, 159, 3, 43, "Input"],
-Cell[29684, 1012, 177, 3, 39, "Message"]
-}, Open  ]],
-Cell[29876, 1018, 159, 3, 43, "Input"],
-Cell[30038, 1023, 174, 3, 59, "Input"],
-Cell[30215, 1028, 172, 3, 59, "Input"],
-
-Cell[CellGroupData[{
-Cell[30412, 1035, 162, 4, 47, "Input"],
-Cell[30577, 1041, 52, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[30666, 1047, 162, 4, 47, "Input"],
-Cell[30831, 1053, 52, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[30932, 1060, 127, 2, 45, "Subsection",
-  Evaluatable->False],
-Cell[31062, 1064, 123, 3, 47, "Input"],
-Cell[31188, 1069, 137, 3, 47, "Input"],
-
-Cell[CellGroupData[{
-Cell[31350, 1076, 150, 4, 47, "Input"],
-Cell[31503, 1082, 52, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[31592, 1088, 123, 3, 50, "Input"],
-Cell[31718, 1093, 177, 3, 39, "Message"]
-}, Open  ]],
-Cell[31910, 1099, 137, 3, 50, "Input"],
-
-Cell[CellGroupData[{
-Cell[32072, 1106, 150, 4, 47, "Input"],
-Cell[32225, 1112, 52, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[32314, 1118, 312, 7, 107, "Input"],
-Cell[32629, 1127, 176, 3, 39, "Message"],
-Cell[32808, 1132, 181, 3, 39, "Message"],
-Cell[32992, 1137, 176, 3, 39, "Message"],
-Cell[33171, 1142, 181, 3, 39, "Message"],
-Cell[33355, 1147, 181, 3, 39, "Message"],
-Cell[33539, 1152, 160, 3, 39, "Message"],
-Cell[33702, 1157, 177, 3, 39, "Message"],
-Cell[33882, 1162, 161, 3, 39, "Message"],
-Cell[34046, 1167, 126, 2, 23, "Message"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[34233, 1176, 116, 2, 47, "Section",
-  Evaluatable->False],
-Cell[34352, 1180, 469, 10, 115, "Input"],
-Cell[34824, 1192, 96, 2, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[34945, 1198, 114, 2, 45, "Subsection",
-  Evaluatable->False],
-Cell[35062, 1202, 113, 2, 27, "Input"],
-Cell[35178, 1206, 106, 2, 27, "Input"],
-Cell[35287, 1210, 116, 2, 27, "Input"],
-Cell[35406, 1214, 1004, 16, 203, "Input"],
-Cell[36413, 1232, 1050, 17, 203, "Input"],
-Cell[37466, 1251, 1066, 18, 203, "Input"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[38569, 1274, 152, 4, 45, "Subsection",
-  Evaluatable->False],
-Cell[38724, 1280, 83, 2, 27, "Input"],
-Cell[38810, 1284, 579, 10, 123, "Input"],
-Cell[39392, 1296, 74, 2, 27, "Input"],
-Cell[39469, 1300, 78, 2, 27, "Input"],
-Cell[39550, 1304, 535, 12, 155, "Input"],
-Cell[40088, 1318, 110, 2, 27, "Input"],
-Cell[40201, 1322, 113, 2, 27, "Input"],
-Cell[40317, 1326, 74, 2, 27, "Input"],
-Cell[40394, 1330, 120, 3, 27, "Input"],
-Cell[40517, 1335, 73, 2, 27, "Input"],
-Cell[40593, 1339, 168, 4, 43, "Input"]
-}, Open  ]]
-}, Open  ]]
-}
-]
-*)
-
-
-
-
-(***********************************************************************
-End of Mathematica Notebook file.
-***********************************************************************)
-
diff --git a/Src/LinearSolvers/C_TensorMG/visc3d.m b/Src/LinearSolvers/C_TensorMG/visc3d.m
deleted file mode 100644
index 317967cae59..00000000000
--- a/Src/LinearSolvers/C_TensorMG/visc3d.m
+++ /dev/null
@@ -1,359 +0,0 @@
-Off[General::spell,General::spell1];
-
-(* Set PageWidth to 59 to reproduce old files *)
-SetOptions[$Output, PageWidth->59]; 
-(* SetOptions[$Output, PageWidth->73]; *)
-
-Get["Format.m"]
-
-(* definition of tau *)
-
-tauxxdef = tauxx[i_ + half, j_ ,k_] -> 2*mu[i+half,j,k]*dudx[i+half,j,k]
-tauyydef = tauyy[i_, j_ + half,k_] -> 2*mu[i,j+half,k] * dvdy[i,j+half,k]
-tauzzdef = tauzz[i_,j_,k_+half] -> 2*mu[i,j,k+half]*dwdz[i,j,k+half]
-tauxydef = tauxy[i_,j_,k_] -> mu[i,j,k]*(dudy[i,j,k]+dvdx[i,j,k])
-tauxzdef = tauxz[i_,j_,k_] -> mu[i,j,k]*(dudz[i,j,k]+dwdx[i,j,k])
-tauyzdef = tauyz[i_,j_,k_] -> mu[i,j,k]*(dvdz[i,j,k]+dwdy[i,j,k])
-
-(* definitions of derivatives *)
-(* diagonal derivatives *)
-dudxdef = dudx[i_+half,j_,k_] -> (u[i+1,j,k]-u[i,j,k])/hx
-dvdydef = dvdy[i_,j_+half,k_] -> (v[i,j+1,k]-v[i,j,k])/hy
-dwdzdef = dwdz[i_,j_,k_+half] -> (w[i,j,k+1]-w[i,j,k])/hz
-
-(* dudy *)
-dudydef1 = dudy[i_,j_+half,k_] -> (u[i,j+1,k]-u[i,j,k])/hy
-dudydef2 = dudy[i_+half,j_,k_] -> (u[i,j+1,k]-u[i,j-1,k]+u[i+1,j+1,k]-u[i+1,j-1,k])/(4*hy)
-
-(* dudz *)
-dudzdef1 = dudz[i_,j_,k_+half] -> (u[i,j,k+1]-u[i,j,k])/hz
-dudzdef2 = dudz[i_+half,j_,k_] -> (u[i,j,k+1]-u[i,j,k-1]+u[i+1,j,k+1]-u[i+1,j,k-1])/ (4*hz)
-
-(* dvdx *)
-dvdxdef1 = dvdx[i_+half,j_,k_] -> (v[i+1,j,k]-v[i,j,k])/hx
-dvdxdef2 = dvdx[i_,j_+half,k_] -> (v[i+1,j+1,k]-v[i-1,j+1,k]+v[i+1,j,k]-v[i-1,j,k])/(4*hx)
-
-(* dvdz *)
-dvdzdef1 = dvdz[i_,j_,k_+half] -> (v[i,j,k+1]-v[i,j,k])/hz
-dvdzdef2 = dvdz[i_,j_+half,k_] -> (v[i,j,k+1]-v[i,j,k-1]+v[i,j+1,k+1]-v[i,j+1,k-1])/(4*hz)
-
-(* dwdx *)
-dwdxdef1 = dwdx[i_+half,j_,k_] -> (w[i+1,j,k]-w[i,j,k])/hx
-dwdxdef2 = dwdx[i_,j_,k_+half] -> (w[i+1,j,k]-w[i-1,j,k]+w[i+1,j,k+1]-w[i-1,j,k+1])/(4*hx)
-
-(* dwdy *)
-dwdydef1 = dwdy[i_,j_+half,k_] -> (w[i,j+1,k]-w[i,j,k])/hy
-dwdydef2 = dwdy[i_,j_,k_+half] -> (w[i,j+1,k]-w[i,j-1,k]+w[i,j+1,k+1]-w[i,j-1,k+1])/(4*hy)
-
-(* definitions used for fortran output *)
-murepl1 = mu[i_,j_+half,k_] -> muY[i,j+1,k]
-murepl2 = mu[i_+half,j_,k_] -> muX[i+1,j,k]
-murepl3 = mu[i_,j_,k_+half] -> muZ[i,j,k+1]
-urepl = u[i_,j_,k_] -> U[i,j,k,1]
-vrepl = v[i_,j_,k_] -> U[i,j,k,2]
-wrepl = w[i_,j_,k_] -> U[i,j,k,3]
-
-(*
-dependentCellsNotCovered is a function which returns a logical
-expression suitable for inclusion in fortran.  Give an expression,
-exp, we wish to determine which mesh locations are accessed by the
-expression.  However, we do not wish to examine all possible
-locations, only those outside the grid patch region.  So we provide a
-second argument, which is a boolean function taking two arguments.
-The combination will give logical expressions testing the mask for
-cells utilized by the expression and for which the boolean function,
-logfunc[il,jl], evaluates as true. The third argument is the name of
-the mask array
-*)
-
-Clear[ dependentCellsNotCovered ]
-dependentCellsNotCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond = False, lexp = exp, il, jl, kl, ml},
-    For[il=-1,il<=+1,il++,
-      For[jl=-1,jl<=+1,jl++,
-        For[kl=-1,kl<=+1,kl++,
-          For[ml=1,ml<=3,ml++,
-            If[ (logfunc[il,jl,kl]) &&
-	          (Coefficient[Expand[exp], U[i+il,j+jl,k+kl,ml]] =!= 0), 
-                  cond = cond || (maskfun[i+il,j+jl,k+kl]>0)
-	        ]
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-
-(*
-dependentCellsCovered is the logical inverse of dependentCellsNotCovered
-*)
-
-Clear[ dependentCellsCovered ]
-dependentCellsCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond = True, lexp = exp, il, jl, kl, ml},
-    For[il=-1,il<=+1,il++,
-      For[jl=-1,jl<=+1,jl++,
-        For[kl=-1,kl<=+1,kl++,
-          For[ml=1,ml<=3,ml++,
-            If[ (logfunc[il,jl,kl]) &&
-	          (Coefficient[Expand[exp],U[i+il,j+jl,k+kl,ml]] =!= 0), 
-                  cond = cond && (maskfun[i+il,j+jl,k+kl]==0)
-	        ]
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-
-(* definitions for two sided derivs *)
-
-DTwoX[u_,i_,j_,k_] := (u[i+1,j,k]-u[i-1,j,k])/(2*hx)
-DTwoX[u_,i_,j_,k_,n_] := (u[i+1,j,k,n]-u[i-1,j,k,n])/(2*hx)
-DTwoY[u_,i_,j_,k_] := (u[i,j+1,k]-u[i,j-1,k])/(2*hy)
-DTwoY[u_,i_,j_,k_,n_] := (u[i,j+1,k,n]-u[i,j-1,k,n])/(2*hy)
-DTwoZ[u_,i_,j_,k_] := (u[i,j,k+1]-u[i,j,k-1])/(2*hz)
-DTwoZ[u_,i_,j_,k_,n_] := (u[i,j,k+1,n]-u[i,j,k-1,n])/(2*hz)
-
-(*
-definitions for Do One-sided Derivative in X direction.  if sign is
-positive, it means extend the stencil in the positivie x direction.
-if negative, extend in other direction
-*)
-
-Clear[DOneX]
-DOneX[u_, i_, j_, k_, sign_] := (-u[i + 2, j, k] + 4*u[i + 1, j, k] - 3*u[i, j, k])/(2*hx)  /; sign == 1
-DOneX[u_, i_, j_, k_, sign_] := (u[i - 2, j, k] - 4*u[i - 1, j, k] + 3*u[i, j, k])/(2*hx) /; sign == -1
-DOneX[u_, i_, j_, k_, n_, sign_] := (-u[i + 2, j, k, n] + 4*u[i + 1, j, k, n] - 3*u[i, j, k, n])/(2*hx) /; sign == 1
-DOneX[u_, i_, j_, k_, n_, sign_] := (u[i - 2, j, k, n] - 4*u[i - 1, j, k, n] + 3*u[i, j, k, n])/(2*hx) /; sign == -1
-
-(* 
-definitions for Do One-sided Derivative in Y direction.  if sign is
-positive, it means extend the stencil in the positivie y direction.
-if negative, extend in other direction 
-*)
-
-Clear[DOneY]
-DOneY[u_, i_, j_, k_, sign_] := (-u[i, j + 2, k] + 4*u[i, j + 1, k] - 3*u[i, j, k])/(2*hy) /; sign == 1
-DOneY[u_, i_, j_, k_, sign_] := (u[i, j - 2, k] - 4*u[i, j - 1, k] + 3*u[i, j, k])/(2*hy) /; sign == -1
-DOneY[u_, i_, j_, k_, n_, sign_] := (-u[i, j + 2, k, n] + 4*u[i, j + 1, k, n] - 3*u[i, j, k, n])/(2*hy) /; sign == 1
-DOneY[u_, i_, j_, k_, n_, sign_] := (u[i, j - 2, k, n] - 4*u[i, j - 1, k, n] + 3*u[i, j, k, n])/(2*hy) /; sign == -1
-
-(*
-definitions for Do One-sided Derivative in Z direction.  if sign is
-positive, it means extend the stencil in the positivie z direction.
-if negative, extend in other direction 
-*)
-
-Clear[DOneZ]
-DOneZ[u_, i_, j_, k_, sign_] := (-u[i, j, k + 2] + 4*u[i, j, k + 1] - 3*u[i, j, k])/(2*hz) /; sign == 1
-DOneZ[u_, i_, j_, k_, sign_] := (u[i, j, k - 2] - 4*u[i, j, k - 1] + 3*u[i, j, k])/(2*hz)  /; sign == -1
-DOneZ[u_, i_, j_, k_, n_, sign_] := (-u[i, j, k + 2, n] + 4*u[i, j, k + 1, n] - 3*u[i, j, k, n])/(2*hz) /; sign == 1
-DOneZ[u_, i_, j_, k_, n_, sign_] := (u[i, j, k - 2, n] - 4*u[i, j, k - 1, n] + 3*u[i, j, k, n])/(2*hz)  /; sign == -1
-
-(* useful one-sided derivatives *)
-
-Clear[dvdxalt, dudyalt, dvdzalt, dwdyalt, dudzalt, dwdxalt]
-dvdxalt[i_, j_ + half, k_,sign_] := (DOneX[v, i, j, k, sign] + DOneX[v, i, j + 1, k, sign])/2
-dudyalt[i_+half,j_,k_,sign_] := (DOneY[u,i  ,j,k,sign]+DOneY[u,i+1,j,k,sign])/2
-dvdzalt[i_,j_+half,k_,sign_] := (DOneZ[v,i,j  ,k,sign]+DOneZ[v,i,j+1,k,sign])/2
-dwdyalt[i_,j_,k_+half,sign_] := (DOneY[w,i,j,k  ,sign]+DOneY[w,i,j,k+1,sign])/2
-dudzalt[i_+half,j_,k_,sign_] := (DOneZ[u,i  ,j,k,sign]+DOneZ[u,i+1,j,k,sign])/2
-dwdxalt[i_,j_,k_+half,sign_] := (DOneX[w,i,j,k  ,sign]+DOneX[w,i,j,k+1,sign])/2
-
-(* substitution for all derivatives and variables *)
-
-allDerivAllUV = {dudxdef,
-		 dvdydef,
-		 dwdzdef,
-		 dudydef1,dudydef2,
-		 dudzdef1,dudzdef2,
-		 dvdxdef1,dvdxdef2,
-		 dvdzdef1,dvdzdef2,
-		 dwdxdef1,dwdxdef2,
-		 dwdydef1,dwdydef2,
-		 urepl,
-		 vrepl,
-		 wrepl};
-allUVW = {       urepl,
-		 vrepl,
-		 wrepl};
-
-(* transverse u derivs *)
-
-tduext[half+i,j,k] = trandere[i+1,j,k,1];
-tduext[half+i-1,j,k] = tranderw[i-1,j,k,1];
-tduext[i,j+half,k] = trandern[i,j+1,k,1];
-tduext[i,j-1+half,k] = tranders[i,j-1,k,1];
-tduext[i,j,k+half] = trandert[i,j,k+1,1];
-tduext[i,j,k-1+half] = tranderb[i,j,k-1,1];
-
-(* transverse v derivs *)
-
-tdvext[half+i,j,k] = trandere[i+1,j,k,2];
-tdvext[half+i-1,j,k] = tranderw[i-1,j,k,2];
-tdvext[i,j+half,k] = trandern[i,j+1,k,2];
-tdvext[i,j-1+half,k] = tranders[i,j-1,k,2];
-tdvext[i,j,k+half] = trandert[i,j,k+1,2];
-tdvext[i,j,k-1+half] = tranderb[i,j,k-1,2];
-
-(* transverse w derivs *)
-
-tdwext[half+i,j,k] = trandere[i+1,j,k,3];
-tdwext[half+i-1,j,k] = tranderw[i-1,j,k,3];
-tdwext[i,j+half,k] = trandern[i,j+1,k,3];
-tdwext[i,j-1+half,k] = tranders[i,j-1,k,3];
-tdwext[i,j,k+half] = trandert[i,j,k+1,3];
-tdwext[i,j,k-1+half] = tranderb[i,j,k-1,3];
-
-(*
-an alternate approach which seeks to automatically determine which 
-direction to use for one sided deriv
-*)
-
-altgen[lhs_,indx_,indy_,indz_,
-       exp_,expalt_,expext_,
-       varindx_,derivindx_,
-       indexcond_,mask_] :=
-	Block[
-		{tmpcond,tmp,tmpalt,
-		 depplus,depminus,sign,
-		 line1,line2,line3,line4,line5,
-		 icase,jcase,kcase},
-		(* conditions are False if expression is safe to use *)
-		tmpcond = dependentCellsNotCovered[
-					exp[indx,indy,indz] //. allDerivAllUV,
-					indexcond,mask];
-		depplus = dependentCellsNotCovered[
-					expalt[indx,indy,indz,+1] //.allDerivAllUV,
-					indexcond,mask];
-		depminus = dependentCellsNotCovered[
-					expalt[indx,indy,indz,-1] //.allDerivAllUV,
-					indexcond,mask];
-		(* temporary *)
-		If[ depplus === False , 
-			sign = 1,
-			If[ depminus === False ,
-				sign = -1,
-				sign = 0  (* means neither of one 
-				             sided is safe *)
-			]
-		];
-		(* treat 3 different cases *)
-		Which[
-			tmpcond === False,
-			(* exp does not extend into masked region *)
-			FortranAssign[
-				lhs,
-				exp[indx,indy,indz] //.allDerivAllUV,
-				AssignToArray->{U},
-				AssignPrecision->Infinity
-			],
-			
-			tmpcond =!= False && sign != 0,
-			(* exp extends outside, output conditional mask *)
-
-			tmp = FortranAssign[
-				tmpcond,
-				AssignToArray->{mask},
-				AssignIndent->"",
-				AssignPrecision->Infinity
-			];
-			tmpalt =dependentCellsNotCovered[
-					expalt[indx,indx,indz,sign]//.allDerivAllUV,
-						indexcond,mask];
-			line1 = StringForm["      if(``) then ", tmp];
-			line2 = FortranAssign[
-				lhs,
-				expalt[indx,indy,indz,sign]//.allDerivAllUV,
-				AssignToArray->{U},
-				AssignPrecision->Infinity
-			];
-			line3 = StringForm["      else"];
-			line4 = FortranAssign[
-				lhs,
-				exp[indx,indy,indz] //.allDerivAllUV,
-				AssignToArray->{U},
-				AssignPrecision->Infinity
-			];
-			If[tmpalt =!= False ,
-				(* this is an error, the alternate form should
-				   be specified to be inside safe region *)
-		   		line5 = StringForm[" error in tandergen"]
-		   	,
-		   		line5 = StringForm["      endif"]
-			];
-			ColumnForm[{line1,line2,line3,line4,line5}],
-			
-			True,
-			(* cannot use exp or expalt, must be
-			   externally supplied derivative *)
-
-			(* need to figure out where to evaluate
-			   the transverse derivative *)
-			icase = Which[ indx === i-1+half, -1,
-						   indx === i       ,  0,
-						   indx === i  +half, +1,
-						   _, Print["error in icase"]];
-			jcase = Which[ indy === j-1+half, -1,
-						   indy === j       ,  0,
-						   indy === j  +half, +1,
-						   _, Print["error in jcase"]];
-
-			kcase = Which[ indz === k-1+half, -1,
-						   indz === k       ,  0,
-						   indz === k  +half, +1,
-						   _, Print["error in kcase"]];
-		
-			FortranAssign[
-					lhs, expext[i+icase,
-								j+jcase,
-								k+kcase,
-								varindx,derivindx],
-					AssignToArray->{trandere,tranderw,
-									trandern,tranders,
-									trandert,tranderb},
-					AssignPrecision->Infinity]	
-		]	
-	]
-
-(* a short-hand function *)
-
-FA[x_] := FortranAssign[x, AssignToArray->{U, muX, muY, muZ, a, u, maskn, maske, maskw, masks, maskt, maskb},
-				AssignIndent->"", AssignPrecision->Infinity];		
-
-(*
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D1.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D1.F"];
-CopyFile[ "dog.f", "DV_3D1.F" ];
-SetFileDate["DV_3D1.F"];
-*)
-
-(*
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D2.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D2.F"];
-CopyFile[ "dog.f", "DV_3D2.F" ];
-SetFileDate["DV_3D2.F";
-*)
-
-(*
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D3.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D3.F"];
-CopyFile[ "dog.f", "DV_3D3.F" ];
-SetFileDate["DV_3D3.F"];
-*)
-
-(*
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D4.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D4.F"];
-CopyFile[ "dog.f", "DV_3D4.F" ];
-SetFileDate["DV_3D4.F"];
-*)
diff --git a/Src/LinearSolvers/C_TensorMG/visc3d.ma b/Src/LinearSolvers/C_TensorMG/visc3d.ma
deleted file mode 100644
index 5186d66850a..00000000000
--- a/Src/LinearSolvers/C_TensorMG/visc3d.ma
+++ /dev/null
@@ -1,1740 +0,0 @@
-(*^
-
-::[	Information =
-
-	"This is a Mathematica Notebook file.  It contains ASCII text, and can be
-	transferred by email, ftp, or other text-file transfer utility.  It should
-	be read or edited using a copy of Mathematica or MathReader.  If you 
-	received this as email, use your mail application or copy/paste to save 
-	everything from the line containing (*^ down to the line containing ^*)
-	into a plain text file.  On some systems you may have to give the file a 
-	name ending with ".ma" to allow Mathematica to recognize it as a Notebook.
-	The line below identifies what version of Mathematica created this file,
-	but it can be opened using any other version as well.";
-
-	FrontEndVersion = "X Window System Mathematica Notebook Front End Version 2.2";
-
-	X11StandardFontEncoding; 
-	
-	fontset = title, inactive, noPageBreakBelow, noPageBreakInGroup, nohscroll, preserveAspect, groupLikeTitle, center, M7, bold, e8,  24, fontName, "times";
-	fontset = subtitle, inactive, noPageBreakBelow, noPageBreakInGroup, nohscroll, preserveAspect, groupLikeTitle, center, M7, bold, e6,  18, fontName, "times";
-	fontset = subsubtitle, inactive, noPageBreakBelow, noPageBreakInGroup, nohscroll, preserveAspect, groupLikeTitle, center, M7, italic, e6,  14, fontName, "times";
-	fontset = section, inactive, noPageBreakBelow, nohscroll, preserveAspect, groupLikeSection, grayBox, M22, bold, a20,  18, fontName, "times";
-	fontset = subsection, inactive, noPageBreakBelow, nohscroll, preserveAspect, groupLikeSection, blackBox, M19, bold, a15,  14, fontName, "times";
-	fontset = subsubsection, inactive, noPageBreakBelow, nohscroll, preserveAspect, groupLikeSection, whiteBox, M18, bold, a12,  12, fontName, "times";
-	fontset = text, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = smalltext, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  10, fontName, "times";
-	fontset = input, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeInput, M42, N23, bold,  12, fontName, "courier";
-	fontset = output, output, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23, L-5,  12, fontName, "courier";
-	fontset = message, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23,  12, fontName, "courier";
-	fontset = print, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23,  12, fontName, "courier";
-	fontset = info, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeOutput, M42, N23,  12, fontName, "courier";
-	fontset = postscript, PostScript, formatAsPostScript, output, inactive, noPageBreakInGroup, nowordwrap, preserveAspect, groupLikeGraphics, M7, l34, w282, h287,  12, fontName, "courier";
-	fontset = name, inactive, noPageBreakInGroup, nohscroll, preserveAspect, M7, italic, B65535,  10, fontName, "times";
-	fontset = header, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7, italic,  12, fontName, "times";
-	fontset = leftheader,  12, fontName, "times";
-	fontset = footer, inactive, nohscroll, noKeepOnOnePage, preserveAspect, center, M7, italic,  12, fontName, "times";
-	fontset = leftfooter,  12, fontName, "times";
-	fontset = help, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = clipboard, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = completions, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "courier";
-	fontset = special1, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special2, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special3, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special4, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";
-	fontset = special5, inactive, nohscroll, noKeepOnOnePage, preserveAspect, M7,  12, fontName, "times";paletteColors = 128; automaticGrouping; currentKernel; 
-]
-:[font = subtitle; inactive; preserveAspect; startGroup]
-a clone of visc2d.ma  which
-should work in 3D
-:[font = section; inactive; preserveAspect; startGroup]
-definition of tau
-:[font = input; preserveAspect; startGroup]
-tauxxdef = tauxx[i_ + half, j_ ,k_] -> 
-		2*mu[i+half,j,k]*dudx[i+half,j,k]
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauxx[half + (i_), j_, k_] -> 
- 
-  2*dudx[half + i, j, k]*mu[half + i, j, k]
-;[o]
-tauxx[half + (i_), j_, k_] -> 
- 
-  2 dudx[half + i, j, k] mu[half + i, j, k]
-:[font = input; preserveAspect; startGroup]
-tauyydef = tauyy[i_, j_ + half,k_] ->
-		2*mu[i,j+half,k] * dvdy[i,j+half,k]
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauyy[i_, half + (j_), k_] -> 
- 
-  2*dvdy[i, half + j, k]*mu[i, half + j, k]
-;[o]
-tauyy[i_, half + (j_), k_] -> 
- 
-  2 dvdy[i, half + j, k] mu[i, half + j, k]
-:[font = input; preserveAspect; startGroup]
-tauzzdef = tauzz[i_,j_,k_+half] ->
-		2*mu[i,j,k+half]*dwdz[i,j,k+half]
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauzz[i_, j_, half + (k_)] -> 
- 
-  2*dwdz[i, j, half + k]*mu[i, j, half + k]
-;[o]
-tauzz[i_, j_, half + (k_)] -> 
- 
-  2 dwdz[i, j, half + k] mu[i, j, half + k]
-:[font = input; preserveAspect; startGroup]
-tauxydef = tauxy[i_,j_,k_] -> mu[i,j,k]*
-							(dudy[i,j,k]+dvdx[i,j,k])
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauxydef"
-     is similar to existing symbols {tauxxdef, tauyydef}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauxy"
-     is similar to existing symbols {tauxx, tauyy}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dudy"
-     is similar to existing symbols {dudx, dvdy}.
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauxy[i_, j_, k_] -> 
- 
-  (dudy[i, j, k] + dvdx[i, j, k])*mu[i, j, k]
-;[o]
-tauxy[i_, j_, k_] -> 
- 
-  (dudy[i, j, k] + dvdx[i, j, k]) mu[i, j, k]
-:[font = input; preserveAspect; startGroup]
-tauxzdef = tauxz[i_,j_,k_] -> mu[i,j,k]*
-							(dudz[i,j,k]+dwdx[i,j,k])
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauxzdef"
-     is similar to existing symbols 
-    {tauxxdef, tauxydef, tauzzdef}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauxz"
-     is similar to existing symbols {tauxx, tauxy, tauzz}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dudz"
-     is similar to existing symbols {dudx, dudy, dwdz}.
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup]
-tauxz[i_, j_, k_] -> 
- 
-  (dudz[i, j, k] + dwdx[i, j, k])*mu[i, j, k]
-;[o]
-tauxz[i_, j_, k_] -> 
- 
-  (dudz[i, j, k] + dwdx[i, j, k]) mu[i, j, k]
-:[font = input; preserveAspect; startGroup]
-tauyzdef = tauyz[i_,j_,k_] -> mu[i,j,k]*
-							(dvdz[i,j,k]+dwdy[i,j,k])
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauyzdef"
-     is similar to existing symbols 
-    {tauxzdef, tauyydef, tauzzdef}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "tauyz"
-     is similar to existing symbols {tauxz, tauyy, tauzz}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dvdz"
-     is similar to existing symbols {dudz, dvdx, dvdy, 
-     dwdz}.
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-tauyz[i_, j_, k_] -> 
- 
-  (dvdz[i, j, k] + dwdy[i, j, k])*mu[i, j, k]
-;[o]
-tauyz[i_, j_, k_] -> 
- 
-  (dvdz[i, j, k] + dwdy[i, j, k]) mu[i, j, k]
-:[font = section; inactive; preserveAspect; startGroup]
-definitions of derivatives
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-diagonal derivatives
-:[font = input; preserveAspect; startGroup]
-dudxdef = dudx[i_+half,j_,k_] -> 
-		(u[i+1,j,k]-u[i,j,k])/hx
-:[font = output; output; inactive; preserveAspect; endGroup]
-dudx[half + (i_), j_, k_] -> 
- 
-  (-u[i, j, k] + u[1 + i, j, k])/hx
-;[o]
-                             -u[i, j, k] + u[1 + i, j, k]
-dudx[half + (i_), j_, k_] -> ----------------------------
-                                          hx
-:[font = input; preserveAspect; startGroup]
-dvdydef = dvdy[i_,j_+half,k_] ->
-		(v[i,j+1,k]-v[i,j,k])/hy
-:[font = output; output; inactive; preserveAspect; endGroup]
-dvdy[i_, half + (j_), k_] -> 
- 
-  (-v[i, j, k] + v[i, 1 + j, k])/hy
-;[o]
-                             -v[i, j, k] + v[i, 1 + j, k]
-dvdy[i_, half + (j_), k_] -> ----------------------------
-                                          hy
-:[font = input; preserveAspect; startGroup]
-dwdzdef = dwdz[i_,j_,k_+half] ->
-		(w[i,j,k+1]-w[i,j,k])/hz
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dwdz[i_, j_, half + (k_)] -> 
- 
-  (-w[i, j, k] + w[i, j, 1 + k])/hz
-;[o]
-                             -w[i, j, k] + w[i, j, 1 + k]
-dwdz[i_, j_, half + (k_)] -> ----------------------------
-                                          hz
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dudy
-:[font = input; preserveAspect; startGroup]
-dudydef1 = dudy[i_,j_+half,k_] -> (u[i,j+1,k]-u[i,j,k])/hy
-:[font = output; output; inactive; preserveAspect; endGroup]
-dudy[i_, half + (j_), k_] -> 
- 
-  (-u[i, j, k] + u[i, 1 + j, k])/hy
-;[o]
-                             -u[i, j, k] + u[i, 1 + j, k]
-dudy[i_, half + (j_), k_] -> ----------------------------
-                                          hy
-:[font = input; preserveAspect; startGroup]
-dudydef2 = dudy[i_+half,j_,k_] -> 
-		(u[i,j+1,k]-u[i,j-1,k]+u[i+1,j+1,k]-u[i+1,j-1,k])/
-													(4*hy)
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dudy[half + (i_), j_, k_] -> 
- 
-  (-u[i, -1 + j, k] + u[i, 1 + j, k] - 
- 
-     u[1 + i, -1 + j, k] + u[1 + i, 1 + j, k])/(4*hy)
-;[o]
-dudy[half + (i_), j_, k_] -> 
- 
-  (-u[i, -1 + j, k] + u[i, 1 + j, k] - 
- 
-     u[1 + i, -1 + j, k] + u[1 + i, 1 + j, k]) / (4 hy)
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dudz
-:[font = input; preserveAspect; startGroup]
-dudzdef1 = dudz[i_,j_,k_+half]->(u[i,j,k+1]-u[i,j,k])/hz
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "dudzdef1"
-     is similar to existing symbol "dudydef1".
-:[font = output; output; inactive; preserveAspect; endGroup]
-dudz[i_, j_, half + (k_)] -> 
- 
-  (-u[i, j, k] + u[i, j, 1 + k])/hz
-;[o]
-                             -u[i, j, k] + u[i, j, 1 + k]
-dudz[i_, j_, half + (k_)] -> ----------------------------
-                                          hz
-:[font = input; preserveAspect; startGroup]
-dudzdef2 = dudz[i_+half,j_,k_] ->
-		(u[i,j,k+1]-u[i,j,k-1]+u[i+1,j,k+1]-u[i+1,j,k-1])/
-												(4*hz)
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "dudzdef2"
-     is similar to existing symbol "dudydef2".
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dudz[half + (i_), j_, k_] -> 
- 
-  (-u[i, j, -1 + k] + u[i, j, 1 + k] - 
- 
-     u[1 + i, j, -1 + k] + u[1 + i, j, 1 + k])/(4*hz)
-;[o]
-dudz[half + (i_), j_, k_] -> 
- 
-  (-u[i, j, -1 + k] + u[i, j, 1 + k] - 
- 
-     u[1 + i, j, -1 + k] + u[1 + i, j, 1 + k]) / (4 hz)
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dvdx
-:[font = input; preserveAspect; startGroup]
-dvdxdef1 = dvdx[i_+half,j_,k_] -> (v[i+1,j,k]-v[i,j,k])/hx
-:[font = output; output; inactive; preserveAspect; endGroup]
-dvdx[half + (i_), j_, k_] -> 
- 
-  (-v[i, j, k] + v[1 + i, j, k])/hx
-;[o]
-                             -v[i, j, k] + v[1 + i, j, k]
-dvdx[half + (i_), j_, k_] -> ----------------------------
-                                          hx
-:[font = input; preserveAspect; startGroup]
-dvdxdef2 = dvdx[i_,j_+half,k_] ->
-		(v[i+1,j+1,k]-v[i-1,j+1,k]+v[i+1,j,k]-v[i-1,j,k])/(4*hx)
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dvdx[i_, half + (j_), k_] -> 
- 
-  (-v[-1 + i, j, k] - v[-1 + i, 1 + j, k] + 
- 
-     v[1 + i, j, k] + v[1 + i, 1 + j, k])/(4*hx)
-;[o]
-dvdx[i_, half + (j_), k_] -> 
- 
-  (-v[-1 + i, j, k] - v[-1 + i, 1 + j, k] + 
- 
-     v[1 + i, j, k] + v[1 + i, 1 + j, k]) / (4 hx)
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dvdz
-:[font = input; preserveAspect; startGroup]
-dvdzdef1 = dvdz[i_,j_,k_+half]->(v[i,j,k+1]-v[i,j,k])/hz
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dvdzdef1"
-     is similar to existing symbols {dudzdef1, dvdxdef1}.
-:[font = output; output; inactive; preserveAspect; endGroup]
-dvdz[i_, j_, half + (k_)] -> 
- 
-  (-v[i, j, k] + v[i, j, 1 + k])/hz
-;[o]
-                             -v[i, j, k] + v[i, j, 1 + k]
-dvdz[i_, j_, half + (k_)] -> ----------------------------
-                                          hz
-:[font = input; preserveAspect; startGroup]
-dvdzdef2 = dvdz[i_,j_+half,k_]->
-		(v[i,j,k+1]-v[i,j,k-1]+v[i,j+1,k+1]-v[i,j+1,k-1])/
-												(4*hz)
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dvdzdef2"
-     is similar to existing symbols {dudzdef2, dvdxdef2}.
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dvdz[i_, half + (j_), k_] -> 
- 
-  (-v[i, j, -1 + k] + v[i, j, 1 + k] - 
- 
-     v[i, 1 + j, -1 + k] + v[i, 1 + j, 1 + k])/(4*hz)
-;[o]
-dvdz[i_, half + (j_), k_] -> 
- 
-  (-v[i, j, -1 + k] + v[i, j, 1 + k] - 
- 
-     v[i, 1 + j, -1 + k] + v[i, 1 + j, 1 + k]) / (4 hz)
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dwdx
-:[font = input; preserveAspect; startGroup]
-dwdxdef1 = dwdx[i_+half,j_,k_]->(w[i+1,j,k]-w[i,j,k])/hx
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "dwdxdef1"
-     is similar to existing symbol "dvdxdef1".
-:[font = output; output; inactive; preserveAspect; endGroup]
-dwdx[half + (i_), j_, k_] -> 
- 
-  (-w[i, j, k] + w[1 + i, j, k])/hx
-;[o]
-                             -w[i, j, k] + w[1 + i, j, k]
-dwdx[half + (i_), j_, k_] -> ----------------------------
-                                          hx
-:[font = input; preserveAspect; startGroup]
-dwdxdef2 = dwdx[i_,j_,k_+half]->
-		(w[i+1,j,k]-w[i-1,j,k]+w[i+1,j,k+1]-w[i-1,j,k+1])/
-											(4*hx)
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "dwdxdef2"
-     is similar to existing symbol "dvdxdef2".
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-dwdx[i_, j_, half + (k_)] -> 
- 
-  (-w[-1 + i, j, k] - w[-1 + i, j, 1 + k] + 
- 
-     w[1 + i, j, k] + w[1 + i, j, 1 + k])/(4*hx)
-;[o]
-dwdx[i_, j_, half + (k_)] -> 
- 
-  (-w[-1 + i, j, k] - w[-1 + i, j, 1 + k] + 
- 
-     w[1 + i, j, k] + w[1 + i, j, 1 + k]) / (4 hx)
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-dwdy
-:[font = input; preserveAspect; startGroup]
-dwdydef1 = dwdy[i_,j_+half,k_] ->
-		(w[i,j+1,k]-w[i,j,k])/hy
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dwdydef1"
-     is similar to existing symbols {dudydef1, dwdxdef1}.
-:[font = output; output; inactive; preserveAspect; endGroup]
-dwdy[i_, half + (j_), k_] -> 
- 
-  (-w[i, j, k] + w[i, 1 + j, k])/hy
-;[o]
-                             -w[i, j, k] + w[i, 1 + j, k]
-dwdy[i_, half + (j_), k_] -> ----------------------------
-                                          hy
-:[font = input; preserveAspect; startGroup]
-dwdydef2 = dwdy[i_,j_,k_+half] ->
-	(w[i,j+1,k]-w[i,j-1,k]+w[i,j+1,k+1]-w[i,j-1,k+1])/(4*hy)
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "dwdydef2"
-     is similar to existing symbols {dudydef2, dwdxdef2}.
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup; endGroup]
-dwdy[i_, j_, half + (k_)] -> 
- 
-  (-w[i, -1 + j, k] - w[i, -1 + j, 1 + k] + 
- 
-     w[i, 1 + j, k] + w[i, 1 + j, 1 + k])/(4*hy)
-;[o]
-dwdy[i_, j_, half + (k_)] -> 
- 
-  (-w[i, -1 + j, k] - w[i, -1 + j, 1 + k] + 
- 
-     w[i, 1 + j, k] + w[i, 1 + j, 1 + k]) / (4 hy)
-:[font = section; inactive; preserveAspect; startGroup]
-definitions used to test taylor expansions
-:[font = input; preserveAspect; startGroup]
-taylorudef = u[i_,j_,k_]->
-			U[x0,y0,z0]+
-			DuDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-			DuDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-			DuDz[x0,y0,z0]*((k+1/2)*hz-z0)+
-			D2uDy2[x0,y0,z0]/2*((i+1/2)*hx-x0)^2+
-			D2uDx2[x0,y0,z0]/2*((j+1/2)*hy-y0)^2+
-			D2uDz2[x0,y0,z0]/2*((k+1/2)*hz-z0)^2+
-			D2uDxDy[x0,y0,z0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)+
-			D2uDxDz[x0,y0,z0]*((i+1/2)*hx-x0)*((k+1/2)*hz-z0)+
-			D2uDyDz[x0,y0,z0]*((j+1/2)*hy-y0)*((k+1/2)*hz-z0)
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "DuDy"
-     is similar to existing symbol "DuDx".
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DuDz"
-     is similar to existing symbols {DuDx, DuDy}.
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "D2uDx2"
-     is similar to existing symbol "D2uDy2".
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "D2uDz2"
-     is similar to existing symbols {D2uDx2, D2uDy2}.
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "D2uDxDz"
-     is similar to existing symbol "D2uDxDy".
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell1
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup]
-u[i_, j_, k_] -> 
- 
-  (hx*(1/2 + i) - x0)*DuDx[x0, y0, z0] + 
- 
-   (hy*(1/2 + j) - y0)*DuDy[x0, y0, z0] + 
- 
-   (hz*(1/2 + k) - z0)*DuDz[x0, y0, z0] + 
- 
-   (hx*(1/2 + i) - x0)*(hy*(1/2 + j) - y0)*
- 
-    D2uDxDy[x0, y0, z0] + 
- 
-   (hx*(1/2 + i) - x0)*(hz*(1/2 + k) - z0)*
- 
-    D2uDxDz[x0, y0, z0] + 
- 
-   ((hy*(1/2 + j) - y0)^2*D2uDx2[x0, y0, z0])/2 + 
- 
-   (hy*(1/2 + j) - y0)*(hz*(1/2 + k) - z0)*
- 
-    D2uDyDz[x0, y0, z0] + 
- 
-   ((hx*(1/2 + i) - x0)^2*D2uDy2[x0, y0, z0])/2 + 
- 
-   ((hz*(1/2 + k) - z0)^2*D2uDz2[x0, y0, z0])/2 + 
- 
-   U[x0, y0, z0]
-;[o]
-u[i_, j_, k_] -> 
- 
-       1
-  (hx (- + i) - x0) DuDx[x0, y0, z0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DuDy[x0, y0, z0] + 
-        2
- 
-        1
-   (hz (- + k) - z0) DuDz[x0, y0, z0] + 
-        2
- 
-        1                 1
-   (hx (- + i) - x0) (hy (- + j) - y0) 
-        2                 2
- 
-    D2uDxDy[x0, y0, z0] + 
- 
-        1                 1
-   (hx (- + i) - x0) (hz (- + k) - z0) 
-        2                 2
- 
-    D2uDxDz[x0, y0, z0] + 
- 
-        1           2
-   (hy (- + j) - y0)  D2uDx2[x0, y0, z0]
-        2
-   ------------------------------------- + 
-                     2
- 
-        1                 1
-   (hy (- + j) - y0) (hz (- + k) - z0) 
-        2                 2
- 
-    D2uDyDz[x0, y0, z0] + 
- 
-        1           2
-   (hx (- + i) - x0)  D2uDy2[x0, y0, z0]
-        2
-   ------------------------------------- + 
-                     2
- 
-        1           2
-   (hz (- + k) - z0)  D2uDz2[x0, y0, z0]
-        2
-   ------------------------------------- + U[x0, y0, z0]
-                     2
-:[font = input; preserveAspect]
-dog = dudy[i+half,j,k] //. {dudydef1,dudydef2,taylorudef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,k->0,x0->hx,y0->hy/2,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx, hy/2, hz/2]
-;[o]
-         hy  hz
-DuDy[hx, --, --]
-         2   2
-:[font = input; preserveAspect]
-dog = dudy[i,j+half,k] //. {dudydef1,dudydef2,taylorudef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx/2, hy, hz/2]
-;[o]
-     hx      hz
-DuDy[--, hy, --]
-     2       2
-:[font = input; preserveAspect; startGroup]
-taylorvdef = v[i_,j_,k_]->
-			V[x0,y0,z0]+
-			DvDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-			DvDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-			DvDz[x0,y0,z0]*((k+1/2)*hz-z0)+
-			D2vDy2[x0,y0,z0]/2*((i+1/2)*hx-x0)^2+
-			D2vDx2[x0,y0,z0]/2*((j+1/2)*hy-y0)^2+
-			D2vDz2[x0,y0,z0]/2*((k+1/2)*hz-z0)^2+
-			D2vDxDy[x0,y0,z0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)+
-			D2vDxDz[x0,y0,z0]*((i+1/2)*hx-x0)*((k+1/2)*hz-z0)+
-			D2vDyDz[x0,y0,z0]*((j+1/2)*hy-y0)*((k+1/2)*hz-z0)
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "taylorvdef"
-     is similar to existing symbol "taylorudef".
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "DvDx"
-     is similar to existing symbol "DuDx".
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DvDy"
-     is similar to existing symbols {DuDy, DvDx}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DvDz"
-     is similar to existing symbols {DuDz, DvDx, DvDy}.
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "D2vDy2"
-     is similar to existing symbol "D2uDy2".
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell1
-     will be suppressed during this calculation.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "D2vDx2"
-     is similar to existing symbols {D2uDx2, D2vDy2}.
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup]
-v[i_, j_, k_] -> 
- 
-  (hx*(1/2 + i) - x0)*DvDx[x0, y0, z0] + 
- 
-   (hy*(1/2 + j) - y0)*DvDy[x0, y0, z0] + 
- 
-   (hz*(1/2 + k) - z0)*DvDz[x0, y0, z0] + 
- 
-   (hx*(1/2 + i) - x0)*(hy*(1/2 + j) - y0)*
- 
-    D2vDxDy[x0, y0, z0] + 
- 
-   (hx*(1/2 + i) - x0)*(hz*(1/2 + k) - z0)*
- 
-    D2vDxDz[x0, y0, z0] + 
- 
-   ((hy*(1/2 + j) - y0)^2*D2vDx2[x0, y0, z0])/2 + 
- 
-   (hy*(1/2 + j) - y0)*(hz*(1/2 + k) - z0)*
- 
-    D2vDyDz[x0, y0, z0] + 
- 
-   ((hx*(1/2 + i) - x0)^2*D2vDy2[x0, y0, z0])/2 + 
- 
-   ((hz*(1/2 + k) - z0)^2*D2vDz2[x0, y0, z0])/2 + 
- 
-   V[x0, y0, z0]
-;[o]
-v[i_, j_, k_] -> 
- 
-       1
-  (hx (- + i) - x0) DvDx[x0, y0, z0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DvDy[x0, y0, z0] + 
-        2
- 
-        1
-   (hz (- + k) - z0) DvDz[x0, y0, z0] + 
-        2
- 
-        1                 1
-   (hx (- + i) - x0) (hy (- + j) - y0) 
-        2                 2
- 
-    D2vDxDy[x0, y0, z0] + 
- 
-        1                 1
-   (hx (- + i) - x0) (hz (- + k) - z0) 
-        2                 2
- 
-    D2vDxDz[x0, y0, z0] + 
- 
-        1           2
-   (hy (- + j) - y0)  D2vDx2[x0, y0, z0]
-        2
-   ------------------------------------- + 
-                     2
- 
-        1                 1
-   (hy (- + j) - y0) (hz (- + k) - z0) 
-        2                 2
- 
-    D2vDyDz[x0, y0, z0] + 
- 
-        1           2
-   (hx (- + i) - x0)  D2vDy2[x0, y0, z0]
-        2
-   ------------------------------------- + 
-                     2
- 
-        1           2
-   (hz (- + k) - z0)  D2vDz2[x0, y0, z0]
-        2
-   ------------------------------------- + V[x0, y0, z0]
-                     2
-:[font = input; preserveAspect]
-dog = dvdy[i,j+half,k] //. {dvdydef, taylorvdef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DvDy[hx/2, hy, hz/2]
-;[o]
-     hx      hz
-DvDy[--, hy, --]
-     2       2
-:[font = input; preserveAspect; startGroup]
-taylorwdef = w[i_,j_,k_]->
-			W[x0,y0,z0]+
-			DwDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-			DwDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-			DwDz[x0,y0,z0]*((k+1/2)*hz-z0)+
-			D2wDy2[x0,y0,z0]/2*((i+1/2)*hx-x0)^2+
-			D2wDx2[x0,y0,z0]/2*((j+1/2)*hy-y0)^2+
-			D2wDz2[x0,y0,z0]/2*((k+1/2)*hz-z0)^2+
-			D2wDxDy[x0,y0,z0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)+
-			D2wDxDz[x0,y0,z0]*((i+1/2)*hx-x0)*((k+1/2)*hz-z0)+
-			D2wDyDz[x0,y0,z0]*((j+1/2)*hy-y0)*((k+1/2)*hz-z0)
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "taylorwdef"
-     is similar to existing symbols {taylorudef, 
-     taylorvdef}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DwDx"
-     is similar to existing symbols {DuDx, DvDx}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DwDy"
-     is similar to existing symbols {DuDy, DvDy, DwDx}.
-:[font = message; inactive; preserveAspect]
-General::stop: 
-   Further output of General::spell
-     will be suppressed during this calculation.
-:[font = output; output; inactive; preserveAspect; endGroup]
-w[i_, j_, k_] -> 
- 
-  (hx*(1/2 + i) - x0)*DwDx[x0, y0, z0] + 
- 
-   (hy*(1/2 + j) - y0)*DwDy[x0, y0, z0] + 
- 
-   (hz*(1/2 + k) - z0)*DwDz[x0, y0, z0] + 
- 
-   (hx*(1/2 + i) - x0)*(hy*(1/2 + j) - y0)*
- 
-    D2wDxDy[x0, y0, z0] + 
- 
-   (hx*(1/2 + i) - x0)*(hz*(1/2 + k) - z0)*
- 
-    D2wDxDz[x0, y0, z0] + 
- 
-   ((hy*(1/2 + j) - y0)^2*D2wDx2[x0, y0, z0])/2 + 
- 
-   (hy*(1/2 + j) - y0)*(hz*(1/2 + k) - z0)*
- 
-    D2wDyDz[x0, y0, z0] + 
- 
-   ((hx*(1/2 + i) - x0)^2*D2wDy2[x0, y0, z0])/2 + 
- 
-   ((hz*(1/2 + k) - z0)^2*D2wDz2[x0, y0, z0])/2 + 
- 
-   W[x0, y0, z0]
-;[o]
-w[i_, j_, k_] -> 
- 
-       1
-  (hx (- + i) - x0) DwDx[x0, y0, z0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DwDy[x0, y0, z0] + 
-        2
- 
-        1
-   (hz (- + k) - z0) DwDz[x0, y0, z0] + 
-        2
- 
-        1                 1
-   (hx (- + i) - x0) (hy (- + j) - y0) 
-        2                 2
- 
-    D2wDxDy[x0, y0, z0] + 
- 
-        1                 1
-   (hx (- + i) - x0) (hz (- + k) - z0) 
-        2                 2
- 
-    D2wDxDz[x0, y0, z0] + 
- 
-        1           2
-   (hy (- + j) - y0)  D2wDx2[x0, y0, z0]
-        2
-   ------------------------------------- + 
-                     2
- 
-        1                 1
-   (hy (- + j) - y0) (hz (- + k) - z0) 
-        2                 2
- 
-    D2wDyDz[x0, y0, z0] + 
- 
-        1           2
-   (hx (- + i) - x0)  D2wDy2[x0, y0, z0]
-        2
-   ------------------------------------- + 
-                     2
- 
-        1           2
-   (hz (- + k) - z0)  D2wDz2[x0, y0, z0]
-        2
-   ------------------------------------- + W[x0, y0, z0]
-                     2
-:[font = input; preserveAspect]
-dog = dwdy[i,j+half,k] //. {dwdydef1,dwdydef2, taylorwdef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DwDy[hx/2, hy, hz/2]
-;[o]
-     hx      hz
-DwDy[--, hy, --]
-     2       2
-:[font = input; preserveAspect]
-dog = dwdy[i,j,k+half] //. {dwdydef1,dwdydef2, taylorwdef} ;
-:[font = input; preserveAspect; startGroup]
-dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}
-:[font = output; output; inactive; preserveAspect; endGroup]
-DwDy[hx/2, hy/2, hz]
-;[o]
-     hx  hy
-DwDy[--, --, hz]
-     2   2
-:[font = input; preserveAspect; startGroup]
-taylormudef = mu[i_,j_]->
-			MU[x0,y0,z0]+
-			DmuDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-			DmuDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-			DmuDz[x0,y0,z0]*((k+1/2)*hz-z0)
-
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "taylormudef"
-     is similar to existing symbol "taylorudef".
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "DmuDx"
-     is similar to existing symbol "DuDx".
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DmuDy"
-     is similar to existing symbols {DmuDx, DuDy}.
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "DmuDz"
-     is similar to existing symbols {DmuDx, DmuDy, DuDz}.
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-mu[i_, j_] -> 
- 
-  (hx*(1/2 + i) - x0)*DmuDx[x0, y0, z0] + 
- 
-   (hy*(1/2 + j) - y0)*DmuDy[x0, y0, z0] + 
- 
-   (hz*(1/2 + k) - z0)*DmuDz[x0, y0, z0] + MU[x0, y0, z0]
-;[o]
-mu[i_, j_] -> 
- 
-       1
-  (hx (- + i) - x0) DmuDx[x0, y0, z0] + 
-       2
- 
-        1
-   (hy (- + j) - y0) DmuDy[x0, y0, z0] + 
-        2
- 
-        1
-   (hz (- + k) - z0) DmuDz[x0, y0, z0] + MU[x0, y0, z0]
-        2
-:[font = section; inactive; preserveAspect; startGroup]
-tests
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-diagonal elements of tau
-:[font = input; preserveAspect]
-dog = tauxx[i+half,j,k] //.
-		{tauxxdef,dudxdef,taylormudef,taylorudef};
-:[font = input; preserveAspect; startGroup]
- dog //. {half->1/2,i->0,j->0,k->0,x0->hx,y0 -> hy/2,z0->hz/2 } 
-:[font = output; output; inactive; preserveAspect; endGroup]
-2*DuDx[hx, hy/2, hz/2]*mu[1/2, 0, 0]
-;[o]
-           hy  hz     1
-2 DuDx[hx, --, --] mu[-, 0, 0]
-           2   2      2
-:[font = input; preserveAspect]
-dog = tauyy[i,j+half,k] //. 
-		{tauyydef,dvdydef,taylormudef,taylorvdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-2*DvDy[hx/2, hy, hz/2]*mu[0, 1/2, 0]
-;[o]
-       hx      hz        1
-2 DvDy[--, hy, --] mu[0, -, 0]
-       2       2         2
-:[font = input; preserveAspect]
-dog = tauzz[i,j,k+half] //. 
-		{tauzzdef,dwdzdef,taylormudef,taylorvdef,taylorwdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-2*DwDz[hx/2, hy/2, hz]*mu[0, 0, 1/2]
-;[o]
-       hx  hy               1
-2 DwDz[--, --, hz] mu[0, 0, -]
-       2   2                2
-:[font = subsubsection; inactive; preserveAspect; startGroup]
- tauxy
-:[font = input; preserveAspect]
-dog = tauxy[i,j+half,k] //.
-		{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-		 taylormudef,taylorudef,taylorvdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-(DuDy[hx/2, hy, hz/2] + DvDx[hx/2, hy, hz/2])*mu[0, 1/2, 0]
-;[o]
-      hx      hz         hx      hz         1
-(DuDy[--, hy, --] + DvDx[--, hy, --]) mu[0, -, 0]
-      2       2          2       2          2
-:[font = input; preserveAspect]
-dog = tauxy[i+half,j,k] //.
-		{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-		 taylormudef,taylorudef,taylorvdef};
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx,y0->hy/2,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-(DuDy[hx, hy/2, hz/2] + DvDx[hx, hy/2, hz/2])*mu[1/2, 0, 0]
-;[o]
-          hy  hz             hy  hz      1
-(DuDy[hx, --, --] + DvDx[hx, --, --]) mu[-, 0, 0]
-          2   2              2   2       2
-:[font = subsubsection; inactive; preserveAspect; startGroup]
- tauxz
-:[font = input; preserveAspect]
-dog = tauxz[i+half,j,k] //.
-		{tauxzdef,dudzdef1,dudzdef2,dwdxdef1,dwdxdef2,
-		 taylormudef,taylorudef,taylorwdef} ;
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx,y0->hy/2,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-(DuDz[hx, hy/2, hz/2] + DwDx[hx, hy/2, hz/2])*mu[1/2, 0, 0]
-;[o]
-          hy  hz             hy  hz      1
-(DuDz[hx, --, --] + DwDx[hx, --, --]) mu[-, 0, 0]
-          2   2              2   2       2
-:[font = input; preserveAspect]
-dog = tauxz[i,j,k+half] //.
-		{tauxzdef,dudzdef1,dudzdef2,dwdxdef1,dwdxdef2,
-		 taylormudef,taylorudef,taylorwdef} ;
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-(DuDz[hx/2, hy/2, hz] + DwDx[hx/2, hy/2, hz])*mu[0, 0, 1/2]
-;[o]
-      hx  hy             hx  hy                1
-(DuDz[--, --, hz] + DwDx[--, --, hz]) mu[0, 0, -]
-      2   2              2   2                 2
-:[font = subsubsection; inactive; preserveAspect; startGroup]
- tauyz
-:[font = input; preserveAspect]
-dog = tauyz[i,j+half,k] //.
-		{tauyzdef,dvdzdef1,dvdzdef2,dwdydef1,dwdydef2,
-		 taylormudef,taylorvdef,taylorwdef} ;
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}
-:[font = output; output; inactive; preserveAspect; endGroup]
-(DvDz[hx/2, hy, hz/2] + DwDy[hx/2, hy, hz/2])*mu[0, 1/2, 0]
-;[o]
-      hx      hz         hx      hz         1
-(DvDz[--, hy, --] + DwDy[--, hy, --]) mu[0, -, 0]
-      2       2          2       2          2
-:[font = input; preserveAspect]
-dog = tauyz[i,j,k+half] //.
-		{tauyzdef,dvdzdef1,dvdzdef2,dwdydef1,dwdydef2,
-		 taylormudef,taylorvdef,taylorwdef} ;
-:[font = input; preserveAspect; startGroup]
-dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup; endGroup]
-(DvDz[hx/2, hy/2, hz] + DwDy[hx/2, hy/2, hz])*mu[0, 0, 1/2]
-;[o]
-      hx  hy             hx  hy                1
-(DvDz[--, --, hz] + DwDy[--, --, hz]) mu[0, 0, -]
-      2   2              2   2                 2
-:[font = section; inactive; preserveAspect; startGroup]
-definitions used for fortran output
-:[font = input; preserveAspect; startGroup]
-murepl1 = mu[i_,j_+half,k_] -> muY[i,j+1,k]
-:[font = output; output; inactive; preserveAspect; endGroup]
-mu[i_, half + (j_), k_] -> muY[i, 1 + j, k]
-;[o]
-mu[i_, half + (j_), k_] -> muY[i, 1 + j, k]
-:[font = input; preserveAspect; startGroup]
-murepl2 = mu[i_+half,j_,k_] -> muX[i+1,j,k]
-:[font = output; output; inactive; preserveAspect; endGroup]
-mu[half + (i_), j_, k_] -> muX[1 + i, j, k]
-;[o]
-mu[half + (i_), j_, k_] -> muX[1 + i, j, k]
-:[font = input; preserveAspect; startGroup]
-murepl3 = mu[i_,j_,k_+half] -> muZ[i,j,k+1]
-:[font = output; output; inactive; preserveAspect; endGroup]
-mu[i_, j_, half + (k_)] -> muZ[i, j, 1 + k]
-;[o]
-mu[i_, j_, half + (k_)] -> muZ[i, j, 1 + k]
-:[font = input; preserveAspect; startGroup]
-urepl = u[i_,j_,k_] -> U[i,j,k,1]
-:[font = output; output; inactive; preserveAspect; endGroup]
-u[i_, j_, k_] -> U[i, j, k, 1]
-;[o]
-u[i_, j_, k_] -> U[i, j, k, 1]
-:[font = input; preserveAspect; startGroup]
-vrepl = v[i_,j_,k_] -> U[i,j,k,2]
-:[font = message; inactive; preserveAspect]
-General::spell1: 
-   Possible spelling error: new symbol name "vrepl"
-     is similar to existing symbol "urepl".
-:[font = output; output; inactive; preserveAspect; endGroup]
-v[i_, j_, k_] -> U[i, j, k, 2]
-;[o]
-v[i_, j_, k_] -> U[i, j, k, 2]
-:[font = input; preserveAspect; startGroup]
-wrepl = w[i_,j_,k_] -> U[i,j,k,3]
-:[font = message; inactive; preserveAspect]
-General::spell: 
-   Possible spelling error: new symbol name "wrepl"
-     is similar to existing symbols {urepl, vrepl}.
-:[font = output; output; inactive; preserveAspect; endGroup]
-w[i_, j_, k_] -> U[i, j, k, 3]
-;[o]
-w[i_, j_, k_] -> U[i, j, k, 3]
-:[font = subsection; inactive; preserveAspect; startGroup]
-dependentCellsNotCovered is a function which returns a logical expression suitable for inclusion in fortran.  Give an expression, exp, we wish to determine which mesh locations are accessed by the expression.  However, we do not wish to examine all possible locations, only those outside the grid patch region.  So we provide a second argument, which is a boolean function taking two arguments.  The combination will give logical expressions testing the mask for cells utilized by the
-expression and for which the boolean function, logfunc[il,jl], evaluates as true. The third argument is the name of the mask array
-:[font = input; preserveAspect]
-Clear[ dependentCellsNotCovered ]
-:[font = input; preserveAspect; startGroup]
-dependentCellsNotCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp,il,jl,kl,ml},
-	cond = False;
-	lexp = exp;
-	For[il=-1,il<=+1,il++,
-      For[jl=-1,jl<=+1,jl++,
-        For[kl=-1,kl<=+1,kl++,
-          For[ml=1,ml<=3,ml++,
-            If[ (logfunc[il,jl,kl]) &&
-	          (Coefficient[
-		        Expand[ 
-		          exp
-		        ] ,
-		        U[i+il,j+jl,k+kl,ml]
-	          ] =!= 0), cond = cond || (maskfun[i+il,j+jl,k+kl]>0)
-	        ]
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "lexp"
-     is similar to existing symbol "exp".
-:[font = input; preserveAspect; startGroup]
-dependentCellsNotCovered[abba*U[i+1,j-1,k,1]+U[i-1,j-1,k+1,2]
-							, Function[{i,j,k},(k>0)] , 
-							  masks  ]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-masks[-1 + i, -1 + j, 1 + k] > 0
-;[o]
-masks[-1 + i, -1 + j, 1 + k] > 0
-:[font = subsection; inactive; preserveAspect; startGroup]
-dependentCellsCovered is the logical inverse of dependentCellsNotCovered
-:[font = input; preserveAspect]
-Clear[ dependentCellsCovered ]
-:[font = input; preserveAspect]
-dependentCellsCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp,il,jl,kl,ml},
-	cond = True;
-	lexp = exp;
-	For[il=-1,il<=+1,il++,
-      For[jl=-1,jl<=+1,jl++,
-        For[kl=-1,kl<=+1,kl++,
-          For[ml=1,ml<=3,ml++,
-            If[ (logfunc[il,jl,kl]) &&
-	          (Coefficient[
-		        Expand[ 
-		          exp
-		        ] ,
-		        U[i+il,j+jl,k+kl,ml]
-	          ] =!= 0), cond = cond && (maskfun[i+il,j+jl,k+kl]==0)
-	        ]
-	      ]
-        ]
-      ]
-    ];
-    cond
-  ]
-:[font = input; preserveAspect; startGroup]
-dependentCellsCovered[abba*U[i+1,j-1,k,1]+U[i-1,j-1,k+1,2]
-							, Function[{i,j,k},(k>0)] , 
-							  masks  ]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-masks[-1 + i, -1 + j, 1 + k] == 0
-;[o]
-masks[-1 + i, -1 + j, 1 + k] == 0
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for two sided derivs
-:[font = input; preserveAspect]
-DTwoX[u_,i_,j_,k_] := (u[i+1,j,k]-u[i-1,j,k])/(2*hx)
-:[font = input; preserveAspect]
-DTwoX[u_,i_,j_,k_,n_] := (u[i+1,j,k,n]-u[i-1,j,k,n])/(2*hx)
-:[font = input; preserveAspect; startGroup]
-Simplify[ DTwoX[u,0,0,0] //. {taylorudef,x0->hx/2,y0->hy/2,
-									z0->hz/2} ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDx[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDx[--, --, --]
-     2   2   2
-:[font = input; preserveAspect; startGroup]
-DTwoY[u_,i_,j_,k_] := (u[i,j+1,k]-u[i,j-1,k])/(2*hy)
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "DTwoY"
-     is similar to existing symbol "DTwoX".
-:[font = input; preserveAspect]
-DTwoY[u_,i_,j_,k_,n_] := (u[i,j+1,k,n]-u[i,j-1,k,n])/(2*hy)
-:[font = input; preserveAspect; startGroup]
-Simplify[ DTwoY[u,0,0,0] //. {taylorudef,x0->hx/2,y0->hy/2,
-									z0->hz/2} ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDy[--, --, --]
-     2   2   2
-:[font = input; preserveAspect; startGroup]
-DTwoZ[u_,i_,j_,k_] := (u[i,j,k+1]-u[i,j,k-1])/(2*hz)
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell: 
-   Possible spelling error: new symbol name "DTwoZ"
-     is similar to existing symbols {DTwoX, DTwoY}.
-:[font = input; preserveAspect]
-DTwoZ[u_,i_,j_,k_,n_] := (u[i,j,k+1,n]-u[i,j,k-1,n])/(2*hz)
-:[font = input; preserveAspect; startGroup]
-Simplify[ DTwoZ[u,0,0,0] //. {taylorudef,x0->hx/2,y0->hy/2,
-									z0->hz/2} ]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-DuDz[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDz[--, --, --]
-     2   2   2
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for Do One-sided Derivative in X direction.  if sign is positive, 
-it means extend the stencil in the positivie x direction.  if negative, extend
-in other direction
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,k_,sign_] := 
-		(-u[i+2,j,k]+4*u[i+1,j,k]-3*u[i,j,k])/
-									(2*hx)  /; sign==1
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,k_,sign_] := 
-		(u[i-2,j,k]-4*u[i-1,j,k]+3*u[i,j,k])/
-									(2*hx)  /; sign==-1
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,k_,n_,sign_] := 
-		(-u[i+2,j,k,n]+4*u[i+1,j,k,n]-3*u[i,j,k,n])/
-									(2*hx)  /; sign==1
-:[font = input; preserveAspect]
-DOneX[u_,i_,j_,k_,n_,sign_] := 
-		(u[i-2,j,k,n]-4*u[i-1,j,k,n]+3*u[i,j,k,n])/
-									(2*hx)  /; sign==-1
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneX[u,0,0,0,-1] //. 
-		{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDx[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDx[--, --, --]
-     2   2   2
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneX[u,0,0,0,+1] //. 
-		{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-DuDx[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDx[--, --, --]
-     2   2   2
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for Do One-sided Derivative in Y direction.  if sign is positive, 
-it means extend the stencil in the positivie y direction.  if negative, extend
-in other direction
-:[font = input; preserveAspect; startGroup]
-DOneY[u_,i_,j_,k_,sign_] := 
-		(-u[i,j+2,k]+4*u[i,j+1,k]-3*u[i,j,k])/
-									(2*hy)  /; sign==1
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "DOneY"
-     is similar to existing symbol "DOneX".
-:[font = input; preserveAspect]
-DOneY[u_,i_,j_,k_,sign_] := 
-		(u[i,j-2,k]-4*u[i,j-1,k]+3*u[i,j,k])/
-									(2*hy)  /; sign==-1
-:[font = input; preserveAspect]
-DOneY[u_,i_,j_,k_,n_,sign_] := 
-		(-u[i,j+2,k,n]+4*u[i,j+1,k,n]-3*u[i,j,k,n])/
-									(2*hy)  /; sign==1
-:[font = input; preserveAspect]
-DOneY[u_,i_,j_,k_,n_,sign_] := 
-		(u[i,j-2,k,n]-4*u[i,j-1,k,n]+3*u[i,j,k,n])/
-									(2*hy)  /; sign==-1
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneY[u,0,0,0,-1] //. 
-		{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDy[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDy[--, --, --]
-     2   2   2
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneY[u,0,0,0,+1] //. 
-		{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup]
-DuDy[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDy[--, --, --]
-     2   2   2
-:[font = subsection; inactive; preserveAspect; startGroup]
-definitions for Do One-sided Derivative in Z direction.  if sign is positive, 
-it means extend the stencil in the positivie z direction.  if negative, extend
-in other direction
-:[font = input; preserveAspect; startGroup]
-DOneZ[u_,i_,j_,k_,sign_] := 
-		(-u[i,j,k+2]+4*u[i,j,k+1]-3*u[i,j,k])/
-									(2*hz)  /; sign==1
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell: 
-   Possible spelling error: new symbol name "DOneZ"
-     is similar to existing symbols {DOneX, DOneY}.
-:[font = input; preserveAspect]
-DOneZ[u_,i_,j_,k_,sign_] := 
-		(u[i,j,k-2]-4*u[i,j,k-1]+3*u[i,j,k])/
-									(2*hz)  /; sign==-1
-:[font = input; preserveAspect]
-DOneZ[u_,i_,j_,k_,n_,sign_] := 
-		(-u[i,j,k+2,n]+4*u[i,j,k+1,n]-3*u[i,j,k,n])/
-									(2*hz)  /; sign==1
-:[font = input; preserveAspect]
-DOneZ[u_,i_,j_,k_,n_,sign_] := 
-		(u[i,j,k-2,n]-4*u[i,j,k-1,n]+3*u[i,j,k,n])/
-									(2*hz)  /; sign==-1
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneZ[u,0,0,0,-1] //. 
-		{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDz[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDz[--, --, --]
-     2   2   2
-:[font = input; preserveAspect; startGroup]
-Simplify[ DOneZ[u,0,0,0,+1] //. 
-		{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]
-:[font = output; output; inactive; preserveAspect; endGroup]
-DuDz[hx/2, hy/2, hz/2]
-;[o]
-     hx  hy  hz
-DuDz[--, --, --]
-     2   2   2
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-useful one-sided derivatives
-:[font = input; preserveAspect]
-dvdxalt[i_,j_+half,k_,sign_] := (DOneX[v,i,j  ,k,sign]+
-							     DOneX[v,i,j+1,k,sign])/2
-:[font = input; preserveAspect]
-dudyalt[i_+half,j_,k_,sign_] := (DOneY[u,i  ,j,k,sign]+
-							     DOneY[u,i+1,j,k,sign])/2
-:[font = input; preserveAspect; startGroup]
-dvdzalt[i_,j_+half,k_,sign_] := (DOneZ[v,i,j  ,k,sign]+
-							     DOneZ[v,i,j+1,k,sign])/2
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "dvdzalt"
-     is similar to existing symbol "dvdxalt".
-:[font = input; preserveAspect; startGroup]
-dwdyalt[i_,j_,k_+half,sign_] := (DOneY[w,i,j,k  ,sign]+
-								 DOneY[w,i,j,k+1,sign])/2
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell1: 
-   Possible spelling error: new symbol name "dwdyalt"
-     is similar to existing symbol "dudyalt".
-:[font = input; preserveAspect; startGroup]
-dudzalt[i_+half,j_,k_,sign_] := (DOneZ[u,i  ,j,k,sign]+
-								 DOneZ[u,i+1,j,k,sign])/2
-:[font = message; inactive; preserveAspect; endGroup]
-General::spell: 
-   Possible spelling error: new symbol name "dudzalt"
-     is similar to existing symbols {dudyalt, dvdzalt}.
-:[font = input; preserveAspect; startGroup]
-dwdxalt[i_,j_,k_+half,sign_] := (DOneX[w,i,j,k  ,sign]+
-								 DOneX[w,i,j,k+1,sign])/2
-:[font = message; inactive; preserveAspect; endGroup; endGroup; endGroup]
-General::spell: 
-   Possible spelling error: new symbol name "dwdxalt"
-     is similar to existing symbols {dvdxalt, dwdyalt}.
-:[font = subsection; inactive; preserveAspect; startGroup]
-setup to use the Format.m package 
-:[font = input; preserveAspect]
-Off[General::spell,General::spell1];
-:[font = input; preserveAspect]
-SetOptions[$Output,PageWidth->73];
-:[font = input; preserveAspect; startGroup]
-<</usr/people/wyc/_math/MathSource/Format/Format.m
-:[font = message; inactive; preserveAspect]
-exp::shdw: Warning: Symbol exp
-     appears in multiple contexts {Format`, Global`};
-     definitions in context Format`
-     may shadow or be shadowed by other definitions.
-:[font = message; inactive; preserveAspect; endGroup]
-sign::shdw: 
-   Warning: Symbol sign appears in multiple contexts 
-    {Format`, Global`}; definitions in context Format`
-     may shadow or be shadowed by other definitions.
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-substitution for all derivatives and variables
-:[font = input; preserveAspect]
-allDerivAllUV = {dudxdef,
-				 dvdydef,
-				 dwdzdef,
-				 dudydef1,dudydef2,
-				 dudzdef1,dudzdef2,
-				 dvdxdef1,dvdxdef2,
-				 dvdzdef1,dvdzdef2,
-				 dwdxdef1,dwdxdef2,
-				 dwdydef1,dwdydef2,
-				 urepl,
-				 vrepl,
-				 wrepl};
-:[font = input; preserveAspect; endGroup]
-allUVW = {       urepl,
-				 vrepl,
-				 wrepl};
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-transverse u derivs
-:[font = input; preserveAspect]
-tduext[half+i,j,k] = trandere[i+1,j,k,1];
-:[font = input; preserveAspect]
-tduext[half+i-1,j,k] = tranderw[i-1,j,k,1];
-:[font = input; preserveAspect]
-tduext[i,j+half,k] = trandern[i,j+1,k,1];
-:[font = input; preserveAspect]
-tduext[i,j-1+half,k] = tranders[i,j-1,k,1];
-:[font = input; preserveAspect]
-tduext[i,j,k+half] = trandert[i,j,k+1,1];
-:[font = input; preserveAspect; endGroup]
-tduext[i,j,k-1+half] = tranderb[i,j,k-1,1];
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-transverse v derivs
-:[font = input; preserveAspect]
-tdvext[half+i,j,k] = trandere[i+1,j,k,2];
-:[font = input; preserveAspect]
-tdvext[half+i-1,j,k] = tranderw[i-1,j,k,2];
-:[font = input; preserveAspect]
-tdvext[i,j+half,k] = trandern[i,j+1,k,2];
-:[font = input; preserveAspect]
-tdvext[i,j-1+half,k] = tranders[i,j-1,k,2];
-:[font = input; preserveAspect]
-tdvext[i,j,k+half] = trandert[i,j,k+1,2];
-:[font = input; preserveAspect; endGroup]
-tdvext[i,j,k-1+half] = tranderb[i,j,k-1,2];
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-transverse w derivs
-:[font = input; preserveAspect]
-tdwext[half+i,j,k] = trandere[i+1,j,k,3];
-:[font = input; preserveAspect]
-tdwext[half+i-1,j,k] = tranderw[i-1,j,k,3];
-:[font = input; preserveAspect]
-tdwext[i,j+half,k] = trandern[i,j+1,k,3];
-:[font = input; preserveAspect]
-tdwext[i,j-1+half,k] = tranders[i,j-1,k,3];
-:[font = input; preserveAspect]
-tdwext[i,j,k+half] = trandert[i,j,k+1,3];
-:[font = input; preserveAspect; endGroup; endGroup]
-tdwext[i,j,k-1+half] = tranderb[i,j,k-1,3];
-:[font = subsection; inactive; preserveAspect; startGroup]
-an alternate approach which seeks to automatically determine which 
-direction to use for one sided deriv
-:[font = input; preserveAspect]
-altgen[lhs_,indx_,indy_,indz_,
-       exp_,expalt_,expext_,
-       varindx_,derivindx_,
-       indexcond_,mask_] :=
-	Block[
-		{tmpcond,tmp,tmpalt,
-		 depplus,depminus,sign,
-		 line1,line2,line3,line4,line5,
-		 icase,jcase,kcase},
-		(* conditions are False if expression is safe to use *)
-		tmpcond = dependentCellsNotCovered[
-					exp[indx,indy,indz] //. allDerivAllUV,
-					indexcond,mask];
-		depplus = dependentCellsNotCovered[
-					expalt[indx,indy,indz,+1] //.allDerivAllUV,
-					indexcond,mask];
-		depminus = dependentCellsNotCovered[
-					expalt[indx,indy,indz,-1] //.allDerivAllUV,
-					indexcond,mask];
-		(* temporary *)
-		If[ depplus === False , 
-			sign = 1,
-			If[ depminus === False ,
-				sign = -1,
-				sign = 0  (* means neither of one 
-				             sided is safe *)
-			]
-		];
-		(* treat 3 different cases *)
-		Which[
-			tmpcond === False,
-			(* exp does not extend into masked region *)
-			FortranAssign[
-				lhs,
-				exp[indx,indy,indz] //.allDerivAllUV,
-				AssignToArray->{U}
-			],
-			
-			tmpcond =!= False && sign != 0,
-			(* exp extends outside, output conditional mask *)
-
-			tmp = FortranAssign[
-				tmpcond,
-				AssignToArray->{mask},
-				AssignIndent->""
-			];
-			tmpalt =dependentCellsNotCovered[
-					expalt[indx,indx,indz,sign]//.allDerivAllUV,
-						indexcond,mask];
-			line1 = StringForm["      if(``) then ", tmp];
-			line2 = FortranAssign[
-				lhs,
-				expalt[indx,indy,indz,sign]//.allDerivAllUV,
-				AssignToArray->{U}
-			];
-			line3 = StringForm["      else"];
-			line4 = FortranAssign[
-				lhs,
-				exp[indx,indy,indz] //.allDerivAllUV,
-				AssignToArray->{U}
-			];
-			If[tmpalt =!= False ,
-				(* this is an error, the alternate form should
-				   be specified to be inside safe region *)
-		   		line5 = StringForm[" error in tandergen"]
-		   	,
-		   		line5 = StringForm["      endif"]
-			];
-			ColumnForm[{line1,line2,line3,line4,line5}],
-			
-			True,
-			(* cannot use exp or expalt, must be
-			   externally supplied derivative *)
-
-			(* need to figure out where to evaluate
-			   the transverse derivative *)
-			icase = Which[ indx === i-1+half, -1,
-						   indx === i       ,  0,
-						   indx === i  +half, +1,
-						   _, Print["error in icase"]];
-			jcase = Which[ indy === j-1+half, -1,
-						   indy === j       ,  0,
-						   indy === j  +half, +1,
-						   _, Print["error in jcase"]];
-
-			kcase = Which[ indz === k-1+half, -1,
-						   indz === k       ,  0,
-						   indz === k  +half, +1,
-						   _, Print["error in kcase"]];
-
-		
-			FortranAssign[
-					lhs, expext[i+icase,
-								j+jcase,
-								k+kcase,
-								varindx,derivindx],
-					AssignToArray->{trandere,tranderw,
-									trandern,tranders,
-									trandert,tranderb}]	
-		]	
-	]
-:[font = input; preserveAspect; startGroup]
-altgen[ dwdxt, 
-		i,j,k+half,
-		dwdx,dwdxalt,
-		trandern,3,1,Function[{i,j,k},(k>0)],
-		maskn ]
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-        dwdxt=trandern(i,j,1+k,3,1)
-;[o]
-        dwdxt=trandern(i,j,1+k,3,1)
-:[font = input; preserveAspect; startGroup]
-altgen[ dudye, 
-		i+half,j,k,
-		dudy,
-		dudyalt,
-		tduext,
-		1,2,
-		Function[{i,j,k},(i<0)],
-		maskn ] 
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-;[o]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-:[font = input; preserveAspect; startGroup]
-altgen[ dudye, 
-		i+half,j,k,
-		dudy,
-		dudyalt,
-		trandere,
-		1,2,
-		Function[{i,j,k},(i>0)],
-		maskn ] 
-:[font = output; output; inactive; preserveAspect; endGroup]
-        dudye=trandere(1+i,j,k,1,2)
-;[o]
-        dudye=trandere(1+i,j,k,1,2)
-:[font = input; preserveAspect; startGroup]
-altgen[ dudye, 
-		i+half,j,k,
-		dudy,
-		dudyalt,
-		tranderns,
-		1,2,
-		Function[{i,j,k},(j<0)],
-		maskn ] 
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-StringForm["      if(``) then ", 
- 
-  (maskn(i,-1+j,k).gt.0).or.(maskn(1+i,-1+j,k).gt.0)]
-        dudye=5.d-1*(5.d-1*(-3.d0*U(i,j,k,1)+4.d0*U(i,1+j,
-     &  k,1)-U(i,2+j,k,1))/hy+5.d-1*(-3.d0*U(1+i,j,k,1)+4.
-     &  d0*U(1+i,1+j,k,1)-U(1+i,2+j,k,1))/hy)
-StringForm["      else"]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-StringForm["      endif"]
-;[o]
-      if((maskn(i,-1+j,k).gt.0).or.(maskn(1+i,-1+j,k).gt.0)
- 
-  ) then 
-        dudye=5.d-1*(5.d-1*(-3.d0*U(i,j,k,1)+4.d0*U(i,1+j,
-     &  k,1)-U(i,2+j,k,1))/hy+5.d-1*(-3.d0*U(1+i,j,k,1)+4.
-     &  d0*U(1+i,1+j,k,1)-U(1+i,2+j,k,1))/hy)
-      else
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-      endif
-:[font = input; preserveAspect; startGroup]
-altgen[ dudye, 
-		i+half,j,k,
-		dudy,
-		dudyalt,
-		trandere,
-		1,2,
-		Function[{i,j,k},(j>0)],
-		maskn ] 
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-StringForm["      if(``) then ", 
- 
-  (maskn(i,1+j,k).gt.0).or.(maskn(1+i,1+j,k).gt.0)]
-        dudye=5.d-1*(5.d-1*(U(i,-2+j,k,1)-4.d0*U(i,-1+j,k,
-     &  1)+3.d0*U(i,j,k,1))/hy+5.d-1*(U(1+i,-2+j,k,1)-4.d0
-     &  *U(1+i,-1+j,k,1)+3.d0*U(1+i,j,k,1))/hy)
-StringForm["      else"]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-StringForm["      endif"]
-;[o]
-      if((maskn(i,1+j,k).gt.0).or.(maskn(1+i,1+j,k).gt.0)
- 
-  ) then 
-        dudye=5.d-1*(5.d-1*(U(i,-2+j,k,1)-4.d0*U(i,-1+j,k,
-     &  1)+3.d0*U(i,j,k,1))/hy+5.d-1*(U(1+i,-2+j,k,1)-4.d0
-     &  *U(1+i,-1+j,k,1)+3.d0*U(1+i,j,k,1))/hy)
-      else
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-      endif
-:[font = input; preserveAspect; startGroup]
-altgen[ dudye, 
-		i+half,j,k,
-		dudy,
-		dudyalt,
-		tranderb,
-		1,2,
-		Function[{i,j,k},(k<0)],
-		maskn ] 
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-;[o]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-:[font = input; preserveAspect; startGroup]
-altgen[ dudye, 
-		i+half,j,k,
-		dudy,
-		dudyalt,
-		trandert,
-		1,2,
-		Function[{i,j,k},(k>0)],
-		maskn ] 
-:[font = output; output; inactive; preserveAspect; fontLeading = 0; endGroup]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-;[o]
-        dudye=2.5d-1*(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1
-     &  +j,k,1)+U(1+i,1+j,k,1))/hy
-:[font = subsubsection; inactive; preserveAspect; startGroup]
-a short-hand function
-:[font = input; preserveAspect]
-FA[x_] := FortranAssign[x,
-						AssignToArray->{U,muX,muY,muZ,a,u,
-										maskn,maske,maskw,
-										masks,maskt,maskb},
-						AssignIndent->"" ];		
-:[font = input; preserveAspect]
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D1.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D1.F"];
-CopyFile[ "dog.f", "DV_3D1.F" ];
-<<"!touch DV_3D1.F"
-
-:[font = input; preserveAspect]
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D2.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D2.F"];
-CopyFile[ "dog.f", "DV_3D2.F" ];
-<<"!touch DV_3D2.F"
-
-:[font = input; preserveAspect]
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D3.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D3.F"];
-CopyFile[ "dog.f", "DV_3D3.F" ];
-<<"!touch DV_3D3.F"
-
-:[font = input; preserveAspect]
-DeleteFile[ "dog.mf"];
-CopyFile[ "DV_3D4.mF" , "dog.mf"];
-Splice["dog.mf",FormatType->OutputForm];
-DeleteFile[ "DV_3D4.F"];
-CopyFile[ "dog.f", "DV_3D4.F" ];
-<<"!touch DV_3D4.F"
-
-:[font = input; preserveAspect; startGroup]
-
- FA[ Coefficient[Expand[
-  alpha*a[i,j,k]*u[i,j,k]-beta*(
-	hy*hz*(tauxx[i+half  ,j      , k]-
-	       tauxx[i-1+half,j      , k])+
-	hx*hz*(tauxy[i       ,j+half  ,k]-   
-	       tauxy[i       ,j-1+half,k])+
-	hx*hy*(tauxz[i       ,j       ,k+half]-
-	       tauxz[i       ,j       ,k-1+half]))/vol //. 
-	       {murepl1,murepl2,murepl3,
-	        tauxxdef,tauyydef,tauxydef,tauxzdef,tauyzdef,
-	        tauzzdef,
-	        vol->hx*hy*hz,
-	        dudxdef,dvdydef,dwdzdef,
-	        dudydef1,dudydef2,
-	        dudzdef1,dudzdef2,
-	        dwdxdef1,dwdxdef2,
-	        dvdxdef1,dvdxdef2 }
- ],u[i,j+1,k]]]
-	       
-:[font = output; output; inactive; preserveAspect; endGroup]
--(beta*muY(i,1+j,k)/hy**2)
-;[o]
--(beta*muY(i,1+j,k)/hy**2)
-:[font = input; preserveAspect; startGroup]
-
-FA[Coefficient[ Expand[
-  alpha*a[i,j,k]*v[i,j,k]-beta*(
-	hy*hz*(tauxy[i+half  ,j      , k]-
-	       tauxy[i-1+half,j      , k])+
-	hx*hz*(tauyy[i       ,j+half  ,k]-   
-	       tauyy[i       ,j-1+half,k])+
-	hx*hy*(tauyz[i       ,j       ,k+half]-
-	       tauyz[i       ,j       ,k-1+half]))/vol //. 
-	       {murepl1,murepl2,murepl3,
-	        tauxxdef,tauyydef,tauxydef,tauxzdef,tauyzdef,
-	        tauzzdef,
-	        vol->hx*hy*hz,
-	        dudxdef,dvdydef,dwdzdef,
-	        dudydef1,dudydef2,
-	        dudzdef1,dudzdef2,
-	        dwdxdef1,dwdxdef2,
-	        dvdxdef1,dvdxdef2,
-	        dvdzdef1,dvdzdef2,
-	        dwdydef1,dwdydef2 } ] , v[i,j+1,k] ] ]
-:[font = output; output; inactive; preserveAspect; endGroup]
--2.d0*beta*muY(i,1+j,k)/hy**2
-;[o]
--2.d0*beta*muY(i,1+j,k)/hy**2
-:[font = input; preserveAspect; startGroup]
-
-FA[ Coefficient[ Expand[
-  alpha*a[i,j,k]*w[i,j,k]-beta*(
-	hy*hz*(tauxz[i+half  ,j      , k]-
-	       tauxz[i-1+half,j      , k])+
-	hx*hz*(tauyz[i       ,j+half  ,k]-   
-	       tauyz[i       ,j-1+half,k])+
-	hx*hy*(tauzz[i       ,j       ,k+half]-
-	       tauzz[i       ,j       ,k-1+half]))/vol //. 
-	       {murepl1,murepl2,murepl3,
-	        tauxxdef,tauyydef,tauxydef,tauxzdef,tauyzdef,
-	        tauzzdef,
-	        vol->hx*hy*hz,
-	        dudxdef,dvdydef,dwdzdef,
-	        dudydef1,dudydef2,
-	        dudzdef1,dudzdef2,
-	        dwdxdef1,dwdxdef2,
-	        dvdxdef1,dvdxdef2,
-	        dvdzdef1,dvdzdef2,
-	        dwdydef1,dwdydef2 } ] , w[i,j+1,k] ] ]
-:[font = output; output; inactive; preserveAspect; endGroup]
--(beta*muY(i,1+j,k)/hy**2)
-;[o]
--(beta*muY(i,1+j,k)/hy**2)
-:[font = input; preserveAspect; startGroup]
-
-	DTwoY[u,i,j,k] //. allDerivAllUV
-:[font = output; output; inactive; preserveAspect; endGroup]
-(-U[i, -1 + j, k, 1] + U[i, 1 + j, k, 1])/(2*hy)
-;[o]
--U[i, -1 + j, k, 1] + U[i, 1 + j, k, 1]
----------------------------------------
-                 2 hy
-:[font = input; preserveAspect; startGroup]
-FA[ dependentCellsNotCovered[
-	DTwoY[u,i,j,k] //. allDerivAllUV,
-	Function[{i,j,k},(j<0)],masks] ]
-:[font = output; output; inactive; preserveAspect; endGroup]
-masks(i,-1+j,k).gt.0
-;[o]
-masks(i,-1+j,k).gt.0
-:[font = input; preserveAspect; startGroup]
-FA[ DTwoY[U,i,j,k,n] ]
-:[font = output; output; inactive; preserveAspect; endGroup; endGroup; endGroup; endGroup; endGroup]
-5.d-1*(-U(i,-1+j,k,n)+U(i,1+j,k,n))/hy
-;[o]
-5.d-1*(-U(i,-1+j,k,n)+U(i,1+j,k,n))/hy
-^*)
\ No newline at end of file
diff --git a/Src/LinearSolvers/C_TensorMG/visc3d.nb b/Src/LinearSolvers/C_TensorMG/visc3d.nb
deleted file mode 100644
index b32fcf81ab4..00000000000
--- a/Src/LinearSolvers/C_TensorMG/visc3d.nb
+++ /dev/null
@@ -1,2943 +0,0 @@
-(***********************************************************************
-
-                    Mathematica-Compatible Notebook
-
-This notebook can be used on any computer system with Mathematica 3.0,
-MathReader 3.0, or any compatible application. The data for the notebook 
-starts with the line of stars above.
-
-To get the notebook into a Mathematica-compatible application, do one of 
-the following:
-
-* Save the data starting with the line of stars above into a file
-  with a name ending in .nb, then open the file inside the application;
-
-* Copy the data starting with the line of stars above to the
-  clipboard, then use the Paste menu command inside the application.
-
-Data for notebooks contains only printable 7-bit ASCII and can be
-sent directly in email or through ftp in text mode.  Newlines can be
-CR, LF or CRLF (Unix, Macintosh or MS-DOS style).
-
-NOTE: If you modify the data for this notebook not in a Mathematica-
-compatible application, you must delete the line below containing the 
-word CacheID, otherwise Mathematica-compatible applications may try to 
-use invalid cache data.
-
-For more information on notebooks and Mathematica-compatible 
-applications, contact Wolfram Research:
-  web: http://www.wolfram.com
-  email: info@wolfram.com
-  phone: +1-217-398-0700 (U.S.)
-
-Notebook reader applications are available free of charge from 
-Wolfram Research.
-***********************************************************************)
-
-(*CacheID: 232*)
-
-
-(*NotebookFileLineBreakTest
-NotebookFileLineBreakTest*)
-(*NotebookOptionsPosition[     61315,       2219]*)
-(*NotebookOutlinePosition[     62304,       2253]*)
-(*  CellTagsIndexPosition[     62260,       2249]*)
-(*WindowFrame->Normal*)
-
-
-
-Notebook[{
-
-Cell[CellGroupData[{
-Cell[TextData[
-"a clone of visc2d.ma  which\nshould work in 3D"], "Subtitle",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definition of tau"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-tauxxdef = tauxx[i_ + half, j_ ,k_] -> 
-\t\t2*mu[i+half,j,k]*dudx[i+half,j,k]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(tauxx[half + i_, j_, k_] \[Rule] 
-      2\ dudx[half + i, j, k]\ mu[half + i, j, k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-tauyydef = tauyy[i_, j_ + half,k_] ->
-\t\t2*mu[i,j+half,k] * dvdy[i,j+half,k]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(tauyy[i_, half + j_, k_] \[Rule] 
-      2\ dvdy[i, half + j, k]\ mu[i, half + j, k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-tauzzdef = tauzz[i_,j_,k_+half] ->
-\t\t2*mu[i,j,k+half]*dwdz[i,j,k+half]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(tauzz[i_, j_, half + k_] \[Rule] 
-      2\ dwdz[i, j, half + k]\ mu[i, j, half + k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-tauxydef = tauxy[i_,j_,k_] -> mu[i,j,k]*
-\t\t\t\t\t\t\t(dudy[i,j,k]+dvdx[i,j,k])\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauxydef\)\" is similar \
-to existing symbols \!\({tauxxdef, tauyydef}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauxy\)\" is similar to \
-existing symbols \!\({tauxx, tauyy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudy\)\" is similar to \
-existing symbols \!\({dudx, dvdy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(tauxy[i_, j_, k_] \[Rule] 
-      \((dudy[i, j, k] + dvdx[i, j, k])\)\ mu[i, j, k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-tauxzdef = tauxz[i_,j_,k_] -> mu[i,j,k]*
-\t\t\t\t\t\t\t(dudz[i,j,k]+dwdx[i,j,k])\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauxzdef\)\" is similar \
-to existing symbols \!\({tauxxdef, tauxydef, tauzzdef}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauxz\)\" is similar to \
-existing symbols \!\({tauxx, tauxy, tauzz}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudz\)\" is similar to \
-existing symbols \!\({dudx, dudy, dwdz}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(tauxz[i_, j_, k_] \[Rule] 
-      \((dudz[i, j, k] + dwdx[i, j, k])\)\ mu[i, j, k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-tauyzdef = tauyz[i_,j_,k_] -> mu[i,j,k]*
-\t\t\t\t\t\t\t(dvdz[i,j,k]+dwdy[i,j,k])\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauyzdef\)\" is similar \
-to existing symbols \!\({tauxzdef, tauyydef, tauzzdef}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(tauyz\)\" is similar to \
-existing symbols \!\({tauxz, tauyy, tauzz}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dvdz\)\" is similar to \
-existing symbols \!\({dudz, dvdx, dvdy, dwdz}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(tauyz[i_, j_, k_] \[Rule] 
-      \((dvdz[i, j, k] + dwdy[i, j, k])\)\ mu[i, j, k]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions of derivatives"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[TextData["diagonal derivatives"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dudxdef = dudx[i_+half,j_,k_] -> 
-\t\t(u[i+1,j,k]-u[i,j,k])/hx\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dudx[half + i_, j_, k_] \[Rule] 
-      \(\(-u[i, j, k]\) + u[1 + i, j, k]\)\/hx\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dvdydef = dvdy[i_,j_+half,k_] ->
-\t\t(v[i,j+1,k]-v[i,j,k])/hy\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dvdy[i_, half + j_, k_] \[Rule] 
-      \(\(-v[i, j, k]\) + v[i, 1 + j, k]\)\/hy\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dwdzdef = dwdz[i_,j_,k_+half] ->
-\t\t(w[i,j,k+1]-w[i,j,k])/hz\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dwdz[i_, j_, half + k_] \[Rule] 
-      \(\(-w[i, j, k]\) + w[i, j, 1 + k]\)\/hz\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["dudy"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dudydef1 = dudy[i_,j_+half,k_] -> (u[i,j+1,k]-u[i,j,k])/hy", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dudy[i_, half + j_, k_] \[Rule] 
-      \(\(-u[i, j, k]\) + u[i, 1 + j, k]\)\/hy\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dudydef2 = dudy[i_+half,j_,k_] -> 
-\t\t(u[i,j+1,k]-u[i,j-1,k]+u[i+1,j+1,k]-u[i+1,j-1,k])/
-\t\t\t\t\t\t\t\t\t\t\t\t\t(4*hy)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dudy[half + i_, j_, k_] \[Rule] 
-      \(1\/\(4\ hy\)\((
-        \(-u[i, \(-1\) + j, k]\) + u[i, 1 + j, k] - u[1 + i, \(-1\) + j, k] + 
-          u[1 + i, 1 + j, k])\)\)\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["dudz"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dudzdef1 = dudz[i_,j_,k_+half]->(u[i,j,k+1]-u[i,j,k])/hz", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudzdef1\)\" is similar \
-to existing symbol \"\!\(dudydef1\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(dudz[i_, j_, half + k_] \[Rule] 
-      \(\(-u[i, j, k]\) + u[i, j, 1 + k]\)\/hz\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dudzdef2 = dudz[i_+half,j_,k_] ->
-\t\t(u[i,j,k+1]-u[i,j,k-1]+u[i+1,j,k+1]-u[i+1,j,k-1])/
-\t\t\t\t\t\t\t\t\t\t\t\t(4*hz)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudzdef2\)\" is similar \
-to existing symbol \"\!\(dudydef2\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(dudz[half + i_, j_, k_] \[Rule] 
-      \(1\/\(4\ hz\)\((
-        \(-u[i, j, \(-1\) + k]\) + u[i, j, 1 + k] - u[1 + i, j, \(-1\) + k] + 
-          u[1 + i, j, 1 + k])\)\)\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["dvdx"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dvdxdef1 = dvdx[i_+half,j_,k_] -> (v[i+1,j,k]-v[i,j,k])/hx", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dvdx[half + i_, j_, k_] \[Rule] 
-      \(\(-v[i, j, k]\) + v[1 + i, j, k]\)\/hx\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dvdxdef2 = dvdx[i_,j_+half,k_] ->
-\t\t(v[i+1,j+1,k]-v[i-1,j+1,k]+v[i+1,j,k]-v[i-1,j,k])/(4*hx)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(dvdx[i_, half + j_, k_] \[Rule] 
-      \(1\/\(4\ hx\)\((
-        \(-v[\(-1\) + i, j, k]\) - v[\(-1\) + i, 1 + j, k] + v[1 + i, j, k] + 
-          v[1 + i, 1 + j, k])\)\)\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["dvdz"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dvdzdef1 = dvdz[i_,j_,k_+half]->(v[i,j,k+1]-v[i,j,k])/hz", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dvdzdef1\)\" is similar \
-to existing symbols \!\({dudzdef1, dvdxdef1}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(dvdz[i_, j_, half + k_] \[Rule] 
-      \(\(-v[i, j, k]\) + v[i, j, 1 + k]\)\/hz\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dvdzdef2 = dvdz[i_,j_+half,k_]->
-\t\t(v[i,j,k+1]-v[i,j,k-1]+v[i,j+1,k+1]-v[i,j+1,k-1])/
-\t\t\t\t\t\t\t\t\t\t\t\t(4*hz)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dvdzdef2\)\" is similar \
-to existing symbols \!\({dudzdef2, dvdxdef2}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(dvdz[i_, half + j_, k_] \[Rule] 
-      \(1\/\(4\ hz\)\((
-        \(-v[i, j, \(-1\) + k]\) + v[i, j, 1 + k] - v[i, 1 + j, \(-1\) + k] + 
-          v[i, 1 + j, 1 + k])\)\)\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["dwdx"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dwdxdef1 = dwdx[i_+half,j_,k_]->(w[i+1,j,k]-w[i,j,k])/hx", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dwdxdef1\)\" is similar \
-to existing symbol \"\!\(dvdxdef1\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(dwdx[half + i_, j_, k_] \[Rule] 
-      \(\(-w[i, j, k]\) + w[1 + i, j, k]\)\/hx\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dwdxdef2 = dwdx[i_,j_,k_+half]->
-\t\t(w[i+1,j,k]-w[i-1,j,k]+w[i+1,j,k+1]-w[i-1,j,k+1])/
-\t\t\t\t\t\t\t\t\t\t\t(4*hx)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dwdxdef2\)\" is similar \
-to existing symbol \"\!\(dvdxdef2\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(dwdx[i_, j_, half + k_] \[Rule] 
-      \(1\/\(4\ hx\)\((
-        \(-w[\(-1\) + i, j, k]\) - w[\(-1\) + i, j, 1 + k] + w[1 + i, j, k] + 
-          w[1 + i, j, 1 + k])\)\)\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["dwdy"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dwdydef1 = dwdy[i_,j_+half,k_] ->
-\t\t(w[i,j+1,k]-w[i,j,k])/hy\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dwdydef1\)\" is similar \
-to existing symbols \!\({dudydef1, dwdxdef1}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(dwdy[i_, half + j_, k_] \[Rule] 
-      \(\(-w[i, j, k]\) + w[i, 1 + j, k]\)\/hy\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dwdydef2 = dwdy[i_,j_,k_+half] ->
-\t(w[i,j+1,k]-w[i,j-1,k]+w[i,j+1,k+1]-w[i,j-1,k+1])/(4*hy)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dwdydef2\)\" is similar \
-to existing symbols \!\({dudydef2, dwdxdef2}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(dwdy[i_, j_, half + k_] \[Rule] 
-      \(1\/\(4\ hy\)\((
-        \(-w[i, \(-1\) + j, k]\) - w[i, \(-1\) + j, 1 + k] + w[i, 1 + j, k] + 
-          w[i, 1 + j, 1 + k])\)\)\)], "Output"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions used to test taylor expansions"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-taylorudef = u[i_,j_,k_]->
-\t\t\tU[x0,y0,z0]+
-\t\t\tDuDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-\t\t\tDuDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-\t\t\tDuDz[x0,y0,z0]*((k+1/2)*hz-z0)+
-\t\t\tD2uDy2[x0,y0,z0]/2*((i+1/2)*hx-x0)^2+
-\t\t\tD2uDx2[x0,y0,z0]/2*((j+1/2)*hy-y0)^2+
-\t\t\tD2uDz2[x0,y0,z0]/2*((k+1/2)*hz-z0)^2+
-\t\t\tD2uDxDy[x0,y0,z0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)+
-\t\t\tD2uDxDz[x0,y0,z0]*((i+1/2)*hx-x0)*((k+1/2)*hz-z0)+
-\t\t\tD2uDyDz[x0,y0,z0]*((j+1/2)*hy-y0)*((k+1/2)*hz-z0)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DuDy\)\" is similar to \
-existing symbol \"\!\(DuDx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DuDz\)\" is similar to \
-existing symbols \!\({DuDx, DuDy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2uDx2\)\" is similar \
-to existing symbol \"\!\(D2uDy2\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2uDz2\)\" is similar \
-to existing symbols \!\({D2uDx2, D2uDy2}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2uDxDz\)\" is similar \
-to existing symbol \"\!\(D2uDxDy\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell1\"\) will be suppressed \
-during this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(u[i_, j_, k_] \[Rule] 
-      1\/2\ \((hy\ \((1\/2 + j)\) - y0)\)\^2\ D2uDx2[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hy\ \((1\/2 + j)\) - y0)\)\ 
-          D2uDxDy[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hz\ \((1\/2 + k)\) - z0)\)\ 
-          D2uDxDz[x0, y0, z0] + 
-        1\/2\ \((hx\ \((1\/2 + i)\) - x0)\)\^2\ D2uDy2[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ \((hz\ \((1\/2 + k)\) - z0)\)\ 
-          D2uDyDz[x0, y0, z0] + 
-        1\/2\ \((hz\ \((1\/2 + k)\) - z0)\)\^2\ D2uDz2[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ DuDx[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DuDy[x0, y0, z0] + 
-        \((hz\ \((1\/2 + k)\) - z0)\)\ DuDz[x0, y0, z0] + U[x0, y0, z0]\)], 
-  "Output"]
-}, Open  ]],
-
-Cell["dog = dudy[i+half,j,k] //. {dudydef1,dudydef2,taylorudef} ;", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog /. {i->0,j->0,k->0,x0->hx,y0->hy/2,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell["dog = dudy[i,j+half,k] //. {dudydef1,dudydef2,taylorudef} ;", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-taylorvdef = v[i_,j_,k_]->
-\t\t\tV[x0,y0,z0]+
-\t\t\tDvDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-\t\t\tDvDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-\t\t\tDvDz[x0,y0,z0]*((k+1/2)*hz-z0)+
-\t\t\tD2vDy2[x0,y0,z0]/2*((i+1/2)*hx-x0)^2+
-\t\t\tD2vDx2[x0,y0,z0]/2*((j+1/2)*hy-y0)^2+
-\t\t\tD2vDz2[x0,y0,z0]/2*((k+1/2)*hz-z0)^2+
-\t\t\tD2vDxDy[x0,y0,z0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)+
-\t\t\tD2vDxDz[x0,y0,z0]*((i+1/2)*hx-x0)*((k+1/2)*hz-z0)+
-\t\t\tD2vDyDz[x0,y0,z0]*((j+1/2)*hy-y0)*((k+1/2)*hz-z0)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(taylorvdef\)\" is \
-similar to existing symbol \"\!\(taylorudef\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DvDx\)\" is similar to \
-existing symbol \"\!\(DuDx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DvDy\)\" is similar to \
-existing symbols \!\({DuDy, DvDx}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DvDz\)\" is similar to \
-existing symbols \!\({DuDz, DvDx, DvDy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2vDy2\)\" is similar \
-to existing symbol \"\!\(D2uDy2\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell1\"\) will be suppressed \
-during this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(D2vDx2\)\" is similar \
-to existing symbols \!\({D2uDx2, D2vDy2}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(v[i_, j_, k_] \[Rule] 
-      1\/2\ \((hy\ \((1\/2 + j)\) - y0)\)\^2\ D2vDx2[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hy\ \((1\/2 + j)\) - y0)\)\ 
-          D2vDxDy[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hz\ \((1\/2 + k)\) - z0)\)\ 
-          D2vDxDz[x0, y0, z0] + 
-        1\/2\ \((hx\ \((1\/2 + i)\) - x0)\)\^2\ D2vDy2[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ \((hz\ \((1\/2 + k)\) - z0)\)\ 
-          D2vDyDz[x0, y0, z0] + 
-        1\/2\ \((hz\ \((1\/2 + k)\) - z0)\)\^2\ D2vDz2[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ DvDx[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DvDy[x0, y0, z0] + 
-        \((hz\ \((1\/2 + k)\) - z0)\)\ DvDz[x0, y0, z0] + V[x0, y0, z0]\)], 
-  "Output"]
-}, Open  ]],
-
-Cell["dog = dvdy[i,j+half,k] //. {dvdydef, taylorvdef} ;", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DvDy[hx\/2, hy, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-taylorwdef = w[i_,j_,k_]->
-\t\t\tW[x0,y0,z0]+
-\t\t\tDwDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-\t\t\tDwDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-\t\t\tDwDz[x0,y0,z0]*((k+1/2)*hz-z0)+
-\t\t\tD2wDy2[x0,y0,z0]/2*((i+1/2)*hx-x0)^2+
-\t\t\tD2wDx2[x0,y0,z0]/2*((j+1/2)*hy-y0)^2+
-\t\t\tD2wDz2[x0,y0,z0]/2*((k+1/2)*hz-z0)^2+
-\t\t\tD2wDxDy[x0,y0,z0]*((i+1/2)*hx-x0)*((j+1/2)*hy-y0)+
-\t\t\tD2wDxDz[x0,y0,z0]*((i+1/2)*hx-x0)*((k+1/2)*hz-z0)+
-\t\t\tD2wDyDz[x0,y0,z0]*((j+1/2)*hy-y0)*((k+1/2)*hz-z0)\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(taylorwdef\)\" is \
-similar to existing symbols \!\({taylorudef, taylorvdef}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DwDx\)\" is similar to \
-existing symbols \!\({DuDx, DvDx}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DwDy\)\" is similar to \
-existing symbols \!\({DuDy, DvDy, DwDx}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"stop" \( : \ \) 
-      "Further output of \!\(General :: \"spell\"\) will be suppressed during \
-this calculation."\)], "Message"],
-
-Cell[BoxData[
-    \(w[i_, j_, k_] \[Rule] 
-      1\/2\ \((hy\ \((1\/2 + j)\) - y0)\)\^2\ D2wDx2[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hy\ \((1\/2 + j)\) - y0)\)\ 
-          D2wDxDy[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ \((hz\ \((1\/2 + k)\) - z0)\)\ 
-          D2wDxDz[x0, y0, z0] + 
-        1\/2\ \((hx\ \((1\/2 + i)\) - x0)\)\^2\ D2wDy2[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ \((hz\ \((1\/2 + k)\) - z0)\)\ 
-          D2wDyDz[x0, y0, z0] + 
-        1\/2\ \((hz\ \((1\/2 + k)\) - z0)\)\^2\ D2wDz2[x0, y0, z0] + 
-        \((hx\ \((1\/2 + i)\) - x0)\)\ DwDx[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DwDy[x0, y0, z0] + 
-        \((hz\ \((1\/2 + k)\) - z0)\)\ DwDz[x0, y0, z0] + W[x0, y0, z0]\)], 
-  "Output"]
-}, Open  ]],
-
-Cell["dog = dwdy[i,j+half,k] //. {dwdydef1,dwdydef2, taylorwdef} ;", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DwDy[hx\/2, hy, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell["dog = dwdy[i,j,k+half] //. {dwdydef1,dwdydef2, taylorwdef} ;", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog /. {i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DwDy[hx\/2, hy\/2, hz]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-taylormudef = mu[i_,j_]->
-\t\t\tMU[x0,y0,z0]+
-\t\t\tDmuDx[x0,y0,z0]*((i+1/2)*hx-x0)+
-\t\t\tDmuDy[x0,y0,z0]*((j+1/2)*hy-y0)+
-\t\t\tDmuDz[x0,y0,z0]*((k+1/2)*hz-z0)
-\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(taylormudef\)\" is \
-similar to existing symbol \"\!\(taylorudef\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DmuDx\)\" is similar to \
-existing symbol \"\!\(DuDx\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DmuDy\)\" is similar to \
-existing symbols \!\({DmuDx, DuDy}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DmuDz\)\" is similar to \
-existing symbols \!\({DmuDx, DmuDy, DuDz}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(mu[i_, j_] \[Rule] 
-      \((hx\ \((1\/2 + i)\) - x0)\)\ DmuDx[x0, y0, z0] + 
-        \((hy\ \((1\/2 + j)\) - y0)\)\ DmuDy[x0, y0, z0] + 
-        \((hz\ \((1\/2 + k)\) - z0)\)\ DmuDz[x0, y0, z0] + MU[x0, y0, z0]\)], 
-  "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["tests"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[TextData["diagonal elements of tau"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-dog = tauxx[i+half,j,k] //.
-\t\t{tauxxdef,dudxdef,taylormudef,taylorudef};\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
- dog //. {half->1/2,i->0,j->0,k->0,x0->hx,y0 -> hy/2,z0->hz/2 } \
-\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(2\ DuDx[hx, hy\/2, hz\/2]\ mu[1\/2, 0, 0]\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dog = tauyy[i,j+half,k] //. 
-\t\t{tauyydef,dvdydef,taylormudef,taylorvdef};\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(2\ DvDy[hx\/2, hy, hz\/2]\ mu[0, 1\/2, 0]\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dog = tauzz[i,j,k+half] //. 
-\t\t{tauzzdef,dwdzdef,taylormudef,taylorvdef,taylorwdef};\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(2\ DwDz[hx\/2, hy\/2, hz]\ mu[0, 0, 1\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[" tauxy"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-dog = tauxy[i,j+half,k] //.
-\t\t{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-\t\t taylormudef,taylorudef,taylorvdef};\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DuDy[hx\/2, hy, hz\/2] + DvDx[hx\/2, hy, hz\/2])\)\ 
-      mu[0, 1\/2, 0]\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dog = tauxy[i+half,j,k] //.
-\t\t{tauxydef,dudydef1,dudydef2,dvdxdef1,dvdxdef2,
-\t\t taylormudef,taylorudef,taylorvdef};\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx,y0->hy/2,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DuDy[hx, hy\/2, hz\/2] + DvDx[hx, hy\/2, hz\/2])\)\ 
-      mu[1\/2, 0, 0]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[" tauxz"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-dog = tauxz[i+half,j,k] //.
-\t\t{tauxzdef,dudzdef1,dudzdef2,dwdxdef1,dwdxdef2,
-\t\t taylormudef,taylorudef,taylorwdef} ;\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx,y0->hy/2,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DuDz[hx, hy\/2, hz\/2] + DwDx[hx, hy\/2, hz\/2])\)\ 
-      mu[1\/2, 0, 0]\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dog = tauxz[i,j,k+half] //.
-\t\t{tauxzdef,dudzdef1,dudzdef2,dwdxdef1,dwdxdef2,
-\t\t taylormudef,taylorudef,taylorwdef} ;\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DuDz[hx\/2, hy\/2, hz] + DwDx[hx\/2, hy\/2, hz])\)\ 
-      mu[0, 0, 1\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[" tauyz"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-dog = tauyz[i,j+half,k] //.
-\t\t{tauyzdef,dvdzdef1,dvdzdef2,dwdydef1,dwdydef2,
-\t\t taylormudef,taylorvdef,taylorwdef} ;\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy,z0->hz/2}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DvDz[hx\/2, hy, hz\/2] + DwDy[hx\/2, hy, hz\/2])\)\ 
-      mu[0, 1\/2, 0]\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dog = tauyz[i,j,k+half] //.
-\t\t{tauyzdef,dvdzdef1,dvdzdef2,dwdydef1,dwdydef2,
-\t\t taylormudef,taylorvdef,taylorwdef} ;\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["dog //. {half->1/2,i->0,j->0,k->0,x0->hx/2,y0->hy/2,z0->hz}", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(\((DvDz[hx\/2, hy\/2, hz] + DwDy[hx\/2, hy\/2, hz])\)\ 
-      mu[0, 0, 1\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions used for fortran output"], "Section",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["murepl1 = mu[i_,j_+half,k_] -> muY[i,j+1,k]", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(mu[i_, half + j_, k_] \[Rule] muY[i, 1 + j, k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["murepl2 = mu[i_+half,j_,k_] -> muX[i+1,j,k]", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(mu[half + i_, j_, k_] \[Rule] muX[1 + i, j, k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["murepl3 = mu[i_,j_,k_+half] -> muZ[i,j,k+1]", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(mu[i_, j_, half + k_] \[Rule] muZ[i, j, 1 + k]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["urepl = u[i_,j_,k_] -> U[i,j,k,1]", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(u[i_, j_, k_] \[Rule] U[i, j, k, 1]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["vrepl = v[i_,j_,k_] -> U[i,j,k,2]", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(vrepl\)\" is similar to \
-existing symbol \"\!\(urepl\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(v[i_, j_, k_] \[Rule] U[i, j, k, 2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["wrepl = w[i_,j_,k_] -> U[i,j,k,3]", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(wrepl\)\" is similar to \
-existing symbols \!\({urepl, vrepl}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(w[i_, j_, k_] \[Rule] U[i, j, k, 3]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"dependentCellsNotCovered is a function which returns a logical expression \
-suitable for inclusion in fortran.  Give an expression, exp, we wish to \
-determine which mesh locations are accessed by the expression.  However, we \
-do not wish to examine all possible locations, only those outside the grid \
-patch region.  So we provide a second argument, which is a boolean function \
-taking two arguments.  The combination will give logical expressions testing \
-the mask for cells utilized by the\nexpression and for which the boolean \
-function, logfunc[il,jl], evaluates as true. The third argument is the name \
-of the mask array"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["Clear[ dependentCellsNotCovered ]", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dependentCellsNotCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp,il,jl,kl,ml},
-\tcond = False;
-\tlexp = exp;
-\tFor[il=-1,il<=+1,il++,
-      For[jl=-1,jl<=+1,jl++,
-        For[kl=-1,kl<=+1,kl++,
-          For[ml=1,ml<=3,ml++,
-            If[ (logfunc[il,jl,kl]) &&
-\t          (Coefficient[
-\t\t        Expand[ 
-\t\t          exp
-\t\t        ] ,
-\t\t        U[i+il,j+jl,k+kl,ml]
-\t          ] =!= 0), cond = cond || (maskfun[i+il,j+jl,k+kl]>0)
-\t        ]
-\t      ]
-        ]
-      ]
-    ];
-    cond
-  ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(exp\)\" is similar to \
-existing symbol \"\!\(Exp\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(lexp\)\" is similar to \
-existing symbol \"\!\(exp\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dependentCellsNotCovered[abba*U[i+1,j-1,k,1]+U[i-1,j-1,k+1,2]
-\t\t\t\t\t\t\t, Function[{i,j,k},(k>0)] , 
-\t\t\t\t\t\t\t  masks  ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(masks[\(-1\) + i, \(-1\) + j, 1 + k] > 0\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"dependentCellsCovered is the logical inverse of dependentCellsNotCovered"], 
-  "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["Clear[ dependentCellsCovered ]", "Input",
-  AspectRatioFixed->True],
-
-Cell["\<\
-dependentCellsCovered[exp_ , logfunc_ ,maskfun_] :=
-  Module[{cond,lexp,il,jl,kl,ml},
-\tcond = True;
-\tlexp = exp;
-\tFor[il=-1,il<=+1,il++,
-      For[jl=-1,jl<=+1,jl++,
-        For[kl=-1,kl<=+1,kl++,
-          For[ml=1,ml<=3,ml++,
-            If[ (logfunc[il,jl,kl]) &&
-\t          (Coefficient[
-\t\t        Expand[ 
-\t\t          exp
-\t\t        ] ,
-\t\t        U[i+il,j+jl,k+kl,ml]
-\t          ] =!= 0), cond = cond && (maskfun[i+il,j+jl,k+kl]==0)
-\t        ]
-\t      ]
-        ]
-      ]
-    ];
-    cond
-  ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-dependentCellsCovered[abba*U[i+1,j-1,k,1]+U[i-1,j-1,k+1,2]
-\t\t\t\t\t\t\t, Function[{i,j,k},(k>0)] , 
-\t\t\t\t\t\t\t  masks  ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(masks[\(-1\) + i, \(-1\) + j, 1 + k] == 0\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["definitions for two sided derivs"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["DTwoX[u_,i_,j_,k_] := (u[i+1,j,k]-u[i-1,j,k])/(2*hx)", "Input",
-  AspectRatioFixed->True],
-
-Cell["DTwoX[u_,i_,j_,k_,n_] := (u[i+1,j,k,n]-u[i-1,j,k,n])/(2*hx)", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DTwoX[u,0,0,0] //. {taylorudef,x0->hx/2,y0->hy/2,
-\t\t\t\t\t\t\t\t\tz0->hz/2} ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["DTwoY[u_,i_,j_,k_] := (u[i,j+1,k]-u[i,j-1,k])/(2*hy)", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DTwoY\)\" is similar to \
-existing symbol \"\!\(DTwoX\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell["DTwoY[u_,i_,j_,k_,n_] := (u[i,j+1,k,n]-u[i,j-1,k,n])/(2*hy)", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DTwoY[u,0,0,0] //. {taylorudef,x0->hx/2,y0->hy/2,
-\t\t\t\t\t\t\t\t\tz0->hz/2} ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["DTwoZ[u_,i_,j_,k_] := (u[i,j,k+1]-u[i,j,k-1])/(2*hz)", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DTwoZ\)\" is similar to \
-existing symbols \!\({DTwoX, DTwoY}\)."\)], "Message"]
-}, Open  ]],
-
-Cell["DTwoZ[u_,i_,j_,k_,n_] := (u[i,j,k+1,n]-u[i,j,k-1,n])/(2*hz)", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DTwoZ[u,0,0,0] //. {taylorudef,x0->hx/2,y0->hy/2,
-\t\t\t\t\t\t\t\t\tz0->hz/2} ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDz[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"definitions for Do One-sided Derivative in X direction.  if sign is \
-positive, \nit means extend the stencil in the positivie x direction.  if \
-negative, extend\nin other direction"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(Clear[DOneX]\)], "Input"],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, k_, sign_]\  := \ \n\t\t
-      \((\(-u[i + 2, j, k]\) + 4*u[i + 1, j, k] - 3*u[i, j, k])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hx)\)\ \  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(sign\)\" is similar to \
-existing symbol \"\!\(Sign\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, k_, sign_]\  := \ \n\t\t
-      \((u[i - 2, j, k] - 4*u[i - 1, j, k] + 3*u[i, j, k])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hx)\)\  /; \ sign == \(-1\)\)], "Input"],
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, k_, n_, sign_]\  := \ \n\t\t
-      \((\(-u[i + 2, j, k, n]\) + 4*u[i + 1, j, k, n] - 3*u[i, j, k, n])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hx)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneX[u_, i_, j_, k_, n_, sign_]\  := \ \n\t\t
-      \((u[i - 2, j, k, n] - 4*u[i - 1, j, k, n] + 3*u[i, j, k, n])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hx)\)\  /; \ sign == \(-1\)\)], "Input"],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DOneX[u,0,0,0,-1] //. 
-\t\t{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DOneX[u,0,0,0,+1] //. 
-\t\t{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDx[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"definitions for Do One-sided Derivative in Y direction.  if sign is \
-positive, \nit means extend the stencil in the positivie y direction.  if \
-negative, extend\nin other direction"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Clear[DOneY]\)], "Input"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DOneY\)\" is similar to \
-existing symbol \"\!\(DOneX\)\"."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, k_, sign_]\  := \ \n\t\t
-      \((\(-u[i, j + 2, k]\) + 4*u[i, j + 1, k] - 3*u[i, j, k])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hy)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, k_, sign_]\  := \ \n\t\t
-      \((u[i, j - 2, k] - 4*u[i, j - 1, k] + 3*u[i, j, k])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hy)\)\  /; \ sign == \(-1\)\)], "Input"],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, k_, n_, sign_]\  := \ \n\t\t
-      \((\(-u[i, j + 2, k, n]\) + 4*u[i, j + 1, k, n] - 3*u[i, j, k, n])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hy)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneY[u_, i_, j_, k_, n_, sign_]\  := \ \n\t\t
-      \((u[i, j - 2, k, n] - 4*u[i, j - 1, k, n] + 3*u[i, j, k, n])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hy)\)\  /; \ sign == \(-1\)\)], "Input"],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DOneY[u,0,0,0,-1] //. 
-\t\t{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DOneY[u,0,0,0,+1] //. 
-\t\t{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDy[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"definitions for Do One-sided Derivative in Z direction.  if sign is \
-positive, \nit means extend the stencil in the positivie z direction.  if \
-negative, extend\nin other direction"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Clear[DOneZ]\)], "Input"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(DOneZ\)\" is similar to \
-existing symbols \!\({DOneX, DOneY}\)."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(DOneZ[u_, i_, j_, k_, sign_]\  := \ \n\t\t
-      \((\(-u[i, j, k + 2]\) + 4*u[i, j, k + 1] - 3*u[i, j, k])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hz)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneZ[u_, i_, j_, k_, sign_]\  := \ \n\t\t
-      \((u[i, j, k - 2] - 4*u[i, j, k - 1] + 3*u[i, j, k])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hz)\)\ \  /; \ sign == \(-1\)\)], "Input"],
-
-Cell[BoxData[
-    \(DOneZ[u_, i_, j_, k_, n_, sign_]\  := \ \n\t\t
-      \((\(-u[i, j, k + 2, n]\) + 4*u[i, j, k + 1, n] - 3*u[i, j, k, n])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hz)\)\  /; \ sign == 1\)], "Input"],
-
-Cell[BoxData[
-    \(DOneZ[u_, i_, j_, k_, n_, sign_]\  := \ \n\t\t
-      \((u[i, j, k - 2, n] - 4*u[i, j, k - 1, n] + 3*u[i, j, k, n])\)/\n
-          \t\t\t\t\t\t\t\t\t\((2*hz)\)\ \  /; \ sign == \(-1\)\)], "Input"],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DOneZ[u,0,0,0,-1] //. 
-\t\t{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDz[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-Simplify[ DOneZ[u,0,0,0,+1] //. 
-\t\t{taylorudef,x0->hx/2,y0->hy/2,z0->hz/2}]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DuDz[hx\/2, hy\/2, hz\/2]\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["useful one-sided derivatives"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(Clear[dvdxalt, dudyalt, dvdzalt, dwdyalt, dudzalt, dwdxalt]\)], "Input"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dvdzalt\)\" is similar \
-to existing symbol \"\!\(dvdxalt\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell1" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dwdyalt\)\" is similar \
-to existing symbol \"\!\(dudyalt\)\"."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dudzalt\)\" is similar \
-to existing symbols \!\({dudyalt, dvdzalt}\)."\)], "Message"],
-
-Cell[BoxData[
-    \(General::"spell" \( : \ \) 
-      "Possible spelling error: new symbol name \"\!\(dwdxalt\)\" is similar \
-to existing symbols \!\({dvdxalt, dwdyalt}\)."\)], "Message"]
-}, Open  ]],
-
-Cell[BoxData[
-    \(dvdxalt[i_, j_ + half, k_, sign_]\  := \ 
-      \((DOneX[v, i, j, k, sign] + DOneX[v, i, j + 1, k, sign])\)/2\)], 
-  "Input"],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dvdxalt[i, j + half, k, 1]\)], "Input"],
-
-Cell[BoxData[
-    \(1\/2\ 
-      \((\(\(-3\)\ v[i, j, k] + 4\ v[1 + i, j, k] - v[2 + i, j, k]\)\/\(2\ hx
-              \) + \(\(-3\)\ v[i, 1 + j, k] + 4\ v[1 + i, 1 + j, k] - 
-              v[2 + i, 1 + j, k]\)\/\(2\ hx\))\)\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dudyalt[i_+half,j_,k_,sign_] := (DOneY[u,i  ,j,k,sign]+
-\t\t\t\t\t\t\t     DOneY[u,i+1,j,k,sign])/2\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dudyalt[i + half, j, k, 1]\)], "Input"],
-
-Cell[BoxData[
-    \(1\/2\ 
-      \((\(\(-3\)\ u[i, j, k] + 4\ u[i, 1 + j, k] - u[i, 2 + j, k]\)\/\(2\ hy
-              \) + \(\(-3\)\ u[1 + i, j, k] + 4\ u[1 + i, 1 + j, k] - 
-              u[1 + i, 2 + j, k]\)\/\(2\ hy\))\)\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dvdzalt[i_,j_+half,k_,sign_] := (DOneZ[v,i,j  ,k,sign]+
-\t\t\t\t\t\t\t     DOneZ[v,i,j+1,k,sign])/2\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dvdzalt[i, j + half, k, 1]\)], "Input"],
-
-Cell[BoxData[
-    \(1\/2\ 
-      \((\(\(-3\)\ v[i, j, k] + 4\ v[i, j, 1 + k] - v[i, j, 2 + k]\)\/\(2\ hz
-              \) + \(\(-3\)\ v[i, 1 + j, k] + 4\ v[i, 1 + j, 1 + k] - 
-              v[i, 1 + j, 2 + k]\)\/\(2\ hz\))\)\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dwdyalt[i_,j_,k_+half,sign_] := (DOneY[w,i,j,k  ,sign]+
-\t\t\t\t\t\t\t\t DOneY[w,i,j,k+1,sign])/2\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dwdyalt[i, j, k + half, 1]\)], "Input"],
-
-Cell[BoxData[
-    \(1\/2\ 
-      \((\(\(-3\)\ w[i, j, k] + 4\ w[i, 1 + j, k] - w[i, 2 + j, k]\)\/\(2\ hy
-              \) + \(\(-3\)\ w[i, j, 1 + k] + 4\ w[i, 1 + j, 1 + k] - 
-              w[i, 2 + j, 1 + k]\)\/\(2\ hy\))\)\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dudzalt[i_+half,j_,k_,sign_] := (DOneZ[u,i  ,j,k,sign]+
-\t\t\t\t\t\t\t\t DOneZ[u,i+1,j,k,sign])/2\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dudzalt[i + half, j, k, 1]\)], "Input"],
-
-Cell[BoxData[
-    \(1\/2\ 
-      \((\(\(-3\)\ u[i, j, k] + 4\ u[i, j, 1 + k] - u[i, j, 2 + k]\)\/\(2\ hz
-              \) + \(\(-3\)\ u[1 + i, j, k] + 4\ u[1 + i, j, 1 + k] - 
-              u[1 + i, j, 2 + k]\)\/\(2\ hz\))\)\)], "Output"]
-}, Open  ]],
-
-Cell["\<\
-dwdxalt[i_,j_,k_+half,sign_] := (DOneX[w,i,j,k  ,sign]+
-\t\t\t\t\t\t\t\t DOneX[w,i,j,k+1,sign])/2\
-\>", "Input",
-  AspectRatioFixed->True]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[BoxData[
-    \(dwdxalt[i, j, k + half, 1]\)], "Input"],
-
-Cell[BoxData[
-    \(1\/2\ 
-      \((\(\(-3\)\ w[i, j, k] + 4\ w[1 + i, j, k] - w[2 + i, j, k]\)\/\(2\ hx
-              \) + \(\(-3\)\ w[i, j, 1 + k] + 4\ w[1 + i, j, 1 + k] - 
-              w[2 + i, j, 1 + k]\)\/\(2\ hx\))\)\)], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["setup to use the Format.m package "], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["Off[General::spell,General::spell1];", "Input",
-  AspectRatioFixed->True],
-
-Cell["SetOptions[$Output,PageWidth->73];", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["<</usr/people/wyc/_math/MathSource/Format/Format.m", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(exp::"shdw" \( : \ \) 
-      "Symbol \!\(\"exp\"\) appears in multiple contexts \!\({\"Format`\", \
-\"Global`\"}\); definitions in context \!\(\"Format`\"\) may shadow or be \
-shadowed by other definitions."\)], "Message"],
-
-Cell[BoxData[
-    \(sign::"shdw" \( : \ \) 
-      "Symbol \!\(\"sign\"\) appears in multiple contexts \!\({\"Format`\", \
-\"Global`\"}\); definitions in context \!\(\"Format`\"\) may shadow or be \
-shadowed by other definitions."\)], "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"substitution for all derivatives and variables"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-allDerivAllUV = {dudxdef,
-\t\t\t\t dvdydef,
-\t\t\t\t dwdzdef,
-\t\t\t\t dudydef1,dudydef2,
-\t\t\t\t dudzdef1,dudzdef2,
-\t\t\t\t dvdxdef1,dvdxdef2,
-\t\t\t\t dvdzdef1,dvdzdef2,
-\t\t\t\t dwdxdef1,dwdxdef2,
-\t\t\t\t dwdydef1,dwdydef2,
-\t\t\t\t urepl,
-\t\t\t\t vrepl,
-\t\t\t\t wrepl};\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell["\<\
-allUVW = {       urepl,
-\t\t\t\t vrepl,
-\t\t\t\t wrepl};\
-\>", "Input",
-  AspectRatioFixed->True]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["transverse u derivs"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["tduext[half+i,j,k] = trandere[i+1,j,k,1];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tduext[half+i-1,j,k] = tranderw[i-1,j,k,1];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tduext[i,j+half,k] = trandern[i,j+1,k,1];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tduext[i,j-1+half,k] = tranders[i,j-1,k,1];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tduext[i,j,k+half] = trandert[i,j,k+1,1];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tduext[i,j,k-1+half] = tranderb[i,j,k-1,1];", "Input",
-  AspectRatioFixed->True]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["transverse v derivs"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["tdvext[half+i,j,k] = trandere[i+1,j,k,2];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdvext[half+i-1,j,k] = tranderw[i-1,j,k,2];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdvext[i,j+half,k] = trandern[i,j+1,k,2];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdvext[i,j-1+half,k] = tranders[i,j-1,k,2];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdvext[i,j,k+half] = trandert[i,j,k+1,2];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdvext[i,j,k-1+half] = tranderb[i,j,k-1,2];", "Input",
-  AspectRatioFixed->True]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["transverse w derivs"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["tdwext[half+i,j,k] = trandere[i+1,j,k,3];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdwext[half+i-1,j,k] = tranderw[i-1,j,k,3];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdwext[i,j+half,k] = trandern[i,j+1,k,3];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdwext[i,j-1+half,k] = tranders[i,j-1,k,3];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdwext[i,j,k+half] = trandert[i,j,k+1,3];", "Input",
-  AspectRatioFixed->True],
-
-Cell["tdwext[i,j,k-1+half] = tranderb[i,j,k-1,3];", "Input",
-  AspectRatioFixed->True]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData[
-"an alternate approach which seeks to automatically determine which \n\
-direction to use for one sided deriv"], "Subsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-altgen[lhs_,indx_,indy_,indz_,
-       exp_,expalt_,expext_,
-       varindx_,derivindx_,
-       indexcond_,mask_] :=
-\tBlock[
-\t\t{tmpcond,tmp,tmpalt,
-\t\t depplus,depminus,sign,
-\t\t line1,line2,line3,line4,line5,
-\t\t icase,jcase,kcase},
-\t\t(* conditions are False if expression is safe to use *)
-\t\ttmpcond = dependentCellsNotCovered[
-\t\t\t\t\texp[indx,indy,indz] //. allDerivAllUV,
-\t\t\t\t\tindexcond,mask];
-\t\tdepplus = dependentCellsNotCovered[
-\t\t\t\t\texpalt[indx,indy,indz,+1] //.allDerivAllUV,
-\t\t\t\t\tindexcond,mask];
-\t\tdepminus = dependentCellsNotCovered[
-\t\t\t\t\texpalt[indx,indy,indz,-1] //.allDerivAllUV,
-\t\t\t\t\tindexcond,mask];
-\t\t(* temporary *)
-\t\tIf[ depplus === False , 
-\t\t\tsign = 1,
-\t\t\tIf[ depminus === False ,
-\t\t\t\tsign = -1,
-\t\t\t\tsign = 0  (* means neither of one 
-\t\t\t\t             sided is safe *)
-\t\t\t]
-\t\t];
-\t\t(* treat 3 different cases *)
-\t\tWhich[
-\t\t\ttmpcond === False,
-\t\t\t(* exp does not extend into masked region *)
-\t\t\tFortranAssign[
-\t\t\t\tlhs,
-\t\t\t\texp[indx,indy,indz] //.allDerivAllUV,
-\t\t\t\tAssignToArray->{U},
-\t\t\t\tAssignPrecision->Infinity
-\t\t\t],
-\t\t\t
-\t\t\ttmpcond =!= False && sign != 0,
-\t\t\t(* exp extends outside, output conditional mask *)
-
-\t\t\ttmp = FortranAssign[
-\t\t\t\ttmpcond,
-\t\t\t\tAssignToArray->{mask},
-\t\t\t\tAssignIndent->\"\",
-\t\t\t\tAssignPrecision->Infinity
-\t\t\t];
-\t\t\ttmpalt =dependentCellsNotCovered[
-\t\t\t\t\texpalt[indx,indx,indz,sign]//.allDerivAllUV,
-\t\t\t\t\t\tindexcond,mask];
-\t\t\tline1 = StringForm[\"      if(``) then \", tmp];
-\t\t\tline2 = FortranAssign[
-\t\t\t\tlhs,
-\t\t\t\texpalt[indx,indy,indz,sign]//.allDerivAllUV,
-\t\t\t\tAssignToArray->{U},
-\t\t\t\tAssignPrecision->Infinity
-\t\t\t];
-\t\t\tline3 = StringForm[\"      else\"];
-\t\t\tline4 = FortranAssign[
-\t\t\t\tlhs,
-\t\t\t\texp[indx,indy,indz] //.allDerivAllUV,
-\t\t\t\tAssignToArray->{U},
-\t\t\t\tAssignPrecision->Infinity
-\t\t\t];
-\t\t\tIf[tmpalt =!= False ,
-\t\t\t\t(* this is an error, the alternate form should
-\t\t\t\t   be specified to be inside safe region *)
-\t\t   \t\tline5 = StringForm[\" error in tandergen\"]
-\t\t   \t,
-\t\t   \t\tline5 = StringForm[\"      endif\"]
-\t\t\t];
-\t\t\tColumnForm[{line1,line2,line3,line4,line5}],
-\t\t\t
-\t\t\tTrue,
-\t\t\t(* cannot use exp or expalt, must be
-\t\t\t   externally supplied derivative *)
-
-\t\t\t(* need to figure out where to evaluate
-\t\t\t   the transverse derivative *)
-\t\t\ticase = Which[ indx === i-1+half, -1,
-\t\t\t\t\t\t   indx === i       ,  0,
-\t\t\t\t\t\t   indx === i  +half, +1,
-\t\t\t\t\t\t   _, Print[\"error in icase\"]];
-\t\t\tjcase = Which[ indy === j-1+half, -1,
-\t\t\t\t\t\t   indy === j       ,  0,
-\t\t\t\t\t\t   indy === j  +half, +1,
-\t\t\t\t\t\t   _, Print[\"error in jcase\"]];
-
-\t\t\tkcase = Which[ indz === k-1+half, -1,
-\t\t\t\t\t\t   indz === k       ,  0,
-\t\t\t\t\t\t   indz === k  +half, +1,
-\t\t\t\t\t\t   _, Print[\"error in kcase\"]];
-\t\t
-\t\t\tFortranAssign[
-\t\t\t\t\tlhs, expext[i+icase,
-\t\t\t\t\t\t\t\tj+jcase,
-\t\t\t\t\t\t\t\tk+kcase,
-\t\t\t\t\t\t\t\tvarindx,derivindx],
-\t\t\t\t\tAssignToArray->{trandere,tranderw,
-\t\t\t\t\t\t\t\t\ttrandern,tranders,
-\t\t\t\t\t\t\t\t\ttrandert,tranderb},
-\t\t\t\t\tAssignPrecision->Infinity]\t
-\t\t]\t
-\t]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dwdxt, 
-\t\ti,j,k+half,
-\t\tdwdx,dwdxalt,
-\t\ttrandern,3,1,Function[{i,j,k},(k>0)],
-\t\tmaskn ]\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[OutputFormData["\<\
-\"        dwdxt=trandern(i,j,1+k,3,1)\"\
-\>", 
-"\<\
-        dwdxt=trandern(i,j,1+k,3,1)\
-\>"], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dudye, 
-\t\ti+half,j,k,
-\t\tdudy,
-\t\tdudyalt,
-\t\ttduext,
-\t\t1,2,
-\t\tFunction[{i,j,k},(i<0)],
-\t\tmaskn ] \
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[OutputFormData["\<\
-\"        \\
-dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\\n     & \\
- +U(1+i,1+j,k,1))/(4.d0*hy)\"\
-\>", 
-"\<\
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))/(4.d0*hy)\
-\>"], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dudye, 
-\t\ti+half,j,k,
-\t\tdudy,
-\t\tdudyalt,
-\t\ttrandere,
-\t\t1,2,
-\t\tFunction[{i,j,k},(i>0)],
-\t\tmaskn ] \
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[OutputFormData["\<\
-\"        dudye=trandere(1+i,j,k,1,2)\"\
-\>", 
-"\<\
-        dudye=trandere(1+i,j,k,1,2)\
-\>"], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dudye, 
-\t\ti+half,j,k,
-\t\tdudy,
-\t\tdudyalt,
-\t\ttranderns,
-\t\t1,2,
-\t\tFunction[{i,j,k},(j<0)],
-\t\tmaskn ] \
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    InterpretationBox[GridBox[{
-          {
-            "\<\"      \
-if(\\!\\(\\*FrameBox[\\\"\\\\\\\"maskn(i,-1+j,k).gt.0.or.maskn(1+i,-1+j,k).gt.\
-0\\\\\\\"\\\", Rule[BoxFrame, False], Rule[BoxMargins, False]]\\)) then \
-\"\>"},
-          {
-            
-            FrameBox[
-              \("        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))\n \
-    &  /(2.d0*hy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i\n     &  \
-,2+j,k,1))/(2.d0*hy))/2.d0"\),
-              BoxFrame->False,
-              BoxMargins->False]},
-          {"\<\"      else\"\>"},
-          {
-            
-            FrameBox[
-              \("        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\n \
-    &  +U(1+i,1+j,k,1))/(4.d0*hy)"\),
-              BoxFrame->False,
-              BoxMargins->False]},
-          {"\<\"      endif\"\>"}
-          },
-        GridBaseline->{Baseline, {1, 1}},
-        ColumnAlignments->{Left}],
-      ColumnForm[ {
-        StringForm[ "      if(``) then ", 
-          OutputForm[ 
-            
-            ColumnForm[ {
-              "maskn(i,-1+j,k).gt.0.or.maskn(1+i,-1+j,k).gt.0"}]]], 
-        OutputForm[ 
-          
-          ColumnForm[ {
-            "        dudye=((-3*U(i,j,k,1)+4*U(i,1+j,k,1)-U(i,2+j,k,1))\n     \
-&  /(2.d0*hy)+(-3*U(1+i,j,k,1)+4*U(1+i,1+j,k,1)-U(1+i\n     &  \
-,2+j,k,1))/(2.d0*hy))/2.d0"}]], 
-        StringForm[ "      else"], 
-        OutputForm[ 
-          
-          ColumnForm[ {
-            "        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\n     \
-&  +U(1+i,1+j,k,1))/(4.d0*hy)"}]], 
-        StringForm[ "      endif"]}],
-      Editable->False]], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dudye, 
-\t\ti+half,j,k,
-\t\tdudy,
-\t\tdudyalt,
-\t\ttrandere,
-\t\t1,2,
-\t\tFunction[{i,j,k},(j>0)],
-\t\tmaskn ] \
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    InterpretationBox[GridBox[{
-          {
-            "\<\"      \
-if(\\!\\(\\*FrameBox[\\\"\\\\\\\"maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0\
-\\\\\\\"\\\", Rule[BoxFrame, False], Rule[BoxMargins, False]]\\)) then \"\>"},
-          
-          {
-            
-            FrameBox[
-              \("        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)\n \
-    &  )/(2.d0*hy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U\n     &  \
-(1+i,j,k,1))/(2.d0*hy))/2.d0"\),
-              BoxFrame->False,
-              BoxMargins->False]},
-          {"\<\"      else\"\>"},
-          {
-            
-            FrameBox[
-              \("        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\n \
-    &  +U(1+i,1+j,k,1))/(4.d0*hy)"\),
-              BoxFrame->False,
-              BoxMargins->False]},
-          {"\<\"      endif\"\>"}
-          },
-        GridBaseline->{Baseline, {1, 1}},
-        ColumnAlignments->{Left}],
-      ColumnForm[ {
-        StringForm[ "      if(``) then ", 
-          OutputForm[ 
-            ColumnForm[ {"maskn(i,1+j,k).gt.0.or.maskn(1+i,1+j,k).gt.0"}]]], 
-        OutputForm[ 
-          
-          ColumnForm[ {
-            "        dudye=((U(i,-2+j,k,1)-4*U(i,-1+j,k,1)+3*U(i,j,k,1)\n     \
-&  )/(2.d0*hy)+(U(1+i,-2+j,k,1)-4*U(1+i,-1+j,k,1)+3*U\n     &  \
-(1+i,j,k,1))/(2.d0*hy))/2.d0"}]], 
-        StringForm[ "      else"], 
-        OutputForm[ 
-          
-          ColumnForm[ {
-            "        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\n     \
-&  +U(1+i,1+j,k,1))/(4.d0*hy)"}]], 
-        StringForm[ "      endif"]}],
-      Editable->False]], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dudye, 
-\t\ti+half,j,k,
-\t\tdudy,
-\t\tdudyalt,
-\t\ttranderb,
-\t\t1,2,
-\t\tFunction[{i,j,k},(k<0)],
-\t\tmaskn ] \
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[OutputFormData["\<\
-\"        \\
-dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\\n     & \\
- +U(1+i,1+j,k,1))/(4.d0*hy)\"\
-\>", 
-"\<\
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))/(4.d0*hy)\
-\>"], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-altgen[ dudye, 
-\t\ti+half,j,k,
-\t\tdudy,
-\t\tdudyalt,
-\t\ttrandert,
-\t\t1,2,
-\t\tFunction[{i,j,k},(k>0)],
-\t\tmaskn ] \
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[OutputFormData["\<\
-\"        \\
-dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)\\n     & \\
- +U(1+i,1+j,k,1))/(4.d0*hy)\"\
-\>", 
-"\<\
-        dudye=(-U(i,-1+j,k,1)+U(i,1+j,k,1)-U(1+i,-1+j,k,1)
-     &  +U(1+i,1+j,k,1))/(4.d0*hy)\
-\>"], "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell[TextData["a short-hand function"], "Subsubsection",
-  Evaluatable->False,
-  AspectRatioFixed->True],
-
-Cell["\<\
-FA[x_] := FortranAssign[x,
-\t\t\t\t\t\tAssignToArray->{U,muX,muY,muZ,a,u,
-\t\t\t\t\t\t\t\t\t\tmaskn,maske,maskw,
-\t\t\t\t\t\t\t\t\t\tmasks,maskt,maskb},
-\t\t\t\t\t\tAssignIndent->\"\",
-\t\t\t\t\t\tAssignPrecision->Infinity];\t\t\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-DeleteFile[ \"dog.mf\"];
-CopyFile[ \"DV_3D1.mF\" , \"dog.mf\"];
-Splice[\"dog.mf\",FormatType->OutputForm];
-DeleteFile[ \"DV_3D1.F\"];
-CopyFile[ \"dog.f\", \"DV_3D1.F\" ];
-<<\"!touch DV_3D1.F\"
-\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DeleteFile::"nffil" \( : \ \) 
-      "File not found during \!\(DeleteFile[\"DV_3D1.F\"]\)."\)], "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-DeleteFile[ \"dog.mf\"];
-CopyFile[ \"DV_3D2.mF\" , \"dog.mf\"];
-Splice[\"dog.mf\",FormatType->OutputForm];
-DeleteFile[ \"DV_3D2.F\"];
-CopyFile[ \"dog.f\", \"DV_3D2.F\" ];
-<<\"!touch DV_3D2.F\"
-\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DeleteFile::"nffil" \( : \ \) 
-      "File not found during \!\(DeleteFile[\"DV_3D2.F\"]\)."\)], "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-DeleteFile[ \"dog.mf\"];
-CopyFile[ \"DV_3D3.mF\" , \"dog.mf\"];
-Splice[\"dog.mf\",FormatType->OutputForm];
-DeleteFile[ \"DV_3D3.F\"];
-CopyFile[ \"dog.f\", \"DV_3D3.F\" ];
-<<\"!touch DV_3D3.F\"
-\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DeleteFile::"nffil" \( : \ \) 
-      "File not found during \!\(DeleteFile[\"DV_3D3.F\"]\)."\)], "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-
-Cell["\<\
-DeleteFile[ \"dog.mf\"];
-CopyFile[ \"DV_3D4.mF\" , \"dog.mf\"];
-Splice[\"dog.mf\",FormatType->OutputForm];
-DeleteFile[ \"DV_3D4.F\"];
-CopyFile[ \"dog.f\", \"DV_3D4.F\" ];
-<<\"!touch DV_3D4.F\"
-\
-\>", "Input",
-  AspectRatioFixed->True],
-
-Cell[BoxData[
-    \(DeleteFile::"nffil" \( : \ \) 
-      "File not found during \!\(DeleteFile[\"DV_3D4.F\"]\)."\)], "Message"]
-}, Open  ]],
-
-Cell[TextData[
-"\n FA[ Coefficient[Expand[\n  alpha*a[i,j,k]*u[i,j,k]-beta*(\n\t\
-hy*hz*(tauxx[i+half  ,j      , k]-\n\t       tauxx[i-1+half,j      , k])+\n\t\
-hx*hz*(tauxy[i       ,j+half  ,k]-   \n\t       tauxy[i       ,j-1+half,k])+\n\
-\thx*hy*(tauxz[i       ,j       ,k+half]-\n\t       tauxz[i       ,j       \
-,k-1+half]))/vol //. \n\t       {murepl1,murepl2,murepl3,\n\t        \
-tauxxdef,tauyydef,tauxydef,tauxzdef,tauyzdef,\n\t        tauzzdef,\n\t        \
-vol->hx*hy*hz,\n\t        dudxdef,dvdydef,dwdzdef,\n\t        \
-dudydef1,dudydef2,\n\t        dudzdef1,dudzdef2,\n\t        \
-dwdxdef1,dwdxdef2,\n\t        dvdxdef1,dvdxdef2 }\n ],u[i,j+1,k]]]\n\t       \
-"], "Input",
-  AspectRatioFixed->True],
-
-Cell[TextData[
-"\nFA[Coefficient[ Expand[\n  alpha*a[i,j,k]*v[i,j,k]-beta*(\n\t\
-hy*hz*(tauxy[i+half  ,j      , k]-\n\t       tauxy[i-1+half,j      , k])+\n\t\
-hx*hz*(tauyy[i       ,j+half  ,k]-   \n\t       tauyy[i       ,j-1+half,k])+\n\
-\thx*hy*(tauyz[i       ,j       ,k+half]-\n\t       tauyz[i       ,j       \
-,k-1+half]))/vol //. \n\t       {murepl1,murepl2,murepl3,\n\t        \
-tauxxdef,tauyydef,tauxydef,tauxzdef,tauyzdef,\n\t        tauzzdef,\n\t        \
-vol->hx*hy*hz,\n\t        dudxdef,dvdydef,dwdzdef,\n\t        \
-dudydef1,dudydef2,\n\t        dudzdef1,dudzdef2,\n\t        \
-dwdxdef1,dwdxdef2,\n\t        dvdxdef1,dvdxdef2,\n\t        \
-dvdzdef1,dvdzdef2,\n\t        dwdydef1,dwdydef2 } ] , v[i,j+1,k] ] ]"], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[TextData[
-"\nFA[ Coefficient[ Expand[\n  alpha*a[i,j,k]*w[i,j,k]-beta*(\n\t\
-hy*hz*(tauxz[i+half  ,j      , k]-\n\t       tauxz[i-1+half,j      , k])+\n\t\
-hx*hz*(tauyz[i       ,j+half  ,k]-   \n\t       tauyz[i       ,j-1+half,k])+\n\
-\thx*hy*(tauzz[i       ,j       ,k+half]-\n\t       tauzz[i       ,j       \
-,k-1+half]))/vol //. \n\t       {murepl1,murepl2,murepl3,\n\t        \
-tauxxdef,tauyydef,tauxydef,tauxzdef,tauyzdef,\n\t        tauzzdef,\n\t        \
-vol->hx*hy*hz,\n\t        dudxdef,dvdydef,dwdzdef,\n\t        \
-dudydef1,dudydef2,\n\t        dudzdef1,dudzdef2,\n\t        \
-dwdxdef1,dwdxdef2,\n\t        dvdxdef1,dvdxdef2,\n\t        \
-dvdzdef1,dvdzdef2,\n\t        dwdydef1,dwdydef2 } ] , w[i,j+1,k] ] ]"], 
-  "Input",
-  AspectRatioFixed->True],
-
-Cell[TextData["\n\tDTwoY[u,i,j,k] //. allDerivAllUV"], "Input",
-  AspectRatioFixed->True],
-
-Cell[TextData[
-"FA[ dependentCellsNotCovered[\n\tDTwoY[u,i,j,k] //. allDerivAllUV,\n\t\
-Function[{i,j,k},(j<0)],masks] ]"], "Input",
-  AspectRatioFixed->True],
-
-Cell[TextData["FA[ DTwoY[U,i,j,k,n] ]"], "Input",
-  AspectRatioFixed->True]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]]
-},
-FrontEndVersion->"X 3.0",
-ScreenRectangle->{{0, 1280}, {0, 1024}},
-WindowToolbars->{},
-CellGrouping->Manual,
-WindowSize->{517, 949},
-WindowMargins->{{Automatic, 112}, {Automatic, 22}},
-PrintingPageRange->{Automatic, Automatic},
-PrintingOptions->{"PaperSize"->{612, 792},
-"PaperOrientation"->"Portrait",
-"Magnification"->1},
-PrivateNotebookOptions->{"ColorPalette"->{RGBColor, -1}},
-ShowCellLabel->True,
-ShowCellTags->False,
-RenderingOptions->{"ObjectDithering"->True,
-"RasterDithering"->False}
-]
-
-
-(***********************************************************************
-Cached data follows.  If you edit this Notebook file directly, not using
-Mathematica, you must remove the line containing CacheID at the top of 
-the file.  The cache data will then be recreated when you save this file 
-from within Mathematica.
-***********************************************************************)
-
-(*CellTagsOutline
-CellTagsIndex->{}
-*)
-
-(*CellTagsIndex
-CellTagsIndex->{}
-*)
-
-(*NotebookFileOutline
-Notebook[{
-
-Cell[CellGroupData[{
-Cell[1731, 51, 125, 3, 93, "Subtitle",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[1881, 58, 94, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[2000, 64, 128, 4, 42, "Input"],
-Cell[2131, 70, 117, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[2285, 77, 128, 4, 42, "Input"],
-Cell[2416, 83, 117, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[2570, 90, 123, 4, 42, "Input"],
-Cell[2696, 96, 117, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[2850, 103, 131, 4, 42, "Input"],
-Cell[2984, 109, 191, 3, 55, "Message"],
-Cell[3178, 114, 182, 3, 55, "Message"],
-Cell[3363, 119, 179, 3, 39, "Message"],
-Cell[3545, 124, 160, 3, 39, "Message"],
-Cell[3708, 129, 115, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[3860, 136, 131, 4, 42, "Input"],
-Cell[3994, 142, 201, 3, 55, "Message"],
-Cell[4198, 147, 189, 3, 55, "Message"],
-Cell[4390, 152, 185, 3, 55, "Message"],
-Cell[4578, 157, 160, 3, 39, "Message"],
-Cell[4741, 162, 115, 2, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[4893, 169, 131, 4, 42, "Input"],
-Cell[5027, 175, 201, 3, 55, "Message"],
-Cell[5231, 180, 189, 3, 55, "Message"],
-Cell[5423, 185, 191, 3, 55, "Message"],
-Cell[5617, 190, 160, 3, 39, "Message"],
-Cell[5780, 195, 115, 2, 27, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[5944, 203, 103, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[6072, 209, 103, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[6200, 215, 113, 4, 42, "Input"],
-Cell[6316, 221, 113, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[6466, 228, 112, 4, 42, "Input"],
-Cell[6581, 234, 113, 2, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[6731, 241, 112, 4, 42, "Input"],
-Cell[6846, 247, 113, 2, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[7008, 255, 87, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[7120, 261, 101, 1, 27, "Input"],
-Cell[7224, 264, 113, 2, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[7374, 271, 173, 5, 57, "Input"],
-Cell[7550, 278, 203, 4, 69, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[7802, 288, 87, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[7914, 294, 99, 1, 27, "Input"],
-Cell[8016, 297, 183, 3, 39, "Message"],
-Cell[8202, 302, 113, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[8352, 309, 170, 5, 57, "Input"],
-Cell[8525, 316, 183, 3, 39, "Message"],
-Cell[8711, 321, 203, 4, 65, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[8963, 331, 87, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[9075, 337, 101, 1, 27, "Input"],
-Cell[9179, 340, 113, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[9329, 347, 145, 4, 57, "Input"],
-Cell[9477, 353, 203, 4, 65, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[9729, 363, 87, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[9841, 369, 99, 1, 27, "Input"],
-Cell[9943, 372, 191, 3, 55, "Message"],
-Cell[10137, 377, 113, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[10287, 384, 169, 5, 57, "Input"],
-Cell[10459, 391, 191, 3, 55, "Message"],
-Cell[10653, 396, 203, 4, 65, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[10905, 406, 87, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[11017, 412, 99, 1, 27, "Input"],
-Cell[11119, 415, 183, 3, 39, "Message"],
-Cell[11305, 420, 113, 2, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[11455, 427, 167, 5, 57, "Input"],
-Cell[11625, 434, 183, 3, 39, "Message"],
-Cell[11811, 439, 203, 4, 65, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[12063, 449, 87, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[12175, 455, 113, 4, 42, "Input"],
-Cell[12291, 461, 191, 3, 55, "Message"],
-Cell[12485, 466, 113, 2, 50, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[12635, 473, 143, 4, 42, "Input"],
-Cell[12781, 479, 191, 3, 55, "Message"],
-Cell[12975, 484, 203, 4, 69, "Output"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[13239, 495, 119, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[13383, 501, 512, 13, 207, "Input"],
-Cell[13898, 516, 175, 3, 39, "Message"],
-Cell[14076, 521, 179, 3, 39, "Message"],
-Cell[14258, 526, 179, 3, 39, "Message"],
-Cell[14440, 531, 185, 3, 55, "Message"],
-Cell[14628, 536, 181, 3, 39, "Message"],
-Cell[14812, 541, 161, 3, 39, "Message"],
-Cell[14976, 546, 769, 14, 381, "Output"]
-}, Open  ]],
-Cell[15760, 563, 102, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[15887, 568, 91, 1, 27, "Input"],
-Cell[15981, 571, 56, 1, 47, "Output"]
-}, Open  ]],
-Cell[16052, 575, 102, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[16179, 580, 91, 1, 27, "Input"],
-Cell[16273, 583, 56, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[16366, 589, 512, 13, 207, "Input"],
-Cell[16881, 604, 187, 3, 55, "Message"],
-Cell[17071, 609, 175, 3, 39, "Message"],
-Cell[17249, 614, 179, 3, 39, "Message"],
-Cell[17431, 619, 185, 3, 55, "Message"],
-Cell[17619, 624, 179, 3, 39, "Message"],
-Cell[17801, 629, 161, 3, 39, "Message"],
-Cell[17965, 634, 185, 3, 55, "Message"],
-Cell[18153, 639, 160, 3, 39, "Message"],
-Cell[18316, 644, 769, 14, 381, "Output"]
-}, Open  ]],
-Cell[19100, 661, 93, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[19218, 666, 91, 1, 27, "Input"],
-Cell[19312, 669, 56, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[19405, 675, 512, 13, 207, "Input"],
-Cell[19920, 690, 197, 3, 55, "Message"],
-Cell[20120, 695, 179, 3, 39, "Message"],
-Cell[20302, 700, 185, 3, 55, "Message"],
-Cell[20490, 705, 160, 3, 39, "Message"],
-Cell[20653, 710, 769, 14, 381, "Output"]
-}, Open  ]],
-Cell[21437, 727, 103, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[21565, 732, 91, 1, 27, "Input"],
-Cell[21659, 735, 56, 1, 47, "Output"]
-}, Open  ]],
-Cell[21730, 739, 103, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[21858, 744, 91, 1, 27, "Input"],
-Cell[21952, 747, 56, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[22045, 753, 213, 8, 102, "Input"],
-Cell[22261, 763, 188, 3, 55, "Message"],
-Cell[22452, 768, 176, 3, 39, "Message"],
-Cell[22631, 773, 181, 3, 39, "Message"],
-Cell[22815, 778, 188, 3, 55, "Message"],
-Cell[23006, 783, 248, 5, 129, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[23303, 794, 82, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[23410, 800, 107, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[23520, 804, 125, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[23670, 812, 117, 4, 42, "Input"],
-Cell[23790, 818, 75, 1, 47, "Output"]
-}, Open  ]],
-Cell[23880, 822, 126, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[24031, 830, 102, 1, 27, "Input"],
-Cell[24136, 833, 75, 1, 47, "Output"]
-}, Open  ]],
-Cell[24226, 837, 137, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[24388, 845, 102, 1, 27, "Input"],
-Cell[24493, 848, 75, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[24617, 855, 89, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[24709, 859, 170, 5, 57, "Input"],
-
-Cell[CellGroupData[{
-Cell[24904, 868, 102, 1, 27, "Input"],
-Cell[25009, 871, 110, 2, 47, "Output"]
-}, Open  ]],
-Cell[25134, 876, 170, 5, 57, "Input"],
-
-Cell[CellGroupData[{
-Cell[25329, 885, 102, 1, 27, "Input"],
-Cell[25434, 888, 110, 2, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[25593, 896, 89, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[25685, 900, 171, 5, 57, "Input"],
-
-Cell[CellGroupData[{
-Cell[25881, 909, 102, 1, 27, "Input"],
-Cell[25986, 912, 110, 2, 47, "Output"]
-}, Open  ]],
-Cell[26111, 917, 171, 5, 57, "Input"],
-
-Cell[CellGroupData[{
-Cell[26307, 926, 102, 1, 27, "Input"],
-Cell[26412, 929, 110, 2, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[26571, 937, 89, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[26663, 941, 171, 5, 57, "Input"],
-
-Cell[CellGroupData[{
-Cell[26859, 950, 102, 1, 27, "Input"],
-Cell[26964, 953, 110, 2, 47, "Output"]
-}, Open  ]],
-Cell[27089, 958, 171, 5, 57, "Input"],
-
-Cell[CellGroupData[{
-Cell[27285, 967, 102, 1, 27, "Input"],
-Cell[27390, 970, 110, 2, 47, "Output"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[27561, 979, 112, 2, 47, "Section",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[27698, 985, 86, 1, 27, "Input"],
-Cell[27787, 988, 80, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[27904, 994, 86, 1, 27, "Input"],
-Cell[27993, 997, 80, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[28110, 1003, 86, 1, 27, "Input"],
-Cell[28199, 1006, 80, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[28316, 1012, 76, 1, 27, "Input"],
-Cell[28395, 1015, 69, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[28501, 1021, 76, 1, 27, "Input"],
-Cell[28580, 1024, 177, 3, 39, "Message"],
-Cell[28760, 1029, 69, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[28866, 1035, 76, 1, 27, "Input"],
-Cell[28945, 1038, 182, 3, 55, "Message"],
-Cell[29130, 1043, 69, 1, 27, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[29236, 1049, 713, 11, 181, "Subsection",
-  Evaluatable->False],
-Cell[29952, 1062, 76, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[30053, 1067, 563, 24, 357, "Input"],
-Cell[30619, 1093, 173, 3, 39, "Message"],
-Cell[30795, 1098, 174, 3, 39, "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[31006, 1106, 180, 5, 72, "Input"],
-Cell[31189, 1113, 74, 1, 27, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[31312, 1120, 156, 4, 62, "Subsection",
-  Evaluatable->False],
-Cell[31471, 1126, 73, 1, 27, "Input"],
-Cell[31547, 1129, 560, 24, 357, "Input"],
-
-Cell[CellGroupData[{
-Cell[32132, 1157, 177, 5, 57, "Input"],
-Cell[32312, 1164, 75, 1, 27, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[32436, 1171, 112, 2, 45, "Subsection",
-  Evaluatable->False],
-Cell[32551, 1175, 95, 1, 27, "Input"],
-Cell[32649, 1178, 102, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[32776, 1183, 140, 4, 42, "Input"],
-Cell[32919, 1189, 59, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[33015, 1195, 95, 1, 27, "Input"],
-Cell[33113, 1198, 177, 3, 39, "Message"]
-}, Open  ]],
-Cell[33305, 1204, 102, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[33432, 1209, 140, 4, 42, "Input"],
-Cell[33575, 1215, 59, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[33671, 1221, 95, 1, 27, "Input"],
-Cell[33769, 1224, 182, 3, 55, "Message"]
-}, Open  ]],
-Cell[33966, 1230, 102, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[34093, 1235, 140, 4, 42, "Input"],
-Cell[34236, 1241, 59, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[34344, 1248, 263, 5, 113, "Subsection",
-  Evaluatable->False],
-Cell[34610, 1255, 45, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[34680, 1260, 202, 3, 59, "Input"],
-Cell[34885, 1265, 175, 3, 39, "Message"]
-}, Open  ]],
-Cell[35075, 1271, 200, 3, 59, "Input"],
-Cell[35278, 1276, 213, 3, 59, "Input"],
-Cell[35494, 1281, 213, 3, 59, "Input"],
-
-Cell[CellGroupData[{
-Cell[35732, 1288, 128, 4, 42, "Input"],
-Cell[35863, 1294, 59, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[35959, 1300, 128, 4, 42, "Input"],
-Cell[36090, 1306, 59, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[36198, 1313, 263, 5, 113, "Subsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[36486, 1322, 45, 1, 27, "Input"],
-Cell[36534, 1325, 177, 3, 39, "Message"]
-}, Open  ]],
-Cell[36726, 1331, 200, 3, 59, "Input"],
-Cell[36929, 1336, 200, 3, 59, "Input"],
-Cell[37132, 1341, 213, 3, 59, "Input"],
-Cell[37348, 1346, 213, 3, 59, "Input"],
-
-Cell[CellGroupData[{
-Cell[37586, 1353, 128, 4, 42, "Input"],
-Cell[37717, 1359, 59, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[37813, 1365, 128, 4, 42, "Input"],
-Cell[37944, 1371, 59, 1, 47, "Output"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[38052, 1378, 263, 5, 113, "Subsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[38340, 1387, 45, 1, 27, "Input"],
-Cell[38388, 1390, 182, 3, 55, "Message"]
-}, Open  ]],
-Cell[38585, 1396, 200, 3, 59, "Input"],
-Cell[38788, 1401, 202, 3, 59, "Input"],
-Cell[38993, 1406, 213, 3, 59, "Input"],
-Cell[39209, 1411, 215, 3, 59, "Input"],
-
-Cell[CellGroupData[{
-Cell[39449, 1418, 128, 4, 42, "Input"],
-Cell[39580, 1424, 59, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[39676, 1430, 128, 4, 42, "Input"],
-Cell[39807, 1436, 59, 1, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[39903, 1442, 111, 2, 42, "Subsubsection",
-  Evaluatable->False],
-
-Cell[CellGroupData[{
-Cell[40039, 1448, 92, 1, 27, "Input"],
-Cell[40134, 1451, 181, 3, 39, "Message"],
-Cell[40318, 1456, 181, 3, 39, "Message"],
-Cell[40502, 1461, 188, 3, 55, "Message"],
-Cell[40693, 1466, 188, 3, 55, "Message"]
-}, Open  ]],
-Cell[40896, 1472, 145, 3, 43, "Input"],
-
-Cell[CellGroupData[{
-Cell[41066, 1479, 59, 1, 27, "Input"],
-Cell[41128, 1482, 238, 4, 88, "Output"]
-}, Open  ]],
-Cell[41381, 1489, 150, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[41556, 1497, 59, 1, 27, "Input"],
-Cell[41618, 1500, 238, 4, 97, "Output"]
-}, Open  ]],
-Cell[41871, 1507, 150, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[42046, 1515, 59, 1, 27, "Input"],
-Cell[42108, 1518, 238, 4, 88, "Output"]
-}, Open  ]],
-Cell[42361, 1525, 148, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[42534, 1533, 59, 1, 27, "Input"],
-Cell[42596, 1536, 238, 4, 97, "Output"]
-}, Open  ]],
-Cell[42849, 1543, 148, 4, 42, "Input"],
-
-Cell[CellGroupData[{
-Cell[43022, 1551, 59, 1, 27, "Input"],
-Cell[43084, 1554, 238, 4, 88, "Output"]
-}, Open  ]],
-Cell[43337, 1561, 148, 4, 42, "Input"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[43534, 1571, 59, 1, 27, "Input"],
-Cell[43596, 1574, 238, 4, 88, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[43871, 1583, 114, 2, 45, "Subsection",
-  Evaluatable->False],
-Cell[43988, 1587, 79, 1, 27, "Input"],
-Cell[44070, 1590, 77, 1, 27, "Input"],
-
-Cell[CellGroupData[{
-Cell[44172, 1595, 93, 1, 27, "Input"],
-Cell[44268, 1598, 242, 4, 55, "Message"],
-Cell[44513, 1604, 244, 4, 55, "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[44794, 1613, 130, 3, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[44927, 1618, 329, 14, 192, "Input"],
-Cell[45259, 1634, 107, 5, 57, "Input"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[45403, 1644, 102, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[45508, 1648, 84, 1, 27, "Input"],
-Cell[45595, 1651, 86, 1, 27, "Input"],
-Cell[45684, 1654, 84, 1, 27, "Input"],
-Cell[45771, 1657, 86, 1, 27, "Input"],
-Cell[45860, 1660, 84, 1, 27, "Input"],
-Cell[45947, 1663, 86, 1, 27, "Input"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[46070, 1669, 102, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[46175, 1673, 84, 1, 27, "Input"],
-Cell[46262, 1676, 86, 1, 27, "Input"],
-Cell[46351, 1679, 84, 1, 27, "Input"],
-Cell[46438, 1682, 86, 1, 27, "Input"],
-Cell[46527, 1685, 84, 1, 27, "Input"],
-Cell[46614, 1688, 86, 1, 27, "Input"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[46737, 1694, 102, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[46842, 1698, 84, 1, 27, "Input"],
-Cell[46929, 1701, 86, 1, 27, "Input"],
-Cell[47018, 1704, 84, 1, 27, "Input"],
-Cell[47105, 1707, 86, 1, 27, "Input"],
-Cell[47194, 1710, 84, 1, 27, "Input"],
-Cell[47281, 1713, 86, 1, 27, "Input"]
-}, Open  ]]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[47416, 1720, 188, 4, 62, "Subsection",
-  Evaluatable->False],
-Cell[47607, 1726, 3297, 107, 1677, "Input"],
-
-Cell[CellGroupData[{
-Cell[50929, 1837, 154, 7, 87, "Input"],
-Cell[51086, 1846, 129, 5, 38, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[51252, 1856, 168, 10, 132, "Input"],
-Cell[51423, 1868, 253, 8, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[51713, 1881, 170, 10, 132, "Input"],
-Cell[51886, 1893, 129, 5, 38, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[52052, 1903, 171, 10, 132, "Input"],
-Cell[52226, 1915, 1635, 46, 149, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[53898, 1966, 170, 10, 132, "Input"],
-Cell[54071, 1978, 1616, 44, 149, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[55724, 2027, 170, 10, 132, "Input"],
-Cell[55897, 2039, 253, 8, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[56187, 2052, 170, 10, 132, "Input"],
-Cell[56360, 2064, 253, 8, 47, "Output"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[56650, 2077, 104, 2, 42, "Subsubsection",
-  Evaluatable->False],
-Cell[56757, 2081, 279, 8, 102, "Input"],
-
-Cell[CellGroupData[{
-Cell[57061, 2093, 244, 9, 117, "Input"],
-Cell[57308, 2104, 127, 2, 39, "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[57472, 2111, 244, 9, 117, "Input"],
-Cell[57719, 2122, 127, 2, 39, "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[57883, 2129, 244, 9, 117, "Input"],
-Cell[58130, 2140, 127, 2, 39, "Message"]
-}, Open  ]],
-
-Cell[CellGroupData[{
-Cell[58294, 2147, 244, 9, 117, "Input"],
-Cell[58541, 2158, 127, 2, 39, "Message"]
-}, Open  ]],
-Cell[58683, 2163, 712, 11, 312, "Input"],
-Cell[59398, 2176, 765, 12, 312, "Input"],
-Cell[60166, 2190, 766, 12, 312, "Input"],
-Cell[60935, 2204, 89, 1, 42, "Input"],
-Cell[61027, 2207, 158, 3, 57, "Input"],
-Cell[61188, 2212, 75, 1, 27, "Input"]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]]
-}, Open  ]]
-}
-]
-*)
-
-
-
-
-(***********************************************************************
-End of Mathematica Notebook file.
-***********************************************************************)
-
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLABecLap_1D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLABecLap_1D_K.H
index b9a6d3ead39..353379c3925 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLABecLap_1D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLABecLap_1D_K.H
@@ -26,6 +26,34 @@ void mlabeclap_adotx (Box const& box, Array4<Real> const& y,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlabeclap_adotx_os (Box const& box, Array4<Real> const& y,
+                         Array4<Real const> const& x,
+                         Array4<Real const> const& a,
+                         Array4<Real const> const& bX,
+                         Array4<int const> const& osm,
+                         GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                         Real alpha, Real beta, int ncomp) noexcept
+{
+    const Real dhx = beta*dxinv[0]*dxinv[0];
+
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+
+    for (int n = 0; n < ncomp; ++n) {
+    AMREX_PRAGMA_SIMD
+    for (int i = lo.x; i <= hi.x; ++i) {
+        if (osm(i,0,0) == 0) {
+            y(i,0,0,n) = 0.0;
+        } else {
+            y(i,0,0,n) = alpha*a(i,0,0)*x(i,0,0,n)
+                - dhx * (bX(i+1,0,0)*(x(i+1,0,0,n) - x(i  ,0,0,n))
+                       - bX(i  ,0,0)*(x(i  ,0,0,n) - x(i-1,0,0,n)));
+        }
+    }
+    }
+}
+
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlabeclap_normalize (Box const& box, Array4<Real> const& x,
                           Array4<Real const> const& a,
@@ -116,5 +144,99 @@ void abec_gsrb (Box const& box, Array4<Real> const& phi, Array4<Real const> cons
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void abec_gsrb_os (Box const& box, Array4<Real> const& phi, Array4<Real const> const& rhs,
+                   Real alpha, Array4<Real const> const& a,
+                   Real dhx,
+                   Array4<Real const> const& bX,
+                   Array4<int const> const& m0,
+                   Array4<int const> const& m1,
+                   Array4<Real const> const& f0,
+                   Array4<Real const> const& f1,
+                   Array4<int const> const& osm,
+                   Box const& vbox, int redblack, int nc) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const auto vlo = amrex::lbound(vbox);
+    const auto vhi = amrex::ubound(vbox);
+
+    for (int n = 0; n < nc; ++n) {
+        AMREX_PRAGMA_SIMD
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((i+redblack)%2 == 0) {
+                if (osm(i,0,0) == 0) {
+                    phi(i,0,0) = 0.0;
+                } else {
+                    Real cf0 = (i == vlo.x and m0(vlo.x-1,0,0) > 0)
+                        ? f0(vlo.x,0,0,n) : 0.0;
+                    Real cf1 = (i == vhi.x and m1(vhi.x+1,0,0) > 0)
+                        ? f1(vhi.x,0,0,n) : 0.0;
+
+                    Real delta = dhx*(bX(i,0,0)*cf0 + bX(i+1,0,0)*cf1);
+
+                    Real gamma = alpha*a(i,0,0)
+                        +   dhx*( bX(i,0,0) + bX(i+1,0,0) );
+
+                    Real rho = dhx*(bX(i  ,0  ,0)*phi(i-1,0  ,0,n)
+                                  + bX(i+1,0  ,0)*phi(i+1,0  ,0,n));
+
+                    phi(i,0,0,n) = (rhs(i,0,0,n) + rho - phi(i,0,0,n)*delta)
+                        / (gamma - delta);
+                }
+            }
+        }
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void abec_gsrb_with_line_solve (
+                Box const& box, Array4<Real> const& phi, Array4<Real const> const& rhs,
+                Real alpha, Array4<Real const> const& a,
+                Real dhx,
+                Array4<Real const> const& bX,
+                Array4<int const> const& m0,
+                Array4<int const> const& m1,
+                Array4<Real const> const& f0,
+                Array4<Real const> const& f1,
+                Box const& vbox, int redblack, int nc) noexcept
+{
+    amrex::Abort("abec_gsrb_with_line_solve not implemented in 1D");
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int coarsen_overset_mask (Box const& bx, Array4<int> const& cmsk, Array4<int const> const& fmsk)
+    noexcept
+{
+    int nerrors = 0;
+    const auto lo = amrex::lbound(bx);
+    const auto hi = amrex::ubound(bx);
+    for (int i = lo.x; i <= hi.x; ++i) {
+        int ii = 2*i;
+        cmsk(i,0,0) = fmsk(ii,0,0) + fmsk(ii+1,0,0);
+        if (cmsk(i,0,0) == 2) {
+            cmsk(i,0,0) = 1;
+        } else if (cmsk(i,0,0) != 0) {
+            ++nerrors;
+        }
+    }
+    return nerrors;
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void overset_rescale_bcoef_x (Box const& box, Array4<Real> const& bX, Array4<int const> const& osm,
+                              int ncomp, Real osfac) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int n = 0; n < ncomp; ++n) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((osm(i-1,0,0)+osm(i,0,0)) == 1) {
+                bX(i,0,0,n) *= osfac;
+            }
+        }
+    }
+}
+
 }
 #endif
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLABecLap_2D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLABecLap_2D_K.H
index abd7dd94c1f..985d892a877 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLABecLap_2D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLABecLap_2D_K.H
@@ -32,6 +32,40 @@ void mlabeclap_adotx (Box const& box, Array4<Real> const& y,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlabeclap_adotx_os (Box const& box, Array4<Real> const& y,
+                         Array4<Real const> const& x,
+                         Array4<Real const> const& a,
+                         Array4<Real const> const& bX,
+                         Array4<Real const> const& bY,
+                         Array4<int const> const& osm,
+                         GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                         Real alpha, Real beta, int ncomp) noexcept
+{
+    const Real dhx = beta*dxinv[0]*dxinv[0];
+    const Real dhy = beta*dxinv[1]*dxinv[1];
+
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+
+    for (int n = 0; n < ncomp; ++n) {
+    for     (int j = lo.y; j <= hi.y; ++j) {
+        AMREX_PRAGMA_SIMD
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if (osm(i,j,0) == 0) {
+                y(i,j,0,n) = 0.0;
+            } else {
+                y(i,j,0,n) = alpha*a(i,j,0)*x(i,j,0,n)
+                    - dhx * (bX(i+1,j,0,n)*(x(i+1,j,0,n) - x(i  ,j,0,n))
+                           - bX(i  ,j,0,n)*(x(i  ,j,0,n) - x(i-1,j,0,n)))
+                    - dhy * (bY(i,j+1,0,n)*(x(i,j+1,0,n) - x(i,j  ,0,n))
+                           - bY(i,j  ,0,n)*(x(i,j  ,0,n) - x(i,j-1,0,n)));
+            }
+        }
+    }
+    }
+}
+
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlabeclap_normalize (Box const& box, Array4<Real> const& x,
                           Array4<Real const> const& a,
@@ -180,5 +214,224 @@ void abec_gsrb (Box const& box, Array4<Real> const& phi, Array4<Real const> cons
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void abec_gsrb_os (Box const& box, Array4<Real> const& phi, Array4<Real const> const& rhs,
+                   Real alpha, Array4<Real const> const& a,
+                   Real dhx, Real dhy,
+                   Array4<Real const> const& bX, Array4<Real const> const& bY,
+                   Array4<int const> const& m0, Array4<int const> const& m2,
+                   Array4<int const> const& m1, Array4<int const> const& m3,
+                   Array4<Real const> const& f0, Array4<Real const> const& f2,
+                   Array4<Real const> const& f1, Array4<Real const> const& f3,
+                   Array4<int const> const& osm,
+                   Box const& vbox, int redblack, int nc) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const auto vlo = amrex::lbound(vbox);
+    const auto vhi = amrex::ubound(vbox);
+
+    for (int n = 0; n < nc; ++n) {
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            AMREX_PRAGMA_SIMD
+            for (int i = lo.x; i <= hi.x; ++i) {
+                if ((i+j+redblack)%2 == 0) {
+                    if (osm(i,j,0) == 0) {
+                        phi(i,j,0,n) = 0.0;
+                    } else {
+                        Real cf0 = (i == vlo.x and m0(vlo.x-1,j,0) > 0)
+                            ? f0(vlo.x,j,0,n) : 0.0;
+                        Real cf1 = (j == vlo.y and m1(i,vlo.y-1,0) > 0)
+                            ? f1(i,vlo.y,0,n) : 0.0;
+                        Real cf2 = (i == vhi.x and m2(vhi.x+1,j,0) > 0)
+                            ? f2(vhi.x,j,0,n) : 0.0;
+                        Real cf3 = (j == vhi.y and m3(i,vhi.y+1,0) > 0)
+                            ? f3(i,vhi.y,0,n) : 0.0;
+
+                        Real delta = dhx*(bX(i,j,0,n)*cf0 + bX(i+1,j,0,n)*cf2)
+                                  +  dhy*(bY(i,j,0,n)*cf1 + bY(i,j+1,0,n)*cf3);
+
+                        Real gamma = alpha*a(i,j,0)
+                            +   dhx*( bX(i,j,0,n) + bX(i+1,j,0,n) )
+                            +   dhy*( bY(i,j,0,n) + bY(i,j+1,0,n) );
+
+                        Real rho = dhx*(bX(i  ,j  ,0,n)*phi(i-1,j  ,0,n)
+                                      + bX(i+1,j  ,0,n)*phi(i+1,j  ,0,n))
+                                  +dhy*(bY(i  ,j  ,0,n)*phi(i  ,j-1,0,n)
+                                      + bY(i  ,j+1,0,n)*phi(i  ,j+1,0,n));
+
+                        phi(i,j,0,n) = (rhs(i,j,0,n) + rho - phi(i,j,0,n)*delta)
+                            / (gamma - delta);
+                    }
+                }
+            }
+        }
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void abec_gsrb_with_line_solve (
+                Box const& box, Array4<Real> const& phi, Array4<Real const> const& rhs,
+                Real alpha, Array4<Real const> const& a,
+                Real dhx, Real dhy,
+                Array4<Real const> const& bX, Array4<Real const> const& bY,
+                Array4<int const> const& m0, Array4<int const> const& m2,
+                Array4<int const> const& m1, Array4<int const> const& m3,
+                Array4<Real const> const& f0, Array4<Real const> const& f2,
+                Array4<Real const> const& f1, Array4<Real const> const& f3,
+                Box const& vbox, int redblack, int nc) noexcept
+{
+
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const auto vlo = amrex::lbound(vbox);
+    const auto vhi = amrex::ubound(vbox);
+
+    // amrex::Print() << "GSRB LS " << box << " " << dhx << " " << dhy << " " << dhz << std::endl;
+
+    // idir is the direction in which we will do the tridiagonal solve --
+    // it should be the direction in which the mesh spacing is much larger
+    // than in the other directions
+    // int idir = 1;
+
+    // This should be moved outside the kernel!
+    if (dhy <= dhx) amrex::Abort("dhy is supposed to be much larger than dhx");
+
+    int ilen = hi.y - lo.y + 1;
+
+    // This should be moved outside the kernel!
+    if (ilen > 32) amrex::Abort("abec_gsrb_with_line_solve is hard-wired to be no longer than 32");
+
+    Array1D<Real,0,31> a_ls;
+    Array1D<Real,0,31> b_ls;
+    Array1D<Real,0,31> c_ls;
+    Array1D<Real,0,31> r_ls;
+    Array1D<Real,0,31> u_ls;
+    Array1D<Real,0,31> gam;
+
+    for (int n = 0; n < nc; ++n) {
+        AMREX_PRAGMA_SIMD
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((i+redblack)%2 == 0) {
+                for (int j = lo.y; j <= hi.y; ++j) {
+                    Real gamma = alpha*a(i,j,0)
+                        +   dhx*(bX(i,j,0,n)+bX(i+1,j,0,n))
+                        +   dhy*(bY(i,j,0,n)+bY(i,j+1,0,n));
+
+                    Real cf0 = (i == vlo.x and m0(vlo.x-1,j,0) > 0)
+                        ? f0(vlo.x,j,0,n) : 0.0;
+                    Real cf1 = (j == vlo.y and m1(i,vlo.y-1,0) > 0)
+                        ? f1(i,vlo.y,0,n) : 0.0;
+                    Real cf2 = (i == vhi.x and m2(vhi.x+1,j,0) > 0)
+                        ? f2(vhi.x,j,0,n) : 0.0;
+                    Real cf3 = (j == vhi.y and m3(i,vhi.y+1,0) > 0)
+                        ? f3(i,vhi.y,0,n) : 0.0;
+
+                    Real g_m_d = gamma
+                        - (dhx*(bX(i,j,0,n)*cf0 + bX(i+1,j,0,n)*cf2)
+                        +  dhy*(bY(i,j,0,n)*cf1 + bY(i,j+1,0,n)*cf3));
+
+                    Real rho =  dhx*( bX(i  ,j,0,n)*phi(i-1,j,0,n)
+                              +       bX(i+1,j,0,n)*phi(i+1,j,0,n) );
+
+                    // We have already accounted for this external boundary in the coefficient of phi(i,j,k,n)
+                    if (i == vlo.x and m0(vlo.x-1,j,0) > 0)
+                        rho -= dhx*bX(i  ,j,0,n)*phi(i-1,j,0,n);
+                    if (i == vhi.x and m3(vhi.x+1,j,0) > 0)
+                        rho -= dhx*bX(i+1,j,0,n)*phi(i+1,j,0,n);
+
+                    a_ls(j-lo.y) = -dhy*bY(i,j,0,n);
+                    b_ls(j-lo.y) =  g_m_d;
+                    c_ls(j-lo.y) = -dhy*bY(i,j+1,0,n);
+                    u_ls(j-lo.y) = 0.;
+                    r_ls(j-lo.y) = rhs(i,j,0,n) + rho;
+
+                    if (j == lo.y) {
+                        a_ls(j-lo.y) = 0.;
+                        if (!(m1(i,vlo.y-1,0) > 0)) r_ls(j-lo.y) += dhy*bY(i,j,0,n)*phi(i,j-1,0,n);
+                    }
+                    if (j == hi.y) {
+                        c_ls(j-lo.y) = 0.;
+                        if (!(m3(i,vhi.y+1,0) > 0)) r_ls(j-lo.y) += dhy*bY(i,j+1,0,n)*phi(i,j+1,0,n);
+                    }
+                }
+//                      This is the tridiagonal solve
+                {
+                    Real bet = b_ls(0);
+                    u_ls(0) = r_ls(0) / bet;
+
+                    for (int jj = 1; jj <= ilen-1; jj++) {
+                        gam(jj) = c_ls(jj-1) / bet;
+                        bet = b_ls(jj) - a_ls(jj)*gam(jj);
+                        if (bet == 0) amrex::Abort(">>>TRIDIAG FAILED");
+                        u_ls(jj) = (r_ls(jj)-a_ls(jj)*u_ls(jj-1)) / bet;
+                    }
+
+                    for (int jj = ilen-2; jj >= 0; jj--) {
+                                u_ls(jj) = u_ls(jj) - gam(jj+1)*u_ls(jj+1);
+                    }
+                }
+
+                for (int j = lo.y; j <= hi.y; ++j) {
+                            phi(i,j,0,n) = u_ls(j-lo.y);
+                }
+            }
+	}
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int coarsen_overset_mask (Box const& bx, Array4<int> const& cmsk, Array4<int const> const& fmsk)
+    noexcept
+{
+    int nerrors = 0;
+    const auto lo = amrex::lbound(bx);
+    const auto hi = amrex::ubound(bx);
+    for (int j = lo.y; j <= hi.y; ++j) {
+    for (int i = lo.x; i <= hi.x; ++i) {
+        int ii = 2*i;
+        int jj = 2*j;
+        cmsk(i,j,0) = fmsk(ii,jj,0) + fmsk(ii+1,jj,0) + fmsk(ii,jj+1,0) + fmsk(ii+1,jj+1,0);
+        if (cmsk(i,j,0) == 4) {
+            cmsk(i,j,0) = 1;
+        } else if (cmsk(i,j,0) != 0) {
+            ++nerrors;
+        }
+    }}
+    return nerrors;
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void overset_rescale_bcoef_x (Box const& box, Array4<Real> const& bX, Array4<int const> const& osm,
+                              int ncomp, Real osfac) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int n = 0; n < ncomp; ++n) {
+        for (int j = lo.y; j <= hi.y; ++j) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((osm(i-1,j,0)+osm(i,j,0)) == 1) {
+                bX(i,j,0,n) *= osfac;
+            }
+        }}
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void overset_rescale_bcoef_y (Box const& box, Array4<Real> const& bY, Array4<int const> const& osm,
+                              int ncomp, Real osfac) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int n = 0; n < ncomp; ++n) {
+        for (int j = lo.y; j <= hi.y; ++j) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((osm(i,j-1,0)+osm(i,j,0)) == 1) {
+                bY(i,j,0,n) *= osfac;
+            }
+        }}
+    }
+}
+
 }
 #endif
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLABecLap_3D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLABecLap_3D_K.H
index 07b12da4409..37143b185a8 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLABecLap_3D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLABecLap_3D_K.H
@@ -38,6 +38,46 @@ void mlabeclap_adotx (Box const& box, Array4<Real> const& y,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlabeclap_adotx_os (Box const& box, Array4<Real> const& y,
+                         Array4<Real const> const& x,
+                         Array4<Real const> const& a,
+                         Array4<Real const> const& bX,
+                         Array4<Real const> const& bY,
+                         Array4<Real const> const& bZ,
+                         Array4<int const> const& osm,
+                         GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                         Real alpha, Real beta, int ncomp) noexcept
+{
+    const Real dhx = beta*dxinv[0]*dxinv[0];
+    const Real dhy = beta*dxinv[1]*dxinv[1];
+    const Real dhz = beta*dxinv[2]*dxinv[2];
+
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+
+    for (int n = 0; n < ncomp; ++n) {
+    for         (int k = lo.z; k <= hi.z; ++k) {
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            AMREX_PRAGMA_SIMD
+            for (int i = lo.x; i <= hi.x; ++i) {
+                if (osm(i,j,k) == 0) {
+                    y(i,j,k,n) = 0.0;
+                } else {
+                    y(i,j,k,n) = alpha*a(i,j,k)*x(i,j,k,n)
+                        - dhx * (bX(i+1,j,k,n)*(x(i+1,j,k,n) - x(i  ,j,k,n))
+                               - bX(i  ,j,k,n)*(x(i  ,j,k,n) - x(i-1,j,k,n)))
+                        - dhy * (bY(i,j+1,k,n)*(x(i,j+1,k,n) - x(i,j  ,k,n))
+                               - bY(i,j  ,k,n)*(x(i,j  ,k,n) - x(i,j-1,k,n)))
+                        - dhz * (bZ(i,j,k+1,n)*(x(i,j,k+1,n) - x(i,j,k  ,n))
+                               - bZ(i,j,k  ,n)*(x(i,j,k  ,n) - x(i,j,k-1,n)));
+                }
+            }
+        }
+    }
+    }
+}
+
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlabeclap_normalize (Box const& box, Array4<Real> const& x,
                           Array4<Real const> const& a,
@@ -262,5 +302,452 @@ void abec_gsrb (Box const& box, Array4<Real> const& phi, Array4<Real const> cons
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void abec_gsrb_os (Box const& box, Array4<Real> const& phi, Array4<Real const> const& rhs,
+                   Real alpha, Array4<Real const> const& a,
+                   Real dhx, Real dhy, Real dhz,
+                   Array4<Real const> const& bX, Array4<Real const> const& bY,
+                   Array4<Real const> const& bZ,
+                   Array4<int const> const& m0, Array4<int const> const& m2,
+                   Array4<int const> const& m4,
+                   Array4<int const> const& m1, Array4<int const> const& m3,
+                   Array4<int const> const& m5,
+                   Array4<Real const> const& f0, Array4<Real const> const& f2,
+                   Array4<Real const> const& f4,
+                   Array4<Real const> const& f1, Array4<Real const> const& f3,
+                   Array4<Real const> const& f5,
+                   Array4<int const> const& osm,
+                   Box const& vbox, int redblack, int nc) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const auto vlo = amrex::lbound(vbox);
+    const auto vhi = amrex::ubound(vbox);
+
+    constexpr Real omega = 1.15;
+
+    for (int n = 0; n < nc; ++n) {
+        for         (int k = lo.z; k <= hi.z; ++k) {
+            for     (int j = lo.y; j <= hi.y; ++j) {
+                AMREX_PRAGMA_SIMD
+                for (int i = lo.x; i <= hi.x; ++i) {
+                    if ((i+j+k+redblack)%2 == 0) {
+                        if (osm(i,j,k) == 0) {
+                            phi(i,j,k,n) = 0.0;
+                        } else {
+                            Real cf0 = (i == vlo.x and m0(vlo.x-1,j,k) > 0)
+                                ? f0(vlo.x,j,k,n) : 0.0;
+                            Real cf1 = (j == vlo.y and m1(i,vlo.y-1,k) > 0)
+                                ? f1(i,vlo.y,k,n) : 0.0;
+                            Real cf2 = (k == vlo.z and m2(i,j,vlo.z-1) > 0)
+                                ? f2(i,j,vlo.z,n) : 0.0;
+                            Real cf3 = (i == vhi.x and m3(vhi.x+1,j,k) > 0)
+                                ? f3(vhi.x,j,k,n) : 0.0;
+                            Real cf4 = (j == vhi.y and m4(i,vhi.y+1,k) > 0)
+                                ? f4(i,vhi.y,k,n) : 0.0;
+                            Real cf5 = (k == vhi.z and m5(i,j,vhi.z+1) > 0)
+                                ? f5(i,j,vhi.z,n) : 0.0;
+
+                            Real gamma = alpha*a(i,j,k)
+                                +   dhx*(bX(i,j,k,n)+bX(i+1,j,k,n))
+                                +   dhy*(bY(i,j,k,n)+bY(i,j+1,k,n))
+                                +   dhz*(bZ(i,j,k,n)+bZ(i,j,k+1,n));
+
+                            Real g_m_d = gamma
+                                - (dhx*(bX(i,j,k,n)*cf0 + bX(i+1,j,k,n)*cf3)
+                                +  dhy*(bY(i,j,k,n)*cf1 + bY(i,j+1,k,n)*cf4)
+                                +  dhz*(bZ(i,j,k,n)*cf2 + bZ(i,j,k+1,n)*cf5));
+
+                            Real rho =  dhx*( bX(i  ,j,k,n)*phi(i-1,j,k,n)
+                                      +       bX(i+1,j,k,n)*phi(i+1,j,k,n) )
+                                      + dhy*( bY(i,j  ,k,n)*phi(i,j-1,k,n)
+                                      +       bY(i,j+1,k,n)*phi(i,j+1,k,n) )
+                                      + dhz*( bZ(i,j,k  ,n)*phi(i,j,k-1,n)
+                                      +       bZ(i,j,k+1,n)*phi(i,j,k+1,n) );
+
+                            Real res =  rhs(i,j,k,n) - (gamma*phi(i,j,k,n) - rho);
+                            phi(i,j,k,n) = phi(i,j,k,n) + omega/g_m_d * res;
+                        }
+                    }
+                }
+            }
+        }
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void tridiagonal_solve (Array1D<Real,0,31>& a_ls, Array1D<Real,0,31>& b_ls, Array1D<Real,0,31>& c_ls,
+                        Array1D<Real,0,31>& r_ls, Array1D<Real,0,31>& u_ls, Array1D<Real,0,31>& gam,
+                        int ilen ) noexcept
+{
+    Real bet = b_ls(0);
+    u_ls(0) = r_ls(0) / bet;
+
+    for (int i = 1; i <= ilen - 1; i++) {
+        gam(i) = c_ls(i-1) / bet;
+        bet = b_ls(i) - a_ls(i)*gam(i);
+        if (bet == 0) amrex::Abort(">>>TRIDIAG FAILED");
+        u_ls(i) = (r_ls(i)-a_ls(i)*u_ls(i-1)) / bet;
+    }
+    for (int i = ilen-2; i >= 0; i--) {
+        u_ls(i) = u_ls(i) - gam(i+1)*u_ls(i+1);
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void abec_gsrb_with_line_solve (
+                Box const& box, Array4<Real> const& phi, Array4<Real const> const& rhs,
+                Real alpha, Array4<Real const> const& a,
+                Real dhx, Real dhy, Real dhz,
+                Array4<Real const> const& bX, Array4<Real const> const& bY,
+                Array4<Real const> const& bZ,
+                Array4<int const> const& m0, Array4<int const> const& m2,
+                Array4<int const> const& m4,
+                Array4<int const> const& m1, Array4<int const> const& m3,
+                Array4<int const> const& m5,
+                Array4<Real const> const& f0, Array4<Real const> const& f2,
+                Array4<Real const> const& f4,
+                Array4<Real const> const& f1, Array4<Real const> const& f3,
+                Array4<Real const> const& f5,
+                Box const& vbox, int redblack, int nc) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const auto vlo = amrex::lbound(vbox);
+    const auto vhi = amrex::ubound(vbox);
+
+    // amrex::Print() << "GSRB LS " << box << " " << dhx << " " << dhy << " " << dhz << std::endl;
+    
+    // idir is the direction in which we will do the tridiagonal solve --
+    //    it should be the direction in which the mesh spacing is much larger
+    //    than in the other directions
+    int idir = 2;
+    int ilen = hi.z - lo.z + 1;
+	
+    if ( (dhx <= dhy) and (dhz <= dhy) ) {
+	idir = 1;
+	ilen = hi.y - lo.y + 1;
+    }	
+    if ( (dhy <= dhx) and (dhz <= dhx) ) {
+	idir = 0;
+	ilen = hi.x - lo.x + 1;
+    } 
+
+    // This assertion should be moved outside the kernel for performance!
+    if (ilen > 32) amrex::Abort("abec_gsrb_with_line_solve is hard-wired to be no longer than 32");
+
+    Array1D<Real,0,31> a_ls;
+    Array1D<Real,0,31> b_ls;
+    Array1D<Real,0,31> c_ls;
+    Array1D<Real,0,31> r_ls;
+    Array1D<Real,0,31> u_ls;
+    Array1D<Real,0,31> gam;
+
+    if (idir == 2) {         
+    	for (int n = 0; n < nc; ++n) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+                AMREX_PRAGMA_SIMD
+                for (int i = lo.x; i <= hi.x; ++i) {
+                    if ((i+j+redblack)%2 == 0) {
+
+                        for (int k = lo.z; k <= hi.z; ++k)
+                        {
+                            Real gamma = alpha*a(i,j,k)
+                                +   dhx*(bX(i,j,k,n)+bX(i+1,j,k,n))
+                                +   dhy*(bY(i,j,k,n)+bY(i,j+1,k,n))
+                                +   dhz*(bZ(i,j,k,n)+bZ(i,j,k+1,n));
+
+                            Real cf0 = (i == vlo.x and m0(vlo.x-1,j,k) > 0)
+                                ? f0(vlo.x,j,k,n) : 0.0;
+                            Real cf1 = (j == vlo.y and m1(i,vlo.y-1,k) > 0)
+                                ? f1(i,vlo.y,k,n) : 0.0;
+                            Real cf2 = (k == vlo.z and m2(i,j,vlo.z-1) > 0)
+                                ? f2(i,j,vlo.z,n) : 0.0;
+                            Real cf3 = (i == vhi.x and m3(vhi.x+1,j,k) > 0)
+                                ? f3(vhi.x,j,k,n) : 0.0;
+                            Real cf4 = (j == vhi.y and m4(i,vhi.y+1,k) > 0)
+                                ? f4(i,vhi.y,k,n) : 0.0;
+                            Real cf5 = (k == vhi.z and m5(i,j,vhi.z+1) > 0)
+                                ? f5(i,j,vhi.z,n) : 0.0;
+
+                            Real g_m_d = gamma
+                                - (dhx*(bX(i,j,k,n)*cf0 + bX(i+1,j,k,n)*cf3)
+                                +  dhy*(bY(i,j,k,n)*cf1 + bY(i,j+1,k,n)*cf4)
+                                +  dhz*(bZ(i,j,k,n)*cf2 + bZ(i,j,k+1,n)*cf5));
+
+                            Real rho =  dhx*( bX(i  ,j,k,n)*phi(i-1,j,k,n)
+                                      +       bX(i+1,j,k,n)*phi(i+1,j,k,n) )
+                                      + dhy*( bY(i,j  ,k,n)*phi(i,j-1,k,n)
+                                      +       bY(i,j+1,k,n)*phi(i,j+1,k,n) );
+
+                            // We have already accounted for this external boundary in the coefficient of phi(i,j,k,n)
+                            if (i == vlo.x and m0(vlo.x-1,j,k) > 0)
+                                rho -= dhx*bX(i  ,j,k,n)*phi(i-1,j,k,n);
+                            if (i == vhi.x and m3(vhi.x+1,j,k) > 0)
+                                rho -= dhx*bX(i+1,j,k,n)*phi(i+1,j,k,n);
+                            if (j == vlo.y and m1(i,vlo.y-1,k) > 0)
+                                rho -= dhy*bY(i,j  ,k,n)*phi(i,j-1,k,n);
+                            if (j == vhi.y and m4(i,vhi.y+1,k) > 0)
+                                rho -= dhy*bY(i,j+1,k,n)*phi(i,j+1,k,n);
+
+                            a_ls(k-lo.z) = -dhz*bZ(i,j,k,n);
+                            b_ls(k-lo.z) =  g_m_d;
+                            c_ls(k-lo.z) = -dhz*bZ(i,j,k+1,n);
+                            u_ls(k-lo.z) = 0.;
+                            r_ls(k-lo.z) = rhs(i,j,k,n) + rho;
+                            // r_ls(k-lo.z) = g_m_d*phi(i,j,k,n) -gamma*phi(i,j,k,n) + rhs(i,j,k,n) + rho;
+
+                            if (k == lo.z)
+                            {
+                                a_ls(k-lo.z) = 0.;
+                                if (!(m2(i,j,vlo.z-1) > 0)) r_ls(k-lo.z) += dhz*bZ(i,j,k,n)*phi(i,j,k-1,n);
+                            }
+                            if (k == hi.z)
+                            {
+                                c_ls(k-lo.z) = 0.;
+                                if (!(m5(i,j,vhi.z+1) > 0)) r_ls(k-lo.z) += dhz*bZ(i,j,k+1,n)*phi(i,j,k+1,n);
+                            }
+                        }
+
+			tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+                        for (int k = lo.z; k <= hi.z; ++k)
+                        {
+                            phi(i,j,k,n) = u_ls(k-lo.z);
+                        }
+                    }
+                }
+            }
+        }
+    } else if (idir == 1) { 
+        for (int n = 0; n < nc; ++n) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                AMREX_PRAGMA_SIMD
+                for (int k = lo.z; k <= hi.z; ++k) {
+                    if ((i+k+redblack)%2 == 0) {
+
+                        for (int j = lo.y; j <= hi.y; ++j)
+                        {
+                            Real gamma = alpha*a(i,j,k)
+                                +   dhx*(bX(i,j,k,n)+bX(i+1,j,k,n))
+                                +   dhy*(bY(i,j,k,n)+bY(i,j+1,k,n))
+                                +   dhz*(bZ(i,j,k,n)+bZ(i,j,k+1,n));
+
+                            Real cf0 = (i == vlo.x and m0(vlo.x-1,j,k) > 0)
+                                ? f0(vlo.x,j,k,n) : 0.0;
+                            Real cf1 = (j == vlo.y and m1(i,vlo.y-1,k) > 0)
+                                ? f1(i,vlo.y,k,n) : 0.0;
+                            Real cf2 = (k == vlo.z and m2(i,j,vlo.z-1) > 0)
+                                ? f2(i,j,vlo.z,n) : 0.0;
+                            Real cf3 = (i == vhi.x and m3(vhi.x+1,j,k) > 0)
+                                ? f3(vhi.x,j,k,n) : 0.0;
+                            Real cf4 = (j == vhi.y and m4(i,vhi.y+1,k) > 0)
+                                ? f4(i,vhi.y,k,n) : 0.0;
+                            Real cf5 = (k == vhi.z and m5(i,j,vhi.z+1) > 0)
+                                ? f5(i,j,vhi.z,n) : 0.0;
+
+                            Real g_m_d = gamma
+                                - (dhx*(bX(i,j,k,n)*cf0 + bX(i+1,j,k,n)*cf3)
+                                +  dhy*(bY(i,j,k,n)*cf1 + bY(i,j+1,k,n)*cf4)
+                                +  dhz*(bZ(i,j,k,n)*cf2 + bZ(i,j,k+1,n)*cf5));
+
+                            Real rho =  dhx*( bX(i  ,j,k,n)*phi(i-1,j,k,n)
+                                      +       bX(i+1,j,k,n)*phi(i+1,j,k,n) )
+                                      + dhz*( bZ(i,j  ,k,n)*phi(i,j,k-1,n)
+                                      +       bZ(i,j,k+1,n)*phi(i,j,k+1,n) );
+
+                            // We have already accounted for this external boundary in the coefficient of phi(i,j,k,n)
+                            if (i == vlo.x and m0(vlo.x-1,j,k) > 0)
+                                rho -= dhx*bX(i  ,j,k,n)*phi(i-1,j,k,n);
+                            if (i == vhi.x and m3(vhi.x+1,j,k) > 0)
+                                rho -= dhx*bX(i+1,j,k,n)*phi(i+1,j,k,n);
+                            if (k == vlo.z and m2(i,j,vlo.z-1) > 0)
+                                rho -= dhz*bZ(i,j  ,k,n)*phi(i,j,k-1,n);
+                            if (k == vhi.z and m5(i,j,vhi.z+1) > 0)
+                                rho -= dhz*bZ(i,j,k+1,n)*phi(i,j,k+1,n);
+
+                            a_ls(j-lo.y) = -dhy*bY(i,j,k,n);
+                            b_ls(j-lo.y) =  g_m_d;
+                            c_ls(j-lo.y) = -dhy*bY(i,j+1,k,n);
+                            u_ls(j-lo.y) = 0.;
+                            r_ls(j-lo.y) = rhs(i,j,k,n) + rho;
+
+                            if (j == lo.y)
+                            {
+                                a_ls(j-lo.y) = 0.;
+                                if (!(m1(i,vlo.y-1,k) > 0)) r_ls(j-lo.y) += dhy*bY(i,j,k,n)*phi(i,j-1,k,n);
+                            }
+                            if (j == hi.y)
+                            {
+                                c_ls(j-lo.y) = 0.;
+                                if (!(m4(i,vhi.y+1,k) > 0)) r_ls(j-lo.y) += dhy*bY(i,j+1,k,n)*phi(i,j+1,k,n);
+                            }
+                        }
+
+			tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+                        for (int j = lo.y; j <= hi.y; ++j)
+                        {
+                            phi(i,j,k,n) = u_ls(j-lo.y);
+                        }
+                    }
+                }
+            }
+        } 
+    } else if (idir == 0) {
+        for (int n = 0; n < nc; ++n) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+                AMREX_PRAGMA_SIMD
+                for (int k = lo.z; k <= hi.z; ++k) {
+                    if ((j+k+redblack)%2 == 0) {
+
+                        for (int i = lo.x; i <= hi.x; ++i)
+                        {
+                            Real gamma = alpha*a(i,j,k)
+                                +   dhx*(bX(i,j,k,n)+bX(i+1,j,k,n))
+                                +   dhy*(bY(i,j,k,n)+bY(i,j+1,k,n))
+                                +   dhz*(bZ(i,j,k,n)+bZ(i,j,k+1,n));
+
+                            Real cf0 = (i == vlo.x and m0(vlo.x-1,j,k) > 0)
+                                ? f0(vlo.x,j,k,n) : 0.0;
+                            Real cf1 = (j == vlo.y and m1(i,vlo.y-1,k) > 0)
+                                ? f1(i,vlo.y,k,n) : 0.0;
+                            Real cf2 = (k == vlo.z and m2(i,j,vlo.z-1) > 0)
+                                ? f2(i,j,vlo.z,n) : 0.0;
+                            Real cf3 = (i == vhi.x and m3(vhi.x+1,j,k) > 0)
+                                ? f3(vhi.x,j,k,n) : 0.0;
+                            Real cf4 = (j == vhi.y and m4(i,vhi.y+1,k) > 0)
+                                ? f4(i,vhi.y,k,n) : 0.0;
+                            Real cf5 = (k == vhi.z and m5(i,j,vhi.z+1) > 0)
+                                ? f5(i,j,vhi.z,n) : 0.0;
+
+                            Real g_m_d = gamma
+                                - (dhx*(bX(i,j,k,n)*cf0 + bX(i+1,j,k,n)*cf3)
+                                +  dhy*(bY(i,j,k,n)*cf1 + bY(i,j+1,k,n)*cf4)
+                                +  dhz*(bZ(i,j,k,n)*cf2 + bZ(i,j,k+1,n)*cf5));
+
+                            Real rho =  dhy*( bY(i,j  ,k,n)*phi(i,j-1,k,n)
+                                      +       bY(i,j+1,k,n)*phi(i,j+1,k,n) )
+                                      + dhz*( bZ(i,j  ,k,n)*phi(i,j,k-1,n)
+                                      +       bZ(i,j,k+1,n)*phi(i,j,k+1,n) );
+
+                            // We have already accounted for this external boundary in the coefficient of phi(i,j,k,n)
+                            if (j == vlo.y and m1(i,vlo.y-1,k) > 0)
+                                rho -= dhy*bY(i,j  ,k,n)*phi(i,j-1,k,n);
+                            if (j == vhi.y and m4(i,vhi.y+1,k) > 0)
+                                rho -= dhy*bY(i,j+1,k,n)*phi(i,j+1,k,n);
+                            if (k == vlo.z and m2(i,j,vlo.z-1) > 0)
+                                rho -= dhz*bZ(i,j  ,k,n)*phi(i,j,k-1,n);
+                            if (k == vhi.z and m5(i,j,vhi.z+1) > 0)
+                                rho -= dhz*bZ(i,j,k+1,n)*phi(i,j,k+1,n);
+
+                            a_ls(i-lo.x) = -dhx*bX(i,j,k,n);
+                            b_ls(i-lo.x) =  g_m_d;
+                            c_ls(i-lo.x) = -dhx*bX(i+1,j,k,n);
+                            u_ls(i-lo.x) = 0.;
+                            r_ls(i-lo.x) = rhs(i,j,k,n) + rho;
+
+                            if (i == lo.x)
+                            {
+                                a_ls(i-lo.x) = 0.;
+                                if (!(m0(vlo.x-1,j,k) > 0)) r_ls(i-lo.x) += dhx*bX(i,j,k,n)*phi(i-1,j,k,n);
+                            }
+                            if (i == hi.x)
+                            {
+                                c_ls(i-lo.x) = 0.;
+                                if (!(m3(vhi.x+1,j,k) > 0)) r_ls(i-lo.x) += dhx*bX(i+1,j,k,n)*phi(i+1,j,k,n);
+                            }
+                        }
+
+			tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+        
+                        for (int i = lo.x; i <= hi.x; ++i)
+                        {
+                            phi(i,j,k,n) = u_ls(i-lo.x);
+                        }
+                    }
+                }
+            }
+	}
+    }	
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int coarsen_overset_mask (Box const& bx, Array4<int> const& cmsk, Array4<int const> const& fmsk)
+    noexcept
+{
+    int nerrors = 0;
+    const auto lo = amrex::lbound(bx);
+    const auto hi = amrex::ubound(bx);
+    for (int k = lo.z; k <= hi.z; ++k) {
+    for (int j = lo.y; j <= hi.y; ++j) {
+    for (int i = lo.x; i <= hi.x; ++i) {
+        int ii = 2*i;
+        int jj = 2*j;
+        int kk = 2*k;
+        cmsk(i,j,k) = fmsk(ii,jj  ,kk  ) + fmsk(ii+1,jj  ,kk  )
+            +         fmsk(ii,jj+1,kk  ) + fmsk(ii+1,jj+1,kk  )
+            +         fmsk(ii,jj  ,kk+1) + fmsk(ii+1,jj  ,kk+1)
+            +         fmsk(ii,jj+1,kk+1) + fmsk(ii+1,jj+1,kk+1);
+        if (cmsk(i,j,k) == 8) {
+            cmsk(i,j,k) = 1;
+        } else if (cmsk(i,j,k) != 0) {
+            ++nerrors;
+        }
+    }}}
+    return nerrors;
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void overset_rescale_bcoef_x (Box const& box, Array4<Real> const& bX, Array4<int const> const& osm,
+                              int ncomp, Real osfac) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int n = 0; n < ncomp; ++n) {
+        for (int k = lo.z; k <= hi.z; ++k) {
+        for (int j = lo.y; j <= hi.y; ++j) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((osm(i-1,j,k)+osm(i,j,k)) == 1) {
+                bX(i,j,k,n) *= osfac;
+            }
+        }}}
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void overset_rescale_bcoef_y (Box const& box, Array4<Real> const& bY, Array4<int const> const& osm,
+                              int ncomp, Real osfac) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int n = 0; n < ncomp; ++n) {
+        for (int k = lo.z; k <= hi.z; ++k) {
+        for (int j = lo.y; j <= hi.y; ++j) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((osm(i,j-1,k)+osm(i,j,k)) == 1) {
+                bY(i,j,k,n) *= osfac;
+            }
+        }}}
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void overset_rescale_bcoef_z (Box const& box, Array4<Real> const& bZ, Array4<int const> const& osm,
+                              int ncomp, Real osfac) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    for (int n = 0; n < ncomp; ++n) {
+        for (int k = lo.z; k <= hi.z; ++k) {
+        for (int j = lo.y; j <= hi.y; ++j) {
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if ((osm(i,j,k-1)+osm(i,j,k)) == 1) {
+                bZ(i,j,k,n) *= osfac;
+            }
+        }}}
+    }
+}
+
 }
 #endif
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.H b/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.H
index cd788398c89..b523cd997f8 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.H
@@ -20,6 +20,12 @@ public:
                      const Vector<DistributionMapping>& a_dmap,
                      const LPInfo& a_info = LPInfo(),
                      const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
+    MLABecLaplacian (const Vector<Geometry>& a_geom,
+                     const Vector<BoxArray>& a_grids,
+                     const Vector<DistributionMapping>& a_dmap,
+                     const Vector<iMultiFab const*>& a_overset_mask, // 1: unknown, 0: known
+                     const LPInfo& a_info = LPInfo(),
+                     const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
     virtual ~MLABecLaplacian ();
 
     MLABecLaplacian (const MLABecLaplacian&) = delete;
@@ -33,6 +39,13 @@ public:
                  const LPInfo& a_info = LPInfo(),
                  const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
 
+    void define (const Vector<Geometry>& a_geom,
+                 const Vector<BoxArray>& a_grids,
+                 const Vector<DistributionMapping>& a_dmap,
+                 const Vector<iMultiFab const*>& a_overset_mask,
+                 const LPInfo& a_info = LPInfo(),
+                 const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
+
     void setScalars (Real a, Real b) noexcept;
     void setACoeffs (int amrlev, const MultiFab& alpha);
     void setACoeffs (int amrlev, Real alpha);
@@ -64,12 +77,18 @@ public:
     virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int amrlev, int mglev) const final override
         { return amrex::GetArrOfConstPtrs(m_b_coeffs[amrlev][mglev]); }
 
-    virtual std::unique_ptr<MLLinOp> makeNLinOp (int grid_size) const final override {
+    virtual std::unique_ptr<MLLinOp> makeNLinOp (int /*grid_size*/) const final override {
         amrex::Abort("MLABecLaplacian::makeNLinOp: Not implmented");
         return std::unique_ptr<MLLinOp>{};
     }
 
-    void averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a,
+    virtual iMultiFab const* getOversetMask (int amrlev, int mglev) const override {
+        return m_overset_mask[amrlev][mglev].get();
+    }
+
+    virtual void applyOverset (int amlev, MultiFab& rhs) const override;
+
+    void averageDownCoeffsSameAmrLevel (int amrlev, Vector<MultiFab>& a,
                                         Vector<Array<MultiFab,AMREX_SPACEDIM> >& b);
     void averageDownCoeffs ();
     void averageDownCoeffsToCoarseAmrLevel (int flev);
@@ -90,6 +109,8 @@ protected:
     Vector<Vector<MultiFab> > m_a_coeffs;
     Vector<Vector<Array<MultiFab,AMREX_SPACEDIM> > > m_b_coeffs;
 
+    Vector<Vector<std::unique_ptr<iMultiFab> > > m_overset_mask;
+
     Vector<int> m_is_singular;
 };
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.cpp b/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.cpp
index c54fdb0022f..652baa1bf92 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLABecLaplacian.cpp
@@ -15,6 +15,16 @@ MLABecLaplacian::MLABecLaplacian (const Vector<Geometry>& a_geom,
     define(a_geom, a_grids, a_dmap, a_info, a_factory);
 }
 
+MLABecLaplacian::MLABecLaplacian (const Vector<Geometry>& a_geom,
+                                  const Vector<BoxArray>& a_grids,
+                                  const Vector<DistributionMapping>& a_dmap,
+                                  const Vector<iMultiFab const*>& a_overset_mask,
+                                  const LPInfo& a_info,
+                                  const Vector<FabFactory<FArrayBox> const*>& a_factory)
+{
+    define(a_geom, a_grids, a_dmap, a_overset_mask, a_info, a_factory);
+}
+
 void
 MLABecLaplacian::define (const Vector<Geometry>& a_geom,
                          const Vector<BoxArray>& a_grids,
@@ -30,10 +40,12 @@ MLABecLaplacian::define (const Vector<Geometry>& a_geom,
 
     m_a_coeffs.resize(m_num_amr_levels);
     m_b_coeffs.resize(m_num_amr_levels);
+    m_overset_mask.resize(m_num_amr_levels);
     for (int amrlev = 0; amrlev < m_num_amr_levels; ++amrlev)
     {
         m_a_coeffs[amrlev].resize(m_num_mg_levels[amrlev]);
         m_b_coeffs[amrlev].resize(m_num_mg_levels[amrlev]);
+        m_overset_mask[amrlev].resize(m_num_mg_levels[amrlev]);
         for (int mglev = 0; mglev < m_num_mg_levels[amrlev]; ++mglev)
         {
             m_a_coeffs[amrlev][mglev].define(m_grids[amrlev][mglev],
@@ -51,6 +63,92 @@ MLABecLaplacian::define (const Vector<Geometry>& a_geom,
     }
 }
 
+void
+MLABecLaplacian::define (const Vector<Geometry>& a_geom,
+                         const Vector<BoxArray>& a_grids,
+                         const Vector<DistributionMapping>& a_dmap,
+                         const Vector<iMultiFab const*>& a_overset_mask,
+                         const LPInfo& a_info,
+                         const Vector<FabFactory<FArrayBox> const*>& a_factory)
+{
+    BL_PROFILE("MLABecLaplacian::define(overset)");
+
+    int namrlevs = a_geom.size();
+    m_overset_mask.resize(namrlevs);
+    for (int amrlev = 0; amrlev < namrlevs; ++amrlev)
+    {
+        m_overset_mask[amrlev].emplace_back(new iMultiFab(a_grids[amrlev], a_dmap[amrlev], 1, 1));
+        iMultiFab::Copy(*m_overset_mask[amrlev][0], *a_overset_mask[amrlev], 0, 0, 1, 0);
+        if (amrlev > 1) {
+            AMREX_ALWAYS_ASSERT(amrex::refine(a_geom[amrlev-1].Domain(),2)
+                                == a_geom[amrlev].Domain());
+        }
+    }
+
+    int amrlev = 0;
+    Box dom = a_geom[0].Domain();
+    for (int mglev = 1; mglev <= a_info.max_coarsening_level; ++mglev)
+    {
+        AMREX_ALWAYS_ASSERT(mg_coarsen_ratio == 2);
+        iMultiFab const& fine = *m_overset_mask[amrlev][mglev-1];
+        if (dom.coarsenable(2) and fine.boxArray().coarsenable(2)) {
+            dom.coarsen(2);
+            std::unique_ptr<iMultiFab> crse(new iMultiFab(amrex::coarsen(fine.boxArray(),2),
+                                                          fine.DistributionMap(), 1, 1));
+            ReduceOps<ReduceOpSum> reduce_op;
+            ReduceData<int> reduce_data(reduce_op);
+            using ReduceTuple = typename decltype(reduce_data)::Type;
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+            for (MFIter mfi(*crse, TilingIfNotGPU()); mfi.isValid(); ++mfi)
+            {
+                const Box& bx = mfi.tilebox();
+                Array4<int const> const& fmsk = fine.const_array(mfi);
+                Array4<int> const& cmsk = crse->array(mfi);
+                reduce_op.eval(bx, reduce_data,
+                [=] AMREX_GPU_HOST_DEVICE (Box const& b) -> ReduceTuple
+                {
+                    return { coarsen_overset_mask(b, cmsk, fmsk) };
+                });
+            }
+            ReduceTuple hv = reduce_data.value();
+            if (amrex::get<0>(hv) == 0) {
+                m_overset_mask[amrlev].push_back(std::move(crse));
+            } else {
+                break;
+            }
+        } else {
+            break;
+        }
+    }
+    int max_overset_mask_coarsening_level = m_overset_mask[amrlev].size()-1;
+    ParallelAllReduce::Min(max_overset_mask_coarsening_level, ParallelContext::CommunicatorSub());
+    m_overset_mask[amrlev].resize(max_overset_mask_coarsening_level+1);
+
+    LPInfo linfo = a_info;
+    linfo.max_coarsening_level = std::min(a_info.max_coarsening_level,
+                                          max_overset_mask_coarsening_level);
+    define(a_geom, a_grids, a_dmap, linfo, a_factory);
+
+    amrlev = 0;
+    for (int mglev = 1; mglev < m_num_mg_levels[amrlev]; ++mglev) {
+        if (! isMFIterSafe(*m_overset_mask[amrlev][mglev], m_a_coeffs[amrlev][mglev])) {
+            std::unique_ptr<iMultiFab> osm(new iMultiFab(m_grids[amrlev][mglev],
+                                                         m_dmap[amrlev][mglev], 1, 1));
+            osm->ParallelCopy(*m_overset_mask[amrlev][mglev]);
+            std::swap(osm, m_overset_mask[amrlev][mglev]);
+        }
+    }
+
+    for (amrlev = 0; amrlev < m_num_amr_levels; ++amrlev) {
+        for (int mglev = 0; mglev < m_num_mg_levels[amrlev]; ++mglev) {
+            m_overset_mask[amrlev][mglev]->setBndry(1);
+            m_overset_mask[amrlev][mglev]->FillBoundary(m_geom[amrlev][mglev].periodicity());
+        }
+    }
+}
+
 MLABecLaplacian::~MLABecLaplacian ()
 {}
 
@@ -124,7 +222,6 @@ MLABecLaplacian::setBCoeffs (int amrlev, Vector<Real> const& beta)
     m_needs_update = true;
 }
 
-
 void
 MLABecLaplacian::averageDownCoeffs ()
 {
@@ -135,27 +232,29 @@ MLABecLaplacian::averageDownCoeffs ()
         auto& fine_a_coeffs = m_a_coeffs[amrlev];
         auto& fine_b_coeffs = m_b_coeffs[amrlev];
 
-        averageDownCoeffsSameAmrLevel(fine_a_coeffs, fine_b_coeffs);
+        averageDownCoeffsSameAmrLevel(amrlev, fine_a_coeffs, fine_b_coeffs);
         averageDownCoeffsToCoarseAmrLevel(amrlev);
     }
 
-    averageDownCoeffsSameAmrLevel(m_a_coeffs[0], m_b_coeffs[0]);
+    averageDownCoeffsSameAmrLevel(0, m_a_coeffs[0], m_b_coeffs[0]);
 }
 
 void
-MLABecLaplacian::averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a,
+MLABecLaplacian::averageDownCoeffsSameAmrLevel (int amrlev, Vector<MultiFab>& a,
                                                 Vector<Array<MultiFab,AMREX_SPACEDIM> >& b)
 {
     int nmglevs = a.size();
     for (int mglev = 1; mglev < nmglevs; ++mglev)
     {
+        IntVect ratio = (amrlev > 0) ? IntVect(mg_coarsen_ratio) : mg_coarsen_ratio_vec[mglev-1];
+
         if (m_a_scalar == 0.0)
         {
             a[mglev].setVal(0.0);
         }
         else
         {
-            amrex::average_down(a[mglev-1], a[mglev], 0, 1, mg_coarsen_ratio);
+            amrex::average_down(a[mglev-1], a[mglev], 0, 1, ratio);
         }
         
         Vector<const MultiFab*> fine {AMREX_D_DECL(&(b[mglev-1][0]),
@@ -164,9 +263,44 @@ MLABecLaplacian::averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a,
         Vector<MultiFab*> crse {AMREX_D_DECL(&(b[mglev][0]),
                                              &(b[mglev][1]),
                                              &(b[mglev][2]))};
-        IntVect ratio {mg_coarsen_ratio};
+
         amrex::average_down_faces(fine, crse, ratio, 0);
     }
+
+    for (int mglev = 1; mglev < nmglevs; ++mglev)
+    {
+        if (m_overset_mask[amrlev][mglev]) {
+            const Real fac = static_cast<Real>(1 << mglev); // 2**mglev
+            const Real osfac = 2.0*fac/(fac+1.0);
+            const int ncomp = getNComp();
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+            for (MFIter mfi(a[mglev],TilingIfNotGPU()); mfi.isValid(); ++mfi)
+            {
+                AMREX_D_TERM(Box const& xbx = mfi.nodaltilebox(0);,
+                             Box const& ybx = mfi.nodaltilebox(1);,
+                             Box const& zbx = mfi.nodaltilebox(2));
+                AMREX_D_TERM(Array4<Real> const& bx = b[mglev][0].array(mfi);,
+                             Array4<Real> const& by = b[mglev][1].array(mfi);,
+                             Array4<Real> const& bz = b[mglev][2].array(mfi));
+                Array4<int const> const& osm = m_overset_mask[amrlev][mglev]->const_array(mfi);
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
+                    (xbx, t_xbx,
+                     {
+                         overset_rescale_bcoef_x(t_xbx, bx, osm, ncomp, osfac);
+                     },
+                     ybx, t_ybx,
+                     {
+                         overset_rescale_bcoef_y(t_ybx, by, osm, ncomp, osfac);
+                     },
+                     zbx, t_zbx,
+                     {
+                         overset_rescale_bcoef_z(t_zbx, bz, osm, ncomp, osfac);
+                     });
+            }
+        }
+    }
 }
 
 void
@@ -185,7 +319,7 @@ MLABecLaplacian::averageDownCoeffsToCoarseAmrLevel (int flev)
 
     amrex::average_down_faces(amrex::GetArrOfConstPtrs(fine_b_coeffs),
                               amrex::GetArrOfPtrs(crse_b_coeffs),
-                              mg_coarsen_ratio, 0);
+                              IntVect(mg_coarsen_ratio), m_geom[flev-1][0]);
 }
 
 void
@@ -225,7 +359,8 @@ MLABecLaplacian::prepareForSolve ()
     {  // No Dirichlet
         for (int alev = 0; alev < m_num_amr_levels; ++alev)
         {
-            if (m_domain_covered[alev])
+            // For now this assumes that overset regions are treated as Dirichlet bc's
+            if (m_domain_covered[alev] && !m_overset_mask[alev][0]) 
             {
                 if (m_a_scalar == 0.0)
                 {
@@ -273,12 +408,20 @@ MLABecLaplacian::Fapply (int amrlev, int mglev, MultiFab& out, const MultiFab& i
         AMREX_D_TERM(const auto& bxfab = bxcoef.array(mfi);,
                      const auto& byfab = bycoef.array(mfi);,
                      const auto& bzfab = bzcoef.array(mfi););
-
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
-        {
-            mlabeclap_adotx(tbx, yfab, xfab, afab, AMREX_D_DECL(bxfab,byfab,bzfab),
-                            dxinv, ascalar, bscalar, ncomp);
-        });
+        if (m_overset_mask[amrlev][mglev]) {
+            const auto& osm = m_overset_mask[amrlev][mglev]->array(mfi);
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
+            {
+                mlabeclap_adotx_os(tbx, yfab, xfab, afab, AMREX_D_DECL(bxfab,byfab,bzfab),
+                                   osm, dxinv, ascalar, bscalar, ncomp);
+            });
+        } else {
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
+            {
+                mlabeclap_adotx(tbx, yfab, xfab, afab, AMREX_D_DECL(bxfab,byfab,bzfab),
+                                dxinv, ascalar, bscalar, ncomp);
+            });
+        }
     }
 }
 
@@ -311,7 +454,7 @@ MLABecLaplacian::normalize (int amrlev, int mglev, MultiFab& mf) const
                      const auto& byfab = bycoef.array(mfi);,
                      const auto& bzfab = bzcoef.array(mfi););
 
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
         {
             mlabeclap_normalize(tbx, fab, afab, AMREX_D_DECL(bxfab,byfab,bzfab),
                                 dxinv, ascalar, bscalar, ncomp);
@@ -324,6 +467,11 @@ MLABecLaplacian::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab&
 {
     BL_PROFILE("MLABecLaplacian::Fsmooth()");
 
+    bool regular_coarsening = true;
+    if (amrlev == 0 and mglev > 0) {
+        regular_coarsening = mg_coarsen_ratio_vec[mglev-1] == mg_coarsen_ratio;
+    }
+
     const MultiFab& acoef = m_a_coeffs[amrlev][mglev];
     AMREX_D_TERM(const MultiFab& bxcoef = m_b_coeffs[amrlev][mglev][0];,
                  const MultiFab& bycoef = m_b_coeffs[amrlev][mglev][1];,
@@ -417,29 +565,88 @@ MLABecLaplacian::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab&
 #endif
         Gpu::AsyncArray<Array4<Real const> > aa(ha.data(), 2*AMREX_SPACEDIM);
         auto dp = aa.data();
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tbx, thread_box,
-        {
-            abec_gsrb(thread_box, solnfab, rhsfab, alpha, afab,
-                      AMREX_D_DECL(dhx, dhy, dhz),
-                      AMREX_D_DECL(bxfab, byfab, bzfab),
-                      AMREX_D_DECL(m0,m2,m4),
-                      AMREX_D_DECL(m1,m3,m5),
-                      AMREX_D_DECL(dp[0],dp[2],dp[4]),
-                      AMREX_D_DECL(dp[1],dp[3],dp[5]),
-                      vbx, redblack, nc);
-        });
+
+        if (m_overset_mask[amrlev][mglev]) {
+            const auto& osm = m_overset_mask[amrlev][mglev]->array(mfi);
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tbx, thread_box,
+            {
+                abec_gsrb_os(thread_box, solnfab, rhsfab, alpha, afab,
+                             AMREX_D_DECL(dhx, dhy, dhz),
+                             AMREX_D_DECL(bxfab, byfab, bzfab),
+                             AMREX_D_DECL(m0,m2,m4),
+                             AMREX_D_DECL(m1,m3,m5),
+                             AMREX_D_DECL(dp[0],dp[2],dp[4]),
+                             AMREX_D_DECL(dp[1],dp[3],dp[5]),
+                             osm, vbx, redblack, nc);
+            });
+        } else if (regular_coarsening) {
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tbx, thread_box,
+            {
+                abec_gsrb(thread_box, solnfab, rhsfab, alpha, afab,
+                          AMREX_D_DECL(dhx, dhy, dhz),
+                          AMREX_D_DECL(bxfab, byfab, bzfab),
+                          AMREX_D_DECL(m0,m2,m4),
+                          AMREX_D_DECL(m1,m3,m5),
+                          AMREX_D_DECL(dp[0],dp[2],dp[4]),
+                          AMREX_D_DECL(dp[1],dp[3],dp[5]),
+                          vbx, redblack, nc);
+            });
+        } else {
+            Gpu::LaunchSafeGuard lsg(false); // xxxxx gpu todo
+            // line solve does not with with GPU
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tbx, thread_box,
+            {
+                abec_gsrb_with_line_solve(thread_box, solnfab, rhsfab, alpha, afab,
+                                          AMREX_D_DECL(dhx, dhy, dhz),
+                                          AMREX_D_DECL(bxfab, byfab, bzfab),
+                                          AMREX_D_DECL(m0,m2,m4),
+                                          AMREX_D_DECL(m1,m3,m5),
+                                          AMREX_D_DECL(dp[0],dp[2],dp[4]),
+                                          AMREX_D_DECL(dp[1],dp[3],dp[5]),
+                                          vbx, redblack, nc);
+            });
+        }
 #else
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tbx, thread_box,
-        {
-            abec_gsrb(thread_box, solnfab, rhsfab, alpha, afab,
-                      AMREX_D_DECL(dhx, dhy, dhz),
-                      AMREX_D_DECL(bxfab, byfab, bzfab),
-                      AMREX_D_DECL(m0,m2,m4),
-                      AMREX_D_DECL(m1,m3,m5),
-                      AMREX_D_DECL(f0fab,f2fab,f4fab),
-                      AMREX_D_DECL(f1fab,f3fab,f5fab),
-                      vbx, redblack, nc);
-        });
+        if (m_overset_mask[amrlev][mglev]) {
+            const auto& osm = m_overset_mask[amrlev][mglev]->array(mfi);
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( tbx, thread_box,
+            {
+                abec_gsrb_os(thread_box, solnfab, rhsfab, alpha, afab,
+                             AMREX_D_DECL(dhx, dhy, dhz),
+                             AMREX_D_DECL(bxfab, byfab, bzfab),
+                             AMREX_D_DECL(m0,m2,m4),
+                             AMREX_D_DECL(m1,m3,m5),
+                             AMREX_D_DECL(f0fab,f2fab,f4fab),
+                             AMREX_D_DECL(f1fab,f3fab,f5fab),
+                             osm, vbx, redblack, nc);
+            });
+        } else if (regular_coarsening) {
+            AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( tbx, thread_box,
+            {
+                abec_gsrb(thread_box, solnfab, rhsfab, alpha, afab,
+                          AMREX_D_DECL(dhx, dhy, dhz),
+                          AMREX_D_DECL(bxfab, byfab, bzfab),
+                          AMREX_D_DECL(m0,m2,m4),
+                          AMREX_D_DECL(m1,m3,m5),
+                          AMREX_D_DECL(f0fab,f2fab,f4fab),
+                          AMREX_D_DECL(f1fab,f3fab,f5fab),
+                          vbx, redblack, nc);
+            });
+        } else {
+            Gpu::LaunchSafeGuard lsg(false); // xxxxx gpu todo
+            // line solve does not with with GPU
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( tbx, thread_box,
+            {
+                abec_gsrb_with_line_solve(thread_box, solnfab, rhsfab, alpha, afab,
+                                          AMREX_D_DECL(dhx, dhy, dhz),
+                                          AMREX_D_DECL(bxfab, byfab, bzfab),
+                                          AMREX_D_DECL(m0,m2,m4),
+                                          AMREX_D_DECL(m1,m3,m5),
+                                          AMREX_D_DECL(f0fab,f2fab,f4fab),
+                                          AMREX_D_DECL(f1fab,f3fab,f5fab),
+                                          vbx, redblack, nc);
+            });
+        }
 #endif
     }
 }
@@ -456,9 +663,9 @@ MLABecLaplacian::FFlux (int amrlev, const MFIter& mfi,
     const Real* dxinv = m_geom[amrlev][mglev].InvCellSize();
     const int ncomp = getNComp();
     FFlux(box, dxinv, m_b_scalar,
-          Array<FArrayBox const*,AMREX_SPACEDIM>{AMREX_D_DECL(&(m_b_coeffs[amrlev][mglev][0][mfi]),
-                                                              &(m_b_coeffs[amrlev][mglev][1][mfi]),
-                                                              &(m_b_coeffs[amrlev][mglev][2][mfi]))},
+          Array<FArrayBox const*,AMREX_SPACEDIM>{{AMREX_D_DECL(&(m_b_coeffs[amrlev][mglev][0][mfi]),
+                                                               &(m_b_coeffs[amrlev][mglev][1][mfi]),
+                                                               &(m_b_coeffs[amrlev][mglev][2][mfi]))}},
           flux, sol, face_only, ncomp);
 }
 
@@ -481,7 +688,7 @@ MLABecLaplacian::FFlux (Box const& box, Real const* dxinv, Real bscalar,
         Real fac = bscalar*dxinv[0];
         Box blo = amrex::bdryLo(box, 0);
         int blen = box.length(0);
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( blo, tbox,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( blo, tbox,
         {
             mlabeclap_flux_xface(tbox, fxarr, solarr, bx, fac, blen, ncomp);
         });
@@ -489,7 +696,7 @@ MLABecLaplacian::FFlux (Box const& box, Real const* dxinv, Real bscalar,
         fac = bscalar*dxinv[1];
         blo = amrex::bdryLo(box, 1);
         blen = box.length(1);
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( blo, tbox,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( blo, tbox,
         {
             mlabeclap_flux_yface(tbox, fyarr, solarr, by, fac, blen, ncomp);
         });
@@ -498,7 +705,7 @@ MLABecLaplacian::FFlux (Box const& box, Real const* dxinv, Real bscalar,
         fac = bscalar*dxinv[2];
         blo = amrex::bdryLo(box, 2);
         blen = box.length(2);
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( blo, tbox,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( blo, tbox,
         {
             mlabeclap_flux_zface(tbox, fzarr, solarr, bz, fac, blen, ncomp);
         });
@@ -508,14 +715,14 @@ MLABecLaplacian::FFlux (Box const& box, Real const* dxinv, Real bscalar,
     {
         Real fac = bscalar*dxinv[0];
         Box bflux = amrex::surroundingNodes(box, 0);
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bflux, tbox,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bflux, tbox,
         {
             mlabeclap_flux_x(tbox, fxarr, solarr, bx, fac, ncomp);
         });
 #if (AMREX_SPACEDIM >= 2)
         fac = bscalar*dxinv[1];
         bflux = amrex::surroundingNodes(box, 1);
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bflux, tbox,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bflux, tbox,
         {
             mlabeclap_flux_y(tbox, fyarr, solarr, by, fac, ncomp);
         });
@@ -523,7 +730,7 @@ MLABecLaplacian::FFlux (Box const& box, Real const* dxinv, Real bscalar,
 #if (AMREX_SPACEDIM == 3)
         fac = bscalar*dxinv[2];
         bflux = amrex::surroundingNodes(box, 2);
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bflux, tbox,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bflux, tbox,
         {
             mlabeclap_flux_z(tbox, fzarr, solarr, bz, fac, ncomp);
         });
@@ -550,7 +757,8 @@ MLABecLaplacian::update ()
     {  // No Dirichlet
         for (int alev = 0; alev < m_num_amr_levels; ++alev)
         {
-            if (m_domain_covered[alev])
+            // For now this assumes that overset regions are treated as Dirichlet bc's
+            if (m_domain_covered[alev] && !m_overset_mask[alev][0]) 
             {
                 if (m_a_scalar == 0.0)
                 {
@@ -569,4 +777,25 @@ MLABecLaplacian::update ()
     m_needs_update = false;
 }
 
+void
+MLABecLaplacian::applyOverset (int amrlev, MultiFab& rhs) const
+{
+    if (m_overset_mask[amrlev][0]) {
+        const int ncomp = getNComp();
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+        for (MFIter mfi(*m_overset_mask[amrlev][0],TilingIfNotGPU()); mfi.isValid(); ++mfi)
+        {
+            const Box& bx = mfi.tilebox();
+            Array4<Real> const& rfab = rhs.array(mfi);
+            Array4<int const> const& osm = m_overset_mask[amrlev][0]->const_array(mfi);
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D(bx, ncomp, i, j, k, n,
+            {
+                if (osm(i,j,k) == 0) rfab(i,j,k,n) = 0.0;
+            });
+        }
+    }
+}
+
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.H b/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.H
index c6b9948c66a..195ff39154b 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.H
@@ -50,15 +50,15 @@ public:
     virtual Real getBScalar () const final override { return m_b_scalar; }
     virtual MultiFab const* getACoeffs (int amrlev, int mglev) const final override
         { return &(m_a_coeffs[amrlev][mglev]); }
-    virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int amrlev, int mglev) const final override
-        { return { AMREX_D_DECL(nullptr,nullptr,nullptr)}; }
+    virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int /*amrlev*/, int /*mglev*/) const final override
+        { return {{ AMREX_D_DECL(nullptr,nullptr,nullptr)}}; }
 
-    virtual std::unique_ptr<MLLinOp> makeNLinOp (int grid_size) const final override {
+    virtual std::unique_ptr<MLLinOp> makeNLinOp (int /*grid_size*/) const final override {
         amrex::Abort("MLALaplacian::makeNLinOp: Not implmented");
         return std::unique_ptr<MLLinOp>{};
     }
 
-    void averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a);
+    void averageDownCoeffsSameAmrLevel (int amrlev, Vector<MultiFab>& a);
     void averageDownCoeffs ();
     void averageDownCoeffsToCoarseAmrLevel (int flev);
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.cpp b/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.cpp
index cff50dc65de..015a6003a48 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLALaplacian.cpp
@@ -71,15 +71,15 @@ MLALaplacian::averageDownCoeffs ()
     {
         auto& fine_a_coeffs = m_a_coeffs[amrlev];
 
-        averageDownCoeffsSameAmrLevel(fine_a_coeffs);
+        averageDownCoeffsSameAmrLevel(amrlev, fine_a_coeffs);
         averageDownCoeffsToCoarseAmrLevel(amrlev);
     }
 
-    averageDownCoeffsSameAmrLevel(m_a_coeffs[0]);
+    averageDownCoeffsSameAmrLevel(0, m_a_coeffs[0]);
 }
 
 void
-MLALaplacian::averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a)
+MLALaplacian::averageDownCoeffsSameAmrLevel (int amrlev, Vector<MultiFab>& a)
 {
     int nmglevs = a.size();
     for (int mglev = 1; mglev < nmglevs; ++mglev)
@@ -90,7 +90,8 @@ MLALaplacian::averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a)
         }
         else
         {
-            amrex::average_down(a[mglev-1], a[mglev], 0, 1, mg_coarsen_ratio);
+            IntVect ratio = (amrlev > 0) ? IntVect(mg_coarsen_ratio) : mg_coarsen_ratio_vec[mglev-1];
+            amrex::average_down(a[mglev-1], a[mglev], 0, 1, ratio);
         }
     }
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.H b/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.H
index 59ae63bdc8c..b4945bcf99b 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.H
@@ -2,12 +2,13 @@
 #ifndef AMREX_MLCGSOLVER_H_
 #define AMREX_MLCGSOLVER_H_
 
-#include <cmath>
-
 #include <AMReX_Vector.H>
 #include <AMReX_MultiFab.H>
 #include <AMReX_MLLinOp.H>
 
+#include <cmath>
+
+
 namespace amrex {
 
 class MLMG;
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.cpp b/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.cpp
index 12293d43692..0a9633f84dd 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLCGSolver.cpp
@@ -1,9 +1,4 @@
 
-#include <limits>
-#include <algorithm>
-#include <iomanip>
-#include <cmath>
-
 #include <AMReX_ParmParse.H>
 #include <AMReX_Utility.H>
 #include <AMReX_LO_BCTYPES.H>
@@ -16,6 +11,12 @@
 #include <omp.h>
 #endif
 
+#include <limits>
+#include <algorithm>
+#include <iomanip>
+#include <cmath>
+
+
 namespace amrex {
 
 namespace {
@@ -160,7 +161,8 @@ MLCGSolver::solve_bicgstab (MultiFab&       sol,
         Lp.apply(amrlev, mglev, v, ph, MLLinOp::BCMode::Homogeneous, MLLinOp::StateMode::Correction);
         Lp.normalize(amrlev, mglev, v);
 
-        if ( Real rhTv = dotxy(rh,v) )
+        Real rhTv = dotxy(rh,v);
+        if ( rhTv != Real(0.0) )
 	{
             alpha = rho/rhTv;
 	}
@@ -200,7 +202,7 @@ MLCGSolver::solve_bicgstab (MultiFab&       sol,
         ParallelAllReduce::Sum(tvals,2,Lp.BottomCommunicator());
         BL_PROFILE_VAR_STOP(blp_par);
 
-        if ( tvals[0] )
+        if ( tvals[0] != Real(0.0) )
 	{
             omega = tvals[1]/tvals[0];
 	}
@@ -332,7 +334,8 @@ MLCGSolver::solve_cg (MultiFab&       sol,
         Lp.apply(amrlev, mglev, q, p, MLLinOp::BCMode::Homogeneous, MLLinOp::StateMode::Correction);
 
         Real alpha;
-        if ( Real pw = dotxy(p,q) )
+        Real pw = dotxy(p,q);
+        if ( pw != Real(0.0))
 	{
             alpha = rho/pw;
 	}
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.H b/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.H
index a26ec57a3f8..6e9d4812f2e 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.H
@@ -37,8 +37,8 @@ public:
     virtual void getFluxes (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_flux,
                             const Vector<MultiFab*>& a_sol,
                             Location a_loc) const final override;
-    virtual void getFluxes (const Vector<MultiFab*>& a_flux,
-                            const Vector<MultiFab*>& a_sol) const final override {
+    virtual void getFluxes (const Vector<MultiFab*>& /*a_flux*/,
+                            const Vector<MultiFab*>& /*a_sol*/) const final override {
         amrex::Abort("MLCellABecLap::getFluxes: How did we get here?");
     }
 
@@ -47,6 +47,8 @@ public:
     virtual MultiFab const* getACoeffs (int amrlev, int mglev) const = 0;
     virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int amrlev, int mglev) const = 0;
 
+    virtual iMultiFab const* getOversetMask (int /*amrlev*/, int /*mglev*/) const { return nullptr; }
+
     virtual void applyInhomogNeumannTerm (int amrlev, MultiFab& rhs) const final override;
 
 #ifdef AMREX_USE_HYPRE
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.cpp b/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.cpp
index 8bd13d02363..241d9694e56 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLCellABecLap.cpp
@@ -237,11 +237,14 @@ MLCellABecLap::makeHypre (Hypre::Interface hypre_interface) const
     const auto& factory = *(m_factory[0].back());
     MPI_Comm comm = BottomCommunicator();
 
-    auto hypre_solver = amrex::makeHypre(ba, dm, geom, comm, hypre_interface);
+    const int mglev = NMGLevels(0)-1;
+
+    auto om = getOversetMask(0, mglev);
+
+    auto hypre_solver = amrex::makeHypre(ba, dm, geom, comm, hypre_interface, om);
 
     hypre_solver->setScalars(getAScalar(), getBScalar());
 
-    const int mglev = NMGLevels(0)-1;
     auto ac = getACoeffs(0, mglev);
     if (ac)
     {
@@ -270,6 +273,7 @@ MLCellABecLap::makeHypre (Hypre::Interface hypre_interface) const
         }
         hypre_solver->setBCoeffs(amrex::GetArrOfConstPtrs(beta));
     }
+    hypre_solver->setIsMatrixSingular(this->isBottomSingular());
 
     return hypre_solver;
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLCellLinOp.cpp b/Src/LinearSolvers/MLMG/AMReX_MLCellLinOp.cpp
index e3d2c5d994e..bb88308d595 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLCellLinOp.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLCellLinOp.cpp
@@ -138,9 +138,9 @@ MLCellLinOp::defineBC ()
                                             m_amr_ref_ratio[amrlev-1], BCRec());
 
         Vector<Array<LinOpBCType,AMREX_SPACEDIM> > bclohi
-            (ncomp,Array<LinOpBCType,AMREX_SPACEDIM>{AMREX_D_DECL(BCType::Dirichlet,
-                                                                  BCType::Dirichlet,
-                                                                  BCType::Dirichlet)});
+            (ncomp,Array<LinOpBCType,AMREX_SPACEDIM>{{AMREX_D_DECL(BCType::Dirichlet,
+                                                                   BCType::Dirichlet,
+                                                                   BCType::Dirichlet)}});
         m_bndry_cor[amrlev]->setLOBndryConds(bclohi, bclohi, m_amr_ref_ratio[amrlev-1], RealVect{});
     }
 
@@ -281,13 +281,14 @@ MLCellLinOp::makeNGrids (int grid_size) const
 }
 
 void
-MLCellLinOp::restriction (int, int, MultiFab& crse, MultiFab& fine) const
+MLCellLinOp::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab& fine) const
 {
     const int ncomp = getNComp();
 #ifdef AMREX_SOFT_PERF_COUNTERS
     perf_counters.restrict(crse);
 #endif
-    amrex::average_down(fine, crse, 0, ncomp, 2);
+    IntVect ratio = (amrlev > 0) ? IntVect(2) : mg_coarsen_ratio_vec[cmglev-1];
+    amrex::average_down(fine, crse, 0, ncomp, ratio);
 }
 
 void
@@ -299,6 +300,12 @@ MLCellLinOp::interpolation (int amrlev, int fmglev, MultiFab& fine, const MultiF
 
     const int ncomp = getNComp();
 
+    Dim3 ratio3 = {2,2,2};
+    IntVect ratio = (amrlev > 0) ? IntVect(2) : mg_coarsen_ratio_vec[fmglev];
+    AMREX_D_TERM(ratio3.x = ratio[0];,
+                 ratio3.y = ratio[1];,
+                 ratio3.z = ratio[2];);
+
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
@@ -307,11 +314,11 @@ MLCellLinOp::interpolation (int amrlev, int fmglev, MultiFab& fine, const MultiF
         const Box& bx    = mfi.tilebox();
         Array4<Real const> const& cfab = crse.const_array(mfi);
         Array4<Real> const& ffab = fine.array(mfi);
-        AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( bx, ncomp, i, j, k, n,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_4D_FUSIBLE ( bx, ncomp, i, j, k, n,
         {
-            int ic = amrex::coarsen(i,2);
-            int jc = amrex::coarsen(j,2);
-            int kc = amrex::coarsen(k,2);
+            int ic = amrex::coarsen(i,ratio3.x);
+            int jc = amrex::coarsen(j,ratio3.y);
+            int kc = amrex::coarsen(k,ratio3.z);
             ffab(i,j,k,n) += cfab(ic,jc,kc,n);
         });
     }    
@@ -452,9 +459,9 @@ MLCellLinOp::applyBC (int amrlev, int mglev, MultiFab& in, BCMode bc_mode, State
     const int imaxorder = maxorder;
 
     const Real* dxinv = m_geom[amrlev][mglev].InvCellSize();
-    const Real dxi = m_geom[amrlev][mglev].InvCellSize(0);
-    const Real dyi = (AMREX_SPACEDIM >= 2) ? m_geom[amrlev][mglev].InvCellSize(1) : 1.0;
-    const Real dzi = (AMREX_SPACEDIM == 3) ? m_geom[amrlev][mglev].InvCellSize(2) : 1.0;
+    const Real dxi = dxinv[0];
+    const Real dyi = (AMREX_SPACEDIM >= 2) ? dxinv[1] : 1.0;
+    const Real dzi = (AMREX_SPACEDIM == 3) ? dxinv[2] : 1.0;
 
     const auto& maskvals = m_maskvals[amrlev][mglev];
     const auto& bcondloc = *m_bcondloc[amrlev][mglev];
@@ -498,7 +505,7 @@ MLCellLinOp::applyBC (int amrlev, int mglev, MultiFab& in, BCMode bc_mode, State
                     const Real bcllo = bdlv[icomp][olo];
                     const Real bclhi = bdlv[icomp][ohi];
                     if (idim == 0) {
-                        AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA (
                         blo, tboxlo, {
                         mllinop_apply_bc_x(0, tboxlo, blen, iofab, mlo,
                                            bctlo, bcllo, bvlo,
@@ -510,7 +517,7 @@ MLCellLinOp::applyBC (int amrlev, int mglev, MultiFab& in, BCMode bc_mode, State
                                            imaxorder, dxi, flagbc, icomp);
                         });
                     } else if (idim == 1) {
-                        AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA (
                         blo, tboxlo, {
                         mllinop_apply_bc_y(0, tboxlo, blen, iofab, mlo,
                                            bctlo, bcllo, bvlo,
@@ -522,7 +529,7 @@ MLCellLinOp::applyBC (int amrlev, int mglev, MultiFab& in, BCMode bc_mode, State
                                            imaxorder, dyi, flagbc, icomp);
                         });
                     } else {
-                        AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA (
                         blo, tboxlo, {
                         mllinop_apply_bc_z(0, tboxlo, blen, iofab, mlo,
                                            bctlo, bcllo, bvlo,
@@ -539,12 +546,12 @@ MLCellLinOp::applyBC (int amrlev, int mglev, MultiFab& in, BCMode bc_mode, State
         }
         else
         {
+#ifndef BL_NO_FORT
             const RealTuple & bdl = bdlv[0];
             const BCTuple   & bdc = bdcv[0];
 
             for (OrientationIter oitr; oitr; ++oitr)
             {
-#ifndef BL_NO_FORT
                 const Orientation ori = oitr();
 
                 int  cdr = ori;
@@ -561,10 +568,10 @@ MLCellLinOp::applyBC (int amrlev, int mglev, MultiFab& in, BCMode bc_mode, State
                                        cdr, bct, bcl,
                                        BL_TO_FORTRAN_ANYD(fsfab),
                                        maxorder, dxinv, flagbc, ncomp, cross);
+            }
 #else
                 amrex::Abort("amrex_mllinop_apply_bc not available when BL_NO_FORT=TRUE");
 #endif
-            }
         }
     }
 }
@@ -598,8 +605,8 @@ MLCellLinOp::reflux (int crse_amrlev,
 #endif
     {
         Array<FArrayBox,AMREX_SPACEDIM> flux;
-        Array<FArrayBox*,AMREX_SPACEDIM> pflux { AMREX_D_DECL(&flux[0], &flux[1], &flux[2]) };
-        Array<FArrayBox const*,AMREX_SPACEDIM> cpflux { AMREX_D_DECL(&flux[0], &flux[1], &flux[2]) };
+        Array<FArrayBox*,AMREX_SPACEDIM> pflux {{ AMREX_D_DECL(&flux[0], &flux[1], &flux[2]) }};
+        Array<FArrayBox const*,AMREX_SPACEDIM> cpflux {{ AMREX_D_DECL(&flux[0], &flux[1], &flux[2]) }};
 
         for (MFIter mfi(crse_sol, mfi_info);  mfi.isValid(); ++mfi)
         {
@@ -612,6 +619,7 @@ MLCellLinOp::reflux (int crse_amrlev,
                 AMREX_D_TERM(Elixir elifx = flux[0].elixir();,
                              Elixir elify = flux[1].elixir();,
                              Elixir elifz = flux[2].elixir(););
+                Gpu::FuseSafeGuard fsg(false); // Turn off fusing in FFlux
                 FFlux(crse_amrlev, mfi, pflux, crse_sol[mfi], Location::FaceCentroid);
                 fluxreg.CrseAdd(mfi, cpflux, crse_dx, dt, RunOn::Gpu);
             }
@@ -633,6 +641,7 @@ MLCellLinOp::reflux (int crse_amrlev,
                 AMREX_D_TERM(Elixir elifx = flux[0].elixir();,
                              Elixir elify = flux[1].elixir();,
                              Elixir elifz = flux[2].elixir(););
+                Gpu::FuseSafeGuard fsg(false); // Turn off fusing in FFlux
                 FFlux(fine_amrlev, mfi, pflux, fine_sol[mfi], Location::FaceCentroid, face_only);
                 fluxreg.FineAdd(mfi, cpflux, fine_dx, dt, RunOn::Gpu);
             }
@@ -661,7 +670,7 @@ MLCellLinOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes
 #endif
     {
         Array<FArrayBox,AMREX_SPACEDIM> flux;
-        Array<FArrayBox*,AMREX_SPACEDIM> pflux { AMREX_D_DECL(&flux[0], &flux[1], &flux[2]) };
+        Array<FArrayBox*,AMREX_SPACEDIM> pflux {{ AMREX_D_DECL(&flux[0], &flux[1], &flux[2]) }};
         for (MFIter mfi(sol, mfi_info);  mfi.isValid(); ++mfi)
         {
             const Box& tbx = mfi.tilebox();
@@ -671,6 +680,7 @@ MLCellLinOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes
             AMREX_D_TERM(Elixir elifx = flux[0].elixir();,
                          Elixir elify = flux[1].elixir();,
                          Elixir elifz = flux[2].elixir(););
+            Gpu::FuseSafeGuard fsg(false); // Turn off fusing in FFlux
             FFlux(amrlev, mfi, pflux, sol[mfi], loc);
             for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
                 const Box& nbx = mfi.nodaltilebox(idim);
@@ -687,7 +697,7 @@ MLCellLinOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes
 
 void
 MLCellLinOp::compGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& grad,
-                       MultiFab& sol, Location loc) const
+                       MultiFab& sol, Location /*loc*/) const
 {
     BL_PROFILE("MLCellLinOp::compGrad()");
 
@@ -756,6 +766,14 @@ MLCellLinOp::prepareForSolve ()
             BndryRegister& undrrelxr = m_undrrelxr[amrlev][mglev];
             MultiFab foo(m_grids[amrlev][mglev], m_dmap[amrlev][mglev], ncomp, 0, MFInfo().SetAlloc(false));
 
+#ifdef AMREX_USE_EB
+            auto factory = dynamic_cast<EBFArrayBoxFactory const*>(m_factory[amrlev][mglev].get());
+            const FabArray<EBCellFlagFab>* flags =
+                (factory) ? &(factory->getMultiEBCellFlagFab()) : nullptr;
+            auto area = (factory) ? factory->getAreaFrac()
+                : Array<const MultiCutFab*,AMREX_SPACEDIM>{AMREX_D_DECL(nullptr,nullptr,nullptr)};
+#endif
+
             MFItInfo mfi_info;
             if (Gpu::notInLaunchRegion()) mfi_info.SetDynamic(true);
 
@@ -769,6 +787,10 @@ MLCellLinOp::prepareForSolve ()
                 const auto & bdlv = bcondloc.bndryLocs(mfi);
                 const auto & bdcv = bcondloc.bndryConds(mfi);
 
+#ifdef AMREX_USE_EB
+                auto fabtyp = (flags) ? (*flags)[mfi].getType(vbx) : FabType::regular;
+#endif
+
                 for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
                 {
                     const Orientation olo(idim,Orientation::low);
@@ -785,42 +807,86 @@ MLCellLinOp::prepareForSolve ()
                         const BoundCond bcthi = bdcv[icomp][ohi];
                         const Real bcllo = bdlv[icomp][olo];
                         const Real bclhi = bdlv[icomp][ohi];
-                        if (idim == 0) {
-                            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
-                            blo, tboxlo, {
-                            mllinop_comp_interp_coef0_x
-                                (0, tboxlo, blen, flo, mlo, bctlo, bcllo,
-                                 imaxorder, dxi, icomp);
-                            },
-                            bhi, tboxhi, {
-                            mllinop_comp_interp_coef0_x
-                                (1, tboxhi, blen, fhi, mhi, bcthi, bclhi,
-                                 imaxorder, dxi, icomp);
-                            });
-                        } else if (idim == 1) {
-                            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
-                            blo, tboxlo, {
-                            mllinop_comp_interp_coef0_y
-                                (0, tboxlo, blen, flo, mlo, bctlo, bcllo,
-                                 imaxorder, dyi, icomp);
-                            },
-                            bhi, tboxhi, {
-                            mllinop_comp_interp_coef0_y
-                                (1, tboxhi, blen, fhi, mhi, bcthi, bclhi,
-                                 imaxorder, dyi, icomp);
-                            });
-                        } else {
-                            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
-                            blo, tboxlo, {
-                            mllinop_comp_interp_coef0_z
-                                (0, tboxlo, blen, flo, mlo, bctlo, bcllo,
-                                 imaxorder, dzi, icomp);
-                            },
-                            bhi, tboxhi, {
-                            mllinop_comp_interp_coef0_z
-                                (1, tboxhi, blen, fhi, mhi, bcthi, bclhi,
-                                 imaxorder, dzi, icomp);
-                            });
+#ifdef AMREX_USE_EB
+                        if (fabtyp == FabType::singlevalued) {
+                            Array4<Real const> const& ap = area[idim]->const_array(mfi);
+                            if (idim == 0) {
+                                AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                                blo, tboxlo, {
+                                mllinop_comp_interp_coef0_x_eb
+                                    (0, tboxlo, blen, flo, mlo, ap, bctlo, bcllo,
+                                     imaxorder, dxi, icomp);
+                                },
+                                bhi, tboxhi, {
+                                mllinop_comp_interp_coef0_x_eb
+                                    (1, tboxhi, blen, fhi, mhi, ap, bcthi, bclhi,
+                                     imaxorder, dxi, icomp);
+                                });
+                            } else if (idim == 1) {
+                                AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                                blo, tboxlo, {
+                                mllinop_comp_interp_coef0_y_eb
+                                    (0, tboxlo, blen, flo, mlo, ap, bctlo, bcllo,
+                                     imaxorder, dyi, icomp);
+                                },
+                                bhi, tboxhi, {
+                                mllinop_comp_interp_coef0_y_eb
+                                    (1, tboxhi, blen, fhi, mhi, ap, bcthi, bclhi,
+                                     imaxorder, dyi, icomp);
+                                });
+                            } else {
+                                AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                                blo, tboxlo, {
+                                mllinop_comp_interp_coef0_z_eb
+                                    (0, tboxlo, blen, flo, mlo, ap, bctlo, bcllo,
+                                     imaxorder, dzi, icomp);
+                                },
+                                bhi, tboxhi, {
+                                mllinop_comp_interp_coef0_z_eb
+                                    (1, tboxhi, blen, fhi, mhi, ap, bcthi, bclhi,
+                                     imaxorder, dzi, icomp);
+                                });
+                            }
+                        } else
+#endif
+                        {
+                            if (idim == 0) {
+                                AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                                blo, tboxlo, {
+                                mllinop_comp_interp_coef0_x
+                                    (0, tboxlo, blen, flo, mlo, bctlo, bcllo,
+                                     imaxorder, dxi, icomp);
+                                },
+                                bhi, tboxhi, {
+                                mllinop_comp_interp_coef0_x
+                                    (1, tboxhi, blen, fhi, mhi, bcthi, bclhi,
+                                     imaxorder, dxi, icomp);
+                                });
+                            } else if (idim == 1) {
+                                AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                                blo, tboxlo, {
+                                mllinop_comp_interp_coef0_y
+                                    (0, tboxlo, blen, flo, mlo, bctlo, bcllo,
+                                     imaxorder, dyi, icomp);
+                                },
+                                bhi, tboxhi, {
+                                mllinop_comp_interp_coef0_y
+                                    (1, tboxhi, blen, fhi, mhi, bcthi, bclhi,
+                                     imaxorder, dyi, icomp);
+                                });
+                            } else {
+                                AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+                                blo, tboxlo, {
+                                mllinop_comp_interp_coef0_z
+                                    (0, tboxlo, blen, flo, mlo, bctlo, bcllo,
+                                     imaxorder, dzi, icomp);
+                                },
+                                bhi, tboxhi, {
+                                mllinop_comp_interp_coef0_z
+                                    (1, tboxhi, blen, fhi, mhi, bcthi, bclhi,
+                                     imaxorder, dzi, icomp);
+                                });
+                            }
                         }
                     }
                 }
@@ -830,7 +896,7 @@ MLCellLinOp::prepareForSolve ()
 }
 
 Real
-MLCellLinOp::xdoty (int amrlev, int mglev, const MultiFab& x, const MultiFab& y, bool local) const
+MLCellLinOp::xdoty (int /*amrlev*/, int /*mglev*/, const MultiFab& x, const MultiFab& y, bool local) const
 {
     const int ncomp = getNComp();
     const int nghost = 0;
@@ -881,6 +947,7 @@ MLCellLinOp::BndryCondLoc::setLOBndryConds (const Geometry& geom, const Real* dx
 void
 MLCellLinOp::applyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const
 {
+    amrex::ignore_unused(amrlev,mglev,rhs);
 #if (AMREX_SPACEDIM != 3)
     
     if (!m_has_metric_term) return;
@@ -900,27 +967,35 @@ MLCellLinOp::applyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const
     {
         const Box& tbx = mfi.tilebox();
         Array4<Real> const& rhsarr = rhs.array(mfi);
+#if (AMREX_SPACEDIM == 1)
         if (cc) {
             AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
             {
                 Real rc = probxlo + (i+0.5)*dx;
-#if (AMREX_SPACEDIM == 2)
-                rhsarr(i,j,k,n) *= rc;
-#else
                 rhsarr(i,j,k,n) *= rc*rc;
-#endif
             });
         } else {
             AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
             {
                 Real re = probxlo + i*dx;
-#if (AMREX_SPACEDIM == 2)
-                rhsarr(i,j,k,n) *= re;
-#else
                 rhsarr(i,j,k,n) *= re*re;
-#endif
             });
         }
+#elif (AMREX_SPACEDIM == 2)
+        if (cc) {
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
+            {
+                Real rc = probxlo + (i+0.5)*dx;
+                rhsarr(i,j,k,n) *= rc;
+            });
+        } else {
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
+            {
+                Real re = probxlo + i*dx;
+                rhsarr(i,j,k,n) *= re;
+            });
+        }
+#endif
     }
 #endif
 }
@@ -928,6 +1003,7 @@ MLCellLinOp::applyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const
 void
 MLCellLinOp::unapplyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const
 {
+    amrex::ignore_unused(amrlev,mglev,rhs);
 #if (AMREX_SPACEDIM != 3)
     
     if (!m_has_metric_term) return;
@@ -947,28 +1023,37 @@ MLCellLinOp::unapplyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const
     {
         const Box& tbx = mfi.tilebox();
         Array4<Real> const& rhsarr = rhs.array(mfi);
+#if (AMREX_SPACEDIM == 1)
         if (cc) {
             AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
             {
                 Real rcinv = 1.0/(probxlo + (i+0.5)*dx);
-#if (AMREX_SPACEDIM == 2)
-                rhsarr(i,j,k,n) *= rcinv;
-#else
                 rhsarr(i,j,k,n) *= rcinv*rcinv;
-#endif
             });
         } else {
             AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
             {
                 Real re = probxlo + i*dx;
                 Real reinv = (re==0.0) ? 0.0 : 1./re;
-#if (AMREX_SPACEDIM == 2)
-                rhsarr(i,j,k,n) *= reinv;
-#else
                 rhsarr(i,j,k,n) *= reinv*reinv;
-#endif
             });
         }
+#elif (AMREX_SPACEDIM == 2)
+        if (cc) {
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
+            {
+                Real rcinv = 1.0/(probxlo + (i+0.5)*dx);
+                rhsarr(i,j,k,n) *= rcinv;
+            });
+        } else {
+            AMREX_HOST_DEVICE_PARALLEL_FOR_4D ( tbx, ncomp, i, j, k, n,
+            {
+                Real re = probxlo + i*dx;
+                Real reinv = (re==0.0) ? 0.0 : 1./re;
+                rhsarr(i,j,k,n) *= reinv;
+            });
+        }
+#endif
     }
 #endif
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.H b/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.H
index e716c6895e2..a2ea047ee04 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.H
@@ -94,7 +94,7 @@ public:
     virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int amrlev, int mglev) const final override
         { return amrex::GetArrOfConstPtrs(m_b_coeffs[amrlev][mglev]); }
 
-    virtual std::unique_ptr<MLLinOp> makeNLinOp (int grid_size) const final override {
+    virtual std::unique_ptr<MLLinOp> makeNLinOp (int /*grid_size*/) const final override {
         amrex::Abort("MLABecLaplacian::makeNLinOp: Not implmented");
         return std::unique_ptr<MLLinOp>{};
     }
@@ -142,7 +142,7 @@ protected:
     //
     bool isEBDirichlet   () const noexcept { return m_eb_phi[0] != nullptr; }
 
-    void averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a,
+    void averageDownCoeffsSameAmrLevel (int amrlev, Vector<MultiFab>& a,
                                         Vector<Array<MultiFab,AMREX_SPACEDIM> >& b,
                                         const Vector<MultiFab*>& b_eb);
     void averageDownCoeffs ();
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.cpp b/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.cpp
index 2cd4f35de27..35831ab5732 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap.cpp
@@ -557,12 +557,12 @@ MLEBABecLap::averageDownCoeffs ()
         auto& fine_a_coeffs = m_a_coeffs[amrlev];
         auto& fine_b_coeffs = m_b_coeffs[amrlev];
         
-        averageDownCoeffsSameAmrLevel(fine_a_coeffs, fine_b_coeffs,
+        averageDownCoeffsSameAmrLevel(amrlev, fine_a_coeffs, fine_b_coeffs,
                                       amrex::GetVecOfPtrs(m_eb_b_coeffs[0]));
         averageDownCoeffsToCoarseAmrLevel(amrlev);
     }
 
-    averageDownCoeffsSameAmrLevel(m_a_coeffs[0], m_b_coeffs[0],
+    averageDownCoeffsSameAmrLevel(0, m_a_coeffs[0], m_b_coeffs[0],
                                   amrex::GetVecOfPtrs(m_eb_b_coeffs[0]));
 
     for (int amrlev = 0; amrlev < m_num_amr_levels; ++amrlev) {
@@ -575,30 +575,32 @@ MLEBABecLap::averageDownCoeffs ()
 }
 
 void
-MLEBABecLap::averageDownCoeffsSameAmrLevel (Vector<MultiFab>& a,
+MLEBABecLap::averageDownCoeffsSameAmrLevel (int amrlev, Vector<MultiFab>& a,
                                             Vector<Array<MultiFab,AMREX_SPACEDIM> >& b,
                                             const Vector<MultiFab*>& b_eb)
 {
     int nmglevs = a.size();
     for (int mglev = 1; mglev < nmglevs; ++mglev)
     {
+        IntVect ratio = (amrlev > 0) ? IntVect(mg_coarsen_ratio) : mg_coarsen_ratio_vec[mglev-1];
+
         if (m_a_scalar == 0.0)
         {
             a[mglev].setVal(0.0);
         }
         else
         {
-            amrex::EB_average_down(a[mglev-1], a[mglev], 0, 1, mg_coarsen_ratio);
+            amrex::EB_average_down(a[mglev-1], a[mglev], 0, 1, ratio);
         }
 
         amrex::EB_average_down_faces(amrex::GetArrOfConstPtrs(b[mglev-1]),
                                      amrex::GetArrOfPtrs(b[mglev]),
-                                     mg_coarsen_ratio, 0);
+                                     ratio, 0);
 
         if (b_eb[mglev])
         {
             amrex::EB_average_down_boundaries(*b_eb[mglev-1], *b_eb[mglev],
-                                              mg_coarsen_ratio, 0);
+                                              ratio, 0);
         }
     }
 }
@@ -619,7 +621,7 @@ MLEBABecLap::averageDownCoeffsToCoarseAmrLevel (int flev)
 
     amrex::EB_average_down_faces(amrex::GetArrOfConstPtrs(fine_b_coeffs),
                                  amrex::GetArrOfPtrs(crse_b_coeffs),
-                                 mg_coarsen_ratio, 0);
+                                 IntVect(mg_coarsen_ratio), m_geom[flev-1][0]);
 
     if (fine_eb_b_coeffs) {
         amrex::EB_average_down_boundaries(*fine_eb_b_coeffs, *crse_eb_b_coeffs, mg_coarsen_ratio, 0);
@@ -763,25 +765,30 @@ MLEBABecLap::Fapply (int amrlev, int mglev, MultiFab& out, const MultiFab& in) c
 #endif
             AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
             {
+                AMREX_DPCPP_ONLY(auto bafab    = dp[0]);
+                AMREX_DPCPP_ONLY(auto bcfab    = dp[1]);
+                AMREX_DPCPP_ONLY(auto bebfab   = dp[2]);
+                AMREX_DPCPP_ONLY(auto phiebfab = dp[3]);
+
+                AMREX_DPCPP_2D_ONLY(auto apxfab = dp[4]);
+                AMREX_DPCPP_2D_ONLY(auto apyfab = dp[5]);
+                AMREX_DPCPP_2D_ONLY(auto fcxfab = dp[6]);
+                AMREX_DPCPP_2D_ONLY(auto fcyfab = dp[7]);
+
+                AMREX_DPCPP_3D_ONLY(auto apxfab = dp[4]);
+                AMREX_DPCPP_3D_ONLY(auto apyfab = dp[5]);
+                AMREX_DPCPP_3D_ONLY(auto apzfab = dp[6]);
+                AMREX_DPCPP_3D_ONLY(auto fcxfab = dp[7]);
+                AMREX_DPCPP_3D_ONLY(auto fcyfab = dp[8]);
+                AMREX_DPCPP_3D_ONLY(auto fczfab = dp[9]);
+
                 mlebabeclap_adotx(tbx, yfab, xfab, afab, AMREX_D_DECL(bxfab,byfab,bzfab),
                                   ccmfab, flagfab, vfracfab,
-#ifdef AMREX_USE_DPCPP
-#if (AMREX_SPACEDIM == 2)
-                                  dp[4], dp[5], dp[6], dp[7], dp[0], dp[1], dp[2],
-#else
-                                  dp[4], dp[5], dp[6], dp[7], dp[8], dp[9], dp[0], dp[1], dp[2],
-#endif
-#else
                                   AMREX_D_DECL(apxfab,apyfab,apzfab),
                                   AMREX_D_DECL(fcxfab,fcyfab,fczfab),
                                   bafab, bcfab, bebfab,
-#endif
                                   is_eb_dirichlet,
-#ifdef AMREX_USE_DPCPP
-                                  dp[3],
-#else
                                   phiebfab,
-#endif
                                   is_eb_inhomog, dxinvarr,
                                   ascalar, bscalar, ncomp, beta_on_centroid, phi_on_centroid);
             });
@@ -906,20 +913,25 @@ MLEBABecLap::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab& rhs,
 
             AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
             {
+                AMREX_DPCPP_2D_ONLY(auto f0fab = dp[0]);
+                AMREX_DPCPP_2D_ONLY(auto f2fab = dp[1]);
+                AMREX_DPCPP_2D_ONLY(auto f1fab = dp[2]);
+                AMREX_DPCPP_2D_ONLY(auto f3fab = dp[3]);
+
+                AMREX_DPCPP_3D_ONLY(auto f0fab = dp[0]);
+                AMREX_DPCPP_3D_ONLY(auto f2fab = dp[1]);
+                AMREX_DPCPP_3D_ONLY(auto f4fab = dp[2]);
+                AMREX_DPCPP_3D_ONLY(auto f1fab = dp[3]);
+                AMREX_DPCPP_3D_ONLY(auto f3fab = dp[4]);
+                AMREX_DPCPP_3D_ONLY(auto f5fab = dp[5]);
+
                 abec_gsrb(thread_box, solnfab, rhsfab, alpha, afab,
                           AMREX_D_DECL(dhx, dhy, dhz),
                           AMREX_D_DECL(bxfab, byfab, bzfab),
                           AMREX_D_DECL(m0,m2,m4),
                           AMREX_D_DECL(m1,m3,m5),
-#ifdef AMREX_USE_DPCPP
-                          dp[0],dp[1],dp[2],dp[3],
-#if (AMREX_SPACEDIM == 3)
-                          dp[4],dp[5],
-#endif
-#else
                           AMREX_D_DECL(f0fab,f2fab,f4fab),
                           AMREX_D_DECL(f1fab,f3fab,f5fab),
-#endif
                           vbx, redblack, nc);
             });
         }
@@ -956,30 +968,41 @@ MLEBABecLap::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab& rhs,
             Gpu::AsyncArray<Array4<int const> > dtmp2(htmp2.data(), 2*AMREX_SPACEDIM);
             auto dp = dtmp.data();
             auto dp2 = dtmp2.data();
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
-            {
-                mlebabeclap_gsrb(thread_box, solnfab, dp[0], alpha, dp[1],
-                                 AMREX_D_DECL(dhx, dhy, dhz),
-                                 AMREX_D_DECL(dp[2],dp[3],dp[4]),
-                                 dp2[0],dp2[1],dp2[2],dp2[3],
-#if (AMREX_SPACEDIM == 3)
-                                 dp2[4],dp2[5],
-#endif
-#if (AMREX_SPACEDIM == 2)
-                                 dp[4],dp[5],dp[6],dp[7],
-#else
-                                 dp[5],dp[6],dp[7],dp[8],dp[9],dp[10],
 #endif
-                                 ccmfab, flagfab, vfracfab,
-                                 AMREX_D_DECL(apxfab,apyfab,apzfab),
-                                 AMREX_D_DECL(fcxfab,fcyfab,fczfab),
-                                 bafab, bcfab, bebfab,
-                                 is_eb_dirichlet, beta_on_centroid, phi_on_centroid,
-                                 vbx, redblack, nc);
-            });
-#else
             AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( vbx, thread_box,
             {
+                AMREX_DPCPP_ONLY(auto rhsfab = dp[0]);
+                AMREX_DPCPP_ONLY(auto afab   = dp[1]);
+
+                AMREX_DPCPP_2D_ONLY(auto bxfab = dp[2]);
+                AMREX_DPCPP_2D_ONLY(auto byfab = dp[3]);
+                AMREX_DPCPP_2D_ONLY(auto f0fab = dp[4]);
+                AMREX_DPCPP_2D_ONLY(auto f2fab = dp[5]);
+                AMREX_DPCPP_2D_ONLY(auto f1fab = dp[6]);
+                AMREX_DPCPP_2D_ONLY(auto f3fab = dp[7]);
+
+                AMREX_DPCPP_3D_ONLY(auto bxfab = dp[2]);
+                AMREX_DPCPP_3D_ONLY(auto byfab = dp[3]);
+                AMREX_DPCPP_3D_ONLY(auto bzfab = dp[4]);
+                AMREX_DPCPP_3D_ONLY(auto f0fab = dp[5]);
+                AMREX_DPCPP_3D_ONLY(auto f2fab = dp[6]);
+                AMREX_DPCPP_3D_ONLY(auto f4fab = dp[7]);
+                AMREX_DPCPP_3D_ONLY(auto f1fab = dp[8]);
+                AMREX_DPCPP_3D_ONLY(auto f3fab = dp[9]);
+                AMREX_DPCPP_3D_ONLY(auto f5fab = dp[10]);
+
+                AMREX_DPCPP_2D_ONLY(auto m0 = dp2[0]);
+                AMREX_DPCPP_2D_ONLY(auto m2 = dp2[1]);
+                AMREX_DPCPP_2D_ONLY(auto m1 = dp2[2]);
+                AMREX_DPCPP_2D_ONLY(auto m3 = dp2[3]);
+
+                AMREX_DPCPP_3D_ONLY(auto m0 = dp2[0]);
+                AMREX_DPCPP_3D_ONLY(auto m2 = dp2[1]);
+                AMREX_DPCPP_3D_ONLY(auto m4 = dp2[2]);
+                AMREX_DPCPP_3D_ONLY(auto m1 = dp2[3]);
+                AMREX_DPCPP_3D_ONLY(auto m3 = dp2[4]);
+                AMREX_DPCPP_3D_ONLY(auto m5 = dp2[5]);
+
                 mlebabeclap_gsrb(thread_box, solnfab, rhsfab, alpha, afab,
                                  AMREX_D_DECL(dhx, dhy, dhz),
                                  AMREX_D_DECL(bxfab,byfab,bzfab),
@@ -994,7 +1017,6 @@ MLEBABecLap::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab& rhs,
                                  is_eb_dirichlet, beta_on_centroid, phi_on_centroid,
                                  vbx, redblack, nc);
             });
-#endif
         }
     }
 }
@@ -1079,39 +1101,31 @@ MLEBABecLap::FFlux (int amrlev, const MFIter& mfi, const Array<FArrayBox*,AMREX_
         auto dp = dtmp.data();
 #endif
 
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+        AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
             xbx, txbx,
             {
-#ifdef AMREX_USE_DPCPP
-                auto apx = dp[0];
-                auto fcx = dp[1];
-                auto bxcoef = dp[2];
-#endif
+                AMREX_DPCPP_ONLY(auto apx    = dp[0]);
+                AMREX_DPCPP_ONLY(auto fcx    = dp[1]);
+                AMREX_DPCPP_ONLY(auto bxcoef = dp[2]);
                 mlebabeclap_flux_x(txbx, fx, apx, fcx, phi, bxcoef, msk, dhx, face_only, ncomp, xbx,
                                    beta_on_centroid, phi_on_centroid);
             }
             , ybx, tybx,
             {
-#ifdef AMREX_USE_DPCPP
-                auto apy = dp[3];
-                auto fcy = dp[4];
-                auto bycoef = dp[5];
-#endif
+                AMREX_DPCPP_ONLY(auto apy    = dp[3]);
+                AMREX_DPCPP_ONLY(auto fcy    = dp[4]);
+                AMREX_DPCPP_ONLY(auto bycoef = dp[5]);
                 mlebabeclap_flux_y(tybx, fy, apy, fcy, phi, bycoef, msk, dhy, face_only, ncomp, ybx,
                                    beta_on_centroid, phi_on_centroid);
             }
-#if (AMREX_SPACEDIM == 3)
             , zbx, tzbx,
             {
-#ifdef AMREX_USE_DPCPP
-                auto apz = dp[6];
-                auto fcz = dp[7];
-                auto bzcoef = dp[8];
-#endif
+                AMREX_DPCPP_3D_ONLY(auto apz    = dp[6]);
+                AMREX_DPCPP_3D_ONLY(auto fcz    = dp[7]);
+                AMREX_DPCPP_3D_ONLY(auto bzcoef = dp[8]);
                 mlebabeclap_flux_z(tzbx, fz, apz, fcz, phi, bzcoef, msk, dhz, face_only, ncomp, zbx,
                                    beta_on_centroid, phi_on_centroid);
             }
-#endif
         );
     } else {
         const auto& area = factory->getAreaFrac();
@@ -1137,33 +1151,25 @@ MLEBABecLap::FFlux (int amrlev, const MFIter& mfi, const Array<FArrayBox*,AMREX_
         auto dp = dtmp.data();
 #endif
 
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+        AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
             xbx, txbx,
             {
-#ifdef AMREX_USE_DPCPP
-                auto apx = dp[0];
-                auto bxcoef = dp[1];
-#endif
+                AMREX_DPCPP_ONLY(auto apx    = dp[0]);
+                AMREX_DPCPP_ONLY(auto bxcoef = dp[1]);
                 mlebabeclap_flux_x_0(txbx, fx, apx, phi, bxcoef, dhx, face_only, ncomp, xbx);
             }
             , ybx, tybx,
             {
-#ifdef AMREX_USE_DPCPP
-                auto apy = dp[2];
-                auto bycoef = dp[3];
-#endif
+                AMREX_DPCPP_ONLY(auto apy    = dp[2]);
+                AMREX_DPCPP_ONLY(auto bycoef = dp[3]);
                 mlebabeclap_flux_y_0(tybx, fy, apy, phi, bycoef, dhy, face_only, ncomp, ybx);
             }
-#if (AMREX_SPACEDIM == 3)
             , zbx, tzbx,
             {
-#ifdef AMREX_USE_DPCPP
-                auto apz = dp[4];
-                auto bzcoef = dp[5];
-#endif
+                AMREX_DPCPP_3D_ONLY(auto apz    = dp[4]);
+                AMREX_DPCPP_3D_ONLY(auto bzcoef = dp[5]);
                 mlebabeclap_flux_z_0(tzbx, fz, apz, phi, bzcoef, dhz, face_only, ncomp, zbx);
             }
-#endif
         );
     }
 }
@@ -1251,7 +1257,7 @@ MLEBABecLap::compGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& grad,
 
             if (phi_on_centroid) amrex::Abort("phi_on_centroid is still a WIP");
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 fbx, txbx,
                 {
                     mlebabeclap_grad_x(txbx, gx, s, apx, fcx, msk, dxi, ncomp, phi_on_centroid);
@@ -1260,12 +1266,10 @@ MLEBABecLap::compGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& grad,
                 {
                     mlebabeclap_grad_y(tybx, gy, s, apy, fcy, msk, dyi, ncomp, phi_on_centroid);
                 }
-#if (AMREX_SPACEDIM == 3)
                 , fbz, tzbx,
                 {
                     mlebabeclap_grad_z(tzbx, gz, s, apz, fcz, msk, dzi, ncomp, phi_on_centroid);
                 }
-#endif
             );
         } else {
 
@@ -1276,7 +1280,7 @@ MLEBABecLap::compGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& grad,
             AMREX_ALWAYS_ASSERT_WITH_MESSAGE(m_phi_loc == Location::CellCenter, 
              "If computing the gradient at face centers we assume phi at cell centers");
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 fbx, txbx,
                 {
                     mlebabeclap_grad_x_0(txbx, gx, s, ax, dxi, ncomp);
@@ -1285,12 +1289,10 @@ MLEBABecLap::compGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& grad,
                 {
                     mlebabeclap_grad_y_0(tybx, gy, s, ay, dyi, ncomp);
                 }
-#if (AMREX_SPACEDIM == 3)
                 , fbz, tzbx,
                 {
                     mlebabeclap_grad_z_0(tzbx, gz, s, az, dzi, ncomp);
                 }
-#endif
             );
         }
     }
@@ -1379,16 +1381,15 @@ MLEBABecLap::normalize (int amrlev, int mglev, MultiFab& mf) const
 
             AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
             {
+                AMREX_DPCPP_ONLY(   auto fcxfab = dp[0]);
+                AMREX_DPCPP_ONLY(   auto fcyfab = dp[1]);
+                AMREX_DPCPP_3D_ONLY(auto fczfab = dp[2]);
                 mlebabeclap_normalize(tbx, fab, ascalar, afab,
                                       AMREX_D_DECL(dhx, dhy, dhz),
                                       AMREX_D_DECL(bxfab, byfab, bzfab),
                                       ccmfab, flagfab, vfracfab,
                                       AMREX_D_DECL(apxfab,apyfab,apzfab),
-#ifdef AMREX_USE_DPCPP
-                                      AMREX_D_DECL(dp[0],dp[1],dp[2]),
-#else
                                       AMREX_D_DECL(fcxfab,fcyfab,fczfab),
-#endif
                                       bafab, bcfab, bebfab, is_eb_dirichlet, 
                                       beta_on_centroid, ncomp);
             });
@@ -1397,10 +1398,11 @@ MLEBABecLap::normalize (int amrlev, int mglev, MultiFab& mf) const
 }
 
 void
-MLEBABecLap::restriction (int, int, MultiFab& crse, MultiFab& fine) const
+MLEBABecLap::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab& fine) const
 {
+    IntVect ratio = (amrlev > 0) ? IntVect(mg_coarsen_ratio) : mg_coarsen_ratio_vec[cmglev-1];
     const int ncomp = getNComp();
-    amrex::EB_average_down(fine, crse, 0, ncomp, 2);
+    amrex::EB_average_down(fine, crse, 0, ncomp, ratio);
 }
 
 void
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap_K.H b/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap_K.H
index 4b6fe0df5d4..7ba5d4d7126 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLEBABecLap_K.H
@@ -8,7 +8,7 @@
 namespace amrex { namespace {
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real get_dx_eb (Real kappa) noexcept {
-        return amrex::max(0.3_rt,(kappa*kappa-0.25_rt)/(2.0_rt*kappa));
+        return amrex::max(Real(0.3),(kappa*kappa-Real(0.25))/(Real(2.0)*kappa));
     }
 }}
 
@@ -62,30 +62,36 @@ void mlebabeclap_apply_bc_x (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dxinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{-bcl * dxinv, Real(0.5), Real(1.5), Real(2.5)};
         Array2D<Real, 0, 3, 0, 2> coef{};
         for (int r = 0; r <= maxorder-2; ++r) {
-            poly_interp_coeff(-0.5_rt, &x[0], NX, &(coef(0,r)));
+            poly_interp_coeff(-Real(0.5), &x[0], r+2, &(coef(0,r)));
         }
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int j = lo.y; j <= hi.y; ++j) {
                 if (mask(i,j,k) == 0 and mask(i+s,j,k) == 1) {
                     int order = 1;
+                    bool has_cutfaces = false;
                     for (int r = 0; r <= NX-2; ++r) {
-                        if (area(i+(1-side)+s*r,j,k) > 0.0_rt) {
+                        Real a = area(i+(1-side)+s*r,j,k);
+                        if (a > Real(0.0)) {
                             ++order;
+                            if (a < Real(1.0)) {
+                                has_cutfaces = true;
+                            }
                         } else {
                             break;
                         }
                     }
+                    if (has_cutfaces) order = amrex::min(2,order);
                     if (order == 1) {
                         if (inhomog) {
                             phi(i,j,k,icomp) = bcval(i,j,k,icomp);
                         } else {
-                            phi(i,j,k,icomp) = 0.0_rt;
+                            phi(i,j,k,icomp) = Real(0.0);
                         }
                     } else {
-                        Real tmp = 0.0_rt;
+                        Real tmp = Real(0.0);
                         for (int m = 1; m < order; ++m) {
                             tmp += phi(i+m*s,j,k,icomp) * coef(m,order-2);
                         }
@@ -142,30 +148,36 @@ void mlebabeclap_apply_bc_y (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dyinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{-bcl * dyinv, Real(0.5), Real(1.5), Real(2.5)};
         Array2D<Real, 0, 3, 0, 2> coef{};
         for (int r = 0; r <= maxorder-2; ++r) {
-            poly_interp_coeff(-0.5_rt, &x[0], NX, &(coef(0,r)));
+            poly_interp_coeff(-Real(0.5), &x[0], r+2, &(coef(0,r)));
         }
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int i = lo.x; i <= hi.x; ++i) {
                 if (mask(i,j,k) == 0 and mask(i,j+s,k) == 1) {
                     int order = 1;
+                    bool has_cutfaces = false;
                     for (int r = 0; r <= NX-2; ++r) {
-                        if (area(i,j+(1-side)+s*r,k) > 0.0_rt) {
+                        Real a = area(i,j+(1-side)+s*r,k);
+                        if (a > Real(0.0)) {
                             ++order;
+                            if (a < Real(1.0)) {
+                                has_cutfaces = true;
+                            }
                         } else {
                             break;
                         }
                     }
+                    if (has_cutfaces) order = amrex::min(2,order);
                     if (order == 1) {
                         if (inhomog) {
                             phi(i,j,k,icomp) = bcval(i,j,k,icomp);
                         } else {
-                            phi(i,j,k,icomp) = 0.0_rt;
+                            phi(i,j,k,icomp) = Real(0.0);
                         }
                     } else {
-                        Real tmp = 0.0_rt;
+                        Real tmp = Real(0.0);
                         for (int m = 1; m < order; ++m) {
                             tmp += phi(i,j+m*s,k,icomp) * coef(m,order-2);
                         }
@@ -222,30 +234,36 @@ void mlebabeclap_apply_bc_z (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dzinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{-bcl * dzinv, Real(0.5), Real(1.5), Real(2.5)};
         Array2D<Real, 0, 3, 0, 2> coef{};
         for (int r = 0; r <= maxorder-2; ++r) {
-            poly_interp_coeff(-0.5_rt, &x[0], NX, &(coef(0,r)));
+            poly_interp_coeff(-Real(0.5), &x[0], r+2, &(coef(0,r)));
         }
         for     (int j = lo.y; j <= hi.y; ++j) {
             for (int i = lo.x; i <= hi.x; ++i) {
                 if (mask(i,j,k) == 0 and mask(i,j,k+s) == 1) {
                     int order = 1;
+                    bool has_cutfaces = false;
                     for (int r = 0; r <= NX-2; ++r) {
-                        if (area(i,j,k+(1-side)+s*r) > 0.0_rt) {
+                        Real a = area(i,j,k+(1-side)+s*r);
+                        if (a > Real(0.0)) {
                             ++order;
+                            if (a < Real(1.0)) {
+                                has_cutfaces = true;
+                            }
                         } else {
                             break;
                         }
                     }
+                    if (has_cutfaces) order = amrex::min(2,order);
                     if (order == 1) {
                         if (inhomog) {
                             phi(i,j,k,icomp) = bcval(i,j,k,icomp);
                         } else {
-                            phi(i,j,k,icomp) = 0.0_rt;
+                            phi(i,j,k,icomp) = Real(0.0);
                         }
                     } else {
-                        Real tmp = 0.0_rt;
+                        Real tmp = Real(0.0);
                         for (int m = 1; m < order; ++m) {
                             tmp += phi(i,j,k+m*s,icomp) * coef(m,order-2);
                         }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.H b/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.H
index f76fd3d5c83..36d33a12b44 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.H
@@ -73,7 +73,7 @@ public:
     }
 
     virtual void prepareForSolve () final override;
-    virtual bool isSingular (int armlev) const final override { return false; }
+    virtual bool isSingular (int /*armlev*/) const final override { return false; }
     virtual bool isBottomSingular () const final override { return false; }
 
     virtual void apply (int amrlev, int mglev, MultiFab& out, MultiFab& in, BCMode bc_mode,
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.cpp b/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.cpp
index cf62d92dde4..4f20e0b519e 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLEBTensorOp.cpp
@@ -146,7 +146,7 @@ MLEBTensorOp::prepareForSolve ()
             if (amrlev > 0) {
                 amrex::EB_average_down_faces(GetArrOfConstPtrs(m_kappa[amrlev  ].back()),
                                              GetArrOfPtrs     (m_kappa[amrlev-1].front()),
-                                             IntVect(mg_coarsen_ratio), 0);
+                                             IntVect(mg_coarsen_ratio), m_geom[amrlev-1][0]);
             }
         }
     } else {
@@ -269,15 +269,14 @@ MLEBTensorOp::apply (int amrlev, int mglev, MultiFab& out, MultiFab& in, BCMode
 #endif
             AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
             {
+                AMREX_DPCPP_ONLY(   auto fcx = dp[0]);
+                AMREX_DPCPP_ONLY(   auto fcy = dp[1]);
+                AMREX_DPCPP_3D_ONLY(auto fcz = dp[2]);
                 mlebtensor_cross_terms(tbx, axfab,
                                        AMREX_D_DECL(fxfab,fyfab,fzfab),
                                        vfab, etab, kapb, ccm, flag, vol,
                                        AMREX_D_DECL(apx,apy,apz),
-#ifdef AMREX_USE_DPCPP
-                                       AMREX_D_DECL(dp[0],dp[1],dp[2]),
-#else
                                        AMREX_D_DECL(fcx,fcy,fcz),
-#endif
                                        bc, dxinv, bscalar);
             });
         }
@@ -366,21 +365,20 @@ MLEBTensorOp::applyBCTensor (int amrlev, int mglev, MultiFab& vel,
 #ifdef AMREX_USE_DPCPP
             // xxxxx DPCPP todo: kernel size
             Vector<Array4<int const> > htmp = {mxlo,mylo,mzlo,mxhi,myhi,mzhi};
-//            Gpu::AsyncArray<Array4<int const> > dtmp(htmp.data(), 6);
-//            auto dp = dtmp.data();
-            // Bug # 2: It hangs if the lines above are uncommented and Gpu launch region is on
-            Gpu::LaunchSafeGuard lsg(false);
-            auto dp = htmp.data();
+            Gpu::AsyncArray<Array4<int const> > dtmp(htmp.data(), htmp.size());
+            auto dp = dtmp.data();
 #endif
 
             AMREX_HOST_DEVICE_FOR_1D ( 12, iedge,
             {
+                AMREX_DPCPP_ONLY(auto mxlo = dp[0]);
+                AMREX_DPCPP_ONLY(auto mylo = dp[1]);
+                AMREX_DPCPP_ONLY(auto mzlo = dp[2]);
+                AMREX_DPCPP_ONLY(auto mxhi = dp[3]);
+                AMREX_DPCPP_ONLY(auto myhi = dp[4]);
+                AMREX_DPCPP_ONLY(auto mzhi = dp[5]);
                 mltensor_fill_edges(iedge, vbx, velfab,
-#ifdef AMREX_USE_DPCPP
-                                    dp[0],dp[1],dp[2],dp[3],dp[4],dp[5],
-#else
                                     mxlo, mylo, mzlo, mxhi, myhi, mzhi,
-#endif
                                     bvxlo, bvylo, bvzlo, bvxhi, bvyhi, bvzhi,
                                     bct, bcl, inhomog, imaxorder,
                                     dxinv, domain);
@@ -388,12 +386,14 @@ MLEBTensorOp::applyBCTensor (int amrlev, int mglev, MultiFab& vel,
 
             AMREX_HOST_DEVICE_FOR_1D ( 8, icorner,
             {
+                AMREX_DPCPP_ONLY(auto mxlo = dp[0]);
+                AMREX_DPCPP_ONLY(auto mylo = dp[1]);
+                AMREX_DPCPP_ONLY(auto mzlo = dp[2]);
+                AMREX_DPCPP_ONLY(auto mxhi = dp[3]);
+                AMREX_DPCPP_ONLY(auto myhi = dp[4]);
+                AMREX_DPCPP_ONLY(auto mzhi = dp[5]);
                 mltensor_fill_corners(icorner, vbx, velfab,
-#ifdef AMREX_USE_DPCPP
-                                      dp[0],dp[1],dp[2],dp[3],dp[4],dp[5],
-#else
                                       mxlo, mylo, mzlo, mxhi, myhi, mzhi,
-#endif
                                       bvxlo, bvylo, bvzlo, bvxhi, bvyhi, bvzhi,
                                       bct, bcl, inhomog, imaxorder,
                                       dxinv, domain);
@@ -402,14 +402,12 @@ MLEBTensorOp::applyBCTensor (int amrlev, int mglev, MultiFab& vel,
         }
     }
 
-    vel.EnforcePeriodicity(0, AMREX_SPACEDIM, IntVect(1),
-                           m_geom[amrlev][mglev].periodicity());
+    // Notet that it is incorrect to call EnforcePeriodicity on vel.
 }
 
 void
 MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
 {
-
     auto factory = dynamic_cast<EBFArrayBoxFactory const*>(m_factory[amrlev][mglev].get());
     const FabArray<EBCellFlagFab>* flags = (factory) ? &(factory->getMultiEBCellFlagFab()) : nullptr;
     auto area = (factory) ? factory->getAreaFrac()
@@ -441,7 +439,7 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
 	  AMREX_D_TERM(Array4<Real> const& fxfab = fluxmf[0].array(mfi);,
 		       Array4<Real> const& fyfab = fluxmf[1].array(mfi);,
 		       Array4<Real> const& fzfab = fluxmf[2].array(mfi););
-	  AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+	  AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
 	  ( xbx, txbx,
 	    {
                 AMREX_LOOP_4D(txbx, AMREX_SPACEDIM, i, j, k, n,
@@ -456,7 +454,6 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
                     fyfab(i,j,k,n) = 0.0;
                 });
 	    }
-#if (AMREX_SPACEDIM == 3)
 	    , zbx, tzbx,
 	    {
                 AMREX_LOOP_4D(tzbx, AMREX_SPACEDIM, i, j, k, n,
@@ -464,7 +461,6 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
                     fzfab(i,j,k,n) = 0.0;
                 });
 	    }
-#endif
 	  );
 	} else {
 	  AMREX_D_TERM(Array4<Real> const fxfab = fluxmf[0].array(mfi);,
@@ -480,7 +476,7 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
 	  
 	  if (fabtyp == FabType::regular)
 	  {
-	      AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+	      AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
 	      ( xbx, txbx,
 		{
 		  mltensor_cross_terms_fx(txbx,fxfab,vfab,etaxfab,kapxfab,dxinv);
@@ -489,12 +485,10 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
 		{
 		  mltensor_cross_terms_fy(tybx,fyfab,vfab,etayfab,kapyfab,dxinv);
 		}
-#if (AMREX_SPACEDIM == 3)
 		, zbx, tzbx,
 		{
 		  mltensor_cross_terms_fz(tzbx,fzfab,vfab,etazfab,kapzfab,dxinv);
 		}
-#endif
 	      );
 	  }
 	  else
@@ -504,7 +498,7 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
 			 Array4<Real const> const& apz = area[2]->const_array(mfi););
 	    Array4<EBCellFlag const> const& flag = flags->const_array(mfi);
 	    
-	    AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+	    AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
 	    ( xbx, txbx,
 	      {
 		mlebtensor_cross_terms_fx(txbx,fxfab,vfab,etaxfab,kapxfab,apx,flag,dxinv);
@@ -513,12 +507,10 @@ MLEBTensorOp::compCrossTerms(int amrlev, int mglev, MultiFab const& mf) const
 	      {
 		mlebtensor_cross_terms_fy(tybx,fyfab,vfab,etayfab,kapyfab,apy,flag,dxinv);
 	      }
-#if (AMREX_SPACEDIM == 3)
 	      , zbx, tzbx,
 	      {
 		mlebtensor_cross_terms_fz(tzbx,fzfab,vfab,etazfab,kapzfab,apz,flag,dxinv);
 	      }
-#endif
 	      );
 	  }
 	}
@@ -551,9 +543,6 @@ MLEBTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxe
     auto area = (factory) ? factory->getAreaFrac()
         : Array<const MultiCutFab*,AMREX_SPACEDIM>{AMREX_D_DECL(nullptr,nullptr,nullptr)};
 
-    const Geometry& geom = m_geom[amrlev][mglev];
-    const auto dxinv = geom.InvCellSizeArray();
-
     Array<MultiFab,AMREX_SPACEDIM>& fluxmf = m_tauflux[amrlev][mglev];
     Real bscalar = m_b_scalar;
 
@@ -622,7 +611,7 @@ MLEBTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxe
 
 	    int face_only = 0;
 
-	    AMREX_LAUNCH_HOST_DEVICE_LAMBDA (
+	    AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM (
                 xbx, txbx,
 		{
 		  mlebtensor_flux_x(txbx, Ax, fx, apx, fcx, bscalar, msk, face_only, xbx);
@@ -631,12 +620,10 @@ MLEBTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxe
 		{
 		  mlebtensor_flux_y(tybx, Ay, fy, apy, fcy, bscalar, msk, face_only, ybx);
 		}
-#if (AMREX_SPACEDIM == 3)
 		, zbx, tzbx,
 		{
 		  mlebtensor_flux_z(tzbx, Az, fz, apz, fcz, bscalar, msk, face_only, zbx);
 		}
-#endif
 	    );
 
 	}
@@ -644,12 +631,6 @@ MLEBTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxe
     }
 }
 
-
-
-
-
-
-
 void
 MLEBTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes,
                        MultiFab& sol, Location loc) const
@@ -665,15 +646,12 @@ MLEBTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fl
 
     auto factory = dynamic_cast<EBFArrayBoxFactory const*>(m_factory[amrlev][mglev].get());
     const FabArray<EBCellFlagFab>* flags = (factory) ? &(factory->getMultiEBCellFlagFab()) : nullptr;
-    auto area = (factory) ? factory->getAreaFrac()
-        : Array<const MultiCutFab*,AMREX_SPACEDIM>{AMREX_D_DECL(nullptr,nullptr,nullptr)};
 
     const Geometry& geom = m_geom[amrlev][mglev];
     const auto dxinv = geom.InvCellSizeArray();
 
     const int dim_fluxes = AMREX_SPACEDIM*AMREX_SPACEDIM;
 
-
     MFItInfo mfi_info;
     if (Gpu::notInLaunchRegion()) mfi_info.EnableTiling().SetDynamic(true);
 #ifdef _OPENMP
@@ -704,7 +682,7 @@ MLEBTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fl
             AMREX_D_TERM(Array4<Real> const fxfab = fluxfab_tmp[0].array();,
                          Array4<Real> const fyfab = fluxfab_tmp[1].array();,
                          Array4<Real> const fzfab = fluxfab_tmp[2].array(););
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
             ( xbx, txbx,
               {
                   mltensor_vel_grads_fx(txbx,fxfab,vfab,dxinv);
@@ -713,12 +691,10 @@ MLEBTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fl
               {
                   mltensor_vel_grads_fy(tybx,fyfab,vfab,dxinv);
               }
-#if (AMREX_SPACEDIM == 3)
             , zbx, tzbx,
               {
                   mltensor_vel_grads_fz(tzbx,fzfab,vfab,dxinv);
               }
-#endif
             );
 
 // The derivatives are put in the array with the following order:
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLLinOp.H b/Src/LinearSolvers/MLMG/AMReX_MLLinOp.H
index 1c6ff89be13..8252be01cee 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLLinOp.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLLinOp.H
@@ -34,17 +34,21 @@ struct LPInfo
 {
     bool do_agglomeration = true;
     bool do_consolidation = true;
+    bool do_semicoarsening = false;
     int agg_grid_size = -1;
     int con_grid_size = -1;
     bool has_metric_term = true;
     int max_coarsening_level = 30;
+    int max_semicoarsening_level = 0;
 
     LPInfo& setAgglomeration (bool x) noexcept { do_agglomeration = x; return *this; }
     LPInfo& setConsolidation (bool x) noexcept { do_consolidation = x; return *this; }
+    LPInfo& setSemicoarsening (bool x) noexcept { do_semicoarsening = x; return *this; }
     LPInfo& setAgglomerationGridSize (int x) noexcept { agg_grid_size = x; return *this; }
     LPInfo& setConsolidationGridSize (int x) noexcept { con_grid_size = x; return *this; }
     LPInfo& setMetricTerm (bool x) noexcept { has_metric_term = x; return *this; }
     LPInfo& setMaxCoarseningLevel (int n) noexcept { max_coarsening_level = n; return *this; }
+    LPInfo& setMaxSemicoarseningLevel (int n) noexcept { max_semicoarsening_level = n; return *this; }
 
     static constexpr int getDefaultAgglomerationGridSize () {
 #ifdef AMREX_USE_GPU
@@ -170,6 +174,9 @@ public:
     void setMaxOrder (int o) noexcept { maxorder = o; }
     int getMaxOrder () const noexcept { return maxorder; }
 
+    void setEnforceSingularSolvable (bool o) noexcept { enforceSingularSolvable = o; }
+    bool getEnforceSingularSolvable () const noexcept { return enforceSingularSolvable; }
+
     virtual BottomSolver getDefaultBottomSolver () const { return BottomSolver::bicgstab; }
     virtual int getNComp () const { return 1; }
     virtual int getNGrow () const { return 0; }
@@ -188,7 +195,7 @@ public:
                          bool skip_fillboundary=false) const = 0;
 
     // Divide mf by the diagonal component of the operator. Used by bicgstab.
-    virtual void normalize (int amrlev, int mglev, MultiFab& mf) const {}
+    virtual void normalize (int /*amrlev*/, int /*mglev*/, MultiFab& /*mf*/) const {}
 
     virtual void solutionResidual (int amrlev, MultiFab& resid, MultiFab& x, const MultiFab& b,
                                    const MultiFab* crse_bcdata=nullptr) = 0;
@@ -207,42 +214,46 @@ public:
     virtual void unapplyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const = 0;
     virtual void fillSolutionBC (int amrlev, MultiFab& sol, const MultiFab* crse_bcdata=nullptr) = 0;
 
-    virtual void unimposeNeumannBC (int amrlev, MultiFab& rhs) const {} // only nodal solver might need it
-    virtual void applyInhomogNeumannTerm (int amrlev, MultiFab& rhs) const {}
+    virtual void unimposeNeumannBC (int /*amrlev*/, MultiFab& /*rhs*/) const {} // only nodal solver might need it
+    virtual void applyInhomogNeumannTerm (int /*amrlev*/, MultiFab& /*rhs*/) const {}
+    virtual void applyOverset (int /*amlev*/, MultiFab& /*rhs*/) const {}
 
     virtual void prepareForSolve () = 0;
     virtual bool isSingular (int amrlev) const = 0;
     virtual bool isBottomSingular () const = 0;
     virtual Real xdoty (int amrlev, int mglev, const MultiFab& x, const MultiFab& y, bool local) const = 0;
 
-    virtual void fixUpResidualMask (int amrlev, iMultiFab& resmsk) { }
-    virtual void nodalSync (int amrlev, int mglev, MultiFab& mf) const {}
+    virtual void fixUpResidualMask (int /*amrlev*/, iMultiFab& /*resmsk*/) { }
+    virtual void nodalSync (int /*amrlev*/, int /*mglev*/, MultiFab& /*mf*/) const {}
 
     virtual std::unique_ptr<MLLinOp> makeNLinOp (int grid_size) const = 0;
 
-    virtual void getFluxes (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_flux,
-                            const Vector<MultiFab*>& a_sol,
-                            Location a_loc) const {
+    virtual void getFluxes (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& /*a_flux*/,
+                            const Vector<MultiFab*>& /*a_sol*/,
+                            Location /*a_loc*/) const {
         amrex::Abort("MLLinOp::getFluxes: How did we get here?");
     }
-    virtual void getFluxes (const Vector<MultiFab*>& a_flux,
-                            const Vector<MultiFab*>& a_sol) const {
+    virtual void getFluxes (const Vector<MultiFab*>& /*a_flux*/,
+                            const Vector<MultiFab*>& /*a_sol*/) const {
         amrex::Abort("MLLinOp::getFluxes: How did we get here?");
     }
 
 #ifdef AMREX_USE_EB
-    virtual void getEBFluxes (const Vector<MultiFab*>& a_flux,
-                              const Vector<MultiFab*>& a_sol) const {
+    virtual void getEBFluxes (const Vector<MultiFab*>& /*a_flux*/,
+                              const Vector<MultiFab*>& /*a_sol*/) const {
         amrex::Abort("MLLinOp::getEBFluxes: How did we get here?");
     }
 #endif
 
 #ifdef AMREX_USE_HYPRE
-    virtual std::unique_ptr<Hypre> makeHypre (Hypre::Interface hypre_interface) const {
+    virtual std::unique_ptr<Hypre> makeHypre (Hypre::Interface /*hypre_interface*/) const {
         amrex::Abort("MLLinOp::makeHypre: How did we get here?");
         return {nullptr};
     }
-    virtual std::unique_ptr<HypreNodeLap> makeHypreNodeLap (int bottom_verbose) const {
+    virtual std::unique_ptr<HypreNodeLap> makeHypreNodeLap(
+        int /*bottom_verbose*/,
+        const std::string& /* options_namespace */) const
+    {
         amrex::Abort("MLLinOp::makeHypreNodeLap: How did we get here?");
         return {nullptr};
     }
@@ -268,6 +279,8 @@ protected:
 
     int maxorder = 3;
 
+    bool enforceSingularSolvable = true;
+
     int m_num_amr_levels;
     Vector<int> m_amr_ref_ratio;
 
@@ -279,6 +292,8 @@ protected:
     bool m_do_agglomeration = false;
     bool m_do_consolidation = false;
 
+    bool m_do_semicoarsening = false;
+    Vector<IntVect> mg_coarsen_ratio_vec;
 
     //! first Vector is for amr level and second is mg level
     Vector<Vector<Geometry> >            m_geom;
@@ -332,14 +347,14 @@ protected:
     }
 
     GpuArray<BCType,AMREX_SPACEDIM> LoBC (int icomp = 0) const noexcept {
-        return GpuArray<BCType,AMREX_SPACEDIM>{AMREX_D_DECL(m_lobc[icomp][0],
-                                                            m_lobc[icomp][1],
-                                                            m_lobc[icomp][2])};
+        return GpuArray<BCType,AMREX_SPACEDIM>{{AMREX_D_DECL(m_lobc[icomp][0],
+                                                             m_lobc[icomp][1],
+                                                             m_lobc[icomp][2])}};
     }
     GpuArray<BCType,AMREX_SPACEDIM> HiBC (int icomp = 0) const noexcept {
-        return GpuArray<BCType,AMREX_SPACEDIM>{AMREX_D_DECL(m_hibc[icomp][0],
-                                                            m_hibc[icomp][1],
-                                                            m_hibc[icomp][2])};
+        return GpuArray<BCType,AMREX_SPACEDIM>{{AMREX_D_DECL(m_hibc[icomp][0],
+                                                             m_hibc[icomp][1],
+                                                             m_hibc[icomp][2])}};
     }
 
 #ifdef BL_USE_MPI
@@ -354,12 +369,13 @@ protected:
 
     bool doAgglomeration () const noexcept { return m_do_agglomeration; }
     bool doConsolidation () const noexcept { return m_do_consolidation; }
+    bool doSemicoarsening () const noexcept { return m_do_semicoarsening; }
 
     bool isCellCentered () const noexcept { return m_ixtype == 0; }
 
     void make (Vector<Vector<MultiFab> >& mf, int nc, int ng) const;
 
-    virtual std::unique_ptr<FabFactory<FArrayBox> > makeFactory (int amrlev, int mglev) const {
+    virtual std::unique_ptr<FabFactory<FArrayBox> > makeFactory (int /*amrlev*/, int /*mglev*/) const {
         return std::unique_ptr<FabFactory<FArrayBox> >(new FArrayBoxFactory());
     }
 
@@ -377,7 +393,7 @@ private:
     MPI_Comm makeSubCommunicator (const DistributionMapping& dm);
     void remapNeighborhoods (Vector<DistributionMapping> & dms);
 
-    virtual void checkPoint (std::string const& file_name) const {
+    virtual void checkPoint (std::string const& /*file_name*/) const {
         amrex::Abort("MLLinOp:checkPoint: not implemented");
     }
 };
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLLinOp.cpp b/Src/LinearSolvers/MLMG/AMReX_MLLinOp.cpp
index 5cb1f49bec9..c4e654c7e32 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLLinOp.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLLinOp.cpp
@@ -1,8 +1,4 @@
 
-#include <cmath>
-#include <algorithm>
-#include <unordered_map>
-#include <set>
 #include <AMReX_Utility.H>
 #include <AMReX_MLLinOp.H>
 #include <AMReX_MLCellLinOp.H>
@@ -19,6 +15,12 @@
 #include <AMReX_PETSc.H>
 #endif
 
+#include <algorithm>
+#include <cmath>
+#include <set>
+#include <unordered_map>
+
+
 namespace amrex {
 
 #if __cplusplus < 201703L
@@ -73,7 +75,6 @@ namespace {
     };
 
     std::unique_ptr<CommCache> comm_cache;
-#endif
 
     Vector<int> get_subgroup_ranks ()
     {
@@ -87,6 +88,7 @@ namespace {
         ParallelContext::local_to_global_rank(granks.data(), lranks.data(), rank_n);
         return granks;
     }
+#endif
 }
 
 // static member function
@@ -132,6 +134,8 @@ MLLinOp::define (const Vector<Geometry>& a_geom,
                  const Vector<FabFactory<FArrayBox> const*>& a_factory,
                  bool eb_limit_coarsening)
 {
+    amrex::ignore_unused(eb_limit_coarsening);
+
     BL_PROFILE("MLLinOp::define()");
 
     if (!initialized) {
@@ -267,7 +271,7 @@ MLLinOp::defineGrids (const Vector<Geometry>& a_geom,
 
     bool agged = false;
     bool coned = false;
-    int agg_lev, con_lev;
+    int agg_lev = 0, con_lev = 0;
 
     if (info.do_agglomeration && aggable)
     {
@@ -282,17 +286,85 @@ MLLinOp::defineGrids (const Vector<Geometry>& a_geom,
         Vector<int> agg_flag;
         domainboxes.push_back(dbx);
         boundboxes.push_back(bbx);
-        agg_flag.push_back(false);
-        while (    dbx.coarsenable(mg_coarsen_ratio,mg_domain_min_width)
-               and bbx.coarsenable(mg_coarsen_ratio,mg_box_min_width))
-        {
-            dbx.coarsen(mg_coarsen_ratio);
-            domainboxes.push_back(dbx);
-            bbx.coarsen(mg_coarsen_ratio);
-            boundboxes.push_back(bbx);
-            bool to_agg = (bbx.d_numPts() / nbxs) < 0.999*threshold_npts;
-            agg_flag.push_back(to_agg);
+        agg_flag.push_back(false); 
+
+#if (AMREX_SPACEDIM > 1)
+        if (info.do_semicoarsening) 
+	{   
+	    int num_semicoarsening_level = 0;
+            IntVect rr_0(AMREX_D_DECL(mg_coarsen_ratio,1,1));
+            bool is_coarsenable_x = ( dbx.coarsenable(rr_0, mg_domain_min_width) and
+                                      bbx.coarsenable(rr_0, mg_box_min_width));
+            IntVect rr_1(AMREX_D_DECL(1,mg_coarsen_ratio,1));
+            bool is_coarsenable_y = ( dbx.coarsenable(rr_1, mg_domain_min_width) and
+                                      bbx.coarsenable(rr_1, mg_box_min_width));
+#if (AMREX_SPACEDIM == 3)
+            IntVect rr_2(AMREX_D_DECL(1,1,mg_coarsen_ratio));
+            bool is_coarsenable_z = ( dbx.coarsenable(rr_2, mg_domain_min_width) and
+                                      bbx.coarsenable(rr_2, mg_box_min_width));
+#endif
+	    IntVect rr_vec(mg_coarsen_ratio);
+#if (AMREX_SPACEDIM == 2)
+            while ( is_coarsenable_x or is_coarsenable_y )
+#endif
+#if (AMREX_SPACEDIM == 3)
+            while ( is_coarsenable_x or is_coarsenable_y or is_coarsenable_z )
+#endif
+	    {
+#if (AMREX_SPACEDIM >= 2)
+                int r0 = (is_coarsenable_x) ? mg_coarsen_ratio : 1;
+                int r1 = (is_coarsenable_y) ? mg_coarsen_ratio : 1;
+                rr_vec[0] = r0;
+                rr_vec[1] = r1;
+#if (AMREX_SPACEDIM == 3)
+                int r2 = (is_coarsenable_z) ? mg_coarsen_ratio : 1;
+                rr_vec[2] = r2;
+#endif
+#endif
+                dbx.coarsen(rr_vec);
+                domainboxes.push_back(dbx);
+                bbx.coarsen(rr_vec);
+                boundboxes.push_back(bbx);
+                bool to_agg = (bbx.d_numPts() / nbxs) < 0.999*threshold_npts;
+                agg_flag.push_back(to_agg);
+
+                is_coarsenable_x = ( dbx.coarsenable(rr_0, mg_domain_min_width) and
+                                     bbx.coarsenable(rr_0, mg_box_min_width));
+#if (AMREX_SPACEDIM >= 2)
+                is_coarsenable_y = ( dbx.coarsenable(rr_1, mg_domain_min_width) and
+                                     bbx.coarsenable(rr_1, mg_box_min_width));
+#if (AMREX_SPACEDIM == 3)
+                is_coarsenable_z = ( dbx.coarsenable(rr_2, mg_domain_min_width) and
+                                     bbx.coarsenable(rr_2, mg_box_min_width));
+#endif
+#endif
+#if (AMREX_SPACEDIM == 2)
+		if (!(is_coarsenable_x and is_coarsenable_y))
+#endif
+#if (AMREX_SPACEDIM == 3)
+                if (!(is_coarsenable_x and is_coarsenable_y and is_coarsenable_z))
+#endif
+		{
+		    num_semicoarsening_level++;    
+		    if (num_semicoarsening_level > info.max_semicoarsening_level) break;
+		}
+	    }
+
         }
+	else 
+#endif
+	{
+            while (    dbx.coarsenable(mg_coarsen_ratio,mg_domain_min_width)
+                   and bbx.coarsenable(mg_coarsen_ratio,mg_box_min_width))
+            {
+                dbx.coarsen(mg_coarsen_ratio);
+                domainboxes.push_back(dbx);
+                bbx.coarsen(mg_coarsen_ratio);
+                boundboxes.push_back(bbx);
+                bool to_agg = (bbx.d_numPts() / nbxs) < 0.999*threshold_npts;
+                agg_flag.push_back(to_agg);
+            }
+	}
 
         int first_agglev = std::distance(agg_flag.begin(),
                                          std::find(agg_flag.begin(),agg_flag.end(),1));
@@ -356,7 +428,7 @@ MLLinOp::defineGrids (const Vector<Geometry>& a_geom,
     else
     {
         int rr = mg_coarsen_ratio;
-        Real avg_npts;
+        Real avg_npts = 0.0;
         if (info.do_consolidation) {
             avg_npts = static_cast<Real>(a_grids[0].d_numPts()) / static_cast<Real>(ParallelContext::NProcsSub());
             if (consolidation_threshold == -1) {
@@ -365,12 +437,14 @@ MLLinOp::defineGrids (const Vector<Geometry>& a_geom,
                                                        *info.con_grid_size);
             }
         }
+
+        // Regular coarsening
         while (m_num_mg_levels[0] < info.max_coarsening_level + 1
                and a_geom[0].Domain().coarsenable(rr, mg_domain_min_width)
                and a_grids[0].coarsenable(rr, mg_box_min_width))
         {
             m_geom[0].emplace_back(amrex::coarsen(a_geom[0].Domain(),rr),rb,coord,is_per);
-            
+
             m_grids[0].push_back(a_grids[0]);
             m_grids[0].back().coarsen(rr);
 
@@ -395,6 +469,102 @@ MLLinOp::defineGrids (const Vector<Geometry>& a_geom,
             ++(m_num_mg_levels[0]);
             rr *= mg_coarsen_ratio;
         }
+
+        if (info.do_semicoarsening)
+        {
+            int num_semicoarsening_level = 1;
+            // Semi-coarsening  -- by the time we get here we know we can't coarsen isotropically any more
+            IntVect rr_0(AMREX_D_DECL(rr,1,1));
+            bool is_coarsenable_x = ( a_geom[0].Domain().coarsenable(rr_0, mg_domain_min_width) and
+                                      a_grids[0].coarsenable(rr_0, mg_box_min_width));
+#if (AMREX_SPACEDIM >= 2)
+            IntVect rr_1(AMREX_D_DECL(1,rr,1));
+            bool is_coarsenable_y = ( a_geom[0].Domain().coarsenable(rr_1, mg_domain_min_width) and
+                                      a_grids[0].coarsenable(rr_1, mg_box_min_width));
+#endif
+#if (AMREX_SPACEDIM == 3)
+            IntVect rr_2(AMREX_D_DECL(1,1,rr));
+            bool is_coarsenable_z = ( a_geom[0].Domain().coarsenable(rr_2, mg_domain_min_width) and
+                                      a_grids[0].coarsenable(rr_2, mg_box_min_width));
+#endif
+
+#if (AMREX_SPACEDIM == 2)
+            if (is_coarsenable_x or is_coarsenable_y)
+#endif
+#if (AMREX_SPACEDIM == 3)
+            if (is_coarsenable_x or is_coarsenable_y or is_coarsenable_z)
+#endif
+            {
+                IntVect rr_vec(rr/mg_coarsen_ratio);
+#if (AMREX_SPACEDIM == 2)
+                while ( (num_semicoarsening_level < info.max_semicoarsening_level + 1) and
+			(m_num_mg_levels[0] < info.max_coarsening_level + 1) and
+                        (is_coarsenable_x or is_coarsenable_y ) )
+#endif
+#if (AMREX_SPACEDIM == 3)
+                while ( (num_semicoarsening_level < info.max_semicoarsening_level + 1) and
+		        (m_num_mg_levels[0] < info.max_coarsening_level + 1) and
+                        (is_coarsenable_x or is_coarsenable_y or is_coarsenable_z) )
+#endif
+                {
+                    int r0 = (is_coarsenable_x) ? rr_vec[0]*mg_coarsen_ratio : rr_vec[0];
+#if (AMREX_SPACEDIM >= 2)
+                    int r1 = (is_coarsenable_y) ? rr_vec[1]*mg_coarsen_ratio : rr_vec[1];
+                    rr_vec[0] = r0;
+                    rr_vec[1] = r1;
+#if (AMREX_SPACEDIM == 3)
+                    int r2 = (is_coarsenable_z) ? rr_vec[2]*mg_coarsen_ratio : rr_vec[2];
+                    rr_vec[2] = r2;
+#endif
+#endif
+                    m_geom[0].emplace_back(amrex::coarsen(a_geom[0].Domain(),rr_vec),rb,coord,is_per);
+                    m_grids[0].push_back(a_grids[0]);
+                    m_grids[0].back().coarsen(rr_vec);
+
+                    if (info.do_consolidation)
+                    {
+                        if (avg_npts/(AMREX_D_TERM(rr,*rr,*rr)) < 0.999*consolidation_threshold)
+                        {
+                            coned = true;
+                            con_lev = m_dmap[0].size();
+                            m_dmap[0].push_back(DistributionMapping());
+                        }
+                        else
+                        {
+                            m_dmap[0].push_back(m_dmap[0].back());
+                        }
+                    }
+                    else
+                    {
+                        m_dmap[0].push_back(a_dmap[0]);
+                    }
+                    ++(m_num_mg_levels[0]);
+                    ++num_semicoarsening_level;
+
+                    IntVect rrr_0(AMREX_D_DECL(rr_vec[0]*mg_coarsen_ratio, 1, 1));
+                    is_coarsenable_x = ( a_geom[0].Domain().coarsenable(rrr_0, mg_domain_min_width) and
+                                         a_grids[0].coarsenable(rrr_0, mg_box_min_width));
+#if (AMREX_SPACEDIM >= 2)
+                    IntVect rrr_1(AMREX_D_DECL(1, rr_vec[1]*mg_coarsen_ratio, 1));
+                    is_coarsenable_y = ( a_geom[0].Domain().coarsenable(rrr_1, mg_domain_min_width) and
+                                         a_grids[0].coarsenable(rrr_1, mg_box_min_width));
+
+#if (AMREX_SPACEDIM == 3)
+                    IntVect rrr_2(AMREX_D_DECL(1,1,rr_vec[2]*mg_coarsen_ratio));
+                    is_coarsenable_z = ( a_geom[0].Domain().coarsenable(rrr_2, mg_domain_min_width) and
+                                         a_grids[0].coarsenable(rrr_2, mg_box_min_width));
+#endif
+#endif
+
+                }
+            }
+        }
+    }
+
+    for (int mglev = 0; mglev < m_num_mg_levels[0] - 1; mglev++){
+        const Box& fine_domain = m_geom[0][mglev].Domain();
+        const Box& crse_domain = m_geom[0][mglev+1].Domain();
+        mg_coarsen_ratio_vec.push_back(fine_domain.length()/crse_domain.length());
     }
 
     if (agged)
@@ -411,7 +581,7 @@ MLLinOp::defineGrids (const Vector<Geometry>& a_geom,
         remapNeighborhoods(m_dmap[0]);
     }
 
-    if (info.do_agglomeration || info.do_consolidation)
+    if (agged || coned)
     {
         m_bottom_comm = makeSubCommunicator(m_dmap[0].back());
     }
@@ -632,6 +802,7 @@ MLLinOp::makeSubCommunicator (const DistributionMapping& dm)
 
     return newcomm;
 #else
+    amrex::ignore_unused(dm);
     return m_default_comm;
 #endif
 }
@@ -721,6 +892,7 @@ MLLinOp::makeConsolidatedDMap (const Vector<BoxArray>& ba, Vector<DistributionMa
 void
 MLLinOp::remapNeighborhoods (Vector<DistributionMapping> & dms)
 {
+#ifdef AMREX_USE_MPI
     BL_PROFILE("MLLinOp::remapNeighborhoods()");
 
     if (flag_verbose_linop) {
@@ -754,6 +926,9 @@ MLLinOp::remapNeighborhoods (Vector<DistributionMapping> & dms)
             dms[j] = DistributionMapping(std::move(nbh_pmap));
         }
     }
+#else
+    amrex::ignore_unused(dms);
+#endif
 }
 
 #ifdef AMREX_USE_PETSC
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLLinOp_K.H b/Src/LinearSolvers/MLMG/AMReX_MLLinOp_K.H
index 3689ff4dff3..a3def6ebed8 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLLinOp_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLLinOp_K.H
@@ -46,13 +46,13 @@ void mllinop_apply_bc_x (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dxinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{{-bcl * dxinv, Real(0.5), Real(1.5), Real(2.5)}};
         GpuArray<Real,4> coef{};
-        poly_interp_coeff(-0.5_rt, &x[0], NX, &coef[0]);
+        poly_interp_coeff(-Real(0.5), &x[0], NX, &coef[0]);
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int j = lo.y; j <= hi.y; ++j) {
                 if (mask(i,j,k) > 0) {
-                    Real tmp = 0.0_rt;
+                    Real tmp = Real(0.0);
                     for (int m = 1; m < NX; ++m) {
                         tmp += phi(i+m*s,j,k,icomp) * coef[m];
                     }
@@ -107,13 +107,13 @@ void mllinop_apply_bc_y (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dyinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{{-bcl * dyinv, Real(0.5), Real(1.5), Real(2.5)}};
         GpuArray<Real,4> coef{};
-        poly_interp_coeff(-0.5_rt, &x[0], NX, &coef[0]);
+        poly_interp_coeff(-Real(0.5), &x[0], NX, &coef[0]);
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int i = lo.x; i <= hi.x; ++i) {
                 if (mask(i,j,k) > 0) {
-                    Real tmp = 0.0_rt;
+                    Real tmp = Real(0.0);
                     for (int m = 1; m < NX; ++m) {
                         tmp += phi(i,j+m*s,k,icomp) * coef[m];
                     }
@@ -168,13 +168,13 @@ void mllinop_apply_bc_z (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dzinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{{-bcl * dzinv, Real(0.5), Real(1.5), Real(2.5)}};
         GpuArray<Real,4> coef{};
-        poly_interp_coeff(-0.5_rt, &x[0], NX, &coef[0]);
+        poly_interp_coeff(-Real(0.5), &x[0], NX, &coef[0]);
         for     (int j = lo.y; j <= hi.y; ++j) {
             for (int i = lo.x; i <= hi.x; ++i) {
                 if (mask(i,j,k) > 0) {
-                    Real tmp = 0.0_rt;
+                    Real tmp = Real(0.0);
                     for (int m = 1; m < NX; ++m) {
                         tmp += phi(i,j,k+m*s,icomp) * coef[m];
                     }
@@ -207,7 +207,7 @@ void mllinop_comp_interp_coef0_x (int side, Box const& box, int blen,
     {
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int j = lo.y; j <= hi.y; ++j) {
-                f(ii,j,k,icomp) = 1.0_rt;
+                f(ii,j,k,icomp) = Real(1.0);
             }
         }
         break;
@@ -216,7 +216,7 @@ void mllinop_comp_interp_coef0_x (int side, Box const& box, int blen,
     {
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int j = lo.y; j <= hi.y; ++j) {
-                f(ii,j,k,icomp) = (mask(ib,j,k) > 0) ? 1.0_rt : 0.0_rt;
+                f(ii,j,k,icomp) = (mask(ib,j,k) > 0) ? Real(1.0) : Real(0.0);
             }
         }
         break;
@@ -224,12 +224,12 @@ void mllinop_comp_interp_coef0_x (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dxinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{{-bcl * dxinv, Real(0.5), Real(1.5), Real(2.5)}};
         GpuArray<Real,4> coef{};
-        poly_interp_coeff(-0.5_rt, &x[0], NX, &coef[0]);
+        poly_interp_coeff(-Real(0.5), &x[0], NX, &coef[0]);
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int j = lo.y; j <= hi.y; ++j) {
-                f(ii,j,k,icomp) = (mask(ib,j,k) > 0) ? coef[1] : 0.0_rt;
+                f(ii,j,k,icomp) = (mask(ib,j,k) > 0) ? coef[1] : Real(0.0);
             }
         }
         break;
@@ -254,7 +254,7 @@ void mllinop_comp_interp_coef0_y (int side, Box const& box, int blen,
     {
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                f(i,ji,k,icomp) = 1.0_rt;
+                f(i,ji,k,icomp) = Real(1.0);
             }
         }
         break;
@@ -263,7 +263,7 @@ void mllinop_comp_interp_coef0_y (int side, Box const& box, int blen,
     {
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                f(i,ji,k,icomp) = (mask(i,jb,k) > 0) ? 1.0_rt : 0.0_rt;
+                f(i,ji,k,icomp) = (mask(i,jb,k) > 0) ? Real(1.0) : Real(0.0);
             }
         }
         break;
@@ -271,12 +271,12 @@ void mllinop_comp_interp_coef0_y (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dyinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{{-bcl * dyinv, Real(0.5), Real(1.5), Real(2.5)}};
         GpuArray<Real,4> coef{};
-        poly_interp_coeff(-0.5_rt, &x[0], NX, &coef[0]);
+        poly_interp_coeff(-Real(0.5), &x[0], NX, &coef[0]);
         for     (int k = lo.z; k <= hi.z; ++k) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                f(i,ji,k,icomp) = (mask(i,jb,k) > 0) ? coef[1] : 0.0_rt;
+                f(i,ji,k,icomp) = (mask(i,jb,k) > 0) ? coef[1] : Real(0.0);
             }
         }
         break;
@@ -301,7 +301,7 @@ void mllinop_comp_interp_coef0_z (int side, Box const& box, int blen,
     {
         for     (int j = lo.y; j <= hi.y; ++j) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                f(i,j,ki,icomp) = 1.0_rt;
+                f(i,j,ki,icomp) = Real(1.0);
             }
         }
         break;
@@ -310,7 +310,7 @@ void mllinop_comp_interp_coef0_z (int side, Box const& box, int blen,
     {
         for     (int j = lo.y; j <= hi.y; ++j) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                f(i,j,ki,icomp) = (mask(i,j,kb) > 0) ? 1.0_rt : 0.0_rt;
+                f(i,j,ki,icomp) = (mask(i,j,kb) > 0) ? Real(1.0) : Real(0.0);
             }
         }
         break;
@@ -318,12 +318,12 @@ void mllinop_comp_interp_coef0_z (int side, Box const& box, int blen,
     case AMREX_LO_DIRICHLET:
     {
         const int NX = amrex::min(blen+1, maxorder);
-        GpuArray<Real,4> x{-bcl * dzinv, 0.5_rt, 1.5_rt, 2.5_rt};
+        GpuArray<Real,4> x{{-bcl * dzinv, Real(0.5), Real(1.5), Real(2.5)}};
         GpuArray<Real,4> coef{};
-        poly_interp_coeff(-0.5_rt, &x[0], NX, &coef[0]);
+        poly_interp_coeff(-Real(0.5), &x[0], NX, &coef[0]);
         for     (int j = lo.y; j <= hi.y; ++j) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                f(i,j,ki,icomp) = (mask(i,j,kb) > 0) ? coef[1] : 0.0_rt;
+                f(i,j,ki,icomp) = (mask(i,j,kb) > 0) ? coef[1] : Real(0.0);
             }
         }
         break;
@@ -332,17 +332,221 @@ void mllinop_comp_interp_coef0_z (int side, Box const& box, int blen,
     }
 }
 
+#ifdef AMREX_USE_EB
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mllinop_comp_interp_coef0_x_eb (int side, Box const& box, int blen,
+                                     Array4<Real> const& f,
+                                     Array4<int const> const& mask,
+                                     Array4<Real const> const& area,
+                                     BoundCond bct, Real bcl,
+                                     int maxorder, Real dxinv, int icomp) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const int ib = lo.x; // boundary cell
+    const int s = 1-2*side;  // +1 for lo and -1 for hi
+    const int ii = lo.x + s; // interior cell
+    switch (bct) {
+    case AMREX_LO_NEUMANN:
+    {
+        for     (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+                f(ii,j,k,icomp) = Real(1.0);
+            }
+        }
+        break;
+    }
+    case AMREX_LO_REFLECT_ODD:
+    {
+        for     (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+                f(ii,j,k,icomp) = (mask(ib,j,k) > 0) ? Real(1.0) : Real(0.0);
+            }
+        }
+        break;
+    }
+    case AMREX_LO_DIRICHLET:
+    {
+        const int NX = amrex::min(blen+1, maxorder);
+        GpuArray<Real,4> x{{-bcl * dxinv, Real(0.5), Real(1.5), Real(2.5)}};
+        Array2D<Real, 0, 3, 0, 2> coef{};
+        for (int r = 0; r <= maxorder-2; ++r) {
+            poly_interp_coeff(-Real(0.5), &x[0], r+2, &coef(0,r));
+        }
+        for     (int k = lo.z; k <= hi.z; ++k) {
+            for (int j = lo.y; j <= hi.y; ++j) {
+                int order = 1;
+                if (mask(ib,j,k) > 0) {
+                    bool has_cutfaces = false;
+                    for (int r = 0; r <= NX-2; ++r) {
+                        Real a = area(ii+side+s*r,j,k);
+                        if (a > Real(0.0)) {
+                            ++order;
+                            if (a < Real(1.0)) {
+                                has_cutfaces = true;
+                            }
+                        } else {
+                            break;
+                        }
+                    }
+                    if (has_cutfaces) order = amrex::min(2,order);
+                }
+                f(ii,j,k,icomp) = (order==1) ? Real(0.0) : coef(1,order-2);
+            }
+        }
+        break;
+    }
+    default: {}
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mllinop_comp_interp_coef0_y_eb (int side, Box const& box, int blen,
+                                     Array4<Real> const& f,
+                                     Array4<int const> const& mask,
+                                     Array4<Real const> const& area,
+                                     BoundCond bct, Real bcl,
+                                     int maxorder, Real dyinv, int icomp) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const int jb = lo.y; // boundary cell
+    const int s = 1-2*side;  // +1 for lo and -1 for hi
+    const int ji = lo.y + s; // interior cell
+    switch (bct) {
+    case AMREX_LO_NEUMANN:
+    {
+        for     (int k = lo.z; k <= hi.z; ++k) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                f(i,ji,k,icomp) = Real(1.0);
+            }
+        }
+        break;
+    }
+    case AMREX_LO_REFLECT_ODD:
+    {
+        for     (int k = lo.z; k <= hi.z; ++k) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                f(i,ji,k,icomp) = (mask(i,jb,k) > 0) ? Real(1.0) : Real(0.0);
+            }
+        }
+        break;
+    }
+    case AMREX_LO_DIRICHLET:
+    {
+        const int NX = amrex::min(blen+1, maxorder);
+        GpuArray<Real,4> x{{-bcl * dyinv, Real(0.5), Real(1.5), Real(2.5)}};
+        Array2D<Real, 0, 3, 0, 2> coef{};
+        for (int r = 0; r <= maxorder-2; ++r) {
+            poly_interp_coeff(-Real(0.5), &x[0], r+2, &coef(0,r));
+        }
+        for     (int k = lo.z; k <= hi.z; ++k) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                int order = 1;
+                if (mask(i,jb,k) > 0) {
+                    bool has_cutfaces = false;
+                    for (int r = 0; r <= NX-2; ++r) {
+                        Real a = area(i,ji+side+s*r,k);
+                        if (a > Real(0.0)) {
+                            ++order;
+                            if (a < Real(1.0)) {
+                                has_cutfaces = true;
+                            }
+                        } else {
+                            break;
+                        }
+                    }
+                    if (has_cutfaces) order = amrex::min(2,order);
+                }
+                f(i,ji,k,icomp) = (order==1) ? Real(0.0) : coef(1,order-2);
+            }
+        }
+        break;
+    }
+    default: {}
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mllinop_comp_interp_coef0_z_eb (int side, Box const& box, int blen,
+                                     Array4<Real> const& f,
+                                     Array4<int const> const& mask,
+                                     Array4<Real const> const& area,
+                                     BoundCond bct, Real bcl,
+                                     int maxorder, Real dzinv, int icomp) noexcept
+{
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+    const int kb = lo.z; // bound cell
+    const int s = 1-2*side;  // +1 for lo and -1 for hi
+    const int ki = lo.z + s; // interior cell
+    switch (bct) {
+    case AMREX_LO_NEUMANN:
+    {
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                f(i,j,ki,icomp) = Real(1.0);
+            }
+        }
+        break;
+    }
+    case AMREX_LO_REFLECT_ODD:
+    {
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                f(i,j,ki,icomp) = (mask(i,j,kb) > 0) ? Real(1.0) : Real(0.0);
+            }
+        }
+        break;
+    }
+    case AMREX_LO_DIRICHLET:
+    {
+        const int NX = amrex::min(blen+1, maxorder);
+        GpuArray<Real,4> x{{-bcl * dzinv, Real(0.5), Real(1.5), Real(2.5)}};
+        Array2D<Real, 0, 3, 0, 2> coef{};
+        for (int r = 0; r <= maxorder-2; ++r) {
+            poly_interp_coeff(-Real(0.5), &x[0], r+2, &coef(0,r));
+        }
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            for (int i = lo.x; i <= hi.x; ++i) {
+                int order = 1;
+                if (mask(i,j,kb) > 0) {
+                    bool has_cutfaces = false;
+                    for (int r = 0; r <= NX-2; ++r) {
+                        Real a = area(i,j,ki+side+s*r);
+                        if (a > Real(0.0)) {
+                            ++order;
+                            if (a < Real(1.0)) {
+                                has_cutfaces = true;
+                            }
+                        } else {
+                            break;
+                        }
+                    }
+                    if (has_cutfaces) order = amrex::min(2,order);
+                }
+                f(i,j,ki,icomp) = (order==1) ? Real(0.0) : coef(1,order-2);
+            }
+        }
+        break;
+    }
+    default: {}
+    }
+}
+#endif
+
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mllinop_apply_innu_xlo (int i, int j, int k,
                              Array4<Real> const& rhs,
                              Array4<int const> const& mask,
                              Array4<Real const> const& bcoef,
-                             BoundCond bct, Real bcl,
+                             BoundCond bct, Real /*bcl*/,
                              Array4<Real const> const& bcval,
                              Real fac, bool has_bcoef, int icomp) noexcept
 {
     if (bct == AMREX_LO_NEUMANN and mask(i,j,k) == 2) {
-        Real b = (has_bcoef) ? bcoef(i+1,j,k,icomp) : 1.0_rt;
+        Real b = (has_bcoef) ? bcoef(i+1,j,k,icomp) : Real(1.0);
         rhs(i+1,j,k,icomp) -= fac*b*bcval(i,j,k,icomp);
     }
 }
@@ -352,12 +556,12 @@ void mllinop_apply_innu_xhi (int i, int j, int k,
                              Array4<Real> const& rhs,
                              Array4<int const> const& mask,
                              Array4<Real const> const& bcoef,
-                             BoundCond bct, Real bcl,
+                             BoundCond bct, Real /*bcl*/,
                              Array4<Real const> const& bcval,
                              Real fac, bool has_bcoef, int icomp) noexcept
 {
     if (bct == AMREX_LO_NEUMANN and mask(i,j,k) == 2) {
-        Real b = (has_bcoef) ? bcoef(i,j,k,icomp) : 1.0_rt;
+        Real b = (has_bcoef) ? bcoef(i,j,k,icomp) : Real(1.0);
         rhs(i-1,j,k,icomp) += fac*b*bcval(i,j,k,icomp);
     }
 }
@@ -367,12 +571,12 @@ void mllinop_apply_innu_ylo (int i, int j, int k,
                              Array4<Real> const& rhs,
                              Array4<int const> const& mask,
                              Array4<Real const> const& bcoef,
-                             BoundCond bct, Real bcl,
+                             BoundCond bct, Real /*bcl*/,
                              Array4<Real const> const& bcval,
                              Real fac, bool has_bcoef, int icomp) noexcept
 {
     if (bct == AMREX_LO_NEUMANN and mask(i,j,k) == 2) {
-        Real b = (has_bcoef) ? bcoef(i,j+1,k,icomp) : 1.0_rt;
+        Real b = (has_bcoef) ? bcoef(i,j+1,k,icomp) : Real(1.0);
         rhs(i,j+1,k,icomp) -= fac*b*bcval(i,j,k,icomp);
     }
 }
@@ -381,7 +585,7 @@ AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mllinop_apply_innu_ylo_m (int i, int j, int k,
                                Array4<Real> const& rhs,
                                Array4<int const> const& mask,
-                               BoundCond bct, Real bcl,
+                               BoundCond bct, Real /*bcl*/,
                                Array4<Real const> const& bcval,
                                Real fac, Real xlo, Real dx, int icomp) noexcept
 {
@@ -396,12 +600,12 @@ void mllinop_apply_innu_yhi (int i, int j, int k,
                              Array4<Real> const& rhs,
                              Array4<int const> const& mask,
                              Array4<Real const> const& bcoef,
-                             BoundCond bct, Real bcl,
+                             BoundCond bct, Real /*bcl*/,
                              Array4<Real const> const& bcval,
                              Real fac, bool has_bcoef, int icomp) noexcept
 {
     if (bct == AMREX_LO_NEUMANN and mask(i,j,k) == 2) {
-        Real b = (has_bcoef) ? bcoef(i,j,k,icomp) : 1.0_rt;
+        Real b = (has_bcoef) ? bcoef(i,j,k,icomp) : Real(1.0);
         rhs(i,j-1,k,icomp) += fac*b*bcval(i,j,k,icomp);
     }
 }
@@ -410,7 +614,7 @@ AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mllinop_apply_innu_yhi_m (int i, int j, int k,
                                Array4<Real> const& rhs,
                                Array4<int const> const& mask,
-                               BoundCond bct, Real bcl,
+                               BoundCond bct, Real /*bcl*/,
                                Array4<Real const> const& bcval,
                                Real fac, Real xlo, Real dx, int icomp) noexcept
 {
@@ -425,12 +629,12 @@ void mllinop_apply_innu_zlo (int i, int j, int k,
                              Array4<Real> const& rhs,
                              Array4<int const> const& mask,
                              Array4<Real const> const& bcoef,
-                             BoundCond bct, Real bcl,
+                             BoundCond bct, Real /*bcl*/,
                              Array4<Real const> const& bcval,
                              Real fac, bool has_bcoef, int icomp) noexcept
 {
     if (bct == AMREX_LO_NEUMANN and mask(i,j,k) == 2) {
-        Real b = (has_bcoef) ? bcoef(i,j,k+1,icomp) : 1.0_rt;
+        Real b = (has_bcoef) ? bcoef(i,j,k+1,icomp) : Real(1.0);
         rhs(i,j,k+1,icomp) -= fac*b*bcval(i,j,k,icomp);
     }
 }
@@ -440,12 +644,12 @@ void mllinop_apply_innu_zhi (int i, int j, int k,
                              Array4<Real> const& rhs,
                              Array4<int const> const& mask,
                              Array4<Real const> const& bcoef,
-                             BoundCond bct, Real bcl,
+                             BoundCond bct, Real /*bcl*/,
                              Array4<Real const> const& bcval,
                              Real fac, bool has_bcoef, int icomp) noexcept
 {
     if (bct == AMREX_LO_NEUMANN and mask(i,j,k) == 2) {
-        Real b = (has_bcoef) ? bcoef(i,j,k,icomp) : 1.0_rt;
+        Real b = (has_bcoef) ? bcoef(i,j,k,icomp) : Real(1.0);
         rhs(i,j,k-1,icomp) += fac*b*bcval(i,j,k,icomp);
     }
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLMG.H b/Src/LinearSolvers/MLMG/AMReX_MLMG.H
index 6e4e6a48f15..b2389d102fe 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLMG.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLMG.H
@@ -87,9 +87,6 @@ public:
     void setBottomTolerance (Real t) noexcept { bottom_reltol = t; }
     void setBottomToleranceAbs (Real t) noexcept { bottom_abstol = t;}
     Real getBottomToleranceAbs () noexcept{ return bottom_abstol; }
-    void setCGVerbose (int v) noexcept { bottom_verbose = v; }
-    void setCGMaxIter (int n) noexcept { bottom_maxiter = n; }
-    void setCGTolerance (Real t) noexcept { bottom_reltol = t; }
 
     void setAlwaysUseBNorm (int flag) noexcept { always_use_bnorm = flag; }
 
@@ -107,6 +104,18 @@ public:
         hypre_interface = f;
 #endif
     }
+
+    //! Set the namespace in input file for parsing HYPRE specific options
+    void setHypreOptionsNamespace(const std::string& prefix) noexcept
+    {
+        hypre_options_namespace = prefix;
+    }
+
+    void setHypreOldDefault (bool l) noexcept {hypre_old_default = l;}
+    void setHypreRelaxType (int n) noexcept {hypre_relax_type = n;}
+    void setHypreRelaxOrder (int n) noexcept {hypre_relax_order = n;}
+    void setHypreNumSweeps (int n) noexcept {hypre_num_sweeps = n;}
+    void setHypreStrongThreshold (Real t) noexcept {hypre_strong_threshold = t;}
 #endif
 
     void prepareForSolve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab const*>& a_rhs);
@@ -203,17 +212,20 @@ private:
 
     //! Hypre
 #ifdef AMREX_USE_HYPRE
-#ifdef AMREX_USE_EB
+    // Hypre::Interface hypre_interface = Hypre::Interface::structed;
+    // Hypre::Interface hypre_interface = Hypre::Interface::semi_structed;
     Hypre::Interface hypre_interface = Hypre::Interface::ij;
-#else
 
-    // Hypre::Interface hypre_interface = Hypre::Interface::structed;
-    Hypre::Interface hypre_interface = Hypre::Interface::semi_structed;
-//    Hypre::Interface hypre_interface = Hypre::Interface::ij;
-#endif
     std::unique_ptr<Hypre> hypre_solver;
     std::unique_ptr<MLMGBndry> hypre_bndry;
     std::unique_ptr<HypreNodeLap> hypre_node_solver;
+
+    std::string hypre_options_namespace = "hypre";
+    bool hypre_old_default = true; // Falgout coarsening with modified classical interpolation
+    int hypre_relax_type = 6;  // G-S/Jacobi hybrid relaxation
+    int hypre_relax_order = 1; // uses C/F relaxation
+    int hypre_num_sweeps = 2;  // Sweeps on each level
+    Real hypre_strong_threshold = 0.25; // Hypre default is 0.25
 #endif
 
     //! PETSc
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLMG.cpp b/Src/LinearSolvers/MLMG/AMReX_MLMG.cpp
index b23a481f4ca..aecccef7de3 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLMG.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLMG.cpp
@@ -62,9 +62,13 @@ MLMG::solve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab const*>& a_rh
         bottom_solver = linop.getDefaultBottomSolver();
     }
 
-    if (bottom_solver == BottomSolver::hypre) {
+    if (bottom_solver == BottomSolver::hypre || bottom_solver == BottomSolver::petsc) {
         int mo = linop.getMaxOrder();
-        linop.setMaxOrder(std::min(3,mo));  // maxorder = 4 not supported
+        if (a_sol[0]->hasEBFabFactory()) {
+            linop.setMaxOrder(2);
+        } else {
+            linop.setMaxOrder(std::min(3,mo));  // maxorder = 4 not supported
+        }
     }
     
     bool is_nsolve = linop.m_parent;
@@ -107,7 +111,7 @@ MLMG::solve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab const*>& a_rh
         norm_name = "resid0";
         max_norm = resnorm0;
     }
-    const Real res_target = std::max(a_tol_abs, std::max(a_tol_rel,1.e-16_rt)*max_norm);
+    const Real res_target = std::max(a_tol_abs, std::max(a_tol_rel,Real(1.e-16))*max_norm);
 
     if (!is_nsolve && resnorm0 <= res_target) {
         composite_norminf = resnorm0;
@@ -164,8 +168,20 @@ MLMG::solve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab const*>& a_rh
                                    << composite_norminf/max_norm << "\n";
                 }
                 break;
+            } else {
+              if (composite_norminf > 1.e20*max_norm) 
+              {
+                  if (verbose > 0) {
+                      amrex::Print() << "MLMG: Failing to converge after " << iter+1 << " iterations."
+                                     << " resid, resid/" << norm_name << " = "
+                                     << composite_norminf << ", "
+                                     << composite_norminf/max_norm << "\n";
+                      amrex::Abort("MLMG failing so lets stop here");
+                  }
+              }
             }
         }
+
         if (!converged && do_fixed_number_of_iters == 0) {
             if (verbose > 0) {
                 amrex::Print() << "MLMG: Failed to converge after " << max_iters << " iterations."
@@ -231,7 +247,7 @@ void MLMG::oneIter (int iter)
     // coarsest amr level
     {
         // enforce solvability if appropriate
-        if (linop.isSingular(0))
+        if (linop.isSingular(0) && linop.getEnforceSingularSolvable())
         {
             makeSolvable(0,0,res[0][0]);
         }
@@ -378,7 +394,7 @@ MLMG::miniCycle (int amrlev)
 
 namespace {
 
-void make_str_helper (std::ostringstream & oss) { }
+void make_str_helper (std::ostringstream & /*oss*/) { }
 
 template <class T, class... Ts>
 void make_str_helper (std::ostringstream & oss, T x, Ts... xs) {
@@ -453,6 +469,7 @@ MLMG::mgVcycle (int amrlev, int mglev_top)
         {
             computeResOfCorrection(amrlev, mglev_bottom);
             Real norm = rescor[amrlev][mglev_bottom].norm0();
+            
             amrex::Print() << "AT LEVEL "  << amrlev << " " << mglev_bottom
                            << "   UP: Norm after  bottom " << norm << "\n";
         }
@@ -812,7 +829,6 @@ MLMG::addInterpCorrection (int alev, int mglev)
     const MultiFab& crse_cor = *cor[alev][mglev+1];
     MultiFab&       fine_cor = *cor[alev][mglev  ];
 
-    const int refratio = 2;
     MultiFab cfine;
     const MultiFab* cmf;
 
@@ -823,7 +839,9 @@ MLMG::addInterpCorrection (int alev, int mglev)
     else
     {
         BoxArray cba = fine_cor.boxArray();
-        cba.coarsen(refratio);
+        IntVect ratio = (alev > 0) ? IntVect(2) : linop.mg_coarsen_ratio_vec[mglev];
+
+        cba.coarsen(ratio);
         const int ng = 0;
         cfine.define(cba, fine_cor.DistributionMap(), ncomp, ng);
         cfine.ParallelCopy(crse_cor);
@@ -911,7 +929,7 @@ MLMG::actualBottomSolve ()
     {
         MultiFab* bottom_b = &b;
         MultiFab raii_b;
-        if (linop.isBottomSingular())
+        if (linop.isBottomSingular() && linop.getEnforceSingularSolvable())
         {
             raii_b.define(b.boxArray(), b.DistributionMap(), ncomp, b.nGrow(),
                           MFInfo(), *linop.Factory(amrlev,mglev));
@@ -1004,9 +1022,13 @@ MLMG::ResNormInf (int alev, bool local)
         pmf = scratch[alev].get();
         MultiFab::Copy(*pmf, res[alev][mglev], 0, 0, ncomp, 0);
         auto factory = dynamic_cast<EBFArrayBoxFactory const*>(linop.Factory(alev));
-        const MultiFab& vfrac = factory->getVolFrac();
-        for (int n=0; n < ncomp; ++n) {
-            MultiFab::Multiply(*pmf, vfrac, 0, n, 1, 0);
+        if (factory) {
+            const MultiFab& vfrac = factory->getVolFrac();
+            for (int n=0; n < ncomp; ++n) {
+                MultiFab::Multiply(*pmf, vfrac, 0, n, 1, 0);
+            }
+        } else {
+            amrex::Abort("MLMG::ResNormInf: not EB Factory");
         }
     }
 #endif
@@ -1053,9 +1075,13 @@ MLMG::MLRhsNormInf (bool local)
             pmf = scratch[alev].get();
             MultiFab::Copy(*pmf, rhs[alev], 0, 0, ncomp, 0);
             auto factory = dynamic_cast<EBFArrayBoxFactory const*>(linop.Factory(alev));
-            const MultiFab& vfrac = factory->getVolFrac();
-            for (int n=0; n < ncomp; ++n) {
-                MultiFab::Multiply(*pmf, vfrac, 0, n, 1, 0);
+            if (factory) {
+                const MultiFab& vfrac = factory->getVolFrac();
+                for (int n=0; n < ncomp; ++n) {
+                    MultiFab::Multiply(*pmf, vfrac, 0, n, 1, 0);
+                }
+            } else {
+                amrex::Abort("MLMG::MLRhsNormInf: not EB Factory");
             }
         }
 #endif
@@ -1116,18 +1142,18 @@ MLMG::prepareForSolve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab con
         linop_prepared = true;
     } else if (linop.needsUpdate()) {
         linop.update();
-    }
 
 #ifdef AMREX_USE_HYPRE
-    hypre_solver.reset();
-    hypre_bndry.reset();
-    hypre_node_solver.reset();
+        hypre_solver.reset();
+        hypre_bndry.reset();
+        hypre_node_solver.reset();
 #endif
 
 #ifdef AMREX_USE_PETSC
-    petsc_solver.reset(); 
-    petsc_bndry.reset(); 
+        petsc_solver.reset(); 
+        petsc_bndry.reset(); 
 #endif
+    }
 
     sol.resize(namrlevs);
     sol_raii.resize(namrlevs);
@@ -1166,6 +1192,7 @@ MLMG::prepareForSolve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab con
         linop.applyMetricTerm(alev, 0, rhs[alev]);
         linop.unimposeNeumannBC(alev, rhs[alev]);
         linop.applyInhomogNeumannTerm(alev, rhs[alev]);
+        linop.applyOverset(alev, rhs[alev]);
 
 #ifdef AMREX_USE_EB
         auto factory = dynamic_cast<EBFArrayBoxFactory const*>(linop.Factory(alev));
@@ -1183,7 +1210,7 @@ MLMG::prepareForSolve (const Vector<MultiFab*>& a_sol, const Vector<MultiFab con
     }
     
     // enforce solvability if appropriate
-    if (linop.isSingular(0))
+    if (linop.isSingular(0) && linop.getEnforceSingularSolvable())
     {
         computeVolInv();
         makeSolvable();
@@ -1364,7 +1391,7 @@ MLMG::getFluxes (const Vector<MultiFab*> & a_flux, Location a_loc)
 }
 
 void
-MLMG::getFluxes (const Vector<MultiFab*> & a_flux, const Vector<MultiFab*>& a_sol, Location a_loc)
+MLMG::getFluxes (const Vector<MultiFab*> & a_flux, const Vector<MultiFab*>& a_sol, Location /*a_loc*/)
 {
     AMREX_ASSERT(a_flux[0]->nComp() >= AMREX_SPACEDIM);
 
@@ -1755,6 +1782,13 @@ MLMG::makeSolvable (int amrlev, int mglev, MultiFab& mf)
 
         ParallelAllReduce::Sum(offset.data(), ncomp, ParallelContext::CommunicatorSub());
 
+        if (verbose >= 4) {
+            for (int c = 0; c < ncomp; ++c) {
+                amrex::Print() << "MLMG: Subtracting " << offset[c] 
+                               << " from mf component c = " << c << "\n";
+            }
+        }
+
         for (int c = 0; c < ncomp; ++c) {
             mf.plus(-offset[c], c, 1);
         }
@@ -1793,9 +1827,13 @@ void
 MLMG::bottomSolveWithHypre (MultiFab& x, const MultiFab& b)
 {
 #if !defined(AMREX_USE_HYPRE)
+    amrex::ignore_unused(x,b);
     amrex::Abort("bottomSolveWithHypre is called without building with Hypre");
 #else
 
+    const int amrlev = 0;
+    const int mglev  = linop.NMGLevels(amrlev) - 1;
+
     const int ncomp = linop.getNComp();
     AMREX_ALWAYS_ASSERT_WITH_MESSAGE(ncomp == 1, "bottomSolveWithHypre doesn't work with ncomp > 1");
 
@@ -1804,11 +1842,21 @@ MLMG::bottomSolveWithHypre (MultiFab& x, const MultiFab& b)
         if (hypre_solver == nullptr)  // We should reuse the setup
         {
             hypre_solver = linop.makeHypre(hypre_interface);
+
             hypre_solver->setVerbose(bottom_verbose);
+            if (hypre_interface == amrex::Hypre::Interface::ij) {
+                hypre_solver->setHypreOptionsNamespace(hypre_options_namespace);
+            } else {
+                hypre_solver->setHypreOldDefault(hypre_old_default);
+                hypre_solver->setHypreRelaxType(hypre_relax_type);
+                hypre_solver->setHypreRelaxOrder(hypre_relax_order);
+                hypre_solver->setHypreNumSweeps(hypre_num_sweeps);
+                hypre_solver->setHypreStrongThreshold(hypre_strong_threshold);
+            }
 
-            const BoxArray& ba = linop.m_grids[0].back();
-            const DistributionMapping& dm = linop.m_dmap[0].back();
-            const Geometry& geom = linop.m_geom[0].back();
+            const BoxArray& ba = linop.m_grids[amrlev].back();
+            const DistributionMapping& dm = linop.m_dmap[amrlev].back();
+            const Geometry& geom = linop.m_geom[amrlev].back();
 
             hypre_bndry.reset(new MLMGBndry(ba, dm, ncomp, geom));
             hypre_bndry->setHomogValues();
@@ -1820,17 +1868,30 @@ MLMG::bottomSolveWithHypre (MultiFab& x, const MultiFab& b)
             hypre_bndry->setLOBndryConds(linop.m_lobc, linop.m_hibc, -1, bclocation);
         }
 
-        hypre_solver->solve(x, b, bottom_reltol, -1., bottom_maxiter, *hypre_bndry, linop.getMaxOrder());
+        // IJ interface understands absolute tolerance API of hypre
+        amrex::Real hypre_abstol =
+            (hypre_interface == amrex::Hypre::Interface::ij)
+            ? bottom_abstol : -1.0;
+        hypre_solver->solve(
+            x, b, bottom_reltol, hypre_abstol, bottom_maxiter, *hypre_bndry,
+            linop.getMaxOrder());
     }
     else
     {
         if (hypre_node_solver == nullptr)
         {
-            hypre_node_solver = linop.makeHypreNodeLap(bottom_verbose);
+            hypre_node_solver =
+                linop.makeHypreNodeLap(bottom_verbose, hypre_options_namespace);
         }
-        hypre_node_solver->solve(x, b, bottom_reltol, -1., bottom_maxiter);
+        hypre_node_solver->solve(x, b, bottom_reltol, bottom_abstol, bottom_maxiter);
     }
 
+    // For singular problems there may be a large constant added to all values of the solution
+    // For precision reasons we enforce that the average of the correction from hypre is 0
+    if (linop.isSingular(amrlev) && linop.getEnforceSingularSolvable())
+    {
+        makeSolvable(amrlev, mglev, x);
+    }
 #endif
 }
 
@@ -1838,6 +1899,7 @@ void
 MLMG::bottomSolveWithPETSc (MultiFab& x, const MultiFab& b)
 {
 #if !defined(AMREX_USE_PETSC)
+    amrex::ignore_unused(x,b);
     amrex::Abort("bottomSolveWithPETSc is called without building with PETSc");
 #else
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLMGBndry.cpp b/Src/LinearSolvers/MLMG/AMReX_MLMGBndry.cpp
index 76b1d457ed4..434e1e72f01 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLMGBndry.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLMGBndry.cpp
@@ -35,7 +35,7 @@ MLMGBndry::setLOBndryConds (const Vector<Array<LinOpBCType,AMREX_SPACEDIM> >& lo
         for (int icomp = 0; icomp < nComp(); ++icomp) {
             BCTuple bct;
             setBoxBC(bloc, bct, grd, domain, lo[icomp], hi[icomp], dx, ratio,
-                     a_loc, {AMREX_D_DECL(0.,0.,0.)}, {AMREX_D_DECL(0.,0.,0.)},
+                     a_loc, {{AMREX_D_DECL(0.,0.,0.)}}, {{AMREX_D_DECL(0.,0.,0.)}},
                      is_periodic);
             for (int idim = 0; idim < 2*AMREX_SPACEDIM; ++idim) {
                 bctag[idim][icomp] = bct[idim];
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_1D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_1D_K.H
index 006da5c2a9a..623d3fa6ce2 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_1D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_1D_K.H
@@ -4,8 +4,8 @@
 namespace amrex {
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_set_nodal_mask (int i, int j, int k, Array4<int> const& nmsk,
-                             Array4<int const> const& cmsk) noexcept
+void mlndlap_set_nodal_mask (int /*i*/, int /*j*/, int /*k*/, Array4<int> const& /*nmsk*/,
+                             Array4<int const> const& /*cmsk*/) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -23,15 +23,20 @@ void mlndlap_set_dot_mask (Box const& bx, Array4<Real> const& dmsk,
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_zero_fine (int i, int j, int k, Array4<Real> const& phi,
+void mlndlap_zero_fine (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& phi,
                         Array4<int const> const& msk, int fine_flag) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_avgdown_coeff_x (int i, int j, int k, Array4<Real> const& crse,
+void mlndlap_avgdown_coeff_x (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& crse,
                               Array4<Real const> const& fine) noexcept
 {}
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_avgdown_coeff (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& crse,
+                              Array4<Real const> const& fine, int idir) noexcept
+{}
+
 template <typename T>
 inline void mlndlap_bc_doit (Box const& vbx, Array4<T> const& a, Box const& domain,
                              GpuArray<bool,AMREX_SPACEDIM> const& bflo,
@@ -39,13 +44,13 @@ inline void mlndlap_bc_doit (Box const& vbx, Array4<T> const& a, Box const& doma
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_adotx_ha (int i, int j, int k, Array4<Real> const& y, Array4<Real const> const& x,
+void mlndlap_adotx_ha (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& y, Array4<Real const> const& x,
                        Array4<Real const> const& sx, Array4<int const> const& msk,
                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_adotx_aa (int i, int j, int k, Array4<Real> const& y, Array4<Real const> const& x,
+void mlndlap_adotx_aa (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& y, Array4<Real const> const& x,
                        Array4<Real const> const& sig, Array4<int const> const& msk,
                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {}
@@ -85,52 +90,76 @@ void mlndlap_gauss_seidel_aa (Box const& bx, Array4<Real> const& sol,
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_restriction (int i, int j, int k, Array4<Real> const& crse,
+void mlndlap_gauss_seidel_with_line_solve_aa(Box const& bx, Array4<Real> const& sol,
+                                             Array4<Real const> const& rhs, Array4<Real const> const& sig,
+                                             Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+{}
+
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_restriction (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& crse,
                           Array4<Real const> const& fine, Array4<int const> const& msk) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_interpadd_aa (int i, int j, int k, Array4<Real> const& fine,
+void mlndlap_semi_restriction (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& crse,
+                          Array4<Real const> const& fine, Array4<int const> const& msk, int idir) noexcept
+{}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_interpadd_aa (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& fine,
                            Array4<Real const> const& crse, Array4<Real const> const& sig,
                            Array4<int const> const& msk) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_interpadd_ha (int i, int j, int k, Array4<Real> const& fine,
+void mlndlap_semi_interpadd_aa (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& fine,
+                           Array4<Real const> const& crse, Array4<Real const> const& sig,
+                           Array4<int const> const& msk, int idir) noexcept
+{}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_interpadd_ha (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& fine,
                            Array4<Real const> const& crse, Array4<Real const> const& sigx,
                            Array4<int const> const& msk) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_divu (int i, int j, int k, Array4<Real> const& rhs, Array4<Real const> const& vel,
+void mlndlap_divu (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& rhs, Array4<Real const> const& vel,
                    Array4<int const> const& msk,
-                   GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                   GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                   Box const& nddom,
+                   GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                   GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-Real mlndlap_rhcc (int i, int j, int k, Array4<Real const> const& rhcc,
+Real mlndlap_rhcc (int /*i*/, int /*j*/, int /*k*/, Array4<Real const> const& rhcc,
                    Array4<int const> const& msk) noexcept
-{ return 0._rt; }
+{ return Real(0.); }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_mknewu (int i, int j, int k, Array4<Real> const& u, Array4<Real const> const& p,
+void mlndlap_mknewu (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& u, Array4<Real const> const& p,
                      Array4<Real const> const& sig, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_divu_compute_fine_contrib (int i, int j, int k, Box const& fvbx,
+void mlndlap_divu_compute_fine_contrib (int /*i*/, int /*j*/, int /*k*/, Box const& fvbx,
                                         Array4<Real> const& frh, Array4<Real const> const& vel,
-                                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                                        Box const& nddom,
+                                        GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                                        GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_divu_add_fine_contrib (int i, int j, int k, Box const& fvbx,
+void mlndlap_divu_add_fine_contrib (int /*i*/, int /*j*/, int /*k*/, Box const& fvbx,
                                     Array4<Real> const& rhs, Array4<Real const> const& frh,
                                     Array4<int const> const& msk) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_rhcc_fine_contrib (int i, int j, int k, Box const& fvbx,
+void mlndlap_rhcc_fine_contrib (int /*i*/, int /*j*/, int /*k*/, Box const& fvbx,
                                 Array4<Real> const& rhs, Array4<Real const> const& cc,
                                 Array4<int const> const& msk) noexcept
 {}
@@ -147,7 +176,7 @@ void mlndlap_divu_cf_contrib (int i, int j, int, Array4<Real> const& rhs,
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_crse_resid (int i, int j, int k, Array4<Real> const& resid,
+void mlndlap_crse_resid (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& resid,
                          Array4<Real const> const& rhs, Array4<int const> const& msk,
                          Box const& nddom, GpuArray<LinOpBCType,AMREX_SPACEDIM> const& bclo,
                          GpuArray<LinOpBCType,AMREX_SPACEDIM> const& bchi,
@@ -155,18 +184,18 @@ void mlndlap_crse_resid (int i, int j, int k, Array4<Real> const& resid,
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_res_fine_Ax (int i, int j, int k, Box const& fvbx, Array4<Real> const& Ax,
+void mlndlap_res_fine_Ax (int /*i*/, int /*j*/, int /*k*/, Box const& fvbx, Array4<Real> const& Ax,
                           Array4<Real const> const& x, Array4<Real const> const& sig,
                           GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_res_fine_contrib (int i, int j, int k, Array4<Real> const& f,
+void mlndlap_res_fine_contrib (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& f,
                                Array4<Real const> const& Ax, Array4<int const> const& msk) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_res_cf_contrib (int i, int j, int k, Array4<Real> const& res,
+void mlndlap_res_cf_contrib (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& res,
                              Array4<Real const> const& phi, Array4<Real const> const& rhs,
                              Array4<Real const> const& sig, Array4<int const> const& dmsk,
                              Array4<int const> const& ndmsk, Array4<int const> const& ccmsk,
@@ -184,16 +213,16 @@ void mlndlap_set_stencil (Box const& bx, Array4<Real> const& sten,
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_set_stencil_s0 (int i, int j, int k, Array4<Real> const& sten) noexcept
+void mlndlap_set_stencil_s0 (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& sten) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
+void mlndlap_stencil_rap (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& csten,
                           Array4<Real const> const& fsten) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_adotx_sten (int i, int j, int k, Array4<Real> const& y, Array4<Real const> const& x,
+void mlndlap_adotx_sten (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& y, Array4<Real const> const& x,
                          Array4<Real const> const& sten, Array4<int const> const& msk) noexcept
 {}
 
@@ -205,13 +234,13 @@ void mlndlap_gauss_seidel_sten (Box const& bx, Array4<Real> const& sol,
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_interpadd_rap (int i, int j, int k, Array4<Real> const& fine,
+void mlndlap_interpadd_rap (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& fine,
                             Array4<Real const> const& crse, Array4<Real const> const& sten,
                             Array4<int const> const& msk) noexcept
 {}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_restriction_rap (int i, int j, int k, Array4<Real> const& crse,
+void mlndlap_restriction_rap (int /*i*/, int /*j*/, int /*k*/, Array4<Real> const& crse,
                               Array4<Real const> const& fine, Array4<Real const> const& sten,
                               Array4<int const> const& msk) noexcept
 {}
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_2D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_2D_K.H
index d5bee0fad8a..213ac357f94 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_2D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_2D_K.H
@@ -133,7 +133,7 @@ void mlndlap_zero_fine (int i, int j, int, Array4<Real> const& phi,
         msk(i-1,j  ,0) == fine_flag and
         msk(i  ,j  ,0) == fine_flag)
     {
-        phi(i,j,0) = 0.0;
+        phi(i,j,0) = Real(0.0);
     }
 }
 
@@ -159,6 +159,21 @@ void mlndlap_avgdown_coeff_y (int i, int j, int k, Array4<Real> const& crse,
     crse(i,j,k) = a*b/(a+b);
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_avgdown_coeff (int i, int j, int k, Array4<Real> const& crse,
+                              Array4<Real const> const& fine, int idir) noexcept
+{   
+    if (idir == 1) {
+        Real a = fine(2*i  ,j,k);
+        Real b = fine(2*i+1,j,k);
+        crse(i,j,k) = 2.0*a*b/(a+b);
+    } else {
+        Real a = fine(i,2*j  ,k);
+        Real b = fine(i,2*j+1,k);
+        crse(i,j,k) = 2.0*a*b/(a+b);
+    }
+}
+
 //
 // bc
 //
@@ -280,7 +295,7 @@ void mlndlap_adotx_ha (int i, int j, int k, Array4<Real> const& y, Array4<Real c
                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
     if (msk(i,j,k)) {
-        y(i,j,k) = 0.0;
+        y(i,j,k) = Real(0.0);
     } else {
         Real facx = (1./6.)*dxinv[0]*dxinv[0];
         Real facy = (1./6.)*dxinv[1]*dxinv[1];
@@ -313,7 +328,7 @@ void mlndlap_adotx_aa (int i, int j, int k, Array4<Real> const& y, Array4<Real c
                        bool is_rz, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
     if (msk(i,j,k)) {
-        y(i,j,k) = 0.0;
+        y(i,j,k) = Real(0.0);
     } else {
         Real facx = (1.0/6.0)*dxinv[0]*dxinv[0];
         Real facy = (1.0/6.0)*dxinv[1]*dxinv[1];
@@ -378,15 +393,15 @@ void mlndlap_jacobi_ha (Box const& bx, Array4<Real> const& sol, Array4<Real cons
                         Array4<Real const> const& sy, Array4<int const> const& msk,
                         GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
-    Real facx = -2.0 * (1.0/6.0)*dxinv[0]*dxinv[0];
-    Real facy = -2.0 * (1.0/6.0)*dxinv[1]*dxinv[1];
+    Real facx = -Real(2.0 * (1.0/6.0))*dxinv[0]*dxinv[0];
+    Real facy = -Real(2.0 * (1.0/6.0))*dxinv[1]*dxinv[1];
 
     amrex::LoopConcurrent(bx, [=] (int i, int j, int k) noexcept
     {
         if (msk(i,j,k)) {
-            sol(i,j,k) = 0.0;
+            sol(i,j,k) = Real(0.0);
         } else {
-            sol(i,j,k) += (2.0/3.0) * (rhs(i,j,k) - Ax(i,j,k))
+            sol(i,j,k) += Real(2.0/3.0) * (rhs(i,j,k) - Ax(i,j,k))
                 / (facx*(sx(i-1,j-1,k)+sx(i,j-1,k)+sx(i-1,j,k)+sx(i,j,k))
                 +  facy*(sy(i-1,j-1,k)+sy(i,j-1,k)+sy(i-1,j,k)+sy(i,j,k)));
         }
@@ -398,14 +413,14 @@ void mlndlap_jacobi_aa (Box const& bx, Array4<Real> const& sol, Array4<Real cons
                         Array4<Real const> const& rhs, Array4<Real const> const& sig,
                         Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
-    Real fac = -2.0 * (1.0/6.0)*(dxinv[0]*dxinv[0] + dxinv[1]*dxinv[1]);
+    Real fac = -Real(2.0 * (1.0/6.0))*(dxinv[0]*dxinv[0] + dxinv[1]*dxinv[1]);
 
     amrex::LoopConcurrent(bx, [=] (int i, int j, int k) noexcept
     {
         if (msk(i,j,k)) {
-            sol(i,j,k) = 0.0;
+            sol(i,j,k) = Real(0.0);
         } else {
-            sol(i,j,k) += (2.0/3.0) * (rhs(i,j,k) - Ax(i,j,k))
+            sol(i,j,k) += Real(2.0/3.0) * (rhs(i,j,k) - Ax(i,j,k))
                 / (fac*(sig(i-1,j-1,k)+sig(i,j-1,k)+sig(i-1,j,k)+sig(i,j,k)));
         }
     });
@@ -418,29 +433,29 @@ void mlndlap_gauss_seidel_ha (Box const& bx, Array4<Real> const& sol,
                               GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
                               bool is_rz) noexcept
 {
-    Real facx = (1.0/6.0)*dxinv[0]*dxinv[0];
-    Real facy = (1.0/6.0)*dxinv[1]*dxinv[1];
+    Real facx = Real(1.0/6.0)*dxinv[0]*dxinv[0];
+    Real facy = Real(1.0/6.0)*dxinv[1]*dxinv[1];
 
     amrex::Loop(bx, [=] (int i, int j, int k) noexcept
     {
         if (msk(i,j,k)) {
-            sol(i,j,k) = 0.0;
+            sol(i,j,k) = Real(0.0);
         } else {
-            Real s0 = (-2.0)*(facx*(sx(i-1,j-1,k)+sx(i,j-1,k)+sx(i-1,j,k)+sx(i,j,k))
-                             +facy*(sy(i-1,j-1,k)+sy(i,j-1,k)+sy(i-1,j,k)+sy(i,j,k)));
+            Real s0 = Real(-2.0)*(facx*(sx(i-1,j-1,k)+sx(i,j-1,k)+sx(i-1,j,k)+sx(i,j,k))
+                                 +facy*(sy(i-1,j-1,k)+sy(i,j-1,k)+sy(i-1,j,k)+sy(i,j,k)));
 
             Real Ax = sol(i-1,j-1,k)*(facx*sx(i-1,j-1,k)+facy*sy(i-1,j-1,k))
                     + sol(i+1,j-1,k)*(facx*sx(i  ,j-1,k)+facy*sy(i  ,j-1,k))
                     + sol(i-1,j+1,k)*(facx*sx(i-1,j  ,k)+facy*sy(i-1,j  ,k))
                     + sol(i+1,j+1,k)*(facx*sx(i  ,j  ,k)+facy*sy(i  ,j  ,k))
-                    + sol(i-1,j,k)*(2.0*facx*(sx(i-1,j-1,k)+sx(i-1,j,k))
-                                  -     facy*(sy(i-1,j-1,k)+sx(i-1,j,k)))
-                    + sol(i+1,j,k)*(2.0*facx*(sx(i  ,j-1,k)+sx(i  ,j,k))
-                                  -     facy*(sy(i  ,j-1,k)+sx(i  ,j,k)))
+                    + sol(i-1,j,k)*(Real(2.0)*facx*(sx(i-1,j-1,k)+sx(i-1,j,k))
+                                        -     facy*(sy(i-1,j-1,k)+sx(i-1,j,k)))
+                    + sol(i+1,j,k)*(Real(2.0)*facx*(sx(i  ,j-1,k)+sx(i  ,j,k))
+                                        -     facy*(sy(i  ,j-1,k)+sx(i  ,j,k)))
                     + sol(i,j-1,k)*(   -facx*(sx(i-1,j-1,k)+sx(i,j-1,k))
-                                   +2.0*facy*(sy(i-1,j-1,k)+sy(i,j-1,k)))
+                             +Real(2.0)*facy*(sy(i-1,j-1,k)+sy(i,j-1,k)))
                     + sol(i,j+1,k)*(   -facx*(sx(i-1,j  ,k)+sx(i,j  ,k))
-                                   +2.0*facy*(sy(i-1,j  ,k)+sy(i,j  ,k)))
+                             +Real(2.0)*facy*(sy(i-1,j  ,k)+sy(i,j  ,k)))
                     + sol(i,j,k)*s0;
 
             if (is_rz) {
@@ -502,6 +517,142 @@ void mlndlap_gauss_seidel_aa (Box const& bx, Array4<Real> const& sol,
     });
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void tridiagonal_solve (Array1D<Real,0,31>& a_ls, Array1D<Real,0,31>& b_ls, Array1D<Real,0,31>& c_ls,
+                        Array1D<Real,0,31>& r_ls, Array1D<Real,0,31>& u_ls, Array1D<Real,0,31>& gam,
+                        int ilen ) noexcept
+{
+    Real bet = b_ls(0);
+    u_ls(0) = r_ls(0) / bet;
+
+    for (int i = 1; i <= ilen - 1; i++) {
+        gam(i) = c_ls(i-1) / bet;
+        bet = b_ls(i) - a_ls(i)*gam(i);
+        if (bet == 0) amrex::Abort(">>>TRIDIAG FAILED");
+        u_ls(i) = (r_ls(i)-a_ls(i)*u_ls(i-1)) / bet;
+    }
+    for (int i = ilen-2; i >= 0; i--) {
+        u_ls(i) = u_ls(i) - gam(i+1)*u_ls(i+1);
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_gauss_seidel_with_line_solve_aa (Box const& bx, Array4<Real> const& sol,
+                              Array4<Real const> const& rhs, Array4<Real const> const& sig,
+                              Array4<int const> const& msk,
+                              GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                              bool is_rz) noexcept
+{
+    Real facx = (1.0/6.0)*dxinv[0]*dxinv[0];
+    Real facy = (1.0/6.0)*dxinv[1]*dxinv[1];
+    Real fxy = facx + facy;
+    Real f2xmy = 2.0*facx - facy;
+    Real fmx2y = 2.0*facy - facx;
+
+    if (is_rz) {
+	amrex::Abort("mlndlap_gauss_seidel_with_line_solve_aa is not implemented in r-z 2D ");
+    } 
+
+    const auto lo = amrex::lbound(bx);
+    const auto hi = amrex::ubound(bx);
+
+    int idir = -1;
+    int ilen = 33;
+    int k = 0;
+    if (dxinv[0] <= dxinv[1])  {
+        idir = 1;
+        ilen = hi.y - lo.y + 1;
+    }
+    if (dxinv[1] <= dxinv[0]) {
+        idir = 0;
+        ilen = hi.x - lo.x + 1;
+    }
+
+    if (ilen > 32) amrex::Abort("mlndlap_gauss_seidel_with_line_solve_aa is hard-wired to be no longer than 32");
+
+    Array1D<Real,0,31> a_ls,b_ls,c_ls,u_ls,r_ls,gam;
+
+    if (idir == 1) {
+        for (int i = lo.x; i <= hi.x; ++i)
+        {
+            for (int j = lo.y; j <= hi.y; ++j)
+            {
+                if (msk(i,j,k)) {
+                    a_ls(j-lo.y) = 0.;
+                    b_ls(j-lo.y) = 1.;
+                    c_ls(j-lo.y) = 0.;
+                    u_ls(j-lo.y) = 0.;
+                    r_ls(j-lo.y) = 0.;
+                }
+                else
+                {
+                    Real s0 = (-2.0)*fxy*(sig(i-1,j-1,k)+sig(i,j-1,k)+sig(i-1,j,k)+sig(i,j,k));
+
+                    Real Ax = sol(i-1,j-1,k)*fxy*sig(i-1,j-1,k)
+                            + sol(i+1,j-1,k)*fxy*sig(i  ,j-1,k)
+                            + sol(i-1,j+1,k)*fxy*sig(i-1,j  ,k)
+                            + sol(i+1,j+1,k)*fxy*sig(i  ,j  ,k)
+                            + sol(i-1,j,k)*f2xmy*(sig(i-1,j-1,k)+sig(i-1,j,k))
+                            + sol(i+1,j,k)*f2xmy*(sig(i  ,j-1,k)+sig(i  ,j,k));
+
+                    a_ls(j-lo.y) = fmx2y*(sig(i-1,j-1,k)+sig(i,j-1,k));
+                    b_ls(j-lo.y) = s0;
+                    c_ls(j-lo.y) = fmx2y*(sig(i-1,j  ,k)+sig(i,j  ,k));          
+                    u_ls(j-lo.y) = 0.;
+                    r_ls(j-lo.y) = rhs(i,j,k) - Ax;
+                }
+            }
+            tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+            for (int j = lo.y; j <= hi.y; ++j)
+            {
+                sol(i,j,k) = u_ls(j-lo.y);
+            }
+        }
+    } else if (idir == 0) {
+        for (int j = lo.y ;j <= hi.y; ++j)
+        {
+            for (int i = lo.x; i <= hi.x; ++i)
+            {
+                if (msk(i,j,k)) {
+                    a_ls(i-lo.x) = 0.;
+                    b_ls(i-lo.x) = 1.;
+                    c_ls(i-lo.x) = 0.;
+                    u_ls(i-lo.x) = 0.;
+                    r_ls(i-lo.x) = 0.;
+                }
+                else
+                {
+                    Real s0 = (-2.0)*fxy*(sig(i-1,j-1,k)+sig(i,j-1,k)+sig(i-1,j,k)+sig(i,j,k));
+
+                    Real Ax = sol(i-1,j-1,k)*fxy*sig(i-1,j-1,k)
+                            + sol(i+1,j-1,k)*fxy*sig(i  ,j-1,k)
+                            + sol(i-1,j+1,k)*fxy*sig(i-1,j  ,k)
+                            + sol(i+1,j+1,k)*fxy*sig(i  ,j  ,k)
+                            + sol(i,j-1,k)*fmx2y*(sig(i-1,j-1,k)+sig(i,j-1,k))
+                            + sol(i,j+1,k)*fmx2y*(sig(i-1,j  ,k)+sig(i,j  ,k));
+
+                    a_ls(i-lo.x) = f2xmy*(sig(i-1,j-1,k)+sig(i-1,j,k));
+                    b_ls(i-lo.x) = s0;
+                    c_ls(i-lo.x) = f2xmy*(sig(i  ,j-1,k)+sig(i  ,j,k));
+                    u_ls(i-lo.x) = 0.;
+                    r_ls(i-lo.x) = rhs(i,j,k) - Ax;
+
+                }
+            }
+            tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+            for (int i = lo.x; i <= hi.x; ++i)
+            {
+                sol(i,j,k) = u_ls(i-lo.x);
+            }
+        }
+    } else {
+        amrex::Abort("mlndlap_gauss_seidel_with_line_solve_aa is wrong direction.");
+    }
+
+}
+
 //
 // restriction
 //
@@ -522,6 +673,30 @@ void mlndlap_restriction (int i, int j, int k, Array4<Real> const& crse,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_restriction (int i, int j, int k, Array4<Real> const& crse,
+                          Array4<Real const> const& fine, Array4<int const> const& msk, int idir) noexcept
+{
+    int kk = 0;
+    if (idir == 1) {
+        int ii = i*2;
+        int jj = j;
+        if (msk(ii,jj,kk)) {
+            crse(i,j,k) = 0.0;
+        } else {
+            crse(i,j,k) = (1./4.)*(fine(ii-1,jj,kk) + 2.*fine(ii,jj,kk) + fine(ii+1,jj,kk));
+        }
+    } else if (idir == 0) {
+        int ii = i;
+        int jj = j*2;
+        if (msk(ii,jj,kk)) {
+            crse(i,j,k) = 0.0;
+        } else {
+            crse(i,j,k) = (1./4.)*(fine(ii,jj-1,kk) + 2.*fine(ii,jj,kk) + fine(ii,jj+1,kk));
+        }
+    }
+}
+
 //
 // interpolation
 //
@@ -587,6 +762,40 @@ void mlndlap_interpadd_aa (int i, int j, int, Array4<Real> const& fine,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_interpadd_aa (int i, int j, int, Array4<Real> const& fine,
+                           Array4<Real const> const& crse, Array4<Real const> const& sig,
+                           Array4<int const> const& msk, int idir) noexcept
+{
+    if (idir == 1) {
+        if (!msk(i,j,0)) {
+            int ic = amrex::coarsen(i,2);
+            int jc = j;
+            bool i_is_odd = (ic*2 != i);
+            if (i_is_odd) {
+                // Node on X line
+                fine(i,j,0) += aa_interp_line_x(crse,sig,i,j,ic,jc);
+            } else {
+                //Node coincident with coarse node
+                fine(i,j,0) += crse(ic,jc,0);
+            }
+        }
+    } else if (idir == 0 ) { 
+        if (!msk(i,j,0)) { 
+            int ic = i;
+            int jc = amrex::coarsen(j,2);
+            bool j_is_odd = (ic*2 != i); 
+            if (j_is_odd) {
+                // Node on Y line
+                fine(i,j,0) += aa_interp_line_y(crse,sig,i,j,ic,jc);
+            } else {
+                //Node coincident with coarse node
+                fine(i,j,0) += crse(ic,jc,0);
+            }
+        }
+    } 
+}
+
 namespace {
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ha_interp_face_xy (Array4<Real const> const& crse,
@@ -638,19 +847,43 @@ void mlndlap_interpadd_ha (int i, int j, int,
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_divu (int i, int j, int k, Array4<Real> const& rhs, Array4<Real const> const& vel,
                    Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                   Box const& nodal_domain,
+                   GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                   GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi,
                    bool is_rz) noexcept
 {
     Real facx = 0.5*dxinv[0];
     Real facy = 0.5*dxinv[1];
 
+    const auto domlo = amrex::lbound(nodal_domain);
+    const auto domhi = amrex::ubound(nodal_domain);
+
     if (msk(i,j,k)) {
         rhs(i,j,k) = 0.0;
     } else {
-        rhs(i,j,k) = facx*(-vel(i-1,j-1,k,0) + vel(i,j-1,k,0)
-                           -vel(i-1,j  ,k,0) + vel(i,j  ,k,0))
-                   + facy*(-vel(i-1,j-1,k,1) - vel(i,j-1,k,1)
-                           +vel(i-1,j  ,k,1) + vel(i,j  ,k,1));
+
+        Real zero_ilo = 1.0;
+        Real zero_ihi = 1.0;
+        Real zero_jlo = 1.0;
+        Real zero_jhi = 1.0;
+
+        // The nodal divergence operator should not see the tangential velocity
+        //     at an inflow face
+        if ((bclo[0] == LinOpBCType::Neumann or bclo[0] == LinOpBCType::inflow)
+            and i == domlo.x) zero_ilo = 0.0;
+        if ((bchi[0] == LinOpBCType::Neumann or bchi[0] == LinOpBCType::inflow)
+            and i == domhi.x) zero_ihi = 0.0;
+        if ((bclo[1] == LinOpBCType::Neumann or bclo[1] == LinOpBCType::inflow)
+            and j == domlo.y) zero_jlo = 0.0;
+        if ((bchi[1] == LinOpBCType::Neumann or bchi[1] == LinOpBCType::inflow)
+            and j == domhi.y) zero_jhi = 0.0; 
+
+        rhs(i,j,k) = facx*(-vel(i-1,j-1,k,0)*zero_jlo + vel(i,j-1,k,0)*zero_jlo
+                           -vel(i-1,j  ,k,0)*zero_jhi + vel(i,j  ,k,0)*zero_jhi)
+                   + facy*(-vel(i-1,j-1,k,1)*zero_ilo - vel(i,j-1,k,1)*zero_ihi
+                           +vel(i-1,j  ,k,1)*zero_ilo + vel(i,j  ,k,1)*zero_ihi);
         if (is_rz) {
+            // Here we assume we can't have inflow in the radial direction
             Real fm = facy / static_cast<Real>(6*i-3);
             Real fp = facy / static_cast<Real>(6*i+3);
             rhs(i,j,k) += fm*(vel(i-1,j,k,1)-vel(i-1,j-1,k,1))
@@ -690,17 +923,42 @@ void mlndlap_mknewu (int i, int j, int k, Array4<Real> const& u, Array4<Real con
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_divu_compute_fine_contrib (int i, int j, int, Box const& fvbx,
                                         Array4<Real> const& frh, Array4<Real const> const& vel,
-                                        bool is_rz, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                                        Box const& nodal_domain,
+                                        GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                                        GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi,
+                                        bool is_rz) noexcept
 {
+    const auto domlo = amrex::lbound(nodal_domain);
+    const auto domhi = amrex::ubound(nodal_domain);
+
     IntVect iv(i,j);
     if (fvbx.contains(iv) and !fvbx.strictly_contains(iv))
     {
-        Real facx = 0.5_rt*dxinv[0];
-        Real facy = 0.5_rt*dxinv[1];
-        frh(i,j,0) = facx*(-vel(i-1,j-1,0,0)+vel(i,j-1,0,0)-vel(i-1,j,0,0)+vel(i,j,0,0))
-            +        facy*(-vel(i-1,j-1,0,1)-vel(i,j-1,0,1)+vel(i-1,j,0,1)+vel(i,j,0,1));
+        Real zero_ilo = 1.0;
+        Real zero_ihi = 1.0;
+        Real zero_jlo = 1.0;
+        Real zero_jhi = 1.0;
+
+        // The nodal divergence operator should not see the tangential velocity
+        //     at an inflow face
+        if ((bclo[0] == LinOpBCType::Neumann or bclo[0] == LinOpBCType::inflow)
+            and i == domlo.x) zero_ilo = 0.0;
+        if ((bchi[0] == LinOpBCType::Neumann or bchi[0] == LinOpBCType::inflow)
+            and i == domhi.x) zero_ihi = 0.0;
+        if ((bclo[1] == LinOpBCType::Neumann or bclo[1] == LinOpBCType::inflow)
+            and j == domlo.y) zero_jlo = 0.0;
+        if ((bchi[1] == LinOpBCType::Neumann or bchi[1] == LinOpBCType::inflow)
+            and j == domhi.y) zero_jhi = 0.0; 
+
+        Real facx = Real(0.5)*dxinv[0];
+        Real facy = Real(0.5)*dxinv[1];
+
+        frh(i,j,0) = facx*(-vel(i-1,j-1,0,0)*zero_jlo+vel(i,j-1,0,0)*zero_jlo-vel(i-1,j,0,0)*zero_jhi+vel(i,j,0,0)*zero_jhi)
+            +        facy*(-vel(i-1,j-1,0,1)*zero_ilo-vel(i,j-1,0,1)*zero_ihi+vel(i-1,j,0,1)*zero_ilo+vel(i,j,0,1)*zero_ihi);
 
         if (is_rz) {
+            // Here we assume we can't have inflow in the radial direction
             Real fm = facy / static_cast<Real>(6*i-3);
             Real fp = facy / static_cast<Real>(6*i+3);
             frh(i,j,0) += fm*(vel(i-1,j,0,1)-vel(i-1,j-1,0,1))
@@ -710,13 +968,13 @@ void mlndlap_divu_compute_fine_contrib (int i, int j, int, Box const& fvbx,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_divu_add_fine_contrib (int i, int j, int k, Box const& fvbx,
+void mlndlap_divu_add_fine_contrib (int i, int j, int /*k*/, Box const& fvbx,
                                     Array4<Real> const& rhs, Array4<Real const> const& frh,
                                     Array4<int const> const& msk) noexcept
 {
-    constexpr Real rfd = 0.25_rt;
-    constexpr Real chip = 0.5_rt;
-    constexpr Real chip2 = 0.25_rt;
+    constexpr Real rfd = Real(0.25);
+    constexpr Real chip = Real(0.5);
+    constexpr Real chip2 = Real(0.25);
 
     int ii = 2*i;
     int jj = 2*j;
@@ -735,9 +993,9 @@ void mlndlap_rhcc_fine_contrib (int i, int j, int, Box const& fvbx,
                                 Array4<Real> const& rhs, Array4<Real const> const& cc,
                                 Array4<int const> const& msk) noexcept
 {
-    constexpr Real w1 = 9._rt/64._rt;
-    constexpr Real w2 = 3._rt/64._rt;
-    constexpr Real w3 = 1._rt/64._rt;
+    constexpr Real w1 = Real(9./64.);
+    constexpr Real w2 = Real(3./64.);
+    constexpr Real w3 = Real(1./64.);
 
     int ii = 2*i;
     int jj = 2*j;
@@ -762,26 +1020,26 @@ void mlndlap_divu_cf_contrib (int i, int j, int, Array4<Real> const& rhs,
                               bool neumann_doubling) noexcept
 {
     if (!dmsk(i,j,0) and ndmsk(i,j,0) == crse_fine_node) {
-        Real facx = 0.5_rt * dxinv[0];
-        Real facy = 0.5_rt * dxinv[1];
+        Real facx = Real(0.5) * dxinv[0];
+        Real facy = Real(0.5) * dxinv[1];
         Real r = fc(i,j,0);
         if (rhcc) {
-            r += 0.25_rt*( (1._rt-ccmsk(i-1,j-1,0)) * rhcc(i-1,j-1,0)
-                         + (1._rt-ccmsk(i  ,j-1,0)) * rhcc(i  ,j-1,0)
-                         + (1._rt-ccmsk(i-1,j  ,0)) * rhcc(i-1,j  ,0)
-                         + (1._rt-ccmsk(i  ,j  ,0)) * rhcc(i  ,j  ,0));
+            r += Real(0.25)*( (Real(1.)-ccmsk(i-1,j-1,0)) * rhcc(i-1,j-1,0)
+                            + (Real(1.)-ccmsk(i  ,j-1,0)) * rhcc(i  ,j-1,0)
+                            + (Real(1.)-ccmsk(i-1,j  ,0)) * rhcc(i-1,j  ,0)
+                            + (Real(1.)-ccmsk(i  ,j  ,0)) * rhcc(i  ,j  ,0));
         }
-        r += (1._rt-ccmsk(i-1,j-1,0)) * (-facx*vel(i-1,j-1,0,0) - facy*vel(i-1,j-1,0,1))
-           + (1._rt-ccmsk(i  ,j-1,0)) * ( facx*vel(i  ,j-1,0,0) - facy*vel(i  ,j-1,0,1))
-           + (1._rt-ccmsk(i-1,j  ,0)) * (-facx*vel(i-1,j  ,0,0) + facy*vel(i-1,j  ,0,1))
-           + (1._rt-ccmsk(i  ,j  ,0)) * ( facx*vel(i  ,j  ,0,0) + facy*vel(i  ,j  ,0,1));
+        r += (Real(1.)-ccmsk(i-1,j-1,0)) * (-facx*vel(i-1,j-1,0,0) - facy*vel(i-1,j-1,0,1))
+           + (Real(1.)-ccmsk(i  ,j-1,0)) * ( facx*vel(i  ,j-1,0,0) - facy*vel(i  ,j-1,0,1))
+           + (Real(1.)-ccmsk(i-1,j  ,0)) * (-facx*vel(i-1,j  ,0,0) + facy*vel(i-1,j  ,0,1))
+           + (Real(1.)-ccmsk(i  ,j  ,0)) * ( facx*vel(i  ,j  ,0,0) + facy*vel(i  ,j  ,0,1));
         if (is_rz) {
             Real fm = facy / static_cast<Real>(6*i-3);
             Real fp = facy / static_cast<Real>(6*i+3);
-            r += fm*((1._rt-ccmsk(i-1,j  ,0))*vel(i-1,j  ,0,1)
-                    -(1._rt-ccmsk(i-1,j-1,0))*vel(i-1,j-1,0,1))
-               - fp*((1._rt-ccmsk(i  ,j  ,0))*vel(i  ,j  ,0,1)
-                    -(1._rt-ccmsk(i  ,j-1,0))*vel(i  ,j-1,0,1));
+            r += fm*((Real(1.)-ccmsk(i-1,j  ,0))*vel(i-1,j  ,0,1)
+                    -(Real(1.)-ccmsk(i-1,j-1,0))*vel(i-1,j-1,0,1))
+               - fp*((Real(1.)-ccmsk(i  ,j  ,0))*vel(i  ,j  ,0,1)
+                    -(Real(1.)-ccmsk(i  ,j-1,0))*vel(i  ,j-1,0,1));
         }
 
         if (neumann_doubling) {
@@ -789,18 +1047,18 @@ void mlndlap_divu_cf_contrib (int i, int j, int, Array4<Real> const& rhs,
             const auto ndhi = amrex::ubound(nddom);
             if (i == ndlo.x and ( bclo[0] == LinOpBCType::Neumann or
                                   bclo[0] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             } else if (i== ndhi.x and ( bchi[0] == LinOpBCType::Neumann or
                                         bchi[0] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             }
 
             if (j == ndlo.y and ( bclo[1] == LinOpBCType::Neumann or
                                   bclo[1] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             } else if (j == ndhi.y and ( bchi[1] == LinOpBCType::Neumann or
                                          bchi[1] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             }
         }
 
@@ -828,29 +1086,29 @@ void mlndlap_crse_resid (int i, int j, int k, Array4<Real> const& resid,
          msk(i-1,j  ,k  ) == 0 or
          msk(i  ,j  ,k  ) == 0))
     {
-        Real fac = 1.0_rt;
+        Real fac = Real(1.0);
         if (neumann_doubling) {
             const auto ndlo = amrex::lbound(nddom);
             const auto ndhi = amrex::ubound(nddom);
             if (i == ndlo.x and ( bclo[0] == LinOpBCType::Neumann or
                                   bclo[0] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             } else if (i== ndhi.x and ( bchi[0] == LinOpBCType::Neumann or
                                         bchi[0] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             }
             if (j == ndlo.y and ( bclo[1] == LinOpBCType::Neumann or
                                   bclo[1] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             } else if (j == ndhi.y and ( bchi[1] == LinOpBCType::Neumann or
                                          bchi[1] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             }
         }
 
         resid(i,j,k) = (rhs(i,j,k) - resid(i,j,k)) * fac;
     } else {
-        resid(i,j,k) = 0._rt;
+        resid(i,j,k) = Real(0.);
     }
 }
 
@@ -866,11 +1124,11 @@ void mlndlap_res_fine_Ax (int i, int j, int, Box const& fvbx, Array4<Real> const
 {
     IntVect iv(i,j);
     if (fvbx.contains(iv) and !fvbx.strictly_contains(iv)) {
-        Real facx = (1._rt/6._rt)*dxinv[0]*dxinv[0];
-        Real facy = (1._rt/6._rt)*dxinv[1]*dxinv[1];
+        Real facx = Real(1./6.)*dxinv[0]*dxinv[0];
+        Real facy = Real(1./6.)*dxinv[1]*dxinv[1];
         Real fxy = facx + facy;
-        Real f2xmy = 2._rt*facx - facy;
-        Real fmx2y = 2._rt*facy - facx;
+        Real f2xmy = Real(2.)*facx - facy;
+        Real fmx2y = Real(2.)*facy - facx;
         Ax(i,j,0) = x(i-1,j-1,0)*fxy*sig(i-1,j-1,0)
             +       x(i+1,j-1,0)*fxy*sig(i  ,j-1,0)
             +       x(i-1,j+1,0)*fxy*sig(i-1,j  ,0)
@@ -879,7 +1137,7 @@ void mlndlap_res_fine_Ax (int i, int j, int, Box const& fvbx, Array4<Real> const
             +       x(i+1,j,0)*f2xmy*(sig(i  ,j-1,0)+sig(i  ,j  ,0))
             +       x(i,j-1,0)*fmx2y*(sig(i-1,j-1,0)+sig(i  ,j-1,0))
             +       x(i,j+1,0)*fmx2y*(sig(i-1,j  ,0)+sig(i  ,j  ,0))
-            +       x(i,j,0)*(-2._rt)*fxy*(sig(i-1,j-1,0)+sig(i,j-1,0)
+            +       x(i,j,0)*Real(-2.)*fxy*(sig(i-1,j-1,0)+sig(i,j-1,0)
                                            +sig(i-1,j,0)+sig(i,j,0));
         if (is_rz) {
             Real fp = facy / static_cast<Real>(2*i+1);
@@ -895,9 +1153,9 @@ void mlndlap_res_fine_contrib (int i, int j, int k, Array4<Real> const& f,
                                Array4<Real const> const& Ax,
                                Array4<int const> const& msk) noexcept
 {
-    constexpr Real rfd = 0.25_rt;
-    constexpr Real chip = 0.5_rt;
-    constexpr Real chip2 = 0.25_rt;
+    constexpr Real rfd = Real(0.25);
+    constexpr Real chip = Real(0.5);
+    constexpr Real chip2 = Real(0.25);
 
     int ii = 2*i;
     int jj = 2*j;
@@ -922,8 +1180,8 @@ void mlndlap_res_cf_contrib (int i, int j, int, Array4<Real> const& res,
                              bool neumann_doubling) noexcept
 {
     if (!dmsk(i,j,0) and ndmsk(i,j,0) == crse_fine_node) {
-        Real facx = (1._rt/6._rt)*dxinv[0]*dxinv[0];
-        Real facy = (1._rt/6._rt)*dxinv[1]*dxinv[1];
+        Real facx = Real(1./6.)*dxinv[0]*dxinv[0];
+        Real facy = Real(1./6.)*dxinv[1]*dxinv[1];
 
         Real fp, fm;
         if (is_rz) {
@@ -931,39 +1189,39 @@ void mlndlap_res_cf_contrib (int i, int j, int, Array4<Real> const& res,
             fm = facy / static_cast<Real>(2*i-1);
         }
 
-        Real Ax = 0._rt;
+        Real Ax = Real(0.);
         if (ccmsk(i-1,j-1,0) == crse_cell) {
-            Ax += sig(i-1,j-1,0)*(facx*(2._rt*(phi(i-1,j  ,0)-phi(i  ,j  ,0))
-                                        +     (phi(i-1,j-1,0)-phi(i  ,j-1,0)))
-                                + facy*(2._rt*(phi(i  ,j-1,0)-phi(i  ,j  ,0))
-                                        +     (phi(i-1,j-1,0)-phi(i-1,j  ,0))));
+            Ax += sig(i-1,j-1,0)*(facx*(Real(2.)*(phi(i-1,j  ,0)-phi(i  ,j  ,0))
+                                           +     (phi(i-1,j-1,0)-phi(i  ,j-1,0)))
+                                + facy*(Real(2.)*(phi(i  ,j-1,0)-phi(i  ,j  ,0))
+                                           +     (phi(i-1,j-1,0)-phi(i-1,j  ,0))));
             if (is_rz) {
                 Ax += fm*sig(i-1,j-1,0)*(phi(i,j-1,0)-phi(i,j,0));
             }
         }
         if (ccmsk(i,j-1,0) == crse_cell) {
-            Ax += sig(i,j-1,0)*(facx*(2._rt*(phi(i+1,j  ,0)-phi(i  ,j  ,0))
-                                      +     (phi(i+1,j-1,0)-phi(i  ,j-1,0)))
-                              + facy*(2._rt*(phi(i  ,j-1,0)-phi(i  ,j  ,0))
-                                      +     (phi(i+1,j-1,0)-phi(i+1,j  ,0))));
+            Ax += sig(i,j-1,0)*(facx*(Real(2.)*(phi(i+1,j  ,0)-phi(i  ,j  ,0))
+                                         +     (phi(i+1,j-1,0)-phi(i  ,j-1,0)))
+                              + facy*(Real(2.)*(phi(i  ,j-1,0)-phi(i  ,j  ,0))
+                                         +     (phi(i+1,j-1,0)-phi(i+1,j  ,0))));
             if (is_rz) {
                 Ax -= fp*sig(i,j-1,0)*(phi(i,j-1,0)-phi(i,j,0));
             }
         }
         if (ccmsk(i-1,j,0) == crse_cell) {
-            Ax += sig(i-1,j,0)*(facx*(2._rt*(phi(i-1,j  ,0)-phi(i  ,j  ,0))
-                                      +     (phi(i-1,j+1,0)-phi(i  ,j+1,0)))
-                              + facy*(2._rt*(phi(i  ,j+1,0)-phi(i  ,j  ,0))
-                                      +     (phi(i-1,j+1,0)-phi(i-1,j  ,0))));
+            Ax += sig(i-1,j,0)*(facx*(Real(2.)*(phi(i-1,j  ,0)-phi(i  ,j  ,0))
+                                         +     (phi(i-1,j+1,0)-phi(i  ,j+1,0)))
+                              + facy*(Real(2.)*(phi(i  ,j+1,0)-phi(i  ,j  ,0))
+                                         +     (phi(i-1,j+1,0)-phi(i-1,j  ,0))));
             if (is_rz) {
                 Ax += fm*sig(i-1,j,0)*(phi(i,j+1,0)-phi(i,j,0));
             }
         }
         if (ccmsk(i,j,0) == crse_cell) {
-            Ax += sig(i,j,0)*(facx*(2._rt*(phi(i+1,j  ,0)-phi(i  ,j  ,0))
-                                   +      (phi(i+1,j+1,0)-phi(i  ,j+1,0)))
-                            + facy*(2._rt*(phi(i  ,j+1,0)-phi(i  ,j  ,0))
-                                   +      (phi(i+1,j+1,0)-phi(i+1,j  ,0))));
+            Ax += sig(i,j,0)*(facx*(Real(2.)*(phi(i+1,j  ,0)-phi(i  ,j  ,0))
+                                      +      (phi(i+1,j+1,0)-phi(i  ,j+1,0)))
+                            + facy*(Real(2.)*(phi(i  ,j+1,0)-phi(i  ,j  ,0))
+                                      +      (phi(i+1,j+1,0)-phi(i+1,j  ,0))));
             if (is_rz) {
                 Ax -= fp*sig(i,j,0)*(phi(i,j+1,0)-phi(i,j,0));
             }
@@ -976,18 +1234,18 @@ void mlndlap_res_cf_contrib (int i, int j, int, Array4<Real> const& res,
 
             if (i == ndlo.x and (bclo[0] == LinOpBCType::Neumann or
                                  bclo[0] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             } else if (i== ndhi.x and (bchi[0] == LinOpBCType::Neumann or
                                        bchi[0] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             }
 
             if (j == ndlo.y and (bclo[1] == LinOpBCType::Neumann or
                                  bclo[1] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             } else if (j == ndhi.y and (bchi[1] == LinOpBCType::Neumann or
                                         bchi[1] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             }
         }
 
@@ -1037,31 +1295,33 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
 {
     constexpr int k = 0;
 
+#if 0
     auto interp_from_mm_to = [&fsten] (int i_, int j_) -> Real {
         Real wxm = amrex::Math::abs(fsten(i_-1,j_  ,0,1))/(amrex::Math::abs(fsten(i_-1,j_-1,0,3))+amrex::Math::abs(fsten(i_-1,j_  ,0,3))+eps);
         Real wym = amrex::Math::abs(fsten(i_  ,j_-1,0,2))/(amrex::Math::abs(fsten(i_-1,j_-1,0,3))+amrex::Math::abs(fsten(i_  ,j_-1,0,3))+eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,0,3)) * (1._rt + wxm + wym);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,0,3)) * (Real(1.) + wxm + wym);
         return wmm * fsten(i_,j_,0,4);
     };
+#endif
 
     auto interp_from_mp_to = [&fsten] (int i_, int j_) -> Real {
         Real wxm = amrex::Math::abs(fsten(i_-1,j_  ,0,1))/(amrex::Math::abs(fsten(i_-1,j_-1,0,3))+amrex::Math::abs(fsten(i_-1,j_  ,0,3))+eps);
         Real wyp = amrex::Math::abs(fsten(i_  ,j_  ,0,2))/(amrex::Math::abs(fsten(i_-1,j_  ,0,3))+amrex::Math::abs(fsten(i_  ,j_  ,0,3))+eps);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,0,3)) *(1._rt + wxm + wyp);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,0,3)) *(Real(1.) + wxm + wyp);
         return wmp * fsten(i_,j_,0,4);
     };
 
     auto interp_from_pm_to = [&fsten] (int i_, int j_) -> Real {
         Real wxp = amrex::Math::abs(fsten(i_  ,j_  ,0,1))/(amrex::Math::abs(fsten(i_  ,j_-1,0,3))+amrex::Math::abs(fsten(i_  ,j_  ,0,3))+eps);
         Real wym = amrex::Math::abs(fsten(i_  ,j_-1,0,2))/(amrex::Math::abs(fsten(i_-1,j_-1,0,3))+amrex::Math::abs(fsten(i_  ,j_-1,0,3))+eps);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,0,3)) * (1._rt + wxp + wym);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,0,3)) * (Real(1.) + wxp + wym);
         return wpm * fsten(i_,j_,0,4);
     };
 
     auto interp_from_pp_to = [&fsten] (int i_, int j_) -> Real {
         Real wxp = amrex::Math::abs(fsten(i_  ,j_  ,0,1))/(amrex::Math::abs(fsten(i_  ,j_-1,0,3))+amrex::Math::abs(fsten(i_  ,j_  ,0,3))+eps);
         Real wyp = amrex::Math::abs(fsten(i_  ,j_  ,0,2))/(amrex::Math::abs(fsten(i_-1,j_  ,0,3))+amrex::Math::abs(fsten(i_  ,j_  ,0,3))+eps);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,0,3)) * (1._rt + wxp + wyp);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,0,3)) * (Real(1.) + wxp + wyp);
         return wpp * fsten(i_,j_,0,4);
     };
 
@@ -1081,9 +1341,11 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
         return amrex::Math::abs(fsten(i_,j_,0,2))/(amrex::Math::abs(fsten(i_,j_-1,0,2))+amrex::Math::abs(fsten(i_,j_,0,2))+eps);
     };
 
+#if 0
     auto Amm = [&fsten] (int i_, int j_) -> Real {
         return fsten(i_-1,j_-1,0,3);
     };
+#endif
 
     auto A0m = [&fsten] (int i_, int j_) -> Real {
         return fsten(i_,j_-1,0,2);
@@ -1117,12 +1379,14 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
         return fsten(i_,j_,0,3);
     };
 
+#if 0
     auto restrict_from_mm_to = [&fsten] (int ii_, int jj_) -> Real {
         Real wxp = amrex::Math::abs(fsten(ii_-1,jj_-1,0,1))/(amrex::Math::abs(fsten(ii_-1,jj_-2,0,3))+amrex::Math::abs(fsten(ii_-1,jj_-1,0,3))+eps);
         Real wyp = amrex::Math::abs(fsten(ii_-1,jj_-1,0,2))/(amrex::Math::abs(fsten(ii_-2,jj_-1,0,3))+amrex::Math::abs(fsten(ii_-1,jj_-1,0,3))+eps);
-        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_-1,0,3))*(1._rt+wxp+wyp);
+        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_-1,0,3))*(Real(1.)+wxp+wyp);
         return wpp * fsten(ii_-1,jj_-1,0,4);
     };
+#endif
 
     auto restrict_from_0m_to = [&fsten] (int ii_, int jj_) -> Real {
         return amrex::Math::abs(fsten(ii_,jj_-1,0,2))/(amrex::Math::abs(fsten(ii_,jj_-2,0,2))+amrex::Math::abs(fsten(ii_,jj_-1,0,2))+eps);
@@ -1131,7 +1395,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     auto restrict_from_pm_to = [&fsten] (int ii_, int jj_) -> Real {
         Real wxm = amrex::Math::abs(fsten(ii_  ,jj_-1,0,1))/(amrex::Math::abs(fsten(ii_,jj_-2,0,3))+amrex::Math::abs(fsten(ii_  ,jj_-1,0,3))+eps);
         Real wyp = amrex::Math::abs(fsten(ii_+1,jj_-1,0,2))/(amrex::Math::abs(fsten(ii_,jj_-1,0,3))+amrex::Math::abs(fsten(ii_+1,jj_-1,0,3))+eps);
-        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_-1,0,3)) *(1._rt + wxm + wyp);
+        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_-1,0,3)) *(Real(1.) + wxm + wyp);
         return wmp * fsten(ii_+1,jj_-1,0,4);
     };
 
@@ -1146,7 +1410,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     auto restrict_from_mp_to = [&fsten] (int ii_, int jj_) -> Real {
         Real wxp = amrex::Math::abs(fsten(ii_-1,jj_+1,0,1))/(amrex::Math::abs(fsten(ii_-1,jj_,0,3))+amrex::Math::abs(fsten(ii_-1,jj_+1,0,3))+eps);
         Real wym = amrex::Math::abs(fsten(ii_-1,jj_  ,0,2))/(amrex::Math::abs(fsten(ii_-2,jj_,0,3))+amrex::Math::abs(fsten(ii_-1,jj_  ,0,3))+eps);
-        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_  ,0,3)) * (1._rt + wxp + wym);
+        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_  ,0,3)) * (Real(1.) + wxp + wym);
         return wpm * fsten(ii_-1,jj_+1,0,4);
     };
 
@@ -1157,7 +1421,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     auto restrict_from_pp_to = [&fsten] (int ii_, int jj_) -> Real {
         Real wxm = amrex::Math::abs(fsten(ii_  ,jj_+1,0,1))/(amrex::Math::abs(fsten(ii_  ,jj_  ,0,3))+amrex::Math::abs(fsten(ii_  ,jj_+1,0,3))+eps);
         Real wym = amrex::Math::abs(fsten(ii_+1,jj_  ,0,2))/(amrex::Math::abs(fsten(ii_  ,jj_  ,0,3))+amrex::Math::abs(fsten(ii_+1,jj_  ,0,3))+eps);
-        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_  ,0,3)) * (1._rt + wxm + wym);
+        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_  ,0,3)) * (Real(1.) + wxm + wym);
         return wmm * fsten(ii_+1,jj_+1,0,4);
     };
 
@@ -1169,7 +1433,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     p(-1,-1) = interp_from_pp_to(ii+1,jj-1);
     p( 0,-1) = interp_from_0p_to(ii+2,jj-1);
     p(-1, 0) = interp_from_p0_to(ii+1,jj  );
-    p( 0, 0) = 1._rt;
+    p( 0, 0) = Real(1.);
     p(-1, 1) = interp_from_pm_to(ii+1,jj+1);
     p( 0, 1) = interp_from_0m_to(ii+2,jj+1);
 
@@ -1184,7 +1448,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     ap(1,1) = A0m(ii+1,jj+1)*p(-1,0) + Apm(ii+1,jj+1)*p(0,0)
         +     A00(ii+1,jj+1)*p(-1,1) + Ap0(ii+1,jj+1)*p(0,1);
 
-    csten(i,j,k,1) = 0.25_rt*(restrict_from_0m_to(ii,jj)*ap(0,-1)
+    csten(i,j,k,1) = Real(0.25)*(restrict_from_0m_to(ii,jj)*ap(0,-1)
                             + restrict_from_pm_to(ii,jj)*ap(1,-1)
                             + ap(0,0)
                             + restrict_from_p0_to(ii,jj)*ap(1,0)
@@ -1196,7 +1460,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     p( 0,-1) = interp_from_0p_to(ii  ,jj+1);
     p( 1,-1) = interp_from_mp_to(ii+1,jj+1);
     p(-1, 0) = interp_from_p0_to(ii-1,jj+2);
-    p( 0, 0) = 1._rt;
+    p( 0, 0) = Real(1.);
     p( 1, 0) = interp_from_m0_to(ii+1,jj+2);
 
     ap(-1,0) = A0p(ii-1,jj)*p(-1,-1) + App(ii-1,jj)*p(0,-1);
@@ -1209,7 +1473,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     ap(1,1) = Am0(ii+1,jj+1)*p(0,-1) + A00(ii+1,jj+1)*p(1,-1)
         +     Amp(ii+1,jj+1)*p(0,0) + A0p(ii+1,jj+1)*p(1,0);
 
-    csten(i,j,k,2) = 0.25_rt*(restrict_from_m0_to(ii,jj)*ap(-1,0)
+    csten(i,j,k,2) = Real(0.25)*(restrict_from_m0_to(ii,jj)*ap(-1,0)
                             + ap(0,0)
                             + restrict_from_p0_to(ii,jj)*ap(1,0)
                             + restrict_from_mp_to(ii,jj)*ap(-1,1)
@@ -1220,7 +1484,7 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     p(-1,-1) = interp_from_pp_to(ii+1,jj+1);
     p( 0,-1) = interp_from_0p_to(ii+2,jj+1);
     p(-1, 0) = interp_from_p0_to(ii+1,jj+2);
-    p( 0, 0) = 1._rt;
+    p( 0, 0) = Real(1.);
 
     ap(0,0) = App(ii,jj)*p(-1,-1);
     ap(1,0) = A0p(ii+1,jj)*p(-1,-1) + App(ii+1,jj)*p(0,-1);
@@ -1228,14 +1492,14 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
     ap(1,1) = A00(ii+1,jj+1)*p(-1,-1) + Ap0(ii+1,jj+1)*p(0,-1)
         +     A0p(ii+1,jj+1)*p(-1,0) + App(ii+1,jj+1)*p(0,0);
 
-    Real cross1 = 0.25_rt*(ap(0,0)
+    Real cross1 = Real(0.25)*(ap(0,0)
                            + restrict_from_p0_to(ii,jj)*ap(1,0)
                            + restrict_from_0p_to(ii,jj)*ap(0,1)
                            + restrict_from_pp_to(ii,jj)*ap(1,1));
 
     p(0,-1) = interp_from_0p_to(ii,jj+1);
     p(1,-1) = interp_from_mp_to(ii+1,jj+1);
-    p(0, 0) = 1._rt;
+    p(0, 0) = Real(1.);
     p(1, 0) = interp_from_m0_to(ii+1,jj+2);
 
     ap(-1,0) = Amp(ii+1,jj)*p(0,-1) + A0p(ii+1,jj)*p(1,-1);
@@ -1244,12 +1508,12 @@ void mlndlap_stencil_rap (int i, int j, int, Array4<Real> const& csten,
         + A0p(ii+1,jj+1)*p(1,0);
     ap( 0,1) = Am0(ii+2,jj+1)*p(1,-1) + Amp(ii+2,jj+1)*p(1,0);
 
-    Real cross2 = 0.25_rt*(ap(0,0)
+    Real cross2 = Real(0.25)*(ap(0,0)
                            + restrict_from_m0_to(ii+2,jj)*ap(-1,0)
                            + restrict_from_mp_to(ii+2,jj)*ap(-1,1)
                            + restrict_from_0p_to(ii+2,jj)*ap( 0,1));
 
-    csten(i,j,k,3) = 0.5_rt*(cross1+cross2);
+    csten(i,j,k,3) = Real(0.5)*(cross1+cross2);
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -1340,7 +1604,7 @@ void mlndlap_interpadd_rap (int i, int j, int, Array4<Real> const& fine,
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void mlndlap_restriction_rap (int i, int j, int k, Array4<Real> const& crse,
+void mlndlap_restriction_rap (int i, int j, int /*k*/, Array4<Real> const& crse,
                               Array4<Real const> const& fine, Array4<Real const> const& sten,
                               Array4<int const> const& msk) noexcept
 {
@@ -1421,19 +1685,19 @@ void mlndlap_set_connection (int i, int j, int, Array4<Real> const& conn,
                              Array4<EBCellFlag const> const& flag) noexcept
 {
     if (flag(i,j,0).isCovered()) {
-        for (int n = 0; n < 6; ++n) conn(i,j,0,n) = 0._rt;
+        for (int n = 0; n < 6; ++n) conn(i,j,0,n) = Real(0.);
     } else if (flag(i,j,0).isRegular() or vol(i,j,0) >= almostone) {
-        for (int n = 0; n < 6; ++n) conn(i,j,0,n) = 1._rt;
+        for (int n = 0; n < 6; ++n) conn(i,j,0,n) = Real(1.);
     } else {
         // Note that these are normalized so that they equal 1 in the case of a regular cell
 
-        conn(i,j,0,0) = 3._rt*(.25_rt*vol(i,j,0) + intg(i,j,0,i_S_y2) - intg(i,j,0,i_S_y));
-        conn(i,j,0,1) = 6._rt*(.25_rt*vol(i,j,0) - intg(i,j,0,i_S_y2));
-        conn(i,j,0,2) = 3._rt*(.25_rt*vol(i,j,0) + intg(i,j,0,i_S_y2) + intg(i,j,0,i_S_y));
+        conn(i,j,0,0) = Real(3.)*(Real(0.25)*vol(i,j,0) + intg(i,j,0,i_S_y2) - intg(i,j,0,i_S_y));
+        conn(i,j,0,1) = Real(6.)*(Real(0.25)*vol(i,j,0) - intg(i,j,0,i_S_y2));
+        conn(i,j,0,2) = Real(3.)*(Real(0.25)*vol(i,j,0) + intg(i,j,0,i_S_y2) + intg(i,j,0,i_S_y));
 
-        conn(i,j,0,3) = 3._rt*(.25_rt*vol(i,j,0) + intg(i,j,0,i_S_x2) - intg(i,j,0,i_S_x));
-        conn(i,j,0,4) = 6._rt*(.25_rt*vol(i,j,0) - intg(i,j,0,i_S_x2));
-        conn(i,j,0,5) = 3._rt*(.25_rt*vol(i,j,0) + intg(i,j,0,i_S_x2) + intg(i,j,0,i_S_x));
+        conn(i,j,0,3) = Real(3.)*(Real(0.25)*vol(i,j,0) + intg(i,j,0,i_S_x2) - intg(i,j,0,i_S_x));
+        conn(i,j,0,4) = Real(6.)*(Real(0.25)*vol(i,j,0) - intg(i,j,0,i_S_x2));
+        conn(i,j,0,5) = Real(3.)*(Real(0.25)*vol(i,j,0) + intg(i,j,0,i_S_x2) + intg(i,j,0,i_S_x));
     }
 }
 
@@ -1442,13 +1706,13 @@ void mlndlap_set_stencil_eb (int i, int j, int, Array4<Real> const& sten,
                              Array4<Real const> const& sig, Array4<Real const> const& conn,
                              GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
-    Real facx = (1._rt/6._rt)*dxinv[0]*dxinv[0];
-    Real facy = (1._rt/6._rt)*dxinv[1]*dxinv[1];
+    Real facx = Real(1./6.)*dxinv[0]*dxinv[0];
+    Real facy = Real(1./6.)*dxinv[1]*dxinv[1];
 
-    sten(i,j,0,1) = 2._rt*facx*(sig(i,j-1,0)*conn(i,j-1,0,2)+sig(i,j,0)*conn(i,j,0,0))
-                         -facy*(sig(i,j-1,0)*conn(i,j-1,0,4)+sig(i,j,0)*conn(i,j,0,4));
-    sten(i,j,0,2) = 2._rt*facy*(sig(i-1,j,0)*conn(i-1,j,0,5)+sig(i,j,0)*conn(i,j,0,3))
-                         -facx*(sig(i-1,j,0)*conn(i-1,j,0,1)+sig(i,j,0)*conn(i,j,0,1));
+    sten(i,j,0,1) = Real(2.)*facx*(sig(i,j-1,0)*conn(i,j-1,0,2)+sig(i,j,0)*conn(i,j,0,0))
+                            -facy*(sig(i,j-1,0)*conn(i,j-1,0,4)+sig(i,j,0)*conn(i,j,0,4));
+    sten(i,j,0,2) = Real(2.)*facy*(sig(i-1,j,0)*conn(i-1,j,0,5)+sig(i,j,0)*conn(i,j,0,3))
+                            -facx*(sig(i-1,j,0)*conn(i-1,j,0,1)+sig(i,j,0)*conn(i,j,0,1));
     sten(i,j,0,3) = (facx*conn(i,j,0,1)+facy*conn(i,j,0,4))*sig(i,j,0);
 }
 
@@ -1456,21 +1720,45 @@ void mlndlap_set_stencil_eb (int i, int j, int, Array4<Real> const& sten,
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_divu_eb (int i, int j, int, Array4<Real> const& rhs, Array4<Real const> const& vel,
                       Array4<Real const> const& vfrac, Array4<Real const> const& intg,
-                      Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                      Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                      Box const& nodal_domain,
+                      GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                      GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi) noexcept
 {
-    Real facx = 0.5_rt*dxinv[0];
-    Real facy = 0.5_rt*dxinv[1];
+    Real facx = Real(0.5)*dxinv[0];
+    Real facy = Real(0.5)*dxinv[1];
+
+    const auto domlo = amrex::lbound(nodal_domain);
+    const auto domhi = amrex::ubound(nodal_domain);
+
     if (!msk(i,j,0)) {
-        rhs(i,j,0) = facx*(-vel(i-1,j-1,0,0)*(vfrac(i-1,j-1,0)+2._rt*intg(i-1,j-1,0,1))
-                           +vel(i  ,j-1,0,0)*(vfrac(i  ,j-1,0)+2._rt*intg(i  ,j-1,0,1))
-                           -vel(i-1,j  ,0,0)*(vfrac(i-1,j  ,0)-2._rt*intg(i-1,j  ,0,1))
-                           +vel(i  ,j  ,0,0)*(vfrac(i  ,j  ,0)-2._rt*intg(i  ,j  ,0,1)))
-                   + facy*(-vel(i-1,j-1,0,1)*(vfrac(i-1,j-1,0)+2._rt*intg(i-1,j-1,0,0))
-                           -vel(i  ,j-1,0,1)*(vfrac(i  ,j-1,0)-2._rt*intg(i  ,j-1,0,0))
-                           +vel(i-1,j  ,0,1)*(vfrac(i-1,j  ,0)+2._rt*intg(i-1,j  ,0,0))
-                           +vel(i  ,j  ,0,1)*(vfrac(i  ,j  ,0)-2._rt*intg(i  ,j  ,0,0)));
+
+        Real zero_ilo = 1.0;
+        Real zero_ihi = 1.0;
+        Real zero_jlo = 1.0;
+        Real zero_jhi = 1.0;
+
+        // The nodal divergence operator should not see the tangential velocity
+        //     at an inflow face
+        if ((bclo[0] == LinOpBCType::Neumann or bclo[0] == LinOpBCType::inflow)
+            and i == domlo.x) zero_ilo = 0.0;
+        if ((bchi[0] == LinOpBCType::Neumann or bchi[0] == LinOpBCType::inflow)
+            and i == domhi.x) zero_ihi = 0.0;
+        if ((bclo[1] == LinOpBCType::Neumann or bclo[1] == LinOpBCType::inflow)
+            and j == domlo.y) zero_jlo = 0.0;
+        if ((bchi[1] == LinOpBCType::Neumann or bchi[1] == LinOpBCType::inflow)
+            and j == domhi.y) zero_jhi = 0.0; 
+
+        rhs(i,j,0) = facx*(-vel(i-1,j-1,0,0)*(vfrac(i-1,j-1,0)+Real(2.)*intg(i-1,j-1,0,1))*zero_jlo
+                           +vel(i  ,j-1,0,0)*(vfrac(i  ,j-1,0)+Real(2.)*intg(i  ,j-1,0,1))*zero_jlo
+                           -vel(i-1,j  ,0,0)*(vfrac(i-1,j  ,0)-Real(2.)*intg(i-1,j  ,0,1))*zero_jhi
+                           +vel(i  ,j  ,0,0)*(vfrac(i  ,j  ,0)-Real(2.)*intg(i  ,j  ,0,1))*zero_jhi)
+                   + facy*(-vel(i-1,j-1,0,1)*(vfrac(i-1,j-1,0)+Real(2.)*intg(i-1,j-1,0,0))*zero_ilo
+                           -vel(i  ,j-1,0,1)*(vfrac(i  ,j-1,0)-Real(2.)*intg(i  ,j-1,0,0))*zero_ihi
+                           +vel(i-1,j  ,0,1)*(vfrac(i-1,j  ,0)+Real(2.)*intg(i-1,j  ,0,0))*zero_ilo
+                           +vel(i  ,j  ,0,1)*(vfrac(i  ,j  ,0)-Real(2.)*intg(i  ,j  ,0,0))*zero_ihi);
     } else {
-        rhs(i,j,0) = 0._rt;
+        rhs(i,j,0) = Real(0.);
     }
 }
 
@@ -1479,10 +1767,10 @@ void mlndlap_mknewu_eb (int i, int j, int, Array4<Real> const& u, Array4<Real co
                         Array4<Real const> const& sig, Array4<Real const> const& vfrac,
                         Array4<Real const> const& intg, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
-    Real facx = 0.5_rt*dxinv[0];
-    Real facy = 0.5_rt*dxinv[1];
-    if (vfrac(i,j,0) == 0._rt) {
-        u(i,j,0,0) = u(i,j,0,1) = 0._rt;
+    Real facx = Real(0.5)*dxinv[0];
+    Real facy = Real(0.5)*dxinv[1];
+    if (vfrac(i,j,0) == Real(0.)) {
+        u(i,j,0,0) = u(i,j,0,1) = Real(0.);
     } else {
         Real dpdx = facx*(-p(i,j,0)+p(i+1,j,0)-p(i,j+1,0)+p(i+1,j+1,0));
         Real dpdy = facy*(-p(i,j,0)-p(i+1,j,0)+p(i,j+1,0)+p(i+1,j+1,0));
@@ -1499,23 +1787,23 @@ Real mlndlap_rhcc_eb (int i, int j, int, Array4<Real const> const& rhcc,
 {
     if (!msk(i,j,0)) {
         return
-            rhcc(i  ,j  ,0)*(0.25_rt*vfrac(i  ,j  ,0)-intg(i  ,j  ,0,i_S_x)-intg(i  ,j  ,0,i_S_y)+intg(i  ,j  ,0,i_S_xy)) +
-            rhcc(i-1,j  ,0)*(0.25_rt*vfrac(i-1,j  ,0)+intg(i-1,j  ,0,i_S_x)-intg(i-1,j  ,0,i_S_y)-intg(i-1,j  ,0,i_S_xy)) +
-            rhcc(i-1,j-1,0)*(0.25_rt*vfrac(i-1,j-1,0)+intg(i-1,j-1,0,i_S_x)+intg(i-1,j-1,0,i_S_y)+intg(i-1,j-1,0,i_S_xy)) +
-            rhcc(i  ,j-1,0)*(0.25_rt*vfrac(i  ,j-1,0)-intg(i  ,j-1,0,i_S_x)+intg(i  ,j-1,0,i_S_y)-intg(i  ,j-1,0,i_S_xy));
+            rhcc(i  ,j  ,0)*(Real(0.25)*vfrac(i  ,j  ,0)-intg(i  ,j  ,0,i_S_x)-intg(i  ,j  ,0,i_S_y)+intg(i  ,j  ,0,i_S_xy)) +
+            rhcc(i-1,j  ,0)*(Real(0.25)*vfrac(i-1,j  ,0)+intg(i-1,j  ,0,i_S_x)-intg(i-1,j  ,0,i_S_y)-intg(i-1,j  ,0,i_S_xy)) +
+            rhcc(i-1,j-1,0)*(Real(0.25)*vfrac(i-1,j-1,0)+intg(i-1,j-1,0,i_S_x)+intg(i-1,j-1,0,i_S_y)+intg(i-1,j-1,0,i_S_xy)) +
+            rhcc(i  ,j-1,0)*(Real(0.25)*vfrac(i  ,j-1,0)-intg(i  ,j-1,0,i_S_x)+intg(i  ,j-1,0,i_S_y)-intg(i  ,j-1,0,i_S_xy));
     } else {
-        return 0._rt;
+        return Real(0.);
     }
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_set_integral (int i, int j, int, Array4<Real> const& intg) noexcept
 {
-    intg(i,j,0,i_S_x ) = 0._rt;
-    intg(i,j,0,i_S_y ) = 0._rt;
-    intg(i,j,0,i_S_x2) = (1._rt/12._rt);
-    intg(i,j,0,i_S_y2) = (1._rt/12._rt);
-    intg(i,j,0,i_S_xy) = 0._rt;
+    intg(i,j,0,i_S_x ) = Real(0.);
+    intg(i,j,0,i_S_y ) = Real(0.);
+    intg(i,j,0,i_S_x2) = Real(1./12.);
+    intg(i,j,0,i_S_y2) = Real(1./12.);
+    intg(i,j,0,i_S_xy) = Real(0.);
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -1525,17 +1813,17 @@ void mlndlap_set_integral_eb (int i, int j, int, Array4<Real> const& intg,
                               Array4<Real const> const& bcen) noexcept
 {
     if (flag(i,j,0).isCovered()) {
-        intg(i,j,0,i_S_x ) = 0._rt;
-        intg(i,j,0,i_S_y ) = 0._rt;
-        intg(i,j,0,i_S_x2) = 0._rt;
-        intg(i,j,0,i_S_y2) = 0._rt;
-        intg(i,j,0,i_S_xy) = 0._rt;
+        intg(i,j,0,i_S_x ) = Real(0.);
+        intg(i,j,0,i_S_y ) = Real(0.);
+        intg(i,j,0,i_S_x2) = Real(0.);
+        intg(i,j,0,i_S_y2) = Real(0.);
+        intg(i,j,0,i_S_xy) = Real(0.);
     } else if (flag(i,j,0).isRegular() or vol(i,j,0) >= almostone) {
-        intg(i,j,0,i_S_x ) = 0._rt;
-        intg(i,j,0,i_S_y ) = 0._rt;
-        intg(i,j,0,i_S_x2) = (1._rt/12._rt);
-        intg(i,j,0,i_S_y2) = (1._rt/12._rt);
-        intg(i,j,0,i_S_xy) = 0._rt;
+        intg(i,j,0,i_S_x ) = Real(0.);
+        intg(i,j,0,i_S_y ) = Real(0.);
+        intg(i,j,0,i_S_x2) = Real(1./12.);
+        intg(i,j,0,i_S_y2) = Real(1./12.);
+        intg(i,j,0,i_S_xy) = Real(0.);
     } else {
         Real axm = ax(i,j,0);
         Real axp = ax(i+1,j,0);
@@ -1543,11 +1831,11 @@ void mlndlap_set_integral_eb (int i, int j, int, Array4<Real> const& intg,
         Real ayp = ay(i,j+1,0);
 
         Real apnorm = std::sqrt((axm-axp)*(axm-axp) + (aym-ayp)*(aym-ayp));
-        if (apnorm == 0._rt) {
+        if (apnorm == Real(0.)) {
             amrex::Abort("amrex_mlndlap_set_integral: we are in trouble");
         }
 
-        Real apnorminv = 1._rt/apnorm;
+        Real apnorminv = Real(1.)/apnorm;
         Real anrmx = (axm-axp) * apnorminv;  // pointing to the wall
         Real anrmy = (aym-ayp) * apnorminv;
 
@@ -1555,58 +1843,58 @@ void mlndlap_set_integral_eb (int i, int j, int, Array4<Real> const& intg,
         Real bcy = bcen(i,j,0,1);
 
         Real Sx, Sy, Sx2, Sy2, Sxy;
-        if (anrmx == 0._rt) {
-            Sx = 0._rt;
-            Sx2 = (1._rt/24._rt)*(axm+axp);
-            Sxy = 0._rt;
-        } else if (anrmy == 0._rt) {
-            Sx  = (1._rt/8._rt) *(axp-axm) + anrmx*0.5_rt*(bcx*bcx);
-            Sx2 = (1._rt/24._rt)*(axp+axm) + anrmx*(1._rt/3._rt)*(bcx*bcx*bcx);
-            Sxy = 0._rt;
+        if (anrmx == Real(0.)) {
+            Sx = Real(0.);
+            Sx2 = Real(1./24.)*(axm+axp);
+            Sxy = Real(0.);
+        } else if (anrmy == Real(0.)) {
+            Sx  = Real(1./8.) *(axp-axm) + anrmx*Real(0.5)*(bcx*bcx);
+            Sx2 = Real(1./24.)*(axp+axm) + anrmx*Real(1./3.)*(bcx*bcx*bcx);
+            Sxy = Real(0.);
         } else {
             Real xmin, xmax;
-            if (anrmx > 0._rt) {
-                xmin = -0.5_rt + amrex::min(aym,ayp);
-                xmax = -0.5_rt + amrex::max(aym,ayp);
+            if (anrmx > Real(0.)) {
+                xmin = Real(-0.5) + amrex::min(aym,ayp);
+                xmax = Real(-0.5) + amrex::max(aym,ayp);
             } else {
-                xmin = 0.5_rt - amrex::max(aym,ayp);
-                xmax = 0.5_rt - amrex::min(aym,ayp);
+                xmin = Real(0.5) - amrex::max(aym,ayp);
+                xmax = Real(0.5) - amrex::min(aym,ayp);
             }
             Real xmin3 = xmin*xmin*xmin;
             Real xmin4 = xmin3*xmin;
             Real xmax3 = xmax*xmax*xmax;
             Real xmax4 = xmax3*xmax;
-            Sx  = (1._rt/8._rt) *(axp-axm) + (anrmx/amrex::Math::abs(anrmy))*(1._rt/6._rt) *(xmax3-xmin3);
-            Sx2 = (1._rt/24._rt)*(axp+axm) + (anrmx/amrex::Math::abs(anrmy))*(1._rt/12._rt)*(xmax4-xmin4);
+            Sx  = Real(1./8.) *(axp-axm) + (anrmx/amrex::Math::abs(anrmy))*Real(1./6.) *(xmax3-xmin3);
+            Sx2 = Real(1./24.)*(axp+axm) + (anrmx/amrex::Math::abs(anrmy))*Real(1./12.)*(xmax4-xmin4);
 
             Real kk = -anrmx/anrmy;
             Real bb = bcy-kk*bcx;
-            Sxy = (1._rt/8._rt)*kk*kk*(xmax4-xmin4) + (1._rt/3._rt)*kk*bb*(xmax3-xmin3)
-                + (0.25_rt*bb*bb-(1._rt/16._rt))*(xmax*xmax-xmin*xmin);
+            Sxy = Real(1./8.)*kk*kk*(xmax4-xmin4) + Real(1./3.)*kk*bb*(xmax3-xmin3)
+                + (Real(0.25)*bb*bb-Real(1./16.))*(xmax*xmax-xmin*xmin);
             Sxy = amrex::Math::copysign(Sxy, anrmy);
         }
 
-        if (anrmy == 0._rt) {
-            Sy = 0._rt;
-            Sy2 = (1._rt/24._rt)*(aym+ayp);
-        } else if (anrmx == 0._rt) {
-            Sy  = (1._rt/8._rt) *(ayp-aym) + anrmy*0.5_rt*(bcy*bcy);
-            Sy2 = (1._rt/24._rt)*(ayp+aym) + anrmy*(1._rt/3._rt)*(bcy*bcy*bcy);
+        if (anrmy == Real(0.)) {
+            Sy = Real(0.);
+            Sy2 = Real(1./24.)*(aym+ayp);
+        } else if (anrmx == Real(0.)) {
+            Sy  = Real(1./8.) *(ayp-aym) + anrmy*Real(0.5)*(bcy*bcy);
+            Sy2 = Real(1./24.)*(ayp+aym) + anrmy*Real(1./3.)*(bcy*bcy*bcy);
         } else {
             Real ymin, ymax;
-            if (anrmy > 0._rt) {
-                ymin = -0.5_rt + amrex::min(axm,axp);
-                ymax = -0.5_rt + amrex::max(axm,axp);
+            if (anrmy > Real(0.)) {
+                ymin = Real(-0.5) + amrex::min(axm,axp);
+                ymax = Real(-0.5) + amrex::max(axm,axp);
             } else {
-                ymin = 0.5_rt - amrex::max(axm,axp);
-                ymax = 0.5_rt - amrex::min(axm,axp);
+                ymin = Real(0.5) - amrex::max(axm,axp);
+                ymax = Real(0.5) - amrex::min(axm,axp);
             }
             Real ymin3 = ymin*ymin*ymin;
             Real ymin4 = ymin3*ymin;
             Real ymax3 = ymax*ymax*ymax;
             Real ymax4 = ymax3*ymax;
-            Sy  = (1._rt/8._rt) *(ayp-aym) + (anrmy/amrex::Math::abs(anrmx))*(1._rt/6._rt) *(ymax3-ymin3);
-            Sy2 = (1._rt/24._rt)*(ayp+aym) + (anrmy/amrex::Math::abs(anrmx))*(1._rt/12._rt)*(ymax4-ymin4);
+            Sy  = Real(1./8.) *(ayp-aym) + (anrmy/amrex::Math::abs(anrmx))*Real(1./6.) *(ymax3-ymin3);
+            Sy2 = Real(1./24.)*(ayp+aym) + (anrmy/amrex::Math::abs(anrmx))*Real(1./12.)*(ymax4-ymin4);
         }
 
         intg(i,j,0,i_S_x ) = Sx;
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_3D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_3D_K.H
index 3fdf62a358c..b9f75eaffe7 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_3D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_3D_K.H
@@ -228,6 +228,24 @@ void mlndlap_avgdown_coeff_z (int i, int j, int k, Array4<Real> const& crse,
     crse(i,j,k) = 0.5*cl*cr/(cl+cr);
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_avgdown_coeff (int i, int j, int k, Array4<Real> const& crse,
+                              Array4<Real const> const& fine, int idir) noexcept
+{
+    if (idir == 2) {
+        Real cl = fine(2*i  ,2*j,k) + fine(2*i  ,2*j+1,k);
+        Real cr = fine(2*i+1,2*j,k) + fine(2*i+1,2*j+1,k);
+        crse(i,j,k) = cl*cr/(cl+cr);    
+    } else if (idir == 1) {
+        Real cl = fine(2*i  ,j,2*k) + fine(2*i  ,j,2*k+1);
+        Real cr = fine(2*i+1,j,2*k) + fine(2*i+1,j,2*k+1);
+        crse(i,j,k) = cl*cr/(cl+cr);
+    } else {
+        Real cl = fine(i,2*j  ,2*k) + fine(i,2*j  ,2*k+1);
+        Real cr = fine(i,2*j+1,2*k) + fine(i,2*j+1,2*k+1);
+        crse(i,j,k) = cl*cr/(cl+cr);
+    }
+}
 //
 // bc
 //
@@ -1135,6 +1153,258 @@ void mlndlap_gauss_seidel_aa (Box const& bx, Array4<Real> const& sol,
     });
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void tridiagonal_solve (Array1D<Real,0,31>& a_ls, Array1D<Real,0,31>& b_ls, Array1D<Real,0,31>& c_ls,
+                        Array1D<Real,0,31>& r_ls, Array1D<Real,0,31>& u_ls, Array1D<Real,0,31>& gam,
+                        int ilen ) noexcept
+{
+    Real bet = b_ls(0);
+    u_ls(0) = r_ls(0) / bet;
+
+    for (int i = 1; i <= ilen - 1; i++) {
+        gam(i) = c_ls(i-1) / bet;
+        bet = b_ls(i) - a_ls(i)*gam(i);
+        if (bet == 0) amrex::Abort(">>>TRIDIAG FAILED");
+        u_ls(i) = (r_ls(i)-a_ls(i)*u_ls(i-1)) / bet;
+    }
+    for (int i = ilen-2; i >= 0; i--) {
+        u_ls(i) = u_ls(i) - gam(i+1)*u_ls(i+1);
+    }
+}
+
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_gauss_seidel_with_line_solve_aa (Box const& bx, Array4<Real> const& sol,
+                              Array4<Real const> const& rhs, Array4<Real const> const& sig,
+                              Array4<int const> const& msk,
+                              GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+{
+    Real facx = (1.0/36.0)*dxinv[0]*dxinv[0];
+    Real facy = (1.0/36.0)*dxinv[1]*dxinv[1];
+    Real facz = (1.0/36.0)*dxinv[2]*dxinv[2];
+    Real fxyz = facx + facy + facz;
+    Real fmx2y2z = -facx + 2.0*facy + 2.0*facz;
+    Real f2xmy2z = 2.0*facx - facy + 2.0*facz;
+    Real f2x2ymz = 2.0*facx + 2.0*facy - facz;
+    Real f4xm2ym2z = 4.0*facx - 2.0*facy - 2.0*facz;
+    Real fm2x4ym2z = -2.0*facx + 4.0*facy - 2.0*facz;
+    Real fm2xm2y4z = -2.0*facx - 2.0*facy + 4.0*facz;
+ 
+    const auto lo = amrex::lbound(bx);
+    const auto hi = amrex::ubound(bx);
+
+    int idir = -1;
+    int ilen = 33;
+
+    if ( (dxinv[0] <= dxinv[2]) and (dxinv[1] <= dxinv[2]) ) {
+        idir = 2;
+        ilen = hi.z - lo.z + 1;
+    }
+    if ( (dxinv[0] <= dxinv[1]) and (dxinv[2] <= dxinv[1]) ) {
+        idir = 1;
+        ilen = hi.y - lo.y + 1;
+    }
+    if ( (dxinv[1] <= dxinv[0]) and (dxinv[2] <= dxinv[0]) ) {
+        idir = 0;
+        ilen = hi.x - lo.x + 1;
+    }
+
+    if (ilen > 32) amrex::Abort("mlndlap_gauss_seidel_with_line_solve_aa is hard-wired to be no longer than 32");
+
+    Array1D<Real,0,31> a_ls,b_ls,c_ls,u_ls,r_ls,gam;
+
+
+    if ( idir == 2 ) 
+    {
+        for (int j = lo.y; j <= hi.y; ++j) 
+        {
+            for (int i = lo.x; i <= hi.x; ++i)
+            {
+                for (int k = lo.z; k <= hi.z; ++k)
+                {
+                    if (msk(i,j,k)) 
+                    {
+                        a_ls(k-lo.z) = 0.;
+                        b_ls(k-lo.z) = 1.;
+                        c_ls(k-lo.z) = 0.;
+                        u_ls(k-lo.z) = 0.;
+                        r_ls(k-lo.z) = 0.;
+                    } 
+                    else 
+                    {
+                        Real s0 = (-4.0)*fxyz*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1)   
+                                             + sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  ));
+
+                        Real Ax = fxyz*(sol(i-1,j-1,k-1)*sig(i-1,j-1,k-1)
+                                      + sol(i+1,j-1,k-1)*sig(i  ,j-1,k-1)
+                                      + sol(i-1,j+1,k-1)*sig(i-1,j  ,k-1)
+                                      + sol(i+1,j+1,k-1)*sig(i  ,j  ,k-1)
+                                      + sol(i-1,j-1,k+1)*sig(i-1,j-1,k  )
+                                      + sol(i+1,j-1,k+1)*sig(i  ,j-1,k  )
+                                      + sol(i-1,j+1,k+1)*sig(i-1,j  ,k  )
+                                      + sol(i+1,j+1,k+1)*sig(i  ,j  ,k  ))
+                            + fmx2y2z*(sol(i  ,j-1,k-1)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1))
+                                     + sol(i  ,j+1,k-1)*(sig(i-1,j  ,k-1)+sig(i,j  ,k-1))
+                                     + sol(i  ,j-1,k+1)*(sig(i-1,j-1,k  )+sig(i,j-1,k  ))
+                                     + sol(i  ,j+1,k+1)*(sig(i-1,j  ,k  )+sig(i,j  ,k  )))
+                            + f2xmy2z*(sol(i-1,j  ,k-1)*(sig(i-1,j-1,k-1)+sig(i-1,j,k-1))
+                                     + sol(i+1,j  ,k-1)*(sig(i  ,j-1,k-1)+sig(i  ,j,k-1))
+                                     + sol(i-1,j  ,k+1)*(sig(i-1,j-1,k  )+sig(i-1,j,k  ))
+                                     + sol(i+1,j  ,k+1)*(sig(i  ,j-1,k  )+sig(i  ,j,k  )))
+                            + f2x2ymz*(sol(i-1,j-1,k  )*(sig(i-1,j-1,k-1)+sig(i-1,j-1,k))
+                                     + sol(i+1,j-1,k  )*(sig(i  ,j-1,k-1)+sig(i  ,j-1,k))
+                                     + sol(i-1,j+1,k  )*(sig(i-1,j  ,k-1)+sig(i-1,j  ,k))
+                                     + sol(i+1,j+1,k  )*(sig(i  ,j  ,k-1)+sig(i  ,j  ,k)))
+                            + f4xm2ym2z*(sol(i-1,j,k)*(sig(i-1,j-1,k-1)+sig(i-1,j,k-1)+sig(i-1,j-1,k)+sig(i-1,j,k))
+                                       + sol(i+1,j,k)*(sig(i  ,j-1,k-1)+sig(i  ,j,k-1)+sig(i  ,j-1,k)+sig(i  ,j,k)))
+                            + fm2x4ym2z*(sol(i,j-1,k)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j-1,k)+sig(i,j-1,k))
+                                       + sol(i,j+1,k)*(sig(i-1,j  ,k-1)+sig(i,j  ,k-1)+sig(i-1,j  ,k)+sig(i,j  ,k)));
+
+                        a_ls(k-lo.z) = fm2xm2y4z*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1));
+                        b_ls(k-lo.z) = s0;
+                        c_ls(k-lo.z) = fm2xm2y4z*(sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  ));
+                        u_ls(k-lo.z) = 0.;  
+                        r_ls(k-lo.z) = rhs(i,j,k) - Ax;
+                    }
+                }
+                tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+                for (int k = lo.z; k <= hi.z; ++k)
+                {  
+                    sol(i,j,k) = u_ls(k-lo.z);
+                }
+            }
+        }
+    }
+    else if (idir == 1)
+    {
+        for (int k = lo.z; k <= hi.z; ++k)
+        {
+            for (int i = lo.x; i <= hi.x; ++i)
+            {
+                for (int j = lo.y; j <= hi.y; ++j)
+                {
+                    if (msk(i,j,k)) {
+                        a_ls(j-lo.y) = 0.;
+                        b_ls(j-lo.y) = 1.;
+                        c_ls(j-lo.y) = 0.;
+                        u_ls(j-lo.y) = 0.;
+                        r_ls(j-lo.y) = 0.;
+                    } 
+                    else
+                    {
+                        Real s0 = (-4.0)*fxyz*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1)
+                                             + sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  ));
+
+                        Real Ax = fxyz*(sol(i-1,j-1,k-1)*sig(i-1,j-1,k-1)
+                                      + sol(i+1,j-1,k-1)*sig(i  ,j-1,k-1)
+                                      + sol(i-1,j+1,k-1)*sig(i-1,j  ,k-1)
+                                      + sol(i+1,j+1,k-1)*sig(i  ,j  ,k-1)
+                                      + sol(i-1,j-1,k+1)*sig(i-1,j-1,k  )
+                                      + sol(i+1,j-1,k+1)*sig(i  ,j-1,k  )
+                                      + sol(i-1,j+1,k+1)*sig(i-1,j  ,k  )
+                                      + sol(i+1,j+1,k+1)*sig(i  ,j  ,k  ))
+                            + fmx2y2z*(sol(i  ,j-1,k-1)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1))
+                                     + sol(i  ,j+1,k-1)*(sig(i-1,j  ,k-1)+sig(i,j  ,k-1))
+                                     + sol(i  ,j-1,k+1)*(sig(i-1,j-1,k  )+sig(i,j-1,k  ))
+                                     + sol(i  ,j+1,k+1)*(sig(i-1,j  ,k  )+sig(i,j  ,k  )))
+                            + f2xmy2z*(sol(i-1,j  ,k-1)*(sig(i-1,j-1,k-1)+sig(i-1,j,k-1))
+                                     + sol(i+1,j  ,k-1)*(sig(i  ,j-1,k-1)+sig(i  ,j,k-1))
+                                     + sol(i-1,j  ,k+1)*(sig(i-1,j-1,k  )+sig(i-1,j,k  ))
+                                     + sol(i+1,j  ,k+1)*(sig(i  ,j-1,k  )+sig(i  ,j,k  )))
+                            + f2x2ymz*(sol(i-1,j-1,k  )*(sig(i-1,j-1,k-1)+sig(i-1,j-1,k))
+                                     + sol(i+1,j-1,k  )*(sig(i  ,j-1,k-1)+sig(i  ,j-1,k))
+                                     + sol(i-1,j+1,k  )*(sig(i-1,j  ,k-1)+sig(i-1,j  ,k))
+                                     + sol(i+1,j+1,k  )*(sig(i  ,j  ,k-1)+sig(i  ,j  ,k)))
+                            + f4xm2ym2z*(sol(i-1,j,k)*(sig(i-1,j-1,k-1)+sig(i-1,j,k-1)+sig(i-1,j-1,k)+sig(i-1,j,k))
+                                       + sol(i+1,j,k)*(sig(i  ,j-1,k-1)+sig(i  ,j,k-1)+sig(i  ,j-1,k)+sig(i  ,j,k)))
+                            + fm2xm2y4z*(sol(i,j,k-1)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1))
+                                       + sol(i,j,k+1)*(sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  )));
+
+                        a_ls(j-lo.y) = fm2x4ym2z*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j-1,k)+sig(i,j-1,k));
+                        b_ls(j-lo.y) = s0;
+                        c_ls(j-lo.y) = fm2x4ym2z*(sig(i-1,j  ,k-1)+sig(i,j  ,k-1)+sig(i-1,j  ,k)+sig(i,j  ,k));
+                        u_ls(j-lo.y) = 0.;
+                        r_ls(j-lo.y) = rhs(i,j,k) - Ax;
+
+                    }
+                }
+                tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+                for (int j = lo.y; j <= hi.y; ++j)
+                {
+                    sol(i,j,k) = u_ls(j-lo.y);
+                }
+            }
+        }
+    } 
+    else if (idir == 0) 
+    {
+        for (int j = lo.y; j <= hi.y; ++j)
+        {
+            for (int k = lo.z; k <= hi.z; ++k)
+            {
+                for (int i = lo.x; i <= hi.x; ++i)
+                {
+                    if (msk(i,j,k)) 
+                    {
+                        a_ls(i-lo.x) = 0.;
+                        b_ls(i-lo.x) = 1.;
+                        c_ls(i-lo.x) = 0.;
+                        u_ls(i-lo.x) = 0.;
+                        r_ls(i-lo.x) = 0.;
+                    }
+                    else
+                    {
+                        Real s0 = (-4.0)*fxyz*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1)
+                                             + sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  ));
+
+                        Real Ax = fxyz*(sol(i-1,j-1,k-1)*sig(i-1,j-1,k-1)
+                                      + sol(i+1,j-1,k-1)*sig(i  ,j-1,k-1)
+                                      + sol(i-1,j+1,k-1)*sig(i-1,j  ,k-1)
+                                      + sol(i+1,j+1,k-1)*sig(i  ,j  ,k-1)
+                                      + sol(i-1,j-1,k+1)*sig(i-1,j-1,k  )
+                                      + sol(i+1,j-1,k+1)*sig(i  ,j-1,k  )
+                                      + sol(i-1,j+1,k+1)*sig(i-1,j  ,k  )
+                                      + sol(i+1,j+1,k+1)*sig(i  ,j  ,k  ))
+                            + fmx2y2z*(sol(i  ,j-1,k-1)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1))
+                                     + sol(i  ,j+1,k-1)*(sig(i-1,j  ,k-1)+sig(i,j  ,k-1))
+                                     + sol(i  ,j-1,k+1)*(sig(i-1,j-1,k  )+sig(i,j-1,k  ))
+                                     + sol(i  ,j+1,k+1)*(sig(i-1,j  ,k  )+sig(i,j  ,k  )))
+                            + f2xmy2z*(sol(i-1,j  ,k-1)*(sig(i-1,j-1,k-1)+sig(i-1,j,k-1))
+                                     + sol(i+1,j  ,k-1)*(sig(i  ,j-1,k-1)+sig(i  ,j,k-1))
+                                     + sol(i-1,j  ,k+1)*(sig(i-1,j-1,k  )+sig(i-1,j,k  ))
+                                     + sol(i+1,j  ,k+1)*(sig(i  ,j-1,k  )+sig(i  ,j,k  )))
+                            + f2x2ymz*(sol(i-1,j-1,k  )*(sig(i-1,j-1,k-1)+sig(i-1,j-1,k))
+                                     + sol(i+1,j-1,k  )*(sig(i  ,j-1,k-1)+sig(i  ,j-1,k))
+                                     + sol(i-1,j+1,k  )*(sig(i-1,j  ,k-1)+sig(i-1,j  ,k))
+                                     + sol(i+1,j+1,k  )*(sig(i  ,j  ,k-1)+sig(i  ,j  ,k)))
+                            + fm2x4ym2z*(sol(i,j-1,k)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j-1,k)+sig(i,j-1,k))
+                                     + sol(i,j+1,k)*(sig(i-1,j  ,k-1)+sig(i,j  ,k-1)+sig(i-1,j  ,k)+sig(i,j  ,k)))
+                            + fm2xm2y4z*(sol(i,j,k-1)*(sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1))
+                                     + sol(i,j,k+1)*(sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  )));
+
+                        a_ls(i-lo.x) = f4xm2ym2z*(sig(i-1,j-1,k-1)+sig(i-1,j,k-1)+sig(i-1,j-1,k)+sig(i-1,j,k));
+                        b_ls(i-lo.x) = s0;
+                        c_ls(i-lo.x) = f4xm2ym2z*(sig(i  ,j-1,k-1)+sig(i  ,j,k-1)+sig(i  ,j-1,k)+sig(i  ,j,k));
+                        u_ls(i-lo.x) = 0.;
+                        r_ls(i-lo.x) = rhs(i,j,k) - Ax;
+              	    }
+                }
+                tridiagonal_solve(a_ls, b_ls, c_ls, r_ls, u_ls, gam, ilen);
+
+                for (int i = lo.x; i <= hi.x; ++i)
+                {
+                    sol(i,j,k) = u_ls(i-lo.x);
+                }
+            }
+        }
+    } 
+    else
+    {
+        amrex::Abort("mlndlap_gauss_seidel_with_line_solve_aa is wrong direction.");	
+    } 
+}
+
 //
 // restriction
 //
@@ -1166,6 +1436,55 @@ void mlndlap_restriction (int i, int j, int k, Array4<Real> const& crse,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_restriction (int i, int j, int k, Array4<Real> const& crse,
+                               Array4<Real const> const& fine, Array4<int const> const& msk, int idir) noexcept
+{
+    if (idir == 2) 
+    {
+        int ii = i*2;
+        int jj = j*2;
+        int kk = k;
+        if (msk(ii,jj,kk)) {
+            crse(i,j,k) = 0.0;
+        } else { // use 2-D formula 
+            crse(i,j,k) = (1./16.)*(fine(ii-1,jj-1,kk) + 2.*fine(ii  ,jj-1,kk) +    fine(ii+1,jj-1,kk)
+                               + 2.*fine(ii-1,jj  ,kk) + 4.*fine(ii  ,jj  ,kk) + 2.*fine(ii+1,jj  ,kk)
+                                  + fine(ii-1,jj+1,kk) + 2.*fine(ii  ,jj+1,kk) +    fine(ii+1,jj+1,kk));
+        }
+    } 
+    else if (idir == 1) 
+    {
+        int ii = i*2;
+        int jj = j;
+        int kk = k*2;
+        if (msk(ii,jj,kk)) {
+            crse(i,j,k) = 0.0;
+        } else { // use 2-D formula 
+            crse(i,j,k) = (1./16.)*(fine(ii-1,jj,kk-1) + 2.*fine(ii  ,jj,kk-1) +    fine(ii+1,jj,kk-1)
+                               + 2.*fine(ii-1,jj  ,kk) + 4.*fine(ii  ,jj,kk  ) + 2.*fine(ii+1,jj,kk  )
+                                  + fine(ii-1,jj,kk+1) + 2.*fine(ii  ,jj,kk+1) +    fine(ii+1,jj,kk+1));
+        }
+    }
+    else if (idir == 0)
+    {
+        int ii = i;
+        int jj = j*2;
+        int kk = k*2;
+        if (msk(ii,jj,kk)) {
+            crse(i,j,k) = 0.0;
+        } else { // use 2-D formula 
+            crse(i,j,k) = (1./16.)*(fine(ii,jj-1,kk-1) + 2.*fine(ii  ,jj,kk-1) +    fine(ii,jj+1,kk-1)
+                               + 2.*fine(ii,jj-1  ,kk) + 4.*fine(ii  ,jj,kk  ) + 2.*fine(ii,jj+1,kk  )
+                                  + fine(ii,jj-1,kk+1) + 2.*fine(ii  ,jj,kk+1) +    fine(ii,jj+1,kk+1));
+        }
+    }
+    else 
+    {
+        amrex::Abort("mlndlap_semi_restriction semi direction wrong semi-direction. ");
+    }
+}
+
 //
 // interpolation
 //
@@ -1294,6 +1613,82 @@ void mlndlap_interpadd_aa (int i, int j, int k, Array4<Real> const& fine,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mlndlap_semi_interpadd_aa (int i, int j, int k, Array4<Real> const& fine,
+                           Array4<Real const> const& crse, Array4<Real const> const& sig,
+                           Array4<int const> const& msk, int idir) noexcept
+{
+    if (idir == 2 ) 
+    {
+    	if (!msk(i,j,k)) {
+            int ic = amrex::coarsen(i,2);
+            int jc = amrex::coarsen(j,2);
+            int kc = k;
+            bool i_is_odd = (ic*2 != i);
+            bool j_is_odd = (jc*2 != j);
+
+            if (i_is_odd and j_is_odd) {
+                // Node on a X-Y face
+                fine(i,j,k) += aa_interp_face_xy(crse,sig,i,j,k,ic,jc,kc);
+            } else if (i_is_odd) {
+                // Node on X line
+                fine(i,j,k) += aa_interp_line_x(crse,sig,i,j,k,ic,jc,kc);
+            } else if (j_is_odd) {
+                // Node on Y line
+                fine(i,j,k) += aa_interp_line_y(crse,sig,i,j,k,ic,jc,kc);
+            } else {
+                // Node coincident with coarse node 
+                fine(i,j,k) += crse(ic,jc,kc);
+            }
+	}
+    } else if (idir ==1 ){
+        if (!msk(i,j,k)) {
+            int ic = amrex::coarsen(i,2);
+            int jc = j;
+            int kc = amrex::coarsen(k,2);
+            bool i_is_odd = (ic*2 != i);
+            bool k_is_odd = (kc*2 != k);
+
+            if (i_is_odd and k_is_odd) {
+                // Node on a X-Z face
+	        fine(i,j,k) += aa_interp_face_xz(crse,sig,i,j,k,ic,jc,kc);
+            } else if (i_is_odd) {
+                // Node on X line
+                fine(i,j,k) += aa_interp_line_x(crse,sig,i,j,k,ic,jc,kc);
+            } else if (k_is_odd) {
+                // Node on Z line
+                fine(i,j,k) += aa_interp_line_z(crse,sig,i,j,k,ic,jc,kc);
+            } else {
+                // Node coincident with coarse node
+                fine(i,j,k) += crse(ic,jc,kc);
+            }
+        }
+    } else if (idir == 0 ) {
+        if (!msk(i,j,k)) {
+            int ic = i;
+            int jc = amrex::coarsen(j,2);
+            int kc = amrex::coarsen(k,2);
+            bool j_is_odd = (jc*2 != j);
+            bool k_is_odd = (kc*2 != k);
+
+            if (j_is_odd and k_is_odd) {
+                // Node on a Y-Z face
+                fine(i,j,k) += aa_interp_face_yz(crse,sig,i,j,k,ic,jc,kc);
+            } else if (j_is_odd) {
+                // Node on Y line
+                fine(i,j,k) += aa_interp_line_y(crse,sig,i,j,k,ic,jc,kc);
+            } else if (k_is_odd) {
+                // Node on Z line
+                fine(i,j,k) += aa_interp_line_z(crse,sig,i,j,k,ic,jc,kc);
+            } else {
+                // Node coincident with coarse node
+                fine(i,j,k) += crse(ic,jc,kc);
+            }
+        }
+    } else { 
+        amrex::Abort("mlndlap_semi_interpolation semi direction wrong semi-direction. ");
+    }
+}
 namespace {
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -1402,27 +1797,58 @@ void mlndlap_interpadd_ha (int i, int j, int k, Array4<Real> const& fine,
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_divu (int i, int j, int k, Array4<Real> const& rhs, Array4<Real const> const& vel,
                    Array4<int const> const& msk,
-                   GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                   GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                   Box const& nodal_domain,
+                   GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                   GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi) noexcept
 {
     Real facx = 0.25*dxinv[0];
     Real facy = 0.25*dxinv[1];
     Real facz = 0.25*dxinv[2];
 
+    const auto domlo = amrex::lbound(nodal_domain);
+    const auto domhi = amrex::ubound(nodal_domain);
+
     if (msk(i,j,k)) {
         rhs(i,j,k) = 0.0;
     } else {
-        rhs(i,j,k) = facx*(-vel(i-1,j-1,k-1,0)+vel(i,j-1,k-1,0)
-                           -vel(i-1,j  ,k-1,0)+vel(i,j  ,k-1,0)
-                           -vel(i-1,j-1,k  ,0)+vel(i,j-1,k  ,0)
-                           -vel(i-1,j  ,k  ,0)+vel(i,j  ,k  ,0))
-                   + facy*(-vel(i-1,j-1,k-1,1)-vel(i,j-1,k-1,1)
-                           +vel(i-1,j  ,k-1,1)+vel(i,j  ,k-1,1)
-                           -vel(i-1,j-1,k  ,1)-vel(i,j-1,k  ,1)
-                           +vel(i-1,j  ,k  ,1)+vel(i,j  ,k  ,1))
-                   + facz*(-vel(i-1,j-1,k-1,2)-vel(i,j-1,k-1,2)
-                           -vel(i-1,j  ,k-1,2)-vel(i,j  ,k-1,2)
-                           +vel(i-1,j-1,k  ,2)+vel(i,j-1,k  ,2)
-                           +vel(i-1,j  ,k  ,2)+vel(i,j  ,k  ,2));
+
+        Real zero_ilo = 1.0;
+        Real zero_ihi = 1.0;
+        Real zero_jlo = 1.0;
+        Real zero_jhi = 1.0;
+        Real zero_klo = 1.0;
+        Real zero_khi = 1.0;
+
+        // The nodal divergence operator should not see the tangential velocity
+        //     at an inflow face
+        if ((bclo[0] == LinOpBCType::Neumann or bclo[0] == LinOpBCType::inflow)
+            and i == domlo.x) zero_ilo = 0.0;
+        if ((bchi[0] == LinOpBCType::Neumann or bchi[0] == LinOpBCType::inflow)
+            and i == domhi.x) zero_ihi = 0.0;
+        if ((bclo[1] == LinOpBCType::Neumann or bclo[1] == LinOpBCType::inflow)
+            and j == domlo.y) zero_jlo = 0.0;
+        if ((bchi[1] == LinOpBCType::Neumann or bchi[1] == LinOpBCType::inflow)
+            and j == domhi.y) zero_jhi = 0.0;
+        if ((bclo[2] == LinOpBCType::Neumann or bclo[2] == LinOpBCType::inflow)
+            and k == domlo.z) zero_klo = 0.0;
+        if ((bchi[2] == LinOpBCType::Neumann or bchi[2] == LinOpBCType::inflow)
+            and k == domhi.z) zero_khi = 0.0;
+
+        rhs(i,j,k) = facx*(-vel(i-1,j-1,k-1,0)*zero_jlo*zero_klo+vel(i,j-1,k-1,0)*zero_jlo*zero_klo
+                           -vel(i-1,j  ,k-1,0)*zero_jhi*zero_klo+vel(i,j  ,k-1,0)*zero_jhi*zero_klo
+                           -vel(i-1,j-1,k  ,0)*zero_jlo*zero_khi+vel(i,j-1,k  ,0)*zero_jlo*zero_khi
+                           -vel(i-1,j  ,k  ,0)*zero_jhi*zero_khi+vel(i,j  ,k  ,0)*zero_jhi*zero_khi)
+
+                   + facy*(-vel(i-1,j-1,k-1,1)*zero_ilo*zero_klo-vel(i,j-1,k-1,1)*zero_ihi*zero_klo
+                           +vel(i-1,j  ,k-1,1)*zero_ilo*zero_klo+vel(i,j  ,k-1,1)*zero_ihi*zero_klo
+                           -vel(i-1,j-1,k  ,1)*zero_ilo*zero_khi-vel(i,j-1,k  ,1)*zero_ihi*zero_khi
+                           +vel(i-1,j  ,k  ,1)*zero_ilo*zero_khi+vel(i,j  ,k  ,1)*zero_ihi*zero_khi)
+
+                   + facz*(-vel(i-1,j-1,k-1,2)*zero_ilo*zero_jlo-vel(i,j-1,k-1,2)*zero_ihi*zero_jlo
+                           -vel(i-1,j  ,k-1,2)*zero_ilo*zero_jhi-vel(i,j  ,k-1,2)*zero_ihi*zero_jhi
+                           +vel(i-1,j-1,k  ,2)*zero_ilo*zero_jlo+vel(i,j-1,k  ,2)*zero_ihi*zero_jlo
+                           +vel(i-1,j  ,k  ,2)*zero_ilo*zero_jhi+vel(i,j  ,k  ,2)*zero_ihi*zero_jhi);
     }
 }
 
@@ -1461,23 +1887,51 @@ void mlndlap_mknewu (int i, int j, int k, Array4<Real> const& u, Array4<Real con
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_divu_compute_fine_contrib (int i, int j, int k, Box const& fvbx,
                                         Array4<Real> const& frh, Array4<Real const> const& vel,
-                                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                                        GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                                        Box const& nodal_domain,
+                                        GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                                        GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi) noexcept
 {
+    const auto domlo = amrex::lbound(nodal_domain);
+    const auto domhi = amrex::ubound(nodal_domain);
+
     IntVect iv(i,j,k);
     if (fvbx.contains(iv) and !fvbx.strictly_contains(iv))
     {
-        frh(i,j,k) = 0.25*dxinv[0]*(-vel(i-1,j-1,k-1,0)+vel(i,j-1,k-1,0)
-                                    -vel(i-1,j  ,k-1,0)+vel(i,j  ,k-1,0)
-                                    -vel(i-1,j-1,k  ,0)+vel(i,j-1,k  ,0)
-                                    -vel(i-1,j  ,k  ,0)+vel(i,j  ,k  ,0))
-                   + 0.25*dxinv[1]*(-vel(i-1,j-1,k-1,1)-vel(i,j-1,k-1,1)
-                                    +vel(i-1,j  ,k-1,1)+vel(i,j  ,k-1,1)
-                                    -vel(i-1,j-1,k  ,1)-vel(i,j-1,k  ,1)
-                                    +vel(i-1,j  ,k  ,1)+vel(i,j  ,k  ,1))
-                   + 0.25*dxinv[2]*(-vel(i-1,j-1,k-1,2)-vel(i,j-1,k-1,2)
-                                    -vel(i-1,j  ,k-1,2)-vel(i,j  ,k-1,2)
-                                    +vel(i-1,j-1,k  ,2)+vel(i,j-1,k  ,2)
-                                    +vel(i-1,j  ,k  ,2)+vel(i,j  ,k  ,2));
+        Real zero_ilo = 1.0;
+        Real zero_ihi = 1.0;
+        Real zero_jlo = 1.0;
+        Real zero_jhi = 1.0;
+        Real zero_klo = 1.0;
+        Real zero_khi = 1.0;
+
+        // The nodal divergence operator should not see the tangential velocity
+        //     at an inflow face
+        if ((bclo[0] == LinOpBCType::Neumann or bclo[0] == LinOpBCType::inflow)
+            and i == domlo.x) zero_ilo = 0.0;
+        if ((bchi[0] == LinOpBCType::Neumann or bchi[0] == LinOpBCType::inflow)
+            and i == domhi.x) zero_ihi = 0.0;
+        if ((bclo[1] == LinOpBCType::Neumann or bclo[1] == LinOpBCType::inflow)
+            and j == domlo.y) zero_jlo = 0.0;
+        if ((bchi[1] == LinOpBCType::Neumann or bchi[1] == LinOpBCType::inflow)
+            and j == domhi.y) zero_jhi = 0.0;
+        if ((bclo[2] == LinOpBCType::Neumann or bclo[2] == LinOpBCType::inflow)
+            and k == domlo.z) zero_klo = 0.0;
+        if ((bchi[2] == LinOpBCType::Neumann or bchi[2] == LinOpBCType::inflow)
+            and k == domhi.z) zero_khi = 0.0;
+
+        frh(i,j,k) = 0.25*dxinv[0]*(-vel(i-1,j-1,k-1,0)*zero_jlo*zero_klo+vel(i,j-1,k-1,0)*zero_jlo*zero_klo
+                                    -vel(i-1,j  ,k-1,0)*zero_jhi*zero_klo+vel(i,j  ,k-1,0)*zero_jhi*zero_klo
+                                    -vel(i-1,j-1,k  ,0)*zero_jlo*zero_khi+vel(i,j-1,k  ,0)*zero_jlo*zero_khi
+                                    -vel(i-1,j  ,k  ,0)*zero_jhi*zero_khi+vel(i,j  ,k  ,0)*zero_jhi*zero_khi)
+                   + 0.25*dxinv[1]*(-vel(i-1,j-1,k-1,1)*zero_ilo*zero_klo-vel(i,j-1,k-1,1)*zero_ihi*zero_klo
+                                    +vel(i-1,j  ,k-1,1)*zero_ilo*zero_klo+vel(i,j  ,k-1,1)*zero_ihi*zero_klo
+                                    -vel(i-1,j-1,k  ,1)*zero_ilo*zero_khi-vel(i,j-1,k  ,1)*zero_ihi*zero_khi
+                                    +vel(i-1,j  ,k  ,1)*zero_ilo*zero_khi+vel(i,j  ,k  ,1)*zero_ihi*zero_khi)
+                   + 0.25*dxinv[2]*(-vel(i-1,j-1,k-1,2)*zero_ilo*zero_jlo-vel(i,j-1,k-1,2)*zero_ihi*zero_jlo
+                                    -vel(i-1,j  ,k-1,2)*zero_ilo*zero_jhi-vel(i,j  ,k-1,2)*zero_ihi*zero_jhi
+                                    +vel(i-1,j-1,k  ,2)*zero_ilo*zero_jlo+vel(i,j-1,k  ,2)*zero_ihi*zero_jlo
+                                    +vel(i-1,j  ,k  ,2)*zero_ilo*zero_jhi+vel(i,j  ,k  ,2)*zero_ihi*zero_jhi);
     }
 }
 
@@ -1486,10 +1940,10 @@ void mlndlap_divu_add_fine_contrib (int i, int j, int k, Box const& fvbx,
                                     Array4<Real> const& rhs, Array4<Real const> const& frh,
                                     Array4<int const> const& msk) noexcept
 {
-    constexpr Real rfd = 0.125_rt;
-    constexpr Real chip = 0.5_rt;
-    constexpr Real chip2 = 0.25_rt;
-    constexpr Real chip3 = 0.125_rt;
+    constexpr Real rfd = Real(0.125);
+    constexpr Real chip = Real(0.5);
+    constexpr Real chip2 = Real(0.25);
+    constexpr Real chip3 = Real(0.125);
 
     int ii = 2*i;
     int jj = 2*j;
@@ -1517,7 +1971,7 @@ void mlndlap_rhcc_fine_contrib (int i, int j, int k, Box const& fvbx,
                                 Array4<Real> const& rhs, Array4<Real const> const& cc,
                                 Array4<int const> const& msk) noexcept
 {
-    constexpr Real fac[] = {0.125_rt, 0.375_rt, 0.375_rt, 0.125_rt};
+    constexpr Real fac[] = {Real(0.125), Real(0.375), Real(0.375), Real(0.125)};
     int ii = 2*i;
     int jj = 2*j;
     int kk = 2*k;
@@ -1545,19 +1999,19 @@ void mlndlap_divu_cf_contrib (int i, int j, int k, Array4<Real> const& rhs,
                               bool neumann_doubling) noexcept
 {
     if (!dmsk(i,j,k) and ndmsk(i,j,k) == crse_fine_node) {
-        Real facx = 0.25_rt * dxinv[0];
-        Real facy = 0.25_rt * dxinv[1];
-        Real facz = 0.25_rt * dxinv[2];
+        Real facx = Real(0.25) * dxinv[0];
+        Real facy = Real(0.25) * dxinv[1];
+        Real facz = Real(0.25) * dxinv[2];
         Real r = fc(i,j,k);
         if (rhcc) {
-            r += 0.125_rt*((1._rt-ccmsk(i-1,j-1,k-1)) * rhcc(i-1,j-1,k-1)
-                         + (1._rt-ccmsk(i  ,j-1,k-1)) * rhcc(i  ,j-1,k-1)
-                         + (1._rt-ccmsk(i-1,j  ,k-1)) * rhcc(i-1,j  ,k-1)
-                         + (1._rt-ccmsk(i  ,j  ,k-1)) * rhcc(i  ,j  ,k-1)
-                         + (1._rt-ccmsk(i-1,j-1,k  )) * rhcc(i-1,j-1,k  )
-                         + (1._rt-ccmsk(i  ,j-1,k  )) * rhcc(i  ,j-1,k  )
-                         + (1._rt-ccmsk(i-1,j  ,k  )) * rhcc(i-1,j  ,k  )
-                         + (1._rt-ccmsk(i  ,j  ,k  )) * rhcc(i  ,j  ,k  ));
+            r += Real(0.125)*((Real(1.)-ccmsk(i-1,j-1,k-1)) * rhcc(i-1,j-1,k-1)
+                            + (Real(1.)-ccmsk(i  ,j-1,k-1)) * rhcc(i  ,j-1,k-1)
+                            + (Real(1.)-ccmsk(i-1,j  ,k-1)) * rhcc(i-1,j  ,k-1)
+                            + (Real(1.)-ccmsk(i  ,j  ,k-1)) * rhcc(i  ,j  ,k-1)
+                            + (Real(1.)-ccmsk(i-1,j-1,k  )) * rhcc(i-1,j-1,k  )
+                            + (Real(1.)-ccmsk(i  ,j-1,k  )) * rhcc(i  ,j-1,k  )
+                            + (Real(1.)-ccmsk(i-1,j  ,k  )) * rhcc(i-1,j  ,k  )
+                            + (Real(1.)-ccmsk(i  ,j  ,k  )) * rhcc(i  ,j  ,k  ));
         }
         if (ccmsk(i-1,j-1,k-1) == crse_cell) {
             r += - facx*vel(i-1,j-1,k-1,0)
@@ -1605,26 +2059,26 @@ void mlndlap_divu_cf_contrib (int i, int j, int k, Array4<Real> const& rhs,
             const auto ndhi = amrex::ubound(nddom);
             if (i == ndlo.x and ( bclo[0] == LinOpBCType::Neumann or
                                   bclo[0] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             } else if (i== ndhi.x and ( bchi[0] == LinOpBCType::Neumann or
                                         bchi[0] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             }
 
             if (j == ndlo.y and ( bclo[1] == LinOpBCType::Neumann or
                                   bclo[1] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             } else if (j == ndhi.y and ( bchi[1] == LinOpBCType::Neumann or
                                          bchi[1] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             }
 
             if (k == ndlo.z and ( bclo[2] == LinOpBCType::Neumann or
                                   bclo[2] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             } else if (k == ndhi.z and ( bchi[2] == LinOpBCType::Neumann or
                                          bchi[2] == LinOpBCType::inflow)) {
-                r *= 2._rt;
+                r *= Real(2.);
             }
         }
 
@@ -1660,35 +2114,35 @@ void mlndlap_crse_resid (int i, int j, int k, Array4<Real> const& resid,
          msk(i-1,j  ,k  ) == 0 or
          msk(i  ,j  ,k  ) == 0))
     {
-        Real fac = 1.0_rt;
+        Real fac = Real(1.0);
         if (neumann_doubling) {
             const auto ndlo = amrex::lbound(nddom);
             const auto ndhi = amrex::ubound(nddom);
             if (i == ndlo.x and ( bclo[0] == LinOpBCType::Neumann or
                                   bclo[0] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             } else if (i== ndhi.x and ( bchi[0] == LinOpBCType::Neumann or
                                         bchi[0] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             }
             if (j == ndlo.y and ( bclo[1] == LinOpBCType::Neumann or
                                   bclo[1] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             } else if (j == ndhi.y and ( bchi[1] == LinOpBCType::Neumann or
                                          bchi[1] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             }
             if (k == ndlo.z and ( bclo[2] == LinOpBCType::Neumann or
                                   bclo[2] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             } else if (k == ndhi.z and ( bchi[2] == LinOpBCType::Neumann or
                                          bchi[2] == LinOpBCType::inflow)) {
-                fac *= 2._rt;
+                fac *= Real(2.);
             }
         }
         resid(i,j,k) = (rhs(i,j,k) - resid(i,j,k)) * fac;
     } else {
-        resid(i,j,k) = 0._rt;
+        resid(i,j,k) = Real(0.);
     }
 }
 
@@ -1703,17 +2157,17 @@ void mlndlap_res_fine_Ax (int i, int j, int k, Box const& fvbx, Array4<Real> con
 {
     IntVect iv(i,j,k);
     if (fvbx.contains(iv) and !fvbx.strictly_contains(iv)) {
-        Real facx = (1._rt/36._rt)*dxinv[0]*dxinv[0];
-        Real facy = (1._rt/36._rt)*dxinv[1]*dxinv[1];
-        Real facz = (1._rt/36._rt)*dxinv[2]*dxinv[2];
+        Real facx = Real(1./36.)*dxinv[0]*dxinv[0];
+        Real facy = Real(1./36.)*dxinv[1]*dxinv[1];
+        Real facz = Real(1./36.)*dxinv[2]*dxinv[2];
         Real fxyz = facx + facy + facz;
-        Real fmx2y2z = -facx + 2._rt*facy + 2._rt*facz;
-        Real f2xmy2z = 2._rt*facx - facy + 2._rt*facz;
-        Real f2x2ymz = 2._rt*facx + 2._rt*facy - facz;
-        Real f4xm2ym2z = 4._rt*facx - 2._rt*facy - 2._rt*facz;
-        Real fm2x4ym2z = -2._rt*facx + 4._rt*facy - 2._rt*facz;
-        Real fm2xm2y4z = -2._rt*facx - 2._rt*facy + 4._rt*facz;
-        Ax(i,j,k) = x(i,j,k)*(-4._rt)*fxyz*
+        Real fmx2y2z = -facx + Real(2.)*facy + Real(2.)*facz;
+        Real f2xmy2z = Real(2.)*facx - facy + Real(2.)*facz;
+        Real f2x2ymz = Real(2.)*facx + Real(2.)*facy - facz;
+        Real f4xm2ym2z = Real(4.)*facx - Real(2.)*facy - Real(2.)*facz;
+        Real fm2x4ym2z = -Real(2.)*facx + Real(4.)*facy - Real(2.)*facz;
+        Real fm2xm2y4z = -Real(2.)*facx - Real(2.)*facy + Real(4.)*facz;
+        Ax(i,j,k) = x(i,j,k)*Real(-4.)*fxyz*
             (sig(i-1,j-1,k-1)+sig(i,j-1,k-1)+sig(i-1,j,k-1)+sig(i,j,k-1)
             +sig(i-1,j-1,k  )+sig(i,j-1,k  )+sig(i-1,j,k  )+sig(i,j,k  ))
             //
@@ -1750,10 +2204,10 @@ AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_res_fine_contrib (int i, int j, int k, Array4<Real> const& f,
                                Array4<Real const> const& Ax, Array4<int const> const& msk) noexcept
 {
-    constexpr Real rfd = 0.125_rt;
-    constexpr Real chip = 0.5_rt;
-    constexpr Real chip2 = 0.25_rt;
-    constexpr Real chip3 = 0.125_rt;
+    constexpr Real rfd = Real(0.125);
+    constexpr Real chip = Real(0.5);
+    constexpr Real chip2 = Real(0.25);
+    constexpr Real chip3 = Real(0.125);
 
     int ii = 2*i;
     int jj = 2*j;
@@ -1787,122 +2241,122 @@ void mlndlap_res_cf_contrib (int i, int j, int k, Array4<Real> const& res,
 {
     if (!dmsk(i,j,k) and ndmsk(i,j,k) == crse_fine_node) {
 
-        Real facx = (1._rt/36._rt)*dxinv[0]*dxinv[0];
-        Real facy = (1._rt/36._rt)*dxinv[1]*dxinv[1];
-        Real facz = (1._rt/36._rt)*dxinv[2]*dxinv[2];
+        Real facx = Real(1./36.)*dxinv[0]*dxinv[0];
+        Real facy = Real(1./36.)*dxinv[1]*dxinv[1];
+        Real facz = Real(1./36.)*dxinv[2]*dxinv[2];
 
-        Real Ax = 0._rt;
+        Real Ax = Real(0.);
         if (ccmsk(i-1,j-1,k-1) == crse_cell) {
-            Ax += sig(i-1,j-1,k-1)*(facx*(4._rt*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
-                                         +2._rt*(phi(i-1,j-1,k  )-phi(i  ,j-1,k  ))
-                                         +2._rt*(phi(i-1,j  ,k-1)-phi(i  ,j  ,k-1))
-                                          +     (phi(i-1,j-1,k-1)-phi(i  ,j-1,k-1)))
-                                  + facy*(4._rt*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
-                                         +2._rt*(phi(i-1,j-1,k  )-phi(i-1,j  ,k  ))
-                                         +2._rt*(phi(i  ,j-1,k-1)-phi(i  ,j  ,k-1))
-                                          +     (phi(i-1,j-1,k-1)-phi(i-1,j  ,k-1)))
-                                  + facz*(4._rt*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
-                                         +2._rt*(phi(i-1,j  ,k-1)-phi(i-1,j  ,k  ))
-                                         +2._rt*(phi(i  ,j-1,k-1)-phi(i  ,j-1,k  ))
-                                          +     (phi(i-1,j-1,k-1)-phi(i-1,j-1,k  ))));
+            Ax += sig(i-1,j-1,k-1)*(facx*(Real(4.)*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
+                                         +Real(2.)*(phi(i-1,j-1,k  )-phi(i  ,j-1,k  ))
+                                         +Real(2.)*(phi(i-1,j  ,k-1)-phi(i  ,j  ,k-1))
+                                         +         (phi(i-1,j-1,k-1)-phi(i  ,j-1,k-1)))
+                                  + facy*(Real(4.)*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
+                                         +Real(2.)*(phi(i-1,j-1,k  )-phi(i-1,j  ,k  ))
+                                         +Real(2.)*(phi(i  ,j-1,k-1)-phi(i  ,j  ,k-1))
+                                         +         (phi(i-1,j-1,k-1)-phi(i-1,j  ,k-1)))
+                                  + facz*(Real(4.)*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
+                                         +Real(2.)*(phi(i-1,j  ,k-1)-phi(i-1,j  ,k  ))
+                                         +Real(2.)*(phi(i  ,j-1,k-1)-phi(i  ,j-1,k  ))
+                                         +         (phi(i-1,j-1,k-1)-phi(i-1,j-1,k  ))));
         }
         if (ccmsk(i,j-1,k-1) == crse_cell) {
-            Ax += sig(i,j-1,k-1)*(facx*(4._rt*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i+1,j-1,k  )-phi(i  ,j-1,k  ))
-                                       +2._rt*(phi(i+1,j  ,k-1)-phi(i  ,j  ,k-1))
-                                        +     (phi(i+1,j-1,k-1)-phi(i  ,j-1,k-1)))
-                                + facy*(4._rt*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i+1,j-1,k  )-phi(i+1,j  ,k  ))
-                                       +2._rt*(phi(i  ,j-1,k-1)-phi(i  ,j  ,k-1))
-                                        +     (phi(i+1,j-1,k-1)-phi(i+1,j  ,k-1)))
-                                + facz*(4._rt*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i+1,j  ,k-1)-phi(i+1,j  ,k  ))
-                                       +2._rt*(phi(i  ,j-1,k-1)-phi(i  ,j-1,k  ))
-                                        +     (phi(i+1,j-1,k-1)-phi(i+1,j-1,k  ))));
+            Ax += sig(i,j-1,k-1)*(facx*(Real(4.)*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i+1,j-1,k  )-phi(i  ,j-1,k  ))
+                                       +Real(2.)*(phi(i+1,j  ,k-1)-phi(i  ,j  ,k-1))
+                                       +         (phi(i+1,j-1,k-1)-phi(i  ,j-1,k-1)))
+                                + facy*(Real(4.)*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i+1,j-1,k  )-phi(i+1,j  ,k  ))
+                                       +Real(2.)*(phi(i  ,j-1,k-1)-phi(i  ,j  ,k-1))
+                                       +         (phi(i+1,j-1,k-1)-phi(i+1,j  ,k-1)))
+                                + facz*(Real(4.)*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i+1,j  ,k-1)-phi(i+1,j  ,k  ))
+                                       +Real(2.)*(phi(i  ,j-1,k-1)-phi(i  ,j-1,k  ))
+                                       +         (phi(i+1,j-1,k-1)-phi(i+1,j-1,k  ))));
         }
         if (ccmsk(i-1,j,k-1) == crse_cell) {
-            Ax += sig(i-1,j,k-1)*(facx*(4._rt*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i-1,j+1,k  )-phi(i  ,j+1,k  ))
-                                       +2._rt*(phi(i-1,j  ,k-1)-phi(i  ,j  ,k-1))
-                                        +     (phi(i-1,j+1,k-1)-phi(i  ,j+1,k-1)))
-                                 + facy*(4._rt*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
-                                        +2._rt*(phi(i-1,j+1,k  )-phi(i-1,j  ,k  ))
-                                        +2._rt*(phi(i  ,j+1,k-1)-phi(i  ,j  ,k-1))
-                                         +     (phi(i-1,j+1,k-1)-phi(i-1,j  ,k-1)))
-                                 + facz*(4._rt*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
-                                        +2._rt*(phi(i-1,j  ,k-1)-phi(i-1,j  ,k  ))
-                                        +2._rt*(phi(i  ,j+1,k-1)-phi(i  ,j+1,k  ))
-                                         +     (phi(i-1,j+1,k-1)-phi(i-1,j+1,k  ))));
+            Ax += sig(i-1,j,k-1)*(facx*(Real(4.)*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i-1,j+1,k  )-phi(i  ,j+1,k  ))
+                                       +Real(2.)*(phi(i-1,j  ,k-1)-phi(i  ,j  ,k-1))
+                                       +         (phi(i-1,j+1,k-1)-phi(i  ,j+1,k-1)))
+                                 + facy*(Real(4.)*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
+                                        +Real(2.)*(phi(i-1,j+1,k  )-phi(i-1,j  ,k  ))
+                                        +Real(2.)*(phi(i  ,j+1,k-1)-phi(i  ,j  ,k-1))
+                                        +         (phi(i-1,j+1,k-1)-phi(i-1,j  ,k-1)))
+                                 + facz*(Real(4.)*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
+                                        +Real(2.)*(phi(i-1,j  ,k-1)-phi(i-1,j  ,k  ))
+                                        +Real(2.)*(phi(i  ,j+1,k-1)-phi(i  ,j+1,k  ))
+                                        +         (phi(i-1,j+1,k-1)-phi(i-1,j+1,k  ))));
         }
         if (ccmsk(i,j,k-1) == crse_cell) {
-            Ax += sig(i,j,k-1)*(facx*(4._rt*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i+1,j+1,k  )-phi(i  ,j+1,k  ))
-                                     +2._rt*(phi(i+1,j  ,k-1)-phi(i  ,j  ,k-1))
-                                      +     (phi(i+1,j+1,k-1)-phi(i  ,j+1,k-1)))
-                              + facy*(4._rt*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i+1,j+1,k  )-phi(i+1,j  ,k  ))
-                                     +2._rt*(phi(i  ,j+1,k-1)-phi(i  ,j  ,k-1))
-                                      +     (phi(i+1,j+1,k-1)-phi(i+1,j  ,k-1)))
-                              + facz*(4._rt*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i+1,j  ,k-1)-phi(i+1,j  ,k  ))
-                                     +2._rt*(phi(i  ,j+1,k-1)-phi(i  ,j+1,k  ))
-                                      +     (phi(i+1,j+1,k-1)-phi(i+1,j+1,k  ))));
+            Ax += sig(i,j,k-1)*(facx*(Real(4.)*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i+1,j+1,k  )-phi(i  ,j+1,k  ))
+                                     +Real(2.)*(phi(i+1,j  ,k-1)-phi(i  ,j  ,k-1))
+                                     +         (phi(i+1,j+1,k-1)-phi(i  ,j+1,k-1)))
+                              + facy*(Real(4.)*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i+1,j+1,k  )-phi(i+1,j  ,k  ))
+                                     +Real(2.)*(phi(i  ,j+1,k-1)-phi(i  ,j  ,k-1))
+                                     +         (phi(i+1,j+1,k-1)-phi(i+1,j  ,k-1)))
+                              + facz*(Real(4.)*(phi(i  ,j  ,k-1)-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i+1,j  ,k-1)-phi(i+1,j  ,k  ))
+                                     +Real(2.)*(phi(i  ,j+1,k-1)-phi(i  ,j+1,k  ))
+                                     +         (phi(i+1,j+1,k-1)-phi(i+1,j+1,k  ))));
         }
         if (ccmsk(i-1,j-1,k) == crse_cell) {
-            Ax += sig(i-1,j-1,k)*(facx*(4._rt*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i-1,j-1,k  )-phi(i  ,j-1,k  ))
-                                       +2._rt*(phi(i-1,j  ,k+1)-phi(i  ,j  ,k+1))
-                                        +     (phi(i-1,j-1,k+1)-phi(i  ,j-1,k+1)))
-                                + facy*(4._rt*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i-1,j-1,k  )-phi(i-1,j  ,k  ))
-                                       +2._rt*(phi(i  ,j-1,k+1)-phi(i  ,j  ,k+1))
-                                        +     (phi(i-1,j-1,k+1)-phi(i-1,j  ,k+1)))
-                                + facz*(4._rt*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
-                                       +2._rt*(phi(i-1,j  ,k+1)-phi(i-1,j  ,k  ))
-                                       +2._rt*(phi(i  ,j-1,k+1)-phi(i  ,j-1,k  ))
-                                        +     (phi(i-1,j-1,k+1)-phi(i-1,j-1,k  ))));
+            Ax += sig(i-1,j-1,k)*(facx*(Real(4.)*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i-1,j-1,k  )-phi(i  ,j-1,k  ))
+                                       +Real(2.)*(phi(i-1,j  ,k+1)-phi(i  ,j  ,k+1))
+                                       +         (phi(i-1,j-1,k+1)-phi(i  ,j-1,k+1)))
+                                + facy*(Real(4.)*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i-1,j-1,k  )-phi(i-1,j  ,k  ))
+                                       +Real(2.)*(phi(i  ,j-1,k+1)-phi(i  ,j  ,k+1))
+                                       +         (phi(i-1,j-1,k+1)-phi(i-1,j  ,k+1)))
+                                + facz*(Real(4.)*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
+                                       +Real(2.)*(phi(i-1,j  ,k+1)-phi(i-1,j  ,k  ))
+                                       +Real(2.)*(phi(i  ,j-1,k+1)-phi(i  ,j-1,k  ))
+                                       +         (phi(i-1,j-1,k+1)-phi(i-1,j-1,k  ))));
         }
         if (ccmsk(i,j-1,k) == crse_cell) {
-            Ax += sig(i,j-1,k)*(facx*(4._rt*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i+1,j-1,k  )-phi(i  ,j-1,k  ))
-                                     +2._rt*(phi(i+1,j  ,k+1)-phi(i  ,j  ,k+1))
-                                      +     (phi(i+1,j-1,k+1)-phi(i  ,j-1,k+1)))
-                              + facy*(4._rt*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i+1,j-1,k  )-phi(i+1,j  ,k  ))
-                                     +2._rt*(phi(i  ,j-1,k+1)-phi(i  ,j  ,k+1))
-                                      +     (phi(i+1,j-1,k+1)-phi(i+1,j  ,k+1)))
-                              + facz*(4._rt*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i+1,j  ,k+1)-phi(i+1,j  ,k  ))
-                                     +2._rt*(phi(i  ,j-1,k+1)-phi(i  ,j-1,k  ))
-                                      +     (phi(i+1,j-1,k+1)-phi(i+1,j-1,k  ))));
+            Ax += sig(i,j-1,k)*(facx*(Real(4.)*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i+1,j-1,k  )-phi(i  ,j-1,k  ))
+                                     +Real(2.)*(phi(i+1,j  ,k+1)-phi(i  ,j  ,k+1))
+                                     +         (phi(i+1,j-1,k+1)-phi(i  ,j-1,k+1)))
+                              + facy*(Real(4.)*(phi(i  ,j-1,k  )-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i+1,j-1,k  )-phi(i+1,j  ,k  ))
+                                     +Real(2.)*(phi(i  ,j-1,k+1)-phi(i  ,j  ,k+1))
+                                     +         (phi(i+1,j-1,k+1)-phi(i+1,j  ,k+1)))
+                              + facz*(Real(4.)*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i+1,j  ,k+1)-phi(i+1,j  ,k  ))
+                                     +Real(2.)*(phi(i  ,j-1,k+1)-phi(i  ,j-1,k  ))
+                                     +         (phi(i+1,j-1,k+1)-phi(i+1,j-1,k  ))));
         }
         if (ccmsk(i-1,j,k) == crse_cell) {
-            Ax += sig(i-1,j,k)*(facx*(4._rt*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i-1,j+1,k  )-phi(i  ,j+1,k  ))
-                                     +2._rt*(phi(i-1,j  ,k+1)-phi(i  ,j  ,k+1))
-                                      +     (phi(i-1,j+1,k+1)-phi(i  ,j+1,k+1)))
-                              + facy*(4._rt*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i-1,j+1,k  )-phi(i-1,j  ,k  ))
-                                     +2._rt*(phi(i  ,j+1,k+1)-phi(i  ,j  ,k+1))
-                                      +     (phi(i-1,j+1,k+1)-phi(i-1,j  ,k+1)))
-                              + facz*(4._rt*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
-                                     +2._rt*(phi(i-1,j  ,k+1)-phi(i-1,j  ,k  ))
-                                     +2._rt*(phi(i  ,j+1,k+1)-phi(i  ,j+1,k  ))
-                                      +     (phi(i-1,j+1,k+1)-phi(i-1,j+1,k  ))));
+            Ax += sig(i-1,j,k)*(facx*(Real(4.)*(phi(i-1,j  ,k  )-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i-1,j+1,k  )-phi(i  ,j+1,k  ))
+                                     +Real(2.)*(phi(i-1,j  ,k+1)-phi(i  ,j  ,k+1))
+                                     +         (phi(i-1,j+1,k+1)-phi(i  ,j+1,k+1)))
+                              + facy*(Real(4.)*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i-1,j+1,k  )-phi(i-1,j  ,k  ))
+                                     +Real(2.)*(phi(i  ,j+1,k+1)-phi(i  ,j  ,k+1))
+                                     +         (phi(i-1,j+1,k+1)-phi(i-1,j  ,k+1)))
+                              + facz*(Real(4.)*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
+                                     +Real(2.)*(phi(i-1,j  ,k+1)-phi(i-1,j  ,k  ))
+                                     +Real(2.)*(phi(i  ,j+1,k+1)-phi(i  ,j+1,k  ))
+                                     +         (phi(i-1,j+1,k+1)-phi(i-1,j+1,k  ))));
         }
         if (ccmsk(i,j,k) == crse_cell) {
-            Ax += sig(i,j,k)*(facx*(4._rt*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
-                                   +2._rt*(phi(i+1,j+1,k  )-phi(i  ,j+1,k  ))
-                                   +2._rt*(phi(i+1,j  ,k+1)-phi(i  ,j  ,k+1))
-                                    +     (phi(i+1,j+1,k+1)-phi(i  ,j+1,k+1)))
-                            + facy*(4._rt*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
-                                   +2._rt*(phi(i+1,j+1,k  )-phi(i+1,j  ,k  ))
-                                   +2._rt*(phi(i  ,j+1,k+1)-phi(i  ,j  ,k+1))
-                                    +     (phi(i+1,j+1,k+1)-phi(i+1,j  ,k+1)))
-                            + facz*(4._rt*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
-                                   +2._rt*(phi(i+1,j  ,k+1)-phi(i+1,j  ,k  ))
-                                   +2._rt*(phi(i  ,j+1,k+1)-phi(i  ,j+1,k  ))
-                                    +     (phi(i+1,j+1,k+1)-phi(i+1,j+1,k  ))));
+            Ax += sig(i,j,k)*(facx*(Real(4.)*(phi(i+1,j  ,k  )-phi(i  ,j  ,k  ))
+                                   +Real(2.)*(phi(i+1,j+1,k  )-phi(i  ,j+1,k  ))
+                                   +Real(2.)*(phi(i+1,j  ,k+1)-phi(i  ,j  ,k+1))
+                                   +         (phi(i+1,j+1,k+1)-phi(i  ,j+1,k+1)))
+                            + facy*(Real(4.)*(phi(i  ,j+1,k  )-phi(i  ,j  ,k  ))
+                                   +Real(2.)*(phi(i+1,j+1,k  )-phi(i+1,j  ,k  ))
+                                   +Real(2.)*(phi(i  ,j+1,k+1)-phi(i  ,j  ,k+1))
+                                   +         (phi(i+1,j+1,k+1)-phi(i+1,j  ,k+1)))
+                            + facz*(Real(4.)*(phi(i  ,j  ,k+1)-phi(i  ,j  ,k  ))
+                                   +Real(2.)*(phi(i+1,j  ,k+1)-phi(i+1,j  ,k  ))
+                                   +Real(2.)*(phi(i  ,j+1,k+1)-phi(i  ,j+1,k  ))
+                                   +         (phi(i+1,j+1,k+1)-phi(i+1,j+1,k  ))));
         }
 
         Real Axf = fc(i,j,k);
@@ -1912,26 +2366,26 @@ void mlndlap_res_cf_contrib (int i, int j, int k, Array4<Real> const& res,
 
             if (i == ndlo.x and (bclo[0] == LinOpBCType::Neumann or
                                  bclo[0] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             } else if (i== ndhi.x and (bchi[0] == LinOpBCType::Neumann or
                                        bchi[0] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             }
 
             if (j == ndlo.y and ( bclo[1] == LinOpBCType::Neumann or
                                   bclo[1] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             } else if (j == ndhi.y and (bchi[1] == LinOpBCType::Neumann or
                                         bchi[1] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             }
 
             if (k == ndlo.z and (bclo[2] == LinOpBCType::Neumann or
                                  bclo[2] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             } else if (k == ndhi.z and (bchi[2] == LinOpBCType::Neumann or
                                         bchi[2] == LinOpBCType::inflow)) {
-                Axf *= 2._rt;
+                Axf *= Real(2.);
             }
         }
 
@@ -2054,7 +2508,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                           Array4<Real const> const& fsten) noexcept
 {
     auto interp_from_mmm_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_-1,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_ppp))
@@ -2085,7 +2539,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     amrex::ignore_unused(interp_from_mmm_to);
 
     auto interp_from_pmm_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_ppp))
@@ -2115,7 +2569,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto interp_from_mpm_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_-1,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_ppp))
@@ -2145,7 +2599,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto interp_from_ppm_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_ppp))
@@ -2175,7 +2629,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto interp_from_mmp_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_-1,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_ppp))
@@ -2205,7 +2659,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto interp_from_pmp_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_  ,j_  ,k_,ist_p00)) /
            ( amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_ppp))
@@ -2235,7 +2689,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto interp_from_mpp_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_-1,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_ppp))
@@ -2265,7 +2719,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto interp_from_ppp_to = [&fsten] (int i_, int j_, int k_) -> Real {
-        Real p = 1._rt;
+        Real p = Real(1.);
         p += amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p00)) /
            ( amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_ppp))
            + amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_ppp))
@@ -2303,10 +2757,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wmm / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2319,10 +2773,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wmp / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2335,10 +2789,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wpm / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2351,10 +2805,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_  ,j_-1,k_-1,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wpp / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2367,10 +2821,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wmm / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2383,10 +2837,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wpm / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2399,10 +2853,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wmp / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2415,10 +2869,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wpp / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2431,10 +2885,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) + eps);
       Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0p0)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0))
                                                             +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wmm / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2447,10 +2901,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0p0)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wmp / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2463,10 +2917,10 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0p0)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wpm / (wmm+wpm+wmp+wpp+eps);
     };
 
@@ -2479,18 +2933,18 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                              +amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0p0)) / (amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0))
                                                              +amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(i_-1,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wpp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto interp_from_00m_to = [&fsten] (int i_, int j_, int k_) -> Real {
         Real w1 = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_00p));
         Real w2 = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w1 / (w1+w2);
         }
@@ -2499,8 +2953,8 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     auto interp_from_00p_to = [&fsten] (int i_, int j_, int k_) -> Real {
         Real w1 = amrex::Math::abs(fsten(i_  ,j_  ,k_-1,ist_00p));
         Real w2 = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_00p));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w2 / (w1+w2);
         }
@@ -2509,8 +2963,8 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     auto interp_from_0m0_to = [&fsten] (int i_, int j_, int k_) -> Real {
         Real w1 = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0p0));
         Real w2 = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0p0));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w1 / (w1+w2);
         }
@@ -2519,8 +2973,8 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     auto interp_from_0p0_to = [&fsten] (int i_, int j_, int k_) -> Real {
         Real w1 = amrex::Math::abs(fsten(i_  ,j_-1,k_  ,ist_0p0));
         Real w2 = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_0p0));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w2 / (w1+w2);
         }
@@ -2529,8 +2983,8 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     auto interp_from_m00_to = [&fsten] (int i_, int j_, int k_) -> Real {
         Real w1 = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p00));
         Real w2 = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p00));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w1 / (w1+w2);
         }
@@ -2539,8 +2993,8 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     auto interp_from_p00_to = [&fsten] (int i_, int j_, int k_) -> Real {
         Real w1 = amrex::Math::abs(fsten(i_-1,j_  ,k_  ,ist_p00));
         Real w2 = amrex::Math::abs(fsten(i_  ,j_  ,k_  ,ist_p00));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w2 / (w1+w2);
         }
@@ -2656,7 +3110,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     };
 
     auto restrict_from_mmm_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_-1,jj_-1,kk_-1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_-1,jj_-2,kk_-2,ist_ppp))
            + amrex::Math::abs(fsten(ii_-1,jj_-1,kk_-2,ist_ppp))
@@ -2695,15 +3149,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_,jj_-1,kk_-2,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_,jj_-1,kk_-1,ist_00p)) / (amrex::Math::abs(fsten(ii_,jj_-2,kk_-1,ist_0pp))
                                                               +amrex::Math::abs(fsten(ii_,jj_-1,kk_-1,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_,jj_-2,kk_-2,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_,jj_-1,kk_-2,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_,jj_-2,kk_-1,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_,jj_-1,kk_-1,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_,jj_-2,kk_-2,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_,jj_-1,kk_-2,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_,jj_-2,kk_-1,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_,jj_-1,kk_-1,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wpp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_pmm_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_  ,jj_-1,kk_-1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_  ,jj_-2,kk_-2,ist_ppp))
            + amrex::Math::abs(fsten(ii_  ,jj_-1,kk_-2,ist_ppp))
@@ -2741,18 +3195,18 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_-1,jj_,kk_-2,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_-1,jj_,kk_-1,ist_00p)) / (amrex::Math::abs(fsten(ii_-2,jj_,kk_-1,ist_p0p))
                                                               +amrex::Math::abs(fsten(ii_-1,jj_,kk_-1,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_,kk_-2,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_,kk_-2,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_,kk_-1,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_,kk_-1,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_,kk_-2,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_,kk_-2,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_,kk_-1,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_,kk_-1,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wpp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_00m_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
         Real w1 = amrex::Math::abs(fsten(ii_,jj_,kk_-2,ist_00p));
         Real w2 = amrex::Math::abs(fsten(ii_,jj_,kk_-1,ist_00p));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w2 / (w1+w2);
         }
@@ -2767,15 +3221,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_+1,jj_,kk_-2,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_+1,jj_,kk_-1,ist_00p)) / (amrex::Math::abs(fsten(ii_  ,jj_,kk_-1,ist_p0p))
                                                               +amrex::Math::abs(fsten(ii_+1,jj_,kk_-1,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_,kk_-2,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_,kk_-2,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_,kk_-1,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_,kk_-1,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_,kk_-2,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_,kk_-2,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_,kk_-1,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_,kk_-1,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wmp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_mpm_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_-1,jj_+1,kk_-1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_-1,jj_  ,kk_-2,ist_ppp))
            + amrex::Math::abs(fsten(ii_-1,jj_+1,kk_-2,ist_ppp))
@@ -2813,15 +3267,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_,jj_+1,kk_-2,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_,jj_+1,kk_-1,ist_00p)) / (amrex::Math::abs(fsten(ii_,jj_  ,kk_-1,ist_0pp))
                                                               +amrex::Math::abs(fsten(ii_,jj_+1,kk_-1,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_,jj_  ,kk_-2,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_,jj_+1,kk_-2,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_,jj_  ,kk_-1,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_,jj_+1,kk_-1,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_,jj_  ,kk_-2,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_,jj_+1,kk_-2,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_,jj_  ,kk_-1,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_,jj_+1,kk_-1,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wmp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_ppm_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_  ,jj_+1,kk_-1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_  ,jj_  ,kk_-2,ist_ppp))
            + amrex::Math::abs(fsten(ii_  ,jj_+1,kk_-2,ist_ppp))
@@ -2859,18 +3313,18 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_-1,jj_-2,kk_,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_-1,jj_-1,kk_,ist_0p0)) / (amrex::Math::abs(fsten(ii_-2,jj_-1,kk_,ist_pp0))
                                                               +amrex::Math::abs(fsten(ii_-1,jj_-1,kk_,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_-2,kk_,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_-2,kk_,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_-1,kk_,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_-1,kk_,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_-2,kk_,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_-2,kk_,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_-1,kk_,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_-1,kk_,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wpp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_0m0_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
         Real w1 = amrex::Math::abs(fsten(ii_,jj_-2,kk_,ist_0p0));
         Real w2 = amrex::Math::abs(fsten(ii_,jj_-1,kk_,ist_0p0));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w2 / (w1+w2);
         }
@@ -2885,32 +3339,32 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_+1,jj_-2,kk_,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_+1,jj_-1,kk_,ist_0p0)) / (amrex::Math::abs(fsten(ii_  ,jj_-1,kk_,ist_pp0))
                                                               +amrex::Math::abs(fsten(ii_+1,jj_-1,kk_,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_-2,kk_,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_-2,kk_,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_-1,kk_,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_-1,kk_,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_-2,kk_,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_-2,kk_,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_-1,kk_,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_-1,kk_,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wmp / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_m00_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
         Real w1 = amrex::Math::abs(fsten(ii_-2,jj_,kk_,ist_p00));
         Real w2 = amrex::Math::abs(fsten(ii_-1,jj_,kk_,ist_p00));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w2 / (w1+w2);
         }
     };
 
-    auto restrict_from_000_to = [] (int ii_, int jj_, int kk_) -> Real {
-        return 1._rt;
+    auto restrict_from_000_to = [] (int /*ii_*/, int /*jj_*/, int /*kk_*/) -> Real {
+        return Real(1.);
     };
 
     auto restrict_from_p00_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
         Real w1 = amrex::Math::abs(fsten(ii_  ,jj_,kk_,ist_p00));
         Real w2 = amrex::Math::abs(fsten(ii_+1,jj_,kk_,ist_p00));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w1 / (w1+w2);
         }
@@ -2925,18 +3379,18 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_-1,jj_  ,kk_,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_-1,jj_+1,kk_,ist_0p0)) / (amrex::Math::abs(fsten(ii_-2,jj_+1,kk_,ist_pp0))
                                                               +amrex::Math::abs(fsten(ii_-1,jj_+1,kk_,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_  ,kk_,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_  ,kk_,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_+1,kk_,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_+1,kk_,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_  ,kk_,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_  ,kk_,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_+1,kk_,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_+1,kk_,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wpm / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_0p0_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
         Real w1 = amrex::Math::abs(fsten(ii_,jj_  ,kk_,ist_0p0));
         Real w2 = amrex::Math::abs(fsten(ii_,jj_+1,kk_,ist_0p0));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w1 / (w1+w2);
         }
@@ -2951,15 +3405,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_+1,jj_  ,kk_,ist_pp0)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_+1,jj_+1,kk_,ist_0p0)) / (amrex::Math::abs(fsten(ii_  ,jj_+1,kk_,ist_pp0))
                                                               +amrex::Math::abs(fsten(ii_+1,jj_+1,kk_,ist_pp0)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_  ,kk_,ist_pp0)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_  ,kk_,ist_pp0)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_+1,kk_,ist_pp0)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_+1,kk_,ist_pp0)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_  ,kk_,ist_pp0)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_  ,kk_,ist_pp0)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_+1,kk_,ist_pp0)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_+1,kk_,ist_pp0)) * (Real(1.) + w1p + w2p);
         return wmm / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_mmp_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_-1,jj_-1,kk_+1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_-1,jj_-2,kk_  ,ist_ppp))
            + amrex::Math::abs(fsten(ii_-1,jj_-1,kk_  ,ist_ppp))
@@ -2997,15 +3451,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_,jj_-1,kk_  ,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_,jj_-1,kk_+1,ist_00p)) / (amrex::Math::abs(fsten(ii_,jj_-2,kk_+1,ist_0pp))
                                                               +amrex::Math::abs(fsten(ii_,jj_-1,kk_+1,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_,jj_-2,kk_  ,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_,jj_-1,kk_  ,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_,jj_-2,kk_+1,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_,jj_-1,kk_+1,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_,jj_-2,kk_  ,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_,jj_-1,kk_  ,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_,jj_-2,kk_+1,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_,jj_-1,kk_+1,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wpm / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_pmp_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_  ,jj_-1,kk_+1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_  ,jj_-2,kk_  ,ist_ppp))
            + amrex::Math::abs(fsten(ii_  ,jj_-1,kk_  ,ist_ppp))
@@ -3043,18 +3497,18 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_-1,jj_,kk_  ,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_-1,jj_,kk_+1,ist_00p)) / (amrex::Math::abs(fsten(ii_-2,jj_,kk_+1,ist_p0p))
                                                               +amrex::Math::abs(fsten(ii_-1,jj_,kk_+1,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_,kk_  ,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_,kk_  ,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_,kk_+1,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_,kk_+1,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_-2,jj_,kk_  ,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_-1,jj_,kk_  ,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_-2,jj_,kk_+1,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_-1,jj_,kk_+1,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wpm / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_00p_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
         Real w1 = amrex::Math::abs(fsten(ii_,jj_,kk_  ,ist_00p));
         Real w2 = amrex::Math::abs(fsten(ii_,jj_,kk_+1,ist_00p));
-        if (w1 == 0._rt and w2 == 0._rt) {
-            return 0.5_rt;
+        if (w1 == Real(0.) and w2 == Real(0.)) {
+            return Real(0.5);
         } else {
             return w1 / (w1+w2);
         }
@@ -3069,15 +3523,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_+1,jj_,kk_  ,ist_p0p)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_+1,jj_,kk_+1,ist_00p)) / (amrex::Math::abs(fsten(ii_  ,jj_,kk_+1,ist_p0p))
                                                               +amrex::Math::abs(fsten(ii_+1,jj_,kk_+1,ist_p0p)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_,kk_  ,ist_p0p)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_,kk_  ,ist_p0p)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_,kk_+1,ist_p0p)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_,kk_+1,ist_p0p)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_  ,jj_,kk_  ,ist_p0p)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_+1,jj_,kk_  ,ist_p0p)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_  ,jj_,kk_+1,ist_p0p)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_+1,jj_,kk_+1,ist_p0p)) * (Real(1.) + w1p + w2p);
         return wmm / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_mpp_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_-1,jj_+1,kk_+1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_-1,jj_  ,kk_  ,ist_ppp))
            + amrex::Math::abs(fsten(ii_-1,jj_+1,kk_  ,ist_ppp))
@@ -3115,15 +3569,15 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
                                                               +amrex::Math::abs(fsten(ii_,jj_+1,kk_  ,ist_0pp)) + eps);
         Real w2p = amrex::Math::abs(fsten(ii_,jj_+1,kk_+1,ist_00p)) / (amrex::Math::abs(fsten(ii_,jj_  ,kk_+1,ist_0pp))
                                                               +amrex::Math::abs(fsten(ii_,jj_+1,kk_+1,ist_0pp)) + eps);
-        Real wmm = amrex::Math::abs(fsten(ii_,jj_  ,kk_  ,ist_0pp)) * (1._rt + w1m + w2m);
-        Real wpm = amrex::Math::abs(fsten(ii_,jj_+1,kk_  ,ist_0pp)) * (1._rt + w1p + w2m);
-        Real wmp = amrex::Math::abs(fsten(ii_,jj_  ,kk_+1,ist_0pp)) * (1._rt + w1m + w2p);
-        Real wpp = amrex::Math::abs(fsten(ii_,jj_+1,kk_+1,ist_0pp)) * (1._rt + w1p + w2p);
+        Real wmm = amrex::Math::abs(fsten(ii_,jj_  ,kk_  ,ist_0pp)) * (Real(1.) + w1m + w2m);
+        Real wpm = amrex::Math::abs(fsten(ii_,jj_+1,kk_  ,ist_0pp)) * (Real(1.) + w1p + w2m);
+        Real wmp = amrex::Math::abs(fsten(ii_,jj_  ,kk_+1,ist_0pp)) * (Real(1.) + w1m + w2p);
+        Real wpp = amrex::Math::abs(fsten(ii_,jj_+1,kk_+1,ist_0pp)) * (Real(1.) + w1p + w2p);
         return wmm / (wmm+wpm+wmp+wpp+eps);
     };
 
     auto restrict_from_ppp_to = [&fsten] (int ii_, int jj_, int kk_) -> Real {
-        Real r = 1._rt;
+        Real r = Real(1.);
         r += amrex::Math::abs(fsten(ii_  ,jj_+1,kk_+1,ist_p00)) /
            ( amrex::Math::abs(fsten(ii_  ,jj_  ,kk_  ,ist_ppp))
            + amrex::Math::abs(fsten(ii_  ,jj_+1,kk_  ,ist_ppp))
@@ -3172,7 +3626,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(-1,-1, 0) = interp_from_pp0_to(iii+1,jjj-1,kkk  );
     p( 0,-1, 0) = interp_from_0p0_to(iii+2,jjj-1,kkk  );
     p(-1, 0, 0) = interp_from_p00_to(iii+1,jjj  ,kkk  );
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(-1,+1, 0) = interp_from_pm0_to(iii+1,jjj+1,kkk  );
     p( 0,+1, 0) = interp_from_0m0_to(iii+2,jjj+1,kkk  );
     p(-1,-1,+1) = interp_from_ppm_to(iii+1,jjj-1,kkk+1);
@@ -3346,7 +3800,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Apm0(iii+1,jjj+1,kkk+1) * p( 0, 0,+1)
       +              A000(iii+1,jjj+1,kkk+1) * p(-1,+1,+1)
       +              Ap00(iii+1,jjj+1,kkk+1) * p( 0,+1,+1);
-    csten(i,j,k,ist_p00) = 0.125_rt *
+    csten(i,j,k,ist_p00) = Real(0.125) *
       ( restrict_from_0mm_to(iii,jjj,kkk) * ap( 0,-1,-1)
       + restrict_from_pmm_to(iii,jjj,kkk) * ap(+1,-1,-1)
       + restrict_from_00m_to(iii,jjj,kkk) * ap( 0, 0,-1)
@@ -3380,7 +3834,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p( 0,-1, 0) = interp_from_0p0_to(iii  ,jjj+1,kkk  );
     p(+1,-1, 0) = interp_from_mp0_to(iii+1,jjj+1,kkk  );
     p(-1, 0, 0) = interp_from_p00_to(iii-1,jjj+2,kkk  );
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii+1,jjj+2,kkk  );
     p(-1,-1,+1) = interp_from_ppm_to(iii-1,jjj+1,kkk+1);
     p( 0,-1,+1) = interp_from_0pm_to(iii  ,jjj+1,kkk+1);
@@ -3553,7 +4007,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              A000(iii+1,jjj+1,kkk+1) * p(+1,-1,+1)
       +              Amp0(iii+1,jjj+1,kkk+1) * p( 0, 0,+1)
       +              A0p0(iii+1,jjj+1,kkk+1) * p(+1, 0,+1);
-    csten(i,j,k,ist_0p0) = 0.125_rt *
+    csten(i,j,k,ist_0p0) = Real(0.125) *
       ( restrict_from_m0m_to(iii,jjj,kkk) * ap(-1, 0,-1)
       + restrict_from_00m_to(iii,jjj,kkk) * ap( 0, 0,-1)
       + restrict_from_p0m_to(iii,jjj,kkk) * ap(+1, 0,-1)
@@ -3590,7 +4044,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p( 0,-1, 0) = interp_from_0p0_to(iii  ,jjj-1,kkk+2);
     p(+1,-1, 0) = interp_from_mp0_to(iii+1,jjj-1,kkk+2);
     p(-1, 0, 0) = interp_from_p00_to(iii-1,jjj  ,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii+1,jjj  ,kkk+2);
     p(-1,+1, 0) = interp_from_pm0_to(iii-1,jjj+1,kkk+2);
     p( 0,+1, 0) = interp_from_0m0_to(iii  ,jjj+1,kkk+2);
@@ -3760,7 +4214,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              A0mp(iii+1,jjj+1,kkk+1) * p(+1, 0, 0)
       +              Am0p(iii+1,jjj+1,kkk+1) * p( 0,+1, 0)
       +              A00p(iii+1,jjj+1,kkk+1) * p(+1,+1, 0);
-    csten(i,j,k,ist_00p) = 0.125_rt *
+    csten(i,j,k,ist_00p) = Real(0.125) *
       ( restrict_from_mm0_to(iii,jjj,kkk) * ap(-1,-1, 0)
       + restrict_from_0m0_to(iii,jjj,kkk) * ap( 0,-1, 0)
       + restrict_from_pm0_to(iii,jjj,kkk) * ap(+1,-1, 0)
@@ -3791,7 +4245,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(-1,-1, 0) = interp_from_pp0_to(iii+1,jjj+1,kkk  );
     p( 0,-1, 0) = interp_from_0p0_to(iii+2,jjj+1,kkk  );
     p(-1, 0, 0) = interp_from_p00_to(iii+1,jjj+2,kkk  );
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(-1,-1,+1) = interp_from_ppm_to(iii+1,jjj+1,kkk+1);
     p( 0,-1,+1) = interp_from_0pm_to(iii+2,jjj+1,kkk+1);
     p(-1, 0,+1) = interp_from_p0m_to(iii+1,jjj+2,kkk+1);
@@ -3871,7 +4325,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Ap00(iii+1,jjj+1,kkk+1) * p( 0,-1,+1)
       +              A0p0(iii+1,jjj+1,kkk+1) * p(-1, 0,+1)
       +              App0(iii+1,jjj+1,kkk+1) * p( 0, 0,+1);
-    cs1 = 0.125_rt *
+    cs1 = Real(0.125) *
       ( restrict_from_00m_to(iii,jjj,kkk) * ap( 0, 0,-1)
       + restrict_from_p0m_to(iii,jjj,kkk) * ap(+1, 0,-1)
       + restrict_from_0pm_to(iii,jjj,kkk) * ap( 0,+1,-1)
@@ -3895,7 +4349,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(+1, 0,-1) = interp_from_m0p_to(iii-1,jjj+2,kkk-1);
     p( 0,-1, 0) = interp_from_0p0_to(iii-2,jjj+1,kkk  );
     p(+1,-1, 0) = interp_from_mp0_to(iii-1,jjj+1,kkk  );
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii-1,jjj+2,kkk  );
     p( 0,-1,+1) = interp_from_0pm_to(iii-2,jjj+1,kkk+1);
     p(+1,-1,+1) = interp_from_mpm_to(iii-1,jjj+1,kkk+1);
@@ -3976,7 +4430,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Ampm(iii,jjj+1,kkk+1) * p(+1, 0, 0)
       +              Am00(iii,jjj+1,kkk+1) * p(+1,-1,+1)
       +              Amp0(iii,jjj+1,kkk+1) * p(+1, 0,+1);
-    cs2 = 0.125_rt *
+    cs2 = Real(0.125) *
       ( restrict_from_m0m_to(iii,jjj,kkk) * ap(-1, 0,-1)
       + restrict_from_00m_to(iii,jjj,kkk) * ap( 0, 0,-1)
       + restrict_from_mpm_to(iii,jjj,kkk) * ap(-1,+1,-1)
@@ -3990,7 +4444,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       + restrict_from_mpp_to(iii,jjj,kkk) * ap(-1,+1,+1)
       + restrict_from_0pp_to(iii,jjj,kkk) * ap( 0,+1,+1));
 
-    csten(i,j,k,ist_pp0) = 0.5_rt*(cs1 + cs2);
+    csten(i,j,k,ist_pp0) = Real(0.5)*(cs1 + cs2);
 
     // csten(i,j,k,ist_p0p)
     iii = ii;
@@ -4005,7 +4459,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(-1,-1, 0) = interp_from_pp0_to(iii+1,jjj-1,kkk+2);
     p( 0,-1, 0) = interp_from_0p0_to(iii+2,jjj-1,kkk+2);
     p(-1, 0, 0) = interp_from_p00_to(iii+1,jjj  ,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(-1,+1, 0) = interp_from_pm0_to(iii+1,jjj+1,kkk+2);
     p( 0,+1, 0) = interp_from_0m0_to(iii+2,jjj+1,kkk+2);
     ap(0,-1,0) =
@@ -4083,7 +4537,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Apmp(iii+1,jjj+1,kkk+1) * p( 0, 0, 0)
       +              A00p(iii+1,jjj+1,kkk+1) * p(-1,+1, 0)
       +              Ap0p(iii+1,jjj+1,kkk+1) * p( 0,+1, 0);
-    cs1 = 0.125_rt *
+    cs1 = Real(0.125) *
       ( restrict_from_0m0_to(iii,jjj,kkk) * ap( 0,-1, 0)
       + restrict_from_pm0_to(iii,jjj,kkk) * ap(+1,-1, 0)
       + restrict_from_000_to(iii,jjj,kkk) * ap( 0, 0, 0)
@@ -4109,7 +4563,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(+1,+1,-1) = interp_from_mmp_to(iii-1,jjj+1,kkk+1);
     p( 0,-1, 0) = interp_from_0p0_to(iii-2,jjj-1,kkk+2);
     p(+1,-1, 0) = interp_from_mp0_to(iii-1,jjj-1,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii-1,jjj  ,kkk+2);
     p( 0,+1, 0) = interp_from_0m0_to(iii-2,jjj+1,kkk+2);
     p(+1,+1, 0) = interp_from_mm0_to(iii-1,jjj+1,kkk+2);
@@ -4189,7 +4643,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Am00(iii,jjj+1,kkk+1) * p(+1,+1,-1)
       +              Ammp(iii,jjj+1,kkk+1) * p(+1, 0, 0)
       +              Am0p(iii,jjj+1,kkk+1) * p(+1,+1, 0);
-    cs2 = 0.125_rt *
+    cs2 = Real(0.125) *
       ( restrict_from_mm0_to(iii,jjj,kkk) * ap(-1,-1, 0)
       + restrict_from_0m0_to(iii,jjj,kkk) * ap( 0,-1, 0)
       + restrict_from_m00_to(iii,jjj,kkk) * ap(-1, 0, 0)
@@ -4203,7 +4657,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       + restrict_from_mpp_to(iii,jjj,kkk) * ap(-1,+1,+1)
       + restrict_from_0pp_to(iii,jjj,kkk) * ap( 0,+1,+1));
 
-    csten(i,j,k,ist_p0p) = 0.5_rt*(cs1+cs2);
+    csten(i,j,k,ist_p0p) = Real(0.5)*(cs1+cs2);
 
     // csten(i,j,k,ist_0pp)
     iii = ii;
@@ -4219,7 +4673,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p( 0,-1, 0) = interp_from_0p0_to(iii  ,jjj+1,kkk+2);
     p(+1,-1, 0) = interp_from_mp0_to(iii+1,jjj+1,kkk+2);
     p(-1, 0, 0) = interp_from_p00_to(iii-1,jjj+2,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii+1,jjj+2,kkk+2);
     ap(-1,0,0) =
                      A0pp(iii-1,jjj,kkk) * p(-1,-1,-1)
@@ -4296,7 +4750,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              A00p(iii+1,jjj+1,kkk+1) * p(+1,-1, 0)
       +              Ampp(iii+1,jjj+1,kkk+1) * p( 0, 0, 0)
       +              A0pp(iii+1,jjj+1,kkk+1) * p(+1, 0, 0);
-    cs1 = 0.125_rt *
+    cs1 = Real(0.125) *
       ( restrict_from_m00_to(iii,jjj,kkk) * ap(-1, 0, 0)
       + restrict_from_000_to(iii,jjj,kkk) * ap( 0, 0, 0)
       + restrict_from_p00_to(iii,jjj,kkk) * ap(+1, 0, 0)
@@ -4321,7 +4775,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p( 0,+1,-1) = interp_from_0mp_to(iii  ,jjj-1,kkk+1);
     p(+1,+1,-1) = interp_from_mmp_to(iii+1,jjj-1,kkk+1);
     p(-1, 0, 0) = interp_from_p00_to(iii-1,jjj-2,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii+1,jjj-2,kkk+2);
     p(-1,+1, 0) = interp_from_pm0_to(iii-1,jjj-1,kkk+2);
     p( 0,+1, 0) = interp_from_0m0_to(iii  ,jjj-1,kkk+2);
@@ -4401,7 +4855,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              A0m0(iii+1,jjj,kkk+1) * p(+1,+1,-1)
       +              Ammp(iii+1,jjj,kkk+1) * p( 0,+1, 0)
       +              A0mp(iii+1,jjj,kkk+1) * p(+1,+1, 0);
-    cs2 = 0.125_rt *
+    cs2 = Real(0.125) *
       ( restrict_from_mm0_to(iii,jjj,kkk) * ap(-1,-1, 0)
       + restrict_from_0m0_to(iii,jjj,kkk) * ap( 0,-1, 0)
       + restrict_from_pm0_to(iii,jjj,kkk) * ap(+1,-1, 0)
@@ -4415,7 +4869,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       + restrict_from_00p_to(iii,jjj,kkk) * ap( 0, 0,+1)
       + restrict_from_p0p_to(iii,jjj,kkk) * ap(+1, 0,+1));
 
-    csten(i,j,k,ist_0pp) = 0.5_rt*(cs1+cs2);
+    csten(i,j,k,ist_0pp) = Real(0.5)*(cs1+cs2);
 
     // csten(i,j,k,ist_ppp)
     iii = ii;
@@ -4428,7 +4882,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(-1,-1, 0) = interp_from_pp0_to(iii+1,jjj+1,kkk+2);
     p( 0,-1, 0) = interp_from_0p0_to(iii+2,jjj+1,kkk+2);
     p(-1, 0, 0) = interp_from_p00_to(iii+1,jjj+2,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     ap(0,0,0) =
                      Appp(iii,jjj,kkk) * p(-1,-1,-1);
     ap(1,0,0) =
@@ -4464,7 +4918,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Ap0p(iii+1,jjj+1,kkk+1) * p( 0,-1, 0)
       +              A0pp(iii+1,jjj+1,kkk+1) * p(-1, 0, 0)
       +              Appp(iii+1,jjj+1,kkk+1) * p( 0, 0, 0);
-    cs1 = 0.125_rt *
+    cs1 = Real(0.125) *
       ( restrict_from_000_to(iii,jjj,kkk) * ap( 0, 0, 0)
       + restrict_from_p00_to(iii,jjj,kkk) * ap(+1, 0, 0)
       + restrict_from_0p0_to(iii,jjj,kkk) * ap( 0,+1, 0)
@@ -4484,7 +4938,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(+1, 0,-1) = interp_from_m0p_to(iii-1,jjj+2,kkk+1);
     p( 0,-1, 0) = interp_from_0p0_to(iii-2,jjj+1,kkk+2);
     p(+1,-1, 0) = interp_from_mp0_to(iii-1,jjj+1,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii-1,jjj+2,kkk+2);
     ap(-1,0,0) =
                      Ampp(iii-1,jjj,kkk) * p( 0,-1,-1)
@@ -4521,7 +4975,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Amp0(iii,jjj+1,kkk+1) * p(+1, 0,-1)
       +              Am0p(iii,jjj+1,kkk+1) * p(+1,-1, 0)
       +              Ampp(iii,jjj+1,kkk+1) * p(+1, 0, 0);
-    cs2 = 0.125_rt *
+    cs2 = Real(0.125) *
       ( restrict_from_m00_to(iii,jjj,kkk) * ap(-1, 0, 0)
       + restrict_from_000_to(iii,jjj,kkk) * ap( 0, 0, 0)
       + restrict_from_mp0_to(iii,jjj,kkk) * ap(-1,+1, 0)
@@ -4540,7 +4994,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(-1,+1,-1) = interp_from_pmp_to(iii+1,jjj-1,kkk+1);
     p( 0,+1,-1) = interp_from_0mp_to(iii+2,jjj-1,kkk+1);
     p(-1, 0, 0) = interp_from_p00_to(iii+1,jjj-2,kkk+2);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(-1,+1, 0) = interp_from_pm0_to(iii+1,jjj-1,kkk+2);
     p( 0,+1, 0) = interp_from_0m0_to(iii+2,jjj-1,kkk+2);
     ap(0,-1,0) =
@@ -4578,7 +5032,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       +              Apm0(iii+1,jjj,kkk+1) * p( 0,+1,-1)
       +              A0mp(iii+1,jjj,kkk+1) * p(-1,+1, 0)
       +              Apmp(iii+1,jjj,kkk+1) * p( 0,+1, 0);
-    cs3 = 0.125_rt *
+    cs3 = Real(0.125) *
       ( restrict_from_0m0_to(iii,jjj,kkk) * ap( 0,-1, 0)
       + restrict_from_pm0_to(iii,jjj,kkk) * ap(+1,-1, 0)
       + restrict_from_000_to(iii,jjj,kkk) * ap( 0, 0, 0)
@@ -4596,7 +5050,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     p(+1, 0,-1) = interp_from_m0p_to(iii-1,jjj-2,kkk+1);
     p( 0,+1,-1) = interp_from_0mp_to(iii-2,jjj-1,kkk+1);
     p(+1,+1,-1) = interp_from_mmp_to(iii-1,jjj-1,kkk+1);
-    p( 0, 0, 0) = 1._rt;
+    p( 0, 0, 0) = Real(1.);
     p(+1, 0, 0) = interp_from_m00_to(iii-1,jjj-2,kkk+2);
     p( 0,+1, 0) = interp_from_0m0_to(iii-2,jjj-1,kkk+2);
     p(+1,+1, 0) = interp_from_mm0_to(iii-1,jjj-1,kkk+2);
@@ -4635,7 +5089,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
     ap(0,0,1) =
                      Amm0(iii,jjj,kkk+1) * p(+1,+1,-1)
       +              Ammp(iii,jjj,kkk+1) * p(+1,+1, 0);
-    cs4 = 0.125_rt *
+    cs4 = Real(0.125) *
       ( restrict_from_mm0_to(iii,jjj,kkk) * ap(-1,-1, 0)
       + restrict_from_0m0_to(iii,jjj,kkk) * ap( 0,-1, 0)
       + restrict_from_m00_to(iii,jjj,kkk) * ap(-1, 0, 0)
@@ -4645,7 +5099,7 @@ void mlndlap_stencil_rap (int i, int j, int k, Array4<Real> const& csten,
       + restrict_from_m0p_to(iii,jjj,kkk) * ap(-1, 0,+1)
       + restrict_from_00p_to(iii,jjj,kkk) * ap( 0, 0,+1));
 
-    csten(i,j,k,ist_ppp) = 0.25_rt*(cs1+cs2+cs3+cs4);
+    csten(i,j,k,ist_ppp) = Real(0.25)*(cs1+cs2+cs3+cs4);
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -5644,167 +6098,167 @@ void mlndlap_set_connection (int i, int j, int k, Array4<Real> const& conn,
                              Array4<EBCellFlag const> const& flag) noexcept
 {
     if (flag(i,j,k).isCovered()) {
-        for (int n = 0; n < n_conn; ++n) conn(i,j,k,n) = 0._rt;
+        for (int n = 0; n < n_conn; ++n) conn(i,j,k,n) = Real(0.);
     } else if (flag(i,j,k).isRegular() or vol(i,j,k) >= almostone) {
-        for (int n = 0; n < n_conn; ++n) conn(i,j,k,n) = 1._rt;
+        for (int n = 0; n < n_conn; ++n) conn(i,j,k,n) = Real(1.);
     } else {
         // Scaled by 9
-        conn(i,j,k,i_c_xmym) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*(-intg(i,j,k,i_S_x ) - intg(i,j,k,i_S_y)
+        conn(i,j,k,i_c_xmym) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*(-intg(i,j,k,i_S_x ) - intg(i,j,k,i_S_y)
                        +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
-            + 9._rt*( intg(i,j,k,i_S_x_y ) - intg(i,j,k,i_S_x2_y)
+            + Real(9.)*( intg(i,j,k,i_S_x_y ) - intg(i,j,k,i_S_x2_y)
                      -intg(i,j,k,i_S_x_y2) + intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xmyb) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*(-intg(i,j,k,i_S_x) + intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_y2))
-            + 18._rt*( intg(i,j,k,i_S_x_y2) - intg(i,j,k,i_S_x2_y2));
+        conn(i,j,k,i_c_xmyb) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*(-intg(i,j,k,i_S_x) + intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_y2))
+            + Real(18.)*( intg(i,j,k,i_S_x_y2) - intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xmyp) =  0.5625_rt*vol(i,j,k)
-            + 2.25_rt*(-intg(i,j,k,i_S_x ) + intg(i,j,k,i_S_y)
+        conn(i,j,k,i_c_xmyp) =  Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*(-intg(i,j,k,i_S_x ) + intg(i,j,k,i_S_y)
                        +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
-            + 9._rt*(-intg(i,j,k,i_S_x_y ) + intg(i,j,k,i_S_x2_y)
+            + Real(9.)*(-intg(i,j,k,i_S_x_y ) + intg(i,j,k,i_S_x2_y)
                      -intg(i,j,k,i_S_x_y2) + intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xbym) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*(-intg(i,j,k,i_S_y) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
-            + 18._rt*(intg(i,j,k,i_S_x2_y) - intg(i,j,k,i_S_x2_y2));
+        conn(i,j,k,i_c_xbym) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*(-intg(i,j,k,i_S_y) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
+            + Real(18.)*(intg(i,j,k,i_S_x2_y) - intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 36
-        conn(i,j,k,i_c_xbyb) = 2.25_rt*vol(i,j,k)
-            + 9._rt*(-intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_y2))
-            + 36._rt*intg(i,j,k,i_S_x2_y2);
+        conn(i,j,k,i_c_xbyb) = Real(2.25)*vol(i,j,k)
+            + Real(9.)*(-intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_y2))
+            + Real(36.)*intg(i,j,k,i_S_x2_y2);
 
         // Scaled by 18
-        conn(i,j,k,i_c_xbyp) =  1.125_rt*vol(i,j,k)
-            + 4.5_rt*( intg(i,j,k,i_S_y) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
-            + 18._rt*(-intg(i,j,k,i_S_x2_y) - intg(i,j,k,i_S_x2_y2));
+        conn(i,j,k,i_c_xbyp) =  Real(1.125)*vol(i,j,k)
+            + Real(4.5)*( intg(i,j,k,i_S_y) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
+            + Real(18.)*(-intg(i,j,k,i_S_x2_y) - intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xpym) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*( intg(i,j,k,i_S_x ) - intg(i,j,k,i_S_y)
+        conn(i,j,k,i_c_xpym) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*( intg(i,j,k,i_S_x ) - intg(i,j,k,i_S_y)
                         +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
-            + 9._rt*(-intg(i,j,k,i_S_x_y ) - intg(i,j,k,i_S_x2_y)
+            + Real(9.)*(-intg(i,j,k,i_S_x_y ) - intg(i,j,k,i_S_x2_y)
                      +intg(i,j,k,i_S_x_y2) + intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xpyb) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*( intg(i,j,k,i_S_x) + intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_y2))
-            + 18._rt*(-intg(i,j,k,i_S_x_y2) - intg(i,j,k,i_S_x2_y2));
+        conn(i,j,k,i_c_xpyb) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*( intg(i,j,k,i_S_x) + intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_y2))
+            + Real(18.)*(-intg(i,j,k,i_S_x_y2) - intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xpyp) =  0.5625_rt*vol(i,j,k)
-            + 2.25_rt*( intg(i,j,k,i_S_x ) + intg(i,j,k,i_S_y)
+        conn(i,j,k,i_c_xpyp) =  Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*( intg(i,j,k,i_S_x ) + intg(i,j,k,i_S_y)
                         +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_y2))
-            + 9._rt*( intg(i,j,k,i_S_x_y ) + intg(i,j,k,i_S_x2_y)
+            + Real(9.)*( intg(i,j,k,i_S_x_y ) + intg(i,j,k,i_S_x2_y)
                       +intg(i,j,k,i_S_x_y2) + intg(i,j,k,i_S_x2_y2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xmzm) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*(-intg(i,j,k,i_S_x) - intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_xmzm) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*(-intg(i,j,k,i_S_x) - intg(i,j,k,i_S_z)
                        +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
-            + 9._rt*(intg(i,j,k,i_S_x_z) - intg(i,j,k,i_S_x2_z)
+            + Real(9.)*(intg(i,j,k,i_S_x_z) - intg(i,j,k,i_S_x2_z)
                      -intg(i,j,k,i_S_x_z2) + intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xmzb) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*(-intg(i,j,k,i_S_x) + intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_z2))
-            + 18._rt*(intg(i,j,k,i_S_x_z2) - intg(i,j,k,i_S_x2_z2));
+        conn(i,j,k,i_c_xmzb) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*(-intg(i,j,k,i_S_x) + intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_z2))
+            + Real(18.)*(intg(i,j,k,i_S_x_z2) - intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xmzp) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*(-intg(i,j,k,i_S_x  ) + intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_xmzp) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*(-intg(i,j,k,i_S_x  ) + intg(i,j,k,i_S_z)
                        +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
-            + 9._rt*(-intg(i,j,k,i_S_x_z  ) + intg(i,j,k,i_S_x2_z)
+            + Real(9.)*(-intg(i,j,k,i_S_x_z  ) + intg(i,j,k,i_S_x2_z)
                      -intg(i,j,k,i_S_x_z2) + intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xbzm) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*(-intg(i,j,k,i_S_z) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
-            + 18._rt*(intg(i,j,k,i_S_x2_z) - intg(i,j,k,i_S_x2_z2));
+        conn(i,j,k,i_c_xbzm) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*(-intg(i,j,k,i_S_z) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
+            + Real(18.)*(intg(i,j,k,i_S_x2_z) - intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xbzb) = 2.25_rt*vol(i,j,k)
-            + 9._rt*(-intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_z2))
-            + 36._rt*intg(i,j,k,i_S_x2_z2);
+        conn(i,j,k,i_c_xbzb) = Real(2.25)*vol(i,j,k)
+            + Real(9.)*(-intg(i,j,k,i_S_x2) - intg(i,j,k,i_S_z2))
+            + Real(36.)*intg(i,j,k,i_S_x2_z2);
 
         // Scaled by 18
-        conn(i,j,k,i_c_xbzp) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*( intg(i,j,k,i_S_z) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
-            + 18._rt*(-intg(i,j,k,i_S_x2_z) - intg(i,j,k,i_S_x2_z2));
+        conn(i,j,k,i_c_xbzp) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*( intg(i,j,k,i_S_z) - intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
+            + Real(18.)*(-intg(i,j,k,i_S_x2_z) - intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xpzm) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*( intg(i,j,k,i_S_x ) - intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_xpzm) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*( intg(i,j,k,i_S_x ) - intg(i,j,k,i_S_z)
                         +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
-            + 9._rt*(-intg(i,j,k,i_S_x_z ) - intg(i,j,k,i_S_x2_z)
+            + Real(9.)*(-intg(i,j,k,i_S_x_z ) - intg(i,j,k,i_S_x2_z)
                      +intg(i,j,k,i_S_x_z2) + intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_xpzb) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*( intg(i,j,k,i_S_x   ) + intg(i,j,k,i_S_x2   ) - intg(i,j,k,i_S_z2))
-            + 18._rt*(-intg(i,j,k,i_S_x_z2) - intg(i,j,k,i_S_x2_z2));
+        conn(i,j,k,i_c_xpzb) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*( intg(i,j,k,i_S_x   ) + intg(i,j,k,i_S_x2   ) - intg(i,j,k,i_S_z2))
+            + Real(18.)*(-intg(i,j,k,i_S_x_z2) - intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_xpzp) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*( intg(i,j,k,i_S_x ) + intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_xpzp) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*( intg(i,j,k,i_S_x ) + intg(i,j,k,i_S_z)
                         +intg(i,j,k,i_S_x2) + intg(i,j,k,i_S_z2))
-            + 9._rt*( intg(i,j,k,i_S_x_z ) + intg(i,j,k,i_S_x2_z)
+            + Real(9.)*( intg(i,j,k,i_S_x_z ) + intg(i,j,k,i_S_x2_z)
                       +intg(i,j,k,i_S_x_z2) + intg(i,j,k,i_S_x2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_ymzm) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*(-intg(i,j,k,i_S_y) - intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_ymzm) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*(-intg(i,j,k,i_S_y) - intg(i,j,k,i_S_z)
                        +intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
-            + 9._rt*(intg(i,j,k,i_S_y_z) - intg(i,j,k,i_S_y2_z)
+            + Real(9.)*(intg(i,j,k,i_S_y_z) - intg(i,j,k,i_S_y2_z)
                      -intg(i,j,k,i_S_y_z2) + intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_ymzb) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*(-intg(i,j,k,i_S_y) + intg(i,j,k,i_S_y2) - intg(i,j,k,i_S_z2))
-            + 18._rt*(intg(i,j,k,i_S_y_z2) - intg(i,j,k,i_S_y2_z2));
+        conn(i,j,k,i_c_ymzb) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*(-intg(i,j,k,i_S_y) + intg(i,j,k,i_S_y2) - intg(i,j,k,i_S_z2))
+            + Real(18.)*(intg(i,j,k,i_S_y_z2) - intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_ymzp) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*(-intg(i,j,k,i_S_y ) + intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_ymzp) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*(-intg(i,j,k,i_S_y ) + intg(i,j,k,i_S_z)
                        +intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
-            + 9._rt*(-intg(i,j,k,i_S_y_z ) + intg(i,j,k,i_S_y2_z)
+            + Real(9.)*(-intg(i,j,k,i_S_y_z ) + intg(i,j,k,i_S_y2_z)
                      -intg(i,j,k,i_S_y_z2) + intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_ybzm) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*(-intg(i,j,k,i_S_z) - intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
-            + 18._rt*(intg(i,j,k,i_S_y2_z) - intg(i,j,k,i_S_y2_z2));
+        conn(i,j,k,i_c_ybzm) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*(-intg(i,j,k,i_S_z) - intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
+            + Real(18.)*(intg(i,j,k,i_S_y2_z) - intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 36
-        conn(i,j,k,i_c_ybzb) = 2.25_rt*vol(i,j,k)
-            + 9._rt*(-intg(i,j,k,i_S_y2) - intg(i,j,k,i_S_z2))
-                     + 36._rt*intg(i,j,k,i_S_y2_z2);
+        conn(i,j,k,i_c_ybzb) = Real(2.25)*vol(i,j,k)
+            + Real(9.)*(-intg(i,j,k,i_S_y2) - intg(i,j,k,i_S_z2))
+                     + Real(36.)*intg(i,j,k,i_S_y2_z2);
 
         // Scaled by 18
-        conn(i,j,k,i_c_ybzp) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*( intg(i,j,k,i_S_z) - intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
-            + 18._rt*(-intg(i,j,k,i_S_y2_z) - intg(i,j,k,i_S_y2_z2));
+        conn(i,j,k,i_c_ybzp) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*( intg(i,j,k,i_S_z) - intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
+            + Real(18.)*(-intg(i,j,k,i_S_y2_z) - intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_ypzm) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*( intg(i,j,k,i_S_y ) - intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_ypzm) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*( intg(i,j,k,i_S_y ) - intg(i,j,k,i_S_z)
                         +intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
-            + 9._rt*(-intg(i,j,k,i_S_y_z ) - intg(i,j,k,i_S_y2_z)
+            + Real(9.)*(-intg(i,j,k,i_S_y_z ) - intg(i,j,k,i_S_y2_z)
                      +intg(i,j,k,i_S_y_z2) + intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 18
-        conn(i,j,k,i_c_ypzb) = 1.125_rt*vol(i,j,k)
-            + 4.5_rt*( intg(i,j,k,i_S_y   ) + intg(i,j,k,i_S_y2) - intg(i,j,k,i_S_z2))
-            + 18._rt*(-intg(i,j,k,i_S_y_z2) - intg(i,j,k,i_S_y2_z2));
+        conn(i,j,k,i_c_ypzb) = Real(1.125)*vol(i,j,k)
+            + Real(4.5)*( intg(i,j,k,i_S_y   ) + intg(i,j,k,i_S_y2) - intg(i,j,k,i_S_z2))
+            + Real(18.)*(-intg(i,j,k,i_S_y_z2) - intg(i,j,k,i_S_y2_z2));
 
         // Scaled by 9
-        conn(i,j,k,i_c_ypzp) = 0.5625_rt*vol(i,j,k)
-            + 2.25_rt*( intg(i,j,k,i_S_y ) + intg(i,j,k,i_S_z)
+        conn(i,j,k,i_c_ypzp) = Real(0.5625)*vol(i,j,k)
+            + Real(2.25)*( intg(i,j,k,i_S_y ) + intg(i,j,k,i_S_z)
                         +intg(i,j,k,i_S_y2) + intg(i,j,k,i_S_z2))
-            + 9._rt*( intg(i,j,k,i_S_y_z ) + intg(i,j,k,i_S_y2_z)
+            + Real(9.)*( intg(i,j,k,i_S_y_z ) + intg(i,j,k,i_S_y2_z)
                       +intg(i,j,k,i_S_y_z2) + intg(i,j,k,i_S_y2_z2));
     }
 }
@@ -5814,45 +6268,45 @@ void mlndlap_set_stencil_eb (int i, int j, int k, Array4<Real> const& sten,
                              Array4<Real const> const& sig, Array4<Real const> const& conn,
                              GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
-    Real facx = (1._rt/36._rt)*dxinv[0]*dxinv[0];
-    Real facy = (1._rt/36._rt)*dxinv[1]*dxinv[1];
-    Real facz = (1._rt/36._rt)*dxinv[2]*dxinv[2];
+    Real facx = Real(1./36.)*dxinv[0]*dxinv[0];
+    Real facy = Real(1./36.)*dxinv[1]*dxinv[1];
+    Real facz = Real(1./36.)*dxinv[2]*dxinv[2];
 
     // i+1,j,k
     sten(i,j,k,ist_p00) = (
-        sig(i,j  ,k  )*(4._rt*facx*conn(i,j  ,k  ,i_c_ymzm) - 2._rt*facy*conn(i,j  ,k  ,i_c_xbzm) - 2._rt*facz*conn(i,j  ,k  ,i_c_xbym) ) +
-        sig(i,j-1,k  )*(4._rt*facx*conn(i,j-1,k  ,i_c_ypzm) - 2._rt*facy*conn(i,j-1,k  ,i_c_xbzm) - 2._rt*facz*conn(i,j-1,k  ,i_c_xbyp) ) +
-        sig(i,j  ,k-1)*(4._rt*facx*conn(i,j  ,k-1,i_c_ymzp) - 2._rt*facy*conn(i,j  ,k-1,i_c_xbzp) - 2._rt*facz*conn(i,j  ,k-1,i_c_xbym) ) +
-        sig(i,j-1,k-1)*(4._rt*facx*conn(i,j-1,k-1,i_c_ypzp) - 2._rt*facy*conn(i,j-1,k-1,i_c_xbzp) - 2._rt*facz*conn(i,j-1,k-1,i_c_xbyp) ) );
+        sig(i,j  ,k  )*(Real(4.)*facx*conn(i,j  ,k  ,i_c_ymzm) - Real(2.)*facy*conn(i,j  ,k  ,i_c_xbzm) - Real(2.)*facz*conn(i,j  ,k  ,i_c_xbym) ) +
+        sig(i,j-1,k  )*(Real(4.)*facx*conn(i,j-1,k  ,i_c_ypzm) - Real(2.)*facy*conn(i,j-1,k  ,i_c_xbzm) - Real(2.)*facz*conn(i,j-1,k  ,i_c_xbyp) ) +
+        sig(i,j  ,k-1)*(Real(4.)*facx*conn(i,j  ,k-1,i_c_ymzp) - Real(2.)*facy*conn(i,j  ,k-1,i_c_xbzp) - Real(2.)*facz*conn(i,j  ,k-1,i_c_xbym) ) +
+        sig(i,j-1,k-1)*(Real(4.)*facx*conn(i,j-1,k-1,i_c_ypzp) - Real(2.)*facy*conn(i,j-1,k-1,i_c_xbzp) - Real(2.)*facz*conn(i,j-1,k-1,i_c_xbyp) ) );
 
     // i,j+1,k
     sten(i,j,k,ist_0p0) = (
-        sig(i  ,j,k  )*(-2._rt*facx*conn(i  ,j,k  ,i_c_ybzm) + 4._rt*facy*conn(i  ,j,k  ,i_c_xmzm) - 2._rt*facz*conn(i  ,j,k  ,i_c_xmyb) ) +
-        sig(i-1,j,k  )*(-2._rt*facx*conn(i-1,j,k  ,i_c_ybzm) + 4._rt*facy*conn(i-1,j,k  ,i_c_xpzm) - 2._rt*facz*conn(i-1,j,k  ,i_c_xpyb) ) +
-        sig(i  ,j,k-1)*(-2._rt*facx*conn(i  ,j,k-1,i_c_ybzp) + 4._rt*facy*conn(i  ,j,k-1,i_c_xmzp) - 2._rt*facz*conn(i  ,j,k-1,i_c_xmyb) ) +
-        sig(i-1,j,k-1)*(-2._rt*facx*conn(i-1,j,k-1,i_c_ybzp) + 4._rt*facy*conn(i-1,j,k-1,i_c_xpzp) - 2._rt*facz*conn(i-1,j,k-1,i_c_xpyb) ) );
+        sig(i  ,j,k  )*(Real(-2.)*facx*conn(i  ,j,k  ,i_c_ybzm) + Real(4.)*facy*conn(i  ,j,k  ,i_c_xmzm) - Real(2.)*facz*conn(i  ,j,k  ,i_c_xmyb) ) +
+        sig(i-1,j,k  )*(Real(-2.)*facx*conn(i-1,j,k  ,i_c_ybzm) + Real(4.)*facy*conn(i-1,j,k  ,i_c_xpzm) - Real(2.)*facz*conn(i-1,j,k  ,i_c_xpyb) ) +
+        sig(i  ,j,k-1)*(Real(-2.)*facx*conn(i  ,j,k-1,i_c_ybzp) + Real(4.)*facy*conn(i  ,j,k-1,i_c_xmzp) - Real(2.)*facz*conn(i  ,j,k-1,i_c_xmyb) ) +
+        sig(i-1,j,k-1)*(Real(-2.)*facx*conn(i-1,j,k-1,i_c_ybzp) + Real(4.)*facy*conn(i-1,j,k-1,i_c_xpzp) - Real(2.)*facz*conn(i-1,j,k-1,i_c_xpyb) ) );
 
     // i,j,k+1
     sten(i,j,k,ist_00p) = (
-        sig(i  ,j  ,k)*(-2._rt*facx*conn(i  ,j  ,k,i_c_ymzb) - 2._rt*facy*conn(i  ,j  ,k,i_c_xmzb) + 4._rt*facz*conn(i  ,j  ,k,i_c_xmym) ) +
-        sig(i-1,j  ,k)*(-2._rt*facx*conn(i-1,j  ,k,i_c_ymzb) - 2._rt*facy*conn(i-1,j  ,k,i_c_xpzb) + 4._rt*facz*conn(i-1,j  ,k,i_c_xpym) ) +
-        sig(i  ,j-1,k)*(-2._rt*facx*conn(i  ,j-1,k,i_c_ypzb) - 2._rt*facy*conn(i  ,j-1,k,i_c_xmzb) + 4._rt*facz*conn(i  ,j-1,k,i_c_xmyp) ) +
-        sig(i-1,j-1,k)*(-2._rt*facx*conn(i-1,j-1,k,i_c_ypzb) - 2._rt*facy*conn(i-1,j-1,k,i_c_xpzb) + 4._rt*facz*conn(i-1,j-1,k,i_c_xpyp) ) );
+        sig(i  ,j  ,k)*(Real(-2.)*facx*conn(i  ,j  ,k,i_c_ymzb) - Real(2.)*facy*conn(i  ,j  ,k,i_c_xmzb) + Real(4.)*facz*conn(i  ,j  ,k,i_c_xmym) ) +
+        sig(i-1,j  ,k)*(Real(-2.)*facx*conn(i-1,j  ,k,i_c_ymzb) - Real(2.)*facy*conn(i-1,j  ,k,i_c_xpzb) + Real(4.)*facz*conn(i-1,j  ,k,i_c_xpym) ) +
+        sig(i  ,j-1,k)*(Real(-2.)*facx*conn(i  ,j-1,k,i_c_ypzb) - Real(2.)*facy*conn(i  ,j-1,k,i_c_xmzb) + Real(4.)*facz*conn(i  ,j-1,k,i_c_xmyp) ) +
+        sig(i-1,j-1,k)*(Real(-2.)*facx*conn(i-1,j-1,k,i_c_ypzb) - Real(2.)*facy*conn(i-1,j-1,k,i_c_xpzb) + Real(4.)*facz*conn(i-1,j-1,k,i_c_xpyp) ) );
 
     // i+1,j+1,k
     sten(i,j,k,ist_pp0) = (
-        sig(i,j,k  )*(2._rt*facx*conn(i,j,k  ,i_c_ybzm) + 2._rt*facy*conn(i,j,k  ,i_c_xbzm) - facz*conn(i,j,k  ,i_c_xbyb) ) +
-        sig(i,j,k-1)*(2._rt*facx*conn(i,j,k-1,i_c_ybzp) + 2._rt*facy*conn(i,j,k-1,i_c_xbzp) - facz*conn(i,j,k-1,i_c_xbyb) ) );
+        sig(i,j,k  )*(Real(2.)*facx*conn(i,j,k  ,i_c_ybzm) + Real(2.)*facy*conn(i,j,k  ,i_c_xbzm) - facz*conn(i,j,k  ,i_c_xbyb) ) +
+        sig(i,j,k-1)*(Real(2.)*facx*conn(i,j,k-1,i_c_ybzp) + Real(2.)*facy*conn(i,j,k-1,i_c_xbzp) - facz*conn(i,j,k-1,i_c_xbyb) ) );
 
     // i+1,j,k+1
     sten(i,j,k,ist_p0p) = (
-        sig(i,j,k  )*(2._rt*facx*conn(i,j,k  ,i_c_ymzb) - facy*conn(i,j,k  ,i_c_xbzb) + 2._rt*facz*conn(i,j,k  ,i_c_xbym) ) +
-        sig(i,j-1,k)*(2._rt*facx*conn(i,j-1,k,i_c_ypzb) - facy*conn(i,j-1,k,i_c_xbzb) + 2._rt*facz*conn(i,j-1,k,i_c_xbyp) ) );
+        sig(i,j,k  )*(Real(2.)*facx*conn(i,j,k  ,i_c_ymzb) - facy*conn(i,j,k  ,i_c_xbzb) + Real(2.)*facz*conn(i,j,k  ,i_c_xbym) ) +
+        sig(i,j-1,k)*(Real(2.)*facx*conn(i,j-1,k,i_c_ypzb) - facy*conn(i,j-1,k,i_c_xbzb) + Real(2.)*facz*conn(i,j-1,k,i_c_xbyp) ) );
 
     // i,j+1,k+1
     sten(i,j,k,ist_0pp) = (
-        sig(i  ,j,k)*(-facx*conn(i  ,j,k,i_c_ybzb) + 2._rt*facy*conn(i  ,j,k,i_c_xmzb) + 2._rt*facz*conn(i  ,j,k,i_c_xmyb) ) +
-        sig(i-1,j,k)*(-facx*conn(i-1,j,k,i_c_ybzb) + 2._rt*facy*conn(i-1,j,k,i_c_xpzb) + 2._rt*facz*conn(i-1,j,k,i_c_xpyb) ) );
+        sig(i  ,j,k)*(-facx*conn(i  ,j,k,i_c_ybzb) + Real(2.)*facy*conn(i  ,j,k,i_c_xmzb) + Real(2.)*facz*conn(i  ,j,k,i_c_xmyb) ) +
+        sig(i-1,j,k)*(-facx*conn(i-1,j,k,i_c_ybzb) + Real(2.)*facy*conn(i-1,j,k,i_c_xpzb) + Real(2.)*facz*conn(i-1,j,k,i_c_xpyb) ) );
 
     // i+1,j+1,k+1
     sten(i,j,k,ist_ppp) = sig(i,j,k) * (facx*conn(i,j,k,i_c_ybzb) + facy*conn(i,j,k,i_c_xbzb) + facz*conn(i,j,k,i_c_xbyb) );
@@ -5861,114 +6315,143 @@ void mlndlap_set_stencil_eb (int i, int j, int k, Array4<Real> const& sten,
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndlap_divu_eb (int i, int j, int k, Array4<Real> const& rhs, Array4<Real const> const& vel,
                       Array4<Real const> const& vfrac, Array4<Real const> const& intg,
-                      Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
+                      Array4<int const> const& msk, GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                      Box const& nodal_domain,
+                      GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bclo,
+                      GpuArray<LinOpBCType, AMREX_SPACEDIM> const& bchi) noexcept
 {
-    Real facx = 0.25_rt*dxinv[0];
-    Real facy = 0.25_rt*dxinv[1];
-    Real facz = 0.25_rt*dxinv[2];
+    Real facx = Real(0.25)*dxinv[0];
+    Real facy = Real(0.25)*dxinv[1];
+    Real facz = Real(0.25)*dxinv[2];
+
+    const auto domlo = amrex::lbound(nodal_domain);
+    const auto domhi = amrex::ubound(nodal_domain);
 
     if (!msk(i,j,k)) {
+
+        Real zero_ilo = 1.0;
+        Real zero_ihi = 1.0;
+        Real zero_jlo = 1.0;
+        Real zero_jhi = 1.0;
+        Real zero_klo = 1.0;
+        Real zero_khi = 1.0;
+
+        // The nodal divergence operator should not see the tangential velocity
+        //     at an inflow face
+        if ((bclo[0] == LinOpBCType::Neumann or bclo[0] == LinOpBCType::inflow)
+            and i == domlo.x) zero_ilo = 0.0;
+        if ((bchi[0] == LinOpBCType::Neumann or bchi[0] == LinOpBCType::inflow)
+            and i == domhi.x) zero_ihi = 0.0;
+        if ((bclo[1] == LinOpBCType::Neumann or bclo[1] == LinOpBCType::inflow)
+            and j == domlo.y) zero_jlo = 0.0;
+        if ((bchi[1] == LinOpBCType::Neumann or bchi[1] == LinOpBCType::inflow)
+            and j == domhi.y) zero_jhi = 0.0;
+        if ((bclo[2] == LinOpBCType::Neumann or bclo[2] == LinOpBCType::inflow)
+            and k == domlo.z) zero_klo = 0.0;
+        if ((bchi[2] == LinOpBCType::Neumann or bchi[2] == LinOpBCType::inflow)
+            and k == domhi.z) zero_khi = 0.0;
+
         rhs(i,j,k) = facx*(
             vel(i-1,j-1,k  ,0)*(    -vfrac(i-1,j-1,k  )
-                               -2._rt*intg(i-1,j-1,k  ,i_S_y)
-                               +2._rt*intg(i-1,j-1,k  ,i_S_z)
-                               +4._rt*intg(i-1,j-1,k  ,i_S_y_z))
+                               -Real(2.)*intg(i-1,j-1,k  ,i_S_y)
+                               +Real(2.)*intg(i-1,j-1,k  ,i_S_z)
+                               +Real(4.)*intg(i-1,j-1,k  ,i_S_y_z))*zero_jlo*zero_khi
            +vel(i  ,j-1,k  ,0)*(     vfrac(i  ,j-1,k  )
-                               +2._rt*intg(i  ,j-1,k  ,i_S_y)
-                               -2._rt*intg(i  ,j-1,k  ,i_S_z)
-                               -4._rt*intg(i  ,j-1,k  ,i_S_y_z))
+                               +Real(2.)*intg(i  ,j-1,k  ,i_S_y)
+                               -Real(2.)*intg(i  ,j-1,k  ,i_S_z)
+                               -Real(4.)*intg(i  ,j-1,k  ,i_S_y_z))*zero_jlo*zero_khi
            +vel(i-1,j  ,k  ,0)*(    -vfrac(i-1,j  ,k  )
-                               +2._rt*intg(i-1,j  ,k  ,i_S_y)
-                               +2._rt*intg(i-1,j  ,k  ,i_S_z)
-                               -4._rt*intg(i-1,j  ,k  ,i_S_y_z))
+                               +Real(2.)*intg(i-1,j  ,k  ,i_S_y)
+                               +Real(2.)*intg(i-1,j  ,k  ,i_S_z)
+                               -Real(4.)*intg(i-1,j  ,k  ,i_S_y_z))*zero_jhi*zero_khi
            +vel(i  ,j  ,k  ,0)*(     vfrac(i  ,j  ,k  )
-                               -2._rt*intg(i  ,j  ,k  ,i_S_y)
-                               -2._rt*intg(i  ,j  ,k  ,i_S_z)
-                               +4._rt*intg(i  ,j  ,k  ,i_S_y_z))
+                               -Real(2.)*intg(i  ,j  ,k  ,i_S_y)
+                               -Real(2.)*intg(i  ,j  ,k  ,i_S_z)
+                               +Real(4.)*intg(i  ,j  ,k  ,i_S_y_z))*zero_jhi*zero_khi
            +vel(i-1,j-1,k-1,0)*(    -vfrac(i-1,j-1,k-1)
-                               -2._rt*intg(i-1,j-1,k-1,i_S_y)
-                               -2._rt*intg(i-1,j-1,k-1,i_S_z)
-                               -4._rt*intg(i-1,j-1,k-1,i_S_y_z))
+                               -Real(2.)*intg(i-1,j-1,k-1,i_S_y)
+                               -Real(2.)*intg(i-1,j-1,k-1,i_S_z)
+                               -Real(4.)*intg(i-1,j-1,k-1,i_S_y_z))*zero_jlo*zero_klo
            +vel(i  ,j-1,k-1,0)*(     vfrac(i  ,j-1,k-1)
-                               +2._rt*intg(i  ,j-1,k-1,i_S_y)
-                               +2._rt*intg(i  ,j-1,k-1,i_S_z)
-                               +4._rt*intg(i  ,j-1,k-1,i_S_y_z))
+                               +Real(2.)*intg(i  ,j-1,k-1,i_S_y)
+                               +Real(2.)*intg(i  ,j-1,k-1,i_S_z)
+                               +Real(4.)*intg(i  ,j-1,k-1,i_S_y_z))*zero_jlo*zero_klo
            +vel(i-1,j  ,k-1,0)*(    -vfrac(i-1,j  ,k-1)
-                               +2._rt*intg(i-1,j  ,k-1,i_S_y)
-                               -2._rt*intg(i-1,j  ,k-1,i_S_z)
-                               +4._rt*intg(i-1,j  ,k-1,i_S_y_z))
+                               +Real(2.)*intg(i-1,j  ,k-1,i_S_y)
+                               -Real(2.)*intg(i-1,j  ,k-1,i_S_z)
+                               +Real(4.)*intg(i-1,j  ,k-1,i_S_y_z))*zero_jhi*zero_klo
            +vel(i  ,j  ,k-1,0)*(     vfrac(i  ,j  ,k-1)
-                               -2._rt*intg(i  ,j  ,k-1,i_S_y)
-                               +2._rt*intg(i  ,j  ,k-1,i_S_z)
-                               -4._rt*intg(i  ,j  ,k-1,i_S_y_z)) )
+                               -Real(2.)*intg(i  ,j  ,k-1,i_S_y)
+                               +Real(2.)*intg(i  ,j  ,k-1,i_S_z)
+                               -Real(4.)*intg(i  ,j  ,k-1,i_S_y_z))*zero_jhi*zero_klo )
             + facy*(
             vel(i-1,j-1,k  ,1)*(    -vfrac(i-1,j-1,k  )
-                               -2._rt*intg(i-1,j-1,k  ,i_S_x)
-                               +2._rt*intg(i-1,j-1,k  ,i_S_z)
-                               +4._rt*intg(i-1,j-1,k  ,i_S_x_z))
+                               -Real(2.)*intg(i-1,j-1,k  ,i_S_x)
+                               +Real(2.)*intg(i-1,j-1,k  ,i_S_z)
+                               +Real(4.)*intg(i-1,j-1,k  ,i_S_x_z))*zero_ilo*zero_khi
            +vel(i  ,j-1,k  ,1)*(    -vfrac(i  ,j-1,k  )
-                               +2._rt*intg(i  ,j-1,k  ,i_S_x)
-                               +2._rt*intg(i  ,j-1,k  ,i_S_z)
-                               -4._rt*intg(i  ,j-1,k  ,i_S_x_z))
+                               +Real(2.)*intg(i  ,j-1,k  ,i_S_x)
+                               +Real(2.)*intg(i  ,j-1,k  ,i_S_z)
+                               -Real(4.)*intg(i  ,j-1,k  ,i_S_x_z))*zero_ihi*zero_khi
            +vel(i-1,j  ,k  ,1)*(     vfrac(i-1,j  ,k  )
-                               +2._rt*intg(i-1,j  ,k  ,i_S_x)
-                               -2._rt*intg(i-1,j  ,k  ,i_S_z)
-                               -4._rt*intg(i-1,j  ,k  ,i_S_x_z))
+                               +Real(2.)*intg(i-1,j  ,k  ,i_S_x)
+                               -Real(2.)*intg(i-1,j  ,k  ,i_S_z)
+                               -Real(4.)*intg(i-1,j  ,k  ,i_S_x_z))*zero_ilo*zero_khi
            +vel(i  ,j  ,k  ,1)*(     vfrac(i  ,j  ,k  )
-                               -2._rt*intg(i  ,j  ,k  ,i_S_x)
-                               -2._rt*intg(i  ,j  ,k  ,i_S_z)
-                               +4._rt*intg(i  ,j  ,k  ,i_S_x_z))
+                               -Real(2.)*intg(i  ,j  ,k  ,i_S_x)
+                               -Real(2.)*intg(i  ,j  ,k  ,i_S_z)
+                               +Real(4.)*intg(i  ,j  ,k  ,i_S_x_z))*zero_ihi*zero_khi
            +vel(i-1,j-1,k-1,1)*(    -vfrac(i-1,j-1,k-1)
-                               -2._rt*intg(i-1,j-1,k-1,i_S_x)
-                               -2._rt*intg(i-1,j-1,k-1,i_S_z)
-                               -4._rt*intg(i-1,j-1,k-1,i_S_x_z))
+                               -Real(2.)*intg(i-1,j-1,k-1,i_S_x)
+                               -Real(2.)*intg(i-1,j-1,k-1,i_S_z)
+                               -Real(4.)*intg(i-1,j-1,k-1,i_S_x_z))*zero_ilo*zero_klo
            +vel(i  ,j-1,k-1,1)*(    -vfrac(i  ,j-1,k-1)
-                               +2._rt*intg(i  ,j-1,k-1,i_S_x)
-                               -2._rt*intg(i  ,j-1,k-1,i_S_z)
-                               +4._rt*intg(i  ,j-1,k-1,i_S_x_z))
+                               +Real(2.)*intg(i  ,j-1,k-1,i_S_x)
+                               -Real(2.)*intg(i  ,j-1,k-1,i_S_z)
+                               +Real(4.)*intg(i  ,j-1,k-1,i_S_x_z))*zero_ihi*zero_klo
            +vel(i-1,j  ,k-1,1)*(     vfrac(i-1,j  ,k-1)
-                               +2._rt*intg(i-1,j  ,k-1,i_S_x)
-                               +2._rt*intg(i-1,j  ,k-1,i_S_z)
-                               +4._rt*intg(i-1,j  ,k-1,i_S_x_z))
+                               +Real(2.)*intg(i-1,j  ,k-1,i_S_x)
+                               +Real(2.)*intg(i-1,j  ,k-1,i_S_z)
+                               +Real(4.)*intg(i-1,j  ,k-1,i_S_x_z))*zero_ilo*zero_klo
            +vel(i  ,j  ,k-1,1)*(     vfrac(i  ,j  ,k-1)
-                               -2._rt*intg(i  ,j  ,k-1,i_S_x)
-                               +2._rt*intg(i  ,j  ,k-1,i_S_z)
-                               -4._rt*intg(i  ,j  ,k-1,i_S_x_z)) )
+                               -Real(2.)*intg(i  ,j  ,k-1,i_S_x)
+                               +Real(2.)*intg(i  ,j  ,k-1,i_S_z)
+                               -Real(4.)*intg(i  ,j  ,k-1,i_S_x_z))*zero_ihi*zero_klo )
             + facz*(
             vel(i-1,j-1,k  ,2)*(     vfrac(i-1,j-1,k  )
-                               +2._rt*intg(i-1,j-1,k  ,i_S_x)
-                               +2._rt*intg(i-1,j-1,k  ,i_S_y)
-                               +4._rt*intg(i-1,j-1,k  ,i_S_x_y))
+                               +Real(2.)*intg(i-1,j-1,k  ,i_S_x)
+                               +Real(2.)*intg(i-1,j-1,k  ,i_S_y)
+                               +Real(4.)*intg(i-1,j-1,k  ,i_S_x_y))*zero_ilo*zero_jlo
            +vel(i  ,j-1,k  ,2)*(     vfrac(i  ,j-1,k  )
-                               -2._rt*intg(i  ,j-1,k  ,i_S_x)
-                               +2._rt*intg(i  ,j-1,k  ,i_S_y)
-                               -4._rt*intg(i  ,j-1,k  ,i_S_x_y))
+                               -Real(2.)*intg(i  ,j-1,k  ,i_S_x)
+                               +Real(2.)*intg(i  ,j-1,k  ,i_S_y)
+                               -Real(4.)*intg(i  ,j-1,k  ,i_S_x_y))*zero_ihi*zero_jlo
            +vel(i-1,j  ,k  ,2)*(     vfrac(i-1,j  ,k  )
-                               +2._rt*intg(i-1,j  ,k  ,i_S_x)
-                               -2._rt*intg(i-1,j  ,k  ,i_S_y)
-                               -4._rt*intg(i-1,j  ,k  ,i_S_x_y))
+                               +Real(2.)*intg(i-1,j  ,k  ,i_S_x)
+                               -Real(2.)*intg(i-1,j  ,k  ,i_S_y)
+                               -Real(4.)*intg(i-1,j  ,k  ,i_S_x_y))*zero_ilo*zero_jhi
            +vel(i  ,j  ,k  ,2)*(     vfrac(i  ,j  ,k  )
-                               -2._rt*intg(i  ,j  ,k  ,i_S_x)
-                               -2._rt*intg(i  ,j  ,k  ,i_S_y)
-                               +4._rt*intg(i  ,j  ,k  ,i_S_x_y))
+                               -Real(2.)*intg(i  ,j  ,k  ,i_S_x)
+                               -Real(2.)*intg(i  ,j  ,k  ,i_S_y)
+                               +Real(4.)*intg(i  ,j  ,k  ,i_S_x_y))*zero_ihi*zero_jhi
            +vel(i-1,j-1,k-1,2)*(    -vfrac(i-1,j-1,k-1)
-                               -2._rt*intg(i-1,j-1,k-1,i_S_x)
-                               -2._rt*intg(i-1,j-1,k-1,i_S_y)
-                               -4._rt*intg(i-1,j-1,k-1,i_S_x_y))
+                               -Real(2.)*intg(i-1,j-1,k-1,i_S_x)
+                               -Real(2.)*intg(i-1,j-1,k-1,i_S_y)
+                               -Real(4.)*intg(i-1,j-1,k-1,i_S_x_y))*zero_ilo*zero_jlo
            +vel(i  ,j-1,k-1,2)*(    -vfrac(i  ,j-1,k-1)
-                               +2._rt*intg(i  ,j-1,k-1,i_S_x)
-                               -2._rt*intg(i  ,j-1,k-1,i_S_y)
-                               +4._rt*intg(i  ,j-1,k-1,i_S_x_y))
+                               +Real(2.)*intg(i  ,j-1,k-1,i_S_x)
+                               -Real(2.)*intg(i  ,j-1,k-1,i_S_y)
+                               +Real(4.)*intg(i  ,j-1,k-1,i_S_x_y))*zero_ihi*zero_jlo
            +vel(i-1,j  ,k-1,2)*(    -vfrac(i-1,j  ,k-1)
-                               -2._rt*intg(i-1,j  ,k-1,i_S_x)
-                               +2._rt*intg(i-1,j  ,k-1,i_S_y)
-                               +4._rt*intg(i-1,j  ,k-1,i_S_x_y))
+                               -Real(2.)*intg(i-1,j  ,k-1,i_S_x)
+                               +Real(2.)*intg(i-1,j  ,k-1,i_S_y)
+                               +Real(4.)*intg(i-1,j  ,k-1,i_S_x_y))*zero_ilo*zero_jhi
            +vel(i  ,j  ,k-1,2)*(    -vfrac(i  ,j  ,k-1)
-                               +2._rt*intg(i  ,j  ,k-1,i_S_x)
-                               +2._rt*intg(i  ,j  ,k-1,i_S_y)
-                               -4._rt*intg(i  ,j  ,k-1,i_S_x_y)) );
+                               +Real(2.)*intg(i  ,j  ,k-1,i_S_x)
+                               +Real(2.)*intg(i  ,j  ,k-1,i_S_y)
+                               -Real(4.)*intg(i  ,j  ,k-1,i_S_x_y))*zero_ihi*zero_jhi );
     } else {
-        rhs(i,j,k) = 0._rt;
+        rhs(i,j,k) = Real(0.);
     }
 }
 
@@ -5977,15 +6460,15 @@ void mlndlap_mknewu_eb (int i, int j, int k, Array4<Real> const& u, Array4<Real
                         Array4<Real const> const& sig, Array4<Real const> const& vfrac,
                         Array4<Real const> const& intg, GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
-    if (vfrac(i,j,k) == 0._rt) {
-        u(i,j,k,0) = u(i,j,k,1) = u(i,j,k,2) = 0._rt;
+    if (vfrac(i,j,k) == Real(0.)) {
+        u(i,j,k,0) = u(i,j,k,1) = u(i,j,k,2) = Real(0.);
     } else {
-        Real dpdx = 0.25_rt*(-p(i,j,k  )+p(i+1,j,k  )-p(i,j+1,k  )+p(i+1,j+1,k  )
-                             -p(i,j,k+1)+p(i+1,j,k+1)-p(i,j+1,k+1)+p(i+1,j+1,k+1));
-        Real dpdy = 0.25_rt*(-p(i,j,k  )-p(i+1,j,k  )+p(i,j+1,k  )+p(i+1,j+1,k  )
-                             -p(i,j,k+1)-p(i+1,j,k+1)+p(i,j+1,k+1)+p(i+1,j+1,k+1));
-        Real dpdz = 0.25_rt*(-p(i,j,k  )-p(i+1,j,k  )-p(i,j+1,k  )-p(i+1,j+1,k  )
-                             +p(i,j,k+1)+p(i+1,j,k+1)+p(i,j+1,k+1)+p(i+1,j+1,k+1));
+        Real dpdx = Real(0.25)*(-p(i,j,k  )+p(i+1,j,k  )-p(i,j+1,k  )+p(i+1,j+1,k  )
+                                -p(i,j,k+1)+p(i+1,j,k+1)-p(i,j+1,k+1)+p(i+1,j+1,k+1));
+        Real dpdy = Real(0.25)*(-p(i,j,k  )-p(i+1,j,k  )+p(i,j+1,k  )+p(i+1,j+1,k  )
+                                -p(i,j,k+1)-p(i+1,j,k+1)+p(i,j+1,k+1)+p(i+1,j+1,k+1));
+        Real dpdz = Real(0.25)*(-p(i,j,k  )-p(i+1,j,k  )-p(i,j+1,k  )-p(i+1,j+1,k  )
+                                +p(i,j,k+1)+p(i+1,j,k+1)+p(i,j+1,k+1)+p(i+1,j+1,k+1));
 
         Real dpp_xy = (p(i+1,j+1,k+1) - p(i,j+1,k+1) - p(i+1,j,k+1) + p(i,j,k+1)
                       +p(i+1,j+1,k  ) - p(i,j+1,k  ) - p(i+1,j,k  ) + p(i,j,k  ) ) / vfrac(i,j,k);
@@ -5999,15 +6482,15 @@ void mlndlap_mknewu_eb (int i, int j, int k, Array4<Real> const& u, Array4<Real
         Real dpp_xyz = (p(i+1,j+1,k+1) - p(i,j+1,k+1) - p(i+1,j,k+1) + p(i,j,k+1)
                        -p(i+1,j+1,k  ) + p(i,j+1,k  ) + p(i+1,j,k  ) - p(i,j,k  ) ) / vfrac(i,j,k);
 
-        u(i,j,k,0) -= sig(i,j,k)*dxinv[0]*(dpdx + .5_rt*intg(i,j,k,i_S_y  )*dpp_xy +
-                                                  .5_rt*intg(i,j,k,i_S_z  )*dpp_xz +
-                                                        intg(i,j,k,i_S_y_z)*dpp_xyz );
-        u(i,j,k,1) -= sig(i,j,k)*dxinv[1]*(dpdy + .5_rt*intg(i,j,k,i_S_x  )*dpp_xy +
-                                                  .5_rt*intg(i,j,k,i_S_z  )*dpp_yz +
-                                                        intg(i,j,k,i_S_x_z)*dpp_xyz );
-        u(i,j,k,2) -= sig(i,j,k)*dxinv[2]*(dpdz + .5_rt*intg(i,j,k,i_S_x  )*dpp_xz +
-                                                  .5_rt*intg(i,j,k,i_S_y  )*dpp_yz +
-                                                        intg(i,j,k,i_S_x_y)*dpp_xyz );
+        u(i,j,k,0) -= sig(i,j,k)*dxinv[0]*(dpdx + Real(0.5)*intg(i,j,k,i_S_y  )*dpp_xy +
+                                                  Real(0.5)*intg(i,j,k,i_S_z  )*dpp_xz +
+                                                            intg(i,j,k,i_S_y_z)*dpp_xyz );
+        u(i,j,k,1) -= sig(i,j,k)*dxinv[1]*(dpdy + Real(0.5)*intg(i,j,k,i_S_x  )*dpp_xy +
+                                                  Real(0.5)*intg(i,j,k,i_S_z  )*dpp_yz +
+                                                            intg(i,j,k,i_S_x_z)*dpp_xyz );
+        u(i,j,k,2) -= sig(i,j,k)*dxinv[2]*(dpdz + Real(0.5)*intg(i,j,k,i_S_x  )*dpp_xz +
+                                                  Real(0.5)*intg(i,j,k,i_S_y  )*dpp_yz +
+                                                            intg(i,j,k,i_S_x_y)*dpp_xyz );
     }
 }
 
@@ -6019,86 +6502,86 @@ Real mlndlap_rhcc_eb (int i, int j, int k, Array4<Real const> const& rhcc,
     if (!msk(i,j,k)) {
         return
                           rhcc(i  ,j  ,k  ) *
-            ( 0.125_rt * vfrac(i  ,j  ,k  )
-            + 0.25_rt * (-intg(i  ,j  ,k  ,i_S_x)
+         ( Real(0.125) * vfrac(i  ,j  ,k  )
+         + Real(0.25) * (-intg(i  ,j  ,k  ,i_S_x)
                          -intg(i  ,j  ,k  ,i_S_y)
                          -intg(i  ,j  ,k  ,i_S_z))
-            + 0.5_rt * (  intg(i  ,j  ,k  ,i_S_x_y)
+         + Real(0.5) * (  intg(i  ,j  ,k  ,i_S_x_y)
                          +intg(i  ,j  ,k  ,i_S_x_z)
                          +intg(i  ,j  ,k  ,i_S_y_z))
             +          ( -intg(i  ,j  ,k  ,i_S_xyz)))
             //
             +             rhcc(i-1,j  ,k  ) *
-            ( 0.125_rt * vfrac(i-1,j  ,k  )
-            + 0.25_rt * ( intg(i-1,j  ,k  ,i_S_x)
+         ( Real(0.125) * vfrac(i-1,j  ,k  )
+         + Real(0.25) * ( intg(i-1,j  ,k  ,i_S_x)
                          -intg(i-1,j  ,k  ,i_S_y)
                          -intg(i-1,j  ,k  ,i_S_z))
-            + 0.5_rt * ( -intg(i-1,j  ,k  ,i_S_x_y)
+         + Real(0.5) * ( -intg(i-1,j  ,k  ,i_S_x_y)
                          -intg(i-1,j  ,k  ,i_S_x_z)
                          +intg(i-1,j  ,k  ,i_S_y_z))
             +          (  intg(i-1,j  ,k  ,i_S_xyz)))
             //
             +             rhcc(i  ,j-1,k  ) *
-            ( 0.125_rt * vfrac(i  ,j-1,k  )
-            + 0.25_rt * (-intg(i  ,j-1,k  ,i_S_x)
+         ( Real(0.125) * vfrac(i  ,j-1,k  )
+         + Real(0.25) * (-intg(i  ,j-1,k  ,i_S_x)
                          +intg(i  ,j-1,k  ,i_S_y)
                          -intg(i  ,j-1,k  ,i_S_z))
-            + 0.5_rt * ( -intg(i  ,j-1,k  ,i_S_x_y)
+         + Real(0.5) * ( -intg(i  ,j-1,k  ,i_S_x_y)
                          +intg(i  ,j-1,k  ,i_S_x_z)
                          -intg(i  ,j-1,k  ,i_S_y_z))
             +          (  intg(i  ,j-1,k  ,i_S_xyz)))
             //
             +             rhcc(i-1,j-1,k  ) *
-            ( 0.125_rt * vfrac(i-1,j-1,k  )
-            + 0.25_rt * ( intg(i-1,j-1,k  ,i_S_x)
+         ( Real(0.125) * vfrac(i-1,j-1,k  )
+         + Real(0.25) * ( intg(i-1,j-1,k  ,i_S_x)
                          +intg(i-1,j-1,k  ,i_S_y)
                          -intg(i-1,j-1,k  ,i_S_z))
-            + 0.5_rt * (  intg(i-1,j-1,k  ,i_S_x_y)
+         + Real(0.5) * (  intg(i-1,j-1,k  ,i_S_x_y)
                          -intg(i-1,j-1,k  ,i_S_x_z)
                          -intg(i-1,j-1,k  ,i_S_y_z))
             +          ( -intg(i-1,j-1,k  ,i_S_xyz)))
             //
             +             rhcc(i  ,j  ,k-1) *
-            ( 0.125_rt * vfrac(i  ,j  ,k-1)
-            + 0.25_rt * (-intg(i  ,j  ,k-1,i_S_x)
+         ( Real(0.125) * vfrac(i  ,j  ,k-1)
+         + Real(0.25) * (-intg(i  ,j  ,k-1,i_S_x)
                          -intg(i  ,j  ,k-1,i_S_y)
                          +intg(i  ,j  ,k-1,i_S_z))
-            + 0.5_rt * (  intg(i  ,j  ,k-1,i_S_x_y)
+         + Real(0.5) * (  intg(i  ,j  ,k-1,i_S_x_y)
                          -intg(i  ,j  ,k-1,i_S_x_z)
                          -intg(i  ,j  ,k-1,i_S_y_z))
             +          (  intg(i  ,j  ,k-1,i_S_xyz)))
             //
             +             rhcc(i-1,j  ,k-1) *
-            ( 0.125_rt * vfrac(i-1,j  ,k-1)
-            + 0.25_rt * ( intg(i-1,j  ,k-1,i_S_x)
+         ( Real(0.125) * vfrac(i-1,j  ,k-1)
+         + Real(0.25) * ( intg(i-1,j  ,k-1,i_S_x)
                          -intg(i-1,j  ,k-1,i_S_y)
                          +intg(i-1,j  ,k-1,i_S_z))
-            + 0.5_rt * ( -intg(i-1,j  ,k-1,i_S_x_y)
+         + Real(0.5) * ( -intg(i-1,j  ,k-1,i_S_x_y)
                          +intg(i-1,j  ,k-1,i_S_x_z)
                          -intg(i-1,j  ,k-1,i_S_y_z))
             +          ( -intg(i-1,j  ,k-1,i_S_xyz)))
             //
             +             rhcc(i  ,j-1,k-1) *
-            ( 0.125_rt * vfrac(i  ,j-1,k-1)
-            + 0.25_rt * (-intg(i  ,j-1,k-1,i_S_x)
+         ( Real(0.125) * vfrac(i  ,j-1,k-1)
+         + Real(0.25) * (-intg(i  ,j-1,k-1,i_S_x)
                          +intg(i  ,j-1,k-1,i_S_y)
                          +intg(i  ,j-1,k-1,i_S_z))
-            + 0.5_rt * ( -intg(i  ,j-1,k-1,i_S_x_y)
+         + Real(0.5) * ( -intg(i  ,j-1,k-1,i_S_x_y)
                          -intg(i  ,j-1,k-1,i_S_x_z)
                          +intg(i  ,j-1,k-1,i_S_y_z))
             +          ( -intg(i  ,j-1,k-1,i_S_xyz)))
             //
             +             rhcc(i-1,j-1,k-1) *
-            ( 0.125_rt * vfrac(i-1,j-1,k-1)
-            + 0.25_rt * ( intg(i-1,j-1,k-1,i_S_x)
+         ( Real(0.125) * vfrac(i-1,j-1,k-1)
+         + Real(0.25) * ( intg(i-1,j-1,k-1,i_S_x)
                          +intg(i-1,j-1,k-1,i_S_y)
                          +intg(i-1,j-1,k-1,i_S_z))
-            + 0.5_rt * (  intg(i-1,j-1,k-1,i_S_x_y)
+         + Real(0.5) * (  intg(i-1,j-1,k-1,i_S_x_y)
                          +intg(i-1,j-1,k-1,i_S_x_z)
                          +intg(i-1,j-1,k-1,i_S_y_z))
              +         (  intg(i-1,j-1,k-1,i_S_xyz)));
     } else {
-        return 0._rt;
+        return Real(0.);
     }
 }
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_K.H
index 183c48d3e0a..8224a379832 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLap_K.H
@@ -16,11 +16,11 @@ namespace {
     constexpr int crse_fine_node = 1;
     constexpr int fine_node = 2;
 #if (BL_USE_FLOAT)
-    constexpr double eps = 1.e-30;
+    constexpr float eps = 1.e-30;
 #else
     constexpr double eps = 1.e-100;
 #endif
-    constexpr Real almostone = 1._rt - 100._rt*std::numeric_limits<Real>::epsilon();
+    constexpr Real almostone = Real(1.) - Real(100.)*std::numeric_limits<Real>::epsilon();
 
 }
 
@@ -86,12 +86,12 @@ void mlndlap_fillbc_cc (Box const& vbx, Array4<T> const& sigma, Box const& domai
                         GpuArray<LinOpBCType, AMREX_SPACEDIM> bclo,
                         GpuArray<LinOpBCType, AMREX_SPACEDIM> bchi) noexcept
 {
-    GpuArray<bool,AMREX_SPACEDIM> bflo{AMREX_D_DECL(bclo[0] != LinOpBCType::Periodic,
-                                                    bclo[1] != LinOpBCType::Periodic,
-                                                    bclo[2] != LinOpBCType::Periodic)};
-    GpuArray<bool,AMREX_SPACEDIM> bfhi{AMREX_D_DECL(bchi[0] != LinOpBCType::Periodic,
-                                                    bchi[1] != LinOpBCType::Periodic,
-                                                    bchi[2] != LinOpBCType::Periodic)};
+    GpuArray<bool,AMREX_SPACEDIM> bflo{{AMREX_D_DECL(bclo[0] != LinOpBCType::Periodic,
+                                                     bclo[1] != LinOpBCType::Periodic,
+                                                     bclo[2] != LinOpBCType::Periodic)}};
+    GpuArray<bool,AMREX_SPACEDIM> bfhi{{AMREX_D_DECL(bchi[0] != LinOpBCType::Periodic,
+                                                     bchi[1] != LinOpBCType::Periodic,
+                                                     bchi[2] != LinOpBCType::Periodic)}};
     mlndlap_bc_doit(vbx, sigma, domain, bflo, bfhi);
 }
 
@@ -100,18 +100,18 @@ void mlndlap_applybc (Box const& vbx, Array4<T> const& phi, Box const& domain,
                       GpuArray<LinOpBCType, AMREX_SPACEDIM> bclo,
                       GpuArray<LinOpBCType, AMREX_SPACEDIM> bchi) noexcept
 {
-    GpuArray<bool,AMREX_SPACEDIM> bflo{AMREX_D_DECL(bclo[0] == LinOpBCType::Neumann or
-                                                    bclo[0] == LinOpBCType::inflow,
-                                                    bclo[1] == LinOpBCType::Neumann or
-                                                    bclo[1] == LinOpBCType::inflow,
-                                                    bclo[2] == LinOpBCType::Neumann or
-                                                    bclo[2] == LinOpBCType::inflow)};
-    GpuArray<bool,AMREX_SPACEDIM> bfhi{AMREX_D_DECL(bchi[0] == LinOpBCType::Neumann or
-                                                    bchi[0] == LinOpBCType::inflow,
-                                                    bchi[1] == LinOpBCType::Neumann or
-                                                    bchi[1] == LinOpBCType::inflow,
-                                                    bchi[2] == LinOpBCType::Neumann or
-                                                    bchi[2] == LinOpBCType::inflow)};
+    GpuArray<bool,AMREX_SPACEDIM> bflo{{AMREX_D_DECL(bclo[0] == LinOpBCType::Neumann or
+                                                     bclo[0] == LinOpBCType::inflow,
+                                                     bclo[1] == LinOpBCType::Neumann or
+                                                     bclo[1] == LinOpBCType::inflow,
+                                                     bclo[2] == LinOpBCType::Neumann or
+                                                     bclo[2] == LinOpBCType::inflow)}};
+    GpuArray<bool,AMREX_SPACEDIM> bfhi{{AMREX_D_DECL(bchi[0] == LinOpBCType::Neumann or
+                                                     bchi[0] == LinOpBCType::inflow,
+                                                     bchi[1] == LinOpBCType::Neumann or
+                                                     bchi[1] == LinOpBCType::inflow,
+                                                     bchi[2] == LinOpBCType::Neumann or
+                                                     bchi[2] == LinOpBCType::inflow)}};
     mlndlap_bc_doit(vbx, phi, domain, bflo, bfhi);
 }
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.H
index b5f5978ca33..08195577014 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.H
@@ -96,9 +96,9 @@ public :
 
     virtual void fixUpResidualMask (int amrlev, iMultiFab& resmsk) final override;
 
-    virtual void getFluxes (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_flux,
-                            const Vector<MultiFab*>& a_sol,
-                            Location a_loc) const final override {
+    virtual void getFluxes (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& /*a_flux*/,
+                            const Vector<MultiFab*>& /*a_sol*/,
+                            Location /*a_loc*/) const final override {
         amrex::Abort("MLLinOp::getFluxes: How did we get here?");
     }
     virtual void getFluxes (const Vector<MultiFab*>& a_flux,
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.cpp b/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.cpp
index 73554923a63..103eee4eb25 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLaplacian.cpp
@@ -1,5 +1,3 @@
-#include <limits>
-
 #include <AMReX_MLMG.H>
 #include <AMReX_MLNodeLaplacian.H>
 #include <AMReX_MLNodeLap_K.H>
@@ -14,6 +12,9 @@
 #include <omp.h>
 #endif
 
+#include <limits>
+
+
 namespace amrex {
 
 MLNodeLaplacian::MLNodeLaplacian (const Vector<Geometry>& a_geom,
@@ -230,7 +231,7 @@ MLNodeLaplacian::compRHS (const Vector<MultiFab*>& rhs, const Vector<MultiFab*>&
                     Array4<Real const> const& intgarr = intg->const_array(mfi);
                     AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
                     {
-                        mlndlap_divu_eb(i,j,k,rhsarr,velarr,vfracarr,intgarr,dmskarr,dxinvarr);
+                        mlndlap_divu_eb(i,j,k,rhsarr,velarr,vfracarr,intgarr,dmskarr,dxinvarr,nddom,lobc,hibc);
                     });
                 }
                 else
@@ -241,15 +242,19 @@ MLNodeLaplacian::compRHS (const Vector<MultiFab*>& rhs, const Vector<MultiFab*>&
             if (regular)
 #endif
             {
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
                 {
-
-#if (AMREX_SPACEDIM == 2)
-                    mlndlap_divu(i,j,k,rhsarr,velarr,dmskarr,dxinvarr,is_rz);
+                    mlndlap_divu(i,j,k,rhsarr,velarr,dmskarr,dxinvarr,
+                                 nddom,lobc,hibc,is_rz);
+                });
 #else
-                    mlndlap_divu(i,j,k,rhsarr,velarr,dmskarr,dxinvarr);
-#endif
+                AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+                {
+                    mlndlap_divu(i,j,k,rhsarr,velarr,dmskarr,dxinvarr,
+                                 nddom,lobc,hibc);
                 });
+#endif
             }
 
             mlndlap_impose_neumann_bc(bx, rhsarr, nddom, lobc, hibc);
@@ -301,6 +306,7 @@ MLNodeLaplacian::compRHS (const Vector<MultiFab*>& rhs, const Vector<MultiFab*>&
         frhs[ilev]->setVal(0.0);
 
         const Box& cccdom = cgeom.Domain();
+        const Box& nddom = amrex::surroundingNodes(fgeom.Domain());
         const auto fdxinv = fgeom.InvCellSizeArray();
         const iMultiFab& fdmsk = *m_dirichlet_mask[ilev+1][0];
 
@@ -360,6 +366,7 @@ MLNodeLaplacian::compRHS (const Vector<MultiFab*>& rhs, const Vector<MultiFab*>&
                 });
 
                 Array4<Real const> const& rarr_orig = rhs[ilev+1]->const_array(mfi);
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_FOR_3D(bx_rhs, i, j, k,
                 {
                     if (b2.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
@@ -367,12 +374,21 @@ MLNodeLaplacian::compRHS (const Vector<MultiFab*>& rhs, const Vector<MultiFab*>&
                     } else {
                         rarr(i,j,k) = 0.0;
                     }
-#if (AMREX_SPACEDIM == 2)
-                    mlndlap_divu_compute_fine_contrib(i,j,k,fvbx,rarr,varr,is_rz,fdxinv);
+                    mlndlap_divu_compute_fine_contrib(i,j,k,fvbx,rarr,varr,fdxinv,
+                                                      nddom,lobc,hibc,is_rz);
+                });
 #else
-                    mlndlap_divu_compute_fine_contrib(i,j,k,fvbx,rarr,varr,fdxinv);
-#endif
+                AMREX_HOST_DEVICE_FOR_3D(bx_rhs, i, j, k,
+                {
+                    if (b2.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
+                        rarr(i,j,k) = rarr_orig(i,j,k);
+                    } else {
+                        rarr(i,j,k) = 0.0;
+                    }
+                    mlndlap_divu_compute_fine_contrib(i,j,k,fvbx,rarr,varr,fdxinv,
+                                                      nddom,lobc,hibc);
                 });
+#endif
 
                 Array4<Real> const& rhsarr = frhs[ilev]->array(mfi);
                 Array4<int const> const& mskarr = fdmsk.const_array(mfi);
@@ -454,16 +470,22 @@ MLNodeLaplacian::compRHS (const Vector<MultiFab*>& rhs, const Vector<MultiFab*>&
 
                 Array4<Real const> rhccarr = (rhcc[ilev])
                     ? rhcc[ilev]->const_array(mfi) : Array4<Real const>{};
-
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
                 {
                     mlndlap_divu_cf_contrib(i,j,k,rhsarr,velarr,crhsarr,rhccarr,
                                             cdmskarr,ndmskarr,ccmskarr,
-#if (AMREX_SPACEDIM == 2)
                                             is_rz,
-#endif
                                             cdxinv,cnddom,lobc,hibc, neumann_doubling);
                 });
+#else
+                AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
+                {
+                    mlndlap_divu_cf_contrib(i,j,k,rhsarr,velarr,crhsarr,rhccarr,
+                                            cdmskarr,ndmskarr,ccmskarr,
+                                            cdxinv,cnddom,lobc,hibc, neumann_doubling);
+                });
+#endif
             }
         }
     }
@@ -537,14 +559,17 @@ MLNodeLaplacian::updateVelocity (const Vector<MultiFab*>& vel, const Vector<Mult
             if (regular)
 #endif
             {
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
                 {
-#if (AMREX_SPACEDIM == 2)
                     mlndlap_mknewu(i,j,k,varr,solarr,sigmaarr,dxinv,is_rz);
+                });
 #else
+                AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+                {
                     mlndlap_mknewu(i,j,k,varr,solarr,sigmaarr,dxinv);
-#endif
                 });
+#endif
             }
         }
     }
@@ -611,14 +636,17 @@ MLNodeLaplacian::getFluxes (const Vector<MultiFab*> & a_flux, const Vector<Multi
             if (regular)
 #endif
             {
+#if (AMREX_SPACEDIM == 2)
                 AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
                 {
-#if (AMREX_SPACEDIM == 2)
                     mlndlap_mknewu(i,j,k,farr,solarr,sigmaarr,dxinv,is_rz);
+                });
 #else
+                AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+                {
                     mlndlap_mknewu(i,j,k,farr,solarr,sigmaarr,dxinv);
-#endif
                 });
+#endif
             }
         }
     }
@@ -709,6 +737,14 @@ MLNodeLaplacian::averageDownCoeffsSameAmrLevel (int amrlev)
 
     for (int mglev = 1; mglev < m_num_mg_levels[amrlev]; ++mglev)
     {
+        int idir = 2;
+        bool regular_coarsening = mg_coarsen_ratio_vec[mglev-1] == mg_coarsen_ratio;
+        IntVect ratio = mg_coarsen_ratio_vec[mglev-1];
+        if (ratio[1] == 1) {
+            idir = 1;
+        } else if (ratio[0] == 1) {
+            idir = 0;
+        }
         for (int idim = 0; idim < nsigma; ++idim)
         {
             const MultiFab& fine = *m_sigma[amrlev][mglev-1][idim];
@@ -716,42 +752,57 @@ MLNodeLaplacian::averageDownCoeffsSameAmrLevel (int amrlev)
             bool need_parallel_copy = !amrex::isMFIterSafe(crse, fine);
             MultiFab cfine;
             if (need_parallel_copy) {
-                const BoxArray& ba = amrex::coarsen(fine.boxArray(), 2);
+                const BoxArray& ba = amrex::coarsen(fine.boxArray(), ratio);
                 cfine.define(ba, fine.DistributionMap(), 1, 0);
             }
 
             MultiFab* pcrse = (need_parallel_copy) ? &cfine : &crse;
-
+            
+            if (regular_coarsening) {
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
-            for (MFIter mfi(*pcrse, TilingIfNotGPU()); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.tilebox();
-                Array4<Real> const& cfab = pcrse->array(mfi);
-                Array4<Real const> const& ffab = fine.const_array(mfi);
-                if (idim == 0) {
-                    AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
-                    {
-                        mlndlap_avgdown_coeff_x(i,j,k,cfab,ffab);
-                    });
-                } else if (idim == 1) {
+                for (MFIter mfi(*pcrse, TilingIfNotGPU()); mfi.isValid(); ++mfi)
+                {
+                    const Box& bx = mfi.tilebox();
+                    Array4<Real> const& cfab = pcrse->array(mfi);
+                    Array4<Real const> const& ffab = fine.const_array(mfi);
+                    if (idim == 0) {
+                        AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
+                        {
+                            mlndlap_avgdown_coeff_x(i,j,k,cfab,ffab);
+                        });
+                    } else if (idim == 1) {
 #if (AMREX_SPACEDIM >= 2)
-                    AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
-                    {
-                        mlndlap_avgdown_coeff_y(i,j,k,cfab,ffab);
-                    });
+                        AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
+                        {
+                            mlndlap_avgdown_coeff_y(i,j,k,cfab,ffab);
+                        });
 #endif
-                } else {
+                    } else {
 #if (AMREX_SPACEDIM == 3)
+                        AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
+                        {
+                            mlndlap_avgdown_coeff_z(i,j,k,cfab,ffab);
+                        });
+#endif
+                    }
+                }
+            } else {
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+                for (MFIter mfi(*pcrse, TilingIfNotGPU()); mfi.isValid(); ++mfi)
+                {
+                    const Box& bx = mfi.tilebox();
+                    Array4<Real> const& cfab = pcrse->array(mfi);
+                    Array4<Real const> const& ffab = fine.const_array(mfi);
                     AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
                     {
-                        mlndlap_avgdown_coeff_z(i,j,k,cfab,ffab);
+                        mlndlap_semi_avgdown_coeff(i,j,k,cfab,ffab,idir);
                     });
-#endif
                 }
             }
-
             if (need_parallel_copy) {
                 crse.ParallelCopy(cfine);
             }
@@ -972,7 +1023,9 @@ MLNodeLaplacian::buildStencil ()
                 Array4<Real const> const& fsten = fine.const_array(mfi);
 #ifdef AMREX_USE_DPCPP
                 // xxxxx DPCPP todo: this kernel hangs at JIT compilation
+#ifndef AMREX_DPCPP_STENCIL_RAP_ON_GPU
                 Gpu::LaunchSafeGuard lsg(false);
+#endif
 #endif
                 AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
                 {
@@ -1065,6 +1118,17 @@ MLNodeLaplacian::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab&
 
     const auto& stencil = m_stencil[amrlev][cmglev-1];
 
+    bool regular_coarsening = true; int idir = 2;
+    if (cmglev > 0) {
+        regular_coarsening = mg_coarsen_ratio_vec[cmglev-1] == mg_coarsen_ratio;
+        IntVect ratio = mg_coarsen_ratio_vec[cmglev-1];
+        if (ratio[1] == 1) {
+            idir = 1;
+        } else if (ratio[0] == 1) {
+            idir = 0;
+        }
+    }
+
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
@@ -1076,10 +1140,20 @@ MLNodeLaplacian::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab&
         Array4<int const> const& mfab = dmsk.const_array(mfi);
         if (m_coarsening_strategy == CoarseningStrategy::Sigma)
         {
-            AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
-            {
-                mlndlap_restriction(i,j,k,cfab,ffab,mfab);
-            });
+	    if (regular_coarsening) 
+	    {
+            	AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+            	{
+               	    mlndlap_restriction(i,j,k,cfab,ffab,mfab);
+            	});
+	    }
+	    else
+	    {
+                AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+                {
+                    mlndlap_semi_restriction(i,j,k,cfab,ffab,mfab,idir);
+                });
+	    }
         }
         else
         {
@@ -1116,6 +1190,18 @@ MLNodeLaplacian::interpolation (int amrlev, int fmglev, MultiFab& fine, const Mu
 
     const iMultiFab& dmsk = *m_dirichlet_mask[amrlev][fmglev];
 
+    bool regular_coarsening = true; int idir = 2;
+    if (fmglev > 0) {
+        regular_coarsening = mg_coarsen_ratio_vec[fmglev] == mg_coarsen_ratio;
+        IntVect ratio = mg_coarsen_ratio_vec[fmglev];
+	if (ratio[1] == 1) {
+	    idir = 1;
+        } else if (ratio[0] == 1) {
+ 	    idir = 0;
+        }
+    }
+
+
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
@@ -1144,12 +1230,22 @@ MLNodeLaplacian::interpolation (int amrlev, int fmglev, MultiFab& fine, const Mu
             });
         }
         else
-        {
-            Array4<Real const> const& sfab = sigma[0]->const_array(mfi);
-            AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
-            {
-                mlndlap_interpadd_aa(i,j,k,ffab,cfab,sfab,mfab);
-            });
+        { 
+	    Array4<Real const> const& sfab = sigma[0]->const_array(mfi);
+	    if (regular_coarsening)
+	    {
+            	AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+            	{
+                    mlndlap_interpadd_aa(i,j,k,ffab,cfab,sfab,mfab);
+                });
+	    } 
+	    else
+	    {
+                AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+                {
+                    mlndlap_semi_interpadd_aa(i,j,k,ffab,cfab,sfab,mfab,idir);
+                });
+	    } 
         }
     }
 }
@@ -1287,27 +1383,35 @@ MLNodeLaplacian::Fapply (int amrlev, int mglev, MultiFab& out, const MultiFab& i
             AMREX_D_TERM(Array4<Real const> const& sxarr = sigma[0]->const_array(mfi);,
                          Array4<Real const> const& syarr = sigma[1]->const_array(mfi);,
                          Array4<Real const> const& szarr = sigma[2]->const_array(mfi););
+#if (AMREX_SPACEDIM == 2)
+            AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
+            {
+                mlndlap_adotx_ha(i,j,k,yarr,xarr,AMREX_D_DECL(sxarr,syarr,szarr), dmskarr,
+                                 is_rz, dxinvarr);
+            });
+#else
             AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
             {
                 mlndlap_adotx_ha(i,j,k,yarr,xarr,AMREX_D_DECL(sxarr,syarr,szarr), dmskarr,
-#if (AMREX_SPACEDIM == 2)
-                                 is_rz,
-#endif
                                  dxinvarr);
             });
+#endif
         }
         else
         {
             Array4<Real const> const& sarr = sigma[0]->const_array(mfi);
+#if (AMREX_SPACEDIM == 2)
             AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
             {
-                mlndlap_adotx_aa(i,j,k,yarr,xarr,sarr,dmskarr,
-#if (AMREX_SPACEDIM == 2)
-                                 is_rz,
-#endif
-                                 dxinvarr);
+                mlndlap_adotx_aa(i,j,k,yarr,xarr,sarr,dmskarr, is_rz, dxinvarr);
             });
-        }
+#else
+            AMREX_HOST_DEVICE_PARALLEL_FOR_3D ( bx, i, j, k,
+            {
+                mlndlap_adotx_aa(i,j,k,yarr,xarr,sarr,dmskarr, dxinvarr);
+            });
+#endif
+       }
     }
 }
 
@@ -1418,6 +1522,12 @@ MLNodeLaplacian::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab&
     else // cpu
 #endif
     {
+	bool regular_coarsening = true;
+	if (amrlev == 0 and mglev > 0) 
+    	{
+            regular_coarsening = mg_coarsen_ratio_vec[mglev-1] == mg_coarsen_ratio;
+        }
+
         constexpr int nsweeps = 2;
         if (m_use_gauss_seidel)
         {
@@ -1472,20 +1582,33 @@ MLNodeLaplacian::Fsmooth (int amrlev, int mglev, MultiFab& sol, const MultiFab&
 #endif
                 for (MFIter mfi(sol); mfi.isValid(); ++mfi)
                 {
+
                     const Box& bx = mfi.validbox();
                     Array4<Real const> const& sarr = sigma[0]->const_array(mfi);
                     Array4<Real> const& solarr = sol.array(mfi);
                     Array4<Real const> const& rhsarr = rhs.const_array(mfi);
                     Array4<int const> const& dmskarr = dmsk.const_array(mfi);
 
-                    for (int ns = 0; ns < nsweeps; ++ns) {
-                        mlndlap_gauss_seidel_aa(bx, solarr, rhsarr,
-                                                sarr, dmskarr, dxinvarr
+		    if ( regular_coarsening ) 
+		    {
+                        for (int ns = 0; ns < nsweeps; ++ns) {
+                            mlndlap_gauss_seidel_aa(bx, solarr, rhsarr,
+                                                    sarr, dmskarr, dxinvarr
 #if (AMREX_SPACEDIM == 2)
-                                                ,is_rz
+                                                   ,is_rz
 #endif
-                            );
-                    }
+                                 );
+                        }
+		    } else {
+			for (int ns = 0; ns < nsweeps; ++ns) {
+                            mlndlap_gauss_seidel_with_line_solve_aa(bx, solarr, rhsarr,
+                                                                    sarr, dmskarr, dxinvarr
+#if (AMREX_SPACEDIM == 2)
+                                                                   ,is_rz
+#endif
+                                 );
+			}
+		    }
                 }
             }
 
@@ -1619,6 +1742,7 @@ MLNodeLaplacian::compSyncResidualCoarse (MultiFab& sync_resid, const MultiFab& a
     const BoxArray& ccba = m_grids[0][0];
     const BoxArray& ndba = amrex::convert(ccba, IntVect::TheNodeVector());
     const BoxArray& ccfba = amrex::convert(fine_grids, IntVect::TheZeroVector());
+
     const auto lobc = LoBC();
     const auto hibc = HiBC();
 
@@ -1710,7 +1834,7 @@ MLNodeLaplacian::compSyncResidualCoarse (MultiFab& sync_resid, const MultiFab& a
                 if (Gpu::inLaunchRegion()) {
                     AMREX_ASSERT(ccbxg1 == crse_cc_mask[mfi].box());
                     has_fine = Reduce::AnyOf(ccbxg1,
-                                             [cccmsk,nonowner] AMREX_GPU_DEVICE (int i, int j, int k) noexcept -> bool
+                                             [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept -> bool
                     {
                         return cccmsk(i,j,k) == nonowner;
                     });
@@ -1769,20 +1893,23 @@ MLNodeLaplacian::compSyncResidualCoarse (MultiFab& sync_resid, const MultiFab& a
                         Array4<Real const> const& intgarr = intg->const_array(mfi);
                         AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
                         {
-                            mlndlap_divu_eb(i,j,k,rhsarr,uarr,vfracarr,intgarr,dmskarr,dxinv);
+                            mlndlap_divu_eb(i,j,k,rhsarr,uarr,vfracarr,intgarr,dmskarr,dxinv,nddom,lobc,hibc);
                         });
                     }
                     else
 #endif
                     {
+#if (AMREX_SPACEDIM == 2)
                         AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
                         {
-#if (AMREX_SPACEDIM == 2)
-                            mlndlap_divu(i,j,k,rhsarr,uarr,dmskarr,dxinv,is_rz);
+                            mlndlap_divu(i,j,k,rhsarr,uarr,dmskarr,dxinv,nddom,lobc,hibc,is_rz);
+                        });
 #else
-                            mlndlap_divu(i,j,k,rhsarr,uarr,dmskarr,dxinv);
-#endif
+                        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+                        {
+                            mlndlap_divu(i,j,k,rhsarr,uarr,dmskarr,dxinv,nddom,lobc,hibc);
                         });
+#endif
                     }
 
                     if (rhcc)
@@ -1886,15 +2013,19 @@ MLNodeLaplacian::compSyncResidualCoarse (MultiFab& sync_resid, const MultiFab& a
                             }
                         });
 
+#if (AMREX_SPACEDIM == 2)
                         AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
                         {
-                            mlndlap_adotx_aa(i, j, k, sync_resid_a, phiarr, sigmaarr, dmskarr,
-#if (AMREX_SPACEDIM == 2)
-                                             is_rz,
-#endif
-                                             dxinv);
+                            mlndlap_adotx_aa(i, j, k, sync_resid_a, phiarr, sigmaarr, dmskarr, is_rz, dxinv);
                             mlndlap_crse_resid(i, j, k, sync_resid_a, rhsarr, cccmsk, nddom, lobc, hibc, neumann_doubling);
                         });
+#else
+                        AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+                        {
+                            mlndlap_adotx_aa(i, j, k, sync_resid_a, phiarr, sigmaarr, dmskarr, dxinv);
+                            mlndlap_crse_resid(i, j, k, sync_resid_a, rhsarr, cccmsk, nddom, lobc, hibc, neumann_doubling);
+                        });
+#endif
                     }
                 }
             }
@@ -1911,6 +2042,9 @@ MLNodeLaplacian::compSyncResidualFine (MultiFab& sync_resid, const MultiFab& phi
     const MultiFab& sigma_orig = *m_sigma[0][0][0];
     const iMultiFab& dmsk = *m_dirichlet_mask[0][0];
 
+    const auto lobc = LoBC();
+    const auto hibc = HiBC();
+
 #ifdef AMREX_USE_EB
     auto factory = dynamic_cast<EBFArrayBoxFactory const*>(m_factory[0][0].get());
     const FabArray<EBCellFlagFab>* flags = (factory) ? &(factory->getMultiEBCellFlagFab()) : nullptr;
@@ -1920,6 +2054,7 @@ MLNodeLaplacian::compSyncResidualFine (MultiFab& sync_resid, const MultiFab& phi
 
     const Geometry& geom = m_geom[0][0];
     const Box& ccdom = geom.Domain();
+    const Box& nddom = amrex::surroundingNodes(ccdom);
     const auto dxinv = geom.InvCellSizeArray();
 #if (AMREX_SPACEDIM == 2)
     bool is_rz = m_is_rz;
@@ -2009,20 +2144,23 @@ MLNodeLaplacian::compSyncResidualFine (MultiFab& sync_resid, const MultiFab& phi
                     Array4<Real const> const& intgarr = intg->const_array(mfi);
                     AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
                     {
-                        mlndlap_divu_eb(i,j,k,rhsarr,uarr,vfracarr,intgarr,tmpmaskarr,dxinv);
+                        mlndlap_divu_eb(i,j,k,rhsarr,uarr,vfracarr,intgarr,tmpmaskarr,dxinv,nddom,lobc,hibc);
                     });
                 }
                 else
 #endif
                 {
+#if (AMREX_SPACEDIM == 2)
                     AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
                     {
-#if (AMREX_SPACEDIM == 2)
-                        mlndlap_divu(i,j,k,rhsarr,uarr,tmpmaskarr,dxinv,is_rz);
+                        mlndlap_divu(i,j,k,rhsarr,uarr,tmpmaskarr,dxinv,nddom,lobc,hibc,is_rz);
+                    });
 #else
-                        mlndlap_divu(i,j,k,rhsarr,uarr,tmpmaskarr,dxinv);
-#endif
+                    AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+                    {
+                        mlndlap_divu(i,j,k,rhsarr,uarr,tmpmaskarr,dxinv,nddom,lobc,hibc);
                     });
+#endif
                 }
 
                 if (rhcc)
@@ -2129,19 +2267,29 @@ MLNodeLaplacian::compSyncResidualFine (MultiFab& sync_resid, const MultiFab& phi
                         }
                     });
 
+#if (AMREX_SPACEDIM == 2)
+                    AMREX_HOST_DEVICE_FOR_3D(gbx, i, j, k,
+                    {
+                        if (bx.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
+                            mlndlap_adotx_aa(i,j,k, sync_resid_a, phiarr, sigmaarr, tmpmaskarr,
+                                             is_rz, dxinv);
+                            sync_resid_a(i,j,k) = rhsarr(i,j,k) - sync_resid_a(i,j,k);
+                        } else {
+                            sync_resid_a(i,j,k) = 0.0;
+                        }
+                    });
+#else
                     AMREX_HOST_DEVICE_FOR_3D(gbx, i, j, k,
                     {
                         if (bx.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
                             mlndlap_adotx_aa(i,j,k, sync_resid_a, phiarr, sigmaarr, tmpmaskarr,
-#if (AMREX_SPACEDIM == 2)
-                                             is_rz,
-#endif
                                              dxinv);
                             sync_resid_a(i,j,k) = rhsarr(i,j,k) - sync_resid_a(i,j,k);
                         } else {
                             sync_resid_a(i,j,k) = 0.0;
                         }
                     });
+#endif
                 }
             }
 
@@ -2250,6 +2398,7 @@ MLNodeLaplacian::reflux (int crse_amrlev,
             Array4<Real const> const& rhsarr = fine_rhs.const_array(mfi);
             Array4<Real const> const& resarr = fine_res.const_array(mfi);
             Array4<Real const> const& solarr = fine_sol.const_array(mfi);
+#if (AMREX_SPACEDIM == 2)
             AMREX_HOST_DEVICE_FOR_3D(bx_Ax, i, j, k,
             {
                 if (b2.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
@@ -2257,13 +2406,19 @@ MLNodeLaplacian::reflux (int crse_amrlev,
                 } else {
                     Axarr(i,j,k) = 0.0;
                 }
-                mlndlap_res_fine_Ax(i,j,k, fvbx, Axarr, solarr, sigarr,
-#if (AMREX_SPACEDIM == 2)
-                                    is_rz,
-#endif
-                                    fdxinv);
+                mlndlap_res_fine_Ax(i,j,k, fvbx, Axarr, solarr, sigarr, is_rz, fdxinv);
             });
-
+#else
+            AMREX_HOST_DEVICE_FOR_3D(bx_Ax, i, j, k,
+            {
+                if (b2.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
+                    Axarr(i,j,k) = rhsarr(i,j,k) - resarr(i,j,k);
+                } else {
+                    Axarr(i,j,k) = 0.0;
+                }
+                mlndlap_res_fine_Ax(i,j,k, fvbx, Axarr, solarr, sigarr, fdxinv);
+            });
+#endif
             Array4<Real> const& farr = fine_contrib.array(mfi);
             Array4<int const> const& marr = fdmsk.const_array(mfi);
             AMREX_HOST_DEVICE_FOR_3D(cbx, i, j, k,
@@ -2304,16 +2459,24 @@ MLNodeLaplacian::reflux (int crse_amrlev,
             Array4<int const> const& ccmskarr = cc_mask->const_array(mfi);
             Array4<Real const> const& fcocarr = fine_contrib_on_crse.const_array(mfi);
 
+#if (AMREX_SPACEDIM == 2)
             AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
             {
                 mlndlap_res_cf_contrib(i,j,k,resarr,csolarr,crhsarr,csigarr,
                                        cdmskarr,ndmskarr,ccmskarr,fcocarr,
                                        cdxinv,c_nd_domain,
-#if (AMREX_SPACEDIM == 2)
                                        is_rz,
-#endif
                                        lobc,hibc, neumann_doubling);
             });
+#else
+            AMREX_HOST_DEVICE_FOR_3D(bx, i, j, k,
+            {
+                mlndlap_res_cf_contrib(i,j,k,resarr,csolarr,crhsarr,csigarr,
+                                       cdmskarr,ndmskarr,ccmskarr,fcocarr,
+                                       cdxinv,c_nd_domain,
+                                       lobc,hibc, neumann_doubling);
+            });
+#endif
         }
     }
 #ifdef AMREX_USE_EB
@@ -2485,13 +2648,17 @@ MLNodeLaplacian::fillIJMatrix (MFIter const& mfi, Array4<HypreNodeLap::Int const
                                Vector<HypreNodeLap::Int>& ncols, Vector<HypreNodeLap::Int>& rows,
                                Vector<HypreNodeLap::Int>& cols, Vector<Real>& mat) const
 {
+    const int amrlev = 0;
+    const int mglev  = m_num_mg_levels[amrlev]-1;
+
     const Box& ndbx = mfi.validbox();
     const auto lo = amrex::lbound(ndbx);
     const auto hi = amrex::ubound(ndbx);
 
-    AMREX_ASSERT(m_coarsening_strategy == CoarseningStrategy::RAP);
+    AMREX_ALWAYS_ASSERT_WITH_MESSAGE((mglev == 0) || (m_coarsening_strategy == CoarseningStrategy::RAP),
+                                     "Coarsening strategy must be RAP to use hypre at mglev > 0");
 
-    const auto& sten = m_stencil[0][0]->array(mfi);
+    const auto& sten = m_stencil[amrlev][mglev]->array(mfi);
 
     constexpr int k = 0;
     for     (int j = lo.y; j <= hi.y; ++j) {
@@ -2563,17 +2730,17 @@ MLNodeLaplacian::fillIJMatrix (MFIter const& mfi, Array4<HypreNodeLap::Int const
                                Vector<HypreNodeLap::Int>& ncols, Vector<HypreNodeLap::Int>& rows,
                                Vector<HypreNodeLap::Int>& cols, Vector<Real>& mat) const
 {
-    AMREX_ASSERT(NMGLevels(0) == 1);
-
-    const Real* dxinv = m_geom[0][0].InvCellSize();
+    const int amrlev = 0;
+    const int mglev  = m_num_mg_levels[amrlev]-1;
 
     const Box& ndbx = mfi.validbox();
     const auto lo = amrex::lbound(ndbx);
     const auto hi = amrex::ubound(ndbx);
 
-    AMREX_ASSERT(m_coarsening_strategy == CoarseningStrategy::RAP);
+    AMREX_ALWAYS_ASSERT_WITH_MESSAGE((mglev == 0) || (m_coarsening_strategy == CoarseningStrategy::RAP),
+                                     "Coarsening strategy must be RAP to use hypre at mglev > 0");
 
-    const auto& sten = m_stencil[0][0]->array(mfi);
+    const auto& sten = m_stencil[amrlev][mglev]->array(mfi);
 
     constexpr int ist_000 = 1-1;
     constexpr int ist_p00 = 2-1;
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.H
index 9496ff6ff3c..9eb036df86d 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.H
@@ -34,7 +34,7 @@ public:
                  const LPInfo& a_info = LPInfo(),
                  const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
 
-    virtual void setLevelBC (int amrlev, const MultiFab* levelbcdata) final override {}
+    virtual void setLevelBC (int /*amrlev*/, const MultiFab* /*levelbcdata*/) final override {}
 
     virtual void apply (int amrlev, int mglev, MultiFab& out, MultiFab& in, BCMode bc_mode,
                         StateMode s_mode, const MLMGBndry* bndry=nullptr) const final override;
@@ -46,19 +46,20 @@ public:
                                    const MultiFab* crse_bcdata=nullptr) override;
     virtual void correctionResidual (int amrlev, int mglev, MultiFab& resid, MultiFab& x, const MultiFab& b,
                                      BCMode bc_mode, const MultiFab* crse_bcdata=nullptr) override;
-    virtual void compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes,
-                           MultiFab& sol, Location loc) const final override {
+    virtual void compFlux (int /*amrlev*/, const Array<MultiFab*,AMREX_SPACEDIM>& /*fluxes*/,
+                           MultiFab& /*sol*/, Location /*loc*/) const final override {
         amrex::Abort("AMReX_MLNodeLinOp::compFlux::How did we get here?");
     }
-    virtual void compGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& grad,
-                           MultiFab& sol, Location loc) const final override {
+    virtual void compGrad (int /*amrlev*/, const Array<MultiFab*,AMREX_SPACEDIM>& /*grad*/,
+                           MultiFab& /*sol*/, Location /*loc*/) const final override {
         amrex::Abort("AMReX_MLNodeLinOp::compGrad::How did we get here?");
     }
     
-    virtual void applyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const final override {}
-    virtual void unapplyMetricTerm (int amrlev, int mglev, MultiFab& rhs) const final override {}
+    virtual void applyMetricTerm (int /*amrlev*/, int /*mglev*/, MultiFab& /*rhs*/) const final override {}
+    virtual void unapplyMetricTerm (int /*amrlev*/, int /*mglev*/, MultiFab& /*rhs*/) const final override {}
 
-    virtual void fillSolutionBC (int amrlev, MultiFab& sol, const MultiFab* crse_bcdata=nullptr) final override {
+    virtual void fillSolutionBC (int /*amrlev*/, MultiFab& /*sol*/,
+                                 const MultiFab* /*crse_bcdata*/=nullptr) final override {
         amrex::Abort("AMReX_MLNodeLinOp::fillSolutionBC::How did we get here?");
     }
 
@@ -80,7 +81,7 @@ public:
 
     virtual void nodalSync (int amrlev, int mglev, MultiFab& mf) const final override;
 
-    virtual std::unique_ptr<MLLinOp> makeNLinOp (int grid_size) const final override {
+    virtual std::unique_ptr<MLLinOp> makeNLinOp (int /*grid_size*/) const final override {
         amrex::Abort("MLNodeLinOp::makeNLinOp: N-Solve not supported");
         return std::unique_ptr<MLLinOp>{};
     }
@@ -91,15 +92,18 @@ public:
 
     void buildMasks ();
 
-    void setDirichletMask (int amrlev, const iMultiFab& a_dmask);
+    // omask is either 0 or 1. 1 means the node is an unknown. 0 means it's known.
+    void setOversetMask (int amrlev, const iMultiFab& a_omask);
 
 #ifdef AMREX_USE_HYPRE
-    virtual std::unique_ptr<HypreNodeLap> makeHypreNodeLap (int bottom_verbose) const override;
-
-    virtual void fillIJMatrix (MFIter const& mfi, Array4<HypreNodeLap::Int const> const& nid,
-                               Array4<int const> const& owner,
-                               Vector<HypreNodeLap::Int>& ncols, Vector<HypreNodeLap::Int>& rows,
-                               Vector<HypreNodeLap::Int>& cols, Vector<Real>& mat) const
+    virtual std::unique_ptr<HypreNodeLap> makeHypreNodeLap(
+        int bottom_verbose,
+        const std::string& options_namespace) const override;
+
+    virtual void fillIJMatrix (MFIter const& /*mfi*/, Array4<HypreNodeLap::Int const> const& /*nid*/,
+                               Array4<int const> const& /*owner*/,
+                               Vector<HypreNodeLap::Int>& /*ncols*/, Vector<HypreNodeLap::Int>& /*rows*/,
+                               Vector<HypreNodeLap::Int>& /*cols*/, Vector<Real>& /*mat*/) const
     {
         amrex::Abort("MLNodeLinOp: how did we get here?");
     }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.cpp b/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.cpp
index 839893d8cc8..41959694c42 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeLinOp.cpp
@@ -23,7 +23,11 @@ MLNodeLinOp::define (const Vector<Geometry>& a_geom,
                      const LPInfo& a_info,
                      const Vector<FabFactory<FArrayBox> const*>& a_factory)
 {
+#ifdef AMREX_USE_HYPRE
+    bool eb_limit_coarsening = true;
+#else
     bool eb_limit_coarsening = false;
+#endif
     MLLinOp::define(a_geom, a_grids, a_dmap, a_info, a_factory, eb_limit_coarsening);
 
     m_owner_mask.resize(m_num_amr_levels);
@@ -79,7 +83,7 @@ MLNodeLinOp::nodalSync (int amrlev, int mglev, MultiFab& mf) const
 
 void
 MLNodeLinOp::solutionResidual (int amrlev, MultiFab& resid, MultiFab& x, const MultiFab& b,
-                               const MultiFab* crse_bcdata)
+                               const MultiFab* /*crse_bcdata*/)
 {
     const int mglev = 0;
     const int ncomp = b.nComp();
@@ -108,7 +112,7 @@ MLNodeLinOp::solutionResidual (int amrlev, MultiFab& resid, MultiFab& x, const M
 
 void
 MLNodeLinOp::correctionResidual (int amrlev, int mglev, MultiFab& resid, MultiFab& x, const MultiFab& b,
-                                 BCMode bc_mode, const MultiFab* crse_bcdata)
+                                 BCMode /*bc_mode*/, const MultiFab* /*crse_bcdata*/)
 {
     apply(amrlev, mglev, resid, x, BCMode::Homogeneous, StateMode::Correction);
     int ncomp = b.nComp();
@@ -136,6 +140,7 @@ MLNodeLinOp::smooth (int amrlev, int mglev, MultiFab& sol, const MultiFab& rhs,
 Real
 MLNodeLinOp::xdoty (int amrlev, int mglev, const MultiFab& x, const MultiFab& y, bool local) const
 {
+    amrex::ignore_unused(amrlev);
     AMREX_ASSERT(amrlev==0);
     AMREX_ASSERT(mglev+1==m_num_mg_levels[0] || mglev==0);
     const auto& mask = (mglev+1 == m_num_mg_levels[0]) ? m_bottom_dot_mask : m_coarse_dot_mask;
@@ -156,6 +161,7 @@ MLNodeLinOp::xdoty (int amrlev, int mglev, const MultiFab& x, const MultiFab& y,
 void
 MLNodeLinOp::applyInhomogNeumannTerm (int amrlev, MultiFab& rhs) const
 {
+    amrex::ignore_unused(amrlev);
     int ncomp = rhs.nComp();
     for (int n = 0; n < ncomp; ++n)
     {
@@ -215,7 +221,7 @@ MLNodeLinOp::buildMasks ()
     auto ithi = std::find(m_hibc[0].begin(), m_hibc[0].end(), BCType::Dirichlet);
     if (itlo == m_lobc[0].end() && ithi == m_hibc[0].end())
     {  // No Dirichlet
-        m_is_bottom_singular = m_domain_covered[0];
+        m_is_bottom_singular = (m_domain_covered[0] && !m_overset_dirichlet_mask);
     }
 
     const auto lobc = LoBC();
@@ -326,9 +332,20 @@ MLNodeLinOp::buildMasks ()
 }
 
 void
-MLNodeLinOp::setDirichletMask (int amrlev, const iMultiFab& a_dmask)
+MLNodeLinOp::setOversetMask (int amrlev, const iMultiFab& a_dmask)
 {
-    iMultiFab::Copy(*m_dirichlet_mask[amrlev][0], a_dmask, 0, 0, 1, 0);
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    for (MFIter mfi(*m_dirichlet_mask[amrlev][0], TilingIfNotGPU()); mfi.isValid(); ++mfi) {
+        Array4<int const> const& omsk = a_dmask.const_array(mfi);
+        Array4<int> const& dmsk = m_dirichlet_mask[amrlev][0]->array(mfi);
+        Box const& bx = mfi.tilebox();
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D(bx, i, j, k,
+        {
+            dmsk(i,j,k) = 1 - omsk(i,j,k);
+        });
+    }
     m_overset_dirichlet_mask = true;
 }
 
@@ -362,7 +379,7 @@ MLNodeLinOp::applyBC (int amrlev, int mglev, MultiFab& phi, BCMode/* bc_mode*/,
 
 #ifdef AMREX_USE_HYPRE
 std::unique_ptr<HypreNodeLap>
-MLNodeLinOp::makeHypreNodeLap (int bottom_verbose) const
+MLNodeLinOp::makeHypreNodeLap (int bottom_verbose, const std::string& options_namespace) const
 {
     const BoxArray& ba = m_grids[0].back();
     const DistributionMapping& dm = m_dmap[0].back();
@@ -372,12 +389,9 @@ MLNodeLinOp::makeHypreNodeLap (int bottom_verbose) const
     const auto& dirichlet_mask = *(m_dirichlet_mask[0].back());
     MPI_Comm comm = BottomCommunicator();
 
-    AMREX_ALWAYS_ASSERT_WITH_MESSAGE(NMGLevels(0) == 1,
-                                     "MLNodeLaplacian: To use hypre, max_coarsening_level must be 0");
-
     std::unique_ptr<HypreNodeLap> hypre_solver
         (new amrex::HypreNodeLap(ba, dm, geom, factory, owner_mask, dirichlet_mask,
-                                 comm, this, bottom_verbose));
+                                 comm, this, bottom_verbose, options_namespace));
 
     return hypre_solver;
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_1D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_1D_K.H
index 197ea3e504c..a0d9dbf331d 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_1D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_1D_K.H
@@ -10,7 +10,7 @@ void mlndtslap_interpadd (int i, int, int, Array4<Real> const& fine,
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndtslap_adotx (Box const& b, Array4<Real> const& y, Array4<Real const> const& x,
-                      Array4<int const> const& msk, GpuArray<Real,6> const& s,
+                      GpuArray<Real,6> const& s,
                       GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {}
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_2D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_2D_K.H
index 1d740421f66..da56cd0347b 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_2D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_2D_K.H
@@ -6,24 +6,24 @@ namespace amrex {
 namespace {
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-    Real ts_interp_line_x (Array4<Real const> const& crse, int i, int j, int ic, int jc) noexcept
+    Real ts_interp_line_x (Array4<Real const> const& crse, int ic, int jc) noexcept
     {
-        return (crse(ic,jc,0)+crse(ic+1,jc,0))*0.5_rt;
+        return (crse(ic,jc,0)+crse(ic+1,jc,0))*Real(0.5);
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-    Real ts_interp_line_y (Array4<Real const> const& crse, int i, int j, int ic, int jc) noexcept
+    Real ts_interp_line_y (Array4<Real const> const& crse, int ic, int jc) noexcept
     {
-        return (crse(ic,jc,0)+crse(ic,jc+1,0))*0.5_rt;
-    };
+        return (crse(ic,jc,0)+crse(ic,jc+1,0))*Real(0.5);
+    }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-    Real ts_interp_face_xy (Array4<Real const> const& crse, int i, int j, int ic, int jc) noexcept
+    Real ts_interp_face_xy (Array4<Real const> const& crse, int ic, int jc) noexcept
     {
-        return (ts_interp_line_y(crse,i-1,j  ,ic  ,jc  ) +
-                ts_interp_line_y(crse,i+1,j  ,ic+1,jc  ) +
-                ts_interp_line_x(crse,i  ,j-1,ic  ,jc  ) +
-                ts_interp_line_x(crse,i  ,j+1,ic  ,jc+1)) * 0.25_rt;
+        return (ts_interp_line_y(crse,ic  ,jc  ) +
+                ts_interp_line_y(crse,ic+1,jc  ) +
+                ts_interp_line_x(crse,ic  ,jc  ) +
+                ts_interp_line_x(crse,ic  ,jc+1)) * Real(0.25);
     }
 }
 
@@ -38,13 +38,13 @@ void mlndtslap_interpadd (int i, int j, int, Array4<Real> const& fine,
         bool j_is_odd = (jc*2 != j);
         if (i_is_odd and j_is_odd) {
             // Node on a X-Y face
-            fine(i,j,0) += ts_interp_face_xy(crse,i,j,ic,jc);
+            fine(i,j,0) += ts_interp_face_xy(crse,ic,jc);
         } else if (i_is_odd) {
             // Node on X line
-            fine(i,j,0) += ts_interp_line_x(crse,i,j,ic,jc);
+            fine(i,j,0) += ts_interp_line_x(crse,ic,jc);
         } else if (j_is_odd) {
             // Node on Y line
-            fine(i,j,0) += ts_interp_line_y(crse,i,j,ic,jc);
+            fine(i,j,0) += ts_interp_line_y(crse,ic,jc);
         } else {
             // Node coincident with coarse node
             fine(i,j,0) += crse(ic,jc,0);
@@ -54,7 +54,7 @@ void mlndtslap_interpadd (int i, int j, int, Array4<Real> const& fine,
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndtslap_adotx (Box const& b, Array4<Real> const& y, Array4<Real const> const& x,
-                      Array4<int const> const& msk, GpuArray<Real,3> const& s,
+                      GpuArray<Real,3> const& s,
                       GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
     const Real h00 = dxinv[0]*dxinv[0];
@@ -126,7 +126,7 @@ void mlndtslap_fill_ijmatrix (Box const& ndbx, Array4<HypreNodeLap::Int const> c
                               Array4<int const> const& owner,
                               Vector<HypreNodeLap::Int>& ncols, Vector<HypreNodeLap::Int>& rows,
                               Vector<HypreNodeLap::Int>& cols, Vector<Real>& mat,
-                              Array4<int const> const& msk, GpuArray<Real,3> const& s,
+                              Array4<int const> const& /*msk*/, GpuArray<Real,3> const& s,
                               GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
     const Real h00 = dxinv[0]*dxinv[0];
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_3D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_3D_K.H
index d874dfe97d8..4e76d8363ea 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_3D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLap_3D_K.H
@@ -7,53 +7,53 @@ namespace {
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ts_interp_line_x (Array4<Real const> const& crse,
-                           int i, int j, int k, int ic, int jc, int kc) noexcept
+                           int ic, int jc, int kc) noexcept
     {
-        return (crse(ic,jc,kc)+crse(ic+1,jc,kc))*0.5_rt;
+        return (crse(ic,jc,kc)+crse(ic+1,jc,kc))*Real(0.5);
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ts_interp_line_y (Array4<Real const> const& crse,
-                           int i, int j, int k, int ic, int jc, int kc) noexcept
+                           int ic, int jc, int kc) noexcept
     {
-        return (crse(ic,jc,kc)+crse(ic,jc+1,kc))*0.5_rt;
+        return (crse(ic,jc,kc)+crse(ic,jc+1,kc))*Real(0.5);
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ts_interp_line_z (Array4<Real const> const& crse,
-                           int i, int j, int k, int ic, int jc, int kc) noexcept
+                           int ic, int jc, int kc) noexcept
     {
-        return (crse(ic,jc,kc)+crse(ic,jc,kc+1))*0.5_rt;
+        return (crse(ic,jc,kc)+crse(ic,jc,kc+1))*Real(0.5);
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ts_interp_face_xy (Array4<Real const> const& crse,
-                            int i, int j, int k, int ic, int jc, int kc) noexcept
+                            int ic, int jc, int kc) noexcept
     {
-        return (ts_interp_line_y(crse,i-1,j  ,k,ic  ,jc  ,kc) +
-                ts_interp_line_y(crse,i+1,j  ,k,ic+1,jc  ,kc) +
-                ts_interp_line_x(crse,i  ,j-1,k,ic  ,jc  ,kc) +
-                ts_interp_line_x(crse,i  ,j+1,k,ic  ,jc+1,kc)) * 0.25_rt;
+        return (ts_interp_line_y(crse,ic  ,jc  ,kc) +
+                ts_interp_line_y(crse,ic+1,jc  ,kc) +
+                ts_interp_line_x(crse,ic  ,jc  ,kc) +
+                ts_interp_line_x(crse,ic  ,jc+1,kc)) * Real(0.25);
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ts_interp_face_xz (Array4<Real const> const& crse,
-                            int i, int j, int k, int ic, int jc, int kc) noexcept
+                            int ic, int jc, int kc) noexcept
     {
-        return (ts_interp_line_z(crse,i-1,j,k  ,ic  ,jc,kc  ) +
-                ts_interp_line_z(crse,i+1,j,k  ,ic+1,jc,kc  ) +
-                ts_interp_line_x(crse,i  ,j,k-1,ic  ,jc,kc  ) +
-                ts_interp_line_x(crse,i  ,j,k+1,ic  ,jc,kc+1)) * 0.25_rt;
+        return (ts_interp_line_z(crse,ic  ,jc,kc  ) +
+                ts_interp_line_z(crse,ic+1,jc,kc  ) +
+                ts_interp_line_x(crse,ic  ,jc,kc  ) +
+                ts_interp_line_x(crse,ic  ,jc,kc+1)) * Real(0.25);
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     Real ts_interp_face_yz (Array4<Real const> const& crse,
-                            int i, int j, int k, int ic, int jc, int kc) noexcept
+                            int ic, int jc, int kc) noexcept
     {
-        return (ts_interp_line_z(crse,i,j-1,k  ,ic,jc  ,kc  ) +
-                ts_interp_line_z(crse,i,j+1,k  ,ic,jc+1,kc  ) +
-                ts_interp_line_y(crse,i,j  ,k-1,ic,jc  ,kc  ) +
-                ts_interp_line_y(crse,i,j  ,k+1,ic,jc  ,kc+1)) * 0.25_rt;
+        return (ts_interp_line_z(crse,ic,jc  ,kc  ) +
+                ts_interp_line_z(crse,ic,jc+1,kc  ) +
+                ts_interp_line_y(crse,ic,jc  ,kc  ) +
+                ts_interp_line_y(crse,ic,jc  ,kc+1)) * Real(0.25);
     }
 }
 
@@ -70,30 +70,30 @@ void mlndtslap_interpadd (int i, int j, int k, Array4<Real> const& fine,
         bool k_is_odd = (kc*2 != k);
         if (i_is_odd and j_is_odd and k_is_odd) {
             // Fine node at center of cell
-            fine(i,j,k) += (ts_interp_face_yz(crse,i-1,j  ,k  ,ic  ,jc  ,kc  ) +
-                            ts_interp_face_yz(crse,i+1,j  ,k  ,ic+1,jc  ,kc  ) +
-                            ts_interp_face_xz(crse,i  ,j-1,k  ,ic  ,jc  ,kc  ) +
-                            ts_interp_face_xz(crse,i  ,j+1,k  ,ic  ,jc+1,kc  ) +
-                            ts_interp_face_xy(crse,i  ,j  ,k-1,ic  ,jc  ,kc  ) +
-                            ts_interp_face_xy(crse,i  ,j  ,k+1,ic  ,jc  ,kc+1)) * (1._rt/6._rt);
+            fine(i,j,k) += (ts_interp_face_yz(crse,ic  ,jc  ,kc  ) +
+                            ts_interp_face_yz(crse,ic+1,jc  ,kc  ) +
+                            ts_interp_face_xz(crse,ic  ,jc  ,kc  ) +
+                            ts_interp_face_xz(crse,ic  ,jc+1,kc  ) +
+                            ts_interp_face_xy(crse,ic  ,jc  ,kc  ) +
+                            ts_interp_face_xy(crse,ic  ,jc  ,kc+1)) * Real(1./6.);
         } else if (j_is_odd and k_is_odd) {
             // Node on a Y-Z face
-            fine(i,j,k) += ts_interp_face_yz(crse,i,j,k,ic,jc,kc);
+            fine(i,j,k) += ts_interp_face_yz(crse,ic,jc,kc);
         } else if (i_is_odd and k_is_odd) {
             // Node on a Z-X face
-            fine(i,j,k) += ts_interp_face_xz(crse,i,j,k,ic,jc,kc);
+            fine(i,j,k) += ts_interp_face_xz(crse,ic,jc,kc);
         } else if (i_is_odd and j_is_odd) {
             // Node on a X-Y face
-            fine(i,j,k) += ts_interp_face_xy(crse,i,j,k,ic,jc,kc);
+            fine(i,j,k) += ts_interp_face_xy(crse,ic,jc,kc);
         } else if (i_is_odd) {
             // Node on X line
-            fine(i,j,k) += ts_interp_line_x(crse,i,j,k,ic,jc,kc);
+            fine(i,j,k) += ts_interp_line_x(crse,ic,jc,kc);
         } else if (j_is_odd) {
             // Node on Y line
-            fine(i,j,k) += ts_interp_line_y(crse,i,j,k,ic,jc,kc);
+            fine(i,j,k) += ts_interp_line_y(crse,ic,jc,kc);
         } else if (k_is_odd) {
             // Node on Z line
-            fine(i,j,k) += ts_interp_line_z(crse,i,j,k,ic,jc,kc);
+            fine(i,j,k) += ts_interp_line_z(crse,ic,jc,kc);
         } else {
             // Node coincident with coarse node
             fine(i,j,k) += crse(ic,jc,kc);
@@ -103,7 +103,7 @@ void mlndtslap_interpadd (int i, int j, int k, Array4<Real> const& fine,
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mlndtslap_adotx (Box const& b, Array4<Real> const& y, Array4<Real const> const& x,
-                      Array4<int const> const& msk, GpuArray<Real,6> const& s,
+                      GpuArray<Real,6> const& s,
                       GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
     const Real h00 = dxinv[0]*dxinv[0];
@@ -220,7 +220,7 @@ void mlndtslap_fill_ijmatrix (Box const& ndbx, Array4<HypreNodeLap::Int const> c
                               Array4<int const> const& owner,
                               Vector<HypreNodeLap::Int>& ncols, Vector<HypreNodeLap::Int>& rows,
                               Vector<HypreNodeLap::Int>& cols, Vector<Real>& mat,
-                              Array4<int const> const& msk, GpuArray<Real,6> const& s,
+                              Array4<int const> const& /*msk*/, GpuArray<Real,6> const& s,
                               GpuArray<Real,AMREX_SPACEDIM> const& dxinv) noexcept
 {
     const Real h00 = dxinv[0]*dxinv[0];
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLaplacian.cpp b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLaplacian.cpp
index 8dd961eb706..c1a7141499f 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLaplacian.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLNodeTensorLaplacian.cpp
@@ -128,8 +128,8 @@ MLNodeTensorLaplacian::interpolation (int amrlev, int fmglev, MultiFab& fine,
 }
 
 void
-MLNodeTensorLaplacian::averageDownSolutionRHS (int camrlev, MultiFab& crse_sol, MultiFab& crse_rhs,
-                                               const MultiFab& fine_sol, const MultiFab& fine_rhs)
+MLNodeTensorLaplacian::averageDownSolutionRHS (int camrlev, MultiFab& crse_sol, MultiFab& /*crse_rhs*/,
+                                               const MultiFab& fine_sol, const MultiFab& /*fine_rhs*/)
 {
     const auto& amrrr = AMRRefRatio(camrlev);
     amrex::average_down(fine_sol, crse_sol, 0, 1, amrrr);
@@ -141,9 +141,9 @@ MLNodeTensorLaplacian::averageDownSolutionRHS (int camrlev, MultiFab& crse_sol,
 }
 
 void
-MLNodeTensorLaplacian::reflux (int crse_amrlev,
-                               MultiFab& res, const MultiFab& crse_sol, const MultiFab& crse_rhs,
-                               MultiFab& fine_res, MultiFab& fine_sol, const MultiFab& fine_rhs) const
+MLNodeTensorLaplacian::reflux (int /*crse_amrlev*/,
+                               MultiFab& /*res*/, const MultiFab& /*crse_sol*/, const MultiFab& /*crse_rhs*/,
+                               MultiFab& /*fine_res*/, MultiFab& /*fine_sol*/, const MultiFab& /*fine_rhs*/) const
 {
     amrex::Abort("MLNodeTensorLaplacian::reflux: TODO");
 }
@@ -164,7 +164,6 @@ MLNodeTensorLaplacian::Fapply (int amrlev, int mglev, MultiFab& out, const Multi
     BL_PROFILE("MLNodeTensorLaplacian::Fapply()");
 
     const auto dxinv = m_geom[amrlev][mglev].InvCellSizeArray();
-    const iMultiFab& dmsk = *m_dirichlet_mask[amrlev][mglev];
     const auto s = m_sigma;
 
 #ifdef _OPENMP
@@ -175,11 +174,10 @@ MLNodeTensorLaplacian::Fapply (int amrlev, int mglev, MultiFab& out, const Multi
         const Box& bx = mfi.tilebox();
         Array4<Real const> const& xarr = in.const_array(mfi);
         Array4<Real> const& yarr = out.array(mfi);
-        Array4<int const> const& dmskarr = dmsk.const_array(mfi);
 
         AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
         {
-            mlndtslap_adotx(tbx,yarr,xarr,dmskarr,s,dxinv);
+            mlndtslap_adotx(tbx,yarr,xarr,s,dxinv);
         });
     }
 }
@@ -215,6 +213,7 @@ MLNodeTensorLaplacian::Fsmooth (int amrlev, int mglev, MultiFab& sol, const Mult
 void
 MLNodeTensorLaplacian::normalize (int amrlev, int mglev, MultiFab& mf) const
 {
+    amrex::ignore_unused(amrlev,mglev,mf);
     return;
 
 #if 0
@@ -242,7 +241,7 @@ MLNodeTensorLaplacian::normalize (int amrlev, int mglev, MultiFab& mf) const
 }
 
 void
-MLNodeTensorLaplacian::fixUpResidualMask (int amrlev, iMultiFab& resmsk)
+MLNodeTensorLaplacian::fixUpResidualMask (int /*amrlev*/, iMultiFab& /*resmsk*/)
 {
     amrex::Abort("MLNodeTensorLaplacian::fixUpResidualMask: TODO");
 }
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLPoisson.H b/Src/LinearSolvers/MLMG/AMReX_MLPoisson.H
index 9db086ec5db..25e4e706f5a 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLPoisson.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLPoisson.H
@@ -46,9 +46,9 @@ public:
 
     virtual Real getAScalar () const final override { return  0.0; }
     virtual Real getBScalar () const final override { return -1.0; }
-    virtual MultiFab const* getACoeffs (int amrlev, int mglev) const final override { return nullptr; }
-    virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int amrlev, int mglev) const final override
-        { return { AMREX_D_DECL(nullptr,nullptr,nullptr)}; }
+    virtual MultiFab const* getACoeffs (int /*amrlev*/, int /*mglev*/) const final override { return nullptr; }
+    virtual Array<MultiFab const*,AMREX_SPACEDIM> getBCoeffs (int /*amrlev*/, int /*mglev*/) const final override
+        { return {{ AMREX_D_DECL(nullptr,nullptr,nullptr)}}; }
 
     virtual std::unique_ptr<MLLinOp> makeNLinOp (int grid_size) const final override;
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLPoisson.cpp b/Src/LinearSolvers/MLMG/AMReX_MLPoisson.cpp
index 89eddb75aae..c556f22824a 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLPoisson.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLPoisson.cpp
@@ -77,30 +77,30 @@ MLPoisson::Fapply (int amrlev, int mglev, MultiFab& out, const MultiFab& in) con
         const auto& yfab = out.array(mfi);
 
 #if (AMREX_SPACEDIM == 3)
-        AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+        AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE (bx, i, j, k,
         {
             mlpoisson_adotx(i, j, k, yfab, xfab, dhx, dhy, dhz);
         });
 #elif (AMREX_SPACEDIM == 2)
         if (m_has_metric_term) {
-            AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE (bx, i, j, k,
             {
                 mlpoisson_adotx_m(i, j, yfab, xfab, dhx, dhy, dx, probxlo);
             });
         } else {
-            AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE (bx, i, j, k,
             {
                 mlpoisson_adotx(i, j, yfab, xfab, dhx, dhy);
             });
         }
 #elif (AMREX_SPACEDIM == 1)
         if (m_has_metric_term) {
-            AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE (bx, i, j, k,
             {
                 mlpoisson_adotx_m(i, yfab, xfab, dhx, dx, probxlo);
             });
         } else {
-            AMREX_HOST_DEVICE_PARALLEL_FOR_3D (bx, i, j, k,
+            AMREX_HOST_DEVICE_PARALLEL_FOR_3D_FUSIBLE (bx, i, j, k,
             {
                 mlpoisson_adotx(i, yfab, xfab, dhx);
             });
@@ -112,6 +112,7 @@ MLPoisson::Fapply (int amrlev, int mglev, MultiFab& out, const MultiFab& in) con
 void
 MLPoisson::normalize (int amrlev, int mglev, MultiFab& mf) const
 {
+    amrex::ignore_unused(amrlev,mglev,mf);
 #if (AMREX_SPACEDIM != 3)
     BL_PROFILE("MLPoisson::normalize()");
 
@@ -133,12 +134,12 @@ MLPoisson::normalize (int amrlev, int mglev, MultiFab& mf) const
         const auto& fab = mf.array(mfi);
 
 #if (AMREX_SPACEDIM == 2)
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
         {
             mlpoisson_normalize(tbx, fab, dhx, dhy, dx, probxlo);
         });
 #else
-        AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+        AMREX_LAUNCH_HOST_DEVICE_FUSIBLE_LAMBDA ( bx, tbx,
         {
             mlpoisson_normalize(tbx, fab, dhx, dx, probxlo);
         });
@@ -468,6 +469,9 @@ MLPoisson::makeNLinOp (int grid_size) const
     std::unique_ptr<MLLinOp> r{new MLALaplacian({geom}, {ba}, {dm}, minfo)};
 
     MLALaplacian* nop = dynamic_cast<MLALaplacian*>(r.get());
+    if (!nop) {
+        return std::unique_ptr<MLLinOp>{};
+    }
 
     nop->m_parent = this;
 
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.H b/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.H
index 84eec4f1251..639cc06b5ea 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.H
@@ -32,6 +32,12 @@ public:
                 const Vector<DistributionMapping>& a_dmap,
                 const LPInfo& a_info = LPInfo(),
                 const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
+    MLTensorOp (const Vector<Geometry>& a_geom,
+                const Vector<BoxArray>& a_grids,
+                const Vector<DistributionMapping>& a_dmap,
+                const Vector<iMultiFab const*>& a_overset_mask, // 1: unknown, 0: known
+                const LPInfo& a_info = LPInfo(),
+                const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
     virtual ~MLTensorOp ();
 
     MLTensorOp (const MLTensorOp&) = delete;
@@ -45,6 +51,13 @@ public:
                  const LPInfo& a_info = LPInfo(),
                  const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
 
+    void define (const Vector<Geometry>& a_geom,
+                 const Vector<BoxArray>& a_grids,
+                 const Vector<DistributionMapping>& a_dmap,
+                 const Vector<iMultiFab const*>& a_overset_mask,
+                 const LPInfo& a_info = LPInfo(),
+                 const Vector<FabFactory<FArrayBox> const*>& a_factory = {});
+
     void setShearViscosity (int amrlev, const Array<MultiFab const*,AMREX_SPACEDIM>& eta);
     void setShearViscosity (int amrlev, Real eta);
     void setBulkViscosity (int amrlev, const Array<MultiFab const*,AMREX_SPACEDIM>& kappa);
@@ -63,7 +76,7 @@ public:
     }
 
     virtual void prepareForSolve () final override;
-    virtual bool isSingular (int armlev) const final override { return false; }
+    virtual bool isSingular (int /*armlev*/) const final override { return false; }
     virtual bool isBottomSingular () const final override { return false; }
 
     virtual void apply (int amrlev, int mglev, MultiFab& out, MultiFab& in, BCMode bc_mode,
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.cpp b/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.cpp
index 6a168780557..106592926be 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.cpp
+++ b/Src/LinearSolvers/MLMG/AMReX_MLTensorOp.cpp
@@ -1,6 +1,7 @@
 #include <AMReX_MLTensorOp.H>
 #include <AMReX_MultiFabUtil.H>
 #include <AMReX_MLTensor_K.H>
+#include <AMReX_MLABecLap_K.H>
 
 namespace amrex {
 
@@ -23,6 +24,17 @@ MLTensorOp::MLTensorOp (const Vector<Geometry>& a_geom,
     define(a_geom, a_grids, a_dmap, a_info, a_factory);
 }
 
+MLTensorOp::MLTensorOp (const Vector<Geometry>& a_geom,
+                        const Vector<BoxArray>& a_grids,
+                        const Vector<DistributionMapping>& a_dmap,
+                        const Vector<iMultiFab const*>& a_overset_mask,
+                        const LPInfo& a_info,
+                        const Vector<FabFactory<FArrayBox> const*>& a_factory)
+{
+    MLABecLaplacian::setScalars(1.0,1.0);
+    define(a_geom, a_grids, a_dmap, a_overset_mask, a_info, a_factory);
+}
+
 MLTensorOp::~MLTensorOp ()
 {}
 
@@ -53,6 +65,34 @@ MLTensorOp::define (const Vector<Geometry>& a_geom,
     }
 }
 
+void
+MLTensorOp::define (const Vector<Geometry>& a_geom,
+                    const Vector<BoxArray>& a_grids,
+                    const Vector<DistributionMapping>& a_dmap,
+                    const Vector<iMultiFab const*>& a_overset_mask,
+                    const LPInfo& a_info,
+                    const Vector<FabFactory<FArrayBox> const*>& a_factory)
+{
+    BL_PROFILE("MLTensorOp::define(oveset)");
+
+    MLABecLaplacian::define(a_geom, a_grids, a_dmap, a_overset_mask, a_info, a_factory);
+
+    m_kappa.clear();
+    m_kappa.resize(NAMRLevels());
+    for (int amrlev = 0; amrlev < NAMRLevels(); ++amrlev) {
+        m_kappa[amrlev].resize(std::min(kappa_num_mglevs,NMGLevels(amrlev)));
+        for (int mglev = 0; mglev < m_kappa[amrlev].size(); ++mglev) {
+            for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+                m_kappa[amrlev][mglev][idim].define
+                    (amrex::convert(m_grids[amrlev][mglev],
+                                    IntVect::TheDimensionVector(idim)),
+                     m_dmap[amrlev][mglev], 1, 0,
+                     MFInfo(), *m_factory[amrlev][mglev]);
+            }
+        }
+    }
+}
+
 void
 MLTensorOp::setShearViscosity (int amrlev, const Array<MultiFab const*,AMREX_SPACEDIM>& eta)
 {
@@ -98,7 +138,7 @@ MLTensorOp::prepareForSolve ()
             if (amrlev > 0) {
                 amrex::average_down_faces(GetArrOfConstPtrs(m_kappa[amrlev  ].back()),
                                           GetArrOfPtrs     (m_kappa[amrlev-1].front()),
-                                          IntVect(mg_coarsen_ratio), 0);
+                                          IntVect(mg_coarsen_ratio), m_geom[amrlev-1][0]);
             }
         }
     } else {
@@ -120,6 +160,41 @@ MLTensorOp::prepareForSolve ()
     }
 
     MLABecLaplacian::prepareForSolve();
+
+    for (int amrlev = NAMRLevels()-1; amrlev >= 0; --amrlev) {
+        for (int mglev = 1; mglev < m_kappa[amrlev].size(); ++mglev) {
+            if (m_has_kappa and m_overset_mask[amrlev][mglev]) {
+                const Real fac = static_cast<Real>(1 << mglev); // 2**mglev
+                const Real osfac = 2.0*fac/(fac+1.0);
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+                for (MFIter mfi(m_kappa[amrlev][mglev][0],TilingIfNotGPU()); mfi.isValid(); ++mfi)
+                {
+                    AMREX_D_TERM(Box const& xbx = mfi.nodaltilebox(0);,
+                                 Box const& ybx = mfi.nodaltilebox(1);,
+                                 Box const& zbx = mfi.nodaltilebox(2));
+                    AMREX_D_TERM(Array4<Real> const& bx = m_kappa[amrlev][mglev][0].array(mfi);,
+                                 Array4<Real> const& by = m_kappa[amrlev][mglev][1].array(mfi);,
+                                 Array4<Real> const& bz = m_kappa[amrlev][mglev][2].array(mfi));
+                    Array4<int const> const& osm = m_overset_mask[amrlev][mglev]->const_array(mfi);
+                    AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
+                        (xbx, t_xbx,
+                         {
+                             overset_rescale_bcoef_x(t_xbx, bx, osm, 1, osfac);
+                         },
+                         ybx, t_ybx,
+                         {
+                             overset_rescale_bcoef_y(t_ybx, by, osm, 1, osfac);
+                         },
+                         zbx, t_zbx,
+                         {
+                             overset_rescale_bcoef_z(t_zbx, bz, osm, 1, osfac);
+                         });
+                }
+            }
+        }
+    }
 }
 
 void
@@ -169,7 +244,8 @@ MLTensorOp::apply (int amrlev, int mglev, MultiFab& out, MultiFab& in, BCMode bc
             AMREX_D_TERM(Array4<Real> const fxfab = fluxfab_tmp[0].array();,
                          Array4<Real> const fyfab = fluxfab_tmp[1].array();,
                          Array4<Real> const fzfab = fluxfab_tmp[2].array(););
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
             ( xbx, txbx,
               {
                   mltensor_cross_terms_fx(txbx,fxfab,vfab,etaxfab,kapxfab,dxinv);
@@ -178,18 +254,26 @@ MLTensorOp::apply (int amrlev, int mglev, MultiFab& out, MultiFab& in, BCMode bc
               {
                   mltensor_cross_terms_fy(tybx,fyfab,vfab,etayfab,kapyfab,dxinv);
               }
-#if (AMREX_SPACEDIM == 3)
             , zbx, tzbx,
               {
                   mltensor_cross_terms_fz(tzbx,fzfab,vfab,etazfab,kapzfab,dxinv);
               }
-#endif
             );
 
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
-            {
-                mltensor_cross_terms(tbx, axfab, AMREX_D_DECL(fxfab,fyfab,fzfab), dxinv, bscalar);
-            });
+            if (m_overset_mask[amrlev][mglev]) {
+                const auto& osm = m_overset_mask[amrlev][mglev]->array(mfi);
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                {
+                    mltensor_cross_terms_os(tbx, axfab, AMREX_D_DECL(fxfab,fyfab,fzfab),
+                                            osm, dxinv, bscalar);
+                });
+            } else {
+                AMREX_LAUNCH_HOST_DEVICE_LAMBDA ( bx, tbx,
+                {
+                    mltensor_cross_terms(tbx, axfab, AMREX_D_DECL(fxfab,fyfab,fzfab),
+                                         dxinv, bscalar);
+                });
+            }
         }
     }
 #endif
@@ -272,32 +356,35 @@ MLTensorOp::applyBCTensor (int amrlev, int mglev, MultiFab& vel,
         const auto& bvzhi = (bndry != nullptr) ?
 	  (*bndry)[Orientation(2,Orientation::high)].array(mfi) : foo;
 
+	// only edge vals used in 3D stencil
 #ifdef AMREX_USE_DPCPP
         // xxxxx DPCPP todo: kernel size
         Vector<Array4<int const> > htmp = {mxlo,mylo,mzlo,mxhi,myhi,mzhi};
         Gpu::AsyncArray<Array4<int const> > dtmp(htmp.data(), 6);
         auto dp = dtmp.data();
-#endif
-
-	// only edge vals used in 3D stencil
         AMREX_HOST_DEVICE_FOR_1D ( 12, iedge,
         {
             mltensor_fill_edges(iedge, vbx, velfab,
-#ifdef AMREX_USE_DPCPP
                                 dp[0],dp[1],dp[2],dp[3],dp[4],dp[5],
+                                bvxlo, bvylo, bvzlo, bvxhi, bvyhi, bvzhi,
+                                bct, bcl, inhomog, imaxorder,
+                                dxinv, domain);
+        });
 #else
+        AMREX_HOST_DEVICE_FOR_1D ( 12, iedge,
+        {
+            mltensor_fill_edges(iedge, vbx, velfab,
                                 mxlo, mylo, mzlo, mxhi, myhi, mzhi,
-#endif
                                 bvxlo, bvylo, bvzlo, bvxhi, bvyhi, bvzhi,
                                 bct, bcl, inhomog, imaxorder,
-				dxinv, domain);
+                                dxinv, domain);
         });
+#endif
 
 #endif
     }
 
-    vel.EnforcePeriodicity(0, AMREX_SPACEDIM, IntVect(1),
-                           m_geom[amrlev][mglev].periodicity());
+    // Notet that it is incorrect to call EnforcePeriodicity on vel.
 #endif
 }
 
@@ -347,7 +434,8 @@ MLTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes,
             AMREX_D_TERM(Array4<Real> const fxfab = fluxfab_tmp[0].array();,
                          Array4<Real> const fyfab = fluxfab_tmp[1].array();,
                          Array4<Real> const fzfab = fluxfab_tmp[2].array(););
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
             ( xbx, txbx,
               {
                   mltensor_cross_terms_fx(txbx,fxfab,vfab,etaxfab,kapxfab,dxinv);
@@ -356,12 +444,10 @@ MLTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes,
               {
                   mltensor_cross_terms_fy(tybx,fyfab,vfab,etayfab,kapyfab,dxinv);
               }
-#if (AMREX_SPACEDIM == 3)
             , zbx, tzbx,
               {
                   mltensor_cross_terms_fz(tzbx,fzfab,vfab,etazfab,kapzfab,dxinv);
               }
-#endif
             );
 
 	    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
@@ -383,7 +469,7 @@ MLTensorOp::compFlux (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes,
 
 void
 MLTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& fluxes,
-                       MultiFab& sol, Location loc) const
+                       MultiFab& sol, Location /*loc*/) const
 {
 #if (AMREX_SPACEDIM > 1)
     BL_PROFILE("MLTensorOp::compVelGrad()");
@@ -393,7 +479,7 @@ MLTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& flux
     applyBCTensor(amrlev, mglev, sol, BCMode::Inhomogeneous, StateMode::Solution, m_bndry_sol[amrlev].get());
 
     const auto dxinv = m_geom[amrlev][mglev].InvCellSizeArray();
-    const int dim_fluxes = pow(AMREX_SPACEDIM,2);
+    const int dim_fluxes = AMREX_SPACEDIM*AMREX_SPACEDIM;
 
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
@@ -416,7 +502,8 @@ MLTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& flux
             AMREX_D_TERM(Array4<Real> const fxfab = fluxfab_tmp[0].array();,
                          Array4<Real> const fyfab = fluxfab_tmp[1].array();,
                          Array4<Real> const fzfab = fluxfab_tmp[2].array(););
-            AMREX_LAUNCH_HOST_DEVICE_LAMBDA
+
+            AMREX_LAUNCH_HOST_DEVICE_LAMBDA_DIM
             ( xbx, txbx,
               {
                   mltensor_vel_grads_fx(txbx,fxfab,vfab,dxinv);
@@ -425,12 +512,10 @@ MLTensorOp::compVelGrad (int amrlev, const Array<MultiFab*,AMREX_SPACEDIM>& flux
               {
                   mltensor_vel_grads_fy(tybx,fyfab,vfab,dxinv);
               }
-#if (AMREX_SPACEDIM == 3)
             , zbx, tzbx,
               {
                   mltensor_vel_grads_fz(tzbx,fzfab,vfab,dxinv);
               }
-#endif
             );
 
 // The derivatives are put in the array with the following order:
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLTensor_2D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLTensor_2D_K.H
index 442b65cdcc0..3cc7b4caead 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLTensor_2D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLTensor_2D_K.H
@@ -201,6 +201,35 @@ void mltensor_cross_terms (Box const& box, Array4<Real> const& Ax,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mltensor_cross_terms_os (Box const& box, Array4<Real> const& Ax,
+                              Array4<Real const> const& fx,
+                              Array4<Real const> const& fy,
+                              Array4<int const> const& osm,
+                              GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                              Real bscalar) noexcept
+{
+    const Real dxi = bscalar * dxinv[0];
+    const Real dyi = bscalar * dxinv[1];
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+
+    for     (int j = lo.y; j <= hi.y; ++j) {
+        AMREX_PRAGMA_SIMD
+        for (int i = lo.x; i <= hi.x; ++i) {
+            if (osm(i,j,0) == 0) {
+                Ax(i,j,0,0) = 0.0;
+                Ax(i,j,0,1) = 0.0;
+            } else {
+                Ax(i,j,0,0) += dxi*(fx(i+1,j  ,0,0) - fx(i,j,0,0))
+                    +          dyi*(fy(i  ,j+1,0,0) - fy(i,j,0,0));
+                Ax(i,j,0,1) += dxi*(fx(i+1,j  ,0,1) - fx(i,j,0,1))
+                    +          dyi*(fy(i  ,j+1,0,1) - fy(i,j,0,1));
+            }
+        }
+    }
+}
+
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mltensor_vel_grads_fx (Box const& box, Array4<Real> const& fx,
                               Array4<Real const> const& vel,
diff --git a/Src/LinearSolvers/MLMG/AMReX_MLTensor_3D_K.H b/Src/LinearSolvers/MLMG/AMReX_MLTensor_3D_K.H
index 357b703e814..52e46191dcf 100644
--- a/Src/LinearSolvers/MLMG/AMReX_MLTensor_3D_K.H
+++ b/Src/LinearSolvers/MLMG/AMReX_MLTensor_3D_K.H
@@ -1182,6 +1182,44 @@ void mltensor_cross_terms (Box const& box, Array4<Real> const& Ax,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+void mltensor_cross_terms_os (Box const& box, Array4<Real> const& Ax,
+                              Array4<Real const> const& fx,
+                              Array4<Real const> const& fy,
+                              Array4<Real const> const& fz,
+                              Array4<int const> const& osm,
+                              GpuArray<Real,AMREX_SPACEDIM> const& dxinv,
+                              Real bscalar) noexcept
+{
+    const Real dxi = bscalar * dxinv[0];
+    const Real dyi = bscalar * dxinv[1];
+    const Real dzi = bscalar * dxinv[2];
+    const auto lo = amrex::lbound(box);
+    const auto hi = amrex::ubound(box);
+
+    for         (int k = lo.z; k <= hi.z; ++k) {
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            AMREX_PRAGMA_SIMD
+            for (int i = lo.x; i <= hi.x; ++i) {
+                if (osm(i,j,k) == 0) {
+                    Ax(i,j,k,0) = 0.0;
+                    Ax(i,j,k,1) = 0.0;
+                    Ax(i,j,k,2) = 0.0;
+                } else {
+                    Ax(i,j,k,0) += dxi*(fx(i+1,j  ,k  ,0) - fx(i,j,k,0))
+                        +          dyi*(fy(i  ,j+1,k  ,0) - fy(i,j,k,0))
+                        +          dzi*(fz(i  ,j  ,k+1,0) - fz(i,j,k,0));
+                    Ax(i,j,k,1) += dxi*(fx(i+1,j  ,k  ,1) - fx(i,j,k,1))
+                        +          dyi*(fy(i  ,j+1,k  ,1) - fy(i,j,k,1))
+                        +          dzi*(fz(i  ,j  ,k+1,1) - fz(i,j,k,1));
+                    Ax(i,j,k,2) += dxi*(fx(i+1,j  ,k  ,2) - fx(i,j,k,2))
+                        +          dyi*(fy(i  ,j+1,k  ,2) - fy(i,j,k,2))
+                        +          dzi*(fz(i  ,j  ,k+1,2) - fz(i,j,k,2));
+                }
+            }
+        }
+    }
+}
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 void mltensor_vel_grads_fx (Box const& box, Array4<Real> const& fx,
diff --git a/Src/LinearSolvers/Projections/AMReX_MacProjector.H b/Src/LinearSolvers/Projections/AMReX_MacProjector.H
index b9f540ebc0d..3070d5e59ed 100644
--- a/Src/LinearSolvers/Projections/AMReX_MacProjector.H
+++ b/Src/LinearSolvers/Projections/AMReX_MacProjector.H
@@ -25,7 +25,8 @@ public:
                   const Vector<Geometry>& a_geom,
                   const LPInfo& a_lpinfo,
                   const Vector<MultiFab const*>& a_divu,
-                  MLMG::Location a_divu_loc);
+                  MLMG::Location a_divu_loc,
+                  const Vector<iMultiFab const*>& a_overset_mask = {});
 
     MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_umac,
                   MLMG::Location a_umac_loc,
@@ -36,7 +37,7 @@ public:
                   const LPInfo& a_lpinfo,
                   const Vector<MultiFab const*>& a_divu = {})
      : MacProjector(a_umac, a_umac_loc, a_beta, a_beta_loc, a_phi_loc,
-                    a_geom, a_lpinfo, a_divu, MLMG::Location::CellCenter) {};
+                    a_geom, a_lpinfo, a_divu, MLMG::Location::CellCenter) {}
 
 #ifndef AMREX_USE_EB
     MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_umac,
@@ -46,7 +47,7 @@ public:
                   const Vector<MultiFab const*>& a_divu = {}) 
      : MacProjector(a_umac, MLMG::Location::FaceCenter,
                     a_beta, MLMG::Location::FaceCenter, MLMG::Location::CellCenter,
-                    a_geom, a_lpinfo, a_divu, MLMG::Location::CellCenter) {};
+                    a_geom, a_lpinfo, a_divu, MLMG::Location::CellCenter) {}
 
     MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_umac,
                   const Vector<Array<MultiFab const*,AMREX_SPACEDIM> >& a_beta,
@@ -54,7 +55,7 @@ public:
                   const Vector<MultiFab const*>& a_divu = {})
      : MacProjector(a_umac, MLMG::Location::FaceCenter,
                     a_beta, MLMG::Location::FaceCenter, MLMG::Location::CellCenter,
-                    a_geom, LPInfo(), a_divu, MLMG::Location::CellCenter) {};
+                    a_geom, LPInfo(), a_divu, MLMG::Location::CellCenter) {}
 #endif
 
     //
@@ -81,7 +82,9 @@ public:
     //
     // Setters and getters
     //
-    void setVerbose            (int  v) noexcept { m_verbose = v; }
+    void setVerbose            (int  v) noexcept 
+       { m_verbose = v;
+         m_mlmg->setVerbose(m_verbose); }
 
     // Methods to get underlying objects
     // Use these to modify properties of MLMG and linear operator
@@ -92,6 +95,8 @@ private:
 
     void setOptions ();
 
+    void averageDownVelocity ();
+
     std::unique_ptr<MLABecLaplacian> m_abeclap;
 #ifdef AMREX_USE_EB
     std::unique_ptr<MLEBABecLap> m_eb_abeclap;
@@ -104,6 +109,7 @@ private:
     Vector<Array<MultiFab*,AMREX_SPACEDIM> > m_umac;
     Vector<MultiFab> m_rhs;
     Vector<MultiFab> m_phi;
+    Vector<MultiFab> m_divu;
     Vector<Array<MultiFab,AMREX_SPACEDIM> > m_fluxes;
 
     Vector<Geometry> m_geom;
diff --git a/Src/LinearSolvers/Projections/AMReX_MacProjector.cpp b/Src/LinearSolvers/Projections/AMReX_MacProjector.cpp
index fdef85459eb..dc69b69ec52 100644
--- a/Src/LinearSolvers/Projections/AMReX_MacProjector.cpp
+++ b/Src/LinearSolvers/Projections/AMReX_MacProjector.cpp
@@ -16,13 +16,14 @@ MacProjector::MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_um
                             const Vector<Geometry>& a_geom,
                             const LPInfo& a_lpinfo,
                             const Vector<MultiFab const*>& a_divu,
-                            MLMG::Location a_divu_loc)
+                            MLMG::Location a_divu_loc,
+                            const Vector<iMultiFab const*>& a_overset_mask)
     : m_umac(a_umac),
       m_geom(a_geom),
       m_umac_loc(a_umac_loc),
       m_divu_loc(a_divu_loc)
 {
-    amrex::ignore_unused(m_divu_loc);
+    amrex::ignore_unused(m_divu_loc,a_beta_loc,a_phi_loc);
     int nlevs = a_umac.size();
     Vector<BoxArray> ba(nlevs);
     Vector<DistributionMapping> dm(nlevs);
@@ -34,6 +35,7 @@ MacProjector::MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_um
     m_rhs.resize(nlevs);
     m_phi.resize(nlevs);
     m_fluxes.resize(nlevs);
+    m_divu.resize(nlevs);
 
 #ifdef AMREX_USE_EB
     bool has_eb = a_umac[0][0]->hasEBFabFactory();
@@ -76,7 +78,11 @@ MacProjector::MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_um
             }
         }
 
-        m_abeclap.reset(new MLABecLaplacian(a_geom, ba, dm, a_lpinfo));
+        if(a_overset_mask.empty())
+            m_abeclap.reset(new MLABecLaplacian(a_geom, ba, dm, a_lpinfo));
+        else
+            m_abeclap.reset(new MLABecLaplacian(a_geom, ba, dm, a_overset_mask, a_lpinfo));
+
         m_linop = m_abeclap.get();
 
         m_abeclap->setScalars(0.0, 1.0);
@@ -86,8 +92,14 @@ MacProjector::MacProjector (const Vector<Array<MultiFab*,AMREX_SPACEDIM> >& a_um
     }
 
     for (int ilev = 0, N = a_divu.size(); ilev < N; ++ilev) {
-        if (a_divu[ilev]) {
-            MultiFab::Copy(m_rhs[ilev], *a_divu[ilev], 0, 0, 1, 0);
+        if (a_divu[ilev])
+        {
+#ifdef AMREX_USE_EB
+            m_divu[ilev].define(ba[ilev],dm[ilev],1,0,MFInfo(),a_umac[ilev][0]->Factory());
+#else
+            m_divu[ilev].define(ba[ilev],dm[ilev],1,0);
+#endif
+            MultiFab::Copy(m_divu[ilev], *a_divu[ilev], 0, 0, 1, 0);
         }
     }
 
@@ -124,6 +136,8 @@ MacProjector::project (Real reltol, Real atol)
 {
     const int nlevs = m_rhs.size();
 
+    averageDownVelocity();
+
     for (int ilev = 0; ilev < nlevs; ++ilev)
     {
         Array<MultiFab const*, AMREX_SPACEDIM> u;
@@ -141,12 +155,20 @@ MacProjector::project (Real reltol, Real atol)
                 m_umac[ilev][idim]->FillBoundary(m_geom[ilev].periodicity());
             }
         }
-        
+
         EB_computeDivergence(divu, u, m_geom[ilev], (m_umac_loc == MLMG::Location::FaceCentroid));
 #else
         computeDivergence(divu, u, m_geom[ilev]);
 #endif
-        MultiFab::Subtract(m_rhs[ilev], divu, 0, 0, 1, 0);
+
+        // Setup RHS as (m_divu - divu) where m_divu is a user-provided source term
+        MultiFab::Copy(m_rhs[ilev], divu, 0, 0, 1, 0);
+        m_rhs[ilev].mult(-1.0);
+
+        if (m_divu[ilev].ok())
+        {
+            MultiFab::Add(m_rhs[ilev],m_divu[ilev],0,0,1,0);
+        }
     }
 
     m_mlmg->solve(amrex::GetVecOfPtrs(m_phi), amrex::GetVecOfConstPtrs(m_rhs), reltol, atol);
@@ -161,6 +183,8 @@ MacProjector::project (Real reltol, Real atol)
 #endif
         }
     }
+
+    averageDownVelocity();
 }
 
 void
@@ -168,6 +192,8 @@ MacProjector::project (const Vector<MultiFab*>& phi_inout, Real reltol, Real ato
 {
     const int nlevs = m_rhs.size();
 
+    averageDownVelocity();
+
     for (int ilev = 0; ilev < nlevs; ++ilev)
     {
         Array<MultiFab const*, AMREX_SPACEDIM> u;
@@ -189,7 +215,14 @@ MacProjector::project (const Vector<MultiFab*>& phi_inout, Real reltol, Real ato
 #else
         computeDivergence(divu, u, m_geom[ilev]);
 #endif
-        MultiFab::Subtract(m_rhs[ilev], divu, 0, 0, 1, 0);
+        // Setup RHS as (m_divu - divu) where m_divu is a user-provided source term
+        MultiFab::Copy(m_rhs[ilev], divu, 0, 0, 1, 0);
+        m_rhs[ilev].mult(-1.0);
+
+        if (m_divu[ilev].ok())
+        {
+            MultiFab::Add(m_rhs[ilev],m_divu[ilev],0,0,1,0);
+        }
 
         MultiFab::Copy(m_phi[ilev], *phi_inout[ilev], 0, 0, 1, 0);
     }
@@ -207,6 +240,9 @@ MacProjector::project (const Vector<MultiFab*>& phi_inout, Real reltol, Real ato
 #endif
         }
     }
+
+    averageDownVelocity();
+
     for (int ilev = 0; ilev < nlevs; ++ilev)
     {
         MultiFab::Copy(*phi_inout[ilev], m_phi[ilev], 0, 0, 1, 0);
@@ -221,7 +257,6 @@ MacProjector::project (const Vector<MultiFab*>& phi_inout, Real reltol, Real ato
 void
 MacProjector::setOptions ()
 {
-
     // Default values
     int          maxorder(3);
     int          bottom_verbose(0);
@@ -290,4 +325,27 @@ MacProjector::setOptions ()
     }
 }
 
+void
+MacProjector::averageDownVelocity ()
+{
+    int finest_level = m_umac.size() - 1;
+
+
+    for (int lev = finest_level; lev > 0; --lev)
+    {
+
+        IntVect rr  = m_geom[lev].Domain().size() / m_geom[lev-1].Domain().size();
+
+#ifdef AMREX_USE_EB
+        EB_average_down_faces(GetArrOfConstPtrs(m_umac[lev]),
+                              m_umac[lev-1],
+                              rr, m_geom[lev-1]);
+#else
+        average_down_faces(GetArrOfConstPtrs(m_umac[lev]),
+                           m_umac[lev-1],
+                           rr, m_geom[lev-1]);
+#endif
+    }
+}
+
 }
diff --git a/Src/LinearSolvers/Projections/AMReX_NodalProjector.H b/Src/LinearSolvers/Projections/AMReX_NodalProjector.H
index b3ea58ee07e..a2c77b0cd84 100644
--- a/Src/LinearSolvers/Projections/AMReX_NodalProjector.H
+++ b/Src/LinearSolvers/Projections/AMReX_NodalProjector.H
@@ -7,6 +7,9 @@
 #include <AMReX_MLNodeLaplacian.H>
 #include <AMReX_MLMG.H>
 
+//
+//
+// ***************************  DEFAULT MODE  ***************************
 //
 // Solves
 //
@@ -14,15 +17,31 @@
 //
 // and  performs the projection
 //
-//     vel = vel - ( sigma / alpha ) * grad(phi)
+//     vel = vel - sigma * grad(phi)
 //
-// vel, sigma, alpha, and S_cc are cell-centered variables, while
+// vel, sigma, and S_cc are cell-centered variables, while
 // phi and S_nd are nodal-centered variables.
 //
+// ***************************  CUSTOM MODE   ***************************
+//
+// Solves
+//
+//     div(sigma*grad(phi)) = rhs
+//
+// and performs the projection
+//
+//     vel = vel - (sigma/alpha) * grad(phi)
+//
+// alpha is a cell-centered variable, while rhs is nodal-centered.
+//
+// In this mode, the user provides rhs and alpha
+//
 // By default alpha is assumed to be 1. Use setAlpha to change the default.
 //
-// The user can provide a custom RHS instead of letting NodalProjector to compute
-// one. Use setCustomRHS to provide a custom RHS.
+// Use setCustomRHS to provide a custom RHS, else "div(vel) + S_nd + S_cc"
+// is used.
+//
+// Example: rhs = div(alpha*vel)
 //
 namespace amrex {
 
@@ -43,15 +62,15 @@ public:
                      const Vector<Geometry>&                      a_geom,
                      const amrex::Vector<amrex::MultiFab*>&       a_S_cc = {},
                      const amrex::Vector<const amrex::MultiFab*>& a_S_nd = {} )
-    : NodalProjector(a_vel, a_sigma, a_geom, LPInfo(), a_S_cc, a_S_nd ) {};
+    : NodalProjector(a_vel, a_sigma, a_geom, LPInfo(), a_S_cc, a_S_nd ) {}
 
 
     void project ( amrex::Real a_rtol = 1.0e-11, amrex::Real a_atol = 1.0e-14 );
     void project ( const Vector<amrex::MultiFab*>& a_phi, amrex::Real a_rtol = 1.0e-11,
                    amrex::Real a_atol = 1.0e-14 );
 
-    Vector< const MultiFab* > getGradPhi () const {return GetVecOfConstPtrs(m_fluxes);};
-    Vector< const MultiFab* > getPhi     () const {return GetVecOfConstPtrs(m_phi);};
+    Vector< const MultiFab* > getGradPhi () const {return GetVecOfConstPtrs(m_fluxes);}
+    Vector< const MultiFab* > getPhi     () const {return GetVecOfConstPtrs(m_phi);}
 
     void computeRHS ( const amrex::Vector<amrex::MultiFab*>&       a_rhs,
                       const amrex::Vector<amrex::MultiFab*>&       a_vel,
@@ -59,7 +78,7 @@ public:
                       const amrex::Vector<const amrex::MultiFab*>& a_S_nd = {} );
 
     void setAlpha     (const amrex::Vector<const amrex::MultiFab*> a_alpha)
-        {m_alpha=a_alpha;m_has_alpha=true;};
+        {m_alpha=a_alpha;m_has_alpha=true;}
     void setCustomRHS (const amrex::Vector<const amrex::MultiFab*> a_rhs);
 
 
diff --git a/Src/LinearSolvers/Projections/AMReX_NodalProjector.cpp b/Src/LinearSolvers/Projections/AMReX_NodalProjector.cpp
index dc472822e3e..23118851e5d 100644
--- a/Src/LinearSolvers/Projections/AMReX_NodalProjector.cpp
+++ b/Src/LinearSolvers/Projections/AMReX_NodalProjector.cpp
@@ -182,8 +182,7 @@ NodalProjector::setDomainBC ( std::array<LinOpBCType,AMREX_SPACEDIM> a_bc_lo,
     m_bc_hi=a_bc_hi;
     m_linop->setDomainBC(m_bc_lo,m_bc_hi);
     m_need_bcs = false;
-};
-
+}
 
 void
 NodalProjector::setCustomRHS (const amrex::Vector<const amrex::MultiFab*> a_rhs)
@@ -242,7 +241,7 @@ NodalProjector::project ( Real a_rtol, Real a_atol )
     // phi comes out already averaged-down and ready to be used by caller if needed
     m_mlmg -> solve( GetVecOfPtrs(m_phi), GetVecOfConstPtrs(m_rhs), a_rtol, a_atol );
 
-    // Get fluxes -- fluxes = -  (alpha/beta) * grad(phi)
+    // Get fluxes -- fluxes = - sigma * grad(phi)
     m_mlmg -> getFluxes( GetVecOfPtrs(m_fluxes) );
 
     // At this time, the fluxes are "correct" only on regions not covered by finer grids.
@@ -259,7 +258,7 @@ NodalProjector::project ( Real a_rtol, Real a_atol )
     {
         if (m_has_alpha)
         {
-            // fluxes -> fluxes/alpha = -grad(phi)/beta
+            // fluxes -> fluxes/alpha = - ( sigma / alpha ) * grad(phi)
             for (int n = 0; n < AMREX_SPACEDIM; ++n)
             {
                 MultiFab::Divide( m_fluxes[lev], *m_alpha[lev], 0, n, 1, 0 );
@@ -267,7 +266,7 @@ NodalProjector::project ( Real a_rtol, Real a_atol )
         }
 
         //
-        // vel = vel + fluxes = vel - grad(phi) / beta
+        // vel = vel + fluxes = vel - ( sigma / alpha ) * grad(phi)
         //
         // Since we already averaged-down the velocity field and -grad(phi),
         // we perform the projection by simply adding the two of them.
@@ -468,10 +467,6 @@ NodalProjector::setCoarseBoundaryVelocityForSync ()
 void
 NodalProjector::averageDown (const amrex::Vector<amrex::MultiFab*> a_var)
 {
-    // If not cartesian, we should average down by using volume weighting
-    // We check that coord sys is Cartesian only for coarsest level and assume
-    // geom for all other levels are Cartesian as well
-    AMREX_ALWAYS_ASSERT(m_geom[0].IsCartesian());
 
     int f_lev = a_var.size()-1;
     int c_lev = 0;
@@ -481,13 +476,21 @@ NodalProjector::averageDown (const amrex::Vector<amrex::MultiFab*> a_var)
         IntVect rr   = m_geom[lev+1].Domain().size() / m_geom[lev].Domain().size();
 
 #ifdef AMREX_USE_EB
-        EB_average_down(*a_var[lev+1], *a_var[lev], 0, a_var[lev]->nComp(), rr);
+        const auto ebf = dynamic_cast<EBFArrayBoxFactory const&>(a_var[lev+1]->Factory());
+
+        amrex::MultiFab volume(a_var[lev+1]->boxArray(),a_var[lev+1]->DistributionMap(),1,0);
+        m_geom[lev+1].GetVolume(volume);
+
+        EB_average_down(*a_var[lev+1], *a_var[lev], volume, ebf.getVolFrac(),
+                        0, a_var[lev]->nComp(), rr);
 #else
-        average_down(*a_var[lev+1], *a_var[lev], 0, a_var[lev]->nComp(), rr);
+        average_down(*a_var[lev+1], *a_var[lev], m_geom[lev+1], m_geom[lev],
+                     0, a_var[lev]->nComp(), rr);
 #endif
 
     }
 
+
 }
 
 
diff --git a/Src/Particle/AMReX_ArrayOfStructs.H b/Src/Particle/AMReX_ArrayOfStructs.H
index e0975ce96d1..f8d8235f6bb 100644
--- a/Src/Particle/AMReX_ArrayOfStructs.H
+++ b/Src/Particle/AMReX_ArrayOfStructs.H
@@ -7,20 +7,21 @@
 
 namespace amrex {
 
-template <int NReal, int NInt>
+template <int NReal, int NInt,
+          template<class> class Allocator=DefaultAllocator>
 class ArrayOfStructs {
 public:
     using ParticleType  = Particle<NReal, NInt>;
     using RealType      = typename ParticleType::RealType;
 
-    using ParticleVector = Gpu::DeviceVector<ParticleType>;
-    
+    using ParticleVector = amrex::PODVector<ParticleType, Allocator<ParticleType> >;
+
     using Iterator      = typename ParticleVector::iterator;
     using ConstIterator = typename ParticleVector::const_iterator;
-    
+
     static constexpr int SizeInReal = sizeof(ParticleType) / sizeof(RealType);
-    
-    ArrayOfStructs() 
+
+    ArrayOfStructs()
         : m_num_neighbor_particles(0) {}
 
     const ParticleVector& operator() () const { return m_data; }
@@ -57,36 +58,41 @@ public:
     int numTotalParticles () const { return m_data.size(); }
 
     void setNumNeighbors (int num_neighbors)
-    { 
+    {
         auto nrp = numRealParticles();
         m_num_neighbor_particles = num_neighbors;
         resize(nrp + num_neighbors);
     }
 
     int getNumNeighbors () { return m_num_neighbor_particles; }
-    
+
     bool empty () const { return m_data.empty(); }
-    
-    const RealType* data () const { return &(m_data[0].m_rdata.arr[0]); }
-    RealType* data () { return &(m_data[0].m_rdata.arr[0]); }
+
+    const RealType* data () const { return &(m_data[0].m_pos[0]); }
+    RealType* data () { return &(m_data[0].pos(0)); }
 
     const RealType* dataPtr () const { return data(); }
     RealType*       dataPtr ()       { return data(); }
-    
+
     std::pair<int,int> dataShape () const {
 	return std::make_pair(SizeInReal, static_cast<int>(m_data.size()));
     }
-    
+
     void push_back (const ParticleType& p) { return m_data.push_back(p); }
     void pop_back() {m_data.pop_back(); }
     bool empty() {return m_data.empty(); }
-    
+
     const ParticleType& back() const {return m_data.back(); }
     ParticleType      & back()       {return m_data.back(); }
 
     const ParticleType& operator[] (int i) const { return m_data[i]; }
     ParticleType      & operator[] (int i)       { return m_data[i]; }
-    
+
+    void swap (ArrayOfStructs<NReal, NInt>& other)
+    {
+        m_data.swap(other.m_data);
+    }
+
     void resize(size_t count) { m_data.resize(count); }
 
     Iterator erase( ConstIterator first, ConstIterator second) { return m_data.erase(first, second); }
@@ -97,7 +103,7 @@ public:
     typename ParticleVector::iterator begin () { return m_data.begin(); }
     typename ParticleVector::const_iterator begin () const { return m_data.begin(); }
     typename ParticleVector::const_iterator cbegin () const { return m_data.cbegin(); }
-        
+
     typename ParticleVector::iterator end () { return m_data.end(); }
     typename ParticleVector::const_iterator end () const { return m_data.end(); }
     typename ParticleVector::const_iterator cend () const { return m_data.cend(); }
@@ -107,8 +113,11 @@ public:
 private:
     ParticleVector m_data;
 };
+
 #if __cplusplus < 201703L
-template <int NReal, int NInt> constexpr int ArrayOfStructs<NReal, NInt>::SizeInReal;
+template <int NReal, int NInt,
+          template<class> class Allocator>
+constexpr int ArrayOfStructs<NReal, NInt, Allocator>::SizeInReal;
 #endif
 
 } // namespace amrex
diff --git a/Src/Particle/AMReX_BinIterator.H b/Src/Particle/AMReX_BinIterator.H
index 9d3977baaa6..95d9895ac00 100644
--- a/Src/Particle/AMReX_BinIterator.H
+++ b/Src/Particle/AMReX_BinIterator.H
@@ -17,14 +17,14 @@ struct BinIterator
     {
         AMREX_GPU_HOST_DEVICE
         iterator (index_type start, index_type stop, const index_type* a_perm, const T* a_items) 
-            : m_index(start), m_stop(stop), m_perm(a_perm), m_items(a_items)   
+            : m_items(a_items), m_perm(a_perm), m_index(start), m_stop(stop)
         {}
         
         AMREX_GPU_HOST_DEVICE
         void operator++ () { ++m_index;; }
         
         AMREX_GPU_HOST_DEVICE
-        bool operator!= (iterator const& rhs) const { return m_index < m_stop; }
+        bool operator!= (iterator const& /*rhs*/) const { return m_index < m_stop; }
         
         AMREX_GPU_HOST_DEVICE
         std::pair<index_type, T> operator* () const
diff --git a/Src/Particle/AMReX_DenseBins.H b/Src/Particle/AMReX_DenseBins.H
index a20c1a96069..59169ead29f 100644
--- a/Src/Particle/AMReX_DenseBins.H
+++ b/Src/Particle/AMReX_DenseBins.H
@@ -13,29 +13,29 @@ template <typename T>
 struct DenseBinIteratorFactory
 {
     using index_type = unsigned int;
-        
-    DenseBinIteratorFactory (const Gpu::DeviceVector<index_type>& offsets, 
+
+    DenseBinIteratorFactory (const Gpu::DeviceVector<index_type>& offsets,
                              const Gpu::DeviceVector<index_type>& permutation,
                              const T* items)
         : m_offsets_ptr(offsets.dataPtr()),
           m_permutation_ptr(permutation.dataPtr()),
           m_items(items)
     {}
-    
+
     AMREX_GPU_HOST_DEVICE
     BinIterator<T> getBinIterator(const int bin_number) const noexcept
     {
         return BinIterator<T>(bin_number, m_offsets_ptr, m_permutation_ptr, m_items);
     }
-    
+
     const index_type* m_offsets_ptr;
     const index_type* m_permutation_ptr;
     const T* m_items;
 };
-    
+
 /**
  * \brief A container for storing items in a set of bins.
- * 
+ *
  * The underlying data structure is an array of size nitems defining a
  * permutation of the items in the container that puts them in bin-sorted order,
  * plus an array of size nbins+1 that stores the offsets into the permutation
@@ -47,14 +47,13 @@ struct DenseBinIteratorFactory
  *
  * \tparam The type of items we hold
  *
- */    
+ */
 template <typename T>
 class DenseBins
 {
 public:
 
     using BinIteratorFactory = DenseBinIteratorFactory<T>;
-    using bin_type = IntVect;
     using index_type = unsigned int;
 
     /**
@@ -64,27 +63,27 @@ public:
      * of items in each bin. Then, we perform a prefix sum on the resulting counts.
      * Finally, the set of partial sums is incremented in parallel using atomicInc,
      * which results in a permutation array that places the items in bin-sorted order.
-     * 
+     *
      * \tparam N the 'size' type that can enumerate all the items
      * \tparam F a function that maps items to IntVect bins
      *
      * \param nitems the number of items to put in the bins
      * \param v pointer to the start of the items
      * \param bx the Box that defines the space over which the bins will be defined
-     * \param f a function object that maps items to bins 
-     */        
+     * \param f a function object that maps items to bins
+     */
     template <typename N, typename F>
-    void build (N nitems, T const* v, const Box& bx, F f)
+    void build (N nitems, T const* v, const Box& bx, F&& f)
     {
         BL_PROFILE("DenseBins<T>::build");
 
         m_items = v;
-        
+
         m_cells.resize(nitems);
         m_perm.resize(nitems);
-        
+
         auto nbins = bx.numPts();
-        m_counts.resize(0);        
+        m_counts.resize(0);
         m_counts.resize(nbins+1, 0);
 
         m_offsets.resize(0);
@@ -94,9 +93,9 @@ public:
         const auto hi = ubound(bx);
         index_type* pcell   = m_cells.dataPtr();
         index_type* pcount  = m_counts.dataPtr();
-        AMREX_FOR_1D ( nitems, i,
+        amrex::ParallelFor(nitems, [=] AMREX_GPU_DEVICE (int i) noexcept
         {
-            bin_type iv = f(v[i]);
+            auto iv = f(v[i]);
             auto iv3 = iv.dim3();
             int nx = hi.x-lo.x+1;
             int ny = hi.y-lo.y+1;
@@ -105,7 +104,46 @@ public:
             index_type uiy = amrex::min(ny-1,amrex::max(0,iv3.y));
             index_type uiz = amrex::min(nz-1,amrex::max(0,iv3.z));
             pcell[i] = (uix * ny + uiy) * nz + uiz;
-            Gpu::Atomic::Add(&pcount[pcell[i]], index_type{ 1 });
+            Gpu::Atomic::AddNoRet(&pcount[pcell[i]], index_type{ 1 });
+        });
+
+        Gpu::exclusive_scan(m_counts.begin(), m_counts.end(), m_offsets.begin());
+
+        Gpu::copy(Gpu::deviceToDevice, m_offsets.begin(), m_offsets.end(), m_counts.begin());
+
+        index_type* pperm = m_perm.dataPtr();
+        constexpr index_type max_index = std::numeric_limits<index_type>::max();
+        amrex::ParallelFor(nitems, [=] AMREX_GPU_DEVICE (int i) noexcept
+        {
+            index_type index = Gpu::Atomic::Inc(&pcount[pcell[i]], max_index);
+            pperm[index] = i;
+        });
+
+        Gpu::Device::streamSynchronize();
+    }
+
+    template <typename N, typename F>
+    void build (N nitems, T const* v, int nbins, F&& f)
+    {
+        BL_PROFILE("DenseBins<T>::build");
+
+        m_items = v;
+
+        m_cells.resize(nitems);
+        m_perm.resize(nitems);
+
+        m_counts.resize(0);
+        m_counts.resize(nbins+1, 0);
+
+        m_offsets.resize(0);
+        m_offsets.resize(nbins+1);
+
+        index_type* pcell   = m_cells.dataPtr();
+        index_type* pcount  = m_counts.dataPtr();
+        amrex::ParallelFor(nitems, [=] AMREX_GPU_DEVICE (int i) noexcept
+        {
+            pcell[i] = f(v[i]);
+            Gpu::Atomic::AddNoRet(&pcount[pcell[i]], index_type{ 1 });
         });
 
         Gpu::exclusive_scan(m_counts.begin(), m_counts.end(), m_offsets.begin());
@@ -114,7 +152,7 @@ public:
 
         index_type* pperm = m_perm.dataPtr();
         constexpr index_type max_index = std::numeric_limits<index_type>::max();
-        AMREX_FOR_1D ( nitems, i,
+        amrex::ParallelFor(nitems, [=] AMREX_GPU_DEVICE (int i) noexcept
         {
             index_type index = Gpu::Atomic::Inc(&pcount[pcell[i]], max_index);
             pperm[index] = i;
@@ -128,14 +166,14 @@ public:
 
     //! \brief the number of bins in the container
     Long numBins () const noexcept { return m_offsets.size()-1; }
-    
-    //! \brief returns the pointer to the permutation array 
+
+    //! \brief returns the pointer to the permutation array
     index_type* permutationPtr () noexcept { return m_perm.dataPtr(); }
 
     //! \brief returns the pointer to the offsets array
     index_type* offsetsPtr () noexcept { return m_offsets.dataPtr(); }
 
-    //! \brief returns const pointer to the permutation array 
+    //! \brief returns const pointer to the permutation array
     const index_type* permutationPtr () const noexcept { return m_perm.dataPtr(); }
 
     //! \brief returns const pointer to the offsets array
@@ -146,11 +184,11 @@ public:
     {
         return DenseBinIteratorFactory<T>(m_offsets, m_perm, m_items);
     }
-    
+
 private:
 
     const T* m_items;
-            
+
     Gpu::DeviceVector<index_type> m_cells;
     Gpu::DeviceVector<index_type> m_counts;
     Gpu::DeviceVector<index_type> m_offsets;
diff --git a/Src/Particle/AMReX_NeighborList.H b/Src/Particle/AMReX_NeighborList.H
index 3ae0aa98f93..d3e03379488 100644
--- a/Src/Particle/AMReX_NeighborList.H
+++ b/Src/Particle/AMReX_NeighborList.H
@@ -10,77 +10,124 @@ namespace amrex
 
 template <class ParticleType>
 struct Neighbors
-{    
+{
     struct iterator
     {
         AMREX_GPU_HOST_DEVICE
-        iterator (int start, int stop, const unsigned int * nbor_list_ptr, const ParticleType* pstruct) 
-            : m_index(start), m_stop(stop), m_nbor_list_ptr(nbor_list_ptr), m_pstruct(pstruct)   
+        iterator (int start, int stop, const unsigned int * nbor_list_ptr, ParticleType* pstruct)
+            : m_index(start), m_stop(stop), m_nbor_list_ptr(nbor_list_ptr), m_pstruct(pstruct)
         {}
-        
+
         AMREX_GPU_HOST_DEVICE
         void operator++ () { ++m_index;; }
-        
+
         AMREX_GPU_HOST_DEVICE
         bool operator!= (iterator const& rhs) const { return m_index < m_stop; }
-        
+
         AMREX_GPU_HOST_DEVICE
-        ParticleType operator* () const { return m_pstruct[m_nbor_list_ptr[m_index]];  }
-        
+        ParticleType& operator* () const { return m_pstruct[m_nbor_list_ptr[m_index]];  }
+
+    private:
+        int m_index;
+        int m_stop;
+        const unsigned int* m_nbor_list_ptr;
+        ParticleType* m_pstruct;
+    };
+
+    struct const_iterator
+    {
+        AMREX_GPU_HOST_DEVICE
+        const_iterator (int start, int stop, const unsigned int * nbor_list_ptr, const ParticleType* pstruct)
+            : m_index(start), m_stop(stop), m_nbor_list_ptr(nbor_list_ptr), m_pstruct(pstruct)
+        {}
+
+        AMREX_GPU_HOST_DEVICE
+        void operator++ () { ++m_index;; }
+
+        AMREX_GPU_HOST_DEVICE
+        bool operator!= (const_iterator const& rhs) const { return m_index < m_stop; }
+
+        AMREX_GPU_HOST_DEVICE
+        const ParticleType& operator* () const { return m_pstruct[m_nbor_list_ptr[m_index]];  }
+
     private:
         int m_index;
         int m_stop;
         const unsigned int* m_nbor_list_ptr;
         const ParticleType* m_pstruct;
     };
-    
+
     AMREX_GPU_HOST_DEVICE
-    iterator begin () const {
-        return iterator(m_nbor_offsets_ptr[m_i], m_nbor_offsets_ptr[m_i+1], 
+    iterator begin () noexcept {
+        return iterator(m_nbor_offsets_ptr[m_i], m_nbor_offsets_ptr[m_i+1],
                         m_nbor_list_ptr, m_pstruct);
     }
 
     AMREX_GPU_HOST_DEVICE
-    iterator end () const { 
-        return iterator(m_nbor_offsets_ptr[m_i+1], m_nbor_offsets_ptr[m_i+1], 
+    iterator end () noexcept {
+        return iterator(m_nbor_offsets_ptr[m_i+1], m_nbor_offsets_ptr[m_i+1],
                         m_nbor_list_ptr, m_pstruct);
     }
 
-    AMREX_GPU_HOST_DEVICE    
+    AMREX_GPU_HOST_DEVICE
+    const_iterator begin () const noexcept {
+        return const_iterator(m_nbor_offsets_ptr[m_i], m_nbor_offsets_ptr[m_i+1],
+                              m_nbor_list_ptr, m_pstruct);
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    const_iterator end () const noexcept {
+        return const_iterator(m_nbor_offsets_ptr[m_i+1], m_nbor_offsets_ptr[m_i+1],
+                              m_nbor_list_ptr, m_pstruct);
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    const_iterator cbegin () const noexcept {
+        return const_iterator(m_nbor_offsets_ptr[m_i], m_nbor_offsets_ptr[m_i+1],
+                              m_nbor_list_ptr, m_pstruct);
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    const_iterator cend () const noexcept {
+        return const_iterator(m_nbor_offsets_ptr[m_i+1], m_nbor_offsets_ptr[m_i+1],
+                              m_nbor_list_ptr, m_pstruct);
+    }
+
+    AMREX_GPU_HOST_DEVICE
     Neighbors (int i, const unsigned int *nbor_offsets_ptr, const unsigned int *nbor_list_ptr,
-               const ParticleType* pstruct)
+               ParticleType* pstruct)
         : m_i(i),
           m_nbor_offsets_ptr(nbor_offsets_ptr),
           m_nbor_list_ptr(nbor_list_ptr),
           m_pstruct(pstruct)
     {}
-    
+
 private:
 
     const int m_i;
     const unsigned int * m_nbor_offsets_ptr;
     const unsigned int * m_nbor_list_ptr;
-    const ParticleType * m_pstruct;
+    ParticleType * m_pstruct;
 };
 
 template <class ParticleType>
 struct NeighborData
 {
-    NeighborData (const Gpu::DeviceVector<unsigned int>& offsets, 
+    NeighborData (const Gpu::DeviceVector<unsigned int>& offsets,
                   const Gpu::DeviceVector<unsigned int>& list,
-                  const ParticleType* pstruct)
+                  ParticleType* pstruct)
         : m_nbor_offsets_ptr(offsets.dataPtr()),
           m_nbor_list_ptr(list.dataPtr()),
           m_pstruct(pstruct)
     {}
-    
+
     AMREX_GPU_HOST_DEVICE
     amrex::Neighbors<ParticleType> getNeighbors (int i) const
     { return Neighbors<ParticleType>(i, m_nbor_offsets_ptr, m_nbor_list_ptr, m_pstruct); }
-    
+
     const unsigned int * m_nbor_offsets_ptr;
     const unsigned int * m_nbor_list_ptr;
-    const ParticleType * m_pstruct;
+    ParticleType * m_pstruct;
 };
 
 template <class ParticleType>
@@ -89,20 +136,22 @@ class NeighborList
 public:
 
     template <class PTile, class CheckPair>
-    void build (const PTile& ptile,
+    void build (PTile& ptile,
                 const amrex::Box& bx, const amrex::Geometry& geom,
-                CheckPair check_pair, int num_cells=1)
+                CheckPair&& check_pair, int num_cells=1)
     {
-        const auto& vec = ptile.GetArrayOfStructs()();
+        BL_PROFILE("NeighborList::build()");
+
+        auto& vec = ptile.GetArrayOfStructs()();
         m_pstruct = vec.dataPtr();
-        
+
         const auto dxi = geom.InvCellSizeArray();
         const auto plo = geom.ProbLoArray();
-		
+
         const size_t np_real  = ptile.numRealParticles();
         const size_t np_total = vec.size();
         const ParticleType* pstruct_ptr = vec.dataPtr();
-		
+
         const auto lo = lbound(bx);
         const auto hi = ubound(bx);
         m_bins.build(np_total, pstruct_ptr, bx,
@@ -111,7 +160,7 @@ public:
                          AMREX_D_TERM(AMREX_ASSERT((p.pos(0)-plo[0])*dxi[0] - lo.x >= 0.0);,
                                       AMREX_ASSERT((p.pos(1)-plo[1])*dxi[1] - lo.y >= 0.0);,
                                       AMREX_ASSERT((p.pos(2)-plo[2])*dxi[2] - lo.z >= 0.0));
-                                      
+
                          return IntVect(AMREX_D_DECL(static_cast<int>((p.pos(0)-plo[0])*dxi[0] - lo.x),
                                                      static_cast<int>((p.pos(1)-plo[1])*dxi[1] - lo.y),
                                                      static_cast<int>((p.pos(2)-plo[2])*dxi[2] - lo.z)));
@@ -131,13 +180,13 @@ public:
             int ix = (pstruct_ptr[i].pos(0)-plo[0])*dxi[0] - lo.x;
             int iy = (pstruct_ptr[i].pos(1)-plo[1])*dxi[1] - lo.y;
             int iz = (pstruct_ptr[i].pos(2)-plo[2])*dxi[2] - lo.z;
-            
+
             int nx = hi.x-lo.x+1;
             int ny = hi.y-lo.y+1;
-            int nz = hi.z-lo.z+1;            
-            
+            int nz = hi.z-lo.z+1;
+
             int count = 0;
-            
+
             for (int ii = amrex::max(ix-num_cells, 0); ii <= amrex::min(ix+num_cells, nx-1); ++ii) {
                 for (int jj = amrex::max(iy-num_cells, 0); jj <= amrex::min(iy+num_cells, ny-1); ++jj) {
                     for (int kk = amrex::max(iz-num_cells, 0); kk <= amrex::min(iz+num_cells, nz-1); ++kk) {
@@ -173,12 +222,12 @@ public:
             int ix = (pstruct_ptr[i].pos(0)-plo[0])*dxi[0] - lo.x;
             int iy = (pstruct_ptr[i].pos(1)-plo[1])*dxi[1] - lo.y;
             int iz = (pstruct_ptr[i].pos(2)-plo[2])*dxi[2] - lo.z;
-            
+
             int nx = hi.x-lo.x+1;
             int ny = hi.y-lo.y+1;
-            int nz = hi.z-lo.z+1;            
-            
-            int n = 0;            
+            int nz = hi.z-lo.z+1;
+
+            int n = 0;
             for (int ii = amrex::max(ix-num_cells, 0); ii <= amrex::min(ix+num_cells, nx-1); ++ii) {
                 for (int jj = amrex::max(iy-num_cells, 0); jj <= amrex::min(iy+num_cells, ny-1); ++jj) {
                     for (int kk = amrex::max(iz-num_cells, 0); kk <= amrex::min(iz+num_cells, nz-1); ++kk) {
@@ -186,7 +235,7 @@ public:
                         for (auto p = poffset[index]; p < poffset[index+1]; ++p) {
                             if (pperm[p] == i) continue;
                             if (check_pair(pstruct_ptr[i], pstruct_ptr[pperm[p]])) {
-                                pm_nbor_list[pnbor_offset[i] + n] = pperm[p]; 
+                                pm_nbor_list[pnbor_offset[i] + n] = pperm[p];
                                 ++n;
                             }
                         }
@@ -195,10 +244,10 @@ public:
             }
         });
     }
-    
-    NeighborData<ParticleType> data () 
-    { 
-        return NeighborData<ParticleType>(m_nbor_offsets, m_nbor_list, m_pstruct); 
+
+    NeighborData<ParticleType> data ()
+    {
+        return NeighborData<ParticleType>(m_nbor_offsets, m_nbor_list, m_pstruct);
     }
 
     int numParticles () { return m_nbor_offsets.size() - 1; }
@@ -211,17 +260,17 @@ public:
 
     Gpu::DeviceVector<unsigned int>&       GetList ()       { return m_nbor_list; }
     const Gpu::DeviceVector<unsigned int>& GetList () const { return m_nbor_list; }
-    
+
     void print ()
     {
         BL_PROFILE("NeighborList::print");
-        
+
         Gpu::HostVector<unsigned int> host_nbor_offsets(m_nbor_offsets.size());
         Gpu::HostVector<unsigned int> host_nbor_list(m_nbor_list.size());
-        
-        Gpu::copy(Gpu::deviceToHost, m_nbor_offsets.begin(), m_nbor_offsets.end(), host_nbor_offsets.begin());        
+
+        Gpu::copy(Gpu::deviceToHost, m_nbor_offsets.begin(), m_nbor_offsets.end(), host_nbor_offsets.begin());
         Gpu::copy(Gpu::deviceToHost, m_nbor_list.begin(), m_nbor_list.end(), host_nbor_list.begin());
-        
+
         for (int i = 0; i < numParticles(); ++i) {
             amrex::Print() << "Particle " << i << " could collide with: ";
             for (int j = host_nbor_offsets[i]; j < host_nbor_offsets[i+1]; ++j) {
@@ -232,14 +281,14 @@ public:
     }
 
 protected:
-    
-    const ParticleType* m_pstruct;
+
+    ParticleType* m_pstruct;
 
     // This is the neighbor list data structure
     Gpu::DeviceVector<unsigned int> m_nbor_offsets;
     Gpu::DeviceVector<unsigned int> m_nbor_list;
     Gpu::DeviceVector<unsigned int> m_nbor_counts;
-    
+
     DenseBins<ParticleType> m_bins;
 };
 
diff --git a/Src/Particle/AMReX_NeighborParticles.H b/Src/Particle/AMReX_NeighborParticles.H
index b8863b7c38c..de62af4783f 100644
--- a/Src/Particle/AMReX_NeighborParticles.H
+++ b/Src/Particle/AMReX_NeighborParticles.H
@@ -6,6 +6,7 @@
 #include <AMReX_Particles.H>
 #include <AMReX_ParticleUtil.H>
 #include <AMReX_NeighborList.H>
+#include <AMReX_OpenMP.H>
 
 namespace amrex {
 
@@ -141,13 +142,13 @@ private:
             amrex::Error("operator<<(ostream&, const InverseCopyTag&) failed");
         return os;
     }
-    
+
     struct NeighborCommTag {
 
         NeighborCommTag (int pid, int lid, int gid, int tid)
             : proc_id(pid), level_id(lid), grid_id(gid), tile_id(tid)
             {}
-        
+
         int proc_id;
         int level_id;
         int grid_id;
@@ -240,7 +241,7 @@ public:
     /// Build a Neighbor List for each tile
     ///
     template <class CheckPair>
-    void buildNeighborList (CheckPair check_pair, bool sort=false);
+    void buildNeighborList (CheckPair&& check_pair, bool sort=false);
 
     void printNeighborList ();
 
@@ -257,6 +258,13 @@ public:
         return neighbors[lev][std::make_pair(grid,tile)];
     }
 
+    void Redistribute (int lev_min=0, int lev_max=-1, int nGrow=0, int local=0)
+    {
+        clearNeighbors();
+        ParticleContainer<NStructReal, NStructInt, 0, 0>::Redistribute(lev_min, lev_max,
+                                                                       nGrow, local);
+    }
+
     void RedistributeLocal ()
     {
         const int lev_min = 0;
@@ -318,7 +326,7 @@ protected:
     void sumNeighborsMPI (std::map<int, Vector<char> >& not_ours,
                           int real_start_comp, int real_num_comp,
                           int int_start_comp, int int_num_comp);
-    
+
     ///
     /// Perform handshake to figure out how many bytes each proc should receive
     ///
@@ -365,7 +373,7 @@ protected:
     static bool enable_inverse;
 
 #ifdef AMREX_USE_GPU
-    
+
     struct NeighborTask {
         int grid_id;
         Box box;
@@ -388,7 +396,7 @@ protected:
             return false;
         }
     };
-        
+
     // These are used to keep track of which particles need to be ghosted to which grids
     bool m_neighbor_mask_initialized = false;
     std::unique_ptr<amrex::iMultiFab> m_neighbor_mask_ptr;
@@ -408,20 +416,20 @@ protected:
 #endif
 
     Vector<std::map<std::pair<int, int>, amrex::NeighborList<ParticleType> > > m_neighbor_list;
-    
-    bool hasNeighbors() const { return m_has_neighbors; };
-  
+
+    bool hasNeighbors() const { return m_has_neighbors; }
+
     bool m_has_neighbors = false;
 };
-    
+
 #include "AMReX_NeighborParticlesI.H"
-    
+
 #ifdef AMREX_USE_GPU
 #include "AMReX_NeighborParticlesGPUImpl.H"
 #else
 #include "AMReX_NeighborParticlesCPUImpl.H"
 #endif
-    
+
 }
 
 #endif // _NEIGHBORPARTICLES_H_
diff --git a/Src/Particle/AMReX_NeighborParticlesCPUImpl.H b/Src/Particle/AMReX_NeighborParticlesCPUImpl.H
index 931f7675da1..07be0dd7f50 100644
--- a/Src/Particle/AMReX_NeighborParticlesCPUImpl.H
+++ b/Src/Particle/AMReX_NeighborParticlesCPUImpl.H
@@ -19,54 +19,55 @@ NeighborParticleContainer<NStructReal, NStructInt>
                    int int_start_comp,  int int_num_comp)
 {
     BL_PROFILE("NeighborParticleContainer::sumNeighborsCPU");
-    
+
     if ( not enableInverse() )
     {
         amrex::Abort("Need to enable inverse to true to use sumNeighbors. \n");
     }
-    
-    const int MyProc = ParallelDescriptor::MyProc();
+
+    const int MyProc = ParallelContext::MyProcSub();
 
     std::map<int, Vector<char> > isend_data;
-    
+
     for (int lev = 0; lev < this->numLevels(); ++lev)
     {
         for (MyParIter pti(*this, lev); pti.isValid(); ++pti)
         {
             PairIndex src_index(pti.index(), pti.LocalTileIndex());
             const auto& tags = inverse_tags[lev][src_index];
-            const auto& neighbs = neighbors[lev][src_index];            
+            const auto& neighbs = neighbors[lev][src_index];
             AMREX_ASSERT(tags.size() == neighbs.size());
-            
+
             const int num_neighbs = neighbs.size();
             for (int i = 0; i < num_neighbs; ++i)
             {
                 const auto& neighb = neighbs[i];
                 const auto& tag = tags[i];
                 const int dst_grid = tag.src_grid;
-                const int dst_proc = this->ParticleDistributionMap(lev)[dst_grid];
+                const int global_rank = this->ParticleDistributionMap(lev)[dst_grid];
+                const int dst_proc = ParallelContext::global_to_local_rank(global_rank);
                 const int dst_tile = tag.src_tile;
                 const int dst_index = tag.src_index;
                 const int dst_level = tag.src_level;
-                
+
                 if (dst_proc == MyProc)
                 {
                     auto pair = std::make_pair(dst_grid, dst_tile);
                     auto& dst_ptile = this->GetParticles(dst_level)[pair];
                     auto& dst_parts = dst_ptile.GetArrayOfStructs();
                     auto& p = dst_parts[dst_index];
-                    
+
                     for (int comp = real_start_comp; comp < real_start_comp + real_num_comp; ++comp)
                     {
-                        p.rdata(comp) += neighb.rdata(comp);                        
+                        p.rdata(comp) += neighb.rdata(comp);
                     }
 
                     for (int comp = int_start_comp; comp < int_start_comp + int_num_comp; ++comp)
                     {
-                        p.idata(comp) += neighb.idata(comp);                        
+                        p.idata(comp) += neighb.idata(comp);
                     }
                 }
-                
+
                 else
                 {
                     auto& sdata = isend_data[dst_proc];
@@ -91,7 +92,7 @@ NeighborParticleContainer<NStructReal, NStructInt>
                         dst += sizeof(int);
                     }
                 }
-            }                    
+            }
         }
     }
 
@@ -103,62 +104,65 @@ void
 NeighborParticleContainer<NStructReal, NStructInt>::
 sumNeighborsMPI (std::map<int, Vector<char> >& not_ours,
                  int real_start_comp, int real_num_comp,
-                 int int_start_comp, int int_num_comp) 
+                 int int_start_comp, int int_num_comp)
 {
     BL_PROFILE("NeighborParticleContainer::sumNeighborsMPI");
-    
+
 #ifdef AMREX_USE_MPI
-    const int NProcs = ParallelDescriptor::NProcs();
-    
+    const int NProcs = ParallelContext::NProcsSub();
+
     Vector<Long> isnds(NProcs, 0);
     Vector<Long> ircvs(NProcs, 0);
     for (int i = 0; i < NProcs; ++i)
         ircvs[i] = 0;
-    
+
     {
         // each proc figures out how many bytes it will send, and how
         // many it will receive
-        
+
         Long num_isnds = 0;
         for (const auto& kv : not_ours)
         {
             num_isnds      += kv.second.size();
             isnds[kv.first] = kv.second.size();
         }
-        ParallelDescriptor::ReduceLongMax(num_isnds);
-        
+
+        ParallelAllReduce::Max(num_isnds, ParallelContext::CommunicatorSub());
+
         if (num_isnds == 0) return;
-        
+
         const int num_ircvs = neighbor_procs.size();
         Vector<MPI_Status>  stats(num_ircvs);
         Vector<MPI_Request> rreqs(num_ircvs);
-        
+
         const int SeqNum = ParallelDescriptor::SeqNum();
-        
+
         // Post receives
         for (int i = 0; i < num_ircvs; ++i)
         {
             const int Who = neighbor_procs[i];
             const Long Cnt = 1;
-            
+
             AMREX_ASSERT(Who >= 0 && Who < NProcs);
-            
-            rreqs[i] = ParallelDescriptor::Arecv(&ircvs[Who], Cnt, Who, SeqNum).req();
+
+            rreqs[i] = ParallelDescriptor::Arecv(&ircvs[Who], Cnt, Who, SeqNum,
+                                                 ParallelContext::CommunicatorSub()).req();
         }
-        
+
         // Send.
         for (int i = 0; i < num_ircvs; ++i) {
         const int Who = neighbor_procs[i];
         const Long Cnt = 1;
-        
+
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
-        
-        ParallelDescriptor::Send(&isnds[Who], Cnt, Who, SeqNum);
+
+        ParallelDescriptor::Send(&isnds[Who], Cnt, Who, SeqNum,
+                                 ParallelContext::CommunicatorSub());
         }
-        
-        if (num_ircvs > 0) ParallelDescriptor::Waitall(rreqs, stats);        
+
+        if (num_ircvs > 0) ParallelDescriptor::Waitall(rreqs, stats);
     }
-    
+
     Vector<int> RcvProc;
     Vector<std::size_t> rOffset; // Offset (in bytes) in the receive buffer
     std::size_t TotRcvBytes = 0;
@@ -189,19 +193,21 @@ sumNeighborsMPI (std::map<int, Vector<char> >& not_ours,
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
 
-        rreqs[i] = ParallelDescriptor::Arecv(&recvdata[offset], Cnt, Who, SeqNum).req();
+        rreqs[i] = ParallelDescriptor::Arecv(&recvdata[offset], Cnt, Who, SeqNum,
+                                             ParallelContext::CommunicatorSub()).req();
     }
 
     // Send.
     for (const auto& kv : not_ours) {
         const auto Who = kv.first;
         const auto Cnt = kv.second.size();
-        
+
         AMREX_ASSERT(Cnt > 0);
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
 
-        ParallelDescriptor::Send(kv.second.data(), Cnt, Who, SeqNum);
+        ParallelDescriptor::Send(kv.second.data(), Cnt, Who, SeqNum,
+                                 ParallelContext::CommunicatorSub());
     }
 
     // unpack the received data and put them into the proper neighbor buffers
@@ -210,7 +216,7 @@ sumNeighborsMPI (std::map<int, Vector<char> >& not_ours,
         ParallelDescriptor::Waitall(rreqs, stats);
 
         const size_t data_size = real_num_comp*sizeof(Real) + int_num_comp*sizeof(int) + 4 * sizeof(int);
-        
+
         if (recvdata.size() % data_size != 0) {
             amrex::Print() << recvdata.size() << " " << data_size << "\n";
             if (this->m_verbose) {
@@ -263,18 +269,14 @@ NeighborParticleContainer<NStructReal, NStructInt>
 
     BL_PROFILE_VAR("NeighborParticleContainer::updateNeighborsCPU", update);
 
-    const int MyProc = ParallelDescriptor::MyProc();
+    const int MyProc = ParallelContext::MyProcSub();
 
     for (int lev = 0; lev < this->numLevels(); ++lev) {
         const Periodicity& periodicity = this->Geom(lev).periodicity();
         const RealBox& prob_domain = this->Geom(lev).ProbDomain();
 
-        int num_threads = 1;
-#ifdef _OPENMP
-#pragma omp parallel
-#pragma omp single
-        num_threads = omp_get_num_threads();
-#endif
+        int num_threads = OpenMP::get_max_threads();
+
         for (MyParIter pti(*this, lev); pti.isValid(); ++pti) {
             PairIndex src_index(pti.index(), pti.LocalTileIndex());
             auto& particles = pti.GetArrayOfStructs();
@@ -286,7 +288,8 @@ NeighborParticleContainer<NStructReal, NStructInt>
 #endif
                 for (int i = 0; i < num_tags; ++i) {
                     const NeighborCopyTag& tag = tags[i];
-                    const int who = this->ParticleDistributionMap(tag.level)[tag.grid];
+                    const int global_who = this->ParticleDistributionMap(tag.level)[tag.grid];
+                    const int who = ParallelContext::global_to_local_rank(global_who);
                     ParticleType p = particles[tag.src_index];  // copy
                     if (periodicity.isAnyPeriodic()) {
                         for (int dir = 0; dir < AMREX_SPACEDIM; ++dir) {
@@ -407,7 +410,7 @@ getRcvCountsMPI () {
     BL_PROFILE("NeighborParticleContainer::getRcvCountsMPI");
 
 #ifdef AMREX_USE_MPI
-    const int NProcs = ParallelDescriptor::NProcs();
+    const int NProcs = ParallelContext::NProcsSub();
 
     // each proc figures out how many bytes it will send, and how
     // many it will receive
@@ -421,7 +424,9 @@ getRcvCountsMPI () {
         num_snds      += kv.second.size();
         snds[kv.first] = kv.second.size();
     }
-    ParallelDescriptor::ReduceLongMax(num_snds);
+
+    ParallelAllReduce::Max(num_snds, ParallelContext::CommunicatorSub());
+
     if (num_snds == 0) return;
 
     const int num_rcvs = neighbor_procs.size();
@@ -429,7 +434,7 @@ getRcvCountsMPI () {
     Vector<MPI_Request> rreqs(num_rcvs);
 
     const int SeqNum = ParallelDescriptor::SeqNum();
-    
+
     // Post receives
     for (int i = 0; i < num_rcvs; ++i) {
         const int Who = neighbor_procs[i];
@@ -437,7 +442,8 @@ getRcvCountsMPI () {
 
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
 
-        rreqs[i] = ParallelDescriptor::Arecv(&rcvs[Who], Cnt, Who, SeqNum).req();
+        rreqs[i] = ParallelDescriptor::Arecv(&rcvs[Who], Cnt, Who, SeqNum,
+                                             ParallelContext::CommunicatorSub()).req();
     }
 
     // Send.
@@ -447,7 +453,8 @@ getRcvCountsMPI () {
 
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
 
-        ParallelDescriptor::Send(&snds[Who], Cnt, Who, SeqNum);
+        ParallelDescriptor::Send(&snds[Who], Cnt, Who, SeqNum,
+                                 ParallelContext::CommunicatorSub());
     }
 
     if (num_rcvs > 0) ParallelDescriptor::Waitall(rreqs, stats);
@@ -463,7 +470,7 @@ fillNeighborsMPI (bool reuse_rcv_counts) {
     BL_PROFILE("NeighborParticleContainer::fillNeighborsMPI");
 
 #ifdef AMREX_USE_MPI
-    const int NProcs = ParallelDescriptor::NProcs();
+    const int NProcs = ParallelContext::NProcsSub();
 
     // each proc figures out how many bytes it will send, and how
     // many it will receive
@@ -500,7 +507,8 @@ fillNeighborsMPI (bool reuse_rcv_counts) {
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
 
-        rreqs[i] = ParallelDescriptor::Arecv(&recvdata[offset], Cnt, Who, SeqNum).req();
+        rreqs[i] = ParallelDescriptor::Arecv(&recvdata[offset], Cnt, Who, SeqNum,
+                                             ParallelContext::CommunicatorSub()).req();
     }
 
     // Send.
@@ -545,7 +553,7 @@ fillNeighborsMPI (bool reuse_rcv_counts) {
                     inverse_tags[lev][dst_index].resize(new_size);
                 }
                 neighbors[lev][dst_index].resize(new_size);
-                
+
                 char* dst = (char*) &neighbors[lev][dst_index][old_size];
                 char* src = buffer;
 
@@ -571,10 +579,10 @@ fillNeighborsMPI (bool reuse_rcv_counts) {
                         auto& tag = inverse_tags[lev][dst_index][old_size+n];
                         std::memcpy(&(tag.src_grid),src,sizeof(int));
                         src += sizeof(int);
-                        
+
                         std::memcpy(&(tag.src_tile),src,sizeof(int));
                         src += sizeof(int);
-                        
+
                         std::memcpy(&(tag.src_index),src,sizeof(int));
                         src += sizeof(int);
 
diff --git a/Src/Particle/AMReX_NeighborParticlesGPUImpl.H b/Src/Particle/AMReX_NeighborParticlesGPUImpl.H
index 055211a18ca..514bc0066e3 100644
--- a/Src/Particle/AMReX_NeighborParticlesGPUImpl.H
+++ b/Src/Particle/AMReX_NeighborParticlesGPUImpl.H
@@ -38,7 +38,7 @@ namespace detail
                 }
             }
         }
-        
+
         RemoveDuplicates(bl);
         return bl;
     }
@@ -48,9 +48,9 @@ template <int NStructReal, int NStructInt>
 void
 NeighborParticleContainer<NStructReal, NStructInt>::
 buildNeighborMask ()
-{    
+{
     BL_PROFILE("NeighborParticleContainer<NStructReal, NStructInt>::buildNeighborMask");
-    AMREX_ALWAYS_ASSERT(this->numLevels() == 1);    
+    AMREX_ALWAYS_ASSERT(this->numLevels() == 1);
     m_neighbor_mask_initialized = true;
     const int lev = 0;
     const Geometry& geom = this->Geom(lev);
@@ -73,24 +73,24 @@ buildNeighborMask ()
         {
             int grid = mfi.index();
 	    int num_codes = 0;
-       
+
             std::set<NeighborTask> neighbor_grids;
             for (auto pit=pshifts.cbegin(); pit!=pshifts.cend(); ++pit)
             {
                 const Box box = ba[mfi] + *pit;
-                
+
                 const bool first_only = false;
                 auto isecs = ba.intersections(box, first_only, m_num_neighbor_cells);
-                
+
                 for (auto& isec : isecs)
                 {
                     int nbor_grid = isec.first;
                     const Box isec_box = isec.second - *pit;
-                    if ( (grid == nbor_grid) and (*pit == IntVect(AMREX_D_DECL(0, 0, 0)))) continue; 
+                    if ( (grid == nbor_grid) and (*pit == IntVect(AMREX_D_DECL(0, 0, 0)))) continue;
                     neighbor_grids.insert(NeighborTask(nbor_grid, isec_box, *pit));
                 }
             }
-            
+
             BoxList isec_bl;
             std::vector<int> isec_grids;
             std::vector<IntVect> isec_pshifts;
@@ -101,20 +101,20 @@ buildNeighborMask ()
                 isec_pshifts.push_back(nbor_grid.periodic_shift);
             }
             BoxArray isec_ba(isec_bl);
-            
+
             Vector<Box> bl = detail::getBoundaryBoxes(
                 amrex::grow(ba[mfi], -m_num_neighbor_cells), m_num_neighbor_cells);
-            
+
             m_grid_map[grid].resize(bl.size());
 	    m_code_offsets[grid].push_back(0);
             for (int i = 0; i < static_cast<int>(bl.size()); ++i)
             {
                 const Box& box = bl[i];
-            
+
                 const int nGrow = 0;
                 const bool first_only = false;
                 auto isecs = isec_ba.intersections(box, first_only, nGrow);
-                
+
                 if (! isecs.empty() ) (*m_neighbor_mask_ptr)[mfi].setVal<RunOn::Host>(i, box);
 
                 for (auto& isec : isecs)
@@ -124,11 +124,12 @@ buildNeighborMask ()
                     code.periodic_shift = isec_pshifts[isec.first];
                     m_grid_map[grid][i].push_back(code);
 		    m_code_array[grid].push_back(code);
-                    neighbor_procs.push_back(dmap[code.grid_id]);
+                    const int global_rank = dmap[code.grid_id];
+                    neighbor_procs.push_back(ParallelContext::global_to_local_rank(global_rank));
 		    ++num_codes;
                 }
    	        m_code_offsets[grid].push_back(m_code_array[grid].size());
-            }        
+            }
 	}
         RemoveDuplicates(neighbor_procs);
     }
@@ -287,17 +288,15 @@ clearNeighborsGPU()
 {
     BL_PROFILE("NeighborParticleContainer<NStructReal, NStructInt>::clearNeighborsGPU");
 
-    AMREX_ALWAYS_ASSERT(this->numLevels() == 1);
-    const int lev = 0;
-
-    for(MFIter mfi = this->MakeMFIter(lev); mfi.isValid(); ++mfi)
+    this->reserveData();
+    this->resizeData();
+    for (int lev = 0; lev < this->numLevels(); ++lev)
     {
-        int src_grid = mfi.index();
-        int src_tile = mfi.LocalTileIndex();
-        AMREX_ASSERT(src_tile == 0);
-        auto index = std::make_pair(src_grid, src_tile);
-        auto& ptile = this->GetParticles(lev)[index];
-        ptile.setNumNeighbors(0);
+        for(MFIter mfi = this->MakeMFIter(lev); mfi.isValid(); ++mfi)
+        {
+            auto& ptile = this->DefineAndReturnParticleTile(lev, mfi);
+            ptile.setNumNeighbors(0);
+        }
     }
 }
 
diff --git a/Src/Particle/AMReX_NeighborParticlesI.H b/Src/Particle/AMReX_NeighborParticlesI.H
index c01e08ad299..25096c5449a 100644
--- a/Src/Particle/AMReX_NeighborParticlesI.H
+++ b/Src/Particle/AMReX_NeighborParticlesI.H
@@ -184,10 +184,11 @@ NeighborParticleContainer<NStructReal, NStructInt>
                 if (grid >= 0) {
                     const int tile = (*mask_ptr[lev])[mfi](iv, MaskComps::tile);
                     const int level = (*mask_ptr[lev])[mfi](iv, MaskComps::level);
-                    const int proc = this->ParticleDistributionMap(level)[grid];
+                    const int global_proc = this->ParticleDistributionMap(level)[grid];
+                    const int proc = ParallelContext::global_to_local_rank(global_proc);
                     NeighborCommTag comm_tag(proc, level, grid, tile);
                     local_neighbors.push_back(comm_tag);
-                    if (proc != ParallelDescriptor::MyProc())
+                    if (proc != ParallelContext::MyProcSub())
                         neighbor_procs.push_back(proc);
                 }
             }
@@ -204,7 +205,7 @@ NeighborParticleContainer<NStructReal, NStructInt>
                 GetCommTagsBox(comm_tags, lev, box);
                 for (auto const& tag : comm_tags) {
                     local_neighbors.push_back(tag);
-                    if (tag.proc_id != ParallelDescriptor::MyProc())
+                    if (tag.proc_id != ParallelContext::MyProcSub())
                         neighbor_procs.push_back(tag.proc_id);
                 }
             }
@@ -265,7 +266,8 @@ NeighborParticleContainer<NStructReal, NStructInt>
             ba.intersections(pbox, isects, first_only, 0);
             for (const auto& isec : isects) {
                 const int grid = isec.first;
-                const int proc = this->ParticleDistributionMap(lev)[grid];
+                const int global_proc = this->ParticleDistributionMap(lev)[grid];
+                const int proc = ParallelContext::global_to_local_rank(global_proc);
                 for (IntVect iv = pbox.smallEnd(); iv <= pbox.bigEnd(); pbox.next(iv))
                 {
                     if (ba[grid].contains(iv))
@@ -295,7 +297,7 @@ NeighborParticleContainer<NStructReal, NStructInt>
 
     AMREX_ASSERT(hasNeighbors() == false);
 
-    const int MyProc = ParallelDescriptor::MyProc();
+    const int MyProc = ParallelContext::MyProcSub();
 
     amrex::Vector<std::map<PairIndex,       Vector<NeighborIndexMap> > > local_map;
     std::map<NeighborCommTag, Vector<NeighborIndexMap> > remote_map;
@@ -307,12 +309,7 @@ NeighborParticleContainer<NStructReal, NStructInt>
     local_map.resize(this->numLevels());
     tmp_local_map.resize(this->numLevels());
 
-    int num_threads = 1;
-#ifdef _OPENMP
-#pragma omp parallel
-#pragma omp single
-    num_threads = omp_get_num_threads();
-#endif
+    int num_threads = OpenMP::get_max_threads();
 
     for (int lev = 0; lev < this->numLevels(); ++lev) {
         // resize our temporaries in serial
@@ -337,11 +334,7 @@ NeighborParticleContainer<NStructReal, NStructInt>
             Vector<NeighborCopyTag> tags;
             tags.reserve(AMREX_D_TERM(3, *3, *3));
             for (MyParIter pti(*this, lev); pti.isValid(); ++pti) {
-#ifdef _OPENMP
-                int thread_num = omp_get_thread_num();
-#else
-                int thread_num = 0;
-#endif
+                int thread_num = OpenMP::get_thread_num();
                 const int& grid = pti.index();
                 const int& tile = pti.LocalTileIndex();
                 PairIndex src_index(grid, tile);
@@ -366,7 +359,8 @@ NeighborParticleContainer<NStructReal, NStructInt>
                         const int cache_index = cache.size();
                         cache.push_back(tag);
 
-                        const int who = this->ParticleDistributionMap(tag.level)[tag.grid];
+                        const int global_who = this->ParticleDistributionMap(tag.level)[tag.grid];
+                        const int who = ParallelContext::global_to_local_rank(global_who);
                         NeighborIndexMap nim(tag.level, dst_index.first, dst_index.second, -1,
                                              lev, src_index.first, src_index.second,
                                              cache_index, thread_num);
@@ -667,7 +661,7 @@ template <int NStructReal, int NStructInt>
 template <class CheckPair>
 void
 NeighborParticleContainer<NStructReal, NStructInt>::
-buildNeighborList (CheckPair check_pair, bool sort) 
+buildNeighborList (CheckPair&& check_pair, bool sort) 
 {
     AMREX_ASSERT(numParticlesOutOfRange(*this, m_num_neighbor_cells) == 0);
 
@@ -711,7 +705,9 @@ buildNeighborList (CheckPair check_pair, bool sort)
             bx.coarsen(ref_fac);
             bx.grow(m_num_neighbor_cells);
             
-            m_neighbor_list[lev][index].build(ptile, bx, geom, check_pair, m_num_neighbor_cells);
+            m_neighbor_list[lev][index].build(ptile, bx, geom,
+                                              std::forward<CheckPair>(check_pair),
+                                              m_num_neighbor_cells);
 #ifndef AMREX_USE_GPU
             const auto& counts = m_neighbor_list[lev][index].GetCounts();
             const auto& list   = m_neighbor_list[lev][index].GetList();
@@ -755,6 +751,8 @@ void
 NeighborParticleContainer<NStructReal, NStructInt>::
 resizeContainers (const int num_levels)
 {
+    this->reserveData();
+    this->resizeData();
     if ( static_cast<int>(neighbors.size()) <= num_levels )
     {
         neighbors.resize(num_levels);
diff --git a/Src/Particle/AMReX_ParGDB.H b/Src/Particle/AMReX_ParGDB.H
index e37d7a84fb6..6d3a49ce32a 100644
--- a/Src/Particle/AMReX_ParGDB.H
+++ b/Src/Particle/AMReX_ParGDB.H
@@ -15,19 +15,31 @@ public:
     ParGDBBase () {;}
     virtual ~ParGDBBase () {;}
 
+    virtual const Geometry& ParticleGeom (int level) const = 0;
     virtual const Geometry& Geom (int level) const = 0;
-    virtual const DistributionMapping& ParticleDistributionMap
-                                             (int level) const = 0;
-    virtual const DistributionMapping&         DistributionMap
-                                             (int level) const = 0;
+
+    virtual const Vector<Geometry>& ParticleGeom () const = 0;
+    virtual const Vector<Geometry>&         Geom () const = 0;
+
+    virtual const DistributionMapping& ParticleDistributionMap (int level) const = 0;
+    virtual const DistributionMapping&         DistributionMap (int level) const = 0;
+
+    virtual const Vector<DistributionMapping>& ParticleDistributionMap () const = 0;
+    virtual const Vector<DistributionMapping>&         DistributionMap () const = 0;
+
     virtual const BoxArray& ParticleBoxArray (int level) const = 0;
     virtual const BoxArray&         boxArray (int level) const = 0;
 
+    virtual const Vector<BoxArray>& ParticleBoxArray () const = 0;
+    virtual const Vector<BoxArray>&         boxArray () const = 0;
+
     virtual void SetParticleBoxArray (int level, const BoxArray& new_ba) = 0;
     virtual void SetParticleDistributionMap (int level, const DistributionMapping& new_dm) = 0;
+    virtual void SetParticleGeometry (int level, const Geometry& new_geom) = 0;
 
     virtual void ClearParticleBoxArray (int level) = 0;
     virtual void ClearParticleDistributionMap (int level) = 0;
+    virtual void ClearParticleGeometry (int level) = 0;
 
     virtual bool LevelDefined (int level) const = 0;
     virtual int finestLevel () const = 0;
@@ -36,6 +48,8 @@ public:
     virtual IntVect refRatio (int level) const = 0;
     virtual int MaxRefRatio (int level) const = 0;
 
+    virtual Vector<IntVect> refRatio () const = 0;
+
     bool OnSameGrids (int level, const MultiFab& mf) const;
 };
 
@@ -57,21 +71,40 @@ public:
 	    const Vector<BoxArray>            & ba,
 	    const Vector<int>                 & rr);
 
+    ParGDB (const Vector<Geometry>            & geom,
+	    const Vector<DistributionMapping> & dmap,
+	    const Vector<BoxArray>            & ba,
+	    const Vector<IntVect>             & rr);
+
     virtual ~ParGDB () {;}
 
+    virtual const Geometry& ParticleGeom (int level) const override;
     virtual const Geometry& Geom (int level) const override;
+
+    virtual const Vector<Geometry>& ParticleGeom () const override;
+    virtual const Vector<Geometry>&         Geom () const override;
+
     virtual const DistributionMapping& ParticleDistributionMap
                                              (int level) const override;
     virtual const DistributionMapping&         DistributionMap
                                              (int level) const override;
+
+    virtual const Vector<DistributionMapping>& ParticleDistributionMap () const override;
+    virtual const Vector<DistributionMapping>&         DistributionMap () const override;
+
     virtual const BoxArray& ParticleBoxArray (int level) const override;
     virtual const BoxArray&         boxArray (int level) const override;
 
+    virtual const Vector<BoxArray>& ParticleBoxArray () const override;
+    virtual const Vector<BoxArray>&         boxArray () const override;
+
     virtual void SetParticleBoxArray (int level, const BoxArray& new_ba) override;
     virtual void SetParticleDistributionMap (int level,	const DistributionMapping& new_dm) override;
+    virtual void SetParticleGeometry (int level, const Geometry& new_geom) override;
 
     virtual void ClearParticleBoxArray (int level) override;
     virtual void ClearParticleDistributionMap (int level) override;
+    virtual void ClearParticleGeometry (int level) override;
 
     virtual bool LevelDefined (int level) const override;
     virtual int finestLevel () const override;
@@ -80,14 +113,15 @@ public:
     virtual IntVect refRatio (int level) const override;
     virtual int MaxRefRatio (int level) const override;
 
+    virtual Vector<IntVect> refRatio () const override;
+
 protected:
 
     Vector<Geometry>            m_geom;
     Vector<DistributionMapping> m_dmap;
     Vector<BoxArray>            m_ba;
-    Vector<int>                 m_rr;
-    int                        m_nlevels;
-
+    Vector<IntVect>             m_rr;
+    int                         m_nlevels;
 };
 
 inline
@@ -113,7 +147,7 @@ inline
 ParGDB::ParGDB (const Vector<Geometry>            & geom,
 		const Vector<DistributionMapping> & dmap,
 		const Vector<BoxArray>            & ba,
-		const Vector<int>                 & rr)
+		const Vector<IntVect>             & rr)
     :
     m_geom(geom),
     m_dmap(dmap),
@@ -122,6 +156,23 @@ ParGDB::ParGDB (const Vector<Geometry>            & geom,
     m_nlevels(ba.size())
 { }
 
+inline
+ParGDB::ParGDB (const Vector<Geometry>            & geom,
+		const Vector<DistributionMapping> & dmap,
+		const Vector<BoxArray>            & ba,
+		const Vector<int>                 & rr)
+    :
+    m_geom(geom),
+    m_dmap(dmap),
+    m_ba(ba),
+    m_nlevels(ba.size())
+{
+    for (int level = 0; level < static_cast<int>(rr.size()); ++level)
+    {
+        m_rr.push_back(rr[level]*IntVect::TheUnitVector());
+    }
+}
+
 inline
 const Geometry&
 ParGDB::Geom (int level) const
@@ -129,6 +180,27 @@ ParGDB::Geom (int level) const
     return m_geom[level];
 }
 
+inline
+const Geometry&
+ParGDB::ParticleGeom (int level) const
+{
+    return m_geom[level];
+}
+
+inline
+const Vector<Geometry>&
+ParGDB::Geom () const
+{
+    return m_geom;
+}
+
+inline
+const Vector<Geometry>&
+ParGDB::ParticleGeom () const
+{
+    return m_geom;
+}
+
 inline
 const DistributionMapping&
 ParGDB::ParticleDistributionMap (int level) const
@@ -143,6 +215,20 @@ ParGDB::DistributionMap (int level) const
     return m_dmap[level];
 }
 
+inline
+const Vector<DistributionMapping>&
+ParGDB::ParticleDistributionMap () const
+{
+    return m_dmap;
+}
+
+inline
+const Vector<DistributionMapping>&
+ParGDB::DistributionMap () const
+{
+    return m_dmap;
+}
+
 inline
 const BoxArray&
 ParGDB::ParticleBoxArray (int level) const
@@ -157,6 +243,20 @@ ParGDB::boxArray (int level) const
     return m_ba[level];
 }
 
+inline
+const Vector<BoxArray>&
+ParGDB::ParticleBoxArray () const
+{
+    return m_ba;
+}
+
+inline
+const Vector<BoxArray>&
+ParGDB::boxArray () const
+{
+    return m_ba;
+}
+
 inline
 void
 ParGDB::SetParticleBoxArray (int level, const BoxArray& new_ba)
@@ -173,6 +273,14 @@ ParGDB::SetParticleDistributionMap (int level, const DistributionMapping& new_dm
     m_dmap[level] = new_dm;
 }
 
+inline
+void
+ParGDB::SetParticleGeometry (int level, const Geometry& new_geom)
+{
+    AMREX_ASSERT(level < m_nlevels);
+    m_geom[level] = new_geom;
+}
+
 inline
 void
 ParGDB::ClearParticleBoxArray (int level)
@@ -189,6 +297,14 @@ ParGDB::ClearParticleDistributionMap (int level)
     m_dmap[level] = DistributionMapping();
 }
 
+inline
+void
+ParGDB::ClearParticleGeometry (int level)
+{
+    AMREX_ASSERT(level < m_nlevels);
+    m_geom[level] = Geometry();
+}
+
 inline
 bool
 ParGDB::LevelDefined (int level) const
@@ -223,10 +339,21 @@ ParGDB::MaxRefRatio (int /*level*/) const
 {
     int max_ref_ratio = 0;
     for (int lev = 0; lev < m_nlevels-1; lev++)
-       max_ref_ratio = std::max(max_ref_ratio, m_rr[lev]);
+        max_ref_ratio = std::max(max_ref_ratio, m_rr[lev].max());
     return max_ref_ratio;
 }
 
+inline
+Vector<IntVect>
+ParGDB::refRatio () const
+{
+    Vector<IntVect> rr_vect;
+    for (auto rr : m_rr) {
+        rr_vect.push_back(rr*IntVect::TheUnitVector());
+    }
+    return rr_vect;
+}
+
 }
 
 #endif
diff --git a/Src/Particle/AMReX_ParIter.H b/Src/Particle/AMReX_ParIter.H
index fe650ea4b76..d2051f62a12 100644
--- a/Src/Particle/AMReX_ParIter.H
+++ b/Src/Particle/AMReX_ParIter.H
@@ -9,7 +9,7 @@ namespace amrex
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 class ParticleContainer;
-    
+
 template <bool is_const, int NStructReal, int NStructInt=0, int NArrayReal=0, int NArrayInt=0>
 class ParIterBase
     : public MFIter
@@ -59,7 +59,6 @@ public:
         ++m_pariter_index;
         currentIndex = m_valid_index[m_pariter_index];
 #ifdef AMREX_USE_GPU
-
         Gpu::Device::setStreamIndex(currentIndex);
 #endif
     }
@@ -71,26 +70,20 @@ public:
 
     SoARef GetStructOfArrays () const { return GetParticleTile().GetStructOfArrays(); }
 
-    template <typename Container>
-    void GetPosition (AMREX_D_DECL(Container& x,
-                                   Container& y,
-                                   Container& z)) const;
-
     int numParticles () const { return GetArrayOfStructs().numParticles(); }
 
     int numRealParticles () const { return GetArrayOfStructs().numRealParticles(); }
 
     int numNeighborParticles () const { return GetArrayOfStructs().numNeighborParticles(); }
 
-    
     int GetLevel () const { return m_level; }
 
     std::pair<int, int> GetPairIndex () const { return std::make_pair(this->index(), this->LocalTileIndex()); }
 
-    const Geometry& Geom (int lev) const { return m_pc.Geom(lev); } 
-    
+    const Geometry& Geom (int lev) const { return m_pc.Geom(lev); }
+
 protected:
-    
+
     int m_level;
     int m_pariter_index;
     Vector<int> m_valid_index;
@@ -119,12 +112,6 @@ public:
     ParIter (ContainerType& pc, int level, MFItInfo& info)
         : ParIterBase<false,NStructReal,NStructInt,NArrayReal,NArrayInt>(pc,level,info)
         {}
-
-    template <typename Container>
-
-    void SetPosition (AMREX_D_DECL(const Container& x,
-                                   const Container& y,
-                                   const Container& z)) const;
 };
 
 template <int NStructReal, int NStructInt=0, int NArrayReal=0, int NArrayInt=0>
@@ -148,7 +135,6 @@ public:
     ParConstIter (ContainerType const& pc, int level, MFItInfo& info)
         : ParIterBase<true,NStructReal,NStructInt,NArrayReal,NArrayInt>(pc,level,info)
         {}
-
 };
 
 template <bool is_const, int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -237,60 +223,6 @@ ParIterBase<is_const, NStructReal, NStructInt, NArrayReal, NArrayInt>::ParIterBa
     }
 }
 
-template <bool is_const, int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
-template <typename Container>
-void
-ParIterBase<is_const, NStructReal, NStructInt, NArrayReal, NArrayInt>::GetPosition
-(AMREX_D_DECL(Container& x, Container& y, Container& z)) const
-{
-    const auto& aos = GetArrayOfStructs();
-    const auto np = aos.numParticles();
-
-    AMREX_D_TERM(x.resize(np);, y.resize(np);, z.resize(np););
-    
-    const auto pstruct_ptr = aos().data();
-
-    AMREX_D_TERM(auto x_ptr = x.data();,
-                 auto y_ptr = y.data();,
-                 auto z_ptr = z.data();)
-    
-    AMREX_FOR_1D( np, i,
-    {
-        AMREX_D_TERM(x_ptr[i] = pstruct_ptr[i].pos(0);,
-                     y_ptr[i] = pstruct_ptr[i].pos(1);,
-                     z_ptr[i] = pstruct_ptr[i].pos(2);)
-    });
-
-    Gpu::streamSynchronize();
-}
-
-template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
-template <typename Container>
-void
-ParIter<NStructReal, NStructInt, NArrayReal, NArrayInt>::SetPosition
-(AMREX_D_DECL(const Container& x, const Container& y, const Container& z)) const
-{
-    auto& aos = this->GetArrayOfStructs();
-    const auto np = aos.numParticles();
-
-    auto pstruct_ptr = aos().data();
-
-    AMREX_D_TERM(const auto x_ptr = x.data();,
-                 const auto y_ptr = y.data();,
-                 const auto z_ptr = z.data();)
-    
-    AMREX_ASSERT(AMREX_D_TERM(x.size() == np, && y.size() == np, && z.size() == np));
-    
-    AMREX_FOR_1D( np, i,
-    {
-        AMREX_D_TERM(pstruct_ptr[i].pos(0) = x_ptr[i];,
-                     pstruct_ptr[i].pos(1) = y_ptr[i];,
-                     pstruct_ptr[i].pos(2) = z_ptr[i];)
-    });
-
-    Gpu::streamSynchronize();
-}
-
 }
 
 #endif
diff --git a/Src/Particle/AMReX_Particle.H b/Src/Particle/AMReX_Particle.H
index 0276dfc656b..c5e0f969f15 100644
--- a/Src/Particle/AMReX_Particle.H
+++ b/Src/Particle/AMReX_Particle.H
@@ -15,111 +15,305 @@ namespace amrex {
 
 namespace
 {
-    std::string   aggregation_type   = "";
-    int           aggregation_buffer = 1;
-    constexpr int GhostParticleID    = std::numeric_limits<int>::max();
-    constexpr int VirtualParticleID  = std::numeric_limits<int>::max()-1;
-    constexpr int LastParticleID     = std::numeric_limits<int>::max()-2;
-    constexpr int DoSplitParticleID  = std::numeric_limits<int>::max()-3;
-    constexpr int NoSplitParticleID  = std::numeric_limits<int>::max()-4;
+    constexpr Long GhostParticleID    = 549755813887L; // 2**39-1
+    constexpr Long VirtualParticleID  = GhostParticleID-1;
+    constexpr Long LastParticleID     = GhostParticleID-2;
+    constexpr Long DoSplitParticleID  = GhostParticleID-3;
+    constexpr Long NoSplitParticleID  = GhostParticleID-4;
 }
 
+struct ParticleIDWrapper
+{
+    uint64_t& m_idata;
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleIDWrapper (uint64_t& idata) noexcept
+        : m_idata(idata)
+    {}
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleIDWrapper (const ParticleIDWrapper& rhs) = default;
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleIDWrapper& operator= (const ParticleIDWrapper& pidw) noexcept
+    {
+        return this->operator=(Long(pidw));
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleIDWrapper& operator= (const Long id) noexcept
+    {
+        // zero out the 40 leftmost bits, which store the sign and the abs of the id;
+        m_idata &= 0x00FFFFFF;
+
+        uint64_t val;
+        uint64_t sign = id >= 0;
+        if (sign)
+        {
+            // 2**39-1, the max value representible in this fashion
+            AMREX_ASSERT(id <= 549755813887L);
+            val = id;
+        }
+        else
+        {
+            // -2**39-1, the min value representible in this fashion
+            AMREX_ASSERT(id >= -549755813887L);
+            val = -id;
+        }
+
+        m_idata |= (sign << 63);  // put the sign in the leftmost bit
+        m_idata |= (val << 24);   // put the val in the next 39
+        return *this;
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    operator Long () const noexcept
+    {
+        Long r = 0;
+
+        uint64_t sign = m_idata >> 63;  // extract leftmost sign bit
+        uint64_t val  = ((m_idata >> 24) & 0x7FFFFFFFFF);  // extract next 39 id bits
+
+        Long lval = static_cast<Long>(val);  // bc we take -
+        r = (sign) ? lval : -lval;
+        return r;
+    }
+};
+
+struct ParticleCPUWrapper
+{
+    uint64_t& m_idata;
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleCPUWrapper (uint64_t& idata) noexcept
+        : m_idata(idata)
+    {}
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleCPUWrapper (const ParticleCPUWrapper& rhs) = default;
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleCPUWrapper& operator= (const ParticleCPUWrapper& pcpuw) noexcept
+    {
+        return this->operator=(int(pcpuw));
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    ParticleCPUWrapper& operator= (const int cpu) noexcept
+    {
+        // zero out the first 24 bits, which are used to store the cpu number
+        m_idata &= (~ 0x00FFFFFF);
+
+        AMREX_ASSERT(cpu >= 0);
+        AMREX_ASSERT(cpu <= 16777215);  // 2**24-1, the max representable number
+
+        m_idata |= cpu;
+        return *this;
+    }
+
+    AMREX_GPU_HOST_DEVICE
+    operator int () const noexcept
+    {
+        return (m_idata & 0x00FFFFFF);
+    }
+};
+
+struct ConstParticleIDWrapper
+{
+    const uint64_t& m_idata;
+
+    AMREX_GPU_HOST_DEVICE
+    ConstParticleIDWrapper (const uint64_t& idata) noexcept
+        : m_idata(idata)
+    {}
+
+    AMREX_GPU_HOST_DEVICE
+    operator Long () const noexcept
+    {
+        Long r = 0;
+
+        uint64_t sign = m_idata >> 63;  // extract leftmost sign bit
+        uint64_t val  = ((m_idata >> 24) & 0x7FFFFFFFFF);  // extract next 39 id bits
+
+        Long lval = static_cast<Long>(val);  // bc we take -
+        r = (sign) ? lval : -lval;
+        return r;
+    }
+};
+
+struct ConstParticleCPUWrapper
+{
+    const uint64_t& m_idata;
+
+    AMREX_GPU_HOST_DEVICE
+    ConstParticleCPUWrapper (const uint64_t& idata) noexcept
+        : m_idata(idata)
+    {}
+
+    AMREX_GPU_HOST_DEVICE
+    operator int () const noexcept { return (m_idata & 0x00FFFFFF); }
+};
+
+
+template <typename T, int NReal, int NInt>
+struct ParticleBase
+{
+    T m_pos[AMREX_SPACEDIM];
+    T m_rdata[NReal];
+    uint64_t m_idcpu = 0;
+    int m_idata[NInt];
+};
+
+template <typename T, int NInt>
+struct ParticleBase<T,0,NInt>
+{
+    T m_pos[AMREX_SPACEDIM];
+    uint64_t m_idcpu = 0;
+    int m_idata[NInt];
+};
+
+template <typename T, int NReal>
+struct ParticleBase<T,NReal,0>
+{
+    T m_pos[AMREX_SPACEDIM];
+    T m_rdata[NReal];
+    uint64_t m_idcpu = 0;
+};
+
+template <typename T>
+struct ParticleBase<T,0,0>
+{
+    T m_pos[AMREX_SPACEDIM];
+    uint64_t m_idcpu = 0;
+};
+
+
 /** \brief The struct used to store particles.
  *
  * \tparam T_NReal The number of extra Real components
  * \tparam T_NInt The number of extra integer components
  */
-template<int T_NReal, int T_NInt=0>
+template <int T_NReal, int T_NInt=0>
 struct Particle
+    : ParticleBase<ParticleReal,T_NReal,T_NInt>
 {
     //! \brief number of extra Real components in the particle struct
     static constexpr int NReal = T_NReal;
+
     //! \brief number of extra integer components in the particle struct
     static constexpr int NInt = T_NInt;
 
-    //
     //! The floating point type used for the particles.
     using RealType = ParticleReal;
 
-    /**
-    * The real data. We always have SPACEDIM position coordinates,
-    * and optionally we have NReal additional real attributes.
-    */
-    union rm_t
+    static Long the_next_id;
+
+    AMREX_GPU_HOST_DEVICE ParticleCPUWrapper cpu () & { return ParticleCPUWrapper(this->m_idcpu); }
+    AMREX_GPU_HOST_DEVICE ParticleIDWrapper id () & { return ParticleIDWrapper(this->m_idcpu); }
+    AMREX_GPU_HOST_DEVICE ConstParticleCPUWrapper cpu () const & { return ConstParticleCPUWrapper(this->m_idcpu); }
+    AMREX_GPU_HOST_DEVICE ConstParticleIDWrapper id () const & { return ConstParticleIDWrapper(this->m_idcpu); }
+
+    AMREX_GPU_HOST_DEVICE RealVect pos () const & {return RealVect(AMREX_D_DECL(this->m_pos[0], this->m_pos[1], this->m_pos[2]));}
+
+    AMREX_GPU_HOST_DEVICE RealType& pos (int index) &
     {
-      RealType pos[AMREX_SPACEDIM];
-      RealType arr[AMREX_SPACEDIM+NReal];
-    };
+        AMREX_ASSERT(index < AMREX_SPACEDIM);
+        return this->m_pos[index];
+    }
 
-    /**
-    * The integer data. We always have id and cpu, and optionally we
-    * have NInt additional integer attributes.
-    */
-    union im_t
+    AMREX_GPU_HOST_DEVICE RealType  pos (int index) const &
+    {
+        AMREX_ASSERT(index < AMREX_SPACEDIM);
+        return this->m_pos[index];
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U != 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealType& rdata (int index) &
+    {
+        AMREX_ASSERT(index < NReal);
+        return this->m_rdata[index];
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U == 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealType& rdata (int /*index*/) &
+    {
+        AMREX_ALWAYS_ASSERT(false);
+        return this->pos(0);  // bc we must return something
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U != 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealType  rdata (int index) const &
+    {
+        AMREX_ASSERT(index < NReal);
+        return this->m_rdata[index];
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U == 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealType  rdata (int /*index*/) const &
     {
-      struct {int id; int cpu;};
-      int arr[2+NInt];
-    };
-
-    rm_t m_rdata;
-    im_t m_idata;
-
-    static int the_next_id;
-
-    AMREX_GPU_HOST_DEVICE int&  id()       & {return m_idata.id;}
-    AMREX_GPU_HOST_DEVICE int   id() const & {return m_idata.id;}
-    AMREX_GPU_HOST_DEVICE int& cpu()       & {return m_idata.cpu;}
-    AMREX_GPU_HOST_DEVICE int  cpu() const & {return m_idata.cpu;}
-
-    AMREX_GPU_HOST_DEVICE RealVect pos() const &
-    {return RealVect(AMREX_D_DECL(m_rdata.pos[0], m_rdata.pos[1], m_rdata.pos[2]));}
-
-    AMREX_GPU_HOST_DEVICE RealType& pos(int index)       &
-	{
-		AMREX_ASSERT(index < AMREX_SPACEDIM);
-		return m_rdata.pos[index];
-	}
-    AMREX_GPU_HOST_DEVICE RealType  pos(int index) const &
-	{
-		AMREX_ASSERT(index < AMREX_SPACEDIM);
-		return m_rdata.pos[index];
-	}
-
-    AMREX_GPU_HOST_DEVICE RealType& rdata(int index)       &
-	{
-		AMREX_ASSERT(index < NReal);
-		return m_rdata.arr[AMREX_SPACEDIM + index];
-	}
-    AMREX_GPU_HOST_DEVICE RealType  rdata(int index) const &
-	{
-		AMREX_ASSERT(index < NReal);
-		return m_rdata.arr[AMREX_SPACEDIM + index];
-	}
-    AMREX_GPU_HOST_DEVICE RealVect  rvec(AMREX_D_DECL(int indx, int indy, int indz)) const &
-	{
-		AMREX_ASSERT(AMREX_D_TERM(indx < NReal, and indy < NReal, and indz < NReal));
-		return RealVect(AMREX_D_DECL(m_rdata.arr[AMREX_SPACEDIM + indx],
-                                 m_rdata.arr[AMREX_SPACEDIM + indy],
-                                 m_rdata.arr[AMREX_SPACEDIM + indz]));
-	}
-    AMREX_GPU_HOST_DEVICE RealVect  rvec(const IntVect& indexes) const &
-	{
-		AMREX_ASSERT(indexes.max() < NReal);
-		return RealVect(AMREX_D_DECL(m_rdata.arr[AMREX_SPACEDIM + indexes[0]],
-                                 m_rdata.arr[AMREX_SPACEDIM + indexes[1]],
-                                 m_rdata.arr[AMREX_SPACEDIM + indexes[2]]));
-	}
-
-    AMREX_GPU_HOST_DEVICE int& idata(int index)       &
-	{
-		AMREX_ASSERT(index < NInt);
-		return m_idata.arr[2 + index];
-	}
-    AMREX_GPU_HOST_DEVICE int  idata(int index) const &
-	{
-		AMREX_ASSERT(index < NInt);		
-		return m_idata.arr[2 + index];
-	}
+        AMREX_ALWAYS_ASSERT(false);
+        return this->pos(0);  // because we must return something
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U != 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealVect  rvec (AMREX_D_DECL(int indx, int indy, int indz)) const &
+    {
+        AMREX_ASSERT(AMREX_D_TERM(indx < NReal, and indy < NReal, and indz < NReal));
+        return RealVect(AMREX_D_DECL(this->m_rdata[indx],
+                                     this->m_rdata[indy],
+                                     this->m_rdata[indz]));
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U == 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealVect  rvec (AMREX_D_DECL(int /*indx*/, int /*indy*/, int /*indz*/)) const &
+    {
+        AMREX_ALWAYS_ASSERT(false);
+        return RealVect(AMREX_D_DECL(0.0, 0.0, 0.0)); // bc we must return something
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U != 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealVect  rvec (const IntVect& indices) const &
+    {
+        AMREX_ASSERT(indices.max() < NReal);
+        return RealVect(AMREX_D_DECL(this->m_rdata[indices[0]],
+                                     this->m_rdata[indices[1]],
+                                     this->m_rdata[indices[2]]));
+    }
+
+    template <int U = T_NReal, typename std::enable_if<U == 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE RealVect  rvec (const IntVect& /*indices*/) const &
+    {
+        AMREX_ALWAYS_ASSERT(false);
+        return RealVect(AMREX_D_DECL(0.0, 0.0, 0.0)); // bc we must return something
+    }
+
+    template <int U = T_NInt, typename std::enable_if<U != 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE int& idata (int index) &
+    {
+        AMREX_ASSERT(index < NInt);
+        return this->m_idata[index];
+    }
+
+    template <int U = T_NInt, typename std::enable_if<U == 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE uint64_t& idata (int /*index*/) &
+    {
+        AMREX_ALWAYS_ASSERT(false);
+        return this->m_idcpu;  //bc we must return something
+    }
+
+    template <int U = T_NInt, typename std::enable_if<U != 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE int  idata (int index) const &
+    {
+        AMREX_ASSERT(index < NInt);
+        return this->m_idata[index];
+    }
+
+    template <int U = T_NInt, typename std::enable_if<U == 0, int>::type = 0>
+    AMREX_GPU_HOST_DEVICE int idata (int /*index*/) const &
+    {
+        AMREX_ALWAYS_ASSERT(false);
+        return this->m_idcpu;  //bc we must return something
+    }
 
     static Real InterpDoit (const FArrayBox& fab, const Real* fracs, const IntVect* cells, int comp);
 
@@ -137,7 +331,6 @@ struct Particle
 
     static Long MaxParticlesPerRead ();
 
-
     /**
     * \brief Returns the next particle ID for this processor.
     * Particle IDs start at 1 and are never reused.
@@ -146,27 +339,24 @@ struct Particle
     * across all processors must be checkpointed and then restored on restart
     * so that we don't reuse particle IDs.
     */
-    static int NextID ();
-
+    static Long NextID ();
 
     /**
     * \brief This version can only be used inside omp critical.
     */
-    static int UnprotectedNextID ();
-
+    static Long UnprotectedNextID ();
 
     /**
     * \brief Reset on restart.
     *
     * \param nextid
     */
-    static void NextID (int nextid);
+    static void NextID (Long nextid);
 
     static void CIC_Fracs (const Real* frac, Real* fracs);
 
     static void CIC_Cells (const IntVect& hicell, IntVect* cells);
 
-
     /**
     * \brief Old, *-based CIC for use in Interp.
     *
@@ -182,7 +372,6 @@ struct Particle
                                        Real*                        fracs,
                                        IntVect*                     cells);
 
-
     /**
     * \brief Wraps the arbitrary dx function.
     *
@@ -215,7 +404,7 @@ struct Particle
                                 Vector<Real>&                 fracs,
                                 Vector<IntVect>&              cells);
 };
-template <int NReal, int NInt> int Particle<NReal, NInt>::the_next_id = 1;
+template <int NReal, int NInt> Long Particle<NReal, NInt>::the_next_id = 1;
 
 template<int NReal, int NInt>
 inline
@@ -375,9 +564,9 @@ Particle<NReal, NInt>::CIC_Cells_Fracs_Basic (const Particle<NReal, NInt>& p,
     //
     // "cells" should be dimensioned: IntVect cells[AMREX_D_TERM(2,+2,+4)]
     //
-    const Real len[AMREX_SPACEDIM] = { AMREX_D_DECL(static_cast<Real>((p.m_rdata.pos[0]-plo[0])/dx[0] + 0.5_rt),
-                                                    static_cast<Real>((p.m_rdata.pos[1]-plo[1])/dx[1] + 0.5_rt),
-                                                    static_cast<Real>((p.m_rdata.pos[2]-plo[2])/dx[2] + 0.5_rt)) };
+    const Real len[AMREX_SPACEDIM] = { AMREX_D_DECL(static_cast<Real>((p.m_pos[0]-plo[0])/dx[0] + Real(0.5)),
+                                                    static_cast<Real>((p.m_pos[1]-plo[1])/dx[1] + Real(0.5)),
+                                                    static_cast<Real>((p.m_pos[2]-plo[2])/dx[2] + Real(0.5))) };
 
     const IntVect cell(AMREX_D_DECL(static_cast<int>(amrex::Math::floor(len[0])),
                                     static_cast<int>(amrex::Math::floor(len[1])),
@@ -411,13 +600,13 @@ Particle<NReal, NInt>::CIC_Cells_Fracs (const Particle<NReal, NInt>& p,
     //
     // The first element in fracs and cells is the lowest corner, the last is the highest.
     //
-    const Real hilen[AMREX_SPACEDIM] = { AMREX_D_DECL((p.m_rdata.pos[0]-plo[0]+dx_part[0]/2)/dx_geom[0],
-                                             (p.m_rdata.pos[1]-plo[1]+dx_part[1]/2)/dx_geom[1],
-                                             (p.m_rdata.pos[2]-plo[2]+dx_part[2]/2)/dx_geom[2]) };
+    const Real hilen[AMREX_SPACEDIM] = { AMREX_D_DECL((p.m_pos[0]-plo[0]+dx_part[0]/2)/dx_geom[0],
+                                             (p.m_pos[1]-plo[1]+dx_part[1]/2)/dx_geom[1],
+                                             (p.m_pos[2]-plo[2]+dx_part[2]/2)/dx_geom[2]) };
 
-    const Real lolen[AMREX_SPACEDIM] = { AMREX_D_DECL((p.m_rdata.pos[0]-plo[0]-dx_part[0]/2)/dx_geom[0],
-                                             (p.m_rdata.pos[1]-plo[1]-dx_part[1]/2)/dx_geom[1],
-                                             (p.m_rdata.pos[2]-plo[2]-dx_part[2]/2)/dx_geom[2]) };
+    const Real lolen[AMREX_SPACEDIM] = { AMREX_D_DECL((p.m_pos[0]-plo[0]-dx_part[0]/2)/dx_geom[0],
+                                             (p.m_pos[1]-plo[1]-dx_part[1]/2)/dx_geom[1],
+                                             (p.m_pos[2]-plo[2]-dx_part[2]/2)/dx_geom[2]) };
 
     const IntVect hicell(AMREX_D_DECL(static_cast<int>(amrex::Math::floor(hilen[0])),
                                       static_cast<int>(amrex::Math::floor(hilen[1])),
@@ -439,34 +628,34 @@ Particle<NReal, NInt>::CIC_Cells_Fracs (const Particle<NReal, NInt>& p,
     for (int xi = locell[0]; xi <= hicell[0]; xi++)
     {
         cells[i][0] = xi;
-        fracs[i] = (std::min(hilen[0]-xi,1_rt)-std::max(lolen[0]-xi,0_rt))*cell_density;
+        fracs[i] = (std::min(hilen[0]-xi,Real(1.0))-std::max(lolen[0]-xi,Real(0.0)))*cell_density;
         i++;
     }
 #elif (AMREX_SPACEDIM == 2)
     for (int yi = locell[1]; yi <= hicell[1]; yi++)
     {
-        const Real yf = std::min(hilen[1]-yi,1_rt)-std::max(lolen[1]-yi,0_rt);
+        const Real yf = std::min(hilen[1]-yi,Real(1.0))-std::max(lolen[1]-yi,Real(0.0));
         for (int xi = locell[0]; xi <= hicell[0]; xi ++)
         {
             cells[i][0] = xi;
             cells[i][1] = yi;
-            fracs[i] = yf * (std::min(hilen[0]-xi,1_rt)-std::max(lolen[0]-xi,0_rt))*cell_density;
+            fracs[i] = yf * (std::min(hilen[0]-xi,Real(1.0))-std::max(lolen[0]-xi,Real(0.0)))*cell_density;
             i++;
         }
     }
 #elif (AMREX_SPACEDIM == 3)
     for (int zi = locell[2]; zi <= hicell[2]; zi++)
     {
-        const Real zf = std::min(hilen[2]-zi,1_rt)-std::max(lolen[2]-zi,0_rt);
+        const Real zf = std::min(hilen[2]-zi,Real(1.0))-std::max(lolen[2]-zi,Real(0.0));
         for (int yi = locell[1]; yi <= hicell[1]; yi++)
         {
-            const Real yf = std::min(hilen[1]-yi,1_rt)-std::max(lolen[1]-yi,0_rt);
+            const Real yf = std::min(hilen[1]-yi,Real(1.0))-std::max(lolen[1]-yi,Real(0.0));
             for (int xi = locell[0]; xi <= hicell[0]; xi++)
             {
                 cells[i][0] = xi;
                 cells[i][1] = yi;
                 cells[i][2] = zi;
-                fracs[i] = zf * yf * (std::min(hilen[0]-xi,1_rt)-std::max(lolen[0]-xi,0_rt)) * cell_density;
+                fracs[i] = zf * yf * (std::min(hilen[0]-xi,Real(1.0))-std::max(lolen[0]-xi,Real(0.0))) * cell_density;
                 i++;
             }
         }
@@ -567,17 +756,17 @@ Particle<NReal, NInt>::Version ()
 }
 
 template <int NReal, int NInt>
-int
+Long
 Particle<NReal, NInt>::NextID ()
 {
-    int next;
+    Long next;
 // we should be able to test on _OPENMP < 201107 for capture (version 3.1)
 // but we must work around a bug in gcc < 4.9
 #if defined(_OPENMP) && _OPENMP < 201307
 #pragma omp critical (amrex_particle_nextid)
 #elif defined(_OPENMP)
 #pragma omp atomic capture
-#endif    
+#endif
     next = the_next_id++;
 
     if (next > LastParticleID)
@@ -587,10 +776,10 @@ Particle<NReal, NInt>::NextID ()
 }
 
 template <int NReal, int NInt>
-int
+Long
 Particle<NReal, NInt>::UnprotectedNextID ()
 {
-    int next = the_next_id++;
+    Long next = the_next_id++;
     if (next > LastParticleID)
 	amrex::Abort("Particle<NReal, NInt>::NextID() -- too many particles");
     return next;
@@ -598,7 +787,7 @@ Particle<NReal, NInt>::UnprotectedNextID ()
 
 template <int NReal, int NInt>
 void
-Particle<NReal, NInt>::NextID (int nextid)
+Particle<NReal, NInt>::NextID (Long nextid)
 {
     the_next_id = nextid;
 }
@@ -695,14 +884,71 @@ template <int NReal, int NInt>
 std::ostream&
 operator<< (std::ostream& os, const Particle<NReal, NInt>& p)
 {
-    os << p.m_idata.id   << ' '
-       << p.m_idata.cpu  << ' ';
+    os << p.id()   << ' '
+       << p.cpu()  << ' ';
+
+    for (int i = 0; i < AMREX_SPACEDIM; i++)
+        os << p.pos(i) << ' ';
+
+    for (int i = 0; i < NReal; i++)
+        os << p.rdata(i) << ' ';
+
+    for (int i = 2; i < NInt; i++)
+        os << p.idata(i) << ' ';
+
+    if (!os.good())
+        amrex::Error("operator<<(ostream&,Particle<NReal, NInt>&) failed");
+
+    return os;
+}
+
+template <int NReal>
+std::ostream&
+operator<< (std::ostream& os, const Particle<NReal, 0>& p)
+{
+    os << p.id()   << ' '
+       << p.cpu()  << ' ';
+
+    for (int i = 0; i < AMREX_SPACEDIM; i++)
+        os << p.pos(i) << ' ';
+
+    for (int i = 0; i < NReal; i++)
+        os << p.rdata(i) << ' ';
 
-    for (int i = 0; i < AMREX_SPACEDIM + NReal; i++)
-        os << p.m_rdata.arr[i] << ' ';
+    if (!os.good())
+        amrex::Error("operator<<(ostream&,Particle<NReal, NInt>&) failed");
+
+    return os;
+}
+
+template <int NInt>
+std::ostream&
+operator<< (std::ostream& os, const Particle<0, NInt>& p)
+{
+    os << p.id()   << ' '
+       << p.cpu()  << ' ';
+
+    for (int i = 0; i < AMREX_SPACEDIM; i++)
+        os << p.pos(i) << ' ';
+
+    for (int i = 2; i < NInt; i++)
+        os << p.idata(i) << ' ';
+
+    if (!os.good())
+        amrex::Error("operator<<(ostream&,Particle<NReal, NInt>&) failed");
+
+    return os;
+}
+
+template <int NReal=0, int NInt=0>
+std::ostream&
+operator<< (std::ostream& os, const Particle<0, 0>& p)
+{
+    os << p.id()   << ' '
+       << p.cpu()  << ' ';
 
-    for (int i = 2; i < 2 + NInt; i++)
-        os << p.m_idata.arr[i] << ' ';
+    for (int i = 0; i < AMREX_SPACEDIM; i++)
+        os << p.pos(i) << ' ';
 
     if (!os.good())
         amrex::Error("operator<<(ostream&,Particle<NReal, NInt>&) failed");
diff --git a/Src/Particle/AMReX_ParticleBufferMap.H b/Src/Particle/AMReX_ParticleBufferMap.H
index 9c0514ed6ec..f8ad90f9d20 100644
--- a/Src/Particle/AMReX_ParticleBufferMap.H
+++ b/Src/Particle/AMReX_ParticleBufferMap.H
@@ -9,8 +9,47 @@
 
 namespace amrex {
 
-class ParticleBufferMap {
-    
+struct GetPID
+{
+    const int* m_bucket_to_pid;
+    const int* m_lev_gid_to_bucket;
+    const int* m_lev_offsets;
+
+    GetPID (const Gpu::DeviceVector<int>& bucket_to_pid,
+            const Gpu::DeviceVector<int>& lev_gid_to_bucket,
+            const Gpu::DeviceVector<int>& lev_offsets)
+        : m_bucket_to_pid(bucket_to_pid.dataPtr()),
+          m_lev_gid_to_bucket(lev_gid_to_bucket.dataPtr()),
+          m_lev_offsets(lev_offsets.dataPtr())
+        {}
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    int operator() (const int lev, const int gid) const noexcept
+    {
+        return m_bucket_to_pid[m_lev_gid_to_bucket[m_lev_offsets[lev]+gid]];
+    }
+};
+
+struct GetBucket
+{
+    const int* m_lev_gid_to_bucket;
+    const int* m_lev_offsets;
+
+    GetBucket (const Gpu::DeviceVector<int>& lev_gid_to_bucket,
+               const Gpu::DeviceVector<int>& lev_offsets)
+        : m_lev_gid_to_bucket(lev_gid_to_bucket.dataPtr()),
+          m_lev_offsets(lev_offsets.dataPtr())
+        {}
+
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    int operator() (const int lev, const int gid) const noexcept
+    {
+        return m_lev_gid_to_bucket[m_lev_offsets[lev]+gid];
+    }
+};
+
+class ParticleBufferMap
+{
     bool m_defined;
     Vector<BoxArray> m_ba;
     Vector<DistributionMapping> m_dm;
@@ -26,95 +65,81 @@ class ParticleBufferMap {
     Vector<int> m_proc_box_offsets;
 
     Gpu::DeviceVector<int> d_bucket_to_pid;
-    Gpu::DeviceVector<int> d_lev_gid_to_bucket;    
+    Gpu::DeviceVector<int> d_lev_gid_to_bucket;
     Gpu::DeviceVector<int> d_lev_offsets;
-    
+
 public:
     ParticleBufferMap ()
         : m_defined(false), m_ba(), m_dm()
         {}
 
     ParticleBufferMap (const ParGDBBase* a_gdb);
-    
+
     void define (const ParGDBBase* a_gdb);
 
     bool isValid (const ParGDBBase* a_gdb) const;
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int numLevels () const
     {
         AMREX_ASSERT(m_defined);
         return m_lev_offsets.size()-1;
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int numBuckets () const
     {
         AMREX_ASSERT(m_defined);
         return m_bucket_to_gid.size();
     }
-        
-    AMREX_INLINE
+
+    AMREX_FORCE_INLINE
     int bucketToGrid (int bid) const
     {
         AMREX_ASSERT(m_defined);
         return m_bucket_to_gid[bid];
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int bucketToLevel (int bid) const
     {
         AMREX_ASSERT(m_defined);
         return m_bucket_to_lev[bid];
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int bucketToProc (int bid) const
     {
         AMREX_ASSERT(m_defined);
         return m_bucket_to_pid[bid];
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int gridAndLevToBucket (int gid, int lev) const
-    {
-        AMREX_ASSERT(m_defined);        
-        return m_lev_gid_to_bucket[m_lev_offsets[lev] + gid];
-    }
-
-    AMREX_INLINE
-    const int* levGridToBucketPtr () const
-    {
-        AMREX_ASSERT(m_defined);
-        return d_lev_gid_to_bucket.dataPtr();
-    }
-
-    AMREX_INLINE
-    const int* levelOffsetsPtr () const
     {
         AMREX_ASSERT(m_defined);
-        return d_lev_offsets.dataPtr();
+        return m_lev_gid_to_bucket[m_lev_offsets[lev] + gid];
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int firstBucketOnProc (int pid) const
     {
         AMREX_ASSERT(m_defined);
         return m_proc_box_offsets[pid];
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     int numBoxesOnProc (int pid) const
     {
         AMREX_ASSERT(m_defined);
         return m_proc_box_counts[pid];
     }
 
-    AMREX_INLINE
+    AMREX_FORCE_INLINE
     Vector<int> allBucketsOnProc (int pid) const
     {
         AMREX_ASSERT(m_defined);
-        Vector<int> buckets;        
+        Vector<int> buckets;
         for (int i = 0; i < numBoxesOnProc(pid); ++i)
         {
             buckets.push_back(i+firstBucketOnProc(pid));
@@ -122,19 +147,15 @@ public:
         return buckets;
     }
 
-    AMREX_INLINE
-    int procID (int gid, int lev) const 
-    { 
-        AMREX_ASSERT(m_defined);
-        return m_dm[lev][gid]; 
-    }
-
-    AMREX_INLINE
-    const int* bucketToPIDPtr () const
+    AMREX_FORCE_INLINE
+    int procID (int gid, int lev) const
     {
         AMREX_ASSERT(m_defined);
-        return d_bucket_to_pid.dataPtr();
+        return m_dm[lev][gid];
     }
+
+    GetPID getPIDFunctor () const noexcept { return GetPID(d_bucket_to_pid, d_lev_gid_to_bucket, d_lev_offsets);}
+    GetBucket getBucketFunctor () const noexcept { return GetBucket(d_lev_gid_to_bucket, d_lev_offsets);}
 };
 
 } // namespace amrex
diff --git a/Src/Particle/AMReX_ParticleBufferMap.cpp b/Src/Particle/AMReX_ParticleBufferMap.cpp
index 0d5f03f161e..0921aa69056 100644
--- a/Src/Particle/AMReX_ParticleBufferMap.cpp
+++ b/Src/Particle/AMReX_ParticleBufferMap.cpp
@@ -23,12 +23,12 @@ void ParticleBufferMap::define (const ParGDBBase* a_gdb)
         m_ba[lev] = a_gdb->ParticleBoxArray(lev);
         m_dm[lev] = a_gdb->ParticleDistributionMap(lev);
     }
-    
+
     m_lev_offsets.resize(0);
     m_lev_offsets.push_back(0);
     for (int lev = 0; lev < num_levels; ++lev)
         m_lev_offsets.push_back(m_lev_offsets.back() + m_ba[lev].size());
-            
+
     int num_buckets = m_lev_offsets.back();
 
     m_bucket_to_gid.resize(0);
@@ -46,11 +46,12 @@ void ParticleBufferMap::define (const ParGDBBase* a_gdb)
 
     for (int lev = 0; lev < num_levels; ++lev) {
         for (int i = 0; i < m_ba[lev].size(); ++i) {
-            box_lev_proc_ids.push_back(std::make_tuple(i, lev, m_dm[lev][i]));
+            int rank = ParallelContext::global_to_local_rank(m_dm[lev][i]);
+            box_lev_proc_ids.push_back(std::make_tuple(i, lev, rank));
         }
     }
-    
-    std::sort(box_lev_proc_ids.begin(), box_lev_proc_ids.end(), 
+
+    std::sort(box_lev_proc_ids.begin(), box_lev_proc_ids.end(),
               [](const ThreeIntTuple& a, const ThreeIntTuple& b) -> bool
               {
                   int pid_a = std::get<2>(a);
@@ -79,7 +80,7 @@ void ParticleBufferMap::define (const ParGDBBase* a_gdb)
     }
 
     m_proc_box_counts.resize(0);
-    m_proc_box_counts.resize(ParallelDescriptor::NProcs(), 0);
+    m_proc_box_counts.resize(ParallelContext::NProcsSub(), 0);
 
     for (int i = 0; i < num_buckets; ++i)
     {
@@ -95,10 +96,10 @@ void ParticleBufferMap::define (const ParGDBBase* a_gdb)
         m_proc_box_offsets.push_back(m_proc_box_offsets.back() + count);
 
     d_bucket_to_pid.resize(0);
-    d_bucket_to_pid.resize(num_buckets);    
-    
+    d_bucket_to_pid.resize(num_buckets);
+
     d_lev_gid_to_bucket.resize(0);
-    d_lev_gid_to_bucket.resize(num_buckets);    
+    d_lev_gid_to_bucket.resize(num_buckets);
 
     d_lev_offsets.resize(0);
     d_lev_offsets.resize(m_lev_offsets.size());
diff --git a/Src/Particle/AMReX_ParticleCommunication.H b/Src/Particle/AMReX_ParticleCommunication.H
index 88d2754bf49..57ec05c4700 100644
--- a/Src/Particle/AMReX_ParticleCommunication.H
+++ b/Src/Particle/AMReX_ParticleCommunication.H
@@ -14,7 +14,7 @@ namespace amrex {
 
 struct NeighborUnpackPolicy
 {
-    template <class PTile> 
+    template <class PTile>
     void resizeTiles (std::vector<PTile*>& tiles, const std::vector<int>& sizes, std::vector<int>& offsets) const
     {
         for(int i = 0; i < static_cast<int>(sizes.size()); ++i)
@@ -29,9 +29,9 @@ struct NeighborUnpackPolicy
 
 struct RedistributeUnpackPolicy
 {
-    template <class PTile> 
+    template <class PTile>
     void resizeTiles (std::vector<PTile*>& tiles, const std::vector<int>& sizes, std::vector<int>& offsets) const
-    {        
+    {
         int N = static_cast<int>(sizes.size());
 
         std::map<PTile*, int> tile_sizes;
@@ -49,7 +49,7 @@ struct RedistributeUnpackPolicy
     }
 };
 
-struct ParticleCopyOp 
+struct ParticleCopyOp
 {
     Vector<std::map<int, Gpu::DeviceVector<int> > > m_boxes;
     Vector<std::map<int, Gpu::DeviceVector<int> > > m_levels;
@@ -62,19 +62,20 @@ struct ParticleCopyOp
 
     void resize (const int gid, const int lev, const int size);
 
-    int numCopies (const int gid, const int lev) const 
+    int numCopies (const int gid, const int lev) const
     {
         if (m_boxes.size() <= lev) return 0;
         auto mit = m_boxes[lev].find(gid);
         return mit == m_boxes[lev].end() ? 0 : mit->second.size();
     }
 };
-    
-struct ParticleCopyPlan 
+
+struct ParticleCopyPlan
 {
     Vector<std::map<int, Gpu::DeviceVector<int> > > m_dst_indices;
-    
-    Gpu::DeviceVector<unsigned int> m_box_counts;
+
+    Gpu::DeviceVector<unsigned int> m_box_counts_d;
+    Gpu::HostVector<unsigned int>   m_box_counts_h;
     Gpu::DeviceVector<unsigned int> m_box_offsets;
 
     Gpu::DeviceVector<int> m_rcv_box_counts;
@@ -95,7 +96,7 @@ struct ParticleCopyPlan
     Vector<Long> m_rcv_num_particles;
 
     Vector<int> m_neighbor_procs;
-        
+
     Vector<Long> m_Snds;
     Vector<Long> m_Rcvs;
     Vector<int> m_RcvProc;
@@ -110,12 +111,12 @@ struct ParticleCopyPlan
 
     Vector<std::size_t> m_rcv_pad_correction_h;
     Gpu::DeviceVector<std::size_t> m_rcv_pad_correction_d;
-    
+
     template <class PC, EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
     void build (const PC& pc, const ParticleCopyOp& op, bool local)
     {
         BL_PROFILE("ParticleCopyPlan::build");
-        
+
         m_local = local;
 
         const int ngrow = 1;  // note - fix
@@ -123,25 +124,24 @@ struct ParticleCopyPlan
         const int num_levels = pc.BufferMap().numLevels();
         const int num_buckets = pc.BufferMap().numBuckets();
 
-        if (m_local) 
+        if (m_local)
         {
             m_neighbor_procs = pc.NeighborProcs(ngrow);
         }
-        else 
+        else
         {
-            m_neighbor_procs.resize(ParallelDescriptor::NProcs());
+            m_neighbor_procs.resize(ParallelContext::NProcsSub());
             std::iota(m_neighbor_procs.begin(), m_neighbor_procs.end(), 0);
         }
 
-        m_box_counts.resize(0);
-        m_box_counts.resize(num_buckets+1, 0);
+        m_box_counts_d.resize(0);
+        m_box_counts_d.resize(num_buckets+1, 0);
         m_box_offsets.resize(num_buckets+1);
-        auto p_dst_box_counts = m_box_counts.dataPtr();
-        auto p_lev_offsets = pc.BufferMap().levelOffsetsPtr();
-        auto p_box_perm = pc.BufferMap().levGridToBucketPtr();
+        auto p_dst_box_counts = m_box_counts_d.dataPtr();
+        auto getBucket = pc.BufferMap().getBucketFunctor();
 
         constexpr unsigned int max_unsigned_int = std::numeric_limits<unsigned int>::max();
-                
+
         m_dst_indices.resize(num_levels);
         for (int lev = 0; lev < num_levels; ++lev)
         {
@@ -151,11 +151,11 @@ struct ParticleCopyPlan
                 int num_copies = op.numCopies(gid, lev);
                 if (num_copies == 0) continue;
                 m_dst_indices[lev][gid].resize(num_copies);
-            
+
                 auto p_boxes = op.m_boxes[lev].at(gid).dataPtr();
                 auto p_levs = op.m_levels[lev].at(gid).dataPtr();
                 auto p_dst_indices = m_dst_indices[lev][gid].dataPtr();
-                
+
                 AMREX_FOR_1D ( num_copies, i,
                 {
                     int dst_box = p_boxes[i];
@@ -163,22 +163,27 @@ struct ParticleCopyPlan
                     {
                         int dst_lev = p_levs[i];
                         int index = Gpu::Atomic::Inc(
-                            &p_dst_box_counts[p_box_perm[p_lev_offsets[dst_lev]+dst_box]], max_unsigned_int);
+                            &p_dst_box_counts[getBucket(dst_lev, dst_box)], max_unsigned_int);
                         p_dst_indices[i] = index;
                     }
                 });
             }
         }
 
-        amrex::Gpu::exclusive_scan(m_box_counts.begin(), m_box_counts.end(), m_box_offsets.begin());
+        amrex::Gpu::exclusive_scan(m_box_counts_d.begin(), m_box_counts_d.end(),
+                                   m_box_offsets.begin());
+
+        m_box_counts_h.resize(m_box_counts_d.size());
+        Gpu::copy(Gpu::deviceToHost, m_box_counts_d.begin(), m_box_counts_d.end(),
+                  m_box_counts_h.begin());
 
         m_snd_pad_correction_h.resize(0);
-        m_snd_pad_correction_h.resize(ParallelDescriptor::NProcs()+1, 0);
+        m_snd_pad_correction_h.resize(ParallelContext::NProcsSub()+1, 0);
 
         m_snd_pad_correction_d.resize(m_snd_pad_correction_h.size());
         Gpu::copy(Gpu::hostToDevice, m_snd_pad_correction_h.begin(), m_snd_pad_correction_h.end(),
                   m_snd_pad_correction_d.begin());
-        
+
         buildMPIStart(pc.BufferMap(), pc.superParticleSize());
     }
 
@@ -187,7 +192,7 @@ struct ParticleCopyPlan
     void buildMPIFinish (const ParticleBufferMap& map);
 
 private:
-    
+
     void buildMPIStart (const ParticleBufferMap& map, Long psize);
 
     //
@@ -203,7 +208,7 @@ private:
     // this purely with point-to-point communication.
     //
     void doHandShakeLocal (const Vector<Long>& Snds, Vector<Long>& Rcvs) const;
-    
+
     //
     // In the global version, we don't know who we'll receive from, so we
     // need to do some collective communication first.
@@ -212,7 +217,7 @@ private:
 
     //
     // Another version of the above that is implemented using MPI All-to-All
-    //    
+    //
     void doHandShakeAllToAll (const Vector<Long>& Snds, Vector<Long>& Rcvs) const;
 
     bool m_local;
@@ -220,26 +225,24 @@ private:
 
 struct GetSendBufferOffset
 {
-    const unsigned int* m_box_offsets;        
+    const unsigned int* m_box_offsets;
     const std::size_t* m_pad_correction;
 
-    const int* m_lev_offsets;
-    const int* m_box_perm;
-    const int* m_buck_to_pid;
+    GetPID m_get_pid;
+    GetBucket m_get_bucket;
 
     GetSendBufferOffset (const ParticleCopyPlan& plan, const ParticleBufferMap& map)
         : m_box_offsets(plan.m_box_offsets.dataPtr()),
           m_pad_correction(plan.m_snd_pad_correction_d.dataPtr()),
-          m_lev_offsets(map.levelOffsetsPtr()),
-          m_box_perm(map.levGridToBucketPtr()),
-          m_buck_to_pid(map.bucketToPIDPtr())
+          m_get_pid(map.getPIDFunctor()),
+          m_get_bucket(map.getBucketFunctor())
     {}
-    
-    AMREX_FORCE_INLINE AMREX_GPU_HOST_DEVICE
+
+    AMREX_FORCE_INLINE AMREX_GPU_DEVICE
     Long operator() (int dst_box, int dst_lev, std::size_t psize, int i) const
     {
-        int dst_pid = m_buck_to_pid[m_box_perm[m_lev_offsets[dst_lev]+dst_box]];
-        Long dst_offset = psize*(m_box_offsets[m_box_perm[m_lev_offsets[dst_lev]+dst_box]] + i);
+        int dst_pid = m_get_pid(dst_lev, dst_box);
+        Long dst_offset = psize*(m_box_offsets[m_get_bucket(dst_lev, dst_box)] + i);
         dst_offset += m_pad_correction[dst_pid];
         return dst_offset;
     }
@@ -257,17 +260,28 @@ void packBuffer (const PC& pc, const ParticleCopyOp& op, const ParticleCopyPlan&
 
     int num_levels = pc.BufferMap().numLevels();
     int num_buckets = pc.BufferMap().numBuckets();
-    Long total_buffer_size = (plan.m_snd_offsets.size() == 0) ? plan.m_box_offsets[num_buckets]*psize : plan.m_snd_offsets.back();
+
+    Long total_buffer_size = 0;
+    if (plan.m_snd_offsets.size() == 0)
+    {
+        unsigned int np = 0;
+        Gpu::copy(Gpu::deviceToHost, plan.m_box_offsets.begin() + num_buckets,
+                  plan.m_box_offsets.begin() + num_buckets + 1, &np);
+        total_buffer_size = np*psize;
+    }
+    else
+    {
+        total_buffer_size = plan.m_snd_offsets.back();
+    }
     snd_buffer.resize(total_buffer_size);
 
-    auto p_comm_real = pc.communicate_real_comp.dataPtr();
-    auto p_comm_int  = pc.communicate_int_comp.dataPtr();
+    auto p_comm_real = pc.d_communicate_real_comp.dataPtr();
+    auto p_comm_int  = pc.d_communicate_int_comp.dataPtr();
 
     for (int lev = 0; lev < num_levels; ++lev)
-    {       
+    {
         const auto& geom = pc.Geom(lev);
         auto& plev = pc.GetParticles(lev);
-        auto& ba = pc.ParticleBoxArray(lev);
         const auto plo = geom.ProbLoArray();
         const auto phi = geom.ProbHiArray();
         const auto is_per = geom.isPeriodicArray();
@@ -277,19 +291,18 @@ void packBuffer (const PC& pc, const ParticleCopyOp& op, const ParticleCopyPlan&
             int gid = kv.first.first;
             int tid = kv.first.second;
             auto index = std::make_pair(gid, tid);
-            
+
             auto& src_tile = plev.at(index);
-            auto& aos   = src_tile.GetArrayOfStructs();
             const auto ptd = src_tile.getConstParticleTileData();
-            
+
             int num_copies = op.numCopies(gid, lev);
             if (num_copies == 0) continue;
-            
+
             auto p_boxes = op.m_boxes[lev].at(gid).dataPtr();
             auto p_levels = op.m_levels[lev].at(gid).dataPtr();
             auto p_src_indices = op.m_src_indices[lev].at(gid).dataPtr();
             auto p_periodic_shift = op.m_periodic_shift[lev].at(gid).dataPtr();
-            auto p_dst_indices = plan.m_dst_indices[lev].at(gid).dataPtr();           
+            auto p_dst_indices = plan.m_dst_indices[lev].at(gid).dataPtr();
             auto p_snd_buffer = snd_buffer.dataPtr();
             GetSendBufferOffset get_offset(plan, pc.BufferMap());
 
@@ -299,17 +312,17 @@ void packBuffer (const PC& pc, const ParticleCopyOp& op, const ParticleCopyPlan&
                 if (dst_box >= 0)
                 {
                     int dst_lev = p_levels[i];
-                    auto dst_offset = get_offset(dst_box, dst_lev, psize, p_dst_indices[i]); 
+                    auto dst_offset = get_offset(dst_box, dst_lev, psize, p_dst_indices[i]);
                     int src_index = p_src_indices[i];
                     ptd.packParticleData(p_snd_buffer, src_index, dst_offset, p_comm_real, p_comm_int);
-                
+
                     ParticleType* p = (ParticleType*) &p_snd_buffer[dst_offset];
                     const IntVect& pshift = p_periodic_shift[i];
                     for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
                     {
                         if (not is_per[idim]) continue;
-                        if (pshift[idim] > 0) 
-                            p->pos(idim) += phi[idim] - plo[idim]; 
+                        if (pshift[idim] > 0)
+                            p->pos(idim) += phi[idim] - plo[idim];
                         else if (pshift[idim] < 0)
                             p->pos(idim) -= phi[idim] - plo[idim];
                     }
@@ -321,7 +334,7 @@ void packBuffer (const PC& pc, const ParticleCopyOp& op, const ParticleCopyPlan&
 
 template <class PC, class Buffer, class UnpackPolicy,
           EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
-void unpackBuffer (PC& pc, const ParticleCopyPlan& plan, const Buffer& snd_buffer, const UnpackPolicy policy)
+void unpackBuffer (PC& pc, const ParticleCopyPlan& plan, const Buffer& snd_buffer, const UnpackPolicy&& policy)
 {
     BL_PROFILE("amrex::unpackBuffer");
 
@@ -334,13 +347,13 @@ void unpackBuffer (PC& pc, const ParticleCopyPlan& plan, const Buffer& snd_buffe
     std::vector<int> sizes;
     std::vector<PTile*> tiles;
     for (int lev = 0; lev < num_levels; ++lev)
-    {       
+    {
         for(MFIter mfi = pc.MakeMFIter(lev); mfi.isValid(); ++mfi)
         {
             int gid = mfi.index();
             int tid = mfi.LocalTileIndex();
             auto& tile = pc.DefineAndReturnParticleTile(lev, gid, tid);
-            int num_copies = plan.m_box_counts[pc.BufferMap().gridAndLevToBucket(gid, lev)];
+            int num_copies = plan.m_box_counts_h[pc.BufferMap().gridAndLevToBucket(gid, lev)];
             sizes.push_back(num_copies);
             tiles.push_back(&tile);
         }
@@ -350,30 +363,29 @@ void unpackBuffer (PC& pc, const ParticleCopyPlan& plan, const Buffer& snd_buffe
     std::vector<int> offsets;
     policy.resizeTiles(tiles, sizes, offsets);
 
-    auto p_comm_real = pc.communicate_real_comp.dataPtr();
-    auto p_comm_int  = pc.communicate_int_comp.dataPtr();
+    auto p_comm_real = pc.d_communicate_real_comp.dataPtr();
+    auto p_comm_int  = pc.d_communicate_int_comp.dataPtr();
 
     // local unpack
     int uindex = 0;
     for (int lev = 0; lev < num_levels; ++lev)
-    {       
+    {
         auto& plev  = pc.GetParticles(lev);
         for(MFIter mfi = pc.MakeMFIter(lev); mfi.isValid(); ++mfi)
         {
             int gid = mfi.index();
             int tid = mfi.LocalTileIndex();
             auto index = std::make_pair(gid, tid);
-            
+
             auto& tile = plev[index];
-            auto& aos   = tile.GetArrayOfStructs();
 
             GetSendBufferOffset get_offset(plan, pc.BufferMap());
             auto p_snd_buffer = snd_buffer.dataPtr();
-            
+
             int offset = offsets[uindex];
             int size = sizes[uindex];
             ++uindex;
-        
+
             auto ptd = tile.getParticleTileData();
             AMREX_FOR_1D ( size, i,
             {
@@ -390,13 +402,12 @@ template <class PC, class Buffer,
 void communicateParticlesStart (const PC& pc, ParticleCopyPlan& plan, const Buffer& snd_buffer, Buffer& rcv_buffer)
 {
     BL_PROFILE("amrex::communicateParticlesStart");
-    
-    Long psize = pc.superParticleSize();
 
 #ifdef AMREX_USE_MPI
-    const int NProcs = ParallelDescriptor::NProcs();
-    const int MyProc = ParallelDescriptor::MyProc();
-    
+    Long psize = pc.superParticleSize();
+    const int NProcs = ParallelContext::NProcsSub();
+    const int MyProc = ParallelContext::MyProcSub();
+
     if (NProcs == 1) return;
 
     Vector<int> RcvProc;
@@ -426,7 +437,7 @@ void communicateParticlesStart (const PC& pc, ParticleCopyPlan& plan, const Buff
     plan.m_rcv_pad_correction_d.resize(plan.m_rcv_pad_correction_h.size());
     Gpu::copy(Gpu::hostToDevice, plan.m_rcv_pad_correction_h.begin(), plan.m_rcv_pad_correction_h.end(),
               plan.m_rcv_pad_correction_d.begin());
-    
+
     rcv_buffer.resize(TotRcvBytes);
 
     plan.m_nrcvs = RcvProc.size();
@@ -436,7 +447,7 @@ void communicateParticlesStart (const PC& pc, ParticleCopyPlan& plan, const Buff
 
     plan.m_particle_rreqs.resize(0);
     plan.m_particle_rreqs.resize(plan.m_nrcvs);
-    
+
     const int SeqNum = ParallelDescriptor::SeqNum();
 
     // Post receives.
@@ -454,21 +465,21 @@ void communicateParticlesStart (const PC& pc, ParticleCopyPlan& plan, const Buff
 
         const int comm_data_type = ParallelDescriptor::select_comm_data_type(nbytes);
         if (comm_data_type == 1) {
-            plan.m_particle_rreqs[i] = 
-                ParallelDescriptor::Arecv((char*) (rcv_buffer.dataPtr() + offset), Cnt, Who, SeqNum).req();
+            plan.m_particle_rreqs[i] =
+                ParallelDescriptor::Arecv((char*) (rcv_buffer.dataPtr() + offset), Cnt, Who, SeqNum, ParallelContext::CommunicatorSub()).req();
         } else if (comm_data_type == 2) {
-            plan.m_particle_rreqs[i] = 
-                ParallelDescriptor::Arecv((unsigned long long*) (rcv_buffer.dataPtr() + offset), Cnt, Who, SeqNum).req();
+            plan.m_particle_rreqs[i] =
+                ParallelDescriptor::Arecv((unsigned long long*) (rcv_buffer.dataPtr() + offset), Cnt, Who, SeqNum, ParallelContext::CommunicatorSub()).req();
         } else if (comm_data_type == 3) {
-            plan.m_particle_rreqs[i] = 
-                ParallelDescriptor::Arecv((ParallelDescriptor::lull_t *) (rcv_buffer.dataPtr() + offset), Cnt, Who, SeqNum).req();
+            plan.m_particle_rreqs[i] =
+                ParallelDescriptor::Arecv((ParallelDescriptor::lull_t *) (rcv_buffer.dataPtr() + offset), Cnt, Who, SeqNum, ParallelContext::CommunicatorSub()).req();
         } else {
             amrex::Abort("TODO: message size is too big");
         }
     }
 
     if (plan.m_NumSnds == 0) return;
-    
+
     // Send.
     for (int i = 0; i < NProcs; ++i)
     {
@@ -484,18 +495,21 @@ void communicateParticlesStart (const PC& pc, ParticleCopyPlan& plan, const Buff
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
         AMREX_ASSERT(snd_offset % acd == 0);
-        
+
         const int comm_data_type = ParallelDescriptor::select_comm_data_type(nbytes);
         if (comm_data_type == 1) {
-            ParallelDescriptor::Send((char*)(snd_buffer.dataPtr()+snd_offset), Cnt, Who, SeqNum);
+            ParallelDescriptor::Send((char*)(snd_buffer.dataPtr()+snd_offset), Cnt, Who, SeqNum,
+                                     ParallelContext::CommunicatorSub());
         } else if (comm_data_type == 2) {
-            ParallelDescriptor::Send((unsigned long long*)(snd_buffer.dataPtr()+snd_offset), Cnt, Who, SeqNum);
+            ParallelDescriptor::Send((unsigned long long*)(snd_buffer.dataPtr()+snd_offset), Cnt, Who, SeqNum, ParallelContext::CommunicatorSub());
         } else if (comm_data_type == 3) {
-            ParallelDescriptor::Send((ParallelDescriptor::lull_t *)(snd_buffer.dataPtr()+snd_offset), Cnt, Who, SeqNum);
+            ParallelDescriptor::Send((ParallelDescriptor::lull_t *)(snd_buffer.dataPtr()+snd_offset), Cnt, Who, SeqNum, ParallelContext::CommunicatorSub());
         } else {
             amrex::Abort("TODO: message size is too big");
         }
     }
+#else
+    amrex::ignore_unused(pc,plan,snd_buffer,rcv_buffer);
 #endif // MPI
 }
 
@@ -503,28 +517,28 @@ void communicateParticlesFinish (const ParticleCopyPlan& plan);
 
 template <class PC, class Buffer, class UnpackPolicy,
           EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
-void unpackRemotes (PC& pc, const ParticleCopyPlan& plan, Buffer& rcv_buffer, const UnpackPolicy& policy)
+void unpackRemotes (PC& pc, const ParticleCopyPlan& plan, Buffer& rcv_buffer, UnpackPolicy&& policy)
 {
     BL_PROFILE("amrex::unpackRemotes");
-    
+
 #ifdef AMREX_USE_MPI
-    const int NProcs = ParallelDescriptor::NProcs();
+    const int NProcs = ParallelContext::NProcsSub();
     if (NProcs == 1) return;
 
-    const int MyProc = ParallelDescriptor::MyProc();
+    const int MyProc = ParallelContext::MyProcSub();
     amrex::ignore_unused(MyProc);
     using PTile = typename PC::ParticleTileType;
 
     if (plan.m_nrcvs > 0)
     {
-        auto p_comm_real = pc.communicate_real_comp.dataPtr();
-        auto p_comm_int  = pc.communicate_int_comp.dataPtr();
-	auto p_rcv_buffer = rcv_buffer.dataPtr();
+        auto p_comm_real = pc.d_communicate_real_comp.dataPtr();
+        auto p_comm_int  = pc.d_communicate_int_comp.dataPtr();
+        auto p_rcv_buffer = rcv_buffer.dataPtr();
 
         std::vector<int> sizes;
         std::vector<PTile*> tiles;
-	for (int i = 0; i < plan.m_rcv_box_counts.size(); ++i)
-	{
+        for (int i = 0; i < plan.m_rcv_box_counts.size(); ++i)
+          {
             int copy_size = plan.m_rcv_box_counts[i];
             int lev = plan.m_rcv_box_levs[i];
             int gid = plan.m_rcv_box_ids[i];
@@ -539,8 +553,8 @@ void unpackRemotes (PC& pc, const ParticleCopyPlan& plan, Buffer& rcv_buffer, co
         Gpu::Device::synchronize();
         int uindex = 0;
         int procindex = 0, rproc = plan.m_rcv_box_pids[0];
-	for (int i = 0; i < plan.m_rcv_box_counts.size(); ++i)
-	{
+        for (int i = 0; i < plan.m_rcv_box_counts.size(); ++i)
+          {
             int lev = plan.m_rcv_box_levs[i];
             int gid = plan.m_rcv_box_ids[i];
             int tid = 0;
@@ -551,24 +565,28 @@ void unpackRemotes (PC& pc, const ParticleCopyPlan& plan, Buffer& rcv_buffer, co
             auto& tile = pc.DefineAndReturnParticleTile(lev, gid, tid);
             auto ptd = tile.getParticleTileData();
 
-            AMREX_ASSERT(MyProc == pc.ParticleDistributionMap(lev)[gid]);
+            AMREX_ASSERT(MyProc ==
+                ParallelContext::global_to_local_rank(pc.ParticleDistributionMap(lev)[gid]));
 
             int dst_offset = offsets[uindex];
             int size = sizes[uindex];
             ++uindex;
 
             Long psize = pc.superParticleSize();
-            auto p_pad_adjust = plan.m_rcv_pad_correction_d.dataPtr();            
-            
-            AMREX_FOR_1D ( size, ip,
-	    {
+            auto p_pad_adjust = plan.m_rcv_pad_correction_d.dataPtr();
+
+            AMREX_FOR_1D ( size, ip, {
                 Long src_offset = psize*(offset + ip) + p_pad_adjust[procindex];
                 int dst_index = dst_offset + ip;
                 ptd.unpackParticleData(p_rcv_buffer, src_offset, dst_index,
                                        p_comm_real, p_comm_int);
-            });
-	}
-    }    
+              });
+
+            Gpu::synchronize();
+          }
+    }
+#else
+    amrex::ignore_unused(pc,plan,rcv_buffer,policy);
 #endif // MPI
 }
 
diff --git a/Src/Particle/AMReX_ParticleCommunication.cpp b/Src/Particle/AMReX_ParticleCommunication.cpp
index 9f3a6134d2c..4bc7f78e510 100644
--- a/Src/Particle/AMReX_ParticleCommunication.cpp
+++ b/Src/Particle/AMReX_ParticleCommunication.cpp
@@ -34,9 +34,10 @@ void ParticleCopyOp::resize (const int gid, const int lev, const int size)
 void ParticleCopyPlan::clear ()
 {
     m_dst_indices.clear();
-    m_box_counts.clear();
+    m_box_counts_d.clear();
+    m_box_counts_h.clear();
     m_box_offsets.clear();
-    
+
     m_rcv_box_counts.clear();
     m_rcv_box_offsets.clear();
     m_rcv_box_ids.clear();
@@ -47,26 +48,24 @@ void ParticleCopyPlan::buildMPIStart (const ParticleBufferMap& map, Long psize)
     BL_PROFILE("ParticleCopyPlan::buildMPIStart");
 
 #ifdef AMREX_USE_MPI
-    const int NProcs = ParallelDescriptor::NProcs();
-    const int MyProc = ParallelDescriptor::MyProc();
+    const int NProcs = ParallelContext::NProcsSub();
+    const int MyProc = ParallelContext::MyProcSub();
     const int NNeighborProcs = m_neighbor_procs.size();
 
     if (NProcs == 1) return;
 
     m_Snds.resize(0);
     m_Snds.resize(NProcs, 0);
-    
+
     m_Rcvs.resize(0);
     m_Rcvs.resize(NProcs, 0);
-    
+
     m_snd_num_particles.resize(0);
     m_snd_num_particles.resize(NProcs, 0);
 
     m_rcv_num_particles.resize(0);
     m_rcv_num_particles.resize(NProcs, 0);
 
-    Gpu::HostVector<int> box_counts(m_box_counts.size());
-    Gpu::copy(Gpu::deviceToHost, m_box_counts.begin(), m_box_counts.end(), box_counts.begin());
     std::map<int, Vector<int> > snd_data;
 
     m_NumSnds = 0;
@@ -78,7 +77,8 @@ void ParticleCopyPlan::buildMPIStart (const ParticleBufferMap& map, Long psize)
 	{
             int dst = map.bucketToGrid(bucket);
             int lev = map.bucketToLevel(bucket);
-            int npart = box_counts[bucket];
+            AMREX_ASSERT(m_box_counts_h[bucket] <= std::numeric_limits<int>::max());
+            int npart = static_cast<int>(m_box_counts_h[bucket]);
             if (npart == 0) continue;
             m_snd_num_particles[i] += npart;
             if (i == MyProc) continue;
@@ -153,7 +153,7 @@ void ParticleCopyPlan::buildMPIStart (const ParticleBufferMap& map, Long psize)
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
         
-        m_build_rreqs[i] = ParallelDescriptor::Arecv((char*) (m_rcv_data.dataPtr() + offset), Cnt, Who, SeqNum).req();
+        m_build_rreqs[i] = ParallelDescriptor::Arecv((char*) (m_rcv_data.dataPtr() + offset), Cnt, Who, SeqNum, ParallelContext::CommunicatorSub()).req();
     }
     
     for (auto i : m_neighbor_procs)
@@ -166,8 +166,9 @@ void ParticleCopyPlan::buildMPIStart (const ParticleBufferMap& map, Long psize)
         AMREX_ASSERT(Cnt > 0);
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
-        
-        ParallelDescriptor::Send((char*) snd_data[i].data(), Cnt, Who, SeqNum);
+
+        ParallelDescriptor::Send((char*) snd_data[i].data(), Cnt, Who, SeqNum,
+                                 ParallelContext::CommunicatorSub());
     }
 
     m_snd_counts.resize(0);
@@ -195,17 +196,20 @@ void ParticleCopyPlan::buildMPIStart (const ParticleBufferMap& map, Long psize)
     m_snd_pad_correction_d.resize(m_snd_pad_correction_h.size());
     Gpu::copy(Gpu::hostToDevice, m_snd_pad_correction_h.begin(), m_snd_pad_correction_h.end(),
               m_snd_pad_correction_d.begin());
-
+#else
+    amrex::ignore_unused(map,psize);
 #endif
 }
 
 void ParticleCopyPlan::buildMPIFinish (const ParticleBufferMap& map)
 {
+    amrex::ignore_unused(map);
+
     BL_PROFILE("ParticleCopyPlan::buildMPIFinish");
 
 #ifdef AMREX_USE_MPI
 
-    const int NProcs = ParallelDescriptor::NProcs();
+    const int NProcs = ParallelContext::NProcsSub();
     if (NProcs == 1) return;
 
     if (m_nrcvs > 0)
@@ -214,27 +218,27 @@ void ParticleCopyPlan::buildMPIFinish (const ParticleBufferMap& map)
 
         Gpu::HostVector<int> rcv_box_offsets;
         Gpu::HostVector<int> rcv_box_counts;
-        Gpu::HostVector<int> rcv_box_ids;        
+        Gpu::HostVector<int> rcv_box_ids;
         Gpu::HostVector<int> rcv_box_levs;
-        Gpu::HostVector<int> rcv_box_pids;        
-        
+        Gpu::HostVector<int> rcv_box_pids;
+
         rcv_box_offsets.push_back(0);
         for (int i = 0; i < m_rcv_data.size(); i+=4)
         {
             rcv_box_counts.push_back(m_rcv_data[i]);
-            AMREX_ASSERT(ParallelDescriptor::MyProc() == map.procID(m_rcv_data[i+1], m_rcv_data[i+2]));
+            AMREX_ASSERT(ParallelContext::MyProcSub() == map.procID(m_rcv_data[i+1], m_rcv_data[i+2]));
             rcv_box_ids.push_back(m_rcv_data[i+1]);
             rcv_box_levs.push_back(m_rcv_data[i+2]);
             rcv_box_pids.push_back(m_rcv_data[i+3]);
             rcv_box_offsets.push_back(rcv_box_offsets.back() + rcv_box_counts.back());
         }
-        
+
         m_rcv_box_counts.resize(rcv_box_counts.size());
         Gpu::copy(Gpu::hostToDevice, rcv_box_counts.begin(), rcv_box_counts.end(), m_rcv_box_counts.begin());
-        
+
         m_rcv_box_offsets.resize(rcv_box_offsets.size());
         Gpu::copy(Gpu::hostToDevice, rcv_box_offsets.begin(), rcv_box_offsets.end(), m_rcv_box_offsets.begin());
-        
+
         m_rcv_box_ids.resize(rcv_box_ids.size());
         Gpu::copy(Gpu::hostToDevice, rcv_box_ids.begin(), rcv_box_ids.end(), m_rcv_box_ids.begin());
 
@@ -244,13 +248,13 @@ void ParticleCopyPlan::buildMPIFinish (const ParticleBufferMap& map)
         m_rcv_box_pids.resize(rcv_box_pids.size());
         Gpu::copy(Gpu::hostToDevice, rcv_box_pids.begin(), rcv_box_pids.end(), m_rcv_box_pids.begin());
     }
-    
+
     for (int j = 0; j < m_nrcvs; ++j)
     {
         const auto Who    = m_RcvProc[j];
         const auto offset = m_rOffset[j];
         const auto Cnt    = m_Rcvs[Who]/sizeof(int);
-        
+
         Long nparticles = 0;
         for (int i = offset; i < offset + Cnt; i +=4)
         {
@@ -258,7 +262,6 @@ void ParticleCopyPlan::buildMPIFinish (const ParticleBufferMap& map)
         }
         m_rcv_num_particles[Who] = nparticles;
     }
-
 #endif // MPI
 }
 
@@ -276,33 +279,37 @@ void ParticleCopyPlan::doHandShakeLocal (const Vector<Long>& Snds, Vector<Long>&
     const int num_rcvs = m_neighbor_procs.size();
     Vector<MPI_Status>  stats(num_rcvs);
     Vector<MPI_Request> rreqs(num_rcvs);
-    
+
     // Post receives
     for (int i = 0; i < num_rcvs; ++i)
     {
         const int Who = m_neighbor_procs[i];
         const Long Cnt = 1;
-        
-        AMREX_ASSERT(Who >= 0 && Who < ParallelDescriptor::NProcs());
-        
-        rreqs[i] = ParallelDescriptor::Arecv(&Rcvs[Who], Cnt, Who, SeqNum).req();
+
+        AMREX_ASSERT(Who >= 0 && Who < ParallelContext::NProcsSub());
+
+        rreqs[i] = ParallelDescriptor::Arecv(&Rcvs[Who], Cnt, Who, SeqNum,
+                                             ParallelContext::CommunicatorSub()).req();
     }
-        
+
     // Send.
     for (int i = 0; i < num_rcvs; ++i)
     {
         const int Who = m_neighbor_procs[i];
         const Long Cnt = 1;
-        
-        AMREX_ASSERT(Who >= 0 && Who < ParallelDescriptor::NProcs());
-        
-        ParallelDescriptor::Send(&Snds[Who], Cnt, Who, SeqNum);        
+
+        AMREX_ASSERT(Who >= 0 && Who < ParallelContext::NProcsSub());
+
+        ParallelDescriptor::Send(&Snds[Who], Cnt, Who, SeqNum,
+                                 ParallelContext::CommunicatorSub());
     }
-        
+
     if (num_rcvs > 0)
     {
         ParallelDescriptor::Waitall(rreqs, stats);
     }
+#else
+    amrex::ignore_unused(Snds,Rcvs);
 #endif
 }
 
@@ -310,7 +317,7 @@ void ParticleCopyPlan::doHandShakeAllToAll (const Vector<Long>& Snds, Vector<Lon
 {
 #ifdef AMREX_USE_MPI
     BL_COMM_PROFILE(BLProfiler::Alltoall, sizeof(Long),
-                    ParallelDescriptor::MyProc(), BLProfiler::BeforeCall());
+                    ParallelContext::MyProcSub(), BLProfiler::BeforeCall());
 
     BL_MPI_REQUIRE( MPI_Alltoall(Snds.dataPtr(),
                                  1,
@@ -318,12 +325,14 @@ void ParticleCopyPlan::doHandShakeAllToAll (const Vector<Long>& Snds, Vector<Lon
                                  Rcvs.dataPtr(),
                                  1,
                                  ParallelDescriptor::Mpi_typemap<Long>::type(),
-                                 ParallelDescriptor::Communicator()) );
-    
-    AMREX_ASSERT(Rcvs[ParallelDescriptor::MyProc()] == 0);
-    
+                                 ParallelContext::CommunicatorSub()) );
+
+    AMREX_ASSERT(Rcvs[ParallelContext::MyProcSub()] == 0);
+
     BL_COMM_PROFILE(BLProfiler::Alltoall, sizeof(Long),
-                    ParallelDescriptor::MyProc(), BLProfiler::AfterCall());
+                    ParallelContext::MyProcSub(), BLProfiler::AfterCall());
+#else
+    amrex::ignore_unused(Snds,Rcvs);
 #endif
 }
 
@@ -331,16 +340,16 @@ void ParticleCopyPlan::doHandShakeGlobal (const Vector<Long>& Snds, Vector<Long>
 {
 #ifdef AMREX_USE_MPI
     const int SeqNum = ParallelDescriptor::SeqNum();
-    const int NProcs = ParallelDescriptor::NProcs();
+    const int NProcs = ParallelContext::NProcsSub();
 
     Vector<Long> snd_connectivity(NProcs, 0);
     Vector<int > rcv_connectivity(NProcs, 1);
     for (int i = 0; i < NProcs; ++i) { if (Snds[i] > 0) snd_connectivity[i] = 1; }
 
     Long num_rcvs = 0;
-    MPI_Reduce_scatter(snd_connectivity.data(), &num_rcvs, rcv_connectivity.data(), 
+    MPI_Reduce_scatter(snd_connectivity.data(), &num_rcvs, rcv_connectivity.data(),
                        ParallelDescriptor::Mpi_typemap<Long>::type(), MPI_SUM,
-                       ParallelDescriptor::Communicator());
+                       ParallelContext::CommunicatorSub());
 
     Vector<MPI_Status>  stats(num_rcvs);
     Vector<MPI_Request> rreqs(num_rcvs);
@@ -349,14 +358,14 @@ void ParticleCopyPlan::doHandShakeGlobal (const Vector<Long>& Snds, Vector<Long>
     for (int i = 0; i < num_rcvs; ++i)
     {
         MPI_Irecv( &num_bytes_rcv[i], 1, ParallelDescriptor::Mpi_typemap<Long>::type(),
-                   MPI_ANY_SOURCE, SeqNum, ParallelDescriptor::Communicator(), &rreqs[i] );
+                   MPI_ANY_SOURCE, SeqNum, ParallelContext::CommunicatorSub(), &rreqs[i] );
     }
     for (int i = 0; i < NProcs; ++i)
     {
         if (Snds[i] == 0) continue;
         const Long Cnt = 1;
         MPI_Send( &Snds[i], Cnt, ParallelDescriptor::Mpi_typemap<Long>::type(), i, SeqNum,
-                  ParallelDescriptor::Communicator());
+                  ParallelContext::CommunicatorSub());
     }
 
     MPI_Waitall(num_rcvs, rreqs.data(), stats.data());
@@ -366,6 +375,8 @@ void ParticleCopyPlan::doHandShakeGlobal (const Vector<Long>& Snds, Vector<Long>
         const auto Who = stats[i].MPI_SOURCE;
         Rcvs[Who] = num_bytes_rcv[i];
     }
+#else
+    amrex::ignore_unused(Snds,Rcvs);
 #endif
 }
 
@@ -377,5 +388,7 @@ void amrex::communicateParticlesFinish (const ParticleCopyPlan& plan)
     {
         ParallelDescriptor::Waitall(plan.m_particle_rreqs, plan.m_particle_stats);
     }
+#else
+    amrex::ignore_unused(plan);
 #endif
 }
diff --git a/Src/Particle/AMReX_ParticleContainerI.H b/Src/Particle/AMReX_ParticleContainerI.H
index 20e197bad1f..dbffcfcbb82 100644
--- a/Src/Particle/AMReX_ParticleContainerI.H
+++ b/Src/Particle/AMReX_ParticleContainerI.H
@@ -9,23 +9,51 @@ IntVect
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::tile_size { AMREX_D_DECL(1024000,8,8) };
 
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+std::string
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
+::aggregation_type = "";
+
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+int
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
+::aggregation_buffer = 1;
+
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt> :: SetParticleSize ()
 {
+    if (NumRealComps() > 0 or NumIntComps() > 0) {
+        if (NumRealComps() > 0) {
+            d_communicate_real_comp.resize(NumRealComps());
+            Gpu::copyAsync(Gpu::hostToDevice,
+                           h_communicate_real_comp.begin(),
+                           h_communicate_real_comp.end(),
+                           d_communicate_real_comp.begin());
+        }
+        if (NumIntComps() > 0) {
+            d_communicate_int_comp.resize(NumIntComps());
+            Gpu::copyAsync(Gpu::hostToDevice,
+                           h_communicate_int_comp.begin(),
+                           h_communicate_int_comp.end(),
+                           d_communicate_int_comp.begin());
+        }
+        Gpu::synchronize();
+    }
+
     num_real_comm_comps = 0;
     for (int i = 0; i < NumRealComps(); ++i) {
-        if (communicate_real_comp[i]) ++num_real_comm_comps;
+        if (h_communicate_real_comp[i]) ++num_real_comm_comps;
     }
 
     num_int_comm_comps = 0;
     for (int i = 0; i < NumIntComps(); ++i) {
-        if (communicate_int_comp[i]) ++num_int_comm_comps;
+        if (h_communicate_int_comp[i]) ++num_int_comm_comps;
     }
 
     particle_size = sizeof(ParticleType);
-    superparticle_size = particle_size + 
-        num_real_comm_comps*sizeof(ParticleReal) + num_int_comm_comps*sizeof(int);    
+    superparticle_size = particle_size +
+        num_real_comm_comps*sizeof(ParticleReal) + num_int_comm_comps*sizeof(int);
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -43,7 +71,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt> :: Initialize
     {
         static_assert(sizeof(ParticleType)%sizeof(RealType) == 0,
                       "sizeof ParticleType is not a multiple of sizeof RealType");
-        
+
         ParmParse pp("particles");
         pp.query("do_tiling", do_tiling);
         Vector<int> tilesize(AMREX_SPACEDIM);
@@ -51,10 +79,11 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt> :: Initialize
             for (int i=0; i<AMREX_SPACEDIM; ++i) tile_size[i] = tilesize[i];
         }
 
-        static_assert(std::is_standard_layout<ParticleType>::value
-                   && std::is_trivial<ParticleType>::value,
-                      "Particle type must be standard layout and trivial.");
-        
+        static_assert(std::is_standard_layout<ParticleType>::value,
+                      "Particle type must be standard layout");
+        //                   && std::is_trivial<ParticleType>::value,
+        //                      "Particle type must be standard layout and trivial.");
+
         pp.query("use_prepost", usePrePost);
         pp.query("do_unlink", doUnlink);
 
@@ -63,15 +92,16 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt> :: Initialize
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+template <typename P>
 IntVect
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::Index (const ParticleType& p, int lev) const
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::Index (const P& p, int lev) const
 {
     IntVect iv;
     const Geometry& geom = Geom(lev);
 
-    AMREX_D_TERM(iv[0]=static_cast<int>(floor((p.m_rdata.pos[0]-geom.ProbLo(0))*geom.InvCellSize(0)));,
-                 iv[1]=static_cast<int>(floor((p.m_rdata.pos[1]-geom.ProbLo(1))*geom.InvCellSize(1)));,
-                 iv[2]=static_cast<int>(floor((p.m_rdata.pos[2]-geom.ProbLo(2))*geom.InvCellSize(2))););
+    AMREX_D_TERM(iv[0]=static_cast<int>(floor((p.pos(0)-geom.ProbLo(0))*geom.InvCellSize(0)));,
+                 iv[1]=static_cast<int>(floor((p.pos(1)-geom.ProbLo(1))*geom.InvCellSize(1)));,
+                 iv[2]=static_cast<int>(floor((p.pos(2)-geom.ProbLo(2))*geom.InvCellSize(2))););
 
     iv += geom.Domain().smallEnd();
 
@@ -79,9 +109,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::Index (const
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+template <typename P>
 bool
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
-::Where (const ParticleType& p,
+::Where (const P& p,
 	 ParticleLocData&    pld,
 	 int                 lev_min,
 	 int                 lev_max,
@@ -90,17 +121,17 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 {
 
   AMREX_ASSERT(m_gdb != 0);
-  
+
   if (lev_max == -1)
       lev_max = finestLevel();
-  
+
   AMREX_ASSERT(lev_max <= finestLevel());
 
   AMREX_ASSERT(nGrow == 0 || (nGrow >= 0 && lev_min == lev_max));
 
   std::vector< std::pair<int, Box> > isects;
 
-  for (int lev = lev_max; lev >= lev_min; lev--) {      
+  for (int lev = lev_max; lev >= lev_min; lev--) {
       const IntVect& iv = Index(p, lev);
       if (lev == pld.m_lev) {
           // The fact that we are here means this particle does not belong to any finer grids.
@@ -137,7 +168,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 	  return true;
       }
   }
-  
+
   return false;
 }
 
@@ -170,7 +201,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             IntVect iv;
             const BoxArray& ba = ParticleBoxArray(lev);
             AMREX_ASSERT(ba.ixType().cellCentered());
-            
+
 	    if (local_grid < 0) {
                 iv = Index(p_prime, lev);
                 ba.intersections(Box(iv, iv), isects, true, 0);
@@ -191,14 +222,14 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 		    }
 		}
 	    }
-            
+
             if (grid >= 0) {
-                AMREX_D_TERM(p.m_rdata.pos[0] = p_prime.m_rdata.pos[0];,
-                             p.m_rdata.pos[1] = p_prime.m_rdata.pos[1];,
-                             p.m_rdata.pos[2] = p_prime.m_rdata.pos[2];);
-                
+                AMREX_D_TERM(p.pos(0) = p_prime.pos(0);,
+                             p.pos(1) = p_prime.pos(1);,
+                             p.pos(2) = p_prime.pos(2););
+
                 const Box& bx = ba.getCellCenteredBox(grid);
-                
+
                 pld.m_lev  = lev;
                 pld.m_grid = grid;
 		pld.m_tile = getTileIndex(iv, bx, do_tiling, tile_size, pld.m_tilebox);
@@ -209,7 +240,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             }
         }
     }
-    
+
     return false;
 }
 
@@ -219,45 +250,19 @@ bool
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::PeriodicShift (ParticleType& p) const
 {
-    AMREX_ASSERT(m_gdb != 0);
-
-    const Geometry& geom    = Geom(0);
-    const Box&      dmn     = geom.Domain();
-    const IntVect&  iv      = Index(p, 0);    
-    bool            shifted = false;  
-    
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-    {
-        if (!geom.isPeriodic(i)) continue;
-
-        if (iv[i] > dmn.bigEnd(i))
-        {
-            while (p.m_rdata.pos[i] >= (typename ParticleType::RealType) geom.ProbHi(i)) p.m_rdata.pos[i] -= (typename ParticleType::RealType) geom.ProbLength(i);
-            if (p.m_rdata.pos[i] < (typename ParticleType::RealType) geom.ProbLo(i)) p.m_rdata.pos[i] = (typename ParticleType::RealType) geom.ProbLo(i); // clamp to avoid precision issues;
-	            shifted = true;
-        }
-        else if (iv[i] < dmn.smallEnd(i))
-        {
-            while (p.m_rdata.pos[i] <  (typename ParticleType::RealType) geom.ProbLo(i)) p.m_rdata.pos[i] += (typename ParticleType::RealType) geom.ProbLength(i);
-
-            // clamp to avoid precision issues
-            if ( p.m_rdata.pos[i] == (typename ParticleType::RealType) geom.ProbHi(i)) p.m_rdata.pos[i] = (typename ParticleType::RealType) geom.ProbLo(i);
-            if ((p.m_rdata.pos[i] > (typename ParticleType::RealType) geom.ProbHi(i))) 
-                p.m_rdata.pos[i] = (typename ParticleType::RealType) geom.ProbHi(i) - std::numeric_limits<typename ParticleType::RealType>::epsilon();
-
-            shifted = true;
-	    }
-        AMREX_ASSERT( (p.m_rdata.pos[i] >= (typename ParticleType::RealType) geom.ProbLo(i) ) and ( p.m_rdata.pos[i] < (typename ParticleType::RealType) geom.ProbHi(i) ));
-    }
+    const auto& geom = Geom(0);
+    const auto plo = geom.ProbLoArray();
+    const auto phi = geom.ProbHiArray();
+    const auto is_per = geom.isPeriodicArray();
 
-    return shifted;
+    return enforcePeriodic(p, plo, phi, is_per);
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 ParticleLocData
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 Reset (ParticleType& p,
-       bool          update,
+       bool          /*update*/,
        bool          verbose,
        ParticleLocData pld) const
 {
@@ -279,9 +284,9 @@ Reset (ParticleType& p,
             amrex::AllPrint()<< "Invalidating out-of-domain particle: " << p << '\n'; 
 	}
 
-	AMREX_ASSERT(p.m_idata.id > 0);
+	AMREX_ASSERT(p.id() > 0);
 
-	p.m_idata.id = -p.m_idata.id;
+	p.id() = -p.id();
     }
 
     return pld;
@@ -310,33 +315,52 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::resizeData ()
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::RedefineDummyMF (int lev) 
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::RedefineDummyMF (int lev)
 {
     if (lev > m_dummy_mf.size()-1) m_dummy_mf.resize(lev+1);
-    
-    if (m_dummy_mf[lev] == nullptr || 
+
+    if (m_dummy_mf[lev] == nullptr ||
         ! BoxArray::SameRefs(m_dummy_mf[lev]->boxArray(),
                              ParticleBoxArray(lev))          ||
-        ! DistributionMapping::SameRefs(m_dummy_mf[lev]->DistributionMap(), 
+        ! DistributionMapping::SameRefs(m_dummy_mf[lev]->DistributionMap(),
                                         ParticleDistributionMap(lev)))
     {
         m_dummy_mf[lev].reset(new MultiFab(ParticleBoxArray(lev),
                                            ParticleDistributionMap(lev),
                                            1,0,MFInfo().SetAlloc(false)));
     };
-}  
+}
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::locateParticle (ParticleType& p, ParticleLocData& pld, 
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::locateParticle (ParticleType& p, ParticleLocData& pld,
                                                                                    int lev_min, int lev_max, int nGrow, int local_grid) const
 {
-    bool outside = AMREX_D_TERM(p.m_rdata.pos[0] <  Geom(0).ProbLo(0)
-                             || p.m_rdata.pos[0] >= Geom(0).ProbHi(0),
-                             || p.m_rdata.pos[1] <  Geom(0).ProbLo(1)
-                             || p.m_rdata.pos[1] >= Geom(0).ProbHi(1),
-                             || p.m_rdata.pos[2] <  Geom(0).ProbLo(2)
-                             || p.m_rdata.pos[2] >= Geom(0).ProbHi(2));
+    bool outside = AMREX_D_TERM(p.pos(0) <  Geom(0).ProbLo(0)
+                             || p.pos(0) >= Geom(0).ProbHi(0),
+                             || p.pos(1) <  Geom(0).ProbLo(1)
+                             || p.pos(1) >= Geom(0).ProbHi(1),
+                             || p.pos(2) <  Geom(0).ProbLo(2)
+                             || p.pos(2) >= Geom(0).ProbHi(2));
+
+    if (not outside)
+    {
+        if (Geom(0).outsideRoundoffDomain(AMREX_D_DECL(p.pos(0), p.pos(1), p.pos(2))))
+        {
+            RealBox roundoff_domain = Geom(0).RoundoffDomain();
+            for (int idim=0; idim < AMREX_SPACEDIM; ++idim)
+            {
+                if (p.pos(idim) <= roundoff_domain.lo(idim)) {
+                    p.pos(idim) = std::nextafter((ParticleReal) roundoff_domain.lo(idim), (ParticleReal) roundoff_domain.hi(idim));
+                }
+                if (p.pos(idim) >= roundoff_domain.hi(idim)) {
+                    p.pos(idim) = std::nextafter((ParticleReal) roundoff_domain.hi(idim), (ParticleReal) roundoff_domain.lo(idim));
+                }
+            }
+
+            AMREX_ASSERT(not Geom(0).outsideRoundoffDomain(AMREX_D_DECL(p.pos(0), p.pos(1), p.pos(2))));
+        }
+    }
 
     bool success;
     if (outside)
@@ -346,7 +370,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::locateParticl
       if (!success && lev_min == 0)
       {
           // The particle has left the domain; invalidate it.
-          p.m_idata.id = -p.m_idata.id;
+          p.id() = -p.id();
           success = true;
       }
     }
@@ -376,7 +400,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::TotalNumberOf
         nparticles += NumberOfParticlesAtLevel(lev,only_valid,true);
     }
     if (!only_local) {
-	ParallelDescriptor::ReduceLongSum(nparticles);
+        ParallelAllReduce::Sum(nparticles, ParallelContext::CommunicatorSub());
     }
     return nparticles;
 }
@@ -385,28 +409,56 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 Vector<Long>
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::NumberOfParticlesInGrid (int lev, bool only_valid, bool only_local) const
 {
-  auto ngrids = ParticleBoxArray(lev).size();
-  Vector<Long> nparticles(ngrids, 0);
+    AMREX_ASSERT(lev >= 0 && lev < int(m_particles.size()));
 
-  if (lev >= 0 && lev < int(m_particles.size())) {
-    for (const auto& kv : GetParticles(lev)) {
-      int gid = kv.first.first;
-      const auto& ptile = kv.second;
-      
-      if (only_valid) {
-	for (int k = 0; k < ptile.GetArrayOfStructs().numParticles(); ++k) {
-	  const ParticleType& p = ptile.GetArrayOfStructs()[k];
-	  if (p.m_idata.id > 0) ++nparticles[gid];
-	}
-      } else {
-	nparticles[gid] += ptile.numParticles();
-      }
+    LayoutData<Long> np_per_grid_local(ParticleBoxArray(lev),
+                                       ParticleDistributionMap(lev));
+
+    for (ParConstIterType pti(*this, lev); pti.isValid(); ++pti)
+    {
+        int gid = pti.index();
+        if (only_valid)
+        {
+            const auto& ptile = ParticlesAt(lev, pti);
+            const auto& aos = ptile.GetArrayOfStructs();
+            const auto pstruct = aos().dataPtr();
+            const int np = ptile.numParticles();
+
+            ReduceOps<ReduceOpSum> reduce_op;
+            ReduceData<int> reduce_data(reduce_op);
+            using ReduceTuple = typename decltype(reduce_data)::Type;
+
+            reduce_op.eval(np, reduce_data,
+                           [=] AMREX_GPU_DEVICE (int i) -> ReduceTuple
+                           {
+                               return (pstruct[i].id() > 0) ? 1 : 0;
+                           });
+
+            int np_valid = amrex::get<0>(reduce_data.value());
+            np_per_grid_local[gid] += np_valid;
+        } else
+        {
+            np_per_grid_local[gid] += pti.numParticles();
+        }
+    }
+        
+    Vector<Long> nparticles(np_per_grid_local.size(), 0);
+    if (only_local)
+    {
+        for (ParConstIterType pti(*this, lev); pti.isValid(); ++pti)
+        {
+            nparticles[pti.index()] = np_per_grid_local[pti.index()];
+        }
+    } 
+    else
+    {
+        ParallelDescriptor::GatherLayoutDataToVector(np_per_grid_local, nparticles,
+                                                     ParallelContext::IOProcessorNumberSub());
+        ParallelDescriptor::Bcast(&nparticles[0], nparticles.size(), 
+                                  ParallelContext::IOProcessorNumberSub());
     }
-    
-    if (!only_local) ParallelDescriptor::ReduceLongSum(&nparticles[0],ngrids);
-  }
 
-  return nparticles;
+    return nparticles;
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -417,20 +469,33 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::NumberOfParti
 
     if (lev >= 0 && lev < int(m_particles.size())) {
         for (const auto& kv : GetParticles(lev)) {
-            const auto& ptile = kv.second;	
+            const auto& ptile = kv.second;
             if (only_valid) {
+#if defined(AMREX_USE_DPCPP) || defined(AMREX_USE_HIP)
+                auto const& ptaos = ptile.GetArrayOfStructs();
+                ParticleType const* pp = ptaos().data();
+                int np = amrex::Reduce::Sum<int>(ptaos.numParticles(), pp, 0,
+                         [=] AMREX_GPU_DEVICE (int s, ParticleType const& p) noexcept
+                         {
+                             return (p.id() > 0) ? s+1 : s;
+                         });
+                nparticles += np;
+#else
                 for (int k = 0; k < ptile.GetArrayOfStructs().numParticles(); ++k) {
                     const ParticleType& p = ptile.GetArrayOfStructs()[k];
-                    if (p.m_idata.id > 0) ++nparticles;
+                    if (p.id() > 0) ++nparticles;
                 }
+#endif
             } else {
                 nparticles += ptile.numParticles();
             }
         }
     }
 
-    if (!only_local) ParallelDescriptor::ReduceLongSum(nparticles);
-    
+    if (!only_local) {
+        ParallelAllReduce::Sum(nparticles, ParallelContext::CommunicatorSub());
+    }
+
     return nparticles;
 }
 
@@ -454,25 +519,25 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::ByteSpread ()
 
     Long mn = cnt, mx = mn;
 
-    const int IOProc = ParallelDescriptor::IOProcessorNumber();
+    const int IOProc = ParallelContext::IOProcessorNumberSub();
     const std::size_t sz = sizeof(ParticleType)+NumRealComps()*sizeof(Real)+NumIntComps()*sizeof(int);
 
 #ifdef AMREX_LAZY
     Lazy::QueueReduction( [=] () mutable {
 #endif
-    ParallelDescriptor::ReduceLongMin(mn, IOProc);
-    ParallelDescriptor::ReduceLongMax(mx, IOProc);
-    ParallelDescriptor::ReduceLongSum(cnt,IOProc);
-
-    amrex::Print() << "ParticleContainer byte spread across MPI nodes: ["
-                   << mn*sz
-                   << " (" << mn << ")"
-                   << " ... "
-                   << mx*sz
-                   << " (" << mx << ")"
-                   << "] total particles: (" << cnt << ")\n";
+            ParallelReduce::Min(mn,  IOProc, ParallelContext::CommunicatorSub());
+            ParallelReduce::Max(mx,  IOProc, ParallelContext::CommunicatorSub());
+            ParallelReduce::Sum(cnt, IOProc, ParallelContext::CommunicatorSub());
+
+            amrex::Print() << "ParticleContainer byte spread across MPI nodes: ["
+                           << mn*sz
+                           << " (" << mn << ")"
+                           << " ... "
+                           << mx*sz
+                           << " (" << mx << ")"
+                           << "] total particles: (" << cnt << ")\n";
 #ifdef AMREX_LAZY
-    });
+        });
 #endif
 }
 
@@ -492,24 +557,24 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::PrintCapacity
 
     Long mn = cnt, mx = mn;
 
-    const int IOProc = ParallelDescriptor::IOProcessorNumber();
+    const int IOProc = ParallelContext::IOProcessorNumberSub();
 
 #ifdef AMREX_LAZY
     Lazy::QueueReduction( [=] () mutable {
 #endif
-    ParallelDescriptor::ReduceLongMin(mn, IOProc);
-    ParallelDescriptor::ReduceLongMax(mx, IOProc);
-    ParallelDescriptor::ReduceLongSum(cnt,IOProc);
-
-    amrex::Print() << "ParticleContainer byte spread across MPI nodes: ["
-                   << mn
-                   << " (" << mn << ")"
-                   << " ... "
-                   << mx
-                   << " (" << mx << ")"
-                   << "] total memory: (" << cnt << ")\n";
+            ParallelReduce::Min(mn,  IOProc, ParallelContext::CommunicatorSub());
+            ParallelReduce::Max(mx,  IOProc, ParallelContext::CommunicatorSub());
+            ParallelReduce::Sum(cnt, IOProc, ParallelContext::CommunicatorSub());
+
+            amrex::Print() << "ParticleContainer byte spread across MPI nodes: ["
+                           << mn
+                           << " (" << mn << ")"
+                           << " ... "
+                           << mx
+                           << " (" << mx << ")"
+                           << "] total memory: (" << cnt << ")\n";
 #ifdef AMREX_LAZY
-    });
+        });
 #endif
 }
 
@@ -563,14 +628,14 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::MoveRandom (i
         for (int i = 0; i < n; i++)
         {
 	  ParticleType& p = aos[i];
-	  
-	  if (p.m_idata.id <= 0) continue;
-	  
+
+	  if (p.id() <= 0) continue;
+
 	  for (int j = 0; j < AMREX_SPACEDIM; j++)
               {
-                  p.m_rdata.pos[j] += dist[j]*(2*amrex::Random()-1);
+                  p.pos(j) += dist[j]*(2*amrex::Random()-1);
               }
-	  
+
 	  Reset(p, true);
         }
     }
@@ -625,7 +690,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::IncrementWith
       FArrayBox&  fab  = (*mf_pointer)[gid];
       for (int k = 0; k < pbox.numParticles(); ++ k) {
 	const ParticleType& p = pbox[k];
-          if (p.m_idata.id > 0) {
+        if (p.id() > 0) {
               Where(p, pld);
               AMREX_ASSERT(pld.m_grid == gid);
               fab(pld.m_cell) += 1;
@@ -633,45 +698,21 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::IncrementWith
           }
       }
   }
-  
+
   // If mf is not defined on the particle_box_array, then we need
   // to copy here from mf_pointer into mf.   I believe that we don't
   // need any information in ghost cells so we don't copy those.
-  if (mf_pointer != &mf) 
+  if (mf_pointer != &mf)
     {
-      mf.copy(*mf_pointer,0,0,mf.nComp());  
+      mf.copy(*mf_pointer,0,0,mf.nComp());
       delete mf_pointer;
     }
-  
-  if (!local) ParallelDescriptor::ReduceLongSum(num_particles_in_domain);
-  
-  return num_particles_in_domain;
-}
 
-template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
-Real
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::sumParticleMass (int rho_index, int lev, bool local) const
-{
-  BL_PROFILE("ParticleContainer::sumParticleMass(lev)");
-  AMREX_ASSERT(NStructReal >= 1);
-  AMREX_ASSERT(lev >= 0 && lev < int(m_particles.size()));
-  
-  Real msum = 0;
-  
-  const auto& pmap = m_particles[lev];
-  for (const auto& kv : pmap) {
-      const auto& pbox = kv.second.GetArrayOfStructs();
-      for (int k = 0; k < pbox.numParticles(); ++k) {
-	  const ParticleType& p = pbox[k];
-	  if (p.m_idata.id > 0) {
-	      msum += p.m_rdata.arr[AMREX_SPACEDIM+rho_index];
-	  }
-      }
+  if (!local) {
+      ParallelAllReduce::Sum(num_particles_in_domain, ParallelContext::CommunicatorSub());
   }
-  
-  if (!local) ParallelDescriptor::ReduceRealSum(msum);
-  
-  return msum;
+
+  return num_particles_in_domain;
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -680,7 +721,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::RemoveParticl
 {
     BL_PROFILE("ParticleContainer::RemoveParticlesAtLevel()");
     if (level >= int(this->m_particles.size())) return;
-    
+
     if (!this->m_particles[level].empty())
     {
         ParticleLevel().swap(this->m_particles[level]);
@@ -693,9 +734,9 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::RemoveParticl
 {
   BL_PROFILE("ParticleContainer::RemoveParticlesNotAtFinestLevel()");
   AMREX_ASSERT(this->finestLevel()+1 == int(this->m_particles.size()));
-  
+
   Long cnt = 0;
-  
+
   for (unsigned lev = 0; lev < m_particles.size() - 1; ++lev) {
       auto& pmap = m_particles[lev];
       if (!pmap.empty()) {
@@ -706,12 +747,12 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::RemoveParticl
           ParticleLevel().swap(pmap);
       }
   }
-  
+
   //
   // Print how many particles removed on each processor if any were removed.
   //
   if (this->m_verbose > 1 && cnt > 0) {
-      amrex::AllPrint() << "Processor " << ParallelDescriptor::MyProc() << " removed " << cnt
+      amrex::AllPrint() << "Processor " << ParallelContext::MyProcSub() << " removed " << cnt
                         << " particles not in finest level\n";
   }
 }
@@ -720,11 +761,21 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::CreateVirtualParticles (int level, AoS& virts) const
+{
+    ParticleTileType ptile;
+    CreateVirtualParticles(level, ptile);
+    ptile.GetArrayOfStructs().swap(virts);
+}
+
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+void
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
+::CreateVirtualParticles (int level, ParticleTileType& virts) const
 {
     BL_PROFILE("ParticleContainer::CreateVirtualParticles()");
     AMREX_ASSERT(level > 0);
     AMREX_ASSERT(virts.empty());
-    
+
     if (level >= static_cast<int>(m_particles.size()))
         return;
 
@@ -740,99 +791,96 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     if (aggregation_type == "None");
     else if (aggregation_type == "Cell");
     else if (aggregation_type == "Flow") amrex::Abort("Flow aggregation not implemented");
-    else amrex::Abort("Unknown Particle Aggregation mode");
-    
+
     if (aggregation_type == "None")
-    { 
-        const auto& pmap = m_particles[level];
-        for (const auto& kv : pmap)
+    {
+        for(ParConstIterType pti(*this, level); pti.isValid(); ++pti)
         {
-            const auto& pbox = kv.second.GetArrayOfStructs();
-            for (auto it = pbox.cbegin(); it != pbox.cend(); ++it)
+            const auto& ptile = ParticlesAt(level, pti);
+            const auto src = ptile.getConstParticleTileData();
+
+            auto& aos = ptile.GetArrayOfStructs();
+            for (int pindex = 0; pindex < ptile.numParticles(); ++pindex)
             {
-	        ParticleType p = *it;
-	        p.m_idata.id = VirtualParticleID;
+                SuperParticleType p = src.getSuperParticle(pindex);
+                p.id() = VirtualParticleID;
                 virts.push_back(p);
             }
         }
-        return;
     }
 
-
     if (aggregation_type == "Cell")
     {
         BoxList bl_buffer;
         bl_buffer.complementIn(Geom(level).Domain(), ParticleBoxArray(level));
         BoxArray buffer(std::move(bl_buffer));
         buffer.grow(aggregation_buffer);
-        
-        const auto& pmap = m_particles[level];
-        for (const auto& kv : pmap)
+
+        for(ParConstIterType pti(*this, level); pti.isValid(); ++pti)
         {
-            const auto& pbox = kv.second.GetArrayOfStructs();
-            
-            std::map<IntVect,ParticleType> agg_map;
-            
-            for (auto it = pbox.cbegin(); it != pbox.cend(); ++it)
+            const auto& ptile = ParticlesAt(level, pti);
+            const auto& aos = pti.GetArrayOfStructs();
+            const auto src = ptile.getConstParticleTileData();
+
+            std::map<IntVect,SuperParticleType> agg_map;
+
+            for (int pindex = 0; pindex < ptile.numParticles(); ++pindex)
             {
-                IntVect cell = Index(*it, level);
+                IntVect cell = Index(aos[pindex], level);
                 if (buffer.contains(cell))
                 {
                     // It's in the no-aggregation buffer.
                     // Set its id to indicate that it's a virt.
-		    ParticleType p = *it;
-                    p.m_idata.id = VirtualParticleID;
+                    SuperParticleType p = src.getSuperParticle(pindex);
+                    p.id() = VirtualParticleID;
                     virts.push_back(p);
                 }
                 else
                 {
                     //
-                    // Note that Cell aggregation assumes that p.m_rdata.arr[AMREX_SPACEDIM] is mass and
+                    // Note that Cell aggregation assumes that p.rdata(0) is mass and
                     // that all other components should be combined in a mass-weighted
                     // average.
                     //
                     auto agg_map_it = agg_map.find(cell);
-                    
+
                     if (agg_map_it == agg_map.end())
                     {
                         //
                         // Add the particle.
                         //
-                        ParticleType p = *it;
-                        //
-                        // Set its id to indicate that it's a virt.
-                        //
-                        p.m_idata.id = VirtualParticleID;
+                        SuperParticleType p = src.getSuperParticle(pindex);
+                        p.id() = VirtualParticleID;
                         agg_map[cell] = p;
                     }
                     else
                     {
                         AMREX_ASSERT(agg_map_it != agg_map.end());
-                        const ParticleType&  pnew       = *it;
-                        ParticleType&        pold       = agg_map_it->second;
-                        const Real           old_mass   = pold.m_rdata.arr[AMREX_SPACEDIM];
-                        const Real           new_mass   = pnew.m_rdata.arr[AMREX_SPACEDIM];
+                        const SuperParticleType&  pnew       = src.getSuperParticle(pindex);
+                        SuperParticleType&        pold       = agg_map_it->second;
+                        const Real           old_mass   = pold.rdata(0);
+                        const Real           new_mass   = pnew.rdata(0);
                         const Real           total_mass = old_mass + new_mass;
                         //
                         // Set the position to the center of mass.
                         //
                         for (int i = 0; i < AMREX_SPACEDIM; i++)
                         {
-                            pold.m_rdata.pos[i] = (old_mass*pold.m_rdata.pos[i] + new_mass*pnew.m_rdata.pos[i])/total_mass;
+                            pold.pos(i) = (old_mass*pold.pos(i) + new_mass*pnew.pos(i))/total_mass;
                         }
                         AMREX_ASSERT(this->Index(pold, level) == cell);
                         //
                         // Set the metadata (presumably velocity) to the mass-weighted average.
                         //
-                        for (int i = AMREX_SPACEDIM + 1; i < AMREX_SPACEDIM + NStructReal; i++)
+                        for (int i = 1; i < NStructReal; i++)
                         {
-                            pold.m_rdata.arr[i] = (old_mass*pold.m_rdata.arr[i] + new_mass*pnew.m_rdata.arr[i])/total_mass;
+                            pold.rdata(i) = (old_mass*pold.rdata(i) + new_mass*pnew.rdata(i))/total_mass;
                         }
-                        pold.m_rdata.arr[AMREX_SPACEDIM] = total_mass;
+                        pold.rdata(0) = total_mass;
                     }
                 }
             }
-            
+
             //
             // Add the aggregated particles to the virtuals.
             //
@@ -848,32 +896,41 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::CreateGhostParticles (int level, int nGrow, AoS& ghosts) const
+{
+    ParticleTileType ptile;
+    CreateGhostParticles(level, nGrow, ptile);
+    ptile.GetArrayOfStructs().swap(ghosts);
+}
+
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+void
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
+::CreateGhostParticles (int level, int nGrow, ParticleTileType& ghosts) const
 {
     BL_PROFILE("ParticleContainer::CreateGhostParticles()");
     AMREX_ASSERT(ghosts.empty());
     AMREX_ASSERT(level < finestLevel());
-  
+
     if (level >= static_cast<int>(m_particles.size()))
         return;
-  
+
     const BoxArray& fine = ParticleBoxArray(level + 1);
-  
     std::vector< std::pair<int,Box> > isects;
-  
-    const auto& pmap = m_particles[level];
-    for (const auto& kv : pmap)
+    for(ParConstIterType pti(*this, level); pti.isValid(); ++pti)
     {
-        const auto& pbox = kv.second.GetArrayOfStructs();
-        for (auto it = pbox.cbegin(); it != pbox.cend(); ++it)
+        const auto& ptile = ParticlesAt(level, pti);
+        const auto src = ptile.getConstParticleTileData();
+
+        auto& aos = ptile.GetArrayOfStructs();
+        for (int pindex = 0; pindex < ptile.numParticles(); ++pindex)
         {
-            const IntVect& iv = Index(*it, level+1);
-            fine.intersections(Box(iv,iv),isects,false,nGrow);
-            for (const auto& isec : isects)
+            const IntVect& iv = Index(aos[pindex], level+1);
+            fine.intersections(Box(iv,iv),isects,true,nGrow);
+            if (isects.size() > 0)
             {
-                amrex::ignore_unused(isec);
-                ParticleType p = *it;  // yes, make a copy
-                p.m_idata.id = GhostParticleID;	    
-                ghosts().push_back(p);
+                SuperParticleType p = src.getSuperParticle(pindex);
+                p.id() = GhostParticleID;
+                ghosts.push_back(p);
             }
         }
     }
@@ -885,10 +942,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 clearParticles ()
 {
     BL_PROFILE("ParticleContainer::clearParticles()");
-    
+
     for (int lev = 0; lev < static_cast<int>(m_particles.size()); ++lev)
     {
-        for (auto& kv : m_particles[lev]) 
+        for (auto& kv : m_particles[lev])
         {
             kv.second.resize(0);
         }
@@ -900,28 +957,49 @@ void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 copyParticles (const ParticleContainerType& other, bool local)
 {
-    BL_PROFILE("ParticleContainer::copyParticles");
-    clearParticles();   
-    addParticles(other, local);
+    using PData = ConstParticleTileData<NStructReal, NStructInt, NArrayReal, NArrayInt>;
+    copyParticles(other, [=] AMREX_GPU_HOST_DEVICE (const PData& /*data*/, int /*i*/) { return 1; }, local);
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 addParticles (const ParticleContainerType& other, bool local)
+{
+    using PData = ConstParticleTileData<NStructReal, NStructInt, NArrayReal, NArrayInt>;
+    addParticles(other, [=] AMREX_GPU_HOST_DEVICE (const PData& /*data*/, int /*i*/) { return 1; }, local);
+}
+
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+template <class F,
+          amrex::EnableIf_t<! std::is_integral<F>::value, int> foo>
+void
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
+copyParticles (const ParticleContainerType& other, F&& f, bool local)
+{
+    BL_PROFILE("ParticleContainer::copyParticles");
+    clearParticles();
+    addParticles(other, std::forward<F>(f), local);
+}
+
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+template <class F,
+          amrex::EnableIf_t<! std::is_integral<F>::value, int> foo>
+void
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
+addParticles (const ParticleContainerType& other, F&& f, bool local)
 {
     BL_PROFILE("ParticleContainer::addParticles");
 
     for (int lev = 0; lev < other.numLevels(); ++lev)
     {
         const auto& plevel_other = other.GetParticles(lev);
-        auto& plevel = GetParticles(lev);
         for(MFIter mfi = other.MakeMFIter(lev); mfi.isValid(); ++mfi)
         {
-            auto index = std::make_pair(mfi.index(), mfi.LocalTileIndex());            
+            auto index = std::make_pair(mfi.index(), mfi.LocalTileIndex());
             if(plevel_other.find(index) == plevel_other.end()) continue;
 
-            auto& ptile = plevel[index];
+            auto& ptile = DefineAndReturnParticleTile(lev, mfi.index(), mfi.LocalTileIndex());
             const auto& ptile_other = plevel_other.at(index);
             auto np = ptile_other.numParticles();
             if (np == 0) continue;
@@ -929,10 +1007,12 @@ addParticles (const ParticleContainerType& other, bool local)
             auto dst_index = ptile.numParticles();
             ptile.resize(dst_index + np);
 
-            amrex::copyParticles(ptile, ptile_other, 0, dst_index, np);            
+            auto count = amrex::filterParticles(ptile, ptile_other, std::forward<F>(f), 0, dst_index, np);
+
+            ptile.resize(dst_index + count);
         }
     }
-    
+
     if (not local) Redistribute();
 }
 
@@ -962,36 +1042,7 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::SortParticlesByCell ()
 {
-    BL_PROFILE("ParticleContainer::SortParticlesByCell()");
-
-    for (int lev = 0; lev < numLevels(); ++lev)
-    {
-        const Geometry& geom = Geom(lev);
-        const auto dxi = geom.InvCellSizeArray();
-        const auto plo = geom.ProbLoArray();
-        const auto domain = geom.Domain();
-
-        for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
-        {
-            auto& ptile = ParticlesAt(lev, mfi);
-            auto& aos   = ptile.GetArrayOfStructs();
-            const size_t np = aos.numParticles();
-            auto pstruct_ptr = aos().dataPtr();
-            
-            ParticleTileType ptile_tmp;
-            ptile_tmp.define(m_num_runtime_real, m_num_runtime_int);
-            ptile_tmp.resize(np);
-
-            m_bins.build(np, pstruct_ptr, mfi.tilebox(),
-                       [=] AMREX_GPU_HOST_DEVICE (const ParticleType& p) noexcept -> IntVect
-                       {
-                           return getParticleCell(p, plo, dxi, domain);
-                       });
-          
-            gatherParticles(ptile_tmp, ptile, np, m_bins.permutationPtr());
-            ptile.swap(ptile_tmp);
-        }
-    }
+    SortParticlesByBin(IntVect(AMREX_D_DECL(1, 1, 1)));
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -1018,15 +1069,19 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::SortParticles
             ptile_tmp.define(m_num_runtime_real, m_num_runtime_int);
             ptile_tmp.resize(np);
 
-            const Box& box = mfi.tilebox();
-            IntVect lo = box.smallEnd();
-			
-            m_bins.build(np, pstruct_ptr, mfi.tilebox(),
-                       [=] AMREX_GPU_HOST_DEVICE (const ParticleType& p) noexcept -> IntVect
+            const Box& box = mfi.validbox();
+
+            int ntiles = numTilesInBox(box, true, bin_size);
+
+            m_bins.build(np, pstruct_ptr, ntiles,
+                       [=] AMREX_GPU_HOST_DEVICE (const ParticleType& p) noexcept -> unsigned int
                        {
-                           return (getParticleCell(p, plo, dxi, domain) - lo) / bin_size;
+                           Box tbx;
+                           auto iv = getParticleCell(p, plo, dxi, domain);
+                           auto tid = getTileIndex(iv, box, true, bin_size, tbx);
+                           return static_cast<unsigned int>(tid);
                        });
-          
+
             gatherParticles(ptile_tmp, ptile, np, m_bins.permutationPtr());
             ptile.swap(ptile_tmp);
         }
@@ -1044,7 +1099,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 #ifdef AMREX_USE_GPU
 
     if (local) AMREX_ASSERT(numParticlesOutOfRange(*this, lev_min, lev_max, local) == 0);
-    
+
     // sanity check
     AMREX_ASSERT(do_tiling == false);
 
@@ -1055,21 +1110,8 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 
     if (lev_max < 0)
         lev_max = GetParGDB()->finestLevel();
-    
-    this->defineBufferMap();
 
-    int num_levels = numLevels();
-    if (num_levels == 1)
-    {
-        const auto& ba = ParticleBoxArray(0);
-        const auto& geom = Geom(0);
-        if ((ba.size() == 1) and geom.isAllPeriodic())
-        {
-            EnforcePeriodic();
-            AMREX_ASSERT(OK());
-            return;
-        }
-    }
+    this->defineBufferMap();
 
     if (not m_particle_locator.isValid(GetParGDB())) m_particle_locator.build(GetParGDB());
     m_particle_locator.setGeometry(GetParGDB());
@@ -1077,13 +1119,12 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 
     BL_PROFILE_VAR_START(blp_partition);
     ParticleCopyOp op;
+    int num_levels = numLevels();
     op.setNumLevels(num_levels);
-    Vector<std::map<int, int> > new_sizes(num_levels);    
+    Vector<std::map<int, int> > new_sizes(num_levels);
     for (int lev = lev_min; lev <= lev_max; ++lev)
     {
         const Geometry& geom = Geom(lev);
-        const BoxArray& ba   = ParticleBoxArray(lev);
-        const DistributionMapping& dmap = ParticleDistributionMap(lev);
 
         auto& plev = m_particles[lev];
         for (auto& kv : plev)
@@ -1091,11 +1132,16 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             int gid = kv.first.first;
             int tid = kv.first.second;
             auto index = std::make_pair(gid, tid);
-            
+
             auto& src_tile = plev[index];
             auto& aos = src_tile.GetArrayOfStructs();
             const size_t np = aos.numParticles();
 
+            AMREX_ASSERT_WITH_MESSAGE((NumRealComps() == 0 and NumIntComps() == 0) or
+                                      aos.size() == src_tile.GetStructOfArrays().size(),
+                "The AoS and SoA data on this tile are different sizes - "
+                "perhaps particles have not been initialized correctly?");
+
             int num_stay = partitionParticlesByDest(src_tile, assign_grid, BufferMap(),
                                                     geom, lev, gid, tid,
                                                     lev_min, lev_max, nGrow);
@@ -1109,14 +1155,14 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             auto p_src_indices = op.m_src_indices[lev][gid].dataPtr();
             auto p_periodic_shift = op.m_periodic_shift[lev][gid].dataPtr();
             auto p_ptr = &(aos[0]);
-            
+
 	    AMREX_FOR_1D ( num_move, i,
             {
                 const auto& p = p_ptr[i + num_stay];
                 if (p.id() < 0)
                 {
                     p_boxes[i] = -1;
-                    p_levs[i]  = -1;                    
+                    p_levs[i]  = -1;
                 }
                 else
                 {
@@ -1132,7 +1178,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     BL_PROFILE_VAR_STOP(blp_partition);
 
     ParticleCopyPlan plan;
-    
+
     plan.build(*this, op, local);
 
     Gpu::DeviceVector<char> snd_buffer;
@@ -1159,7 +1205,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     {
         auto& pmap = m_particles[lev];
         for (auto pmap_it = pmap.begin(); pmap_it != pmap.end(); /* no ++ */)
-        {          
+        {
             if (pmap_it->second.empty())
             {
                 pmap.erase(pmap_it++);
@@ -1177,7 +1223,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         communicateParticlesStart(*this, plan, snd_buffer, rcv_buffer);
         unpackBuffer(*this, plan, snd_buffer, RedistributeUnpackPolicy());
         communicateParticlesFinish(plan);
-        unpackRemotes(*this, plan, rcv_buffer, RedistributeUnpackPolicy());        
+        unpackRemotes(*this, plan, rcv_buffer, RedistributeUnpackPolicy());
     }
     else
     {
@@ -1189,46 +1235,20 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         plan.buildMPIFinish(BufferMap());
         Gpu::Device::synchronize();
         communicateParticlesStart(*this, plan, pinned_snd_buffer, pinned_rcv_buffer);
-        rcv_buffer.resize(pinned_rcv_buffer.size());   
+        rcv_buffer.resize(pinned_rcv_buffer.size());
         unpackBuffer(*this, plan, snd_buffer, RedistributeUnpackPolicy());
-        communicateParticlesFinish(plan);        
+        communicateParticlesFinish(plan);
         Gpu::htod_memcpy_async(rcv_buffer.dataPtr(), pinned_rcv_buffer.dataPtr(), pinned_rcv_buffer.size());
         unpackRemotes(*this, plan, rcv_buffer, RedistributeUnpackPolicy());
     }
 
-    Gpu::Device::synchronize();    
+    Gpu::Device::synchronize();
     AMREX_ASSERT(numParticlesOutOfRange(*this, lev_min, lev_max, nGrow) == 0);
+#else
+    amrex::ignore_unused(lev_min,lev_max,nGrow,local);
 #endif
 }
 
-template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
-void
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
-::EnforcePeriodic ()
-{
-    BL_PROFILE("ParticleContainer::EnforcePeriodic()");
-    const int lev = 0;
-    auto& plev = m_particles[lev];
-    const auto plo = Geom(lev).ProbLoArray();
-    const auto phi = Geom(lev).ProbHiArray();
-    const auto is_per = Geom(lev).isPeriodicArray();
-
-    for (auto& kv : plev)
-    {
-        int gid = kv.first.first;
-        int tid = kv.first.second;
-        auto index = std::make_pair(gid, tid);
-        auto& particles = plev[index];
-
-        const int np = particles.numParticles();
-        ParticleType* pstruct = &(particles.GetArrayOfStructs()[0]);
-        AMREX_FOR_1D ( np, i,
-        {
-            enforcePeriodic(pstruct[i], plo, phi, is_per);
-        });
-    }
-}
-
 //
 // The CPU implementation of Redistribute
 //
@@ -1238,10 +1258,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::RedistributeCPU (int lev_min, int lev_max, int nGrow, int local)
 {
   BL_PROFILE("ParticleContainer::RedistributeCPU()");
-    
-  const int MyProc    = ParallelDescriptor::MyProc();
+
+  const int MyProc    = ParallelContext::MyProcSub();
   Real      strttime  = amrex::second();
-  
+
   if (local > 0) BuildRedistributeMask(0, local);
 
   // On startup there are cases where Redistribute() could be called
@@ -1254,22 +1274,22 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
   if (int(m_particles.size()) < theEffectiveFinestLevel+1) {
       if (Verbose()) {
           amrex::Print() << "ParticleContainer::Redistribute() resizing containers from "
-                         << m_particles.size() << " to " 
+                         << m_particles.size() << " to "
                          << theEffectiveFinestLevel + 1 << '\n';
       }
       m_particles.resize(theEffectiveFinestLevel+1);
       m_dummy_mf.resize(theEffectiveFinestLevel+1);
   }
-  
-  // It is important to do this even if we don't have more levels because we may have changed the 
+
+  // It is important to do this even if we don't have more levels because we may have changed the
   // grids at this level in a regrid.
   for (int lev = 0; lev < theEffectiveFinestLevel+1; ++lev)
       RedefineDummyMF(lev);
-  
+
   int nlevs_particles;
   if (lev_max == -1) {
       lev_max = theEffectiveFinestLevel;
-      nlevs_particles = m_particles.size() - 1; 
+      nlevs_particles = m_particles.size() - 1;
   } else {
       nlevs_particles = lev_max;
   }
@@ -1277,14 +1297,9 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 
   // This will hold the valid particles that go to another process
   std::map<int, Vector<char> > not_ours;
-  
-  int num_threads = 1;
-#ifdef _OPENMP
-#pragma omp parallel
-#pragma omp single
-  num_threads = omp_get_num_threads();
-#endif
-  
+
+  int num_threads = OpenMP::get_max_threads();
+
   // these are temporary buffers for each thread
   std::map<int, Vector<Vector<char> > > tmp_remote;
   Vector<std::map<std::pair<int, int>, Vector<ParticleVector> > > tmp_local;
@@ -1308,7 +1323,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     for (int i = 0; i < neighbor_procs.size(); ++i)
       tmp_remote[neighbor_procs[i]].resize(num_threads);
   } else {
-    for (int i = 0; i < ParallelDescriptor::NProcs(); ++i)
+    for (int i = 0; i < ParallelContext::NProcsSub(); ++i)
       tmp_remote[i].resize(num_threads);
   }
 
@@ -1324,30 +1339,30 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
           grid_tile_ids.push_back(kv.first);
           ptile_ptrs.push_back(&(kv.second));
       }
-      
+
 #ifdef _OPENMP
 #pragma omp parallel for
 #endif
       for (int pmap_it = 0; pmap_it < static_cast<int>(ptile_ptrs.size()); ++pmap_it)
       {
-#ifdef _OPENMP
-          int thread_num = omp_get_thread_num();
-#else
-          int thread_num = 0;
-#endif
+          int thread_num = OpenMP::get_thread_num();
           int grid = grid_tile_ids[pmap_it].first;
           int tile = grid_tile_ids[pmap_it].second;
           auto& aos = ptile_ptrs[pmap_it]->GetArrayOfStructs();
           auto& soa = ptile_ptrs[pmap_it]->GetStructOfArrays();
-          unsigned npart = aos.numParticles();              
+          AMREX_ASSERT_WITH_MESSAGE((NumRealComps() == 0 and NumIntComps() == 0)
+                                    or aos.size() == soa.size(),
+              "The AoS and SoA data on this tile are different sizes - "
+              "perhaps particles have not been initialized correctly?");
+          unsigned npart = aos.numParticles();
           ParticleLocData pld;
           if (npart != 0) {
               Long last = npart - 1;
-              unsigned pindex = 0;
+              Long pindex = 0;
               while (pindex <= last) {
                   ParticleType& p = aos[pindex];
 
-                  if (p.m_idata.id < 0)
+                  if (p.id() < 0)
 		  {
                       aos[pindex] = aos[last];
                       for (int comp = 0; comp < NumRealComps(); comp++)
@@ -1358,12 +1373,12 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                       --last;
                       continue;
                   }
-                      
+
                   locateParticle(p, pld, lev_min, lev_max, nGrow, local ? grid : -1);
 
                   particlePostLocate(p, pld, lev);
-                  
-                  if (p.m_idata.id < 0)
+
+                  if (p.id() < 0)
                   {
                       aos[pindex] = aos[last];
                       for (int comp = 0; comp < NumRealComps(); comp++)
@@ -1375,7 +1390,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                       continue;
                   }
 
-                  const int who = ParticleDistributionMap(pld.m_lev)[pld.m_grid];
+                  const int who = ParallelContext::global_to_local_rank(ParticleDistributionMap(pld.m_lev)[pld.m_grid]);
                   if (who == MyProc) {
                       if (pld.m_lev != lev || pld.m_grid != grid || pld.m_tile != tile) {
                           // We own it but must shift it to another place.
@@ -1390,8 +1405,8 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                               IntVector& arr = soa_local[pld.m_lev][index][thread_num].GetIntData(comp);
                               arr.push_back(soa.GetIntData(comp)[pindex]);
                           }
-                          
-                          p.m_idata.id = -p.m_idata.id; // Invalidate the particle
+
+                          p.id() = -p.id(); // Invalidate the particle
                       }
                   }
                   else {
@@ -1402,22 +1417,22 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                       std::memcpy(&particles_to_send[old_size], &p, particle_size);
                       char* dst = &particles_to_send[old_size] + particle_size;
                       for (int comp = 0; comp < NumRealComps(); comp++) {
-                          if (communicate_real_comp[comp]) {
-                              std::memcpy(dst, &soa.GetRealData(comp)[pindex], sizeof(Real));
-                              dst += sizeof(Real);
+                          if (h_communicate_real_comp[comp]) {
+                              std::memcpy(dst, &soa.GetRealData(comp)[pindex], sizeof(ParticleReal));
+                              dst += sizeof(ParticleReal);
                           }
                       }
                       for (int comp = 0; comp < NumIntComps(); comp++) {
-                          if (communicate_int_comp[comp]) {
+                          if (h_communicate_int_comp[comp]) {
 			      std::memcpy(dst, &soa.GetIntData(comp)[pindex], sizeof(int));
                               dst += sizeof(int);
                           }
                       }
-                      
-                      p.m_idata.id = -p.m_idata.id; // Invalidate the particle
+
+                      p.id() = -p.id(); // Invalidate the particle
                   }
-                  
-                  if (p.m_idata.id < 0)
+
+                  if (p.id() < 0)
 		  {
                       aos[pindex] = aos[last];
                       for (int comp = 0; comp < NumRealComps(); comp++)
@@ -1428,10 +1443,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                       --last;
                       continue;
                   }
-                  
+
                   ++pindex;
               }
-              
+
               aos().erase(aos().begin() + last + 1, aos().begin() + npart);
               for (int comp = 0; comp < NumRealComps(); comp++) {
                   RealVector& rdata = soa.GetRealData(comp);
@@ -1444,11 +1459,11 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
           }
       }
   }
-  
+
   for (int lev = lev_min; lev <= lev_max; lev++) {
       auto& pmap = m_particles[lev];
       for (auto pmap_it = pmap.begin(); pmap_it != pmap.end(); /* no ++ */) {
-          
+
           // Remove any map entries for which the particle container is now empty.
           if (pmap_it->second.empty()) {
               pmap.erase(pmap_it++);
@@ -1547,29 +1562,31 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                          << m_particles.size() << " to " << theEffectiveFinestLevel+1 << '\n';
       }
       AMREX_ASSERT(int(m_particles.size()) >= 2);
-      
+
       m_particles.resize(theEffectiveFinestLevel + 1);
       m_dummy_mf.resize(theEffectiveFinestLevel + 1);
   }
-  
-  if (ParallelDescriptor::NProcs() == 1) {
+
+  if (ParallelContext::NProcsSub() == 1) {
       AMREX_ASSERT(not_ours.empty());
   }
   else {
       RedistributeMPI(not_ours, lev_min, lev_max, nGrow, local);
   }
-  
+
   AMREX_ASSERT(OK(lev_min, lev_max, nGrow));
-  
+
   if (m_verbose > 0) {
       Real stoptime = amrex::second() - strttime;
-      
+
       ByteSpread();
-      
+
 #ifdef AMREX_LAZY
       Lazy::QueueReduction( [=] () mutable {
 #endif
-              ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
+              ParallelReduce::Max(stoptime, ParallelContext::IOProcessorNumberSub(),
+                                  ParallelContext::CommunicatorSub());
+
               amrex::Print() << "ParticleContainer::Redistribute() time: " << stoptime << "\n\n";
 #ifdef AMREX_LAZY
           });
@@ -1581,7 +1598,7 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 defineBufferMap () const
-{    
+{
     BL_PROFILE("ParticleContainer::defineBufferMap");
 
     if (not m_buffer_map.isValid(GetParGDB()))
@@ -1594,7 +1611,7 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 BuildRedistributeMask (int lev, int nghost) const
-{    
+{
     BL_PROFILE("ParticleContainer::BuildRedistributeMask");
     AMREX_ASSERT(lev == 0);
 
@@ -1606,12 +1623,12 @@ BuildRedistributeMask (int lev, int nghost) const
         const Geometry& geom = this->Geom(lev);
         const BoxArray& ba = this->ParticleBoxArray(lev);
         const DistributionMapping& dmap = this->ParticleDistributionMap(lev);
-        
+
         redistribute_mask_nghost = nghost;
         redistribute_mask_ptr.reset(new iMultiFab(ba, dmap, 2, nghost));
         redistribute_mask_ptr->setVal(-1, nghost);
 
-        const auto tile_size_do = this->do_tiling ? this->tile_size : IntVect::TheZeroVector();            
+        const auto tile_size_do = this->do_tiling ? this->tile_size : IntVect::TheZeroVector();
 
 #ifdef _OPENMP
 #pragma omp parallel
@@ -1624,11 +1641,11 @@ BuildRedistributeMask (int lev, int nghost) const
             (*redistribute_mask_ptr)[mfi].template setVal<RunOn::Host>(grid_id, box, 0, 1);
             (*redistribute_mask_ptr)[mfi].template setVal<RunOn::Host>(tile_id, box, 1, 1);
         }
-        
+
         redistribute_mask_ptr->FillBoundary(geom.periodicity());
 
         neighbor_procs.clear();
-        for (MFIter mfi(*redistribute_mask_ptr, tile_size_do); mfi.isValid(); ++mfi) 
+        for (MFIter mfi(*redistribute_mask_ptr, tile_size_do); mfi.isValid(); ++mfi)
         {
             const Box& box = mfi.growntilebox();
             for (IntVect iv = box.smallEnd(); iv <= box.bigEnd(); box.next(iv))
@@ -1636,14 +1653,15 @@ BuildRedistributeMask (int lev, int nghost) const
                 const int grid = (*redistribute_mask_ptr)[mfi](iv, 0);
                 if (grid >= 0)
                 {
-                    const int proc = this->ParticleDistributionMap(lev)[grid];
-                    if (proc != ParallelDescriptor::MyProc())  
-                        neighbor_procs.push_back(proc);
+                    const int global_rank = this->ParticleDistributionMap(lev)[grid];
+                    const int rank = ParallelContext::global_to_local_rank(global_rank);
+                    if (rank != ParallelContext::MyProcSub())
+                        neighbor_procs.push_back(rank);
                 }
             }
         }
         RemoveDuplicates(neighbor_procs);
-    }    
+    }
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -1659,7 +1677,7 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
 #ifdef AMREX_USE_MPI
 
     using buffer_type = unsigned long long;
-    
+
     std::map<int, Vector<buffer_type> > mpi_snd_data;
     for (const auto& kv : not_ours)
     {
@@ -1667,10 +1685,10 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
         mpi_snd_data[kv.first].resize(nbt);
         std::memcpy((char*) mpi_snd_data[kv.first].data(), kv.second.data(), kv.second.size());
     }
-    
-    const int NProcs = ParallelDescriptor::NProcs();
+
+    const int NProcs = ParallelContext::NProcsSub();
     const int NNeighborProcs = neighbor_procs.size();
-    
+
     // We may now have particles that are rightfully owned by another CPU.
     Vector<Long> Snds(NProcs, 0), Rcvs(NProcs, 0);  // bytes!
 
@@ -1688,7 +1706,7 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
     }
 
     const int SeqNum = ParallelDescriptor::SeqNum();
-    
+
     if ((not local) and NumSnds == 0)
         return;  // There's no parallel work to do.
 
@@ -1702,12 +1720,12 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
         }
         if ( (tot_snds_this_proc == 0) and (tot_rcvs_this_proc == 0) ) {
             return; // There's no parallel work to do.
-        } 
+        }
     }
 
     Vector<int> RcvProc;
     Vector<std::size_t> rOffset; // Offset (in bytes) in the receive buffer
-    
+
     std::size_t TotRcvInts = 0;
     std::size_t TotRcvBytes = 0;
     for (int i = 0; i < NProcs; ++i) {
@@ -1719,14 +1737,14 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
             TotRcvInts += nbt;
         }
     }
-    
+
     const int nrcvs = RcvProc.size();
     Vector<MPI_Status>  stats(nrcvs);
     Vector<MPI_Request> rreqs(nrcvs);
-    
+
     // Allocate data for rcvs as one big chunk.
     Vector<unsigned long long> recvdata(TotRcvInts);
-    
+
     // Post receives.
     for (int i = 0; i < nrcvs; ++i) {
         const auto Who    = RcvProc[i];
@@ -1735,29 +1753,31 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
         AMREX_ASSERT(Cnt > 0);
         AMREX_ASSERT(Cnt < size_t(std::numeric_limits<int>::max()));
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
-        
-        rreqs[i] = ParallelDescriptor::Arecv(&recvdata[offset], Cnt, Who, SeqNum).req();
+
+        rreqs[i] = ParallelDescriptor::Arecv(&recvdata[offset], Cnt, Who, SeqNum,
+                                             ParallelContext::CommunicatorSub()).req();
     }
-    
+
     // Send.
     for (const auto& kv : mpi_snd_data) {
         const auto Who = kv.first;
         const auto Cnt = kv.second.size();
-        
+
         AMREX_ASSERT(Cnt > 0);
         AMREX_ASSERT(Who >= 0 && Who < NProcs);
         AMREX_ASSERT(Cnt < std::numeric_limits<int>::max());
-        
-        ParallelDescriptor::Send(kv.second.data(), Cnt, Who, SeqNum);
+
+        ParallelDescriptor::Send(kv.second.data(), Cnt, Who, SeqNum,
+                                 ParallelContext::CommunicatorSub());
     }
-    
+
     if (nrcvs > 0) {
         ParallelDescriptor::Waitall(rreqs, stats);
-     
+
 	BL_PROFILE_VAR_START(blp_locate);
-   
+
         int npart = TotRcvBytes / superparticle_size;
-        
+
         Vector<int> rcv_levs(npart);
         Vector<int> rcv_grid(npart);
         Vector<int> rcv_tile(npart);
@@ -1768,7 +1788,7 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
         {
             const auto offset = rOffset[j];
             const auto Who    = RcvProc[j];
-            const auto Cnt    = Rcvs[Who] / superparticle_size;            
+            const auto Cnt    = Rcvs[Who] / superparticle_size;
             for (int i = 0; i < int(Cnt); ++i)
             {
                 char* pbuf = ((char*) &recvdata[offset]) + i*superparticle_size;
@@ -1792,9 +1812,9 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
         {
             const auto offset = rOffset[i];
             const auto Who    = RcvProc[i];
-            const auto Cnt = Rcvs[Who] / superparticle_size;            
+            const auto Cnt = Rcvs[Who] / superparticle_size;
             for (int j = 0; j < int(Cnt); ++j)
-            {                
+            {
                 auto& ptile = m_particles[rcv_levs[ipart]][std::make_pair(rcv_grid[ipart],
                                                                           rcv_tile[ipart])];
                 char* pbuf = ((char*) &recvdata[offset]) + j*superparticle_size;
@@ -1804,18 +1824,18 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
                 pbuf += sizeof(ParticleType);
                 ptile.push_back(p);
                 for (int comp = 0; comp < NumRealComps(); ++comp) {
-                    if (communicate_real_comp[comp]) {
-                        Real rdata;
-                        std::memcpy(&rdata, pbuf, sizeof(Real));
-                        pbuf += sizeof(Real);
+                    if (h_communicate_real_comp[comp]) {
+                        ParticleReal rdata;
+                        std::memcpy(&rdata, pbuf, sizeof(ParticleReal));
+                        pbuf += sizeof(ParticleReal);
                         ptile.push_back_real(comp, rdata);
                     } else {
                         ptile.push_back_real(comp, 0.0);
                     }
                 }
-            
+
                 for (int comp = 0; comp < NumIntComps(); ++comp) {
-                    if (communicate_int_comp[comp]) {
+                    if (h_communicate_int_comp[comp]) {
                         int idata;
                         std::memcpy(&idata, pbuf, sizeof(int));
                         pbuf += sizeof(int);
@@ -1826,7 +1846,7 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
                 }
                 ++ipart;
             }
-        }	    
+        }
 #else
 	Vector<std::map<std::pair<int, int>, Gpu::HostVector<ParticleType> > > host_particles;
 	host_particles.reserve(15);
@@ -1847,9 +1867,9 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
         {
             const auto offset = rOffset[i];
             const auto Who    = RcvProc[i];
-            const auto Cnt = Rcvs[Who] / superparticle_size;            
+            const auto Cnt = Rcvs[Who] / superparticle_size;
             for (int j = 0; j < Cnt; ++j)
-            {                
+            {
                 int lev = rcv_levs[ipart];
                 std::pair<int, int> ind(std::make_pair(rcv_grid[ipart], rcv_tile[ipart]));
 
@@ -1858,16 +1878,16 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
                 ParticleType p;
                 std::memcpy(&p, pbuf, sizeof(ParticleType));
                 pbuf += sizeof(ParticleType);
-                
+
                 host_real_attribs[lev][ind].resize(NumRealComps());
                 host_int_attribs[lev][ind].resize(NumIntComps());
-	  
+
                 // add the struct
                 host_particles[lev][ind].push_back(p);
 	  
                 // add the real...
                 for (int comp = 0; comp < NumRealComps(); ++comp) {
-                    if (communicate_real_comp[comp]) {
+                    if (h_communicate_real_comp[comp]) {
                         Real rdata;
                         std::memcpy(&rdata, pbuf, sizeof(Real));
                         pbuf += sizeof(Real);
@@ -1879,7 +1899,7 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
                 
                 // ... and int array data
                 for (int comp = 0; comp < NumIntComps(); ++comp) {
-                    if (communicate_int_comp[comp]) {
+                    if (h_communicate_int_comp[comp]) {
                         int idata;
                         std::memcpy(&idata, pbuf, sizeof(int));
                         pbuf += sizeof(int);
@@ -1929,7 +1949,9 @@ RedistributeMPI (std::map<int, Vector<char> >& not_ours,
 
 	BL_PROFILE_VAR_STOP(blp_copy);
     }
-#endif /*AMREX_USE_MPI*/
+#else
+    amrex::ignore_unused(not_ours,lev_min,lev_max,nGrow,local);
+#endif
 }
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -1946,30 +1968,45 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::OK (int lev_m
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
-ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>::AddParticlesAtLevel (AoS& particles, int level, int nGrow)
+ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>
+::AddParticlesAtLevel (AoS& particles, int level, int nGrow)
+{
+    ParticleTileType ptile;
+    ptile.GetArrayOfStructs().swap(particles);
+    AddParticlesAtLevel(ptile, level, nGrow);
+}
+
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+void
+ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>
+::AddParticlesAtLevel (ParticleTileType& particles, int level, int nGrow)
 {
     BL_PROFILE("ParticleContainer::AddParticlesAtLevel()");
+
+    //    if (particles.size() == 0) return;
+
     if (int(m_particles.size()) < level+1)
+    {
+        if (Verbose())
         {
-            if (Verbose())
-            {
-                amrex::Print() << "ParticleContainer::AddParticlesAtLevel resizing m_particles from "
-                               << m_particles.size()
-                               << " to "
-                               << level+1 << '\n';
-            }
-            m_particles.resize(level + 1);
-            m_dummy_mf.resize(level+1);
-            for (int lev = 0; lev < level+1; ++lev) {
-                RedefineDummyMF(lev);
-            }
-        }    
+            amrex::Print() << "ParticleContainer::AddParticlesAtLevel resizing m_particles from "
+                           << m_particles.size()
+                           << " to "
+                           << level+1 << '\n';
+        }
+        m_particles.resize(level+1);
+        m_dummy_mf.resize(level+1);
+        for (int lev = 0; lev < level+1; ++lev) {
+            RedefineDummyMF(lev);
+        }
+    }
 
     ParticleLocData pld;
 
-    for (int i = 0; i < particles.numParticles(); ++i) {
-        ParticleType& p = particles[i];
+    auto src = particles.getParticleTileData();
 
+    for (int i = 0; i < particles.numParticles(); ++i) {
+        SuperParticleType p = src.getSuperParticle(i);
         if (p.id() > 0)
         {
             if (!Where(p, pld, level, level, nGrow))
@@ -1977,6 +2014,7 @@ ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>::AddParticlesAtL
             m_particles[pld.m_lev][std::make_pair(pld.m_grid, pld.m_tile)].push_back(p);
         }
     }
+
     Redistribute(level, level, nGrow);
     particles.resize(0);
 }
@@ -1992,13 +2030,13 @@ AssignCellDensitySingleLevel (int rho_index,
                               int       particle_lvl_offset) const
 {
     BL_PROFILE("ParticleContainer::AssignCellDensitySingleLevel()");
-    
+
     if (rho_index != 0) amrex::Abort("AssignCellDensitySingleLevel only works if rho_index = 0");
-    
+
     MultiFab* mf_pointer;
 
     if (OnSameGrids(lev, mf_to_be_filled)) {
-      // If we are already working with the internal mf defined on the 
+      // If we are already working with the internal mf defined on the
       // particle_box_array, then we just work with this.
       mf_pointer = &mf_to_be_filled;
     }
@@ -2069,7 +2107,7 @@ AssignCellDensitySingleLevel (int rho_index,
                     amrex_deposit_particle_dx_cic(pstruct[i], ncomp, rhoarr, plo, dxi, pdxi);
                 });
             }
-                
+
 #ifdef _OPENMP
             if (Gpu::notInLaunchRegion())
             {
@@ -2078,10 +2116,10 @@ AssignCellDensitySingleLevel (int rho_index,
 #endif
         }
     }
-    
+
     mf_pointer->SumBoundary(Geom(lev).periodicity());
-    
-    // If ncomp > 1, first divide the momenta (component n) 
+
+    // If ncomp > 1, first divide the momenta (component n)
     // by the mass (component 0) in order to get velocities.
     // Be careful not to divide by zero.
     for (int n = 1; n < ncomp; n++)
@@ -2091,15 +2129,15 @@ AssignCellDensitySingleLevel (int rho_index,
             (*mf_pointer)[mfi].protected_divide<RunOn::Device>((*mf_pointer)[mfi],0,n,1);
         }
     }
-    
+
     // Only multiply the first component by (1/vol) because this converts mass
     // to density. If there are additional components (like velocity), we don't
     // want to divide those by volume.
     const Real* dx = Geom(lev).CellSize();
     const Real vol = AMREX_D_TERM(dx[0], *dx[1], *dx[2]);
-    
+
     mf_pointer->mult(1.0/vol, 0, 1, mf_pointer->nGrow());
-    
+
     // If mf_to_be_filled is not defined on the particle_box_array, then we need
     // to copy here from mf_pointer into mf_to_be_filled. I believe that we don't
     // need any information in ghost cells so we don't copy those.
@@ -2108,13 +2146,14 @@ AssignCellDensitySingleLevel (int rho_index,
         mf_to_be_filled.copy(*mf_pointer,0,0,ncomp);
         delete mf_pointer;
     }
-    
+
     if (m_verbose > 1)
     {
         Real stoptime = amrex::second() - strttime;
-        
-        ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
-        
+
+        ParallelReduce::Max(stoptime, ParallelContext::IOProcessorNumberSub(),
+                            ParallelContext::CommunicatorSub());
+
         amrex::Print() << "ParticleContainer::AssignCellDensitySingleLevel) time: "
                        << stoptime << '\n';
     }
@@ -2122,12 +2161,12 @@ AssignCellDensitySingleLevel (int rho_index,
 
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::Interpolate (Vector<std::unique_ptr<MultiFab> >& mesh_data, 
+ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::Interpolate (Vector<std::unique_ptr<MultiFab> >& mesh_data,
                                                                                 int lev_min, int lev_max)
 {
     BL_PROFILE("ParticleContainer::Interpolate()");
     for (int lev = lev_min; lev <= lev_max; ++lev) {
-        InterpolateSingleLevel(*mesh_data[lev], lev); 
+        InterpolateSingleLevel(*mesh_data[lev], lev);
     }
 }
 
@@ -2137,16 +2176,16 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 InterpolateSingleLevel (MultiFab& mesh_data, int lev)
 {
     BL_PROFILE("ParticleContainer::InterpolateSingleLevel()");
-    
+
     if (mesh_data.nGrow() < 1)
         amrex::Error("Must have at least one ghost cell when in InterpolateSingleLevel");
-    
+
     const Geometry& gm = Geom(lev);
     const auto     plo = gm.ProbLoArray();
     const auto     dxi = gm.InvCellSizeArray();
 
     using ParIter = ParIter<NStructReal, NStructInt, NArrayReal, NArrayInt>;
-    
+
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
@@ -2157,7 +2196,7 @@ InterpolateSingleLevel (MultiFab& mesh_data, int lev)
         FArrayBox& fab = mesh_data[pti];
         const auto fabarr = fab.array();
         const Long np = particles.numParticles();
-        
+
         int nComp = fab.nComp();
         AMREX_FOR_1D( np, i,
         {
@@ -2165,98 +2204,3 @@ InterpolateSingleLevel (MultiFab& mesh_data, int lev)
         });
     }
 }
-
-//
-// This version takes as input the acceleration vector at cell centers, and has the option of
-// returning the acceleration at the particle location in the data array, starting at
-// component start_comp_for_accel
-//
-template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
-void
-ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
-::moveKick (MultiFab& acceleration, int lev, Real dt, Real a_new, Real a_half, int start_comp_for_accel)
-{
-    BL_PROFILE("ParticleContainer::moveKick()");
-    AMREX_ASSERT(NStructReal >= AMREX_SPACEDIM+1);
-    AMREX_ASSERT(lev >= 0 && lev < int(m_particles.size()));
-
-    const Real strttime  = amrex::second();
-    const Real half_dt   = 0.5_rt * dt;
-    const Real a_new_inv = 1_rt / a_new;
-    auto&      pmap      = m_particles[lev];
-
-    MultiFab* ac_pointer;
-    if (OnSameGrids(lev,acceleration))
-    {
-        ac_pointer = &acceleration;
-    }
-    else 
-    {
-        ac_pointer = new MultiFab(ParticleBoxArray(lev),
-				  ParticleDistributionMap(lev),
-				  acceleration.nComp(),acceleration.nGrow());
-        for (MFIter mfi(*ac_pointer); mfi.isValid(); ++mfi)
-            ac_pointer->setVal(0.);
-        ac_pointer->copy(acceleration,0,0,acceleration.nComp());
-        ac_pointer->FillBoundary(); // DO WE NEED GHOST CELLS FILLED ???
-    }
-
-    for (auto& kv : pmap) {
-      auto& pbox = kv.second.GetArrayOfStructs();
-      const int grid = kv.first.first;
-      const int n = pbox.numParticles();
-      const FArrayBox& gfab = (*ac_pointer)[grid];
-
-#ifdef _OPENMP
-#pragma omp parallel for
-#endif
-      for (int i = 0; i < n; i++)
-        {
-	  ParticleType& p = pbox[i];
-
-	  if (p.m_idata.id > 0)
-            {
-
-	      //
-	      // Note: rdata.arr[AMREX_SPACEDIM] is mass, AMREX_SPACEDIM+1 is v_x, ...
-	      //
-	      Real grav[AMREX_SPACEDIM];
-
-	      ParticleType::GetGravity(gfab, m_gdb->Geom(lev), p, grav);
-	      //
-	      // Define (a u)^new = (a u)^half + dt/2 grav^new
-	      //
-	      AMREX_D_TERM(p.m_rdata.arr[AMREX_SPACEDIM+1] *= a_half;,
-		     p.m_rdata.arr[AMREX_SPACEDIM+2] *= a_half;,
-		     p.m_rdata.arr[AMREX_SPACEDIM+3] *= a_half;);
-
-	      AMREX_D_TERM(p.m_rdata.arr[AMREX_SPACEDIM+1] += half_dt * grav[0];,
-		     p.m_rdata.arr[AMREX_SPACEDIM+2] += half_dt * grav[1];,
-		     p.m_rdata.arr[AMREX_SPACEDIM+3] += half_dt * grav[2];);
-
-	      AMREX_D_TERM(p.m_rdata.arr[AMREX_SPACEDIM+1] *= a_new_inv;,
-		     p.m_rdata.arr[AMREX_SPACEDIM+2] *= a_new_inv;,
-		     p.m_rdata.arr[AMREX_SPACEDIM+3] *= a_new_inv;);
-
-	      if (start_comp_for_accel > AMREX_SPACEDIM)
-                {
-		  AMREX_D_TERM(p.m_rdata.arr[AMREX_SPACEDIM + start_comp_for_accel  ] = grav[0];,
-			 p.m_rdata.arr[AMREX_SPACEDIM + start_comp_for_accel+1] = grav[1];,
-			 p.m_rdata.arr[AMREX_SPACEDIM + start_comp_for_accel+2] = grav[2];);
-                }
-            }
-        }
-    }
-
-    
-    if (ac_pointer != &acceleration) delete ac_pointer;
-
-    if (m_verbose > 1)
-    {
-        Real stoptime = amrex::second() - strttime;
-
-        ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
-
-        amrex::Print() << "ParticleContainer::moveKick() time: " << stoptime << '\n';
-    }
-}
diff --git a/Src/Particle/AMReX_ParticleHDF5.H b/Src/Particle/AMReX_ParticleHDF5.H
index b2ce39f6f26..016f5e5c474 100644
--- a/Src/Particle/AMReX_ParticleHDF5.H
+++ b/Src/Particle/AMReX_ParticleHDF5.H
@@ -4,6 +4,10 @@
 #ifdef AMREX_USE_HDF5
 #include <hdf5.h>
 
+#ifdef AMREX_USE_HDF5_ASYNC
+#include "h5_vol_external_async_native.h"
+#endif
+
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
@@ -268,6 +272,37 @@ static int ReadHDF5AttrLong(hid_t loc, const char *name, void *data)
     return 1;
 }
 
+static void SetHDF5fapl(hid_t fapl)
+{
+#ifdef BL_USE_MPI
+    H5Pset_fapl_mpio(fapl, MPI_COMM_SELF, MPI_INFO_NULL);
+
+    // Alignment and metadata block size
+    int alignment = 16 * 1024 * 1024;
+    H5Pset_alignment(fapl, alignment, alignment);
+    H5Pset_meta_block_size(fapl, 8388608);
+
+    // Collective metadata ops
+    H5Pset_coll_metadata_write(fapl, true);
+    H5Pset_all_coll_metadata_ops(fapl, true);
+
+    // Defer cache flush
+    H5AC_cache_config_t cache_config;
+    cache_config.version = H5AC__CURR_CACHE_CONFIG_VERSION;
+    H5Pget_mdc_config(fapl, &cache_config);
+    cache_config.set_initial_size = 1;
+    cache_config.initial_size = 16 * 1024 * 1024;
+    cache_config.evictions_enabled = 0;
+    cache_config.incr_mode = H5C_incr__off;
+    cache_config.flash_incr_mode = H5C_flash_incr__off;
+    cache_config.decr_mode = H5C_decr__off;
+    H5Pset_mdc_config (fapl, &cache_config);
+#else
+    H5Pset_fapl_sec2(fapl);
+#endif
+
+}
+
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
@@ -279,33 +314,31 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 {
     BL_PROFILE("ParticleContainer::WriteHDF5ParticleData()");
     BL_ASSERT(OK());
-    
+
     BL_ASSERT(sizeof(typename ParticleType::RealType) == 4 ||
               sizeof(typename ParticleType::RealType) == 8);
-    
+
     const int NProcs = ParallelDescriptor::NProcs();
     const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
     const Real strttime = amrex::second();
-    
+
     AMREX_ALWAYS_ASSERT(real_comp_names.size() == NumRealComps() + NStructReal);
     AMREX_ALWAYS_ASSERT( int_comp_names.size() == NumIntComps() + NStructInt);
 
     std::string pdir = dir;
     if ( not pdir.empty() and pdir[pdir.size()-1] != '/') pdir += '/';
-    
-    if ( ! levelDirectoriesCreated)
-    {
+    if ( ! levelDirectoriesCreated) {
         if (ParallelDescriptor::IOProcessor()) {
-            if ( ! amrex::UtilCreateDirectory(pdir, 0755)) 
+            if ( ! amrex::UtilCreateDirectory(pdir, 0755))
                 amrex::CreateDirectoryFailed(pdir);
 
             int set_stripe = 0;
             char setstripe[1024];
             int stripe_count = 128;
-            int stripe_size = 32;
+            int stripe_size = 1;
             char *stripe_count_str = getenv("HDF5_STRIPE_COUNT");
             char *stripe_size_str  = getenv("HDF5_STRIPE_SIZE");
-            if (stripe_count_str) { 
+            if (stripe_count_str) {
                 stripe_count = atoi(stripe_count_str);
                 set_stripe = 1;
             }
@@ -315,7 +348,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             }
             if (set_stripe == 1) {
                 sprintf(setstripe, "lfs setstripe -c %d -S %dm %s", stripe_count, stripe_size, pdir.c_str());
-                std::cout << "Setting stripe parameters for HDF5 output: " << setstripe << std::endl; 
+                std::cout << "Setting stripe parameters for HDF5 output: " << setstripe << std::endl;
                 amrex::ignore_unused(std::system(setstripe));
             }
         }
@@ -323,7 +356,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     }
 
     Long nparticles = 0;
-    int maxnextid;
+    Long maxnextid;
     
     if(usePrePost)
     {
@@ -344,17 +377,17 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 {
                     // Only count (and checkpoint) valid particles.
                     const ParticleType& p = aos[k];
-                    if (p.m_idata.id > 0) nparticles++;
+                    if (p.id() > 0) nparticles++;
                 }
             }
         }
         
         ParallelDescriptor::ReduceLongSum(nparticles, IOProcNumber);
         ParticleType::NextID(maxnextid);
-        ParallelDescriptor::ReduceIntMax(maxnextid, IOProcNumber);
+        ParallelDescriptor::ReduceLongMax(maxnextid, IOProcNumber);
     }
 
-    hid_t fapl, fid, grp;
+    hid_t fapl, dxpl, fid, grp;
     int status;
 
     hid_t comp_dtype = H5Tcreate (H5T_COMPOUND, 2 * AMREX_SPACEDIM * sizeof(int));
@@ -391,7 +424,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
    
         // Have only one rank to create and write metadata (header)
         fapl = H5Pcreate (H5P_FILE_ACCESS);
-        H5Pset_fapl_mpio(fapl, MPI_COMM_SELF, MPI_INFO_NULL);
+        SetHDF5fapl(fapl);
 
         // Create the HDF5 file
         fid = H5Fcreate(HDF5FileName.c_str(), H5F_ACC_TRUNC, H5P_DEFAULT, fapl);
@@ -458,7 +491,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         CreateWriteHDF5AttrLong(fid, "nparticles", 1, &nparticles);
 
         // The value of nextid that we need to restore on restart.
-        CreateWriteHDF5AttrInt(fid, "maxnextid", 1, &maxnextid);
+        CreateWriteHDF5AttrLong(fid, "maxnextid", 1, &maxnextid);
 
         // Then the finest level of the AMR hierarchy.
         int finest_level = finestLevel();
@@ -516,7 +549,12 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     ParallelDescriptor::Barrier();
 
     fapl = H5Pcreate (H5P_FILE_ACCESS);
-    H5Pset_fapl_mpio(fapl,  ParallelDescriptor::Communicator(), MPI_INFO_NULL);
+    SetHDF5fapl(fapl);
+
+#ifdef AMREX_USE_HDF5_ASYNC
+    // Only use HDF5 async I/O for data write
+    H5Pset_vol_async(fapl);
+#endif
 
     // All process open the file
     fid = H5Fopen(HDF5FileName.c_str(), H5F_ACC_RDWR, fapl);
@@ -590,6 +628,16 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 
     std::map<int, Vector<int> > tile_map;
 
+    hid_t dxpl;
+    dxpl = H5Pcreate(H5P_DATASET_XFER);
+    #ifdef BL_USE_MPI
+    H5Pset_dxpl_mpio(dxpl, H5FD_MPIO_INDEPENDENT);
+    #endif
+
+    #ifdef AMREX_USE_HDF5_ASYNC
+    H5Pset_dxpl_async(dxpl, true);
+    #endif
+
     for (const auto& kv : m_particles[lev])
     {
         const int grid = kv.first.first;
@@ -601,7 +649,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 	for (int k = 0; k < kv.second.GetArrayOfStructs().numParticles(); ++k)
 	{
 	    const ParticleType& p = kv.second.GetArrayOfStructs()[k];
-  	    if (p.m_idata.id > 0) {
+  	    if (p.id() > 0) {
                 cnt++;
 	    }	    
 	}
@@ -643,15 +691,20 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         my_mfi_cnt++;
     }
 
+    #ifdef BL_USE_MPI
     // Collect the number of mf and total size of mf from each rank
-    MPI_Allgather(&my_mfi_cnt, 1, MPI_INT, &(all_mfi_cnt[0]), 1, MPI_INT, ParallelDescriptor::Communicator());
+    MPI_Allgather(&my_mfi_cnt, 1, ParallelDescriptor::Mpi_typemap<int>::type(), &(all_mfi_cnt[0]), 1, ParallelDescriptor::Mpi_typemap<int>::type(), ParallelDescriptor::Communicator());
     for (int i = 0; i < ParallelDescriptor::NProcs(); i++) 
         total_mfi += all_mfi_cnt[i];
 
     // Create the int data 
-    MPI_Allgather(&my_mfi_int_total_size, 1, Mpi_typemap<ULong>::type(), 
-                  &(all_mfi_int_total_size[0]), 1, Mpi_typemap<ULong>::type(), ParallelDescriptor::Communicator());
-    
+    MPI_Allgather(&my_mfi_int_total_size, 1, ParallelDescriptor::Mpi_typemap<ULong>::type(), 
+                  &(all_mfi_int_total_size[0]), 1, ParallelDescriptor::Mpi_typemap<ULong>::type(), ParallelDescriptor::Communicator());
+    #else
+    all_mfi_cnt[0] = &my_mfi_cnt;
+    all_mfi_int_total_size[0] = my_mfi_int_total_size;
+    #endif
+ 
     for (int i = 0; i < ParallelDescriptor::NProcs(); i++) 
         total_int_size += all_mfi_int_total_size[i]; 
 
@@ -667,8 +720,12 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     
 
     // Create the real data 
-    MPI_Allgather(&my_mfi_real_total_size, 1, Mpi_typemap<ULong>::type(), 
-                  &(all_mfi_real_total_size[0]), 1, Mpi_typemap<ULong>::type(), ParallelDescriptor::Communicator());
+    #ifdef BL_USE_MPI
+    MPI_Allgather(&my_mfi_real_total_size, 1, ParallelDescriptor::Mpi_typemap<ULong>::type(), 
+                  &(all_mfi_real_total_size[0]), 1, ParallelDescriptor::Mpi_typemap<ULong>::type(), ParallelDescriptor::Communicator());
+    #else
+    all_mfi_real_total_size[0] = my_mfi_real_total_size;
+    #endif
 
     for (int i = 0; i < ParallelDescriptor::NProcs(); i++) 
         total_real_size += all_mfi_real_total_size[i];
@@ -703,11 +760,14 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             const auto& pbox = m_particles[lev].at(std::make_pair(grid, tile_map[grid][i]));
             for (int pindex = 0; pindex < pbox.GetArrayOfStructs().numParticles(); ++pindex) {
                 const ParticleType& p = pbox.GetArrayOfStructs()[pindex];
-                if (p.m_idata.id > 0) {
-                    for (int j = 0; j < 2 + NStructInt; j++) {
-                        iptr[j] = p.m_idata.arr[j];
+                if (p.id() > 0) {
+                    *iptr = p.id(); ++iptr;
+                    *iptr = p.cpu(); ++iptr;
+
+                    for (int j = 0; j < NStructInt; j++) {
+                        iptr[j] = p.idata(j);
                     }
-                    iptr += 2 + NStructInt;
+                    iptr += NStructInt;
                     const auto& soa  = pbox.GetStructOfArrays();
                     for (int j = 0; j < NArrayInt; j++) {
                         iptr[j] = soa.GetIntData(j)[pindex];
@@ -724,7 +784,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         /*         my_int_offset << ", my_int_count = " << my_int_count << ", total_int_size = " << total_int_size << '\n'; */
         int_dset_space = H5Screate_simple(1, &total_int_size, NULL); 
         H5Sselect_hyperslab (int_dset_space, H5S_SELECT_SET, &my_int_offset, NULL, &my_int_count, NULL);
-        H5Dwrite(int_dset_id, H5T_NATIVE_INT, int_mem_space, int_dset_space, H5P_DEFAULT, istuff.dataPtr());
+        H5Dwrite(int_dset_id, H5T_NATIVE_INT, int_mem_space, int_dset_space, dxpl, istuff.dataPtr());
         H5Sclose(int_mem_space);
         H5Sclose(int_dset_space);
 
@@ -740,11 +800,15 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             const auto& pbox = m_particles[lev].at(std::make_pair(grid, tile_map[grid][i]));
             for (int pindex = 0; pindex < pbox.GetArrayOfStructs().numParticles(); ++pindex) {
                 const ParticleType& p = pbox.GetArrayOfStructs()[pindex];
-                if (p.m_idata.id > 0) {
-                    for (int j = 0; j < AMREX_SPACEDIM + NStructReal; j++) {
-                        rptr[j] = p.m_rdata.arr[j];
+                if (p.id() > 0) {
+                    for (int j = 0; j < AMREX_SPACEDIM; j++) {
+                        rptr[j] = p.pos(j);
+                    }
+                    rptr += AMREX_SPACEDIM;
+                    for (int j = 0; j < NStructReal; j++) {
+                        rptr[j] = p.rdata(j);
                     }
-                    rptr += AMREX_SPACEDIM + NStructReal;
+                    rptr += NStructReal;
                     const auto& soa  = pbox.GetStructOfArrays();
                     for (int j = 0; j < NArrayReal; j++) {
                         rptr[j] = (typename ParticleType::RealType) soa.GetRealData(j)[pindex];
@@ -760,7 +824,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         /*         my_real_offset << ", my_real_count = " << my_real_count << ", total_real_size = " << total_real_size << '\n'; */
         real_dset_space = H5Screate_simple(1, &total_real_size, NULL); 
         H5Sselect_hyperslab (real_dset_space, H5S_SELECT_SET, &my_real_offset, NULL, &my_real_count, NULL);
-        H5Dwrite(real_dset_id, H5T_NATIVE_DOUBLE, real_mem_space, real_dset_space, H5P_DEFAULT, rstuff.dataPtr());
+        if (sizeof(typename ParticleType::RealType) == 4)
+            H5Dwrite(real_dset_id, H5T_NATIVE_FLOAT, real_mem_space, real_dset_space, dxpl, rstuff.dataPtr());
+        else
+            H5Dwrite(real_dset_id, H5T_NATIVE_DOUBLE, real_mem_space, real_dset_space, dxpl, rstuff.dataPtr());
         H5Sclose(real_mem_space);
         H5Sclose(real_dset_space);
 
@@ -785,7 +852,17 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     /*         my_int_offset << ", my_int_count = " << my_int_count << ", total_mfi = " << total_mfi << '\n'; */
     H5Sselect_hyperslab (offset_space, H5S_SELECT_SET, &my_int_offset, NULL, &my_int_count, NULL);
 
-    H5Dwrite(offset_id, H5T_NATIVE_INT, int_mem_space, offset_space, H5P_DEFAULT, &(my_nparticles[0]));
+    hid_t dxpl_col = H5Pcreate(H5P_DATASET_XFER);
+    #ifdef BL_USE_MPI
+    H5Pset_dxpl_mpio(dxpl_col, H5FD_MPIO_COLLECTIVE);
+    #endif
+    #ifdef AMREX_USE_HDF5_ASYNC
+    H5Pset_dxpl_async(dxpl_col, true);
+    #endif
+    H5Dwrite(offset_id, H5T_NATIVE_INT, int_mem_space, offset_space, dxpl_col, &(my_nparticles[0]));
+
+    H5Pclose(dxpl);
+    H5Pclose(dxpl_col);
 
     H5Sclose(int_mem_space);
     H5Dclose(offset_id);
@@ -828,8 +905,8 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     int ret;
 
     fapl = H5Pcreate (H5P_FILE_ACCESS);
-    /* H5Pset_fapl_mpio(fapl, MPI_COMM_SELF, MPI_INFO_NULL); */
-    H5Pset_fapl_mpio(fapl, ParallelDescriptor::Communicator(), MPI_INFO_NULL);
+    SetHDF5fapl(fapl);
+
     fid = H5Fopen(fullname.c_str(), H5F_ACC_RDONLY, fapl);
     if (fid < 0) {
         std::string msg("ParticleContainer::RestartHDF5(): unable to open file: ");
@@ -936,8 +1013,8 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     AMREX_ASSERT(nparticles >= 0);
     
     aname = "maxnextid";
-    int maxnextid;
-    ret = ReadHDF5AttrInt(fid, aname.c_str(), &maxnextid);
+    Long maxnextid;
+    ret = ReadHDF5AttrLong(fid, aname.c_str(), &maxnextid);
     if (ret < 0) {
         std::string msg("ParticleContainer::RestartHDF5(): unable to read attribute ");
         msg += aname;
@@ -1198,7 +1275,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     hsize_t real_offset = offset*rChunkSize;
     real_dspace = H5Screate_simple(1, &real_cnt, NULL); 
     H5Sselect_hyperslab (real_fspace, H5S_SELECT_SET, &real_offset, NULL, &real_cnt, NULL);
-    H5Dread(real_dset, H5T_NATIVE_DOUBLE, real_dspace, real_fspace, H5P_DEFAULT, rstuff.dataPtr());
+    if (sizeof(RTYPE) == 4)
+        H5Dread(real_dset, H5T_NATIVE_FLOAT, real_dspace, real_fspace, H5P_DEFAULT, rstuff.dataPtr());
+    else
+        H5Dread(real_dset, H5T_NATIVE_DOUBLE, real_dspace, real_fspace, H5P_DEFAULT, rstuff.dataPtr());
 
     H5Sclose(real_fspace);
     H5Sclose(real_dspace);
@@ -1225,28 +1305,28 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     host_int_attribs.resize(finest_level_in_file+1);
 
     for (int i = 0; i < cnt; i++) {
-        p.m_idata.id   = iptr[0];
-        p.m_idata.cpu  = iptr[1];
-        
+        p.id()   = iptr[0];
+        p.cpu()  = iptr[1];
+
         iptr += 2;
-            
+
         for (int j = 0; j < NStructInt; j++)
         {
-            p.m_idata.arr[2+j] = *iptr;
+            p.idata(j) = *iptr;
             ++iptr;
         }
 
-        AMREX_ASSERT(p.m_idata.id > 0);
-        
-        AMREX_D_TERM(p.m_rdata.pos[0] = rptr[0];,
-                     p.m_rdata.pos[1] = rptr[1];,
-                     p.m_rdata.pos[2] = rptr[2];);
-        
+        AMREX_ASSERT(p.id() > 0);
+
+        AMREX_D_TERM(p.pos(0) = rptr[0];,
+                     p.pos(1) = rptr[1];,
+                     p.pos(2) = rptr[2];);
+
         rptr += AMREX_SPACEDIM;
-        
+
         for (int j = 0; j < NStructReal; j++)
         {
-            p.m_rdata.arr[AMREX_SPACEDIM+j] = *rptr;
+            p.rdata(j) = *rptr;
             ++rptr;
         }
 
@@ -1307,6 +1387,8 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     Gpu::streamSynchronize();
 }
 
+
+
 #endif
 
 #endif
diff --git a/Src/Particle/AMReX_ParticleIO.H b/Src/Particle/AMReX_ParticleIO.H
index ef5b5f7a619..0fc142619de 100644
--- a/Src/Particle/AMReX_ParticleIO.H
+++ b/Src/Particle/AMReX_ParticleIO.H
@@ -1,15 +1,16 @@
 #ifndef AMREX_PARTICLEIO_H
 #define AMREX_PARTICLEIO_H
 
+#include <AMReX_WriteBinaryParticleData.H>
+
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
-::WriteParticleRealData (void* data, size_t size,
-                         std::ostream& os, const RealDescriptor& rd) const
+::WriteParticleRealData (void* data, size_t size, std::ostream& os) const
 {
     if (sizeof(typename ParticleType::RealType) == 4) {
         writeFloatData((float*) data, size, os, ParticleRealDescriptor);
-    } 
+    }
     else if (sizeof(typename ParticleType::RealType) == 8) {
         writeDoubleData((double*) data, size, os, ParticleRealDescriptor);
     }
@@ -18,12 +19,11 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
-::ReadParticleRealData (void* data, size_t size,
-                         std::istream& is, const RealDescriptor& rd)
+::ReadParticleRealData (void* data, size_t size, std::istream& is)
 {
     if (sizeof(typename ParticleType::RealType) == 4) {
         readFloatData((float*) data, size, is, ParticleRealDescriptor);
-    } 
+    }
     else if (sizeof(typename ParticleType::RealType) == 8) {
         readDoubleData((double*) data, size, is, ParticleRealDescriptor);
     }
@@ -33,7 +33,7 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::Checkpoint (const std::string& dir,
-              const std::string& name, bool is_checkpoint,
+              const std::string& name, bool /*is_checkpoint*/,
               const Vector<std::string>& real_comp_names,
               const Vector<std::string>& int_comp_names) const
 {
@@ -53,7 +53,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             tmp_real_comp_names.push_back(real_comp_names[i]);
         }
     }
-    
+
     Vector<int> write_int_comp;
     Vector<std::string> tmp_int_comp_names;
     for (int i = 0; i < NStructInt + NumIntComps(); ++i )
@@ -93,7 +93,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "real_comp" << i;
         real_comp_names.push_back(ss.str());
     }
-    
+
     Vector<int> write_int_comp;
     Vector<std::string> int_comp_names;
     for (int i = 0; i < NStructInt + NumIntComps(); ++i )
@@ -103,7 +103,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "int_comp" << i;
         int_comp_names.push_back(ss.str());
     }
-    
+
     WriteBinaryParticleData(dir, name, write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
                             [=] AMREX_GPU_HOST_DEVICE (const SuperParticleType& p) -> int
@@ -126,7 +126,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "real_comp" << i;
         real_comp_names.push_back(ss.str());
     }
-    
+
     Vector<int> write_int_comp;
     Vector<std::string> int_comp_names;
     for (int i = 0; i < NStructInt + NumIntComps(); ++i )
@@ -136,7 +136,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "int_comp" << i;
         int_comp_names.push_back(ss.str());
     }
-    
+
     WriteBinaryParticleData(dir, name, write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
                             [=] AMREX_GPU_HOST_DEVICE (const SuperParticleType& p)
@@ -151,7 +151,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::WritePlotFile (const std::string& dir, const std::string& name,
                  const Vector<std::string>& real_comp_names,
                  const Vector<std::string>& int_comp_names) const
-{    
+{
     AMREX_ASSERT(real_comp_names.size() == NStructReal + NumRealComps());
     AMREX_ASSERT( int_comp_names.size() == NStructInt  + NumIntComps() );
 
@@ -175,7 +175,7 @@ void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::WritePlotFile (const std::string& dir, const std::string& name,
                  const Vector<std::string>& real_comp_names) const
-{    
+{
     AMREX_ASSERT(real_comp_names.size() == NStructReal + NumRealComps());
 
     Vector<int> write_real_comp;
@@ -191,7 +191,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "int_comp" << i;
         int_comp_names.push_back(ss.str());
     }
-        
+
     WriteBinaryParticleData(dir, name,
                             write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
@@ -208,10 +208,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                  const std::string& name,
                  const Vector<int>& write_real_comp,
                  const Vector<int>& write_int_comp) const
-{    
+{
     AMREX_ASSERT(write_real_comp.size() == NStructReal + NumRealComps());
     AMREX_ASSERT(write_int_comp.size()  == NStructInt  + NArrayInt );
-    
+
     Vector<std::string> real_comp_names;
     for (int i = 0; i < NStructReal + NumRealComps(); ++i )
     {
@@ -241,12 +241,12 @@ void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 WritePlotFile (const std::string& dir, const std::string& name,
                const Vector<int>& write_real_comp,
-               const Vector<int>& write_int_comp,    
+               const Vector<int>& write_int_comp,
                const Vector<std::string>& real_comp_names,
                const Vector<std::string>&  int_comp_names) const
 {
     BL_PROFILE("ParticleContainer::WritePlotFile()");
-    
+
     WriteBinaryParticleData(dir, name,
                             write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
@@ -271,7 +271,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "real_comp" << i;
         real_comp_names.push_back(ss.str());
     }
-    
+
     Vector<int> write_int_comp;
     Vector<std::string> int_comp_names;
     for (int i = 0; i < NStructInt + NumIntComps(); ++i )
@@ -281,7 +281,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "int_comp" << i;
         int_comp_names.push_back(ss.str());
     }
-    
+
     WriteBinaryParticleData(dir, name, write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
                             std::forward<F>(f));
@@ -294,7 +294,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::WritePlotFile (const std::string& dir, const std::string& name,
                  const Vector<std::string>& real_comp_names,
                  const Vector<std::string>& int_comp_names, F&& f) const
-{    
+{
     AMREX_ASSERT(real_comp_names.size() == NStructReal + NumRealComps());
     AMREX_ASSERT( int_comp_names.size() == NStructInt  + NArrayInt );
 
@@ -316,7 +316,7 @@ void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 ::WritePlotFile (const std::string& dir, const std::string& name,
                  const Vector<std::string>& real_comp_names, F&& f) const
-{    
+{
     AMREX_ASSERT(real_comp_names.size() == NStructReal + NumRealComps());
 
     Vector<int> write_real_comp;
@@ -332,7 +332,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         ss << "int_comp" << i;
         int_comp_names.push_back(ss.str());
     }
-        
+
     WriteBinaryParticleData(dir, name,
                             write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
@@ -347,10 +347,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                  const std::string& name,
                  const Vector<int>& write_real_comp,
                  const Vector<int>& write_int_comp, F&& f) const
-{    
+{
     AMREX_ASSERT(write_real_comp.size() == NStructReal + NumRealComps());
     AMREX_ASSERT(write_int_comp.size()  == NStructInt  + NumIntComps() );
-    
+
     Vector<std::string> real_comp_names;
     for (int i = 0; i < NStructReal + NumRealComps(); ++i )
     {
@@ -378,13 +378,13 @@ void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 WritePlotFile (const std::string& dir, const std::string& name,
                const Vector<int>& write_real_comp,
-               const Vector<int>& write_int_comp,    
+               const Vector<int>& write_int_comp,
                const Vector<std::string>& real_comp_names,
                const Vector<std::string>&  int_comp_names,
                F&& f) const
 {
     BL_PROFILE("ParticleContainer::WritePlotFile()");
-    
+
     WriteBinaryParticleData(dir, name,
                             write_real_comp, write_int_comp,
                             real_comp_names, int_comp_names,
@@ -402,302 +402,19 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                            const Vector<std::string>& int_comp_names,
                            F&& f) const
 {
-    BL_PROFILE("ParticleContainer::WriteBinaryParticleData()");
-    AMREX_ASSERT(OK());
-    
-    AMREX_ASSERT(sizeof(typename ParticleType::RealType) == 4 ||
-                 sizeof(typename ParticleType::RealType) == 8);
-    
-    const int NProcs = ParallelDescriptor::NProcs();
-    const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
-    const Real strttime = amrex::second();
-    
-    AMREX_ALWAYS_ASSERT(real_comp_names.size() == NumRealComps() + NStructReal);
-    AMREX_ALWAYS_ASSERT( int_comp_names.size() == NumIntComps() + NStructInt);
-
-    std::string pdir = dir;
-    if ( not pdir.empty() and pdir[pdir.size()-1] != '/') pdir += '/';
-    pdir += name;
-    
-    if ( ! levelDirectoriesCreated)
-    {
-        if (ParallelDescriptor::IOProcessor()) 
-            if ( ! amrex::UtilCreateDirectory(pdir, 0755)) 
-                amrex::CreateDirectoryFailed(pdir);
-        ParallelDescriptor::Barrier();
-    }
-    
-    std::ofstream HdrFile;
-    
-    Long nparticles = 0;
-    int maxnextid;
-
-    // evaluate f for every particle to determine which ones to output
-    Vector<std::map<std::pair<int, int>, Gpu::DeviceVector<int> > > particle_io_flags(m_particles.size());		
-    for (int lev = 0; lev < m_particles.size();  lev++)
-    {
-        const auto& pmap = m_particles[lev];
-        for (const auto& kv : pmap)
-        {
-            const auto ptd = kv.second.getConstParticleTileData();
-            const auto np = kv.second.numParticles();
-            particle_io_flags[lev][kv.first].resize(np, 0);
-            auto pflags = particle_io_flags[lev][kv.first].data();
-            AMREX_HOST_DEVICE_FOR_1D( np, k, 
-            {
-                const auto p = ptd.getSuperParticle(k);
-                pflags[k] = f(p);
-            });
-        }
-    }
-
-    Gpu::Device::synchronize();
-    
-    if(usePrePost)
-    {
-        nparticles = nparticlesPrePost;
-        maxnextid  = maxnextidPrePost;
-    }
-    else
-    {
-        nparticles = 0;
-        maxnextid  = ParticleType::NextID();
-
-        for (int lev = 0; lev < m_particles.size();  lev++)
-        {
-            const auto& pmap = m_particles[lev];
-            for (const auto& kv : pmap)
-            {
-                const auto& pflags = particle_io_flags[lev][kv.first];
-                for (int k = 0; k < kv.second.numParticles(); ++k) 
-                {
-                    if (pflags[k]) nparticles++;
-                }
-            }
-        }
-        
-        ParallelDescriptor::ReduceLongSum(nparticles, IOProcNumber);
-        ParticleType::NextID(maxnextid);
-        ParallelDescriptor::ReduceIntMax(maxnextid, IOProcNumber);
-    }
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        std::string HdrFileName = pdir;
-	
-        if ( ! HdrFileName.empty() && HdrFileName[HdrFileName.size()-1] != '/')
-            HdrFileName += '/';
-        
-        HdrFileName += "Header";
-        HdrFileNamePrePost = HdrFileName;
-	
-        HdrFile.open(HdrFileName.c_str(), std::ios::out|std::ios::trunc);
-	
-        if ( ! HdrFile.good()) amrex::FileOpenFailed(HdrFileName);
-
-        //
-        // First thing written is our Checkpoint/Restart version string.
-        // We append "_single" or "_double" to the version string indicating
-        // whether we're using "float" or "double" floating point data in the
-        // particles so that we can Restart from the checkpoint files.
-        //
-        if (sizeof(typename ParticleType::RealType) == 4)
-        {
-            HdrFile << ParticleType::Version() << "_single" << '\n';
-        }
-        else
-        {
-            HdrFile << ParticleType::Version() << "_double" << '\n';
-        }
-
-        int num_output_real = 0;
-        for (int i = 0; i < NumRealComps() + NStructReal; ++i)
-            if (write_real_comp[i]) ++num_output_real;
-        
-        int num_output_int = 0;
-        for (int i = 0; i < NumIntComps() + NStructInt; ++i)
-            if (write_int_comp[i]) ++num_output_int;
-        
-        // AMREX_SPACEDIM and N for sanity checking.
-        HdrFile << AMREX_SPACEDIM << '\n';
-	
-        // The number of extra real parameters
-        HdrFile << num_output_real << '\n';
-        
-        // Real component names
-        for (int i = 0; i < NStructReal + NumRealComps(); ++i )
-            if (write_real_comp[i]) HdrFile << real_comp_names[i] << '\n';
-        
-        // The number of extra int parameters
-        HdrFile << num_output_int << '\n';
-        
-        // int component names
-        for (int i = 0; i < NStructInt + NumIntComps(); ++i )
-            if (write_int_comp[i]) HdrFile << int_comp_names[i] << '\n';
-
-        bool is_checkpoint = true; // legacy
-        HdrFile << is_checkpoint << '\n';
-
-        // The total number of particles.
-        HdrFile << nparticles << '\n';
-
-        // The value of nextid that we need to restore on restart.
-        HdrFile << maxnextid << '\n';
-
-        // Then the finest level of the AMR hierarchy.
-        HdrFile << finestLevel() << '\n';
-
-        // Then the number of grids at each level.
-        for (int lev = 0; lev <= finestLevel(); lev++)
-            HdrFile << ParticleBoxArray(lev).size() << '\n';
-    }
-
-    // We want to write the data out in parallel.
-    // We'll allow up to nOutFiles active writers at a time.
-    int nOutFiles(256);
-
-    ParmParse pp("particles");
-    pp.query("particles_nfiles",nOutFiles);
-    if(nOutFiles == -1) nOutFiles = NProcs;
-    nOutFiles = std::max(1, std::min(nOutFiles,NProcs));
-    nOutFilesPrePost = nOutFiles;
-
-    for (int lev = 0; lev <= finestLevel(); lev++)
-    {
-        bool gotsome;
-        if(usePrePost)
-        {
-            gotsome = (nParticlesAtLevelPrePost[lev] > 0);
-        }
-        else
-        {
-            gotsome = (NumberOfParticlesAtLevel(lev) > 0);
-        }
-
-        // We store the particles at each level in their own subdirectory.
-        std::string LevelDir = pdir;
-        
-        if (gotsome)
-        {
-            if ( ! LevelDir.empty() && LevelDir[LevelDir.size()-1] != '/') LevelDir += '/';
-	    
-            LevelDir = amrex::Concatenate(LevelDir + "Level_", lev, 1);
-            
-            if ( ! levelDirectoriesCreated) {
-                if (ParallelDescriptor::IOProcessor()) 
-                    if ( ! amrex::UtilCreateDirectory(LevelDir, 0755)) 
-                        amrex::CreateDirectoryFailed(LevelDir);
-                //
-                // Force other processors to wait until directory is built.
-                //
-                ParallelDescriptor::Barrier();
-            }
-        }
-	
-        // Write out the header for each particle
-        if (gotsome and ParallelDescriptor::IOProcessor()) {
-            std::string HeaderFileName = LevelDir;
-            HeaderFileName += "/Particle_H";
-            std::ofstream ParticleHeader(HeaderFileName);
-            
-            ParticleBoxArray(lev).writeOn(ParticleHeader);
-            ParticleHeader << '\n';
-            
-            ParticleHeader.flush();
-            ParticleHeader.close();
-        }
-        
-        MFInfo info;
-        info.SetAlloc(false);
-        MultiFab state(ParticleBoxArray(lev),
-                       ParticleDistributionMap(lev),
-                       1,0,info);
-        
-        // We eventually want to write out the file name and the offset
-        // into that file into which each grid of particles is written.
-        Vector<int>  which(state.size(),0);
-        Vector<int > count(state.size(),0);
-        Vector<Long> where(state.size(),0);
-	
-        std::string filePrefix(LevelDir);
-        filePrefix += '/';
-        filePrefix += ParticleType::DataPrefix();
-        if(usePrePost) {
-            filePrefixPrePost[lev] = filePrefix;
-        }
-        bool groupSets(false), setBuf(true);
-        
-        if (gotsome)
-        {
-            for(NFilesIter nfi(nOutFiles, filePrefix, groupSets, setBuf); nfi.ReadyToWrite(); ++nfi)
-            {
-                std::ofstream& myStream = (std::ofstream&) nfi.Stream();
-                WriteParticles(lev, myStream, nfi.FileNumber(), which, count, where,
-                               write_real_comp, write_int_comp, particle_io_flags);
-            }
-            
-            if(usePrePost) {
-                whichPrePost[lev] = which;
-                countPrePost[lev] = count;
-                wherePrePost[lev] = where;
-            } else {
-                ParallelDescriptor::ReduceIntSum (which.dataPtr(), which.size(), IOProcNumber);
-                ParallelDescriptor::ReduceIntSum (count.dataPtr(), count.size(), IOProcNumber);
-                ParallelDescriptor::ReduceLongSum(where.dataPtr(), where.size(), IOProcNumber);
-            }
-        }
-	
-        if (ParallelDescriptor::IOProcessor())
-        {
-            if(usePrePost) {
-                // ---- write to the header and unlink in CheckpointPost
-            } else {
-                for (int j = 0; j < state.size(); j++)
-                {
-                    HdrFile << which[j] << ' ' << count[j] << ' ' << where[j] << '\n';
-                }
-				
-                if (gotsome && doUnlink)
-                {
-                    // Unlink any zero-length data files.
-                    Vector<Long> cnt(nOutFiles,0);
-					
-                    for (int i = 0, N=count.size(); i < N; i++) {
-                        cnt[which[i]] += count[i];
-                    }
-                    
-                    for (int i = 0, N=cnt.size(); i < N; i++)
-                    {
-                        if (cnt[i] == 0)
-                        {
-                            std::string FullFileName = NFilesIter::FileName(i, filePrefix);
-                            amrex::UnlinkFile(FullFileName.c_str());
-                        }
-                    }
-                }                
-            }            
-        }
-    }
-    
-    if (ParallelDescriptor::IOProcessor())
+    if (AsyncOut::UseAsyncOut()) {
+        WriteBinaryParticleDataAsync(*this, dir, name,
+                                     write_real_comp, write_int_comp,
+                                     real_comp_names, int_comp_names);
+    } else
     {
-        HdrFile.flush();
-        HdrFile.close();
-        if ( ! HdrFile.good())
-        {
-            amrex::Abort("ParticleContainer::Checkpoint(): problem writing HdrFile");
-        }
-    }
-    
-    if (m_verbose > 1)
-    {
-        Real stoptime = amrex::second() - strttime;        
-        ParallelDescriptor::ReduceRealMax(stoptime, IOProcNumber);        
-        amrex::Print() << "ParticleContainer::Checkpoint() time: " << stoptime << '\n';
+        WriteBinaryParticleDataSync(*this, dir, name,
+                                    write_real_comp, write_int_comp,
+                                    real_comp_names, int_comp_names,
+                                    std::forward<F>(f));
     }
 }
 
-
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
@@ -706,20 +423,20 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     if( ! usePrePost) {
         return;
     }
-    
+
     BL_PROFILE("ParticleContainer::CheckpointPre()");
-    
+
     const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
     Long nparticles = 0;
-    int  maxnextid  = ParticleType::NextID();
-    
+    Long  maxnextid  = ParticleType::NextID();
+
     for (int lev = 0; lev < m_particles.size();  lev++) {
         const auto& pmap = m_particles[lev];
         for (const auto& kv : pmap) {
             const auto& aos = kv.second.GetArrayOfStructs();
             for (int k = 0; k < aos.numParticles(); ++k) {
                 const ParticleType& p = aos[k];
-                if (p.m_idata.id > 0) {
+                if (p.id() > 0) {
                     //
                     // Only count (and checkpoint) valid particles.
                     //
@@ -731,24 +448,24 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     ParallelDescriptor::ReduceLongSum(nparticles, IOProcNumber);
 
     ParticleType::NextID(maxnextid);
-    ParallelDescriptor::ReduceIntMax(maxnextid, IOProcNumber);
-    
+    ParallelDescriptor::ReduceLongMax(maxnextid, IOProcNumber);
+
     nparticlesPrePost = nparticles;
     maxnextidPrePost  = maxnextid;
-    
+
     nParticlesAtLevelPrePost.clear();
     nParticlesAtLevelPrePost.resize(finestLevel() + 1, 0);
     for(int lev(0); lev <= finestLevel(); ++lev) {
         nParticlesAtLevelPrePost[lev] = NumberOfParticlesAtLevel(lev);
     }
-    
+
     whichPrePost.clear();
     whichPrePost.resize(finestLevel() + 1);
     countPrePost.clear();
     countPrePost.resize(finestLevel() + 1);
     wherePrePost.clear();
     wherePrePost.resize(finestLevel() + 1);
-    
+
     filePrefixPrePost.clear();
     filePrefixPrePost.resize(finestLevel() + 1);
 }
@@ -762,44 +479,44 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     if( ! usePrePost) {
         return;
     }
-    
+
     BL_PROFILE("ParticleContainer::CheckpointPost()");
-    
+
     const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
     std::ofstream HdrFile;
     HdrFile.open(HdrFileNamePrePost.c_str(), std::ios::out | std::ios::app);
-    
+
     for(int lev(0); lev <= finestLevel(); ++lev) {
         ParallelDescriptor::ReduceIntSum (whichPrePost[lev].dataPtr(), whichPrePost[lev].size(), IOProcNumber);
         ParallelDescriptor::ReduceIntSum (countPrePost[lev].dataPtr(), countPrePost[lev].size(), IOProcNumber);
         ParallelDescriptor::ReduceLongSum(wherePrePost[lev].dataPtr(), wherePrePost[lev].size(), IOProcNumber);
-        
-        
+
+
         if(ParallelDescriptor::IOProcessor()) {
             for(int j(0); j < whichPrePost[lev].size(); ++j) {
                 HdrFile << whichPrePost[lev][j] << ' ' << countPrePost[lev][j] << ' ' << wherePrePost[lev][j] << '\n';
             }
-            
+
             const bool gotsome = (nParticlesAtLevelPrePost[lev] > 0);
             if(gotsome && doUnlink) {
 //            BL_PROFILE_VAR("PC<NNNN>::Checkpoint:unlink", unlink_post);
                 // Unlink any zero-length data files.
                 Vector<Long> cnt(nOutFilesPrePost,0);
-                
+
                 for(int i(0), N = countPrePost[lev].size(); i < N; ++i) {
                     cnt[whichPrePost[lev][i]] += countPrePost[lev][i];
                 }
-                
+
                 for(int i(0), N = cnt.size(); i < N; ++i) {
                     if(cnt[i] == 0) {
                         std::string FullFileName = NFilesIter::FileName(i, filePrefixPrePost[lev]);
-                        amrex::UnlinkFile(FullFileName.c_str());
+                        FileSystem::Remove(FullFileName);
                     }
                 }
             }
         }
     }
-    
+
     if(ParallelDescriptor::IOProcessor()) {
         HdrFile.flush();
         HdrFile.close();
@@ -847,39 +564,39 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         const int tile = kv.first.second;
         tile_map[grid].push_back(tile);
         const auto& pflags = particle_io_flags[lev].at(kv.first);
-		
+
         // Only write out valid particles.
-        int cnt = 0;	
+        int cnt = 0;
         for (int k = 0; k < kv.second.GetArrayOfStructs().numParticles(); ++k)
         {
             if (pflags[k]) cnt++;
         }
-		
+
         count[grid] += cnt;
     }
-    
+
     MFInfo info;
     info.SetAlloc(false);
     MultiFab state(ParticleBoxArray(lev), ParticleDistributionMap(lev), 1,0,info);
-    
+
     for (MFIter mfi(state); mfi.isValid(); ++mfi)
     {
         const int grid = mfi.index();
-        
+
         which[grid] = fnum;
         where[grid] = VisMF::FileOffset(ofs);
-        
+
         if (count[grid] == 0) continue;
-      
+
         // First write out the integer data in binary.
         int num_output_int = 0;
         for (int i = 0; i < NumIntComps() + NStructInt; ++i)
             if (write_int_comp[i]) ++num_output_int;
-        
+
         const int iChunkSize = 2 + num_output_int;
         Vector<int> istuff(count[grid]*iChunkSize);
         int* iptr = istuff.dataPtr();
-        
+
         for (unsigned i = 0; i < tile_map[grid].size(); i++) {
             auto ptile_index = std::make_pair(grid, tile_map[grid][i]);
             const auto& pbox = m_particles[lev].at(ptile_index);
@@ -890,19 +607,19 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 if (pflags[pindex])
                 {
                     // always write these
-                    for (int j = 0; j < 2; j++) iptr[j] = p.m_idata.arr[j];
-                    iptr += 2;
-                    
+                    *iptr = p.id(); ++iptr;
+                    *iptr = p.cpu(); ++iptr;
+
                     // optionally write these
                     for (int j = 0; j < NStructInt; j++)
                     {
                         if (write_int_comp[j])
                         {
-                            *iptr = p.m_idata.arr[2+j];
+                            *iptr = p.idata(j);
                             ++iptr;
                         }
                     }
-                    
+
                     const auto& soa  = pbox.GetStructOfArrays();
                     for (int j = 0; j < NumIntComps(); j++)
                     {
@@ -915,42 +632,42 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 }
             }
         }
-                
+
         writeIntData(istuff.dataPtr(), istuff.size(), ofs);
         ofs.flush();  // Some systems require this flush() (probably due to a bug)
-        
+
         // Write the Real data in binary.
         int num_output_real = 0;
         for (int i = 0; i < NumRealComps() + NStructReal; ++i)
             if (write_real_comp[i]) ++num_output_real;
-        
+
         const int rChunkSize = AMREX_SPACEDIM + num_output_real;
         Vector<typename ParticleType::RealType> rstuff(count[grid]*rChunkSize);
         typename ParticleType::RealType* rptr = rstuff.dataPtr();
-        
+
         for (unsigned i = 0; i < tile_map[grid].size(); i++) {
 			auto ptile_index = std::make_pair(grid, tile_map[grid][i]);
             const auto& pbox = m_particles[lev].at(ptile_index);
 			const auto& pflags = particle_io_flags[lev].at(ptile_index);
             for (int pindex = 0; pindex < pbox.GetArrayOfStructs().numParticles(); ++pindex) {
                 const auto& aos = pbox.GetArrayOfStructs();
-                const auto& p = aos[pindex];				
+                const auto& p = aos[pindex];
                 if (pflags[pindex])
                 {
                     // always write these
-                    for (int j = 0; j < AMREX_SPACEDIM; j++) rptr[j] = p.m_rdata.arr[j];
+                    for (int j = 0; j < AMREX_SPACEDIM; j++) rptr[j] = p.pos(j);
                     rptr += AMREX_SPACEDIM;
-                    
+
                     // optionally write these
                     for (int j = 0; j < NStructReal; j++)
                     {
                         if (write_real_comp[j])
                         {
-                            *rptr = p.m_rdata.arr[AMREX_SPACEDIM+j];
+                            *rptr = p.rdata(j);
                             ++rptr;
                         }
                     }
-                    
+
                     const auto& soa  = pbox.GetStructOfArrays();
                     for (int j = 0; j < NumRealComps(); j++)
                     {
@@ -963,8 +680,8 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 }
             }
         }
-        
-        WriteParticleRealData(rstuff.dataPtr(), rstuff.size(), ofs, ParticleRealDescriptor);
+
+        WriteParticleRealData(rstuff.dataPtr(), rstuff.size(), ofs);
         ofs.flush();  // Some systems require this flush() (probably due to a bug)
     }
 }
@@ -973,7 +690,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
-::Restart (const std::string& dir, const std::string& file, bool is_checkpoint)
+::Restart (const std::string& dir, const std::string& file, bool /*is_checkpoint*/)
 {
     Restart(dir, file);
 }
@@ -986,9 +703,9 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     BL_PROFILE("ParticleContainer::Restart()");
     AMREX_ASSERT(!dir.empty());
     AMREX_ASSERT(!file.empty());
-    
+
     const Real strttime = amrex::second();
-    
+
     int DATA_Digits_Read(5);
     ParmParse pp("particles");
     pp.query("datadigits_read",DATA_Digits_Read);
@@ -1001,16 +718,16 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     if (!HdrFileName.empty() && HdrFileName[HdrFileName.size()-1] != '/')
         HdrFileName += '/';
     HdrFileName += "Header";
-    
+
     Vector<char> fileCharPtr;
     ParallelDescriptor::ReadAndBcastFile(HdrFileName, fileCharPtr);
     std::string fileCharPtrString(fileCharPtr.dataPtr());
     std::istringstream HdrFile(fileCharPtrString, std::istringstream::in);
-  
+
     std::string version;
     HdrFile >> version;
     AMREX_ASSERT(!version.empty());
-    
+
     // What do our version strings mean?
     // "Version_One_Dot_Zero" -- hard-wired to write out in double precision.
     // "Version_One_Dot_One" -- can write out either as either single or double precision.
@@ -1040,45 +757,45 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         msg += version;
         amrex::Abort(msg.c_str());
     }
-    
+
     int dm;
     HdrFile >> dm;
     if (dm != AMREX_SPACEDIM)
         amrex::Abort("ParticleContainer::Restart(): dm != AMREX_SPACEDIM");
-    
+
     int nr;
     HdrFile >> nr;
     if (nr != NStructReal + NumRealComps())
         amrex::Abort("ParticleContainer::Restart(): nr != NStructReal + NumRealComps()");
-    
+
     std::string comp_name;
     for (int i = 0; i < nr; ++i)
         HdrFile >> comp_name;
-    
+
     int ni;
     HdrFile >> ni;
     if (ni != NStructInt + NumIntComps())
         amrex::Abort("ParticleContainer::Restart(): ni != NStructInt");
-    
+
     for (int i = 0; i < ni; ++i)
         HdrFile >> comp_name;
-    
+
     bool checkpoint;
     HdrFile >> checkpoint;
-    
+
     Long nparticles;
     HdrFile >> nparticles;
     AMREX_ASSERT(nparticles >= 0);
-    
-    int maxnextid;
+
+    Long maxnextid;
     HdrFile >> maxnextid;
     AMREX_ASSERT(maxnextid > 0);
     ParticleType::NextID(maxnextid);
-    
+
     int finest_level_in_file;
     HdrFile >> finest_level_in_file;
     AMREX_ASSERT(finest_level_in_file >= 0);
-    
+
     // Determine whether this is a dual-grid restart or not.
     Vector<BoxArray> particle_box_arrays(finest_level_in_file + 1);
     bool dual_grid = false;
@@ -1093,7 +810,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         if (amrex::FileExists(phdr_name)) {
             have_pheaders = true;
             break;
-        }        
+        }
     }
 
     if (have_pheaders)
@@ -1105,18 +822,18 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             phdr_name += "/Particle_H";
 
             if (not amrex::FileExists(phdr_name)) continue;
-            
+
             Vector<char> phdr_chars;
             ParallelDescriptor::ReadAndBcastFile(phdr_name, phdr_chars);
             std::string phdr_string(phdr_chars.dataPtr());
             std::istringstream phdr_file(phdr_string, std::istringstream::in);
-            
+
             if (lev > finestLevel())
             {
                 dual_grid = true;
                 break;
             }
-        
+
             particle_box_arrays[lev].readFrom(phdr_file);
             if (not particle_box_arrays[lev].CellEqual(ParticleBoxArray(lev))) dual_grid = true;
         }
@@ -1132,7 +849,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             SetParticleDistributionMap(lev, pdm);
         }
     }
-    
+
     Vector<int> ngrids(finest_level_in_file+1);
     for (int lev = 0; lev <= finest_level_in_file; lev++) {
         HdrFile >> ngrids[lev];
@@ -1141,13 +858,13 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             AMREX_ASSERT(ngrids[lev] == int(ParticleBoxArray(lev).size()));
         }
     }
-    
+
     resizeData();
-    
+
     if (finest_level_in_file > finestLevel()) {
         m_particles.resize(finest_level_in_file+1);
     }
-    
+
     for (int lev = 0; lev <= finest_level_in_file; lev++) {
         Vector<int>  which(ngrids[lev]);
         Vector<int>  count(ngrids[lev]);
@@ -1155,65 +872,65 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
         for (int i = 0; i < ngrids[lev]; i++) {
             HdrFile >> which[i] >> count[i] >> where[i];
         }
-        
+
         Vector<int> grids_to_read;
         if (lev <= finestLevel()) {
             for (MFIter mfi(*m_dummy_mf[lev]); mfi.isValid(); ++mfi) {
                 grids_to_read.push_back(mfi.index());
             }
         } else {
-            
+
             // we lost a level on restart. we still need to read in particles
             // on finer levels, and put them in the right place via Redistribute()
-            
+
             const int rank = ParallelDescriptor::MyProc();
             const int NReaders = ParticleType::MaxReaders();
             if (rank >= NReaders) return;
-            
+
             const int Navg = ngrids[lev] / NReaders;
             const int Nleft = ngrids[lev] - Navg * NReaders;
-            
+
             int lo, hi;
             if (rank < Nleft) {
                 lo = rank*(Navg + 1);
                 hi = lo + Navg + 1;
-            } 
+            }
             else {
                 lo = rank * Navg + Nleft;
                 hi = lo + Navg;
             }
-            
+
             for (int i = lo; i < hi; ++i) {
                 grids_to_read.push_back(i);
             }
         }
-        
+
         for(int igrid = 0; igrid < static_cast<int>(grids_to_read.size()); ++igrid) {
             const int grid = grids_to_read[igrid];
-            
+
             if (count[grid] <= 0) continue;
-            
+
             // The file names in the header file are relative.
             std::string name = fullname;
-            
+
             if (!name.empty() && name[name.size()-1] != '/')
                 name += '/';
-            
+
             name += "Level_";
             name += amrex::Concatenate("", lev, 1);
             name += '/';
             name += ParticleType::DataPrefix();
             name += amrex::Concatenate("", which[grid], DATA_Digits_Read);
-            
+
             std::ifstream ParticleFile;
-            
+
             ParticleFile.open(name.c_str(), std::ios::in | std::ios::binary);
-            
+
             if (!ParticleFile.good())
                 amrex::FileOpenFailed(name);
-            
+
             ParticleFile.seekg(where[grid], std::ios::beg);
-            
+
             if (how == "single") {
                 ReadParticles<float>(count[grid], grid, lev, ParticleFile, finest_level_in_file);
             }
@@ -1225,20 +942,20 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 msg += how;
                 amrex::Error(msg.c_str());
             }
-            
+
             ParticleFile.close();
-            
+
             if (!ParticleFile.good())
                 amrex::Abort("ParticleContainer::Restart(): problem reading particles");
         }
     }
-    
+
     Redistribute();
-    
+
     AMREX_ASSERT(OK());
-    
+
     if (m_verbose > 1) {
-        Real stoptime = amrex::second() - strttime;	
+        Real stoptime = amrex::second() - strttime;
         ParallelDescriptor::ReduceRealMax(stoptime, ParallelDescriptor::IOProcessorNumber());
         amrex::Print() << "ParticleContainer::Restart() time: " << stoptime << '\n';
     }
@@ -1261,16 +978,16 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     const int iChunkSize = 2 + NStructInt + NumIntComps();
     Vector<int> istuff(cnt*iChunkSize);
     readIntData(istuff.dataPtr(), istuff.size(), ifs, FPC::NativeIntDescriptor());
-    
+
     // Then the real data in binary.
     const int rChunkSize = AMREX_SPACEDIM + NStructReal + NumRealComps();
     Vector<RTYPE> rstuff(cnt*rChunkSize);
-    ReadParticleRealData(rstuff.dataPtr(), rstuff.size(), ifs, ParticleRealDescriptor);
-    
+    ReadParticleRealData(rstuff.dataPtr(), rstuff.size(), ifs);
+
     // Now reassemble the particles.
     int*   iptr = istuff.dataPtr();
     RTYPE* rptr = rstuff.dataPtr();
-    
+
     ParticleType p;
     ParticleLocData pld;
 
@@ -1289,38 +1006,38 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
     host_int_attribs.resize(finest_level_in_file+1);
 
     for (int i = 0; i < cnt; i++) {
-        p.m_idata.id   = iptr[0];
-        p.m_idata.cpu  = iptr[1];
-        
+        p.id()   = iptr[0];
+        p.cpu()  = iptr[1];
+
         iptr += 2;
-            
+
         for (int j = 0; j < NStructInt; j++)
         {
-            p.m_idata.arr[2+j] = *iptr;
+            p.idata(j) = *iptr;
             ++iptr;
         }
 
-        AMREX_ASSERT(p.m_idata.id > 0);
-        
-        AMREX_D_TERM(p.m_rdata.pos[0] = rptr[0];,
-                     p.m_rdata.pos[1] = rptr[1];,
-                     p.m_rdata.pos[2] = rptr[2];);
-        
+        AMREX_ASSERT(p.id() > 0);
+
+        AMREX_D_TERM(p.pos(0) = rptr[0];,
+                     p.pos(1) = rptr[1];,
+                     p.pos(2) = rptr[2];);
+
         rptr += AMREX_SPACEDIM;
-        
+
         for (int j = 0; j < NStructReal; j++)
         {
-            p.m_rdata.arr[AMREX_SPACEDIM+j] = *rptr;
+            p.rdata(j) = *rptr;
             ++rptr;
         }
 
         locateParticle(p, pld, 0, finestLevel(), 0);
-        
+
 	std::pair<int, int> ind(grd, pld.m_tile);
 
         host_real_attribs[lev][ind].resize(NumRealComps());
         host_int_attribs[lev][ind].resize(NumIntComps());
-        
+
 	// add the struct
 	host_particles[lev][ind].push_back(p);
 
@@ -1329,12 +1046,12 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             host_real_attribs[lev][ind][icomp].push_back(*rptr);
             ++rptr;
 	}
-        
+
 	// ... and int array data
 	for (int icomp = 0; icomp < NumIntComps(); icomp++) {
             host_int_attribs[lev][ind][icomp].push_back(*iptr);
             ++iptr;
-	}        
+	}
     }
 
     for (int host_lev = 0; host_lev < static_cast<int>(host_particles.size()); ++host_lev)
@@ -1343,22 +1060,22 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 	  auto grid = kv.first.first;
 	  auto tile = kv.first.second;
 	  const auto& src_tile = kv.second;
-          
+
 	  auto& dst_tile = DefineAndReturnParticleTile(host_lev, grid, tile);
 	  auto old_size = dst_tile.GetArrayOfStructs().size();
 	  auto new_size = old_size + src_tile.size();
 	  dst_tile.resize(new_size);
-                
+
 	  Gpu::copy(Gpu::hostToDevice, src_tile.begin(), src_tile.end(),
                     dst_tile.GetArrayOfStructs().begin() + old_size);
-	  
+
 	  for (int i = 0; i < NumRealComps(); ++i) {
               Gpu::copy(Gpu::hostToDevice,
                         host_real_attribs[host_lev][std::make_pair(grid,tile)][i].begin(),
                         host_real_attribs[host_lev][std::make_pair(grid,tile)][i].end(),
                         dst_tile.GetStructOfArrays().GetRealData(i).begin() + old_size);
 	  }
-	  
+
 	  for (int i = 0; i < NumIntComps(); ++i) {
               Gpu::copy(Gpu::hostToDevice,
                         host_int_attribs[host_lev][std::make_pair(grid,tile)][i].begin(),
@@ -1367,7 +1084,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 	  }
 	}
       }
-    
+
     Gpu::streamSynchronize();
 }
 
@@ -1393,7 +1110,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::WriteAsciiFil
 	    Gpu::copy(Gpu::deviceToHost, aos.begin(), aos.begin() + np, host_aos.begin());
 	    for (int k = 0; k < np; ++k) {
 	        const ParticleType& p = host_aos[k];
-                if (p.m_idata.id > 0)
+                if (p.id() > 0)
                     //
                     // Only count (and checkpoint) valid particles.
                     //
@@ -1401,7 +1118,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::WriteAsciiFil
             }
         }
     }
-    
+
     //
     // And send count to I/O processor.
     //
@@ -1424,7 +1141,7 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::WriteAsciiFil
         File << NStructInt  << '\n';
         File << NumRealComps()  << '\n';
         File << NumIntComps()   << '\n';
-            
+
         File.flush();
 
         File.close();
@@ -1469,183 +1186,33 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::WriteAsciiFil
 
 		for (int index = 0; index < np; ++index) {
 		    const ParticleType* it = &host_aos[index];
-		    if (it->m_idata.id > 0) {
-
-                        // write out the particle struct first... 
-                        AMREX_D_TERM(File << it->m_rdata.pos[0] << ' ',
-                               << it->m_rdata.pos[1] << ' ',
-                               << it->m_rdata.pos[2] << ' ');
-
-                        for (int i = AMREX_SPACEDIM; i < AMREX_SPACEDIM + NStructReal; i++)
-                            File << it->m_rdata.arr[i] << ' ';
-
-                        File << it->m_idata.id  << ' ';
-                        File << it->m_idata.cpu << ' ';
-                        
-                        for (int i = 2; i < 2 + NStructInt; i++)
-                            File << it->m_idata.arr[i] << ' ';
-		      
-                        // then the particle attributes.
-                        for (int i = 0; i < NumRealComps(); i++)
-                            File << soa.GetRealData(i)[index] << ' ';
-                        
-                        for (int i = 0; i < NumIntComps(); i++)
-                            File << soa.GetIntData(i)[index] << ' ';
-                        
-                        File << '\n';                                                    
-                    }
-                }
-              }
-            }
-	    
-            File.flush();
-	    
-            File.close();
-            
-            if (!File.good())
-                amrex::Abort("ParticleContainer::WriteAsciiFile(): problem writing file");
-	    
-        }
-	
-        ParallelDescriptor::Barrier();
-    }
-    
-    if (m_verbose > 1)
-    {
-        Real stoptime = amrex::second() - strttime;
-        
-        ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
-        
-        amrex::Print() << "ParticleContainer::WriteAsciiFile() time: " << stoptime << '\n';
-    }
-}
+		    if (it->id() > 0) {
 
-template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
-void
-ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>::WriteCoarsenedAsciiFile (const std::string& filename)
-{
-    BL_PROFILE("ParticleContainer::WriteCoarsenedAsciiFile()");
-    AMREX_ASSERT(!filename.empty());
-    
-    const Real strttime = amrex::second();
- 
-    //
-    // Count # of valid particles.
-    //
-    Long nparticles = 0;
+                        // write out the particle struct first...
+                        AMREX_D_TERM(File << it->pos(0) << ' ',
+                                          << it->pos(1) << ' ',
+                                          << it->pos(2) << ' ');
 
-    for (int lev = 0; lev < m_particles.size();  lev++) {
-        auto& pmap = m_particles[lev];
-        for (const auto& kv : pmap) {
-            const auto& aos = kv.second.GetArrayOfStructs();
-            for (int k = 0; k < aos.numParticles(); ++k) {
-	        const ParticleType& p = aos[k];
-                if (p.m_idata.id > 0)
-                    //
-                    // Only count (and checkpoint) valid particles.
-                    //
-                    nparticles++;
-            }
-        }
-    }
- 
-    //
-    // And send count to I/O processor.
-    //
-    ParallelDescriptor::ReduceLongSum(nparticles,ParallelDescriptor::IOProcessorNumber());
+                        for (int i = 0; i < NStructReal; i++)
+                            File << it->rdata(i) << ' ';
 
-    if (ParallelDescriptor::IOProcessor())
-    {
-        //
-        // Have I/O processor open file and write out particle count.
-        //
-        std::ofstream File;
-
-        File.open(filename.c_str(), std::ios::out|std::ios::trunc);
+                        File << it->id()  << ' ';
+                        File << it->cpu() << ' ';
 
-        if (!File.good())
-            amrex::FileOpenFailed(filename);
-
-        File << nparticles << '\n';
-            
-        File.flush();
-
-        File.close();
+                        for (int i = 0; i < NStructInt; i++)
+                            File << it->idata(i) << ' ';
 
-        if (!File.good())
-            amrex::Abort("ParticleContainer::WriteCoarsenedAsciiFile(): problem writing file");
-    }
-
-    ParallelDescriptor::Barrier();
-
-    const int MyProc = ParallelDescriptor::MyProc();
-
-    for (int proc = 0; proc < ParallelDescriptor::NProcs(); proc++)
-    {
-        if (MyProc == proc)
-        {
-            //
-            // Each CPU opens the file for appending and adds its particles.
-            //
-            VisMF::IO_Buffer io_buffer(VisMF::IO_Buffer_Size);
-
-            std::ofstream File;
-
-            File.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-
-            File.open(filename.c_str(), std::ios::out|std::ios::app);
-
-            File.precision(15);
+                        // then the particle attributes.
+                        for (int i = 0; i < NumRealComps(); i++)
+                            File << soa.GetRealData(i)[index] << ' ';
 
-            if (!File.good())
-                amrex::FileOpenFailed(filename);
+                        for (int i = 0; i < NumIntComps(); i++)
+                            File << soa.GetIntData(i)[index] << ' ';
 
-	    for (int lev = 0; lev < m_particles.size();  lev++) {
-                auto& pmap = m_particles[lev];
-                for (auto& kv : pmap) {
-                    auto& aos = kv.second.GetArrayOfStructs();
-                    auto& soa = kv.second.GetStructOfArrays();
-                    
-                    int index = 0;
-                    ParticleLocData pld;
-                    for (int k = 0; k < aos.numParticles(); ++k) {
-                        ParticleType* it = &aos[k];
-                        locateParticle(*it, pld, 0, finestLevel(), 0);
-                        // Only keep particles in even cells
-                        if (it->id() > 0 &&
-                            (pld.m_cell[0])%2 == 0 && (pld.m_cell[1])%2 == 0 && (pld.m_cell[2])%2 == 0)
-                        {
-                            
-                            // Only keep particles in even cells               
-                            if (it->m_idata.id > 0) {
-                              
-                                File << it->m_idata.id  << ' ';
-                                File << it->m_idata.cpu << ' ';
-                              
-                                AMREX_D_TERM(File << it->m_rdata.pos[0] << ' ',
-                                                  << it->m_rdata.pos[1] << ' ',
-                                                  << it->m_rdata.pos[2] << ' ');
-                              
-                                for (int i = 0; i < NumRealComps(); i++) {
-                                    File << soa.GetRealData(i)[index] << ' ';
-                                }
-                                index++;
-                                
-                                for (int i = AMREX_SPACEDIM; i < AMREX_SPACEDIM + NStructReal; i++) {
-                                    char ws = (i == AMREX_SPACEDIM + NStructReal - 1) ? '\n' : ' ';
-                                    if (i == AMREX_SPACEDIM) {
-                                        // Multiply mass by 8 since we are only taking 1/8 of the 
-                                        // total particles and want to keep the mass in the domain the same.
-                                        File << 8.0* it->m_rdata.arr[i] << ws;
-                                    }
-                                    else {
-                                        File << it->m_rdata.arr[i] << ws;
-                                    }
-                                }
-                            }
-                        }
+                        File << '\n';
                     }
                 }
+              }
             }
 
             File.flush();
@@ -1653,7 +1220,8 @@ ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>::WriteCoarsenedA
             File.close();
 
             if (!File.good())
-                amrex::Abort("ParticleContainer::WriteCoarsenedAsciiFile(): problem writing file");
+                amrex::Abort("ParticleContainer::WriteAsciiFile(): problem writing file");
+
         }
 
         ParallelDescriptor::Barrier();
@@ -1665,7 +1233,8 @@ ParticleContainer<NStructReal,NStructInt,NArrayReal, NArrayInt>::WriteCoarsenedA
 
         ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
 
-        amrex::Print() << "ParticleContainer::WriteCoarsenedAsciiFile() time: " << stoptime << '\n';
+        amrex::Print() << "ParticleContainer::WriteAsciiFile() time: " << stoptime << '\n';
     }
 }
+
 #endif /*AMREX_PARTICLEIO_H*/
diff --git a/Src/Particle/AMReX_ParticleInit.H b/Src/Particle/AMReX_ParticleInit.H
index 91b1238adee..8716022477d 100644
--- a/Src/Particle/AMReX_ParticleInit.H
+++ b/Src/Particle/AMReX_ParticleInit.H
@@ -23,10 +23,10 @@
   Parameters:
 
      file:      the name of the Ascii file with the particles
-     extradata: the number of real components to read in, beyond the AMREX_SPACEDIM 
+     extradata: the number of real components to read in, beyond the AMREX_SPACEDIM
                 positions
-     Nrep:      pointer to IntVect that lets you replicate the incoming particles 
-                across the domain so that you only need to specify a sub-volume of 
+     Nrep:      pointer to IntVect that lets you replicate the incoming particles
+                across the domain so that you only need to specify a sub-volume of
                 them. By default particles are not replicated.
  */
 template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
@@ -135,15 +135,15 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 
         for (int i = 0; i < MyCnt; i++)
         {
-            AMREX_D_TERM(ifs >> p.m_rdata.pos[0];,
-                         ifs >> p.m_rdata.pos[1];,
-                         ifs >> p.m_rdata.pos[2];);
+            AMREX_D_TERM(ifs >> p.pos(0);,
+                         ifs >> p.pos(1);,
+                         ifs >> p.pos(2););
 
             for (int n = 0; n < extradata; n++)
             {
                 if (n < NStructReal)
                 {
-                    ifs >> p.m_rdata.arr[AMREX_SPACEDIM+n];
+                    ifs >> p.rdata(n);
                 }
                 else
                 {
@@ -166,10 +166,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 {
                     if (m_verbose) {
                         amrex::AllPrint() << "BAD PARTICLE ID WOULD BE " << ParticleType::NextID() << '\n'
-                                          << "BAD PARTICLE POS " 
-                                          << AMREX_D_TERM(   p.m_rdata.pos[0],
-                                                           << p.m_rdata.pos[1],
-                                                           << p.m_rdata.pos[2])
+                                          << "BAD PARTICLE POS "
+                                          << AMREX_D_TERM(   p.pos(0),
+                                                          << p.pos(1),
+                                                          << p.pos(2))
                                           << "\n";
                     }
                     amrex::Abort("ParticleContainer::InitFromAsciiFile(): invalid particle");
@@ -177,15 +177,15 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
             }
 
             // set these rather than reading them in
-            p.m_idata.id  = ParticleType::NextID();
-            p.m_idata.cpu = MyProc;
+            p.id()  = ParticleType::NextID();
+            p.cpu() = MyProc;
 
             nparticles.push_back(p);
             for (int n = NStructReal; n < extradata; n++)
             {
                 nreals[n-NStructReal].push_back(r[n-NStructReal]);
             }
-            
+
             how_many++;
             how_many_read++;
 
@@ -203,14 +203,14 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                 for (rep[1] = 1; rep[1] <= lNrep[1]; rep[1]++)
                 {
 #endif
-                    for (rep[0] = 1; rep[0] <= lNrep[0]; rep[0]++) 
+                    for (rep[0] = 1; rep[0] <= lNrep[0]; rep[0]++)
                     {
                         if (!(AMREX_D_TERM( (rep[0] == 1), && (rep[1] == 1), && (rep[2] == 1) ) ) )
                         {
                             // Shift the position.
                             for (int d=0; d<AMREX_SPACEDIM; ++d)
                             {
-                                p_rep.m_rdata.pos[d] = p.m_rdata.pos[d] + (rep[d]-1)*DomSize[d];
+                                p_rep.pos(d) = p.pos(d) + (rep[d]-1)*DomSize[d];
                             }
 
                             // Copy the extra data
@@ -218,11 +218,10 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                             {
                                 if (n < NStructReal)
                                 {
-                                    p_rep.m_rdata.arr[AMREX_SPACEDIM+n]
-                                        = p.m_rdata.arr[AMREX_SPACEDIM+n];
+                                    p_rep.rdata(n) = p.rdata(n);
                                 }
                             }
-                            
+
                             if (!Where(p_rep, pld))
                             {
                                 PeriodicShift(p_rep);
@@ -235,15 +234,15 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
                                 }
                             }
 
-                            p_rep.m_idata.id  = ParticleType::NextID();
-                            p_rep.m_idata.cpu = MyProc;
-   
+                            p_rep.id()  = ParticleType::NextID();
+                            p_rep.cpu() = MyProc;
+
                             nparticles.push_back(p_rep);
                             for (int n = NStructReal; n < extradata; n++)
                             {
                                 nreals[n-NStructReal].push_back(r[n-NStructReal]);
                             }
- 
+
                             how_many++;
                         }
                     }
@@ -717,9 +716,9 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::InitFromBinar
 
                     ifs.read((char*)&fpos[0], AMREX_SPACEDIM*sizeof(float));
 
-                    AMREX_D_TERM(p.m_rdata.pos[0] = fpos[0];,
-                           p.m_rdata.pos[1] = fpos[1];,
-                           p.m_rdata.pos[2] = fpos[2];);
+                    AMREX_D_TERM(p.pos(0) = fpos[0];,
+                                 p.pos(1) = fpos[1];,
+                                 p.pos(2) = fpos[2];);
 
                 }
                 else if (RealSizeInFile == sizeof(double))
@@ -728,9 +727,9 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::InitFromBinar
 
                     ifs.read((char*)&dpos[0], AMREX_SPACEDIM*sizeof(double));
 
-                    AMREX_D_TERM(p.m_rdata.pos[0] = dpos[0];,
-                           p.m_rdata.pos[1] = dpos[1];,
-                           p.m_rdata.pos[2] = dpos[2];);
+                    AMREX_D_TERM(p.pos(0) = dpos[0];,
+                                 p.pos(1) = dpos[1];,
+                                 p.pos(2) = dpos[2];);
                 }
 
                 //
@@ -743,14 +742,14 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::InitFromBinar
                         ifs.read((char*)&fxtra[0], extradata*sizeof(float));
 
                         for (int ii = 0; ii < extradata; ii++)
-                            p.m_rdata.arr[AMREX_SPACEDIM+ii] = fxtra[ii];
+                            p.rdata(ii) = fxtra[ii];
                     }
                     else if (RealSizeInFile == sizeof(double))
                     {
                         ifs.read((char*)&dxtra[0], extradata*sizeof(double));
 
                         for (int ii = 0; ii < extradata; ii++)
-                            p.m_rdata.arr[AMREX_SPACEDIM+ii] = dxtra[ii];
+                            p.rdata(ii) = dxtra[ii];
                     }
                 }
                 //
@@ -784,18 +783,18 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::InitFromBinar
                     {
                         if (m_verbose) {
                             amrex::AllPrint() << "BAD PARTICLE ID WOULD BE " << ParticleType::NextID() << '\n'
-                                              << "BAD PARTICLE POS " 
-                                              << AMREX_D_TERM(   p.m_rdata.pos[0],
-                                                                 << p.m_rdata.pos[2],
-                                                                 << p.m_rdata.pos[3])
+                                              << "BAD PARTICLE POS "
+                                              << AMREX_D_TERM(   p.pos(0),
+                                                              << p.pos(1),
+                                                              << p.pos(2))
                                               << "\n";
                         }
                         amrex::Abort("ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::InitFromBinaryFile(): invalid particle");
                     }
                 }
 
-                p.m_idata.id  = ParticleType::NextID();
-                p.m_idata.cpu = MyProc;
+                p.id()  = ParticleType::NextID();
+                p.cpu() = MyProc;
 
                 host_particles[pld.m_lev][std::make_pair(pld.m_grid, pld.m_tile)].push_back(p);
             }
@@ -1010,11 +1009,11 @@ InitRandom (Long                    icount,
             ParticleType p;
 
             for (int i = 0; i < AMREX_SPACEDIM; i++) {
-                p.m_rdata.pos[i] = pos[j*AMREX_SPACEDIM + i];
+                p.pos(i) = pos[j*AMREX_SPACEDIM + i];
             }
 
             for (int i = 0; i < NStructReal; i++) {
-                p.m_rdata.arr[AMREX_SPACEDIM + i] = pdata.real_struct_data[i];
+                p.rdata(i) = pdata.real_struct_data[i];
             }
 
             if (!Where(p, pld)) {
@@ -1022,20 +1021,20 @@ InitRandom (Long                    icount,
             }
 
             AMREX_ASSERT(pld.m_lev >= 0 && pld.m_lev <= finestLevel());
-            std::pair<int, int> ind(pld.m_grid, pld.m_tile); 
+            std::pair<int, int> ind(pld.m_grid, pld.m_tile);
 
             const int who = ParticleDistributionMap(pld.m_lev)[pld.m_grid];
 
             if (who == MyProc) {
 
                 // We own it. Add it at the appropriate level.
-                p.m_idata.id  = ParticleType::NextID();
-                p.m_idata.cpu = MyProc;
+                p.id()  = ParticleType::NextID();
+                p.cpu() = MyProc;
 
                 for (int i = 0; i < NStructInt; i++) {
-                    p.m_idata.arr[2 + i] = pdata.int_struct_data[i];
+                    p.idata(i) = pdata.int_struct_data[i];
                 }
-                
+
                 // add the struct
                 host_particles[pld.m_lev][ind].push_back(p);
 
@@ -1117,32 +1116,31 @@ InitRandom (Long                    icount,
                     x = geom.ProbLo(i) + (r * len[i]);
                 }
                 while (x < xlo[i] || x > xhi[i]);
-                
-                p.m_rdata.pos[i] = x;
-                
-                AMREX_ASSERT(p.m_rdata.pos[i] < geom.ProbHi(i));
+
+                p.pos(i) = x;
+
+                AMREX_ASSERT(p.pos(i) < geom.ProbHi(i));
             }
-            
+
             for (int i = 0; i < NStructReal; i++) {
-                p.m_rdata.arr[AMREX_SPACEDIM + i] = pdata.real_struct_data[i];
+                p.rdata(i) = pdata.real_struct_data[i];
             }
-            
+
             // the int struct data
-            p.m_idata.id  = ParticleType::NextID();
-            p.m_idata.cpu = ParallelDescriptor::MyProc();
-            
+            p.id()  = ParticleType::NextID();
+            p.cpu() = ParallelDescriptor::MyProc();
+
             for (int i = 0; i < NStructInt; i++) {
-                p.m_idata.arr[2 + i] = pdata.int_struct_data[i];
+                p.idata(i) = pdata.int_struct_data[i];
             }
-            
+
             // locate the particle
             if (!Where(p, pld))
             {
                 amrex::Abort("ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::InitRandom(): invalid particle");
             }
-            AMREX_ASSERT(pld.m_lev >= 0 && pld.m_lev <= finestLevel());            
-            std::pair<int, int> ind(pld.m_grid, pld.m_tile); 
-            
+            AMREX_ASSERT(pld.m_lev >= 0 && pld.m_lev <= finestLevel());
+            std::pair<int, int> ind(pld.m_grid, pld.m_tile);
 
 	    // add the struct
 	    host_particles[pld.m_lev][ind].push_back(p);
@@ -1257,15 +1255,15 @@ ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>
 
             // the real struct data
             for (int i = 0; i < NStructReal; i++) {
-                p.m_rdata.arr[AMREX_SPACEDIM + i] = pdata.real_struct_data[i];
+                p.rdata(i) = pdata.real_struct_data[i];
             }
 
             // the int struct data
-            p.m_idata.id  = ParticleType::NextID();
-            p.m_idata.cpu = ParallelDescriptor::MyProc();
-            
+            p.id()  = ParticleType::NextID();
+            p.cpu() = ParallelDescriptor::MyProc();
+
             for (int i = 0; i < NStructInt; i++) {
-                p.m_idata.arr[2 + i] = pdata.int_struct_data[i];
+                p.idata(i) = pdata.int_struct_data[i];
             }
 
             // locate the particle
@@ -1306,6 +1304,8 @@ void
 ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt>::
 InitOnePerCell (Real x_off, Real y_off, Real z_off, const ParticleInitData& pdata)
 {
+    amrex::ignore_unused(y_off,z_off);
+
     BL_PROFILE("ParticleContainer<NSR, NSI, NAR, NAI>::InitOnePerCell()");
 
     AMREX_ASSERT(m_gdb != 0);
@@ -1329,29 +1329,29 @@ InitOnePerCell (Real x_off, Real y_off, Real z_off, const ParticleInitData& pdat
     for (MFIter mfi(*m_dummy_mf[0], false); mfi.isValid(); ++mfi) {
         Box grid = ParticleBoxArray(0)[mfi.index()];
         RealBox grid_box (grid,dx,geom.ProbLo());
-        
+
         for (IntVect beg = grid.smallEnd(), end=grid.bigEnd(),
-                 cell = grid.smallEnd(); cell <= end; grid.next(cell)) { 
+                 cell = grid.smallEnd(); cell <= end; grid.next(cell)) {
 
             // the real struct data
-            AMREX_D_TERM(p.m_rdata.pos[0] = grid_box.lo(0) + (x_off + cell[0]-beg[0])*dx[0];,
-                   p.m_rdata.pos[1] = grid_box.lo(1) + (y_off + cell[1]-beg[1])*dx[1];,
-                   p.m_rdata.pos[2] = grid_box.lo(2) + (z_off + cell[2]-beg[2])*dx[2];);
-            
+            AMREX_D_TERM(p.pos(0) = grid_box.lo(0) + (x_off + cell[0]-beg[0])*dx[0];,
+                         p.pos(1) = grid_box.lo(1) + (y_off + cell[1]-beg[1])*dx[1];,
+                         p.pos(2) = grid_box.lo(2) + (z_off + cell[2]-beg[2])*dx[2];);
+
             for (int d = 0; d < AMREX_SPACEDIM; ++d) {
-                AMREX_ASSERT(p.m_rdata.pos[d] < grid_box.hi(d));
+                AMREX_ASSERT(p.pos(d) < grid_box.hi(d));
             }
 
             for (int i = 0; i < NStructReal; i++) {
-                p.m_rdata.arr[AMREX_SPACEDIM + i] = pdata.real_struct_data[i];
+                p.rdata(i) = pdata.real_struct_data[i];
             }
 
             // the int struct data
-            p.m_idata.id  = ParticleType::NextID();
-            p.m_idata.cpu = ParallelDescriptor::MyProc();
+            p.id()  = ParticleType::NextID();
+            p.cpu() = ParallelDescriptor::MyProc();
 
             for (int i = 0; i < NStructInt; i++) {
-                p.m_idata.arr[2 + i] = pdata.int_struct_data[i];
+                p.idata(i) = pdata.int_struct_data[i];
             }
 
             // locate the particle
@@ -1428,29 +1428,29 @@ InitNRandomPerCell (int n_per_cell, const ParticleInitData& pdata)
 	Vector<std::map<std::pair<int, int>, std::array<Gpu::HostVector<int>, NArrayInt > > > host_int_attribs;
         host_int_attribs.reserve(15);
         host_int_attribs.resize(finestLevel()+1);
-        
+
         for (IntVect beg = grid.smallEnd(), end=grid.bigEnd(),
-                    cell = grid.smallEnd(); cell <= end; grid.next(cell)) { 
+                    cell = grid.smallEnd(); cell <= end; grid.next(cell)) {
 
             for (int n = 0; n < n_per_cell; n++)
             {
                 // the real struct data
                 for (int i = 0; i < AMREX_SPACEDIM; i++) {
                     r = amrex::Random();
-                    p.m_rdata.pos[i] = grid_box.lo(i) + (r + cell[i]-beg[i])*dx[i];
-                    AMREX_ASSERT(p.m_rdata.pos[i] < grid_box.hi(i));
+                    p.pos(i) = grid_box.lo(i) + (r + cell[i]-beg[i])*dx[i];
+                    AMREX_ASSERT(p.pos(i) < grid_box.hi(i));
                 }
-                                
+
                 for (int i = 0; i < NStructReal; i++) {
-                    p.m_rdata.arr[AMREX_SPACEDIM + i] = pdata.real_struct_data[i];
+                    p.rdata(i) = pdata.real_struct_data[i];
                 }
 
                 // the int struct data
-                p.m_idata.id  = ParticleType::NextID();
-                p.m_idata.cpu = ParallelDescriptor::MyProc();
+                p.id()  = ParticleType::NextID();
+                p.cpu() = ParallelDescriptor::MyProc();
 
                 for (int i = 0; i < NStructInt; i++) {
-                    p.m_idata.arr[2 + i] = pdata.int_struct_data[i];
+                    p.idata(i) = pdata.int_struct_data[i];
                 }
 
                 // locate the particle
diff --git a/Src/Particle/AMReX_ParticleLocator.H b/Src/Particle/AMReX_ParticleLocator.H
index 53412ca2cf0..2c0d0928abf 100644
--- a/Src/Particle/AMReX_ParticleLocator.H
+++ b/Src/Particle/AMReX_ParticleLocator.H
@@ -21,7 +21,7 @@ struct AssignGrid
     Box m_domain;
     GpuArray<Real, AMREX_SPACEDIM> m_plo;
     GpuArray<Real, AMREX_SPACEDIM> m_dxi;
-	
+
     AMREX_GPU_HOST_DEVICE
     AssignGrid () {}
 
@@ -62,7 +62,7 @@ struct AssignGrid
         int ix_hi = amrex::min((lo.x + nGrow - m_lo.x) / m_bin_size.x, m_num_bins.x-1);
         int iy_hi = amrex::min((lo.y + nGrow - m_lo.y) / m_bin_size.y, m_num_bins.y-1);
         int iz_hi = amrex::min((lo.z + nGrow - m_lo.z) / m_bin_size.z, m_num_bins.z-1);
-        
+
         for (int ii = ix_lo; ii <= ix_hi; ++ii) {
             for (int jj = iy_lo; jj <= iy_hi; ++jj) {
                 for (int kk = iz_lo; kk <= iz_hi; ++kk) {
@@ -75,7 +75,7 @@ struct AssignGrid
                 }
             }
         }
-        
+
         return -1;
     }
 };
@@ -86,7 +86,7 @@ class ParticleLocator
 public:
 
     using BinIteratorFactory = typename Bins::BinIteratorFactory;
-    
+
     ParticleLocator () : m_defined(false) {}
 
     void build (const BoxArray& ba, const Geometry& geom)
@@ -105,8 +105,8 @@ public:
         ReduceOps<AMREX_D_DECL(ReduceOpMin, ReduceOpMin, ReduceOpMin),
                   AMREX_D_DECL(ReduceOpMax, ReduceOpMax, ReduceOpMax),
                   AMREX_D_DECL(ReduceOpMax, ReduceOpMax, ReduceOpMax)> reduce_op;
-        ReduceData<AMREX_D_DECL(int, int, int), 
-                   AMREX_D_DECL(int, int, int), 
+        ReduceData<AMREX_D_DECL(int, int, int),
+                   AMREX_D_DECL(int, int, int),
                    AMREX_D_DECL(int, int, int)> reduce_data(reduce_op);
         using ReduceTuple = typename decltype(reduce_data)::Type;
 
@@ -118,24 +118,24 @@ public:
             IntVect lo = box.smallEnd();
             IntVect hi = box.bigEnd();
             IntVect si = box.length();
-            return {AMREX_D_DECL(lo[0], lo[1], lo[2]), 
-                    AMREX_D_DECL(hi[0], hi[1], hi[2]), 
+            return {AMREX_D_DECL(lo[0], lo[1], lo[2]),
+                    AMREX_D_DECL(hi[0], hi[1], hi[2]),
                     AMREX_D_DECL(si[0], si[1], si[2])};
-        }); 
-        
+        });
+
         ReduceTuple hv = reduce_data.value();
 
-        m_bins_lo  = IntVect(AMREX_D_DECL(amrex::get<0>(hv), 
-                                          amrex::get<1>(hv), 
+        m_bins_lo  = IntVect(AMREX_D_DECL(amrex::get<0>(hv),
+                                          amrex::get<1>(hv),
                                           amrex::get<2>(hv)));
-        m_bins_hi  = IntVect(AMREX_D_DECL(amrex::get< AMREX_SPACEDIM  >(hv), 
-                                          amrex::get< AMREX_SPACEDIM+1>(hv), 
+        m_bins_hi  = IntVect(AMREX_D_DECL(amrex::get< AMREX_SPACEDIM  >(hv),
+                                          amrex::get< AMREX_SPACEDIM+1>(hv),
                                           amrex::get< AMREX_SPACEDIM+2>(hv)));
-        m_bin_size = IntVect(AMREX_D_DECL(amrex::get<2*AMREX_SPACEDIM>(hv), 
-                                          amrex::get<2*AMREX_SPACEDIM+1>(hv), 
+        m_bin_size = IntVect(AMREX_D_DECL(amrex::get<2*AMREX_SPACEDIM>(hv),
+                                          amrex::get<2*AMREX_SPACEDIM+1>(hv),
                                           amrex::get<2*AMREX_SPACEDIM+2>(hv)));
 
-        m_num_bins = (m_bins_hi - m_bins_lo + m_bin_size) / m_bin_size; 
+        m_num_bins = (m_bins_hi - m_bins_lo + m_bin_size) / m_bin_size;
 
         Box bins_box(IntVect::TheZeroVector(), m_num_bins-IntVect::TheUnitVector());
         IntVect bin_size = m_bin_size;
@@ -144,7 +144,7 @@ public:
                      [=] AMREX_GPU_HOST_DEVICE (const Box& box) noexcept -> IntVect
                      {
                          return (box.smallEnd() - bins_lo) / bin_size;
-                     });                           
+                     });
     }
 
     void setGeometry (const Geometry& a_geom) noexcept
@@ -153,7 +153,7 @@ public:
         m_geom = a_geom;
     }
 
-    AssignGrid<BinIteratorFactory> getGridAssignor () const noexcept 
+    AssignGrid<BinIteratorFactory> getGridAssignor () const noexcept
     {
         AMREX_ASSERT(m_defined);
         return AssignGrid<BinIteratorFactory>(m_bins.getBinIteratorFactory(),
@@ -165,11 +165,11 @@ public:
         if (m_defined) return BoxArray::SameRefs(m_ba, ba);
         return false;
     }
-            
+
 protected:
 
     bool m_defined;
-    
+
     BoxArray m_ba;
     Geometry m_geom;
 
@@ -179,23 +179,23 @@ protected:
     IntVect m_num_bins;
 
     Bins m_bins;
-    
+
     Gpu::HostVector<Box> m_host_boxes;
     Gpu::DeviceVector<Box> m_device_boxes;
 };
 
-template <class BinIteratorFactory>    
+template <class BinIteratorFactory>
 struct AmrAssignGrid
 {
     const AssignGrid<BinIteratorFactory>* m_funcs;
     std::size_t m_size;
-    
+
     AmrAssignGrid(const AssignGrid<BinIteratorFactory>* a_funcs, std::size_t a_size)
         : m_funcs(a_funcs), m_size(a_size)
         {}
 
     template <typename P>
-    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE   
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     GpuTuple<int, int> operator() (const P& p, int lev_min=-1, int lev_max=-1, int nGrow=0) const noexcept
     {
         lev_min = (lev_min == -1) ? 0 : lev_min;
@@ -222,7 +222,7 @@ class AmrParticleLocator
 {
 public:
     using BinIteratorFactory = typename Bins::BinIteratorFactory;
-    
+
 private:
     Vector<ParticleLocator<Bins> > m_locators;
     Gpu::DeviceVector<AssignGrid<BinIteratorFactory> > m_grid_assignors;
@@ -231,7 +231,7 @@ private:
 public:
 
     AmrParticleLocator() {}
-    
+
     AmrParticleLocator(const Vector<BoxArray>& a_ba,
                        const Vector<Geometry>& a_geom)
     {
@@ -242,7 +242,7 @@ public:
     {
         build(a_gdb);
     }
-        
+
     void build (const Vector<BoxArray>& a_ba,
                 const Vector<Geometry>& a_geom)
     {
@@ -250,13 +250,25 @@ public:
         int num_levels = a_ba.size();
         m_locators.resize(num_levels);
         m_grid_assignors.resize(num_levels);
+#ifdef AMREX_USE_GPU
+        Gpu::HostVector<AssignGrid<BinIteratorFactory> > h_grid_assignors(num_levels);
+        for (int lev = 0; lev < num_levels; ++lev)
+        {
+            m_locators[lev].build(a_ba[lev], a_geom[lev]);
+            h_grid_assignors[lev] = m_locators[lev].getGridAssignor();
+        }
+        Gpu::htod_memcpy(m_grid_assignors.data(), h_grid_assignors.data(),
+                         sizeof(AssignGrid<BinIteratorFactory>)*num_levels);
+        Gpu::synchronize();
+#else
         for (int lev = 0; lev < num_levels; ++lev)
         {
             m_locators[lev].build(a_ba[lev], a_geom[lev]);
             m_grid_assignors[lev] = m_locators[lev].getGridAssignor();
-        }        
+        }
+#endif
     }
-    
+
     void build (const ParGDBBase* a_gdb)
     {
         Vector<BoxArray> ba;
@@ -280,7 +292,7 @@ public:
             all_valid = all_valid && m_locators[lev].isValid(a_ba[lev]);
         return all_valid;
     }
-    
+
     bool isValid (const ParGDBBase* a_gdb) const
     {
         Vector<BoxArray> ba;
@@ -293,14 +305,26 @@ public:
     void setGeometry (const ParGDBBase* a_gdb)
     {
         int num_levels = a_gdb->finestLevel()+1;
+#ifdef AMREX_USE_GPU
+        Gpu::HostVector<AssignGrid<BinIteratorFactory> > h_grid_assignors(num_levels);
+        for (int lev = 0; lev < num_levels; ++lev)
+        {
+            m_locators[lev].setGeometry(a_gdb->Geom(lev));
+            h_grid_assignors[lev] = m_locators[lev].getGridAssignor();
+        }
+        Gpu::htod_memcpy(m_grid_assignors.data(), h_grid_assignors.data(),
+                         sizeof(AssignGrid<BinIteratorFactory>)*num_levels);
+        Gpu::synchronize();
+#else
         for (int lev = 0; lev < num_levels; ++lev)
         {
             m_locators[lev].setGeometry(a_gdb->Geom(lev));
             m_grid_assignors[lev] = m_locators[lev].getGridAssignor();
-        }        
+        }
+#endif
     }
 
-     AmrAssignGrid<BinIteratorFactory> getGridAssignor () const noexcept 
+    AmrAssignGrid<BinIteratorFactory> getGridAssignor () const noexcept
     {
         AMREX_ASSERT(m_defined);
         return AmrAssignGrid<BinIteratorFactory>(m_grid_assignors.dataPtr(), m_locators.size());
diff --git a/Src/Particle/AMReX_ParticleMPIUtil.cpp b/Src/Particle/AMReX_ParticleMPIUtil.cpp
index 44db9c8e544..96be9114626 100644
--- a/Src/Particle/AMReX_ParticleMPIUtil.cpp
+++ b/Src/Particle/AMReX_ParticleMPIUtil.cpp
@@ -1,22 +1,23 @@
 #include <AMReX_ParticleMPIUtil.H>
 
 #include <AMReX_ParallelDescriptor.H>
+#include <AMReX_ParallelReduce.H>
 #include <AMReX_BLProfiler.H>
 
 namespace amrex {
 
-#ifdef AMREX_USE_MPI    
-    
+#ifdef AMREX_USE_MPI
+
     Long CountSnds(const std::map<int, Vector<char> >& not_ours, Vector<Long>& Snds)
     {
-        Long NumSnds = 0;        
+        Long NumSnds = 0;
         for (const auto& kv : not_ours)
         {
             NumSnds       += kv.second.size();
             Snds[kv.first] = kv.second.size();
         }
-        
-        ParallelDescriptor::ReduceLongMax(NumSnds);
+
+        ParallelAllReduce::Max(NumSnds, ParallelContext::CommunicatorSub());
 
         return NumSnds;
     }
@@ -28,20 +29,20 @@ namespace amrex {
         if (NumSnds == 0) return NumSnds;
 
         BL_COMM_PROFILE(BLProfiler::Alltoall, sizeof(Long),
-                        ParallelDescriptor::MyProc(), BLProfiler::BeforeCall());
-        
+                        ParallelContext::MyProcSub(), BLProfiler::BeforeCall());
+
         BL_MPI_REQUIRE( MPI_Alltoall(Snds.dataPtr(),
                                      1,
                                      ParallelDescriptor::Mpi_typemap<Long>::type(),
                                      Rcvs.dataPtr(),
                                      1,
                                      ParallelDescriptor::Mpi_typemap<Long>::type(),
-                                     ParallelDescriptor::Communicator()) );
+                                     ParallelContext::CommunicatorSub()) );
+
+        AMREX_ASSERT(Rcvs[ParallelContext::MyProcSub()] == 0);
 
-        AMREX_ASSERT(Rcvs[ParallelDescriptor::MyProc()] == 0);
-        
         BL_COMM_PROFILE(BLProfiler::Alltoall, sizeof(Long),
-                        ParallelDescriptor::MyProc(), BLProfiler::AfterCall());
+                        ParallelContext::MyProcSub(), BLProfiler::AfterCall());
 
         return NumSnds;
     }
@@ -50,7 +51,7 @@ namespace amrex {
                           const Vector<int>& neighbor_procs, Vector<Long>& Snds, Vector<Long>& Rcvs)
     {
 
-        Long NumSnds = 0;        
+        Long NumSnds = 0;
         for (const auto& kv : not_ours)
         {
             NumSnds       += kv.second.size();
@@ -58,35 +59,37 @@ namespace amrex {
         }
 
         const int SeqNum = ParallelDescriptor::SeqNum();
-        
+
         const int num_rcvs = neighbor_procs.size();
         Vector<MPI_Status>  stats(num_rcvs);
         Vector<MPI_Request> rreqs(num_rcvs);
-        
+
         // Post receives
         for (int i = 0; i < num_rcvs; ++i) {
             const int Who = neighbor_procs[i];
             const Long Cnt = 1;
-            
-            AMREX_ASSERT(Who >= 0 && Who < ParallelDescriptor::NProcs());
-            
-            rreqs[i] = ParallelDescriptor::Arecv(&Rcvs[Who], Cnt, Who, SeqNum).req();
+
+            AMREX_ASSERT(Who >= 0 && Who < ParallelContext::NProcsSub());
+
+            rreqs[i] = ParallelDescriptor::Arecv(&Rcvs[Who], Cnt, Who, SeqNum,
+                                                 ParallelContext::CommunicatorSub()).req();
         }
-        
+
         // Send.
         for (int i = 0; i < num_rcvs; ++i) {
             const int Who = neighbor_procs[i];
             const Long Cnt = 1;
-            
-            AMREX_ASSERT(Who >= 0 && Who < ParallelDescriptor::NProcs());
-            
-            ParallelDescriptor::Send(&Snds[Who], Cnt, Who, SeqNum);        
+
+            AMREX_ASSERT(Who >= 0 && Who < ParallelContext::NProcsSub());
+
+            ParallelDescriptor::Send(&Snds[Who], Cnt, Who, SeqNum,
+                                     ParallelContext::CommunicatorSub());
         }
-        
+
         if (num_rcvs > 0) {
             ParallelDescriptor::Waitall(rreqs, stats);
         }
-        
+
         return NumSnds;
     }
 #endif  // AMREX_USE_MPI
diff --git a/Src/Particle/AMReX_ParticleReduce.H b/Src/Particle/AMReX_ParticleReduce.H
index 0962746755a..e54e7539092 100644
--- a/Src/Particle/AMReX_ParticleReduce.H
+++ b/Src/Particle/AMReX_ParticleReduce.H
@@ -16,7 +16,7 @@ namespace amrex
 /**
  * \brief A general reduction method for the particles in a ParticleContainer that can run on either CPUs or GPUs.
  * This version operates over all particles on all levels.
- * 
+ *
  * This version uses "Sum" as the reduction operation. The quantity reduced over is an arbitrary function
  * of a "superparticle", which contains all the data in the particle type, whether it is stored in AoS or
  * SoA form.
@@ -25,12 +25,12 @@ namespace amrex
  * call the MPI reduction operations described in ParallelDescriptor if they want that behavior.
  *
  * \tparam PC the ParticleContainer type
- * \tparam F a function object 
+ * \tparam F a function object
  *
- * \param pc the ParticleContainer to operate on 
+ * \param pc the ParticleContainer to operate on
  * \param f a function that takes a "superparticle" and returns the value to be reduced over all particles.
  *
- */    
+ */
 template <class PC, class F, EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
 auto
 ReduceSum (PC const& pc, F&& f) -> decltype(f(typename PC::SuperParticleType()))
@@ -105,7 +105,7 @@ ReduceSum (PC const& pc, int lev_min, int lev_max, F&& f) -> decltype(f(typename
             {
                 const auto& tile = pti.GetParticleTile();
                 const auto np = tile.numParticles();
-				const auto ptd = tile.getConstParticleTileData();
+                const auto ptd = tile.getConstParticleTileData();
                 reduce_op.eval(np, reduce_data,
                 [=] AMREX_GPU_DEVICE (const int i) -> ReduceTuple {return {f(ptd.getSuperParticle(i))};});
             }
diff --git a/Src/Particle/AMReX_ParticleTile.H b/Src/Particle/AMReX_ParticleTile.H
index 5ab4c867d6e..b565931e995 100644
--- a/Src/Particle/AMReX_ParticleTile.H
+++ b/Src/Particle/AMReX_ParticleTile.H
@@ -14,14 +14,14 @@ template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
 struct ParticleTileData
 {
     static constexpr int NAR = NArrayReal;
-    static constexpr int NAI = NArrayInt;    
+    static constexpr int NAI = NArrayInt;
     using ParticleType = Particle<NStructReal, NStructInt>;
     using SuperParticleType = Particle<NStructReal+NArrayReal, NStructInt+NArrayInt>;
 
     Long m_size;
     ParticleType* AMREX_RESTRICT m_aos;
     GpuArray<ParticleReal* AMREX_RESTRICT, NArrayReal> m_rdata;
-    GpuArray<int* AMREX_RESTRICT, NArrayInt> m_idata;    
+    GpuArray<int* AMREX_RESTRICT, NArrayInt> m_idata;
 
     int m_num_runtime_real;
     int m_num_runtime_int;
@@ -67,7 +67,7 @@ struct ParticleTileData
                 memcpy(dst, m_runtime_idata[i] + src_index, sizeof(int));
                 dst += sizeof(int);
             }
-        }        
+        }
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -117,28 +117,36 @@ struct ParticleTileData
     {
         AMREX_ASSERT(index < m_size);
         SuperParticleType sp;
-        for (int i = 0; i < NStructReal+AMREX_SPACEDIM; ++i)
-            sp.m_rdata.arr[i] = m_aos[index].m_rdata.arr[i];
+        for (int i = 0; i < AMREX_SPACEDIM; ++i)
+            sp.pos(i) = m_aos[index].pos(i);
+        for (int i = 0; i < NStructReal; ++i)
+            sp.rdata(i) = m_aos[index].rdata(i);
         for (int i = 0; i < NArrayReal; ++i)
-            sp.m_rdata.arr[NStructReal+AMREX_SPACEDIM+i] = m_rdata[i][index];
-        for (int i = 0; i < NStructInt+2; ++i)
-            sp.m_idata.arr[i] = m_aos[index].m_idata.arr[i];
+            sp.rdata(NStructReal+i) = m_rdata[i][index];
+        sp.id() = m_aos[index].id();
+        sp.cpu() = m_aos[index].cpu();
+        for (int i = 0; i < NStructInt; ++i)
+            sp.idata(i) = m_aos[index].idata(i);
         for (int i = 0; i < NArrayInt; ++i)
-            sp.m_idata.arr[NStructInt+2+i] = m_idata[i][index];
+            sp.idata(NStructInt+i) = m_idata[i][index];
         return sp;
     }
 
     AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
     void setSuperParticle (const SuperParticleType& sp, int index) const noexcept
     {
-        for (int i = 0; i < NStructReal+AMREX_SPACEDIM; ++i)
-            m_aos[index].m_rdata.arr[i] = sp.m_rdata.arr[i];
+        for (int i = 0; i < AMREX_SPACEDIM; ++i)
+            m_aos[index].pos(i) = sp.pos(i);
+        for (int i = 0; i < NStructReal; ++i)
+            m_aos[index].rdata(i) = sp.rdata(i);
         for (int i = 0; i < NArrayReal; ++i)
-            m_rdata[i][index] = sp.m_rdata.arr[NStructReal+AMREX_SPACEDIM+i];
-        for (int i = 0; i < NStructInt+2; ++i)
-            m_aos[index].m_idata.arr[i] = sp.m_idata.arr[i];
+            m_rdata[i][index] = sp.rdata(NStructReal+i);
+        m_aos[index].id() = sp.id();
+        m_aos[index].cpu() = sp.cpu();
+        for (int i = 0; i < NStructInt; ++i)
+            m_aos[index].idata(i) = sp.idata(i);
         for (int i = 0; i < NArrayInt; ++i)
-            m_idata[i][index] = sp.m_idata.arr[NStructInt+2+i];
+            m_idata[i][index] = sp.idata(NStructInt+i);
     }
 };
 
@@ -153,7 +161,7 @@ struct ConstParticleTileData
     Long m_size;
     const ParticleType* AMREX_RESTRICT m_aos;
     GpuArray<const ParticleReal* AMREX_RESTRICT, NArrayReal> m_rdata;
-    GpuArray<const int* AMREX_RESTRICT, NArrayInt > m_idata;    
+    GpuArray<const int* AMREX_RESTRICT, NArrayInt > m_idata;
 
     int m_num_runtime_real;
     int m_num_runtime_int;
@@ -199,37 +207,44 @@ struct ConstParticleTileData
                 memcpy(dst, m_runtime_idata[i] + src_index, sizeof(int));
                 dst += sizeof(int);
             }
-        }        
+        }
     }
 
-    AMREX_GPU_HOST_DEVICE
-    SuperParticleType getSuperParticle (int index) const
+    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+    SuperParticleType getSuperParticle (int index) const noexcept
     {
         AMREX_ASSERT(index < m_size);
         SuperParticleType sp;
-        for (int i = 0; i < NStructReal+AMREX_SPACEDIM; ++i)
-            sp.m_rdata.arr[i] = m_aos[index].m_rdata.arr[i];
+        for (int i = 0; i < AMREX_SPACEDIM; ++i)
+            sp.pos(i) = m_aos[index].pos(i);
+        for (int i = 0; i < NStructReal; ++i)
+            sp.rdata(i) = m_aos[index].rdata(i);
         for (int i = 0; i < NArrayReal; ++i)
-            sp.m_rdata.arr[NStructReal+AMREX_SPACEDIM+i] = m_rdata[i][index];
-        for (int i = 0; i < NStructInt+2; ++i)
-            sp.m_idata.arr[i] = m_aos[index].m_idata.arr[i];
+            sp.rdata(NStructReal+i) = m_rdata[i][index];
+        sp.id() = m_aos[index].id();
+        sp.cpu() = m_aos[index].cpu();
+        for (int i = 0; i < NStructInt; ++i)
+            sp.idata(i) = m_aos[index].idata(i);
         for (int i = 0; i < NArrayInt; ++i)
-            sp.m_idata.arr[NStructInt+2+i] = m_idata[i][index];
+            sp.idata(NStructInt+i) = m_idata[i][index];
         return sp;
     }
 };
 
-template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt>
+template <int NStructReal, int NStructInt, int NArrayReal, int NArrayInt,
+          template<class> class Allocator=DefaultAllocator>
 struct ParticleTile
 {
     using ParticleType = Particle<NStructReal, NStructInt>;
     static constexpr int NAR = NArrayReal;
     static constexpr int NAI = NArrayInt;
 
-    using AoS = ArrayOfStructs<NStructReal, NStructInt>;
+    using SuperParticleType = Particle<NStructReal + NArrayReal, NStructInt + NArrayInt>;
+
+    using AoS = ArrayOfStructs<NStructReal, NStructInt, Allocator>;
     using ParticleVector = typename AoS::ParticleVector;
 
-    using SoA = StructOfArrays<NArrayReal, NArrayInt>;
+    using SoA = StructOfArrays<NArrayReal, NArrayInt, Allocator>;
     using RealVector = typename SoA::RealVector;
     using IntVector = typename SoA::IntVector;
 
@@ -238,7 +253,7 @@ struct ParticleTile
 
     ParticleTile()
         : m_defined(false)
-        {}
+    {}
 
     void define (int a_num_runtime_real, int a_num_runtime_int)
     {
@@ -249,7 +264,7 @@ struct ParticleTile
         m_runtime_r_cptrs.resize(a_num_runtime_real);
         m_runtime_i_cptrs.resize(a_num_runtime_int);
     }
-    
+
     AoS&       GetArrayOfStructs ()       { return m_aos_tile; }
     const AoS& GetArrayOfStructs () const { return m_aos_tile; }
 
@@ -257,7 +272,7 @@ struct ParticleTile
     const SoA& GetStructOfArrays () const { return m_soa_tile; }
 
     bool empty () const { return m_aos_tile.empty(); }
-    
+
     /**
     * \brief Returns the total number of particles (real and neighbor)
     *
@@ -281,7 +296,7 @@ struct ParticleTile
     * \brief Returns the number of neighbor particles (excluding reals)
     *
     */
-    int numNeighborParticles () const { return m_aos_tile.numNeighborParticles(); }    
+    int numNeighborParticles () const { return m_aos_tile.numNeighborParticles(); }
 
     /**
     * \brief Returns the total number of particles, real and neighbor
@@ -289,13 +304,13 @@ struct ParticleTile
     */
     int numTotalParticles () const { return m_aos_tile.numTotalParticles() ; }
 
-    void setNumNeighbors (int num_neighbors) 
+    void setNumNeighbors (int num_neighbors)
     {
         m_soa_tile.setNumNeighbors(num_neighbors);
         m_aos_tile.setNumNeighbors(num_neighbors);
     }
 
-    int getNumNeighbors () 
+    int getNumNeighbors ()
     {
         AMREX_ASSERT( m_soa_tile.getNumNeighbors() == m_aos_tile.getNumNeighbors() );
         return m_aos_tile.getNumNeighbors();
@@ -312,11 +327,40 @@ struct ParticleTile
     ///
     void push_back (const ParticleType& p) { m_aos_tile().push_back(p); }
 
+    ///
+    /// Add one particle to this tile.
+    ///
+    template < int NR = NArrayReal, int NI = NArrayInt,
+               EnableIf_t<NR != 0 or NI != 0, int> foo = 0>
+    void push_back (const SuperParticleType& sp)
+    {
+        auto np = numParticles();
+
+        m_aos_tile.resize(np+1);
+        m_soa_tile.resize(np+1);
+
+        auto& arr_rdata = m_soa_tile.GetRealData();
+        auto& arr_idata = m_soa_tile.GetIntData();
+
+        for (int i = 0; i < AMREX_SPACEDIM; ++i)
+            m_aos_tile[np].pos(i) = sp.pos(i);
+        for (int i = 0; i < NStructReal; ++i)
+            m_aos_tile[np].rdata(i) = sp.rdata(i);
+        for (int i = 0; i < NArrayReal; ++i)
+            arr_rdata[i][np] = sp.rdata(NStructReal+i);
+        m_aos_tile[np].id() = sp.id();
+        m_aos_tile[np].cpu() = sp.cpu();
+        for (int i = 0; i < NStructInt; ++i)
+            m_aos_tile[np].idata(i) = sp.idata(i);
+        for (int i = 0; i < NArrayInt; ++i)
+            arr_idata[i][np] = sp.idata(NStructInt+i);
+    }
+
     ///
     /// Add a Real value to the struct-of-arrays at index comp.
     /// This sets the data for one particle.
     ///
-    void push_back_real (int comp, ParticleReal v) { 
+    void push_back_real (int comp, ParticleReal v) {
         m_soa_tile.GetRealData(comp).push_back(v);
     }
 
@@ -324,7 +368,7 @@ struct ParticleTile
     /// Add Real values to the struct-of-arrays, for all comps at once.
     /// This sets the data for one particle.
     ///
-    void push_back_real (const std::array<ParticleReal, NArrayReal>& v) { 
+    void push_back_real (const std::array<ParticleReal, NArrayReal>& v) {
         for (int i = 0; i < NArrayReal; ++i) {
             m_soa_tile.GetRealData(i).push_back(v[i]);
         }
@@ -352,20 +396,20 @@ struct ParticleTile
     /// Add an int value to the struct-of-arrays at index comp.
     /// This sets the data for one particle.
     ///
-    void push_back_int (int comp, int v) { 
+    void push_back_int (int comp, int v) {
         m_soa_tile.GetIntData(comp).push_back(v);
     }
-    
+
     ///
     /// Add int values to the struct-of-arrays, for all comps at once.
     /// This sets the data for one particle.
     ///
-    void push_back_int (const std::array<int, NArrayInt>& v) { 
+    void push_back_int (const std::array<int, NArrayInt>& v) {
         for (int i = 0; i < NArrayInt; ++i) {
             m_soa_tile.GetIntData(i).push_back(v[i]);
         }
     }
-    
+
     ///
     /// Add a range of int values to the struct-of-arrays for the given comp.
     /// This sets the data for several particles at once.
@@ -374,7 +418,7 @@ struct ParticleTile
         auto it = m_soa_tile.GetIntData(comp).end();
         m_soa_tile.GetIntData(comp).insert(it, beg, end);
     }
-    
+
     ///
     /// Add npar copies of the int value v to the struct-of-arrays for the given comp.
     /// This sets the data for several particles at once.
@@ -391,8 +435,8 @@ struct ParticleTile
     int NumRuntimeRealComps () const noexcept { return m_runtime_r_ptrs.size(); }
 
     int NumRuntimeIntComps () const noexcept { return m_runtime_i_ptrs.size(); }
-    
-    void shrink_to_fit () 
+
+    void shrink_to_fit ()
     {
         m_aos_tile().shrink_to_fit();
         for (int j = 0; j < NumRealComps(); ++j)
@@ -400,12 +444,12 @@ struct ParticleTile
             auto& rdata = GetStructOfArrays().GetRealData(j);
             rdata.shrink_to_fit();
         }
-        
+
         for (int j = 0; j < NumIntComps(); ++j)
         {
             auto& idata = GetStructOfArrays().GetIntData(j);
             idata.shrink_to_fit();
-        }        
+        }
     }
 
     Long capacity () const
@@ -417,7 +461,7 @@ struct ParticleTile
             auto& rdata = GetStructOfArrays().GetRealData(j);
             nbytes += rdata.capacity() * sizeof(ParticleReal);
         }
-        
+
         for (int j = 0; j < NumIntComps(); ++j)
         {
             auto& idata = GetStructOfArrays().GetIntData(j);
@@ -434,7 +478,7 @@ struct ParticleTile
             auto& rdata = GetStructOfArrays().GetRealData(j);
             rdata.swap(other.GetStructOfArrays().GetRealData(j));
         }
-        
+
         for (int j = 0; j < NumIntComps(); ++j)
         {
             auto& idata = GetStructOfArrays().GetIntData(j);
@@ -444,11 +488,37 @@ struct ParticleTile
 
     ParticleTileDataType getParticleTileData ()
     {
-        for (int i = 0; i < m_runtime_r_ptrs.size(); ++i) {
-            m_runtime_r_ptrs[i] = m_soa_tile.GetRealData(NArrayReal + i).dataPtr();
+        int index = NArrayReal;
+#ifdef AMREX_USE_GPU
+        Gpu::HostVector<ParticleReal*> h_runtime_r_ptrs(m_runtime_r_ptrs.size());
+        for (auto& r_ptr : h_runtime_r_ptrs) {
+            r_ptr = m_soa_tile.GetRealData(index++).dataPtr();
+        }
+        if (h_runtime_r_ptrs.size() > 0) {
+            Gpu::htod_memcpy_async(m_runtime_r_ptrs.data(), h_runtime_r_ptrs.data(),
+                                   h_runtime_r_ptrs.size()*sizeof(ParticleReal*));
         }
-        for (int i = 0; i < m_runtime_i_ptrs.size(); ++i) 
-            m_runtime_i_ptrs[i] = m_soa_tile.GetIntData(NArrayInt + i).dataPtr();
+#else
+        for (auto& r_ptr : m_runtime_r_ptrs) {
+            r_ptr = m_soa_tile.GetRealData(index++).dataPtr();
+        }
+#endif
+
+        index = NArrayInt;
+#ifdef AMREX_USE_GPU
+        Gpu::HostVector<int*> h_runtime_i_ptrs(m_runtime_i_ptrs.size());
+        for (auto& i_ptr : h_runtime_i_ptrs) {
+            i_ptr = m_soa_tile.GetIntData(index++).dataPtr();
+        }
+        if (h_runtime_i_ptrs.size() > 0) {
+            Gpu::htod_memcpy_async(m_runtime_i_ptrs.data(), h_runtime_i_ptrs.data(),
+                                   h_runtime_i_ptrs.size()*sizeof(int*));
+        }
+#else
+        for (auto& i_ptr : m_runtime_i_ptrs) {
+            i_ptr = m_soa_tile.GetIntData(index++).dataPtr();
+        }
+#endif
 
         ParticleTileDataType ptd;
         ptd.m_aos = m_aos_tile().dataPtr();
@@ -461,16 +531,49 @@ struct ParticleTile
         ptd.m_num_runtime_int = m_runtime_i_ptrs.size();
         ptd.m_runtime_rdata = m_runtime_r_ptrs.dataPtr();
         ptd.m_runtime_idata = m_runtime_i_ptrs.dataPtr();
+
+#ifdef AMREX_USE_GPU
+        if ((h_runtime_r_ptrs.size() > 0) or (h_runtime_i_ptrs.size() > 0)) {
+            Gpu::synchronize();
+        }
+#endif
+
         return ptd;
     }
 
     ConstParticleTileDataType getConstParticleTileData () const
     {
-        for (size_t i = 0; i < m_runtime_r_ptrs.size(); ++i) {
-            m_runtime_r_cptrs[i] = m_soa_tile.GetRealData(NArrayReal + i).dataPtr();
+        int index = NArrayReal;
+#ifdef AMREX_USE_GPU
+        Gpu::HostVector<ParticleReal const*> h_runtime_r_cptrs(m_runtime_r_cptrs.size());
+        for (auto& r_ptr : h_runtime_r_cptrs) {
+            r_ptr = m_soa_tile.GetRealData(index++).dataPtr();
+        }
+        if (h_runtime_r_cptrs.size() > 0) {
+            Gpu::htod_memcpy_async(m_runtime_r_cptrs.data(), h_runtime_r_cptrs.data(),
+                                   h_runtime_r_cptrs.size()*sizeof(ParticleReal const*));
         }
-        for (size_t i = 0; i < m_runtime_i_ptrs.size(); ++i)
-            m_runtime_i_cptrs[i] = m_soa_tile.GetIntData(NArrayInt + i).dataPtr();
+#else
+        for (auto& r_ptr : m_runtime_r_cptrs) {
+            r_ptr = m_soa_tile.GetRealData(index++).dataPtr();
+        }
+#endif
+
+        index = NArrayInt;
+#ifdef AMREX_USE_GPU
+        Gpu::HostVector<int const*> h_runtime_i_cptrs(m_runtime_i_cptrs.size());
+        for (auto& i_ptr : h_runtime_i_cptrs) {
+            i_ptr = m_soa_tile.GetIntData(index++).dataPtr();
+        }
+        if (h_runtime_i_cptrs.size() > 0) {
+            Gpu::htod_memcpy_async(m_runtime_i_cptrs.data(), h_runtime_i_cptrs.data(),
+                                   h_runtime_i_cptrs.size()*sizeof(int const*));
+        }
+#else
+        for (auto& i_ptr : m_runtime_i_cptrs) {
+            i_ptr = m_soa_tile.GetIntData(index++).dataPtr();
+        }
+#endif
 
         ConstParticleTileDataType ptd;
         ptd.m_aos = m_aos_tile().dataPtr();
@@ -483,6 +586,13 @@ struct ParticleTile
         ptd.m_num_runtime_int = m_runtime_i_cptrs.size();
         ptd.m_runtime_rdata = m_runtime_r_cptrs.dataPtr();
         ptd.m_runtime_idata = m_runtime_i_cptrs.dataPtr();
+
+#ifdef AMREX_USE_GPU
+        if ((h_runtime_r_cptrs.size() > 0) or (h_runtime_i_cptrs.size() > 0)) {
+            Gpu::synchronize();
+        }
+#endif
+
         return ptd;
     }
 
@@ -493,11 +603,11 @@ private:
 
     bool m_defined;
 
-    Gpu::DeviceVector<ParticleReal*> m_runtime_r_ptrs;
-    Gpu::DeviceVector<int*> m_runtime_i_ptrs;
+    amrex::PODVector<ParticleReal*, Allocator<ParticleReal*> > m_runtime_r_ptrs;
+    amrex::PODVector<int*, Allocator<int*> > m_runtime_i_ptrs;
 
-    mutable Gpu::DeviceVector<const ParticleReal*> m_runtime_r_cptrs;
-    mutable Gpu::DeviceVector<const int*> m_runtime_i_cptrs;
+    mutable amrex::PODVector<const ParticleReal*, Allocator<const ParticleReal*> > m_runtime_r_cptrs;
+    mutable amrex::PODVector<const int*, Allocator<const int*> >m_runtime_i_cptrs;
 };
 
 } // namespace amrex;
diff --git a/Src/Particle/AMReX_ParticleTransformation.H b/Src/Particle/AMReX_ParticleTransformation.H
index 7f44453c9b0..539262c0d71 100644
--- a/Src/Particle/AMReX_ParticleTransformation.H
+++ b/Src/Particle/AMReX_ParticleTransformation.H
@@ -6,12 +6,13 @@
 #include <AMReX_Gpu.H>
 #include <AMReX_Print.H>
 #include <AMReX_ParticleTile.H>
+#include <AMReX_ParticleUtil.H>
 
 namespace amrex
 {
 
 /**
- * \brief A general single particle copying routine that can run on the GPU. 
+ * \brief A general single particle copying routine that can run on the GPU.
  *
  * \tparam NSR number of extra reals in the particle struct
  * \tparam NSI number of extra ints in the particle struct
@@ -26,8 +27,8 @@ namespace amrex
  */
 template <int NSR, int NSI, int NAR, int NAI>
 AMREX_GPU_HOST_DEVICE AMREX_INLINE
-void copyParticle (const      ParticleTileData<NSR, NSI, NAR, NAI>& dst, 
-                   const ConstParticleTileData<NSR, NSI, NAR, NAI>& src, 
+void copyParticle (const      ParticleTileData<NSR, NSI, NAR, NAI>& dst,
+                   const ConstParticleTileData<NSR, NSI, NAR, NAI>& src,
                    int src_i, int dst_i) noexcept
 {
     AMREX_ASSERT(dst.m_num_runtime_real == src.m_num_runtime_real);
@@ -45,7 +46,7 @@ void copyParticle (const      ParticleTileData<NSR, NSI, NAR, NAI>& dst,
 }
 
 /**
- * \brief A general single particle copying routine that can run on the GPU. 
+ * \brief A general single particle copying routine that can run on the GPU.
  *
  * \tparam NSR number of extra reals in the particle struct
  * \tparam NSI number of extra ints in the particle struct
@@ -60,8 +61,8 @@ void copyParticle (const      ParticleTileData<NSR, NSI, NAR, NAI>& dst,
  */
 template <int NSR, int NSI, int NAR, int NAI>
 AMREX_GPU_HOST_DEVICE AMREX_INLINE
-void copyParticle (const ParticleTileData<NSR, NSI, NAR, NAI>& dst, 
-                   const ParticleTileData<NSR, NSI, NAR, NAI>& src, 
+void copyParticle (const ParticleTileData<NSR, NSI, NAR, NAI>& dst,
+                   const ParticleTileData<NSR, NSI, NAR, NAI>& src,
                    int src_i, int dst_i) noexcept
 {
     AMREX_ASSERT(dst.m_num_runtime_real == src.m_num_runtime_real);
@@ -77,9 +78,9 @@ void copyParticle (const ParticleTileData<NSR, NSI, NAR, NAI>& dst,
     for (int j = 0; j < dst.m_num_runtime_int; ++j)
         dst.m_runtime_idata[j][dst_i] = src.m_runtime_idata[j][src_i];
 }
-    
+
 /**
- * \brief A general single particle swapping routine that can run on the GPU. 
+ * \brief A general single particle swapping routine that can run on the GPU.
  *
  * \tparam NSR number of extra reals in the particle struct
  * \tparam NSI number of extra ints in the particle struct
@@ -111,20 +112,21 @@ void swapParticle (const ParticleTileData<NSR, NSI, NAR, NAI>& dst,
     for (int j = 0; j < dst.m_num_runtime_int; ++j)
         amrex::Swap(dst.m_runtime_idata[j][dst_i], src.m_runtime_idata[j][src_i]);
 }
-    
+
 /**
- * \brief Copy particles from src to dst. This version copies all the 
+ * \brief Copy particles from src to dst. This version copies all the
  * particles, writing them to the beginning of dst.
- * 
- * \tparam PTile the particle tile type
+ *
+ * \tparam DstTile the dst particle tile type
+ * \tparam SrcTile the src particle tile type
  *
  * \param dst the destination tile
  * \param src the source tile
  * \param f the function that will be applied to each particle
  *
- */    
-template <typename PTile>
-void copyParticles (PTile& dst, const PTile& src) noexcept
+ */
+template <typename DstTile, typename SrcTile>
+void copyParticles (DstTile& dst, const SrcTile& src) noexcept
 {
     auto np = src.numParticles();
     copyParticles(dst, src, 0, 0, np);
@@ -133,8 +135,9 @@ void copyParticles (PTile& dst, const PTile& src) noexcept
 /**
  * \brief Copy particles from src to dst. This version copies n particles
  * starting at index src_start, writing the result starting at dst_start.
- * 
- * \tparam PTile the particle tile type
+ *
+ * \tparam DstTile the dst particle tile type
+ * \tparam SrcTile the src particle tile type
  * \tparam Index the index type, e.g. unsigned int
  * \tparam N the size type, e.g. Long
  *
@@ -142,11 +145,12 @@ void copyParticles (PTile& dst, const PTile& src) noexcept
  * \param src the source tile
  * \param src_start the offset at which to start reading particles from src
  * \param dst_start the offset at which to start writing particles to dst
+ * \param n the number of particles to write
  *
  */
-template <typename PTile, typename Index, typename N,
+template <typename DstTile, typename SrcTile, typename Index, typename N,
           amrex::EnableIf_t<std::is_integral<Index>::value, int> foo = 0>
-void copyParticles (PTile& dst, const PTile& src,
+void copyParticles (DstTile& dst, const SrcTile& src,
                     Index src_start, Index dst_start, N n) noexcept
 {
     const auto src_data = src.getConstParticleTileData();
@@ -156,12 +160,14 @@ void copyParticles (PTile& dst, const PTile& src,
     {
         copyParticle(dst_data, src_data, src_start+i, dst_start+i);
     });
+
+    Gpu::synchronize();
 }
-    
+
 /**
  * \brief Apply the function f to all the particles in src, writing the
  * result to dst. This version does all the particles in src.
- * 
+ *
  * \tparam DstTile the dst particle tile type
  * \tparam SrcTile the src particle tile type
  * \tparam F a function object
@@ -170,7 +176,7 @@ void copyParticles (PTile& dst, const PTile& src,
  * \param src the source tile
  * \param f the function that will be applied to each particle
  *
- */    
+ */
 template <typename DstTile, typename SrcTile, typename F>
 void transformParticles (DstTile& dst, const SrcTile& src, F&& f) noexcept
 {
@@ -182,7 +188,7 @@ void transformParticles (DstTile& dst, const SrcTile& src, F&& f) noexcept
  * \brief Apply the function f to particles in src, writing the
  * result to dst. This version applies the function to n particles
  * starting at index src_start, writing the result starting at dst_start.
- * 
+ *
  * \tparam DstTile the dst particle tile type
  * \tparam SrcTile the src particle tile type
  * \tparam Index the index type, e.g. unsigned int
@@ -208,12 +214,14 @@ void transformParticles (DstTile& dst, const SrcTile& src,
     {
         f(dst_data, src_data, src_start+i, dst_start+i);
     });
+
+    Gpu::synchronize();
 }
 
 /**
  * \brief Apply the function f to all the particles in src, writing the
  * results to dst1 and dst2. This version does all the particles in src.
- * 
+ *
  * \tparam DstTile1 the dst1 particle tile type
  * \tparam DstTile2 the dst2 particle tile type
  * \tparam SrcTile the src particle tile type
@@ -224,7 +232,7 @@ void transformParticles (DstTile& dst, const SrcTile& src,
  * \param src the source tile
  * \param f the function that will be applied to each particle
  *
- */    
+ */
 template <typename DstTile1, typename DstTile2, typename SrcTile, typename F>
 void transformParticles (DstTile1& dst1, DstTile2& dst2, const SrcTile& src, F&& f) noexcept
 {
@@ -236,7 +244,7 @@ void transformParticles (DstTile1& dst1, DstTile2& dst2, const SrcTile& src, F&&
  * \brief Apply the function f to particles in src, writing the
  * results to dst1 and dst2. This version applies the function to n particles
  * starting at index src_start, writing the result starting at dst1_start and dst2_start.
- * 
+ *
  * \tparam DstTile1 the dst1 particle tile type
  * \tparam DstTile2 the dst2 particle tile type
  * \tparam SrcTile the src particle tile type
@@ -267,22 +275,50 @@ void transformParticles (DstTile1& dst1, DstTile2& dst2, const SrcTile& src,
     {
         f(dst1_data, dst2_data, src_data, src_start+i, dst1_start+i, dst2_start+i);
     });
+
+    Gpu::synchronize();
+}
+
+/**
+ * \brief Conditionally copy particles from src to dst based on the value of mask.
+ * 
+ * \tparam DstTile the dst particle tile type
+ * \tparam SrcTile the src particle tile type
+ * \tparam Index the index type, e.g. unsigned int
+ *
+ * \param dst the destination tile
+ * \param src the source tile
+ * \param mask pointer to the mask - 1 means copy, 0 means don't copy
+ *
+ */
+template <typename DstTile, typename SrcTile, typename Index, typename N,
+          amrex::EnableIf_t<std::is_integral<Index>::value, int> foo = 0>
+Index filterParticles (DstTile& dst, const SrcTile& src, const Index* mask) noexcept
+{
+    return filterParticles(dst, src, mask, 0, 0, src.numParticles());
 }
     
 /**
  * \brief Conditionally copy particles from src to dst based on the value of mask.
+ *  This version conditionally copies n particles starting at index src_start, writing 
+ *  the result starting at dst_start.
  * 
- * \tparam PTile the particle tile type
+ * \tparam DstTile the dst particle tile type
+ * \tparam SrcTile the src particle tile type
  * \tparam Index the index type, e.g. unsigned int
  *
  * \param dst the destination tile
  * \param src the source tile
  * \param mask pointer to the mask - 1 means copy, 0 means don't copy
+ * \param src_start the offset at which to start reading particles from src
+ * \param dst_start the offset at which to start writing particles to dst
+ * \param n the number of particles to apply the operation to
  *
  */
-template <typename PTile, typename Index,
+template <typename DstTile, typename SrcTile, typename Index, typename N,
           amrex::EnableIf_t<std::is_integral<Index>::value, int> foo = 0>
-Index filterParticles (PTile& dst, const PTile& src, const Index* mask) noexcept
+Index filterParticles (DstTile& dst, const SrcTile& src, const Index* mask,
+                       Index src_start, Index dst_start, N n) noexcept
 {
     auto np = src.numParticles();
     Gpu::DeviceVector<Index> offsets(np);
@@ -291,25 +327,27 @@ Index filterParticles (PTile& dst, const PTile& src, const Index* mask) noexcept
     Index last_mask, last_offset;
     Gpu::copyAsync(Gpu::deviceToHost, mask+np-1, mask + np, &last_mask);
     Gpu::copyAsync(Gpu::deviceToHost, offsets.data()+np-1, offsets.data()+np, &last_offset);    
-                               
+      
     auto p_offsets = offsets.dataPtr();
     
     const auto src_data = src.getConstParticleTileData();
           auto dst_data = dst.getParticleTileData();
 
-    AMREX_HOST_DEVICE_FOR_1D( np, i,
+    AMREX_HOST_DEVICE_FOR_1D( n, i,
     {
-        if (mask[i]) copyParticle(dst_data, src_data, i, p_offsets[i]);
+        if (mask[src_start+i]) copyParticle(dst_data, src_data, src_start+i, 
+                                            dst_start+p_offsets[src_start+i]);
     });
 
-    Gpu::streamSynchronize();
+    Gpu::synchronize();
     return last_mask + last_offset;
 }
 
 /**
  * \brief Conditionally copy particles from src to dst based on a predicate.
  * 
- * \tparam PTile the particle tile type
+ * \tparam DstTile the dst particle tile type
+ * \tparam SrcTile the src particle tile type
  * \tparam Pred a function object
  *
  * \param dst the destination tile
@@ -317,29 +355,54 @@ Index filterParticles (PTile& dst, const PTile& src, const Index* mask) noexcept
  * \param p predicate function - particles will be copied if p returns true
  *
  */    
-template <typename PTile, typename Pred>
-auto filterParticles (PTile& dst, const PTile& src, Pred&& p) noexcept
-    -> decltype(p(typename PTile::ConstParticleTileDataType(), 0))
+template <typename DstTile, typename SrcTile, typename Pred>
+auto filterParticles (DstTile& dst, const SrcTile& src, Pred&& p) noexcept
+    -> decltype(p(typename SrcTile::ConstParticleTileDataType(), 0))
+{
+    return filterParticles(dst, src, p, 0, 0, src.numParticles());
+}
+
+/**
+ * \brief Conditionally copy particles from src to dst based on a predicate.
+ *  This version conditionally copies n particles starting at index src_start, writing 
+ *  the result starting at dst_start.
+ * 
+ * \tparam DstTile the dst particle tile type
+ * \tparam SrcTile the src particle tile type
+ * \tparam Pred a function object
+ *
+ * \param dst the destination tile
+ * \param src the source tile
+ * \param p predicate function - particles will be copied if p returns true
+ * \param src_start the offset at which to start reading particles from src
+ * \param dst_start the offset at which to start writing particles to dst
+ * \param n the number of particles to apply the operation to
+ *
+ */
+template <typename DstTile, typename SrcTile, typename Pred, typename Index, typename N>
+auto filterParticles (DstTile& dst, const SrcTile& src, Pred&& p,
+                      Index src_start, Index dst_start, N n) noexcept
+    -> decltype(particle_detail::call_f(p, typename SrcTile::ConstParticleTileDataType(), int{}, RandomEngine{}))
 {
-    using Index = decltype(p(typename PTile::ConstParticleTileDataType(), 0));
     auto np = src.numParticles();
     Gpu::DeviceVector<Index> mask(np);
 
     auto p_mask = mask.dataPtr();
     const auto src_data = src.getConstParticleTileData();
-    
-    AMREX_HOST_DEVICE_FOR_1D(np, i,
+
+    amrex::ParallelForRNG(np,
+    [=] AMREX_GPU_DEVICE (int i, amrex::RandomEngine const& engine) noexcept
     {
-        p_mask[i] = p(src_data, i);
+        p_mask[i] = particle_detail::call_f(p, src_data, i, engine);
     });
 
-    return filterParticles(dst, src, mask.dataPtr());
+    return filterParticles(dst, src, mask.dataPtr(), src_start, dst_start, n);
 }
 
 /**
  * \brief Conditionally copy particles from src to dst based on the value of mask.
  * A transformation will also be applied to the particles on copy.
- * 
+ *
  * \tparam DstTile the dst particle tile type
  * \tparam SrcTile the src particle tile type
  * \tparam Index the index type, e.g. unsigned int
@@ -373,7 +436,7 @@ Index filterAndTransformParticles (DstTile& dst, const SrcTile& src, Index* mask
         if (mask[i]) f(dst_data, src_data, i, p_offsets[i]);
     });
 
-    Gpu::streamSynchronize();
+    Gpu::synchronize();
     return last_mask + last_offset;
 }
 
@@ -402,10 +465,11 @@ auto filterAndTransformParticles (DstTile& dst, const SrcTile& src, Pred&& p, F&
 
     auto p_mask = mask.dataPtr();
     const auto src_data = src.getConstParticleTileData();
-    
-    AMREX_HOST_DEVICE_FOR_1D(np, i,
+
+    amrex::ParallelForRNG(np,
+    [=] AMREX_GPU_DEVICE (int i, amrex::RandomEngine const& engine) noexcept
     {
-        p_mask[i] = p(src_data, i);
+        p_mask[i] = particle_detail::call_f(p, src_data, i, engine);
     });
 
     return filterAndTransformParticles(dst, src, mask.dataPtr(), std::forward<F>(f));
@@ -452,7 +516,7 @@ Index filterAndTransformParticles (DstTile1& dst1, DstTile2& dst2,
         if (mask[i]) f(dst_data1, dst_data2, src_data, i, p_offsets[i], p_offsets[i]);
     });
 
-    Gpu::streamSynchronize();
+    Gpu::synchronize();
     return last_mask + last_offset;
 }
 
@@ -485,10 +549,11 @@ auto filterAndTransformParticles (DstTile1& dst1, DstTile2& dst2, const SrcTile&
 
     auto p_mask = mask.dataPtr();
     const auto src_data = src.getConstParticleTileData();
-    
-    AMREX_HOST_DEVICE_FOR_1D(np, i,
+
+    amrex::ParallelForRNG(np,
+    [=] AMREX_GPU_DEVICE (int i, amrex::RandomEngine const& engine) noexcept
     {
-        p_mask[i] = p(src_data, i);
+        p_mask[i] = particle_detail::call_f(p, src_data, i, engine);
     });
 
     return filterAndTransformParticles(dst1, dst2, src, mask.dataPtr(), std::forward<F>(f));
@@ -520,6 +585,8 @@ void gatherParticles (PTile& dst, const PTile& src, N np, const Index* inds)
     {
         copyParticle(dst_data, src_data, inds[i], i);
     });
+
+    Gpu::synchronize();
 }
 
 /**
@@ -548,6 +615,8 @@ void scatterParticles (PTile& dst, const PTile& src, N np, const Index* inds)
     {
         copyParticle(dst_data, src_data, i, inds[i]);
     });
+
+    Gpu::synchronize();
 }
 
 }
diff --git a/Src/Particle/AMReX_ParticleUtil.H b/Src/Particle/AMReX_ParticleUtil.H
index f42134fdecc..5010458af35 100644
--- a/Src/Particle/AMReX_ParticleUtil.H
+++ b/Src/Particle/AMReX_ParticleUtil.H
@@ -18,6 +18,42 @@
 namespace amrex
 {
 
+namespace particle_detail {
+
+template <typename F, typename P>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+auto call_f (F const& f, P const& p, amrex::RandomEngine const& engine) noexcept
+    -> decltype(f(P{},RandomEngine{}))
+{
+    return f(p,engine);
+}
+
+template <typename F, typename P>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+auto call_f (F const& f, P const& p, amrex::RandomEngine const&) noexcept
+    -> decltype(f(P{}))
+{
+    return f(p);
+}
+
+template <typename F, typename SrcData, typename N>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+auto call_f (F const& f, SrcData const& src, N i, amrex::RandomEngine const& engine) noexcept
+    -> decltype(f(SrcData{},N{},RandomEngine{}))
+{
+    return f(src,i,engine);
+}
+
+template <typename F, typename SrcData, typename N>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+auto call_f (F const& f, SrcData const& src, N i, amrex::RandomEngine const&) noexcept
+    -> decltype(f(SrcData{},N{}))
+{
+    return f(src,i);
+}
+
+}
+
 /**
  * \brief Returns the number of particles that are more than nGrow cells
  * from the box correspond to the input iterator.
@@ -43,10 +79,10 @@ numParticlesOutOfRange (Iterator const& pti, int nGrow)
     const auto domain = geom.Domain();
     const auto plo = geom.ProbLoArray();
     const auto dxi = geom.InvCellSizeArray();
-    
+
     Box box = pti.tilebox();
     box.grow(nGrow);
-        
+
     ReduceOps<ReduceOpSum> reduce_op;
     ReduceData<int> reduce_data(reduce_op);
     using ReduceTuple = typename decltype(reduce_data)::Type;
@@ -66,7 +102,7 @@ numParticlesOutOfRange (Iterator const& pti, int nGrow)
     int hv = amrex::get<0>(reduce_data.value());
     return hv;
 }
-    
+
 /**
  * \brief Returns the number of particles that are more than nGrow cells
  * from their assigned box.
@@ -78,7 +114,7 @@ numParticlesOutOfRange (Iterator const& pti, int nGrow)
  * \param pc the particle container to test
  * \param nGrow the number of grow cells allowed.
  *
- */    
+ */
 template <class PC, EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
 int
 numParticlesOutOfRange (PC const& pc, int nGrow)
@@ -99,7 +135,7 @@ numParticlesOutOfRange (PC const& pc, int nGrow)
  * \param lev_max the maximum level to test
  * \param nGrow the number of grow cells allowed.
  *
- */        
+ */
 template <class PC, EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
 int
 numParticlesOutOfRange (PC const& pc, int lev_min, int lev_max, int nGrow)
@@ -118,13 +154,13 @@ numParticlesOutOfRange (PC const& pc, int lev_min, int lev_max, int nGrow)
             num_wrong += numParticlesOutOfRange(pti, nGrow);
         }
     }
-    ParallelDescriptor::ReduceIntSum(num_wrong);
+    ParallelAllReduce::Sum(num_wrong, ParallelContext::CommunicatorSub());
 
     return num_wrong;
 }
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int getTileIndex (const IntVect& iv, const Box& box, const bool a_do_tiling, 
+int getTileIndex (const IntVect& iv, const Box& box, const bool a_do_tiling,
 		  const IntVect& a_tile_size, Box& tbx)
 {
     if (a_do_tiling == false) {
@@ -171,6 +207,32 @@ int getTileIndex (const IntVect& iv, const Box& box, const bool a_do_tiling,
     }
 }
 
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int numTilesInBox (const Box& box, const bool a_do_tiling, const IntVect& a_tile_size)
+{
+    if (a_do_tiling == false) {
+        return 1;
+    } else {
+        //
+        // This function must be consistent with FabArrayBase::buildTileArray function!!!
+        //
+        auto tiling_1d = [](int lo, int hi, int tilesize, int& ntile) {
+            int ncells = hi-lo+1;
+            ntile = amrex::max(ncells/tilesize, 1);
+        };
+
+        const IntVect& small = box.smallEnd();
+        const IntVect& big   = box.bigEnd();
+        IntVect ntiles;
+
+        AMREX_D_TERM(tiling_1d(small[0], big[0], a_tile_size[0], ntiles[0]);,
+		     tiling_1d(small[1], big[1], a_tile_size[1], ntiles[1]);,
+		     tiling_1d(small[2], big[2], a_tile_size[2], ntiles[2]););
+
+        return AMREX_D_TERM(ntiles[0], *=ntiles[1], *=ntiles[2]);
+    }
+}
+
 template <typename P>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 IntVect getParticleCell (P const& p,
@@ -193,42 +255,43 @@ int getParticleGrid (P const& p, amrex::Array4<int> const& mask,
                      amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dxi,
                      const Box& domain) noexcept
 {
-    if (p.id() < 0) return -1;    
+    if (p.id() < 0) return -1;
     IntVect iv = getParticleCell(p, plo, dxi, domain);
     return mask(iv);
 }
 
 template <typename P>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-void enforcePeriodic (P& p,
+bool enforcePeriodic (P& p,
                       amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& plo,
                       amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& phi,
                       amrex::GpuArray<int,AMREX_SPACEDIM> const& is_per) noexcept
 {
-    // In rare cases, degenerate cases can be found, filter out with a tolerance
-#if !defined(__CUDACC__) || (__CUDACC_VER_MAJOR__ != 9) || (__CUDACC_VER_MINOR__ != 2)
-    static constexpr Real eps = std::numeric_limits<Real>::epsilon();
-#else
-    static constexpr Real eps = DBL_EPSILON;
-#endif
-
+    bool shifted = false;
     for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
     {
         if (not is_per[idim]) continue;
-        if (p.pos(idim) >= phi[idim]) { 
-            while (p.pos(idim) >= phi[idim]) { 
-                p.pos(idim) -= (phi[idim] - plo[idim]);
+        if (p.pos(idim) >= phi[idim]) {
+            while (p.pos(idim) >= phi[idim]) {
+                p.pos(idim) -= static_cast<ParticleReal>(phi[idim] - plo[idim]);
             }
-            if (p.pos(idim) < plo[idim]) p.pos(idim) = plo[idim]; // clamp to avoid precision issues;
-        } 
+            // clamp to avoid precision issues;
+            if (p.pos(idim) < plo[idim]) p.pos(idim) = static_cast<ParticleReal>(plo[idim]);
+            shifted = true;
+        }
         else if (p.pos(idim) < plo[idim]) {
             while (p.pos(idim) < plo[idim]) {
-                p.pos(idim) += (phi[idim] - plo[idim]); 
+                p.pos(idim) += static_cast<ParticleReal>(phi[idim] - plo[idim]);
             }
-            if (p.pos(idim) == phi[idim]) p.pos(idim) = plo[idim]; // clamp to avoid precision issues;
-            if (p.pos(idim) > phi[idim]) p.pos(idim) = phi[idim]-eps; // clamp to avoid precision issues;
+            // clamp to avoid precision issues;
+            if (p.pos(idim) == phi[idim]) p.pos(idim) = static_cast<ParticleReal>(plo[idim]);
+            if (p.pos(idim) > phi[idim]) p.pos(idim) = std::nextafter( (amrex::ParticleReal) phi[idim], (amrex::ParticleReal) plo[idim]);
+            shifted = true;
         }
+        AMREX_ASSERT( (p.pos(idim) >= plo[idim] ) and ( p.pos(idim) < phi[idim] ));
     }
+
+    return shifted;
 }
 
 #if defined(AMREX_USE_GPU)
@@ -236,7 +299,7 @@ void enforcePeriodic (P& p,
 template <typename PTile, typename PLocator>
 int
 partitionParticlesByDest (PTile& ptile, const PLocator& ploc, const ParticleBufferMap& pmap,
-                          const Geometry& geom, int lev, int gid, int tid,
+                          const Geometry& geom, int lev, int gid, int /*tid*/,
                           int lev_min, int lev_max, int nGrow)
 {
     const auto plo    = geom.ProbLoArray();
@@ -247,16 +310,14 @@ partitionParticlesByDest (PTile& ptile, const PLocator& ploc, const ParticleBuff
     const int np = aos.numParticles();
 
     if (np == 0) return 0;
-    
-    auto p_lev_offsets = pmap.levelOffsetsPtr();
-    auto p_box_perm = pmap.levGridToBucketPtr();
-    auto p_pids = pmap.bucketToPIDPtr();
+
+    auto getPID = pmap.getPIDFunctor();
     auto p_ptr = &(aos[0]);
-    
-    int pid = ParallelDescriptor::MyProc();
-    int chunk_size = 256*256*256;
+
+    int pid = ParallelContext::MyProcSub();
+    constexpr int chunk_size = 256*256*256;
     int num_chunks = std::max(1, (np + (chunk_size - 1)) / chunk_size);
-    
+
     PTile ptile_tmp;
     ptile_tmp.define(ptile.NumRuntimeRealComps(), ptile.NumRuntimeIntComps());
     ptile_tmp.resize(std::min(np, chunk_size));
@@ -269,16 +330,16 @@ partitionParticlesByDest (PTile& ptile, const PLocator& ploc, const ParticleBuff
     {
         int this_offset = ichunk*chunk_size;
         int this_chunk_size = std::min(chunk_size, np - this_offset);
-        
+
         int num_stay;
         {
             auto particle_stays = [=] AMREX_GPU_DEVICE (int i) -> int
             {
                 int assigned_grid;
                 int assigned_lev;
-        
+
                 auto& p = p_ptr[i+this_offset];
-                
+
                 if (p.id() < 0 )
                 {
                     assigned_grid = -1;
@@ -291,13 +352,12 @@ partitionParticlesByDest (PTile& ptile, const PLocator& ploc, const ParticleBuff
                     assigned_grid = amrex::get<0>(tup);
                     assigned_lev  = amrex::get<1>(tup);
                 }
-        
-                return ((assigned_grid == gid) && (assigned_lev == lev)
-                        && (p_pids[p_box_perm[p_lev_offsets[lev]+gid]] == pid));
+
+                return ((assigned_grid == gid) && (assigned_lev == lev) && (getPID(lev, gid) == pid));
             };
-        
-            num_stay = Scan::PrefixSum<int> (this_chunk_size, 
-                          [=] AMREX_GPU_DEVICE (int i) -> int 
+
+            num_stay = Scan::PrefixSum<int> (this_chunk_size,
+                          [=] AMREX_GPU_DEVICE (int i) -> int
                           {
                               return particle_stays(i);
                           },
@@ -311,7 +371,7 @@ partitionParticlesByDest (PTile& ptile, const PLocator& ploc, const ParticleBuff
                               {
                                   copyParticle(dst_data, src_data, i + this_offset, this_chunk_size-1-(i-s));
                               }
-                          }, 
+                          },
                           Scan::Type::exclusive);
         }
 
@@ -326,7 +386,7 @@ partitionParticlesByDest (PTile& ptile, const PLocator& ploc, const ParticleBuff
                              copyParticle(src_data, dst_data, i, i + this_offset);
                          });
         }
-        
+
         if ( ichunk > 0 )
         {
             int num_swap = std::min(this_offset - last_offset, num_stay);
diff --git a/Src/Particle/AMReX_ParticleUtil.cpp b/Src/Particle/AMReX_ParticleUtil.cpp
index 0959325b12a..7fe15d7fc4c 100644
--- a/Src/Particle/AMReX_ParticleUtil.cpp
+++ b/Src/Particle/AMReX_ParticleUtil.cpp
@@ -22,7 +22,7 @@ IntVect computeRefFac (const ParGDBBase* a_gdb, int src_lev, int lev)
 Vector<int> computeNeighborProcs (const ParGDBBase* a_gdb, int ngrow)
 {
     BL_PROFILE("amrex::computeNeighborProcs");
-    
+
     Vector<int> neighbor_procs;
     for (int src_lev = 0; src_lev < a_gdb->finestLevel()+1; ++src_lev)
     {
@@ -39,11 +39,11 @@ Vector<int> computeNeighborProcs (const ParGDBBase* a_gdb, int ngrow)
                 if (ref_fac < IntVect::TheZeroVector()) box.coarsen(-1*ref_fac);
                 else if (ref_fac > IntVect::TheZeroVector()) box.refine(ref_fac);
                 box.grow(computeRefFac(a_gdb, 0, src_lev)*ngrow);
-                
+
                 const Periodicity& periodicity = a_gdb->Geom(lev).periodicity();
                 const std::vector<IntVect>& pshifts = periodicity.shiftIntVect();
                 const BoxArray& ba = a_gdb->ParticleBoxArray(lev);
-                
+
                 for (auto pit=pshifts.cbegin(); pit!=pshifts.cend(); ++pit)
                 {
                     const Box& pbox = box + (*pit);
@@ -52,7 +52,8 @@ Vector<int> computeNeighborProcs (const ParGDBBase* a_gdb, int ngrow)
                     for (const auto& isec : isects)
                     {
                         const int grid = isec.first;
-                        const int proc = a_gdb->ParticleDistributionMap(lev)[grid];
+                        const int global_proc = a_gdb->ParticleDistributionMap(lev)[grid];
+                        const int proc = ParallelContext::global_to_local_rank(global_proc);
                         neighbor_procs.push_back(proc);
                     }
                 }
diff --git a/Src/Particle/AMReX_Particle_mod_K.H b/Src/Particle/AMReX_Particle_mod_K.H
index e7a1ff78017..68b84a359ef 100644
--- a/Src/Particle/AMReX_Particle_mod_K.H
+++ b/Src/Particle/AMReX_Particle_mod_K.H
@@ -21,15 +21,15 @@ void amrex_deposit_cic (P const& p, int nc, amrex::Array4<amrex::Real> const& rh
     
     amrex::Real xint = lx - i;
     
-    amrex::Real sx[2] = {1.0_rt - xint, xint};
+    amrex::Real sx[2] = {Real(1.0) - xint, xint};
     
     for (int ii = 0; ii <= 1; ++ii) { 
-        amrex::Gpu::Atomic::Add(&rho(i+ii-1, 0, 0, 0), static_cast<Real>(sx[ii]*p.rdata(0)));
+        amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, 0, 0, 0), static_cast<Real>(sx[ii]*p.rdata(0)));
     }
     
     for (int comp=1; comp < nc; ++comp) {
         for (int ii = 0; ii <= 1; ++ii) { 
-            amrex::Gpu::Atomic::Add(&rho(i+ii-1, 0, 0, comp), 
+            amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, 0, 0, comp), 
                                     static_cast<Real>(sx[ii]*p.rdata(0)*p.rdata(comp)));
         }
     }
@@ -43,12 +43,12 @@ void amrex_deposit_cic (P const& p, int nc, amrex::Array4<amrex::Real> const& rh
     amrex::Real xint = lx - i;
     amrex::Real yint = ly - j;
 
-    amrex::Real sx[2] = {1.0_rt - xint, xint};
-    amrex::Real sy[2] = {1.0_rt - yint, yint};
+    amrex::Real sx[2] = {Real(1.0) - xint, xint};
+    amrex::Real sy[2] = {Real(1.0) - yint, yint};
 
     for (int jj = 0; jj <= 1; ++jj) { 
         for (int ii = 0; ii <= 1; ++ii) { 
-            amrex::Gpu::Atomic::Add(&rho(i+ii-1, j+jj-1, 0, 0),
+            amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, j+jj-1, 0, 0),
                                     static_cast<Real>(sx[ii]*sy[jj]*p.rdata(0)));
         }
     }
@@ -56,7 +56,7 @@ void amrex_deposit_cic (P const& p, int nc, amrex::Array4<amrex::Real> const& rh
     for (int comp=1; comp < nc; ++comp) {
         for (int jj = 0; jj <= 1; ++jj) { 
             for (int ii = 0; ii <= 1; ++ii) {                 
-                amrex::Gpu::Atomic::Add(&rho(i+ii-1, j+jj-1, 0, comp),
+                amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, j+jj-1, 0, comp),
                                         static_cast<Real>(sx[ii]*sy[jj]*p.rdata(0)*p.rdata(comp)));
             }
         }
@@ -75,14 +75,14 @@ void amrex_deposit_cic (P const& p, int nc, amrex::Array4<amrex::Real> const& rh
     amrex::Real yint = ly - j;
     amrex::Real zint = lz - k;
 
-    amrex::Real sx[] = {1.0_rt - xint, xint};
-    amrex::Real sy[] = {1.0_rt - yint, yint};
-    amrex::Real sz[] = {1.0_rt - zint, zint};
+    amrex::Real sx[] = {Real(1.0) - xint, xint};
+    amrex::Real sy[] = {Real(1.0) - yint, yint};
+    amrex::Real sz[] = {Real(1.0) - zint, zint};
     
     for (int kk = 0; kk <= 1; ++kk) { 
         for (int jj = 0; jj <= 1; ++jj) { 
             for (int ii = 0; ii <= 1; ++ii) {
-                amrex::Gpu::Atomic::Add(&rho(i+ii-1, j+jj-1, k+kk-1, 0),
+                amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, j+jj-1, k+kk-1, 0),
                                         static_cast<Real>(sx[ii]*sy[jj]*sz[kk]*p.rdata(0)));
             }
         }
@@ -92,7 +92,7 @@ void amrex_deposit_cic (P const& p, int nc, amrex::Array4<amrex::Real> const& rh
         for (int kk = 0; kk <= 1; ++kk) { 
             for (int jj = 0; jj <= 1; ++jj) { 
                 for (int ii = 0; ii <= 1; ++ii) {
-                    amrex::Gpu::Atomic::Add(&rho(i+ii-1, j+jj-1, k+kk-1, comp),
+                    amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, j+jj-1, k+kk-1, comp),
                                             static_cast<Real>(sx[ii]*sy[jj]*sz[kk]*p.rdata(0)*p.rdata(comp)));
                 }
             }
@@ -125,7 +125,7 @@ void amrex_deposit_particle_dx_cic (P const& p, int nc, amrex::Array4<amrex::Rea
         if (i < rho.begin.x || i >= rho.end.x) continue;
         amrex::Real wx = amrex::min(hx - i, amrex::Real(1.0)) - amrex::max(lx - i, amrex::Real(0.0));
         amrex::Real weight = wx*factor;                
-        rho(i, 0, 0, 0) += weight*p.rdata(0);                
+        amrex::Gpu::Atomic::AddNoRet(&rho(i, 0, 0, 0), static_cast<Real>(weight*p.rdata(0)));
     }
 
     for (int comp = 1; comp < nc; ++comp)
@@ -134,7 +134,7 @@ void amrex_deposit_particle_dx_cic (P const& p, int nc, amrex::Array4<amrex::Rea
             if (i < rho.begin.x || i >= rho.end.x) continue;
             amrex::Real wx = amrex::min(hx - i, amrex::Real(1.0)) - amrex::max(lx - i, amrex::Real(0.0));            
             amrex::Real weight = wx*factor;
-            rho(i, 0, 0, comp) += weight*p.rdata(0)*p.rdata(comp);
+            amrex::Gpu::Atomic::AddNoRet(&rho(i, 0, 0, comp), static_cast<Real>(weight*p.rdata(0)*p.rdata(comp)));
         }
     }
 
@@ -159,10 +159,8 @@ void amrex_deposit_particle_dx_cic (P const& p, int nc, amrex::Array4<amrex::Rea
         for (int i = lo_x; i <= hi_x; ++i) {
             if (i < rho.begin.x || i >= rho.end.x) continue;
             amrex::Real wx = amrex::min(hx - i, amrex::Real(1.0)) - amrex::max(lx - i, amrex::Real(0.0));
-            
             amrex::Real weight = wx*wy*factor;
-                
-            rho(i, j, 0, 0) += weight*p.rdata(0);                
+            amrex::Gpu::Atomic::AddNoRet(&rho(i, j, 0, 0), static_cast<Real>(weight*p.rdata(0)));
         }
     }
 
@@ -174,7 +172,7 @@ void amrex_deposit_particle_dx_cic (P const& p, int nc, amrex::Array4<amrex::Rea
                 if (i < rho.begin.x || i >= rho.end.x) continue;
                 amrex::Real wx = amrex::min(hx - i, amrex::Real(1.0)) - amrex::max(lx - i, amrex::Real(0.0));
                 amrex::Real weight = wx*wy*factor;
-                rho(i, j, 0, comp) += weight*p.rdata(0)*p.rdata(comp);
+                amrex::Gpu::Atomic::AddNoRet(&rho(i, j, 0, comp), static_cast<Real>(weight*p.rdata(0)*p.rdata(comp)));
             }
         }
     }
@@ -207,10 +205,8 @@ void amrex_deposit_particle_dx_cic (P const& p, int nc, amrex::Array4<amrex::Rea
             for (int i = lo_x; i <= hi_x; ++i) {
                 if (i < rho.begin.x || i >= rho.end.x) continue;
                 amrex::Real wx = amrex::min(hx - i, amrex::Real(1.0)) - amrex::max(lx - i, amrex::Real(0.0));
-                
                 amrex::Real weight = wx*wy*wz*factor;
-                
-                rho(i, j, k, 0) += weight*p.rdata(0);                
+                amrex::Gpu::Atomic::AddNoRet(&rho(i, j, k, 0), static_cast<Real>(weight*p.rdata(0)));
             }
         }
     }
@@ -226,7 +222,7 @@ void amrex_deposit_particle_dx_cic (P const& p, int nc, amrex::Array4<amrex::Rea
                     if (i < rho.begin.x || i >= rho.end.x) continue;
                     amrex::Real wx = amrex::min(hx - i, amrex::Real(1.0)) - amrex::max(lx - i, amrex::Real(0.0));
                     amrex::Real weight = wx*wy*wz*factor;
-                    rho(i, j, k, comp) += weight*p.rdata(0)*p.rdata(comp);
+                    amrex::Gpu::Atomic::AddNoRet(&rho(i, j, k, comp), static_cast<Real>(weight*p.rdata(0)*p.rdata(comp)));
                 }
             }
         }
@@ -249,7 +245,7 @@ void amrex_interpolate_cic (P const& p, int nc, amrex::Array4<amrex::Real const>
     
     amrex::Real xint = lx - i;
     
-    amrex::Real sx[] = {1.0_rt-xint, xint};
+    amrex::Real sx[] = {Real(1.0)-xint, xint};
 
     for (int comp=0; comp < nc; ++comp) {    
         for (int ii = 0; ii <= 1; ++ii) { 
@@ -267,8 +263,8 @@ void amrex_interpolate_cic (P const& p, int nc, amrex::Array4<amrex::Real const>
     amrex::Real xint = lx - i;
     amrex::Real yint = ly - j;
     
-    amrex::Real sx[] = {1.0_rt-xint, xint};
-    amrex::Real sy[] = {1.0_rt-yint, yint};
+    amrex::Real sx[] = {Real(1.0)-xint, xint};
+    amrex::Real sy[] = {Real(1.0)-yint, yint};
 
     for (int comp=0; comp < nc; ++comp) {    
         for (int jj = 0; jj <= 1; ++jj) { 
@@ -291,9 +287,9 @@ void amrex_interpolate_cic (P const& p, int nc, amrex::Array4<amrex::Real const>
     amrex::Real yint = ly - j;
     amrex::Real zint = lz - k;
     
-    amrex::Real sx[] = {1.0_rt-xint, xint};
-    amrex::Real sy[] = {1.0_rt-yint, yint};
-    amrex::Real sz[] = {1.0_rt-zint, zint};
+    amrex::Real sx[] = {Real(1.0)-xint, xint};
+    amrex::Real sy[] = {Real(1.0)-yint, yint};
+    amrex::Real sz[] = {Real(1.0)-zint, zint};
 
     for (int comp=0; comp < nc; ++comp) {                    
         for (int kk = 0; kk <= 1; ++kk) { 
diff --git a/Src/Particle/AMReX_Particles.H b/Src/Particle/AMReX_Particles.H
index dfb87f76a04..7c49c96fbef 100644
--- a/Src/Particle/AMReX_Particles.H
+++ b/Src/Particle/AMReX_Particles.H
@@ -49,6 +49,7 @@
 #include <AMReX_SparseBins.H>
 #include <AMReX_ParticleTransformation.H>
 #include <AMReX_ParIter.H>
+#include <AMReX_OpenMP.H>
 
 #ifdef AMREX_LAZY
 #include <AMReX_Lazy.H>
@@ -112,9 +113,9 @@ struct ParticleInitType
     std::array<double, NArrayReal > real_array_data;
     std::array<int,    NArrayInt  > int_array_data;
 };
-    
+
 class ParticleContainerBase {};
-    
+
 /**
  * \brief A distributed container for Particles sorted onto the levels, grids,
  * and tiles of a block-structured AMR hierarachy.
@@ -150,7 +151,7 @@ public:
     using ParticleType = Particle<NStructReal, NStructInt>;
     //! \brief The type of the "SuperParticle" which stored all components in AoS form
     using SuperParticleType = Particle<NStructReal+NArrayReal, NStructInt+NArrayInt>;
-    //! \brief The type of the Real data 
+    //! \brief The type of the Real data
     using RealType = typename Particle<NStructReal, NStructInt>::RealType;
 
 #ifdef AMREX_SINGLE_PRECISION_PARTICLES
@@ -181,13 +182,13 @@ public:
     //!  of a level hierarchy. Must be properly initialized later.
     ParticleContainer ()
       :
-      communicate_real_comp(NArrayReal, true),
-      communicate_int_comp(NArrayInt, true),
+      h_communicate_real_comp(NArrayReal, true),
+      h_communicate_int_comp(NArrayInt, true),
       m_verbose(0),
       m_gdb(nullptr),
       m_runtime_comps_defined(false),
       m_num_runtime_real(0),
-      m_num_runtime_int(0)        
+      m_num_runtime_int(0)
     {
         Initialize ();
     }
@@ -198,11 +199,11 @@ public:
     //! \param gdb A pointer to a ParGDBBase, which contains pointers to the Geometry,
     //! DistributionMapping, and BoxArray objects that define the AMR hierarchy. Usually,
     //! this is generated by an AmrCore or AmrLevel object.
-    //! 
+    //!
     ParticleContainer (ParGDBBase* gdb)
         :
-        communicate_real_comp(NArrayReal, true),
-        communicate_int_comp(NArrayInt, true),
+        h_communicate_real_comp(NArrayReal, true),
+        h_communicate_int_comp(NArrayInt, true),
 	m_verbose(0),
 	m_gdb(gdb),
         m_runtime_comps_defined(false),
@@ -225,8 +226,8 @@ public:
 		       const DistributionMapping & dmap,
 		       const BoxArray            & ba)
 	:
-        communicate_real_comp(NArrayReal, true),
-        communicate_int_comp(NArrayInt, true),
+        h_communicate_real_comp(NArrayReal, true),
+        h_communicate_int_comp(NArrayInt, true),
         m_verbose(0),
 	m_gdb_object(geom,dmap,ba),
         m_runtime_comps_defined(false),
@@ -253,8 +254,8 @@ public:
 		       const Vector<BoxArray>            & ba,
 		       const Vector<int>                 & rr)
 	:
-        communicate_real_comp(NArrayReal, true),
-        communicate_int_comp(NArrayInt, true),
+        h_communicate_real_comp(NArrayReal, true),
+        h_communicate_int_comp(NArrayInt, true),
         m_verbose(0),
 	m_gdb_object(geom,dmap,ba,rr),
         m_runtime_comps_defined(false),
@@ -280,8 +281,8 @@ public:
 		       const Vector<BoxArray>            & ba,
 		       const Vector<IntVect>             & rr)
 	:
-        communicate_real_comp(NArrayReal, true),
-        communicate_int_comp(NArrayInt, true),
+        h_communicate_real_comp(NArrayReal, true),
+        h_communicate_int_comp(NArrayInt, true),
         m_verbose(0),
 	m_gdb_object(geom,dmap,ba, [&]() -> Vector<int> {
                 Vector<int> ref_ratio;
@@ -321,7 +322,7 @@ public:
     //! \param gdb A pointer to a ParGDBBase, which contains pointers to the Geometry,
     //! DistributionMapping, and BoxArray objects that define the AMR hierarchy. Usually,
     //! this is generated by an AmrCore or AmrLevel object.
-    //! 
+    //!
     void Define (ParGDBBase* gdb)
     {
         m_gdb = gdb;
@@ -335,7 +336,7 @@ public:
     //! \param the Geometry object, which describes the problem domain
     //! \param A DistributionMapping, which describes how the boxes are distributed onto MPI tasks
     //! \param A BoxArray, which gives the set of grid boxes
-    //!     
+    //!
     void Define (const Geometry            & geom,
 		 const DistributionMapping & dmap,
 		 const BoxArray            & ba)
@@ -374,7 +375,12 @@ public:
     //! \param new_ba The new BoxArray to use.
     //!
     void SetParticleBoxArray (int lev, const BoxArray& new_ba)
-	{ m_gdb->SetParticleBoxArray(lev, new_ba); }
+    {
+        m_gdb_object = ParGDB(m_gdb->ParticleGeom(), m_gdb->ParticleDistributionMap(),
+                              m_gdb->ParticleBoxArray(), m_gdb->refRatio());
+        m_gdb = &m_gdb_object;
+        m_gdb->SetParticleBoxArray(lev, new_ba);
+    }
 
     //! \brief Set the particle DistributionMapping. If the container was previously set to
     //! to track the AMR hierarchy of an AmrCore or AmrLevel object, that correspondence
@@ -384,7 +390,27 @@ public:
     //! \param new_dmap The new DistributionMapping to use.
     //!
     void SetParticleDistributionMap (int lev, const DistributionMapping& new_dmap)
-	{ m_gdb->SetParticleDistributionMap(lev, new_dmap); }
+    {
+        m_gdb_object = ParGDB(m_gdb->ParticleGeom(), m_gdb->ParticleDistributionMap(),
+                              m_gdb->ParticleBoxArray(), m_gdb->refRatio());
+        m_gdb = &m_gdb_object;
+        m_gdb->SetParticleDistributionMap(lev, new_dmap);
+    }
+
+    //! \brief Set the particle Geometry. If the container was previously set to
+    //! to track the AMR hierarchy of an AmrCore or AmrLevel object, that correspondence
+    //! will be broken here.
+    //!
+    //! \param lev The level on which to set the Geometry.
+    //! \param new_geom The new Geometry to use.
+    //!
+    void SetParticleGeometry (int lev, const Geometry& new_geom)
+    {
+        m_gdb_object = ParGDB(m_gdb->ParticleGeom(), m_gdb->ParticleDistributionMap(),
+                              m_gdb->ParticleBoxArray(), m_gdb->refRatio());
+        m_gdb = &m_gdb_object;
+        m_gdb->SetParticleGeometry(lev, new_geom);
+    }
 
     //! \brief Get the BoxArray for a given level
     //!
@@ -406,24 +432,30 @@ public:
     //!
     const Geometry& Geom (int lev) const { return m_gdb->Geom(lev); }
 
+    //! \brief Get the particle Geometry for a given level
+    //!
+    //! \param lev The level.
+    //!
+    const Geometry& ParticleGeom (int lev) const { return m_gdb->ParticleGeom(lev); }
+
     //! \brief the finest level actually defined for the ParticleContainer
     int finestLevel () const { return m_gdb->finestLevel(); }
 
     //! \brief the finest allowed level in the ParticleContainer, whether it is defined or not.
     int maxLevel ()    const { return m_gdb->maxLevel(); }
 
-    //! \brief the number of defined levels in the ParticleContainer    
+    //! \brief the number of defined levels in the ParticleContainer
     int numLevels()    const { return finestLevel() + 1; }
 
-    //! \brief The total number of tiles on this rank on this level     
+    //! \brief The total number of tiles on this rank on this level
     int numLocalTilesAtLevel (int lev) const { return m_particles[lev].size(); }
 
-    //! \brief Get the ParGDB object used to define this container (const version)    
+    //! \brief Get the ParGDB object used to define this container (const version)
     const ParGDBBase* GetParGDB () const { return m_gdb; }
 
     //! \brief Get the ParGDB object used to define this container
           ParGDBBase* GetParGDB ()       { return m_gdb; }
-    
+
     void reserveData ();
     void resizeData ();
 
@@ -514,15 +546,6 @@ public:
 
     Long IncrementWithTotal (MultiFab& mf, int level, bool local = false);
 
-    /**
-    * \brief rho_index: rho index in rdata
-    *
-    * \param rho_index
-    * \param level
-    * \param local
-    */
-    Real sumParticleMass (int rho_index, int level, bool local = false) const;
-
     /**
     * \brief Redistribute puts all the particles back in the right places (for some value of right)
     *
@@ -639,6 +662,34 @@ public:
     */
     void AddParticlesAtLevel (AoS& particles, int level, int nGrow=0);
 
+    /**
+    * \brief Creates virtual particles for a given level that represent
+    * in some capacity all particles at finer levels
+    *
+    * \param level
+    * \param virts
+    */
+    void CreateVirtualParticles (int level, ParticleTileType& virts) const;
+
+    /**
+    * \brief Create ghost particles for a given level that are copies of particles
+    * near coarse-\>fine boundaries in level-1
+    *
+    * \param level
+    * \param ngrow
+    * \param ghosts
+    */
+    void CreateGhostParticles (int level, int ngrow, ParticleTileType& ghosts) const;
+
+    /**
+    * \brief Add particles from a pbox to the grid at this level
+    *
+    * \param particles
+    * \param level
+    * \param nGrow
+    */
+    void AddParticlesAtLevel (ParticleTileType& particles, int level, int nGrow=0);
+
 
     /**
     * \brief Clear all the particles in this container. This does not free memory.
@@ -651,39 +702,71 @@ public:
     * particles from this container first. local controls whether or not to call
     * Redistribute() after adding the particles.
     *
-    * \param other
+    * \param other the other pc to copy from
+    * \param local whether to call redistribute after
     */
     void copyParticles (const ParticleContainerType& other, bool local=false);
 
     /**
-    * \brief Add particles from other to this ParticleContainer. local controls 
+    * \brief Add particles from other to this ParticleContainer. local controls
     * whether or not to call Redistribute after adding the particles.
     *
-    * \param other
+    * \param other the other pc to copy from
+    * \param local whether to call redistribute after
     */
     void addParticles (const ParticleContainerType& other, bool local=false);
 
+    /**
+    * \brief Copy particles from other to this ParticleContainer. Will clear all the
+    * particles from this container first. local controls whether or not to call
+    * Redistribute() after adding the particles.
+    *
+    * This version conditionally copies based on a predicate function applied to 
+    * each particle.
+    *
+    * \tparam callable that takes a SuperParticle and returns a bool
+    *
+    * \param other the other pc to copy from
+    * \param f function to apply to each particle as a filter
+    * \param local whether to call redistribute after
+    */
+    template <class F, amrex::EnableIf_t<! std::is_integral<F>::value, int> foo = 0>
+    void copyParticles (const ParticleContainerType& other, F&&f, bool local=false);
+
+    /**
+    * \brief Add particles from other to this ParticleContainer. local controls
+    * whether or not to call Redistribute after adding the particles.
+    *
+    * This version conditionally copies based on a predicate function applied to 
+    * each particle.
+    *
+    * \tparam callable that takes a SuperParticle and returns a bool
+    *
+    * \param other the other pc to copy from
+    * \param f function to apply to each particle as a filter
+    * \param local whether to call redistribute after
+    */
+    template <class F, amrex::EnableIf_t<! std::is_integral<F>::value, int> foo = 0>
+    void addParticles (const ParticleContainerType& other, F&& f, bool local=false);
+
     /**
     * \brief Write a contiguous chunk of real particle data to an ostream.
-    * 
+    *
     * \param data A pointer to the start of the buffer to write
     * \param size The number of elements to write
     * \param os The ostream into which to write the data
-    * \param rd A RealDescriptor describing the type of the floating point data
-    */    
-    void WriteParticleRealData (void* data, size_t size,
-                                std::ostream& os, const RealDescriptor& rd) const;
-    
+    */
+    void WriteParticleRealData (void* data, size_t size, std::ostream& os) const;
+
     /**
     * \brief Read a contiguous chunk of real particle data from an istream.
-    * 
+    *
     * \param data A pointer to the start of the buffer into which to read
     * \param size The number of elements to read
     * \param os The istream from which to read the data
     * \param rd A RealDescriptor describing the type of the floating point data
-    */    
-    void ReadParticleRealData (void* data, size_t size,
-                               std::istream& is, const RealDescriptor& rd);
+    */
+    void ReadParticleRealData (void* data, size_t size, std::istream& is);
 
     /**
      * \brief Writes a particle checkpoint to file, suitable for restarting.
@@ -907,7 +990,7 @@ public:
                         const std::string& name,
                         const Vector<int>& write_real_comp,
                         const Vector<int>& write_int_comp, F&& f) const;
-	
+
     /**
      * \brief This is the most general version of WritePlotFile, which takes component 
      * names and flags for whether to write each variable as components. Note that 
@@ -950,19 +1033,17 @@ public:
     void WritePlotFile (const std::string& dir,
                         const std::string& name,
                         const Vector<int>& write_real_comp,
-                        const Vector<int>& write_int_comp,    
+                        const Vector<int>& write_int_comp,
                         const Vector<std::string>& real_comp_names,
                         const Vector<std::string>&  int_comp_names,
                         F&& f) const;
-	
+
     void WritePlotFilePre ();
 
     void WritePlotFilePost ();
 
     void WriteAsciiFile (const std::string& file);
 
-    void WriteCoarsenedAsciiFile (const std::string& filename);
-
     int Verbose () { return m_verbose; }
 
     void SetVerbose (int verbose) { m_verbose = verbose; }
@@ -1001,7 +1082,7 @@ public:
         m_particles[lev][index].define(NumRuntimeRealComps(), NumRuntimeIntComps());
         return ParticlesAt(lev, iter);
     }
-    
+
     /**
     * \brief Functions depending the layout of the data.  Use with caution.
     *
@@ -1024,11 +1105,8 @@ public:
     void AssignCellDensitySingleLevel (int rho_index, MultiFab& mf, int level,
                                        int ncomp=1, int particle_lvl_offset = 0) const;
 
-    void moveKick (MultiFab& acceleration, int level, Real timestep,
-		   Real a_new = 1.0, Real a_half = 1.0,
-		   int start_comp_for_accel = -1);
-
-    IntVect Index (const Particle<NStructReal, NStructInt>& p, int lev) const;
+    template <typename P>
+    IntVect Index (const P& p, int lev) const;
 
 
     /**
@@ -1068,28 +1146,33 @@ public:
 
 
     //! struct-of-array stuff
-    Gpu::DeviceVector<int> communicate_real_comp;
-    Gpu::DeviceVector<int> communicate_int_comp;
+    Vector<int> h_communicate_real_comp;
+    Vector<int> h_communicate_int_comp;
+    Gpu::DeviceVector<int> d_communicate_real_comp;
+    Gpu::DeviceVector<int> d_communicate_int_comp;
 
     static bool do_tiling;
     static IntVect tile_size;
 
-    void SetLevelDirectoriesCreated(bool tf) {
-      levelDirectoriesCreated = tf;
-    }
+    void SetLevelDirectoriesCreated (bool tf) { levelDirectoriesCreated = tf; }
+
+    bool GetLevelDirectoriesCreated () const { return levelDirectoriesCreated; }
 
-    void SetUsePrePost(bool tf) {
+    void SetUsePrePost (bool tf) const {
       usePrePost = tf;
     }
-    bool GetUsePrePost() {
+    bool GetUsePrePost () const {
       return usePrePost;
     }
 
-    void SetUseUnlink(bool tf) {
+    int GetMaxNextIDPrePost () const { return maxnextidPrePost; }
+    Long GetNParticlesPrePost () const { return nparticlesPrePost; }
+
+    void SetUseUnlink (bool tf) const {
       doUnlink = tf;
     }
 
-    bool GetUseUnlink() {
+    bool GetUseUnlink () const {
       return doUnlink;
     }
 
@@ -1097,21 +1180,15 @@ public:
 
     void RedistributeGPU (int lev_min = 0, int lev_max = -1, int nGrow = 0, int local=0);
 
-    bool OKCPU (int lev_min = 0, int lev_max = -1, int nGrow = 0) const;
-
-    bool OKGPU (int lev_min = 0, int lev_max = -1, int nGrow = 0) const;
-
     Long superParticleSize() const { return superparticle_size; }
 
-    void EnforcePeriodic ();
-
     template <typename T,
               typename std::enable_if<std::is_same<T,bool>::value,int>::type=0>
     void AddRealComp (T communicate=true)
     {
         m_runtime_comps_defined = true;
         m_num_runtime_real++;
-        communicate_real_comp.push_back(communicate);
+        h_communicate_real_comp.push_back(communicate);
         SetParticleSize();
     }
 
@@ -1121,7 +1198,7 @@ public:
     {
         m_runtime_comps_defined = true;
         m_num_runtime_int++;
-        communicate_int_comp.push_back(communicate);
+        h_communicate_int_comp.push_back(communicate);
         SetParticleSize();
     }
 
@@ -1130,10 +1207,30 @@ public:
     Vector<int> NeighborProcs(int ngrow) const         
     {
         return computeNeighborProcs(this->GetParGDB(), ngrow);
-    };
+    }
 
     bool OnSameGrids (int level, const MultiFab& mf) const { return m_gdb->OnSameGrids(level, mf); }
 
+    int NumRuntimeRealComps () const { return m_num_runtime_real; }
+    int NumRuntimeIntComps  () const { return m_num_runtime_int;  }
+
+    int NumRealComps () const { return NArrayReal + NumRuntimeRealComps(); }
+    int NumIntComps  () const { return NArrayInt  + NumRuntimeIntComps() ; }
+
+    //! ---- variables for i/o optimization saved for pre and post checkpoint
+    mutable bool levelDirectoriesCreated;
+    mutable bool usePrePost;
+    mutable bool doUnlink;
+    int maxnextidPrePost;
+    mutable int nOutFilesPrePost;
+    Long nparticlesPrePost;
+    Vector<Long> nParticlesAtLevelPrePost;          //!< ---- [level]
+    mutable Vector<Vector<int>>  whichPrePost;      //!< ---- [level]
+    mutable Vector<Vector<int>>  countPrePost;      //!< ---- [level]
+    mutable Vector<Vector<Long>> wherePrePost;      //!< ---- [level]
+    mutable std::string HdrFileNamePrePost;
+    mutable Vector<std::string> filePrefixPrePost;
+
 protected:
 
     mutable amrex::Vector<int> neighbor_procs;
@@ -1151,7 +1248,8 @@ protected:
     * \param nGrow
     * \param local_grid
     */
-    bool Where (const ParticleType& prt, ParticleLocData& pld,
+    template <typename P>
+    bool Where (const P& prt, ParticleLocData& pld,
 		int lev_min = 0, int lev_max = -1, int nGrow=0, int local_grid=-1) const;
 
 
@@ -1168,11 +1266,14 @@ protected:
     bool EnforcePeriodicWhere (ParticleType& prt, ParticleLocData& pld,
                                int lev_min = 0, int lev_max = -1, int local_grid=-1) const;
 
+public:
     void
-	WriteParticles (int level, std::ofstream& ofs, int fnum,
-					Vector<int>& which, Vector<int>& count, Vector<Long>& where,
-					const Vector<int>& write_real_comp, const Vector<int>& write_int_comp,
-                        const Vector<std::map<std::pair<int, int>, Gpu::DeviceVector<int>>>& particle_io_flags) const;
+    WriteParticles (int level, std::ofstream& ofs, int fnum,
+                    Vector<int>& which, Vector<int>& count, Vector<Long>& where,
+                    const Vector<int>& write_real_comp, const Vector<int>& write_int_comp,
+                    const Vector<std::map<std::pair<int, int>, Gpu::DeviceVector<int>>>& particle_io_flags) const;
+protected:
+
 #ifdef AMREX_USE_HDF5
 void WriteParticlesHDF5 ( hid_t grp, int level, Vector<int>& count, Vector<Long>& where ) const;
 
@@ -1182,7 +1283,7 @@ void ReadParticlesHDF5 (hsize_t offset, hsize_t cnt, int grd, int lev, hid_t int
 
     template <class RTYPE>
     void ReadParticles (int cnt, int grd, int lev, std::ifstream& ifs, int finest_level_in_file);
-    
+
     void SetParticleSize ();
 
     void BuildRedistributeMask(int lev, int nghost=1) const;
@@ -1197,39 +1298,19 @@ void ReadParticlesHDF5 (hsize_t offset, hsize_t cnt, int grd, int lev, hid_t int
     ParGDBBase* m_gdb;
     ParGDB      m_gdb_object;
 
-    //! ---- variables for i/o optimization saved for pre and post checkpoint
-    bool         levelDirectoriesCreated;
-    bool         usePrePost;
-    bool         doUnlink;
-    int maxnextidPrePost;
-    mutable int nOutFilesPrePost;
-    Long nparticlesPrePost;
-    Vector<Long> nParticlesAtLevelPrePost;          //!< ---- [level]
-    mutable Vector<Vector<int>>  whichPrePost;      //!< ---- [level]
-    mutable Vector<Vector<int>>  countPrePost;      //!< ---- [level]
-    mutable Vector<Vector<Long>> wherePrePost;      //!< ---- [level]
-    mutable std::string HdrFileNamePrePost;
-    mutable Vector<std::string> filePrefixPrePost;
-
     DenseBins<ParticleType> m_bins;
-    
+
 #ifdef AMREX_USE_GPU
     mutable AmrParticleLocator<DenseBins<Box> > m_particle_locator;
 #endif
 
-    int NumRuntimeRealComps () const { return m_num_runtime_real; }
-    int NumRuntimeIntComps  () const { return m_num_runtime_int;  } 
-    
-    int NumRealComps () const { return NArrayReal + NumRuntimeRealComps(); }
-    int NumIntComps  () const { return NArrayInt  + NumRuntimeIntComps() ; } 
-    
 private:
 
     virtual void particlePostLocate(ParticleType& /*p*/, const ParticleLocData& /*pld*/,
-                                    const int /*lev*/) {};
+                                    const int /*lev*/) {}
 
     virtual void correctCellVectors(int /*old_index*/, int /*new_index*/,
-				    int /*grid*/, const ParticleType& /*p*/) {};
+				    int /*grid*/, const ParticleType& /*p*/) {}
 
     void RedistributeMPI (std::map<int, Vector<char> >& not_ours,
 			  int lev_min = 0, int lev_max = 0, int nGrow = 0, int local=0);
@@ -1242,11 +1323,14 @@ private:
     bool m_runtime_comps_defined;
     int m_num_runtime_real;
     int m_num_runtime_int;
-    
+
     size_t particle_size, superparticle_size;
     int num_real_comm_comps, num_int_comm_comps;
     Vector<ParticleLevel> m_particles;
     Vector<std::unique_ptr<MultiFab> > m_dummy_mf;
+
+    static std::string aggregation_type;
+    static int aggregation_buffer;
 };
 
 #include "AMReX_ParticleInit.H"
diff --git a/Src/Particle/AMReX_SparseBins.H b/Src/Particle/AMReX_SparseBins.H
index 7720e920d61..f2daf753d11 100644
--- a/Src/Particle/AMReX_SparseBins.H
+++ b/Src/Particle/AMReX_SparseBins.H
@@ -100,7 +100,7 @@ public:
      * \param f a function object that maps items to bins 
      */        
     template <typename N, typename F>
-    void build (N nitems, T const* v, const Box& bx, F f)
+    void build (N nitems, T const* v, const Box& bx, F&& f)
     {
         BL_PROFILE("SparseBins<T>::build");
 
diff --git a/Src/Particle/AMReX_StructOfArrays.H b/Src/Particle/AMReX_StructOfArrays.H
index 2f0af64c430..4d468087635 100644
--- a/Src/Particle/AMReX_StructOfArrays.H
+++ b/Src/Particle/AMReX_StructOfArrays.H
@@ -9,11 +9,12 @@
 
 namespace amrex {
 
-template <int NReal, int NInt>
+template <int NReal, int NInt,
+          template<class> class Allocator=DefaultAllocator>
 struct StructOfArrays {
 
-    using RealVector = Gpu::DeviceVector<ParticleReal>;
-    using IntVector = Gpu::DeviceVector<int>;    
+    using RealVector = amrex::PODVector<ParticleReal, Allocator<ParticleReal> >;
+    using IntVector = amrex::PODVector<int, Allocator<int> >;
 
     StructOfArrays()
         : m_num_neighbor_particles(0),
@@ -26,7 +27,7 @@ struct StructOfArrays {
         m_runtime_rdata.resize(a_num_runtime_real);
         m_runtime_idata.resize(a_num_runtime_int );
     }
-    
+
     int NumRealComps () const noexcept { return NReal + m_runtime_rdata.size(); }
 
     int NumIntComps () const noexcept { return NInt + m_runtime_idata.size(); }
@@ -45,7 +46,7 @@ struct StructOfArrays {
             return m_runtime_rdata[index - NReal];
         }
     }
-    
+
     const RealVector& GetRealData (const int index) const {
         AMREX_ASSERT(index < NReal + m_runtime_rdata.size());
         if (index < NReal) return m_rdata[index];
@@ -63,7 +64,7 @@ struct StructOfArrays {
             return m_runtime_idata[index - NInt];
         }
    }
-    
+
     const IntVector& GetIntData (const int index) const {
         AMREX_ASSERT(size_t(index) < NInt + m_runtime_idata.size());
         if (index < NInt) return m_idata[index];
@@ -81,7 +82,7 @@ struct StructOfArrays {
     {
         if (NReal > 0)
             return m_rdata[0].size();
-        else if (NInt > 0) 
+        else if (NInt > 0)
             return m_idata[0].size();
         else if (m_runtime_rdata.size() > 0)
             return m_runtime_rdata[0].size();
@@ -90,7 +91,7 @@ struct StructOfArrays {
         else
             return 0;
     }
-    
+
     /**
     * \brief Returns the number of real particles (excluding neighbors)
     *
@@ -116,7 +117,7 @@ struct StructOfArrays {
     int numTotalParticles () const { return size(); }
 
     void setNumNeighbors (int num_neighbors)
-    { 
+    {
         auto nrp = numRealParticles();
         m_num_neighbor_particles = num_neighbors;
         resize(nrp + num_neighbors);
@@ -127,7 +128,7 @@ struct StructOfArrays {
     void resize (size_t count)
     {
         for (int i = 0; i < NReal; ++i) m_rdata[i].resize(count);
-        for (int i = 0; i < NInt;  ++i) m_idata[i].resize(count); 
+        for (int i = 0; i < NInt;  ++i) m_idata[i].resize(count);
         for (int i = 0; i < (int) m_runtime_rdata.size(); ++i) m_runtime_rdata[i].resize(count);
         for (int i = 0; i < (int) m_runtime_idata.size(); ++i) m_runtime_idata[i].resize(count);
     }
@@ -160,7 +161,7 @@ private:
 
     std::vector<RealVector> m_runtime_rdata;
     std::vector<IntVector > m_runtime_idata;
-    
+
     bool m_defined;
 };
 
diff --git a/Src/Particle/AMReX_TracerParticle_mod_K.H b/Src/Particle/AMReX_TracerParticle_mod_K.H
index 091bc0f6a4b..e281f6b7699 100644
--- a/Src/Particle/AMReX_TracerParticle_mod_K.H
+++ b/Src/Particle/AMReX_TracerParticle_mod_K.H
@@ -12,58 +12,59 @@
 
 
 namespace amrex{
-  
+
 template <typename P>
 AMREX_GPU_HOST_DEVICE AMREX_INLINE
 void cic_interpolate (const P& p,
 		      amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& plo,
 		      amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dxi,
 		      const amrex::Array4<amrex::Real const> &  uccarr,
-		      amrex::Real * val){
-  
+		      amrex::ParticleReal * val){
+
   AMREX_ASSERT(val != 0);
 
 #if (AMREX_SPACEDIM == 1)
-  
+
     amrex::Real lx = (p.pos(0) - plo[0]) * dxi[0] - 0.5; //len
 
     int const i = static_cast<int>(amrex::Math::floor(lx)); //cell
 
     amrex::Real xint = lx - i; //frac
 
-    amrex::Real sx[] = {1._rt - xint, xint};
+    amrex::Real sx[] = {Real(1.0) - xint, xint};
 
     for (int d=0; d < AMREX_SPACEDIM; ++d)
     {
+        val[d] = ParticleReal(0.0);
         for (int ii = 0; ii<=1; ++ii)
 	{
-            val[d] += sx[ii]*uccarr(i+ii,0,0,d);
+            val[d] += static_cast<ParticleReal>(sx[ii]*uccarr(i+ii,0,0,d));
         }
     }
 
-  
+
 #elif (AMREX_SPACEDIM == 2)
 
-    amrex::Real lx = (p.pos(0) - plo[0]) * dxi[0] - 0.5; 
+    amrex::Real lx = (p.pos(0) - plo[0]) * dxi[0] - 0.5;
     amrex::Real ly = (p.pos(1) - plo[1]) * dxi[1] - 0.5;
 
     int const i = static_cast<int>(amrex::Math::floor(lx));
     int const j = static_cast<int>(amrex::Math::floor(ly));
 
-    amrex::Real xint = lx - i; 
+    amrex::Real xint = lx - i;
     amrex::Real yint = ly - j;
 
-    amrex::Real sx[] = {1._rt - xint, xint};
-    amrex::Real sy[] = {1._rt - yint, yint};
+    amrex::Real sx[] = {Real(1.0) - xint, xint};
+    amrex::Real sy[] = {Real(1.0) - yint, yint};
 
     for (int d=0; d < AMREX_SPACEDIM; ++d)
       {
-        val[d] = 0.0;
+        val[d] = ParticleReal(0.0);
         for (int jj = 0; jj <= 1; ++jj)
 	  {
             for (int ii = 0; ii <= 1; ++ii)
 	      {
-                val[d] += sx[ii]*sy[jj]*uccarr(i+ii,j+jj,0,d);
+                  val[d] += static_cast<ParticleReal>(sx[ii]*sy[jj]*uccarr(i+ii,j+jj,0,d));
               }
           }
       }
@@ -83,24 +84,24 @@ void cic_interpolate (const P& p,
     amrex::Real const yint = ly - j;
     amrex::Real const zint = lz - k;
 
-    amrex::Real sx[] = {1._rt - xint, xint};
-    amrex::Real sy[] = {1._rt - yint, yint};
-    amrex::Real sz[] = {1._rt - zint, zint};
+    amrex::Real sx[] = {Real(1.0) - xint, xint};
+    amrex::Real sy[] = {Real(1.0) - yint, yint};
+    amrex::Real sz[] = {Real(1.0) - zint, zint};
 
     for (int d=0; d < AMREX_SPACEDIM; ++d)
     {
-        val[d] = 0.0;
+        val[d] = ParticleReal(0.0);
         for (int kk = 0; kk<=1; ++kk)
 	{
             for (int jj = 0; jj <= 1; ++jj)
             {
                 for (int ii = 0; ii <= 1; ++ii)
                 {
-                    val[d] += sx[ii]*sy[jj]*sz[kk]*uccarr(i+ii,j+jj,k+kk,d);
+                    val[d] += static_cast<ParticleReal>(sx[ii]*sy[jj]*sz[kk]*uccarr(i+ii,j+jj,k+kk,d));
                 }
             }
         }
-    }    
+    }
 #endif
 }
 
@@ -112,85 +113,85 @@ void mac_interpolate (const P& p,
 		      amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& plo,
 		      amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dxi,
 		      amrex::GpuArray<amrex::Array4<amrex::Real const>,AMREX_SPACEDIM> const& p_uccarr,
-		      amrex::Real * val)
+		      amrex::ParticleReal * val)
 {
 
 #if (AMREX_SPACEDIM == 1)
     for (int d=0; d < AMREX_SPACEDIM; ++d)
     {
-      amrex::Real lx = (p.m_rdata.pos[0]-plo[0])*dxi[0] - (d != 0)*0.5;
-      
-      int const i = static_cast<int>(amrex::Math::floor(lx));
-      
-      amrex::Real const xint = lx - i;
-      
-      amrex::Real sx[] = {1._rt - xint, xint};
-      
-      val[d] = 0.0;
-      for (int ii = 0; ii <= 1; ++ii)
-      {
-          val[d] += (p_uccarr[d])(i+ii, 0, 0, 0)*sx[ii];
-      }      
-  }
-      
+        amrex::Real lx = (p.pos(0)-plo[0])*dxi[0] - (d != 0)*0.5;
+
+        int const i = static_cast<int>(amrex::Math::floor(lx));
+
+        amrex::Real const xint = lx - i;
+
+        amrex::Real sx[] = {Real(1.0) - xint, xint};
+
+        val[d] = ParticleReal(0.0);
+        for (int ii = 0; ii <= 1; ++ii)
+        {
+            val[d] += static_cast<ParticleReal>((p_uccarr[d])(i+ii, 0, 0, 0)*sx[ii]);
+        }
+    }
+
 #elif (AMREX_SPACEDIM == 2)
 
   for (int d=0; d < AMREX_SPACEDIM; ++d)
   {
-      amrex::Real lx = (p.m_rdata.pos[0]-plo[0])*dxi[0] - (d != 0)*0.5;
-      amrex::Real ly = (p.m_rdata.pos[1]-plo[1])*dxi[1] - (d != 1)*0.5;
-      
+      amrex::Real lx = (p.pos(0)-plo[0])*dxi[0] - (d != 0)*0.5;
+      amrex::Real ly = (p.pos(1)-plo[1])*dxi[1] - (d != 1)*0.5;
+
       int const i = static_cast<int>(amrex::Math::floor(lx));
       int const j = static_cast<int>(amrex::Math::floor(ly));
-      
+
       amrex::Real const xint = lx - i;
       amrex::Real const yint = ly - j;
-      
-      amrex::Real sx[] = {1._rt - xint, xint};
-      amrex::Real sy[] = {1._rt - yint, yint};
-      
-      val[d] = 0.0;
+
+      amrex::Real sx[] = {Real(1.0) - xint, xint};
+      amrex::Real sy[] = {Real(1.0) - yint, yint};
+
+      val[d] = ParticleReal(0.0);
       for (int jj = 0; jj <= 1; ++jj)
       {
           for (int ii = 0; ii <= 1; ++ii)
           {
-              val[d] += (p_uccarr[d])(i+ii, j+jj, 0, 0)*sx[ii]*sy[jj];
+              val[d] += static_cast<ParticleReal>((p_uccarr[d])(i+ii, j+jj, 0, 0)*sx[ii]*sy[jj]);
           }
       }
   }
 
 
 #elif (AMREX_SPACEDIM == 3)
-  
+
   for (int d=0; d < AMREX_SPACEDIM; ++d)
   {
-      amrex::Real lx = (p.m_rdata.pos[0]-plo[0])*dxi[0] - (d != 0)*0.5;
-      amrex::Real ly = (p.m_rdata.pos[1]-plo[1])*dxi[1] - (d != 1)*0.5;
-      amrex::Real lz = (p.m_rdata.pos[2]-plo[2])*dxi[2] - (d != 2)*0.5;
-      
+      amrex::Real lx = (p.pos(0)-plo[0])*dxi[0] - (d != 0)*0.5;
+      amrex::Real ly = (p.pos(1)-plo[1])*dxi[1] - (d != 1)*0.5;
+      amrex::Real lz = (p.pos(2)-plo[2])*dxi[2] - (d != 2)*0.5;
+
       int const i = static_cast<int>(amrex::Math::floor(lx));
       int const j = static_cast<int>(amrex::Math::floor(ly));
       int const k = static_cast<int>(amrex::Math::floor(lz));
-      
+
       amrex::Real const xint = lx - i;
       amrex::Real const yint = ly - j;
       amrex::Real const zint = lz - k;
-      
-      amrex::Real sx[] = {1._rt - xint, xint};
-      amrex::Real sy[] = {1._rt - yint, yint};
-      amrex::Real sz[] = {1._rt - zint, zint};
-      
-      val[d] = 0.0;
+
+      amrex::Real sx[] = {Real(1.0) - xint, xint};
+      amrex::Real sy[] = {Real(1.0) - yint, yint};
+      amrex::Real sz[] = {Real(1.0) - zint, zint};
+
+      val[d] = ParticleReal(0.0);
       for (int kk = 0; kk <=1; ++kk)
       {
 	  for (int jj = 0; jj <= 1; ++jj)
           {
 	      for (int ii = 0; ii <= 1; ++ii)
               {
-		  val[d] += (p_uccarr[d])(i+ii, j+jj, k+kk ,0)*sx[ii]*sy[jj]*sz[kk];
+		  val[d] += static_cast<ParticleReal>((p_uccarr[d])(i+ii, j+jj, k+kk ,0)*sx[ii]*sy[jj]*sz[kk]);
               }
           }
-      }      
+      }
   }
 #endif
 }
diff --git a/Src/Particle/AMReX_TracerParticles.cpp b/Src/Particle/AMReX_TracerParticles.cpp
index cd3799d9550..4c2d18aa864 100644
--- a/Src/Particle/AMReX_TracerParticles.cpp
+++ b/Src/Particle/AMReX_TracerParticles.cpp
@@ -27,7 +27,7 @@ TracerParticleContainer::AdvectWithUmac (MultiFab* umac, int lev, Real dt)
     const Geometry& geom     = m_gdb->Geom(lev);
     const auto          plo      = geom.ProbLoArray();
     const auto          dxi      = geom.InvCellSizeArray();
-    
+
     Vector<std::unique_ptr<MultiFab> > raii_umac(AMREX_SPACEDIM);
     Vector<MultiFab*> umac_pointer(AMREX_SPACEDIM);
     if (OnSameGrids(lev, umac[0]))
@@ -46,13 +46,13 @@ TracerParticleContainer::AdvectWithUmac (MultiFab* umac, int lev, Real dt)
 
 					                   m_gdb->ParticleDistributionMap(lev),
 					                   umac[i].nComp(), ng));
-					    
+
 
 	    umac_pointer[i] = raii_umac[i].get();
 	    umac_pointer[i]->copy(umac[i],0,0,umac[i].nComp(),ng,ng);
         }
     }
-    
+
     for (int ipass = 0; ipass < 2; ipass++)
     {
 #ifdef _OPENMP
@@ -68,40 +68,40 @@ TracerParticleContainer::AdvectWithUmac (MultiFab* umac, int lev, Real dt)
             const FArrayBox* fab[AMREX_SPACEDIM] = { AMREX_D_DECL(&((*umac_pointer[0])[grid]),
                                                                   &((*umac_pointer[1])[grid]),
                                                                   &((*umac_pointer[2])[grid])) };
-	  
+
             //array of these pointers to pass to the GPU
             amrex::GpuArray<amrex::Array4<const Real>, AMREX_SPACEDIM>
-            const umacarr {AMREX_D_DECL((*fab[0]).array(),
-                                        (*fab[1]).array(),
-                                        (*fab[2]).array() )};
+                const umacarr {{AMREX_D_DECL((*fab[0]).array(),
+                                             (*fab[1]).array(),
+                                             (*fab[2]).array() )}};
 
-            amrex::ParallelFor(n,   
-                               [=] AMREX_GPU_DEVICE (int i)      
-            {					
+            amrex::ParallelFor(n,
+                               [=] AMREX_GPU_DEVICE (int i)
+            {
                 ParticleType& p = p_pbox[i];
-                if (p.m_idata.id <= 0) return;
-                Real v[AMREX_SPACEDIM];
+                if (p.id() <= 0) return;
+                ParticleReal v[AMREX_SPACEDIM];
                 mac_interpolate(p, plo, dxi, umacarr, v);
                 if (ipass == 0)
                 {
                     for (int dim=0; dim < AMREX_SPACEDIM; dim++)
                     {
-                        p.m_rdata.arr[AMREX_SPACEDIM+dim] = p.m_rdata.pos[dim];     
-                        p.m_rdata.pos[dim] += 0.5*dt*v[dim];   		 
-                    }    		  
+                        p.rdata(dim) = p.pos(dim);
+                        p.pos(dim) += static_cast<ParticleReal>(ParticleReal(0.5)*dt*v[dim]);
+                    }
                 }
                 else
                 {
                     for (int dim=0; dim < AMREX_SPACEDIM; dim++)
                     {
-                        p.m_rdata.pos[dim]  = p.m_rdata.arr[AMREX_SPACEDIM+dim] + dt*v[dim];
-                        p.m_rdata.arr[AMREX_SPACEDIM+dim] = v[dim];
+                        p.pos(dim) = p.rdata(dim) + static_cast<ParticleReal>(dt*v[dim]);
+                        p.rdata(dim) = v[dim];
                     }
                 }
             });
         }
     }
-    
+
     if (m_verbose > 1)
     {
         Real stoptime = amrex::second() - strttime;
@@ -109,15 +109,16 @@ TracerParticleContainer::AdvectWithUmac (MultiFab* umac, int lev, Real dt)
 #ifdef AMREX_LAZY
 	Lazy::QueueReduction( [=] () mutable {
 #endif
-        ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
+                ParallelReduce::Max(stoptime, ParallelContext::IOProcessorNumberSub(),
+                                    ParallelContext::CommunicatorSub());
 
-        amrex::Print() << "TracerParticleContainer::AdvectWithUmac() time: " << stoptime << '\n';
+                amrex::Print() << "TracerParticleContainer::AdvectWithUmac() time: " << stoptime << '\n';
 #ifdef AMREX_LAZY
 	});
 #endif
     }
 }
-	
+
 //
 // Uses midpoint method to advance particles using cell-centered velocity
 //
@@ -156,31 +157,31 @@ TracerParticleContainer::AdvectWithUcc (const MultiFab& Ucc, int lev, Real dt)
                                [=] AMREX_GPU_DEVICE (int i)
             {
                 ParticleType& p  = p_pbox[i];
-                if (p.m_idata.id <= 0) return;
-                Real v[AMREX_SPACEDIM];
-                
+                if (p.id() <= 0) return;
+                ParticleReal v[AMREX_SPACEDIM];
+
                 cic_interpolate(p, plo, dxi, uccarr, v);
-                
+
                 if (ipass == 0)
                 {
                     for (int dim=0; dim < AMREX_SPACEDIM; dim++)
                     {
-                        p.m_rdata.arr[AMREX_SPACEDIM+dim] = p.m_rdata.pos[dim];
-                        p.m_rdata.pos[dim] += 0.5*dt*v[dim];
-                    }                  
+                        p.rdata(dim) = p.pos(dim);
+                        p.pos(dim) += static_cast<ParticleReal>(ParticleReal(0.5)*dt*v[dim]);
+                    }
                 }
                 else
                 {
                     for (int dim=0; dim < AMREX_SPACEDIM; dim++)
                     {
-                        p.m_rdata.pos[dim]  = p.m_rdata.arr[AMREX_SPACEDIM+dim] + dt*v[dim];
-                        p.m_rdata.arr[AMREX_SPACEDIM+dim] = v[dim];
+                        p.rdata(dim) = p.rdata(dim) + static_cast<ParticleReal>(dt*v[dim]);
+                        p.rdata(dim) = v[dim];
                     }
                 }
             });
         }
     }
-    
+
     if (m_verbose > 1)
     {
         Real stoptime = amrex::second() - strttime;
@@ -188,11 +189,12 @@ TracerParticleContainer::AdvectWithUcc (const MultiFab& Ucc, int lev, Real dt)
 #ifdef AMREX_LAZY
 	Lazy::QueueReduction( [=] () mutable {
 #endif
-        ParallelDescriptor::ReduceRealMax(stoptime,ParallelDescriptor::IOProcessorNumber());
+                ParallelReduce::Max(stoptime, ParallelContext::IOProcessorNumberSub(),
+                                    ParallelContext::CommunicatorSub());
 
-        amrex::Print() << "TracerParticleContainer::AdvectWithUcc() time: " << stoptime << '\n';
+                amrex::Print() << "TracerParticleContainer::AdvectWithUcc() time: " << stoptime << '\n';
 #ifdef AMREX_LAZY
-	});
+            });
 #endif
     }
 }
@@ -220,7 +222,7 @@ TracerParticleContainer::Timestamp (const std::string&      basename,
     const Real strttime = amrex::second();
 
     const int   MyProc    = ParallelDescriptor::MyProc();
-    const int   NProcs    = ParallelDescriptor::NProcs();
+    const int   NProcs    = ParallelContext::NProcsSub();
     // We'll spread the output over this many files.
     int nOutFiles(64);
     ParmParse pp("particles");
@@ -247,7 +249,7 @@ TracerParticleContainer::Timestamp (const std::string&      basename,
 	      for (int k = 0; k < pbox.numParticles(); ++k)
 	      {
 		const ParticleType& p = pbox[k];
-		if (p.m_idata.id > 0) {
+		if (p.id() > 0) {
 		  gotwork = true;
 		  break;
 		}
@@ -291,25 +293,25 @@ TracerParticleContainer::Timestamp (const std::string&      basename,
 		    {
 		      const ParticleType& p = pbox[k];
 
-		      if (p.m_idata.id <= 0) continue;
+		      if (p.id() <= 0) continue;
 
 		      const IntVect& iv = Index(p,lev);
 
 		      if (!bx.contains(iv) && !ba.contains(iv)) continue;
 
-		      TimeStampFile << p.m_idata.id  << ' ' << p.m_idata.cpu << ' ';
+		      TimeStampFile << p.id()  << ' ' << p.cpu() << ' ';
 
-		      AMREX_D_TERM(TimeStampFile << p.m_rdata.pos[0] << ' ';,
-			     TimeStampFile << p.m_rdata.pos[1] << ' ';,
-			     TimeStampFile << p.m_rdata.pos[2] << ' ';);
+		      AMREX_D_TERM(TimeStampFile << p.pos(0) << ' ';,
+                                   TimeStampFile << p.pos(1) << ' ';,
+                                   TimeStampFile << p.pos(2) << ' ';);
 
 		      TimeStampFile << time;
 		      //
 		      // AdvectWithUmac stores the velocity in rdata ...
 		      //
-		      AMREX_D_TERM(TimeStampFile << ' ' << p.m_rdata.arr[AMREX_SPACEDIM+0];,
-			     TimeStampFile << ' ' << p.m_rdata.arr[AMREX_SPACEDIM+1];,
-			     TimeStampFile << ' ' << p.m_rdata.arr[AMREX_SPACEDIM+2];);
+		      AMREX_D_TERM(TimeStampFile << ' ' << p.rdata(0);,
+                                   TimeStampFile << ' ' << p.rdata(1);,
+                                   TimeStampFile << ' ' << p.rdata(2););
 
 		      if (M > 0)
                         {
diff --git a/Src/Particle/AMReX_WriteBinaryParticleData.H b/Src/Particle/AMReX_WriteBinaryParticleData.H
new file mode 100644
index 00000000000..d7dac7fd1c7
--- /dev/null
+++ b/Src/Particle/AMReX_WriteBinaryParticleData.H
@@ -0,0 +1,733 @@
+#ifndef AMREX_WRITE_BINARY_PARTICLE_DATA_H
+#define AMREX_WRITE_BINARY_PARTICLE_DATA_H
+
+#include <AMReX_TypeTraits.H>
+#include <AMReX_Particles.H>
+#include <AMReX_ParticleUtil.H>
+
+struct KeepValidFilter
+{
+    template <typename SrcData>
+    AMREX_GPU_HOST_DEVICE
+    int operator() (const SrcData& src, int i) const noexcept
+    {
+        return (src.m_aos[i].id() > 0);
+    }
+};
+
+template <typename ParticleReal>
+std::size_t PSizeInFile (const Vector<int>& wrc, const Vector<int>& wic)
+{
+    std::size_t rsize = sizeof(ParticleReal)*std::accumulate(wrc.begin(), wrc.end(), 0);
+    std::size_t isize = sizeof(int)*std::accumulate(wic.begin(), wic.end(), 0);
+    return rsize + isize + AMREX_SPACEDIM*sizeof(ParticleReal) + 2*sizeof(int);
+}
+
+template <class PC, class F, EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
+void WriteBinaryParticleDataSync (PC const& pc,
+                                  const std::string& dir, const std::string& name,
+                                  const Vector<int>& write_real_comp,
+                                  const Vector<int>& write_int_comp,
+                                  const Vector<std::string>& real_comp_names,
+                                  const Vector<std::string>& int_comp_names,
+                                  F&& f)
+{
+    BL_PROFILE("WriteBinaryParticleData()");
+    AMREX_ASSERT(pc.OK());
+
+    AMREX_ASSERT(sizeof(typename PC::ParticleType::RealType) == 4 ||
+                 sizeof(typename PC::ParticleType::RealType) == 8);
+
+    constexpr int NStructReal = PC::NStructReal;
+    constexpr int NStructInt  = PC::NStructInt;
+
+    const int NProcs = ParallelDescriptor::NProcs();
+    const int IOProcNumber = ParallelDescriptor::IOProcessorNumber();
+
+    AMREX_ALWAYS_ASSERT(real_comp_names.size() == pc.NumRealComps() + NStructReal);
+    AMREX_ALWAYS_ASSERT( int_comp_names.size() == pc.NumIntComps() + NStructInt);
+
+    std::string pdir = dir;
+    if ( not pdir.empty() and pdir[pdir.size()-1] != '/') pdir += '/';
+    pdir += name;
+
+    if ( ! pc.GetLevelDirectoriesCreated()) {
+        if (ParallelDescriptor::IOProcessor())
+        {
+            if ( ! amrex::UtilCreateDirectory(pdir, 0755))
+            {
+                amrex::CreateDirectoryFailed(pdir);
+            }
+        }
+        ParallelDescriptor::Barrier();
+    }
+
+    std::ofstream HdrFile;
+
+    Long nparticles = 0;
+    Long maxnextid;
+
+    // evaluate f for every particle to determine which ones to output
+    Vector<std::map<std::pair<int, int>, Gpu::DeviceVector<int> > > particle_io_flags(pc.GetParticles().size());
+    for (int lev = 0; lev < pc.GetParticles().size();  lev++)
+    {
+        const auto& pmap = pc.GetParticles(lev);
+        for (const auto& kv : pmap)
+        {
+            const auto ptd = kv.second.getConstParticleTileData();
+            const auto np = kv.second.numParticles();
+            particle_io_flags[lev][kv.first].resize(np, 0);
+            auto pflags = particle_io_flags[lev][kv.first].data();
+            amrex::ParallelForRNG(np,
+            [=] AMREX_GPU_DEVICE (int k, amrex::RandomEngine const& engine) noexcept
+            {
+                const auto p = ptd.getSuperParticle(k);
+                pflags[k] = particle_detail::call_f(f,p,engine);
+            });
+        }
+    }
+
+    Gpu::Device::synchronize();
+
+    if(pc.GetUsePrePost())
+    {
+        nparticles = pc.GetNParticlesPrePost();
+        maxnextid  = pc.GetMaxNextIDPrePost();
+    }
+    else
+    {
+        nparticles = 0;
+        maxnextid  = PC::ParticleType::NextID();
+
+        for (int lev = 0; lev < pc.GetParticles().size();  lev++)
+        {
+            const auto& pmap = pc.GetParticles(lev);
+            for (const auto& kv : pmap)
+            {
+                const auto& pflags = particle_io_flags[lev][kv.first];
+                for (int k = 0; k < kv.second.numParticles(); ++k)
+                {
+                    if (pflags[k]) nparticles++;
+                }
+            }
+        }
+
+        ParallelDescriptor::ReduceLongSum(nparticles, IOProcNumber);
+        PC::ParticleType::NextID(maxnextid);
+        ParallelDescriptor::ReduceLongMax(maxnextid, IOProcNumber);
+    }
+
+    if (ParallelDescriptor::IOProcessor())
+    {
+        std::string HdrFileName = pdir;
+
+        if ( ! HdrFileName.empty() && HdrFileName[HdrFileName.size()-1] != '/')
+            HdrFileName += '/';
+
+        HdrFileName += "Header";
+        pc.HdrFileNamePrePost = HdrFileName;
+
+        HdrFile.open(HdrFileName.c_str(), std::ios::out|std::ios::trunc);
+
+        if ( ! HdrFile.good()) amrex::FileOpenFailed(HdrFileName);
+
+        //
+        // First thing written is our Checkpoint/Restart version string.
+        // We append "_single" or "_double" to the version string indicating
+        // whether we're using "float" or "double" floating point data in the
+        // particles so that we can Restart from the checkpoint files.
+        //
+        if (sizeof(typename PC::ParticleType::RealType) == 4)
+        {
+            HdrFile << PC::ParticleType::Version() << "_single" << '\n';
+        }
+        else
+        {
+            HdrFile << PC::ParticleType::Version() << "_double" << '\n';
+        }
+
+        int num_output_real = 0;
+        for (int i = 0; i < pc.NumRealComps() + NStructReal; ++i)
+            if (write_real_comp[i]) ++num_output_real;
+
+        int num_output_int = 0;
+        for (int i = 0; i < pc.NumIntComps() + NStructInt; ++i)
+            if (write_int_comp[i]) ++num_output_int;
+
+        // AMREX_SPACEDIM and N for sanity checking.
+        HdrFile << AMREX_SPACEDIM << '\n';
+
+        // The number of extra real parameters
+        HdrFile << num_output_real << '\n';
+
+        // Real component names
+        for (int i = 0; i < NStructReal + pc.NumRealComps(); ++i )
+            if (write_real_comp[i]) HdrFile << real_comp_names[i] << '\n';
+
+        // The number of extra int parameters
+        HdrFile << num_output_int << '\n';
+
+        // int component names
+        for (int i = 0; i < NStructInt + pc.NumIntComps(); ++i )
+            if (write_int_comp[i]) HdrFile << int_comp_names[i] << '\n';
+
+        bool is_checkpoint = true; // legacy
+        HdrFile << is_checkpoint << '\n';
+
+        // The total number of particles.
+        HdrFile << nparticles << '\n';
+
+        // The value of nextid that we need to restore on restart.
+        HdrFile << maxnextid << '\n';
+
+        // Then the finest level of the AMR hierarchy.
+        HdrFile << pc.finestLevel() << '\n';
+
+        // Then the number of grids at each level.
+        for (int lev = 0; lev <= pc.finestLevel(); lev++)
+            HdrFile << pc.ParticleBoxArray(lev).size() << '\n';
+    }
+
+    // We want to write the data out in parallel.
+    // We'll allow up to nOutFiles active writers at a time.
+    int nOutFiles(256);
+
+    ParmParse pp("particles");
+    pp.query("particles_nfiles",nOutFiles);
+    if(nOutFiles == -1) nOutFiles = NProcs;
+    nOutFiles = std::max(1, std::min(nOutFiles,NProcs));
+    pc.nOutFilesPrePost = nOutFiles;
+
+    for (int lev = 0; lev <= pc.finestLevel(); lev++)
+    {
+        bool gotsome;
+        if(pc.usePrePost)
+        {
+            gotsome = (pc.nParticlesAtLevelPrePost[lev] > 0);
+        }
+        else
+        {
+            gotsome = (pc.NumberOfParticlesAtLevel(lev) > 0);
+        }
+
+        // We store the particles at each level in their own subdirectory.
+        std::string LevelDir = pdir;
+
+        if (gotsome)
+        {
+            if ( ! LevelDir.empty() && LevelDir[LevelDir.size()-1] != '/') LevelDir += '/';
+
+            LevelDir = amrex::Concatenate(LevelDir + "Level_", lev, 1);
+
+            if ( ! pc.GetLevelDirectoriesCreated())
+            {
+                if (ParallelDescriptor::IOProcessor())
+                    if ( ! amrex::UtilCreateDirectory(LevelDir, 0755))
+                        amrex::CreateDirectoryFailed(LevelDir);
+                ParallelDescriptor::Barrier();
+            }
+        }
+
+        // Write out the header for each particle
+        if (gotsome and ParallelDescriptor::IOProcessor()) {
+            std::string HeaderFileName = LevelDir;
+            HeaderFileName += "/Particle_H";
+            std::ofstream ParticleHeader(HeaderFileName);
+
+            pc.ParticleBoxArray(lev).writeOn(ParticleHeader);
+            ParticleHeader << '\n';
+
+            ParticleHeader.flush();
+            ParticleHeader.close();
+        }
+
+        MFInfo info;
+        info.SetAlloc(false);
+        MultiFab state(pc.ParticleBoxArray(lev),
+                       pc.ParticleDistributionMap(lev),
+                       1,0,info);
+
+        // We eventually want to write out the file name and the offset
+        // into that file into which each grid of particles is written.
+        Vector<int>  which(state.size(),0);
+        Vector<int > count(state.size(),0);
+        Vector<Long> where(state.size(),0);
+
+        std::string filePrefix(LevelDir);
+        filePrefix += '/';
+        filePrefix += PC::ParticleType::DataPrefix();
+        if(pc.usePrePost) {
+            pc.filePrefixPrePost[lev] = filePrefix;
+        }
+        bool groupSets(false), setBuf(true);
+
+        if (gotsome)
+        {
+            for(NFilesIter nfi(nOutFiles, filePrefix, groupSets, setBuf); nfi.ReadyToWrite(); ++nfi)
+            {
+                std::ofstream& myStream = (std::ofstream&) nfi.Stream();
+                pc.WriteParticles(lev, myStream, nfi.FileNumber(), which, count, where,
+                                  write_real_comp, write_int_comp, particle_io_flags);
+            }
+
+            if(pc.usePrePost) {
+                pc.whichPrePost[lev] = which;
+                pc.countPrePost[lev] = count;
+                pc.wherePrePost[lev] = where;
+            } else {
+                ParallelDescriptor::ReduceIntSum (which.dataPtr(), which.size(), IOProcNumber);
+                ParallelDescriptor::ReduceIntSum (count.dataPtr(), count.size(), IOProcNumber);
+                ParallelDescriptor::ReduceLongSum(where.dataPtr(), where.size(), IOProcNumber);
+            }
+        }
+
+        if (ParallelDescriptor::IOProcessor())
+        {
+            if(pc.GetUsePrePost()) {
+                // ---- write to the header and unlink in CheckpointPost
+            } else {
+                for (int j = 0; j < state.size(); j++)
+                {
+                    HdrFile << which[j] << ' ' << count[j] << ' ' << where[j] << '\n';
+                }
+
+                if (gotsome && pc.doUnlink)
+                {
+                    // Unlink any zero-length data files.
+                    Vector<Long> cnt(nOutFiles,0);
+
+                    for (int i = 0, N=count.size(); i < N; i++) {
+                        cnt[which[i]] += count[i];
+                    }
+
+                    for (int i = 0, N=cnt.size(); i < N; i++)
+                    {
+                        if (cnt[i] == 0)
+                        {
+                            std::string FullFileName = NFilesIter::FileName(i, filePrefix);
+                            FileSystem::Remove(FullFileName);
+                        }
+                    }
+                }
+            }
+        }
+    }
+
+    if (ParallelDescriptor::IOProcessor())
+    {
+        HdrFile.flush();
+        HdrFile.close();
+        if ( ! HdrFile.good())
+        {
+            amrex::Abort("ParticleContainer::Checkpoint(): problem writing HdrFile");
+        }
+    }
+}
+
+template <class PC, EnableIf_t<IsParticleContainer<PC>::value, int> foo = 0>
+void WriteBinaryParticleDataAsync (PC const& pc,
+                                   const std::string& dir, const std::string& name,
+                                   const Vector<int>& write_real_comp,
+                                   const Vector<int>& write_int_comp,
+                                   const Vector<std::string>& real_comp_names,
+                                   const Vector<std::string>& int_comp_names)
+{
+    BL_PROFILE("WriteBinaryParticleDataAsync");
+    AMREX_ASSERT(pc.OK());
+
+    AMREX_ASSERT(sizeof(typename PC::ParticleType::RealType) == 4 ||
+                 sizeof(typename PC::ParticleType::RealType) == 8);
+
+    constexpr int NStructReal = PC::NStructReal;
+    constexpr int NStructInt  = PC::NStructInt;
+    constexpr int NArrayReal  = PC::NArrayReal;
+    constexpr int NArrayInt   = PC::NArrayInt;
+
+    const int MyProc = ParallelDescriptor::MyProc();
+    const int NProcs = ParallelDescriptor::NProcs();
+    const int IOProcNumber = NProcs - 1;
+
+    AMREX_ALWAYS_ASSERT(real_comp_names.size() == pc.NumRealComps() + NStructReal);
+    AMREX_ALWAYS_ASSERT( int_comp_names.size() == pc.NumIntComps() + NStructInt);
+
+    Vector<LayoutData<Long> > np_per_grid_local(pc.finestLevel()+1);
+    for (int lev = 0; lev <= pc.finestLevel(); lev++)
+    {
+        np_per_grid_local[lev].define(pc.ParticleBoxArray(lev), pc.ParticleDistributionMap(lev));
+        for (MFIter mfi = pc.MakeMFIter(lev); mfi.isValid(); ++mfi)
+        {
+            int gid = mfi.index();
+            const auto& ptile = pc.ParticlesAt(lev, mfi);
+            const auto& aos = ptile.GetArrayOfStructs();
+            const auto pstruct = aos().dataPtr();
+            const int np = ptile.numParticles();
+
+            ReduceOps<ReduceOpSum> reduce_op;
+            ReduceData<int> reduce_data(reduce_op);
+            using ReduceTuple = typename decltype(reduce_data)::Type;
+
+            reduce_op.eval(np, reduce_data,
+            [=] AMREX_GPU_DEVICE (int i) -> ReduceTuple
+            {
+                return (pstruct[i].id() > 0) ? 1 : 0;
+            });
+
+            int np_valid = amrex::get<0>(reduce_data.value());
+            np_per_grid_local[lev][gid] += np_valid;
+        }
+    }
+
+    Vector<Vector<Long> > np_per_grid_global(pc.finestLevel()+1);
+    Long total_np = 0;
+    Vector<Long> np_per_level(pc.finestLevel()+1);
+    for (int lev = 0; lev <= pc.finestLevel(); lev++)
+    {
+        np_per_grid_global[lev].resize(np_per_grid_local[lev].size());
+        ParallelDescriptor::GatherLayoutDataToVector(np_per_grid_local[lev],
+                                                     np_per_grid_global[lev],
+                                                     IOProcNumber);
+        np_per_level[lev] = std::accumulate(np_per_grid_global[lev].begin(),
+                                            np_per_grid_global[lev].end(), 0L);
+        total_np += np_per_level[lev];
+    }
+
+    std::string pdir = dir;
+    if ( not pdir.empty() and pdir[pdir.size()-1] != '/') pdir += '/';
+    pdir += name;
+
+    if (MyProc == IOProcNumber)
+    {
+        if ( ! pc.GetLevelDirectoriesCreated())
+        {
+            if ( ! amrex::UtilCreateDirectory(pdir, 0755))
+            {
+                amrex::CreateDirectoryFailed(pdir);
+            }
+        }
+
+        for (int lev = 0; lev <= pc.finestLevel(); lev++)
+        {
+            std::string LevelDir = pdir;
+            bool gotsome = np_per_level[lev];
+
+            if (gotsome)
+            {
+                if ( ! LevelDir.empty() && LevelDir[LevelDir.size()-1] != '/') LevelDir += '/';
+
+                LevelDir = amrex::Concatenate(LevelDir + "Level_", lev, 1);
+
+                if ( ! pc.GetLevelDirectoriesCreated())
+                {
+                    if ( ! amrex::UtilCreateDirectory(LevelDir, 0755))
+                    {
+                        amrex::CreateDirectoryFailed(LevelDir);
+                    }
+                }
+
+                std::string HeaderFileName = LevelDir;
+                HeaderFileName += "/Particle_H";
+                std::ofstream ParticleHeader(HeaderFileName);
+
+                pc.ParticleBoxArray(lev).writeOn(ParticleHeader);
+                ParticleHeader << '\n';
+
+                ParticleHeader.flush();
+                ParticleHeader.close();
+            }
+        }
+    }
+    ParallelDescriptor::Barrier();
+
+    Long maxnextid = PC::ParticleType::NextID();
+    ParallelDescriptor::ReduceLongMax(maxnextid, IOProcNumber);
+
+    Vector<Long> np_on_rank(NProcs, 0L);
+    std::size_t psize = PSizeInFile<ParticleReal>(write_real_comp, write_int_comp);
+    Vector<int64_t> rank_start_offset(NProcs);
+    if (MyProc == IOProcNumber)
+    {
+        for (int lev = 0; lev <= pc.finestLevel(); lev++)
+        {
+            for (int k = 0; k < pc.ParticleBoxArray(lev).size(); ++k)
+            {
+                int rank = pc.ParticleDistributionMap(lev)[k];
+                np_on_rank[rank] += np_per_grid_global[lev][k];
+            }
+        }
+
+        for (int ip = 0; ip < NProcs; ++ip)
+        {
+            auto info = AsyncOut::GetWriteInfo(ip);
+            rank_start_offset[ip] = (info.ispot == 0) ? 0 : rank_start_offset[ip-1] + np_on_rank[ip-1]*psize;
+        }
+    }
+
+    // make tmp particle tiles in pinned memory to write
+    using PinnedPTile = ParticleTile<NStructReal, NStructInt, NArrayReal, NArrayInt,
+                                     PinnedArenaAllocator>;
+    auto myptiles = std::make_shared<Vector<std::map<std::pair<int, int>,PinnedPTile> > >();
+    myptiles->resize(pc.finestLevel()+1);
+    for (int lev = 0; lev <= pc.finestLevel(); lev++)
+    {
+        for (MFIter mfi = pc.MakeMFIter(lev); mfi.isValid(); ++mfi)
+        {
+            auto& new_ptile = (*myptiles)[lev][std::make_pair(mfi.index(),
+                                                              mfi.LocalTileIndex())];
+
+            if (np_per_grid_local[lev][mfi.index()] > 0)
+            {
+                const auto& ptile = pc.ParticlesAt(lev, mfi);
+                new_ptile.resize(np_per_grid_local[lev][mfi.index()]);
+                amrex::filterParticles(new_ptile, ptile, KeepValidFilter());
+            }
+        }
+    }
+
+    int finest_level = pc.finestLevel();
+    Vector<BoxArray> bas;
+    Vector<DistributionMapping> dms;
+    for (int lev = 0; lev <= pc.finestLevel(); lev++)
+    {
+        bas.push_back(pc.ParticleBoxArray(lev));
+        dms.push_back(pc.ParticleDistributionMap(lev));
+    }
+
+    int nrc = pc.NumRealComps();
+    int nic = pc.NumIntComps();
+
+    auto RD = pc.ParticleRealDescriptor;
+
+    AsyncOut::Submit([=] () 
+#if defined(__GNUC__) && (__GNUC__ == 8) && (__GNUC_MINOR__ == 1)
+                     mutable // workaround for bug in gcc 8.1
+#endif
+    {
+        if (MyProc == IOProcNumber)
+        {
+            std::string HdrFileName = pdir;
+            std::ofstream HdrFile;
+
+            if ( ! HdrFileName.empty() && HdrFileName[HdrFileName.size()-1] != '/')
+                HdrFileName += '/';
+
+            HdrFileName += "Header";
+
+            HdrFile.open(HdrFileName.c_str(), std::ios::out|std::ios::trunc);
+
+            if ( ! HdrFile.good()) amrex::FileOpenFailed(HdrFileName);
+
+            if (sizeof(typename PC::ParticleType) == 4)
+            {
+                HdrFile << PC::ParticleType::Version() << "_single" << '\n';
+            }
+            else
+            {
+                HdrFile << PC::ParticleType::Version() << "_double" << '\n';
+            }
+
+            int num_output_real = 0;
+            for (int i = 0; i < nrc + NStructReal; ++i)
+                if (write_real_comp[i]) ++num_output_real;
+
+            int num_output_int = 0;
+            for (int i = 0; i < nic + NStructInt; ++i)
+                if (write_int_comp[i]) ++num_output_int;
+
+            // AMREX_SPACEDIM and N for sanity checking.
+            HdrFile << AMREX_SPACEDIM << '\n';
+
+            // The number of extra real parameters
+            HdrFile << num_output_real << '\n';
+
+            // Real component names
+            for (int i = 0; i < NStructReal + nrc; ++i )
+                if (write_real_comp[i]) HdrFile << real_comp_names[i] << '\n';
+
+            // The number of extra int parameters
+            HdrFile << num_output_int << '\n';
+
+            // int component names
+            for (int i = 0; i < NStructInt + nic; ++i )
+                if (write_int_comp[i]) HdrFile << int_comp_names[i] << '\n';
+
+            bool is_checkpoint = true; // legacy
+            HdrFile << is_checkpoint << '\n';
+
+            // The total number of particles.
+            HdrFile << total_np << '\n';
+
+            // The value of nextid that we need to restore on restart.
+            HdrFile << maxnextid << '\n';
+
+            // Then the finest level of the AMR hierarchy.
+            HdrFile << finest_level << '\n';
+
+            // Then the number of grids at each level.
+            for (int lev = 0; lev <= finest_level; lev++)
+                HdrFile << dms[lev].size() << '\n';
+
+            for (int lev = 0; lev <= finest_level; lev++)
+            {
+                Vector<int64_t> grid_offset(NProcs, 0);
+                for (int k = 0; k < bas[lev].size(); ++k)
+                {
+                    int rank = dms[lev][k];
+                    auto info = AsyncOut::GetWriteInfo(rank);
+                    HdrFile << info.ifile << ' '
+                            << np_per_grid_global[lev][k] << ' '
+                            << grid_offset[rank] + rank_start_offset[rank] << '\n';
+                    grid_offset[rank] += np_per_grid_global[lev][k]*psize;
+                }
+            }
+
+            HdrFile.flush();
+            HdrFile.close();
+            if ( ! HdrFile.good())
+            {
+                amrex::Abort("ParticleContainer::Checkpoint(): problem writing HdrFile");
+            }
+        }
+
+        AsyncOut::Wait();  // Wait for my turn
+
+        for (int lev = 0; lev <= finest_level; lev++)
+        {
+            // For a each grid, the tiles it contains
+            std::map<int, Vector<int> > tile_map;
+
+            for (const auto& kv : (*myptiles)[lev])
+            {
+                const int grid = kv.first.first;
+                const int tile = kv.first.second;
+                tile_map[grid].push_back(tile);
+            }
+
+            std::string LevelDir = pdir;
+            if ( ! LevelDir.empty() && LevelDir[LevelDir.size()-1] != '/') LevelDir += '/';
+            LevelDir = amrex::Concatenate(LevelDir + "Level_", lev, 1);
+            std::string filePrefix(LevelDir);
+            filePrefix += '/';
+            filePrefix += PC::ParticleType::DataPrefix();
+            auto info = AsyncOut::GetWriteInfo(MyProc);
+            std::string file_name = amrex::Concatenate(filePrefix, info.ifile, 5);
+            std::ofstream ofs;
+            ofs.open(file_name.c_str(), (info.ispot == 0) ? (std::ios::binary | std::ios::trunc)
+                     : (std::ios::binary | std::ios::app));
+
+            for (int k = 0; k < bas[lev].size(); ++k)
+            {
+                int rank = dms[lev][k];
+                if (rank != MyProc) continue;
+                const int grid = k;
+                if (np_per_grid_local[lev][grid] == 0) continue;
+
+                // First write out the integer data in binary.
+                int num_output_int = 0;
+                for (int i = 0; i < nic + NStructInt; ++i)
+                    if (write_int_comp[i]) ++num_output_int;
+
+                const int iChunkSize = 2 + num_output_int;
+                Vector<int> istuff(np_per_grid_local[lev][grid]*iChunkSize);
+                int* iptr = istuff.dataPtr();
+
+                for (unsigned i = 0; i < tile_map[grid].size(); i++) {
+                    auto ptile_index = std::make_pair(grid, tile_map[grid][i]);
+                    const auto& pbox = (*myptiles)[lev][ptile_index];
+                    for (int pindex = 0;
+                         pindex < pbox.GetArrayOfStructs().numParticles(); ++pindex)
+                    {
+                        const auto& aos = pbox.GetArrayOfStructs();
+                        const auto& p = aos[pindex];
+
+                        if (p.id() <= 0) continue;
+
+                        // always write these
+                        *iptr = p.id(); ++iptr;
+                        *iptr = p.cpu(); ++iptr;
+
+                        // optionally write these
+                        for (int j = 0; j < NStructInt; j++)
+                        {
+                            if (write_int_comp[j])
+                            {
+                                *iptr = p.idata(j);
+                                ++iptr;
+                            }
+                        }
+
+                        const auto& soa  = pbox.GetStructOfArrays();
+                        for (int j = 0; j < nic; j++)
+                        {
+                            if (write_int_comp[NStructInt+j])
+                            {
+                                *iptr = soa.GetIntData(j)[pindex];
+                                ++iptr;
+                            }
+                        }
+                    }
+                }
+
+                writeIntData(istuff.dataPtr(), istuff.size(), ofs);
+                ofs.flush();  // Some systems require this flush() (probably due to a bug)
+
+                // Write the Real data in binary.
+                int num_output_real = 0;
+                for (int i = 0; i < nrc + NStructReal; ++i)
+                    if (write_real_comp[i]) ++num_output_real;
+
+                const int rChunkSize = AMREX_SPACEDIM + num_output_real;
+                Vector<typename PC::ParticleType::RealType> rstuff(np_per_grid_local[lev][grid]*rChunkSize);
+                typename PC::ParticleType::RealType* rptr = rstuff.dataPtr();
+
+                for (unsigned i = 0; i < tile_map[grid].size(); i++) {
+                    auto ptile_index = std::make_pair(grid, tile_map[grid][i]);
+                    const auto& pbox = (*myptiles)[lev][ptile_index];
+                    for (int pindex = 0;
+                         pindex < pbox.GetArrayOfStructs().numParticles(); ++pindex)
+                    {
+                        const auto& aos = pbox.GetArrayOfStructs();
+                        const auto& p = aos[pindex];
+
+                        if (p.id() <= 0) continue;
+
+                        // always write these
+                        for (int j = 0; j < AMREX_SPACEDIM; j++) rptr[j] = p.pos(j);
+                        rptr += AMREX_SPACEDIM;
+
+                        // optionally write these
+                        for (int j = 0; j < NStructReal; j++)
+                        {
+                            if (write_real_comp[j])
+                            {
+                                *rptr = p.rdata(j);
+                                ++rptr;
+                            }
+                        }
+
+                        const auto& soa  = pbox.GetStructOfArrays();
+                        for (int j = 0; j < nrc; j++)
+                        {
+                            if (write_real_comp[NStructReal+j])
+                            {
+                                *rptr = (typename PC::ParticleType::RealType) soa.GetRealData(j)[pindex];
+                                ++rptr;
+                            }
+                        }
+                    }
+                }
+
+                if (sizeof(typename PC::ParticleType::RealType) == 4) {
+                    writeFloatData((float*) rstuff.dataPtr(), rstuff.size(), ofs, RD);
+                }
+                else if (sizeof(typename PC::ParticleType::RealType) == 8) {
+                    writeDoubleData((double*) rstuff.dataPtr(), rstuff.size(), ofs, RD);
+                }
+
+                ofs.flush();  // Some systems require this flush() (probably due to a bug)
+            }
+        }
+        AsyncOut::Notify();  // Notify others I am done
+    });
+}
+
+#endif
diff --git a/Src/Particle/CMakeLists.txt b/Src/Particle/CMakeLists.txt
index 8a220e4208c..a4bf285573f 100644
--- a/Src/Particle/CMakeLists.txt
+++ b/Src/Particle/CMakeLists.txt
@@ -1,6 +1,6 @@
 target_compile_definitions(amrex PUBLIC $<BUILD_INTERFACE:AMREX_PARTICLES>)
 
-if (NOT ENABLE_DP_PARTICLES)
+if (AMReX_PARTICLES_PRECISION STREQUAL SINGLE)
    target_compile_definitions(amrex PUBLIC $<BUILD_INTERFACE:AMREX_SINGLE_PRECISION_PARTICLES>)
 endif ()
 
@@ -42,4 +42,5 @@ target_sources( amrex
    AMReX_DenseBins.H
    AMReX_BinIterator.H
    AMReX_ParticleTransformation.H
+   AMReX_WriteBinaryParticleData.H
    )
diff --git a/Src/Particle/Make.package b/Src/Particle/Make.package
index 1987f9a2042..0646d5e07ae 100644
--- a/Src/Particle/Make.package
+++ b/Src/Particle/Make.package
@@ -10,6 +10,7 @@ C$(AMREX_PARTICLE)_headers += AMReX_ParIter.H AMReX_ParticleMPIUtil.H AMReX_Stru
 C$(AMREX_PARTICLE)_headers += AMReX_ParticleUtil.H AMReX_NeighborList.H AMReX_ParticleBufferMap.H AMReX_ParticleCommunication.H AMReX_ParticleReduce.H AMReX_ParticleLocator.H
 C$(AMREX_PARTICLE)_headers += AMReX_NeighborParticlesCPUImpl.H AMReX_NeighborParticlesGPUImpl.H
 C$(AMREX_PARTICLE)_headers += AMReX_Particle_mod_K.H AMReX_TracerParticle_mod_K.H AMReX_ParticleMesh.H AMReX_ParticleIO.H AMReX_ParticleHDF5.H AMReX_DenseBins.H AMReX_ParticleTransformation.H AMReX_SparseBins.H AMReX_BinIterator.H
+C$(AMREX_PARTICLE)_headers += AMReX_WriteBinaryParticleData.H
 
 VPATH_LOCATIONS += $(AMREX_HOME)/Src/Particle
 INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Particle
diff --git a/Tests/Algoim/GNUmakefile b/Tests/Algoim/GNUmakefile
deleted file mode 100644
index 3f3dd050e07..00000000000
--- a/Tests/Algoim/GNUmakefile
+++ /dev/null
@@ -1,36 +0,0 @@
-DEBUG = FALSE
-TEST = TRUE
-USE_ASSERTION = TRUE
-
-USE_EB = TRUE
-
-USE_MPI  = FALSE
-USE_OMP  = FALSE
-
-USE_CUDA = FALSE
-
-COMP = gnu
-
-DIM = 3
-
-AMREX_HOME ?= ../../..
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include ./Make.package
-
-ALGOIM_HOME ?= ../../..
-VPATH_LOCATIONS += $(ALGOIM_HOME)/src
-INCLUDE_LOCATIONS += $(ALGOIM_HOME)/src
-
-#BLITZ_HOME ?= /path/to/blitz
-VPATH_LOCATIONS += $(BLITZ_HOME)/include
-INCLUDE_LOCATIONS += $(BLITZ_HOME)/include
-
-Pdirs := Base Boundary AmrCore EB
-
-Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tests/Algoim/main.cpp b/Tests/Algoim/main.cpp
deleted file mode 100644
index 12ab7c58c0b..00000000000
--- a/Tests/Algoim/main.cpp
+++ /dev/null
@@ -1,246 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_Print.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_algoim.H>
-#include <AMReX_algoim_K.H>
-
-#include <algoim_quad.hpp>
-
-using namespace amrex;
-using namespace amrex::algoim;
-
-namespace orig_algoim = Algoim;
-
-static_assert(AMREX_SPACEDIM == 3, "3d only");
-
-namespace {
-    GpuArray<Real,3> normal (Real x, Real y, Real z) {
-        Real norminv = 1./std::sqrt(x*x+y*y+z*z);
-        return {x*norminv, y*norminv, z*norminv};
-    }
-}
-
-namespace {
-struct EBshape
-{
-    template<typename T>
-    T operator() (const blitz::TinyVector<T,3>& x) const
-    {
-        return (x(0) - cent[0])*(norm[0]) + (x(1) - cent[1])*(norm[1]) + (x(2) - cent[2])*(norm[2]);
-    }
-
-    template<typename T>
-    blitz::TinyVector<T,3> grad(const blitz::TinyVector<T,3>& x) const
-    {
-        return blitz::TinyVector<double,3>(norm[0],norm[1],norm[2]);
-    }
-
-    EBshape (GpuArray<Real,3> const& c, GpuArray<Real,3> const& n)
-        : cent(c), norm(c)
-        {}
-
-    EBshape (algoim::EBPlane const& rhs)
-        : cent(rhs.cent), norm(rhs.norm)
-        {}
-
-    GpuArray<Real,3> cent{};
-    GpuArray<Real,3> norm{};
-};
-}
-
-void test_algoim (algoim::EBPlane& ebmax, Real& smax, algoim::EBPlane const& p);
-Real test_algoim_perf (Vector<algoim::EBPlane> const& planes, Real& tnew, Real& told);
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-
-    {
-        long ntry = 1000;
-        long nperf = 1000000;
-        {
-            ParmParse pp;
-            pp.query("ntry", ntry);
-            pp.query("nperf", nperf);
-        }
-
-        algoim::EBPlane ebmax;
-        Real smax = -1.0;
-
-        Vector<algoim::EBPlane> special_cases;
-        for (int ibc = -1; ibc <= 1; ++ibc) {
-        for (int jbc = -1; jbc <= 1; ++jbc) {
-        for (int kbc = -1; kbc <= 1; ++kbc) {
-        for (int ibn = -1; ibn <= 1; ++ibn) {
-        for (int jbn = -1; jbn <= 1; ++jbn) {
-        for (int kbn = -1; kbn <= 1; ++kbn) {
-            if (ibn == 0 and jbn == 0 and kbn == 0) continue;
-            special_cases.emplace_back(GpuArray<Real,3>{0.5*ibc,0.5*jbc,0.5*kbc},
-                                       normal(ibn, jbn, kbn));
-        }}}}}}
-
-        for (auto const& p : special_cases)
-        {
-            test_algoim(ebmax, smax, p);
-        }
-
-        ResetRandomSeed(time(0));
-        for (long itry = 0; itry < ntry; ++itry) {
-            Real d1 = amrex::Random()-0.5;
-            Real d2 = amrex::Random()-0.5;
-            Real d3 = amrex::Random()-0.5;
-            Real d4 = amrex::Random()-0.5;
-            Real d5 = amrex::Random()-0.5;
-            Real d6 = amrex::Random()-0.5;
-            if (d4 != 0.0 or d5 != 0.0 or d6 != 0.0) {
-                algoim::EBPlane p(GpuArray<Real,3>{d1,d2,d3},
-                                  normal(d4,d5,d6));
-                test_algoim(ebmax, smax, p);
-            }
-        }
-
-        Vector<algoim::EBPlane> planes;
-        for (long iperf = 0; iperf < nperf; ++iperf) {
-            Real d1 = amrex::Random()-0.5;
-            Real d2 = amrex::Random()-0.5;
-            Real d3 = amrex::Random()-0.5;
-            Real d4 = amrex::Random()-0.5;
-            Real d5 = amrex::Random()-0.5;
-            Real d6 = amrex::Random()-0.5;
-            if (d4 != 0.0 or d5 != 0.0 or d6 != 0.0) {
-                planes.emplace_back(GpuArray<Real,3>{d1,d2,d3},
-                                    normal(d4,d5,d6));
-            }
-        }
-
-        Real tnew, told;
-        Real total = test_algoim_perf(planes, tnew, told);
-        if (total != 0) amrex::Print() << "\n";
-        amrex::Print() << "New and old performance times: " << tnew << " "
-                       << told << "\n";
-
-        amrex::Print().SetPrecision(17)
-            << "\nMax diff. " << smax << " with\n    centroid("
-            << ebmax.cent[0] << "," << ebmax.cent[1] << ","
-            << ebmax.cent[2] << ")\n    normal  (" << ebmax.norm[0]
-            << "," << ebmax.norm[1] << ","
-            << ebmax.norm[2] << ")\n\n";
-    }
-
-    amrex::Finalize();
-}
-
-AMREX_FORCE_INLINE void
-test_algoim_new (QuadratureRule const& q, Real& vol,
-                 GpuArray<Real,algoim::numIntgs>& intg)
-{
-    vol             = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return 1.0;});
-    intg[i_S_x    ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x; });
-    intg[i_S_y    ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return y; });
-    intg[i_S_z    ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return z; });
-    intg[i_S_x2   ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*x; });
-    intg[i_S_y2   ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return y*y; });
-    intg[i_S_z2   ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return z*z; });
-    intg[i_S_x_y  ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*y; });
-    intg[i_S_x_z  ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*z; });
-    intg[i_S_y_z  ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return y*z; });
-    intg[i_S_x2_y ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*x*y; });
-    intg[i_S_x2_z ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*x*z; });
-    intg[i_S_x_y2 ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*y*y; });
-    intg[i_S_y2_z ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return y*y*z; });
-    intg[i_S_x_z2 ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*z*z; });
-    intg[i_S_y_z2 ] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return y*z*z; });
-    intg[i_S_x2_y2] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*x*y*y;});
-    intg[i_S_x2_z2] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return x*x*z*z;});
-    intg[i_S_y2_z2] = q([] AMREX_GPU_HOST_DEVICE (Real x, Real y, Real z) {return y*y*z*z;});
-}
-
-AMREX_FORCE_INLINE void
-test_algoim_old (orig_algoim::QuadratureRule<3> const& q, Real& vol,
-                 GpuArray<Real,algoim::numIntgs>& intg)
-{
-    vol             = q([](const auto& w) {return 1.0;});
-    intg[i_S_x    ] = q([](const auto& w) {return w[0]; });
-    intg[i_S_y    ] = q([](const auto& w) {return w[1]; });
-    intg[i_S_z    ] = q([](const auto& w) {return w[2]; });
-    intg[i_S_x2   ] = q([](const auto& w) {return w[0]*w[0]; });
-    intg[i_S_y2   ] = q([](const auto& w) {return w[1]*w[1]; });
-    intg[i_S_z2   ] = q([](const auto& w) {return w[2]*w[2]; });
-    intg[i_S_x_y  ] = q([](const auto& w) {return w[0]*w[1]; });
-    intg[i_S_x_z  ] = q([](const auto& w) {return w[0]*w[2]; });
-    intg[i_S_y_z  ] = q([](const auto& w) {return w[1]*w[2]; });
-    intg[i_S_x2_y ] = q([](const auto& w) {return w[0]*w[0]*w[1]; });
-    intg[i_S_x2_z ] = q([](const auto& w) {return w[0]*w[0]*w[2]; });
-    intg[i_S_x_y2 ] = q([](const auto& w) {return w[0]*w[1]*w[1]; });
-    intg[i_S_y2_z ] = q([](const auto& w) {return w[1]*w[1]*w[2]; });
-    intg[i_S_x_z2 ] = q([](const auto& w) {return w[0]*w[2]*w[2]; });
-    intg[i_S_y_z2 ] = q([](const auto& w) {return w[1]*w[2]*w[2]; });
-    intg[i_S_x2_y2] = q([](const auto& w) {return w[0]*w[0]*w[1]*w[1];});
-    intg[i_S_x2_z2] = q([](const auto& w) {return w[0]*w[0]*w[2]*w[2];});
-    intg[i_S_y2_z2] = q([](const auto& w) {return w[1]*w[1]*w[2]*w[2];});
-}
-
-void
-test_algoim (algoim::EBPlane& ebmax, Real& smax, algoim::EBPlane const& p)
-{
-    const QuadratureRule q = quadGen(p);
-    Real vol;
-    GpuArray<Real,algoim::numIntgs> intg;
-    test_algoim_new(q, vol, intg);
-
-    EBshape phi = p;
-    const auto q2 = orig_algoim::quadGen<3>(phi, orig_algoim::BoundingBox<Real,3>({-0.5,-0.5,-0.5},{0.5,0.5,0.5}), -1, -1, 4);
-    Real vol2;
-    GpuArray<Real,algoim::numIntgs> intg2;
-    test_algoim_old(q2, vol2, intg2);
-
-    Real lsmax = std::abs(vol-vol2);
-    for (int i = 0; i < numIntgs; ++i) {
-        lsmax = std::max(lsmax, std::abs(intg[i]-intg2[i]));
-    }
-
-    if (lsmax > smax) {
-        smax = lsmax;
-        ebmax = p;
-    }
-}
-
-Real test_algoim_perf (Vector<algoim::EBPlane> const& planes, Real& tnew, Real& told)
-{
-    Real total = 0.0;
-
-    Real t0 = amrex::second();
-
-    for (auto const& p : planes)
-    {
-        const QuadratureRule q = quadGen(p);
-        Real vol;
-        GpuArray<Real,algoim::numIntgs> intg;
-        test_algoim_new(q, vol, intg);
-        total += vol;
-        for (int i = 0; i < intg.size(); ++i) {
-            total += intg[i];
-        }
-    }
-
-    Real t1 = amrex::second();
-
-    for (auto const& p : planes)
-    {
-        EBshape phi = p;
-        const auto q = orig_algoim::quadGen<3>(phi, orig_algoim::BoundingBox<Real,3>({-0.5,-0.5,-0.5},{0.5,0.5,0.5}), -1, -1, 4);
-        Real vol;
-        GpuArray<Real,algoim::numIntgs> intg;
-        test_algoim_old(q, vol, intg);
-        total += vol;
-        for (int i = 0; i < intg.size(); ++i) {
-            total += intg[i];
-        }
-    }
-
-    Real t2 = amrex::second();
-
-    tnew = t1-t0;
-    told = t2-t1;
-    return total;
-}
diff --git a/Tests/AsyncOut/multifab/CMakeLists.txt b/Tests/AsyncOut/multifab/CMakeLists.txt
new file mode 100644
index 00000000000..4358c17ffcb
--- /dev/null
+++ b/Tests/AsyncOut/multifab/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files inputs  )
+
+setup_test(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/AsyncOut/multifab/GNUmakefile b/Tests/AsyncOut/multifab/GNUmakefile
index 522bf1cac60..606bad49e1f 100644
--- a/Tests/AsyncOut/multifab/GNUmakefile
+++ b/Tests/AsyncOut/multifab/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG = FALSE
 DIM = 3
diff --git a/Tests/AsyncOut/multifab/main.cpp b/Tests/AsyncOut/multifab/main.cpp
index 1e089c7be05..b7f724e0ac2 100644
--- a/Tests/AsyncOut/multifab/main.cpp
+++ b/Tests/AsyncOut/multifab/main.cpp
@@ -77,10 +77,11 @@ void main_main ()
 
         auto arrs_ptr = arrs.dataPtr();
 
-        amrex::ParallelFor(bx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        amrex::ParallelForRNG(bx,
+        [=] AMREX_GPU_DEVICE (int i, int j, int k, RandomEngine const& engine) noexcept
         {
             for (int m = 0; m < nwrites; ++m) {
-               arrs_ptr[m](i,j,k) = amrex::Random();
+               arrs_ptr[m](i,j,k) = amrex::Random(engine);
             }
         });
         Gpu::streamSynchronize(); // because of arrs
@@ -113,7 +114,7 @@ void main_main ()
         if (ip == ParallelDescriptor::MyProc()) {
             amrex::AllPrint() << "Proc. " << ip << " number of boxes = " << mfs[0].local_size() << std::endl;
         }
-        amrex::USleep(0.001);
+        amrex::Sleep(0.001);
         ParallelDescriptor::Barrier();
     }
 
diff --git a/Tests/BBIOBenchmark/BBIOTest.cpp b/Tests/BBIOBenchmark/BBIOTest.cpp
deleted file mode 100644
index 46b916fa71a..00000000000
--- a/Tests/BBIOBenchmark/BBIOTest.cpp
+++ /dev/null
@@ -1,247 +0,0 @@
-// -------------------------------------------------------------
-// BBIOTest.cpp
-// -------------------------------------------------------------
-#include <AMReX_Vector.H>
-#include <AMReX_IntVect.H>
-#include <AMReX_Box.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_Utility.H>
-#include <iostream>
-#include <strstream>
-#include <fstream>
-#include <iomanip>
-
-#include <unistd.h>
-
-using std::cout;
-using std::endl;
-using std::ends;
-using std::ostrstream;
-using std::ofstream;
-using std::ifstream;
-using std::streamoff;
-
-using namespace amrex;
-
-const int XDIR(0);
-const int YDIR(1);
-const int ZDIR(2);
-Real bytesPerMB(1.0e+06);
-
-std::string dirName(".");
-
-// -------------------------------------------------------------
-void SetDirName(const std::string &dirname) {
-  dirName = dirname;
-}
-
-
-// -------------------------------------------------------------
-void TestWriteNFiles(int nfiles, int nMB, bool raninit, bool mb2)
-{
-  int myProc(ParallelDescriptor::MyProc());
-  int nProcs(ParallelDescriptor::NProcs());
-  bool initData(true);
-
-  if(mb2) {
-    bytesPerMB = pow(2.0, 20);
-  }
-
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << "  Timings for writing to " << nfiles << " files:" << endl;
-  }
-
-  // make the data array
-  Vector<long> dataArray(nMB * bytesPerMB / sizeof(long), 0);
-  if(initData) {
-    long *dp = dataArray.dataPtr();
-    for(long i(0); i < dataArray.size(); ++i) {
-      dp[i] = i;
-    }
-  }
-
-  Vector<Real> writeSize, writeRate;
-  long npts(dataArray.size()), nItemsToWrite(0);
-  long totalNBytes(npts * sizeof(long) * nProcs);
-  std::string fileName(dirName + "/TestArray_");
-  fileName = amrex::Concatenate(fileName, myProc, 4);
-  cout << myProc << "::fileName = " << fileName << endl << endl;
-
-  ParallelDescriptor::Barrier();
-
-  for(int buffItems(1024); buffItems < 160000000; buffItems *= 2) {
-    if(ParallelDescriptor::IOProcessor()) {
-      writeSize.push_back(buffItems * sizeof(long) / bytesPerMB);
-    }
-    double wallTimeStart(ParallelDescriptor::second());
-    long *dp = dataArray.dataPtr();
-
-    ofstream os(fileName.c_str());
-    int nItems(dataArray.size());
-    while(nItems > 0) {
-      nItemsToWrite = nItems > buffItems ? buffItems : nItems;
-      os.write((char *) dp, nItemsToWrite * sizeof(long));
-      nItems -= nItemsToWrite;
-      dp += nItemsToWrite;
-    }
-    os.close();
-
-    double wallTime(ParallelDescriptor::second() - wallTimeStart);
-
-    double wallTimeMax(wallTime);
-    double wallTimeMin(wallTime);
-
-    ParallelDescriptor::ReduceRealMin(wallTimeMin);
-    ParallelDescriptor::ReduceRealMax(wallTimeMax);
-    Real megabytes((static_cast<Real> (totalNBytes)) / bytesPerMB);
-
-    dp = dataArray.dataPtr();
-    for(long i(0); i < dataArray.size(); ++i) {
-      dp[i] = -1;
-    }
-    ifstream is(fileName.c_str());
-    is.read((char *) dataArray.dataPtr(), dataArray.size() * sizeof(long));
-    is.close();
-    int badCheck(0);
-    for(long i(0); i < dataArray.size(); ++i) {
-      if(dp[i] != i) {
-        ++badCheck;
-      }
-    }
-    if(badCheck > 0) {
-      cout << myProc << "::**** ****  Error:  BadCheck = " << badCheck << endl;
-    }
-
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << std::setprecision(5);
-      cout << "  Buffer Items    = " << buffItems << endl;
-      cout << "  Write Size MB   = " << buffItems * sizeof(long) / bytesPerMB << endl;
-      cout << "  BadCheck        = " << badCheck << endl;
-      cout << "  Total megabytes = " << megabytes << endl;
-      cout << "  Write:  MB/sec  = " << megabytes/wallTimeMax << endl;
-      cout << "  Wall clock time = " << wallTimeMax << endl;
-      cout << "  Min wall time   = " << wallTimeMin << endl;
-      cout << "  Max wall time   = " << wallTimeMax << endl;
-      cout << endl << endl;
-
-      writeRate.push_back(megabytes/wallTimeMax);
-    }
-
-  }
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << std::setprecision(4) << std::fixed << std::setw(12);
-    cout << "Write Size (MB) Write Rate (MB/s)" << endl;
-    if(writeSize.size() != writeRate.size()) {
-      cout << "**** Error:  writeSize.size() != writeRate.size()" << endl;
-    } else {
-      for(int i(0); i < writeSize.size(); ++i) {
-        cout << std::setprecision(4) << writeSize[i] << "    \t"
-	     << std::setprecision(2) << writeRate[i] << endl;
-      }
-    }
-    cout << endl << endl;
-  }
-}
-
-
-// -------------------------------------------------------------
-void TestReadNFiles(int nfiles, int nMB, bool raninit, bool mb2)
-{
-  int myProc(ParallelDescriptor::MyProc());
-  int nProcs(ParallelDescriptor::NProcs());
-
-  if(mb2) {
-    bytesPerMB = pow(2.0, 20);
-  }
-
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << "  Timings for reading from " << nfiles << " files:" << endl;
-  }
-
-  // make the data array
-  Vector<long> dataArray(nMB * bytesPerMB / sizeof(long), 0);
-
-  Vector<Real> readSize, readRate;
-  long npts(dataArray.size()), nItemsToRead(0);
-  long totalNBytes(npts * sizeof(long) * nProcs);
-  std::string fileName(dirName + "/TestArray_");
-  fileName = amrex::Concatenate(fileName, myProc, 4);
-  cout << myProc << "::fileName = " << fileName << endl << endl;
-
-  ParallelDescriptor::Barrier();
-
-  for(int buffItems(1024); buffItems < 160000000; buffItems *= 2) {
-    if(ParallelDescriptor::IOProcessor()) {
-      readSize.push_back(buffItems * sizeof(long) / bytesPerMB);
-    }
-    double wallTimeStart(ParallelDescriptor::second());
-    long *dp = dataArray.dataPtr();
-
-    ifstream is(fileName.c_str());
-    int nItems(dataArray.size());
-    while(nItems > 0) {
-      nItemsToRead = nItems > buffItems ? buffItems : nItems;
-      is.read((char *) dp, nItemsToRead * sizeof(long));
-      nItems -= nItemsToRead;
-      dp += nItemsToRead;
-    }
-    is.close();
-
-    double wallTime(ParallelDescriptor::second() - wallTimeStart);
-
-    double wallTimeMax(wallTime);
-    double wallTimeMin(wallTime);
-
-    ParallelDescriptor::ReduceRealMin(wallTimeMin);
-    ParallelDescriptor::ReduceRealMax(wallTimeMax);
-    Real megabytes((static_cast<Real> (totalNBytes)) / bytesPerMB);
-
-    dp = dataArray.dataPtr();
-    int badCheck(0);
-    for(long i(0); i < dataArray.size(); ++i) {
-      if(dp[i] != i) {
-        ++badCheck;
-      }
-    }
-    if(badCheck > 0) {
-      cout << myProc << "::**** ****  Error:  BadCheck = " << badCheck << endl;
-    }
-
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << std::setprecision(5);
-      cout << "  Buffer Items    = " << buffItems << endl;
-      cout << "  Read Size MB    = " << buffItems * sizeof(long) / bytesPerMB << endl;
-      cout << "  BadCheck        = " << badCheck << endl;
-      cout << "  Total megabytes = " << megabytes << endl;
-      cout << "  Read:  MB/sec   = " << megabytes/wallTimeMax << endl;
-      cout << "  Wall clock time = " << wallTimeMax << endl;
-      cout << "  Min wall time   = " << wallTimeMin << endl;
-      cout << "  Max wall time   = " << wallTimeMax << endl;
-      cout << endl << endl;
-
-      readRate.push_back(megabytes/wallTimeMax);
-    }
-
-  }
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << std::setprecision(4) << std::fixed << std::setw(12);
-    cout << "Read Size (MB) Read Rate (MB/s)" << endl;
-    if(readSize.size() != readRate.size()) {
-      cout << "**** Error:  readSize.size() != readRate.size()" << endl;
-    } else {
-      for(int i(0); i < readSize.size(); ++i) {
-        cout << std::setprecision(4) << readSize[i] << "    \t"
-	     << std::setprecision(2) << readRate[i] << endl;
-      }
-    }
-    cout << endl << endl;
-  }
-}
-// -------------------------------------------------------------
-// -------------------------------------------------------------
-
-
diff --git a/Tests/BBIOBenchmark/BBIOTestDriver.cpp b/Tests/BBIOBenchmark/BBIOTestDriver.cpp
deleted file mode 100644
index c6129c0ac86..00000000000
--- a/Tests/BBIOBenchmark/BBIOTestDriver.cpp
+++ /dev/null
@@ -1,141 +0,0 @@
-// -------------------------------------------------------------
-// BBIOTestDriver.cpp
-// -------------------------------------------------------------
-#include <new>
-#include <iostream>
-#include <cstdio>
-#include <cstdlib>
-#include <cstring>
-using std::ios;
-
-#include <unistd.h>
-
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_VisMF.H>
-
-using std::cout;
-using std::cerr;
-using std::endl;
-
-using namespace amrex;
-
-void TestWriteNFiles(int nfiles, int nMB, bool raninit, bool mb2);
-void TestReadNFiles(int nfiles, int nMB, bool raninit, bool mb2);
-void SetDirName(const std::string &dirname);
-
-
-// -------------------------------------------------------------
-static void PrintUsage(const char *progName) {
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << '\n';
-    cout << "Usage:" << '\n';
-    cout << progName << '\n';
-    cout << "   [nfiles = nfiles]" << '\n';
-    cout << "   [nMB = nMB]" << '\n';
-    cout << "   [nsleep = nsleep]" << '\n';
-    cout << "   [ntimes = ntimes]" << '\n';
-    cout << "   [raninit = tf]" << '\n';
-    cout << "   [mb2    = tf]" << '\n';
-    cout << "   [dirName = dirname]" << '\n';
-    cout << '\n';
-    cout << "Running with default values." << '\n';
-    cout << '\n';
-  }
-}
-
-
-// -------------------------------------------------------------
-int main(int argc, char *argv[]) {
-
-  amrex::Initialize(argc,argv);
-  VisMF::Initialize();
-
-  if(argc == 1) {
-    PrintUsage(argv[0]);
-  }
-
-  ParmParse pp;
-
-  int myproc(ParallelDescriptor::MyProc());
-  int nprocs(ParallelDescriptor::NProcs());
-  int nsleep(0), nfiles(std::min(nprocs, 128));  // limit default to max of 128
-  int nMB(100), ntimes(1);
-  bool raninit(false), mb2(false);
-  std::string dirName(".");
-
-  pp.query("nfiles", nfiles);
-  nfiles = std::max(1, std::min(nfiles, nprocs));
-
-  pp.query("nMB", nMB);
-  nMB = std::max(1, nMB);
-
-  pp.query("ntimes", ntimes);
-  ntimes = std::max(1, ntimes);
-
-  pp.query("raninit", raninit);
-  pp.query("mb2", mb2);
-
-  pp.query("dirName", dirName);
-  std::cout << "dirName = " << dirName << std::endl;
-  SetDirName(dirName);
-
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << endl;
-    cout << "**************************************************" << endl;
-    cout << "nprocs = " << nprocs << endl;
-    cout << "nfiles = " << nfiles << endl;
-    cout << "nMB    = " << nMB    << endl;
-    cout << "ntimes = " << ntimes << endl;
-    cout << "raninit = " << raninit << endl;
-    cout << "mb2 = " << mb2 << endl;
-  }
-
-  pp.query("nsleep", nsleep);
-  if(nsleep > 0) {  // test the timer
-    double timerTimeStart = ParallelDescriptor::second();
-    sleep(nsleep);  // for attaching a debugger or testing the timer
-    double timerTime = ParallelDescriptor::second() - timerTimeStart;
-    cout << "  ----- " << myproc << " :  " << "Sleep time = "
-         << timerTime << "  (should be " << nsleep << " seconds)" << endl;
-  }
-
-  ParallelDescriptor::Barrier();
-
-  for(int itimes(0); itimes < ntimes; ++itimes) {
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << endl << "--------------------------------------------------" << endl;
-      cout << "Testing NFiles Write" << endl;
-    }
-
-    TestWriteNFiles(nfiles, nMB, raninit, mb2);
-
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << "==================================================" << endl;
-      cout << endl;
-    }
-  }
-
-  for(int itimes(0); itimes < ntimes; ++itimes) {
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << endl << "++++++++++++++++++++++++++++++++++++++++++++++++++" << endl;
-      //cout << "Testing NFiles Read" << endl;
-      cout << "Testing NFiles Write again" << endl;
-    }
-
-    TestWriteNFiles(nfiles, nMB, raninit, mb2);
-
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << "##################################################" << endl;
-      cout << endl;
-    }
-  }
-
-
-  amrex::Finalize();
-  return 0;
-}
-// -------------------------------------------------------------
-// -------------------------------------------------------------
diff --git a/Tests/BBIOBenchmark/GNUmakefile b/Tests/BBIOBenchmark/GNUmakefile
deleted file mode 100644
index 6651309fbee..00000000000
--- a/Tests/BBIOBenchmark/GNUmakefile
+++ /dev/null
@@ -1,36 +0,0 @@
-AMREX_HOME ?= ../../../amrex
-
-PROFILE   = FALSE
-PRECISION = DOUBLE
-DEBUG     = TRUE
-DEBUG     = FALSE
-DIM       = 3
-COMP      = Intel
-COMP      = g++
-
-USE_MPI=FALSE
-USE_MPI=TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-EBASE = bbiotest
-
-HERE = .
-
-include $(AMREX_HOME)/Src/Base/Make.package
-
-INCLUDE_LOCATIONS += $(HERE)
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Base
-
-CEXE_sources += BBIOTestDriver.cpp BBIOTest.cpp
-
-vpath %.H   $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.cpp $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.F   $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.f   $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.f90 $(HERE) $(AMREX_HOME)/Src/Base
-
-all: $(executable)
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tests/BBIOBenchmark/README b/Tests/BBIOBenchmark/README
deleted file mode 100644
index 9e50f59f1aa..00000000000
--- a/Tests/BBIOBenchmark/README
+++ /dev/null
@@ -1,35 +0,0 @@
-
-this code is adapted from BoxLib/Tests/IOBenchmark
-to test the burst buffer on cori.  only the write
-is called (twice by the driver).  the read needs to
-be finished.
-
-this is a boxlib i/o test.
-it writes and reads a multifab.
-
-Usage:
-iotest3d.Linux.g++.gfortran.MPI.ex
-   [nfiles = nfiles]
-   [maxgrid = maxgrid]
-   [ncomps = ncomps]
-   [nboxes = nboxes]
-   [nsleep = nsleep]
-   [ntimes = ntimes]
-   [raninit = tf]
-   [mb2    = tf]
-
-
-the range [1,nprocs] is enforced for nfiles.
-ncomps is the number of FAB components.
-nboxes is the number of boxes in the multifab.
-nsleep will sleep for nsleep seconds.
-ntimes is the number of times to run the test.
-raninit will initialize the multifab with random values.
-mb2 will use 2^20 instead of 1.0e+06 to calculate megabytes.
-
-
-example run:
-
-mpiexec -n 4 bbiotest3d.Linux.g++.gfortran.MPI.ex nfiles=4 maxgrid=64 ncomps=16 nboxes=32 ntimes=4 raninit=true mb2=true
-
-
diff --git a/Tests/BaseFabTesting/GNUmakefile b/Tests/BaseFabTesting/GNUmakefile
deleted file mode 100644
index a2fa4d3d482..00000000000
--- a/Tests/BaseFabTesting/GNUmakefile
+++ /dev/null
@@ -1,18 +0,0 @@
-AMREX_HOME ?= ../../
-
-DEBUG   = FALSE
-#DEBUG   = TRUE
-
-DIM = 3
-
-COMP    = intel 
-
-USE_MPI   = TRUE 
-USE_OMP   = FALSE
-USE_CUDA  = FALSE
-USE_GPU_PRAGMA = FALSE 
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/BaseFabTesting/Make.package b/Tests/BaseFabTesting/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/BaseFabTesting/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/BaseFabTesting/inputs b/Tests/BaseFabTesting/inputs
deleted file mode 100644
index 68b89c69674..00000000000
--- a/Tests/BaseFabTesting/inputs
+++ /dev/null
@@ -1,3 +0,0 @@
-iters = 1
-boxsize = 64
-ncomps = 3 
diff --git a/Tests/BaseFabTesting/main.cpp b/Tests/BaseFabTesting/main.cpp
deleted file mode 100644
index e65a0d9f6ba..00000000000
--- a/Tests/BaseFabTesting/main.cpp
+++ /dev/null
@@ -1,818 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_Print.H>
-#include <AMReX_BaseFab.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-
-    long iters = 0;
-    int boxsize = 0;
-    int ncomps = 0;
-
-    {
-        ParmParse pp;
-        pp.get("iters", iters);
-        pp.get("boxsize",boxsize);
-        pp.get("ncomps", ncomps);
-    }
-
-        amrex::Print() << std::endl;
-
-#ifdef AMREX_USE_GPU_PRAGMA
-        amrex::Print() << "Fortran version of BaseFab testing suite." << std::endl;
-#else
-        amrex::Print() << "C++ version of BaseFab testing suite." << std::endl;
-#endif
-        amrex::Print() << "A lot of results should equal 5.5." << std::endl  
-                       << "Cubic boxes of length: " << boxsize << std::endl
-                       << "Number of components: " << ncomps << std::endl
-                       << "Number of iterations of each test: " << iters << std::endl
-                       << "=========================================" << std::endl << std::endl;
-
-    // ====================================================================
-    // SetVal
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-
-        fab1.setVal(1.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.setVal(5.5);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::setVal() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ====================================================================
-
-    // SetValIfNot 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        BaseFab<int> fab2(bx1,ncomps);
-
-        fab1.setVal(1.0);
-        fab2.setVal(0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.setValIfNot(5.5, bx1, fab2, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::setValIfNot() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ====================================================================
-    // Invert 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-
-        fab1.setVal( (iters%2 == 0) ? 5.5 : (1/5.5) );
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.invert(1.0, bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::invert() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ====================================================================
-    // Abs 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(-5.5);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.abs(bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::abs() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ====================================================================
-    // negate 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal( (iters%2 ==0) ? 5.5 : -5.5 );
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.negate(bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::negate() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ====================================================================
-    // Norm 
-    {
-        double timer;
-        double result = 0.0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5/(bx1.numPts()*ncomps));
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           result = fab1.norm(bx1, 1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::norm() test." << std::endl
-                       << "Result: " << result << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ====================================================================
-
-    // Norminfmask 
-    {
-        double timer;
-        double result = 0.0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        Box bx2(IntVect(0), IntVect(boxsize-1));
-        BaseFab<int> fab2(bx2,ncomps);
-        fab2.setVal(1);
-
-        for (int i = 0; i<ncomps; ++i)
-        {
-           int count = 0;
-           IntVect currIndx = bx2.smallEnd();
-           while (bx2.contains(currIndx))
-           {
-              int random = Random_int(2);
-              fab2(currIndx, i) = random;
-              count += random;
-              bx2.next(currIndx);
-           }
-           amrex::Print() << " *** norm using " << count << " 'true' masks out of " 
-                          << bx2.numPts() << " points in component " << i << "." << std::endl;
-        }
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           result = fab1.norminfmask(bx1, fab2, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::norminfmask() test." << std::endl
-                       << "Result: " << result << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ====================================================================
-    // Min
-    {
-        double timer;
-        double result = 0.0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           result = fab1.min(bx1, 0);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::min() test." << std::endl
-                       << "Result: " << result << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ====================================================================
-    // Max 
-    {
-        double timer;
-        double result = 0.0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           result = fab1.max(bx1, 0);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::max() test." << std::endl
-                       << "Result: " << result << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ====================================================================
-    // minIndex
-    {
-        double timer;
-        IntVect result(-100);
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           result = fab1.minIndex(bx1, 0);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::minIndex() test." << std::endl
-                       << "Result: " << result << " = " << fab1(result) << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ====================================================================
-    // maxIndex
-    {
-        double timer;
-        IntVect result(-100);
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           result = fab1.maxIndex(bx1, 0);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::maxIndex() test." << std::endl
-                       << "Result: " << result << " = " << fab1(result) << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ====================================================================
-    // Sum 
-    {
-        double timer;
-        double total = 0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5/(bx1.numPts()*ncomps));
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           total = fab1.sum(bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::sum() test." << std::endl
-                       << "Result: " << total << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ===================================================================
-    // plus 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(2.75);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.75/iters);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.plus(fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::plus() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ===================================================================
-    // minus 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(8.25);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.75/iters);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.minus(fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::minus() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // mult
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(2);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.75);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.mult(fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::mult() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/ops." << std::endl
-                       << "                         or: " << double(iters)/timer <<  " ops/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // mult & divide 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(11.0);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.divide(fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::divide() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/ops." << std::endl
-                       << "                         or: " << double(iters)/timer <<  " ops/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // protected_divide 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(11.0);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.protected_divide(fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::protected_divide() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/ops." << std::endl
-                       << "                         or: " << double(iters)/timer   <<  " ops/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // protected_divide w/ zeros
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(0.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.protected_divide(fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::protected_divide() test with zeroes." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/ops." << std::endl
-                       << "                         or: " << double(iters)/timer   <<  " ops/second." << std::endl << std::endl; 
-    }
-
-
-
-
-    // ===================================================================
-    // dot 
-    {
-        double timer;
-        double total = 0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(2.75);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(double(2.0)/(bx2.numPts()*ncomps));
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           total = fab1.dot(bx1, 0, fab2, bx2, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::dot() test." << std::endl
-                       << "Result: " << total  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ===================================================================
-    // dotmask
-    {
-        double timer;
-        double total = 0;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(2.75/boxsize);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.0);
-
-        Box bx3(IntVect(0), IntVect(boxsize-1));
-        BaseFab<int> fab3(bx3,ncomps);
-        fab3.setVal(1);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           total = fab1.dotmask(fab3, bx1, 0, fab2, bx2, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::dotmask() test." << std::endl
-                       << "Result: " << total << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ===================================================================
-    // masks
-    {
-        double timer;
-        int totalLT = 0;
-        int totalLE = 0;
-        int totalEQ = 0;
-        int totalGE = 0;
-        int totalGT = 0;
-
-        Box bx1(IntVect(10), IntVect(10+boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        Box bx2(IntVect(10), IntVect(10+boxsize-1));
-        BaseFab<int> fab2(bx2,ncomps);
-        fab2.setVal(0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           totalLT = fab1.maskLT(fab2, 19, 0);
-           totalLE = fab1.maskLE(fab2, 5.5, 0);
-           totalEQ = fab1.maskEQ(fab2, 5.5, 0);
-           totalGE = fab1.maskGE(fab2, 5.5, 0);
-           totalGT = fab1.maskGT(fab2, 1, 0);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::maskLT() test." << std::endl
-                       << "Results (LT/LE/EQ/GE/GT): " << totalLT << "/" << totalLE << "/" << totalEQ << "/"
-                                                       << totalGE << "/" << totalGT << " of " << fab1.numPts() << " points." << std::endl 
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/(double(iters)/5) << " seconds/ops." << std::endl
-                       << "                         or: " << double(iters)/(5*timer) << " ops/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // saxpy 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(1);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.25/iters);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.saxpy(2.0, fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::saxpy() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector()) << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // xpay 
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(2.25/(iters));
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(1.0/iters);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.xpay(2/iters, fab2, bx2, bx1, 0, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::xpay() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // addproduct
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(-0.75);
-
-        Box bx2(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.5);
-
-        Box bx3(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab3(bx3,ncomps);
-        fab3.setVal(2.5/iters);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.addproduct(bx1, 0, ncomps, fab2, 0, fab3, 0);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::addproduct() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // LinComb
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(1.0);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(2.0);
-
-        Box bx3(IntVect(10), IntVect(10+boxsize-1));
-        BaseFab<Real> fab3(bx3,ncomps);
-        fab3.setVal(3.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.linComb(fab2, bx2, 0, fab3, bx3, 0, 0.5, 1.5, bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::linComb() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-    // ===================================================================
-    // LinInterp
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(1.0);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(3.0);
-
-        Box bx3(IntVect(10), IntVect(10+boxsize-1));
-        BaseFab<Real> fab3(bx3,ncomps);
-        fab3.setVal(4.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.linInterp(fab2, bx2, 0, fab3, bx3, 0, 0.5, 1.5, 3.0, bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::linInterp() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // Copy
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(0.0);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(5.5);
-
-        Vector<Real> buffer(bx1.numPts()*ncomps, 0.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.copy(fab2, bx2, 0, bx1, 0, ncomps);
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::copy() test." << std::endl
-                       << "Result: " << fab1(IntVect::TheZeroVector())  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/iter." << std::endl
-                       << "                         or: " << double(iters)/timer << " iters/second." << std::endl << std::endl; 
-    }
-
-    // ===================================================================
-    // CopyToMem & CopyFromMem
-    {
-        double timer;
-
-        Box bx1(IntVect(0), IntVect(boxsize-1));
-        BaseFab<Real> fab1(bx1,ncomps);
-        fab1.setVal(5.5);
-
-        Box bx2(IntVect(1000), IntVect(1000+boxsize-1));
-        BaseFab<Real> fab2(bx2,ncomps);
-        fab2.setVal(0.0);
-
-        Vector<Real> buffer(bx1.numPts()*ncomps, 0.0);
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab1.copyToMem(bx1, 0, ncomps, buffer.data());
-        }
-        timer = second() - timer;
-
-        timer = second();
-        for (int i=0; i<iters; ++i)
-        {
-           fab2.copyFromMem(bx2, 0, ncomps, buffer.data());
-        }
-        timer = second() - timer;
-
-        amrex::Print() << "BaseFab<Real>::copyToMem() test." << std::endl
-                       << "Result: " << fab2(IntVect(1000))  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/op." << std::endl
-                       << "                         or: " << double(iters)/timer << " ops/second." << std::endl << std::endl; 
-
-        amrex::Print() << "BaseFab<Real>::copyFromMem() test." << std::endl
-                       << "Result: " << fab2(IntVect(1000))  << std::endl
-                       << "Completed in: "                <<  timer << " seconds." << std::endl
-                       << " or, completed at a rate of: " <<         timer/iters << " seconds/op." << std::endl
-                       << "                         or: " << double(iters)/timer << " ops/second." << std::endl << std::endl; 
-    }
-    // ===================================================================
-
-    amrex::Finalize();
-}
diff --git a/Tests/CMakeLists.txt b/Tests/CMakeLists.txt
new file mode 100644
index 00000000000..09aeb253ab7
--- /dev/null
+++ b/Tests/CMakeLists.txt
@@ -0,0 +1,141 @@
+#
+# List of subdirectories to search for CMakeLists.
+#
+set( AMREX_TESTS_SUBDIRS AsyncOut )
+
+if (AMReX_PARTICLES)
+   list(APPEND AMREX_TESTS_SUBDIRS Particles)
+endif ()
+
+if (AMReX_HDF5)
+   list(APPEND AMREX_TESTS_SUBDIRS HDF5Benchmark)
+endif ()
+
+list(TRANSFORM AMREX_TESTS_SUBDIRS PREPEND "${CMAKE_CURRENT_LIST_DIR}/")
+
+#
+# Function to setup the tutorials
+#
+function (setup_test _srcs  _inputs)
+
+   cmake_parse_arguments( "" "HAS_FORTRAN_MODULES"
+      "BASE_NAME;RUNTIME_SUBDIR;EXTRA_DEFINITIONS;CMDLINE_PARAMS;NTASKS;NTHREADS" "" ${ARGN} )
+
+   if (_BASE_NAME)
+      set(_base_name ${_BASE_NAME})
+   else ()
+      string(REGEX REPLACE ".*Tests/" "" _base_name ${CMAKE_CURRENT_LIST_DIR})
+      string(REPLACE "/" "_" _base_name ${_base_name})
+   endif()
+
+   if (_RUNTIME_SUBDIR)
+      set(_exe_dir ${CMAKE_CURRENT_BINARY_DIR}/${_RUNTIME_SUBDIR})
+   else ()
+      set(_exe_dir ${CMAKE_CURRENT_BINARY_DIR})
+   endif ()
+
+   set( _exe_name  Test_${_base_name} )
+   set( _test_name ${_base_name} )
+
+   add_executable( ${_exe_name} )
+   target_sources( ${_exe_name} PRIVATE ${${_srcs}} )
+   set_target_properties( ${_exe_name} PROPERTIES RUNTIME_OUTPUT_DIRECTORY ${_exe_dir} )
+
+   if (_EXTRA_DEFINITIONS)
+      target_compile_definitions(${_exe_name} PRIVATE ${_EXTRA_DEFINITIONS})
+   endif ()
+
+   # Find out which include directory is needed
+   set(_includes ${${_srcs}})
+   list(FILTER _includes INCLUDE REGEX "\\.H")
+   foreach(_item IN LISTS _includes)
+      get_filename_component( _include_dir ${_item} DIRECTORY )
+      target_include_directories( ${_exe_name} PRIVATE  ${_include_dir} )
+   endforeach()
+
+   if (_HAS_FORTRAN_MODULES)
+      target_include_directories(${_exe_name}
+         PRIVATE
+         ${CMAKE_CURRENT_BINARY_DIR}/mod_files)
+      set_target_properties( ${_exe_name}
+         PROPERTIES
+         Fortran_MODULE_DIRECTORY
+         ${CMAKE_CURRENT_BINARY_DIR}/mod_files )
+   endif ()
+
+   target_link_libraries( ${_exe_name} amrex )
+
+   if (AMReX_CUDA)
+      setup_target_for_cuda_compilation( ${_exe_name} )
+   endif ()
+
+   #
+   # Assemble the commands sequence to launch the test
+   #
+   set(_cmd ${_exe_dir}/${_exe_name})
+
+   if (_CMDLINE_PARAMS)
+      list(APPEND _cmd ${_CMDLINE_PARAMS})
+   endif ()
+
+   if (${_inputs})
+      file( COPY ${${_inputs}} DESTINATION ${_exe_dir} )
+      list(APPEND _cmd ${${_inputs}})
+   endif ()
+
+   #
+   # Add the test
+   #
+   add_test(
+      NAME               ${_test_name}
+      COMMAND            ${_cmd}
+      WORKING_DIRECTORY  ${_exe_dir}
+      )
+
+   #
+   # Add MPI test
+   #
+   if (AMReX_MPI AND _NTASKS)
+      if (_NTASKS GREATER 2)
+         message(FATAL_ERROR "\nsetup_tests(): number of MPI tasks exceeds CI limit of 2")
+      endif ()
+
+      add_test(
+         NAME               ${_test_name}_MPI
+         COMMAND            mpiexec -n ${_NTASKS} ${_cmd}
+         WORKING_DIRECTORY  ${_exe_dir}
+         )
+
+      set_tests_properties(${_test_name}_MPI PROPERTIES ENVIRONMENT OMP_NUM_THREADS=1 )
+   endif ()
+
+   if (AMReX_OMP AND _NTHREADS)
+      if (_NTHREADS GREATER 2)
+         message(FATAL_ERROR "\nsetup_tests(): number of OpenMP threads exceeds CI limit of 2")
+      endif ()
+
+      add_test(
+         NAME               ${_test_name}_OpenMP
+         COMMAND            ${_cmd}
+         WORKING_DIRECTORY  ${_exe_dir}
+         )
+
+      set_tests_properties(${_test_name}_OpenMP PROPERTIES ENVIRONMENT OMP_NUM_THREADS=${_NTHREADS} )
+   endif ()
+
+endfunction ()
+
+
+#
+# Loop over subdirs and add to the build those containing CMakeLists.txt
+#
+foreach (_subdir IN LISTS AMREX_TESTS_SUBDIRS)
+
+   file( GLOB_RECURSE _tests "${_subdir}/*CMakeLists.txt" )
+
+   foreach ( _item  IN LISTS _tests)
+      get_filename_component(_dir ${_item} DIRECTORY )
+      add_subdirectory(${_dir})
+   endforeach ()
+
+endforeach ()
diff --git a/Tests/C_BaseLib/AMRPROFTEST_F.H b/Tests/C_BaseLib/AMRPROFTEST_F.H
deleted file mode 100644
index 0cd9caad882..00000000000
--- a/Tests/C_BaseLib/AMRPROFTEST_F.H
+++ /dev/null
@@ -1,27 +0,0 @@
-#ifndef _AMRPROFTEST_F_H 
-#define _AMRPROFTEST_F_H
-               
-#ifdef BL_LANG_FORT
-#    define FORT_AMRPROFTEST      amrproftest
-#    define FORT_AMRPROFTESTINT    amrproftestint
-#else 
-#  ifdef BL_FORT_USE_UPPERCASE
-#    define FORT_AMRPROFTEST      AMRPROFTEST
-#    define FORT_AMRPROFTESTINT    AMRPROFTESTNT
-#  else
-#    define FORT_AMRPROFTEST      amrproftest_
-#    define FORT_AMRPROFTESTINT    amrproftestint_ 
-#  endif
-
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-    void FORT_AMRPROFTEST();
-    void FORT_AMRPROFTESTINT();
-#ifdef __cplusplus
-}     
-#endif
- 
-#endif
-#endif
diff --git a/Tests/C_BaseLib/AMRProfTestBL.cpp b/Tests/C_BaseLib/AMRProfTestBL.cpp
deleted file mode 100644
index 3cdf2a38eef..00000000000
--- a/Tests/C_BaseLib/AMRProfTestBL.cpp
+++ /dev/null
@@ -1,287 +0,0 @@
-// --------------------------------------------------------------
-// AMRProfTest.cpp
-// --------------------------------------------------------------
-#include <iostream>
-#include <fstream>
-#include <cstdlib>
-#include <vector>
-#include <string>
-#include <sstream>
-#include <iomanip>
-#include <unistd.h>
-
-#include <AMReX_BLProfiler.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMRPROFTEST_F.H>
-
-using std::cout;
-using std::endl;
-using namespace amrex;
-
-//===============================================================
-namespace {
-  const unsigned int msps(1000000);
-}
-
-
-// --------------------------------------------------------------
-void ReportSleep(double s, bool us = false) {
-  if(ParallelDescriptor::IOProcessor()) {
-    if(us) {
-      s /= msps;
-    }
-    std::cout << "Sleeping " << s << " s." << std::endl;
-  }
-}
-
-
-// --------------------------------------------------------------
-void Nap(double sleepsec) {
-  BL_PROFILE_REGION_START("R::Nap");
-  BL_PROFILE("Nap()");
-  ReportSleep(sleepsec);
-  usleep(sleepsec * msps);
-  BL_PROFILE_REGION_STOP("R::Nap");
-}
-
-
-// --------------------------------------------------------------
-void Nap1234() {
-  BL_PROFILE_REGION_START("R::Nap1234");
-  BL_PROFILE("Nap1234()");
-  double sleepsec(0.1234);
-  usleep(sleepsec * msps);
-  BL_PROFILE_REGION_STOP("R::Nap1234");
-}
-
-
-// --------------------------------------------------------------
-void Sleep(double sleepsec) {
-  BL_PROFILE_REGION_START("R::Sleep");
-  BL_PROFILE("Sleep()");
-  ReportSleep(sleepsec);
-  usleep(sleepsec * msps);
-  BL_PROFILE_REGION_STOP("R::Sleep");
-}
-
-
-// --------------------------------------------------------------
-void SleepNoProf(double sleepsec) {
-  ReportSleep(sleepsec);
-  usleep(sleepsec * msps);
-}
-
-
-// --------------------------------------------------------------
-void SleepOneProc(double sleepsec) {
-  BL_PROFILE("SleepOneProc()");
-  ReportSleep(sleepsec);
-  usleep(sleepsec * msps);
-}
-
-
-// --------------------------------------------------------------
-void SleepProcTimes(double sleepsec) {
-  BL_PROFILE("SleepProcTimes()");
-  ReportSleep(sleepsec);
-  usleep(sleepsec * msps);
-}
-
-
-// --------------------------------------------------------------
-void NestSleep(double s) {
-  BL_PROFILE_REGION_START("R::NestSleep");
-  BL_PROFILE("NestSleep()");
-  Sleep(0.1 * s);
-  SleepNoProf(0.15 * s);
-  BL_PROFILE_REGION_STOP("R::NestSleep");
-}
-
-
-// --------------------------------------------------------------
-void NestSleep2(double s) {
-  BL_PROFILE_REGION_START("R::NestSleep2");
-  BL_PROFILE("NestSleep2()");
-  SleepNoProf(0.2 * s);
-  NestSleep(0.3 * s);
-  BL_PROFILE_REGION_STOP("R::NestSleep2");
-}
-
-
-// --------------------------------------------------------------
-void NoSleep() {
-  BL_PROFILE("NoSleep()");
-}
-
-
-// --------------------------------------------------------------
-void RecursiveSleep(double s, int nr) {
-  BL_PROFILE_REGION_START("R::RecursiveSleep");
-  BL_PROFILE("RecursiveSleep()");
-  if(ParallelDescriptor::IOProcessor()) {
-    std::cout << "_in RecursiveSleep:  nr = " << nr << std::endl;
-  }
-  Sleep(s);
-  if(nr > 0) {
-    RecursiveSleep(s, nr - 1);
-  }
-  BL_PROFILE_REGION_STOP("R::RecursiveSleep");
-}
-
-
-// --------------------------------------------------------------
-void SameProfName(double sleepsec) {
-  BL_PROFILE_VAR("SameProfName()", SameProfName);
-  SleepProcTimes(sleepsec);
-  BL_PROFILE_VAR_STOP(SameProfName);
-}
-
-
-// --------------------------------------------------------------
-void CProfInt() {
-  int largeNCalls(10000);
-  BL_PROFILE_VAR_NS("CProfInt()", cprofint);
-  for(int i(0); i < largeNCalls; ++i) {
-    BL_PROFILE_VAR_START(cprofint);
-    //usleep(0.2);
-    BL_PROFILE_VAR_STOP(cprofint);
-  }
-}
-
-
-// --------------------------------------------------------------
-void FlushTest() {
-  BL_PROFILE_VAR("FlushTest20()", FlushTest20);
-    BL_PROFILE_VAR("FlushTest3()", FlushTest3);
-    usleep(0.2);
-    BL_PROFILE_VAR_STOP(FlushTest3);
-
-    BL_TRACE_PROFILE_FLUSH();
-
-  BL_PROFILE_VAR_STOP(FlushTest20);
-
-  BL_PROFILE_VAR("FlushTest21()", FlushTest21);
-  BL_PROFILE_VAR_STOP(FlushTest21);
-}
-
-
-// --------------------------------------------------------------
-int main(int argc, char *argv[]) {
-
-#ifdef BL_USE_MPI
-  MPI_Init(&argc, &argv);
-#endif
-
-  amrex::Initialize(argc, argv);
-  BL_PROFILE_INIT_PARAMS(3.0, true, true);
-  BL_PROFILE_REGION_START("R::main");
-  BL_PROFILE_VAR("main()", pmain);
-
-  // ---- test the profiling timer
-  double tpStart(ParallelDescriptor::second());
-  Nap1234();
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << "Test profiling time = " << ParallelDescriptor::second() - tpStart << endl;
-  }
-
-  // ---- test simple functions
-  Nap(0.321);  // ---- this one contains profiling
-  BL_PROFILE_VAR("SimpleSleepTest()", SimpleSleepTest);
-  SleepNoProf(0.42);  // ---- this one contains no profiling
-  BL_PROFILE_VAR_STOP(SimpleSleepTest);
-
-  // ---- test nested functions
-  NestSleep(0.333);
-  NestSleep2(0.555);
-
-  // ---- test recursive function
-  if(ParallelDescriptor::IOProcessor()) {
-    std::cout << "RecursiveNapTest." << std::endl;
-  }
-  RecursiveSleep(0.2, 4);
-
-  // ---- test function called on only one proc
-  if(ParallelDescriptor::IOProcessor()) {
-    SleepOneProc(0.4567);
-  }
-
-  // ---- test different function times
-  int myProc(ParallelDescriptor::MyProc());
-  SleepProcTimes(myProc * 0.1111);
-
-
-/*
-  // ---- test fortran functions
-  BL_PROFILE_VAR("TESTFORTPROF", testfortprof);
-  FORT_AMRPROFTEST();
-  BL_PROFILE_VAR_STOP(testfortprof);
-
-  // ---- test fortran functions with a large number of calls
-  BL_PROFILE_CHANGE_FORT_INT_NAME("fort_amrproftestint", 8);
-  BL_PROFILE_VAR("TESTPROFINT", testfortprofint);
-  FORT_AMRPROFTESTINT();
-  BL_PROFILE_VAR_STOP(testfortprofint);
-*/
-
-
-/*
-  // ---- test c++ functions with a large number of calls
-  BL_PROFILE_VAR("CProfIntCall", cprofintcall);
-  SleepNoProf(0.42);  // ---- this one contains no profiling
-  CProfInt();
-  BL_PROFILE_VAR_STOP(cprofintcall);
-*/
-
-
-  // ---- test regions
-  BL_PROFILE_REGION_START("R::Part 1");
-  SleepNoProf(0.77);
-  NoSleep();
-  BL_PROFILE_REGION_START("R::P12 overlap");
-  SleepNoProf(0.88);
-  BL_PROFILE_REGION_STOP("R::Part 1");
-  BL_PROFILE_REGION_START("R::Part 2");
-  SleepNoProf(0.99);
-  BL_PROFILE_REGION_STOP("R::P12 overlap");
-  NoSleep();
-  BL_PROFILE_REGION_STOP("R::Part 2");
-
-
-  // ---- test using the same profile name in a called function
-  BL_PROFILE_VAR("SameProfName()", SameProfName);
-  SameProfName(0.42);
-  BL_PROFILE_VAR_STOP(SameProfName);
-  Nap(0.2);
-
-  // ---- test unmatched start (an error)
-  //BL_PROFILE_VAR("unmatchedstart()", unmatchedstart);
-
-/*
-  // ---- test flushing for html output
-  BL_TRACE_PROFILE_SETFLUSHSIZE(0);
-  BL_PROFILE_VAR("CallingFlushTest", CallingFlushTest);
-  usleep(0.3);
-  FlushTest();
-  BL_PROFILE_VAR_STOP(CallingFlushTest);
-  BL_PROFILE_VAR("AfterCallingFlushTest", AfterCallingFlushTest);
-  BL_PROFILE_VAR_STOP(AfterCallingFlushTest);
-*/
-
-  ParallelDescriptor::Barrier("EndOfMain");
-
-
-  BL_PROFILE_VAR_STOP(pmain);
-  BL_PROFILE_REGION_STOP("R::main");
-  usleep(0.1 * msps);
-
-  bool finalizeMPI(false);
-  amrex::Finalize(finalizeMPI);
-
-#ifdef BL_USE_MPI
-  MPI_Finalize();
-#endif
-
-}
-
-// --------------------------------------------------------------
-// --------------------------------------------------------------
diff --git a/Tests/C_BaseLib/GNUmakefile b/Tests/C_BaseLib/GNUmakefile
deleted file mode 100644
index 31b6018366a..00000000000
--- a/Tests/C_BaseLib/GNUmakefile
+++ /dev/null
@@ -1,71 +0,0 @@
-#
-# Set these to the appropriate value.
-#
-DIM          = 2
-DIM          = 3
-
-COMP         = g++
-
-DEBUG        = TRUE
-DEBUG        = FALSE
-
-USE_MPI      = FALSE
-USE_MPI      = TRUE
-
-PROFILE       = TRUE
-COMM_PROFILE  = TRUE
-TRACE_PROFILE = FALSE
-#DEFINES += -DBL_PROFILING_SPECIAL
-
-AMREX_HOME = ../..
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-#
-# Base name of each of the executables we want to build.
-# I'm assuming that each of these is a stand-alone program,
-# that simply needs to link against BoxLib.
-#
-#_progs += tVisMF tDir t8BIT tFB tFAC tCArena
-#_progs += tRan
-#_progs  := tread
-#_progs  := tParmParse
-#_progs  := tCArena
-#_progs  := tBA
-#_progs  := tDM
-#_progs  := tFillFab
-#_progs  := tMF
-#_progs  := tFB
-#_progs  := tMFcopy
-#_progs  := AMRProfTestBL
-#_progs  := tFB
-#_progs  := tRABcast.cpp
-#_progs  := tProfiler
-_progs  := tUMap
-
-ifeq ($(_progs),tProfiler)
-  FEXE_sources += TPROFILER.F
-endif
-
-ifeq ($(_progs),tFillFab)
-  fEXE_sources += fillfab.f
-endif
-
-ifeq ($(_progs),tUMap)
-  f90EXE_sources += AMReX_BaseUmap_nd.f90
-endif
-
-include $(AMREX_HOME)/Src/Base/Make.package
-
-all: $(addsuffix $(optionsSuffix).ex, $(_progs))
-
-
-$(addsuffix $(optionsSuffix).ex, $(_progs)) \
-   : %$(optionsSuffix).ex : %.cpp $(objForExecs)
-	$(CXX) $(CPPFLAGS) $(CXXFLAGS) $(includes) $(LDFLAGS) -o $@ $< $(objForExecs) $(libraries)
-	$(RM) $@.o
-
-clean::
-	$(RM) bl3_prof bl3_prof.m
-	$(RM) *.ex *.o
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/C_BaseLib/TPROFILER.F b/Tests/C_BaseLib/TPROFILER.F
deleted file mode 100644
index b09774f8142..00000000000
--- a/Tests/C_BaseLib/TPROFILER.F
+++ /dev/null
@@ -1,31 +0,0 @@
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include "TPROFILER_F.H"
-
-
-c     ----------------------------------------------------------
-      subroutine FORT_TESTPROFILER ()
-        integer  i
-        print *, "_in FORT_TESTPROFILER"
-        do i = 1, 12000
-c         call bl_proffortfuncstart("testprofiler")
-c         call bl_proffortfuncstop("testprofiler")
-          call bl_proffortfuncstart("t")
-          call bl_proffortfuncstop("t")
-        enddo
-        print *, "_out FORT_TESTPROFILER"
-      end
-
-c     ----------------------------------------------------------
-      subroutine FORT_TESTPROFILERINT ()
-        integer  i
-        print *, "_in FORT_TESTPROFILERINT"
-        do i = 1, 12000
-          call bl_proffortfuncstart_int(3)
-          call bl_proffortfuncstop_int(3)
-        enddo
-        print *, "_out FORT_TESTPROFILERINT"
-      end
diff --git a/Tests/C_BaseLib/TPROFILER_F.H b/Tests/C_BaseLib/TPROFILER_F.H
deleted file mode 100644
index 1e9315d5e82..00000000000
--- a/Tests/C_BaseLib/TPROFILER_F.H
+++ /dev/null
@@ -1,27 +0,0 @@
-#ifndef _AVGDOWN_F_H 
-#define _AVGDOWN_F_H
-               
-#ifdef BL_LANG_FORT
-#    define FORT_TESTPROFILER         testprofiler
-#    define FORT_TESTPROFILERINT         testprofilerint
-#else 
-#  ifdef BL_FORT_USE_UPPERCASE
-#    define FORT_TESTPROFILER         TESTPROFILER
-#    define FORT_TESTPROFILERINT         TESTPROFILERINT
-#  else
-#    define FORT_TESTPROFILER         testprofiler_ 
-#    define FORT_TESTPROFILERINT         testprofilerint_ 
-#  endif
-
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-    void FORT_TESTPROFILER ();
-    void FORT_TESTPROFILERINT ();
-#ifdef __cplusplus
-}
-#endif     
- 
-#endif
-#endif
diff --git a/Tests/C_BaseLib/fillfab.f b/Tests/C_BaseLib/fillfab.f
deleted file mode 100644
index d39b4713800..00000000000
--- a/Tests/C_BaseLib/fillfab.f
+++ /dev/null
@@ -1,27 +0,0 @@
-      subroutine fillfab(d,nx,ny)
-      implicit none
-
-      double precision d(nx,ny,2)
-      integer nx, ny
-      character :: filename*100
-      real delx
-      integer i, j
-
-      filename = './field_full_native_double.dat'
-
-      open(unit=2345, file=trim(filename), status='old',
-     &     form='unformatted')
-
-      read(2345) i, j
-      read(2345) delx
-
-      if (nx .ne. i) stop 'nx != i'
-      if (ny .ne. j) stop 'ny != j'
-
-      read(2345) d(1:nx,1:ny,1:2)
-      close(2345)
-
-      print*, 'i: ', i, 'j: ', j
-      print*, 'delx: ', delx
-
-      end subroutine fillfab
diff --git a/Tests/C_BaseLib/mt19937int.out b/Tests/C_BaseLib/mt19937int.out
deleted file mode 100644
index 4e81f657870..00000000000
--- a/Tests/C_BaseLib/mt19937int.out
+++ /dev/null
@@ -1,200 +0,0 @@
-2867219139 1585203162 3113124129 2953900839 2463794868 
-3482265796 1164297043 3598195569  589972756 4112233867 
- 767115311 4093075447 1322433849 3357085324 3300048468 
-3649464345 3676604632 1475054104 2601934239 3420804864 
-2492391180   28597038 1901037238 1209433535 3580317774 
-2488297452   79873538 3308484072 2913896343 4166196021 
-1930853421 3313543893 2603730014 2827553081 1952080899 
-1405101208 1959413290 2221997165 4110132150 1025637693 
-3670222467 3930802957 2581008338 1350592177 3907543700 
-4014701607  935323183 1742076441 3183014990 3775329649 
-2670402585  631538770 3348109412 2875142640 1153190187 
-1034841106 4215431531 3369145821 2443967621  489641649 
-1500338112 3753983456  714552875 1260890119 2952668397 
-3337192800  555421782   74804828 1151768793 1410928776 
-1120209439 2228198263 4057501661 3114914981 2544059595 
-3532152016 2287564919 2032846052 1496843742 3333090545 
-1817300007  250812909 1159923179  685307794 3541764804 
- 461984834 3147015419 3371051674  740493100 1639766659 
- 890836426 1816610558  740465142  185885280 4259873427 
-3958263241 4265440603  921638366 4154579172  805230647 
-3014407950 1805221957  561367725 2705796996 1548190021 
-2511308322 1037370857 3468383218 2263520462  100585698 
-1357493989 3614308996  171284736 2282220711 3523042469 
-2348826997  107252578 4276234757 3467471468  226242558 
-1135756939 1172828762 1603997125 2391541156 3151990464 
-1103261409 3154811332 1113077002 3536625341 2952420703 
-1239175044 2568687405 2847842220 3298739581 3765822280 
-1818781797 1788591806 1276077776  949399679  539881640 
-2515373476 3278313288 2195264511 3140718958 2245786462 
-3972928638  927276666  511152533 2786021231 3889288448 
-1460095448 3481321755 2645725544 2557599731 3008353305 
-2338169325 3715786542 2327664598 1670522570  398515741 
-3912248287 1871479044  819271481 1603628159 2242972174 
-3206947715 2994316262 3479367748 2428416502 3005191888 
- 596767713 4276386271  629871933 1632138881 2115083989 
- 801211500 3827872169 1960552366 1795052222 2979479912 
-  87338528 3149244595  643926064 3517042602 2067922190 
-2800708034  196411345 1750850708 1469706228 2911845443 
-1988965279 2800355451 2805480064 2192011017 3674906385 
-2681712455 4227392471 2728849226 3329705101 1906618821 
-3142299622 1154270206 4163694621 1798769436 4013849691 
-2028970854 2216068645 1849210321 4107229332 2515252953 
-3522279734 1983720317 2024886240 3537672193 3930217610 
-  72039252 1780891549 3528367504  251685934 1188909432 
-1947153461  370404364 3813997465  162450456 3817237392 
-3024813148  114391043 3190750639 2737018031 1006449521 
-3646726966  287956073 1149908372  487404965 2110874122 
-4169788922 2708120708 1662089132  509477256 1099251950 
-2939553466 4116915810 2237150968 2532635264 1924974342 
-2275083438 2001527850   85819681 1193976695 2861341617 
-1014135054  996772449 4164228014 1090591843 2130489362 
- 769151670  995393661  930169499   53462752  966539569 
-1906551696 3460997327 3881239157 2276159353  119179965 
-1765229953 2268172609 1085009887 2675771386  458208333 
-1454994770 1017850103 2649434515 2999463338  388687986 
-3415289788 3023627127 1525959519 2452400350 2054320272 
-3631689268 2249184966 2108263178 2566643186  614451766 
-1697197121 1906804322 1965059615 3685123413 1808965526 
-3338843213 3764537527 3904177263  654414333 3369183195 
- 172707682 1789534658   99114865  197192909 1307666933 
-3275439681 3162223316 2159224432 2431824578  479324619 
-1925592859 2627879461  792010626  472668456 4177737701 
-2599283126 3434190900 1904530818 1875549291 2782382323 
-1854703958  335047755  782741003 3349774673 2070491163 
-1444691247 4133539299 3021083499 2858372993 4249693401 
-3115492149 2825785659 3224153798 4151435371 4286292998 
-1256416790 1517863100  745532812 2757126489 4013428350 
-2423548174 2188411943 3829463160 1559482295  745669519 
-3439972168  161134094 3704705522 2092939826 3727766120 
-1109991787 3566213491 1293706699 1909349236 2420196524 
-2304746689 3635143867 3551959793 4288618652  669034647 
-3741111948 2199915868 2168112271 1697649112 1070896705 
-2790677773  929567277 3818265352 1552321291 1984195592 
-2012174866 3313686631 3187267079 3743463291 3456016892 
-3700547177  673536746 3681166837  639979024  908071910 
- 285351138 3480863067 2726064042 3433216772 4179945392 
-3619009940 2905120322 1106151469 2104819134 3436744154 
-2515523866 2371838050 1019585697 3627952443  875737047 
- 370873717 2940893797  685464258  748098950 3797185507 
-1051282146 2282833018  477323378 4052824808 3410768817 
-2708164210 3910080099  801512007 3165259863 3098921372 
- 202576730 3056859886 3173659693 1703200672 1431918718 
-1548107888 4098890898 4025128517 1676726643 3185240256 
-1377418328  682127434  229406958  536272508 1302848757 
-2222642426 3401319609  342519951 3491817370  880356224 
-2288503572 2560186828  904726294 2902811194 2239545174 
-1380829270 1525997083  799156132 3864212205  768044736 
-2575515908 3700396389 1384921240 1784666717 2072282702 
-2273112071   73034983 1893910430  554586922 1002452453 
- 244890730 1914712138 3103142789 4100378990   15082512 
-4138839635  286473904   28127927 4285718216 3253349861 
- 848606688  751913560 2912664004 4265187531 3287406403 
-3072476689 1465740219 1119222960 1706572418 1637696965 
-1301369982  994855959 3172254721 2787055691 4037606898 
-2001758001 3068451101 1913702326  164846220 3386718455 
-2360582776  538955390 1122472306 2163787896 3820825269 
- 473138414  403084459  780682841 1916392897 2137309162 
-2973130398 1560974537  383098889 2823811259   95656605 
-1100898974 2054803549 1432869091   39447374 3865802542 
-2243381851  326718209 3764656818 3855400005 3824649153 
-1760031250 3890102346   38307054 3248874532  997675099 
-1302054089 1134435193 3758588966 3856615910 3995873394 
-1997896248 2341490681 4139020774 4219325865 2880626819 
-1553845962  739906589 2668272545 1218350904 1726725379 
-3948906843 1266205878 3012873230 2240549028  377137844 
- 907277693 2560807557  211027090 1865109379 1680481889 
-3006556199 1195935070  538932664  781359924 1623787727 
-2139406835  695091061 1267298086  644554442 2677351606 
-1079279370 2545101579  536974673 3409890995  328220108 
-3828121455 2972265230 2639000446  208138402 3320584784 
-3363876703 2161783108 3027769253 2818364264 1836513581 
-2700089162 3711109606 2707396532 2252522835  542106924 
- 290861120   65506152 4196413643  358020078  911900450 
-2802065405 3188834047  616484753 4176172380 3492813945 
- 795652043  342823405 3851175499 2477619202  974180631 
-2070155077 3048615955 3495083384  650122283   14857981 
-1511525369 1296338035  240671856 4168080735 2161570494 
- 148980922  962978395 1307706563 3324956171 1322718131 
-1734073640 2389532755  382604108  432552756  311652177 
-2123865787 4157917041 3154366327 2978207584 1290868994 
-2007821863 3260860131 2640548616 3404112149 1612513188 
-3058779399 4287633829 2922820044 3033015498 3511571915 
- 991947766  643957286 2436721391 3576617627 2376996434 
-1222099653 3675388593 1992634707 2782662035 1200611853 
- 159589769  679751733 3161948893  589403970 1044672925 
-1965277612 1713774522 1215426812 1813238647 3046834204 
-1409105205 3251078319 3532268691 2616009849 1386097548 
- 174492254 3978807460 2821108637 2107299989 3461277028 
- 491302117 2132304916 4182289785 2030842100  926165801 
-1843009221    4893907 1091318508 2578976004 3429416159 
-3465002536 4047073710 3470663786  489006494 1589495825 
-2487643370   50052787 4184895002  478354171 4082727190 
-2983387324 3988219089 2947112381 2737973843  650841551 
- 207036108  469279577 2683578043 3017632501  163011627 
-1693305508 3903975904 3023727891 2966166673 1330783281 
- 714904080  487395952 3194176556  132096950 3471991421 
-3333279298  964375359 1852875757 3398189707 1367148533 
-3028366754 1975064118 1410547156  930454876 1797368724 
-1024933376 4216347534 2926795400 2780961322 2950171792 
- 254604891 2461064346 3101055432 4066457036 2276047585 
-2005729740  702724217  352362105 4032003380 3868709967 
-3062450037 1984810322 1122228626 1836441070 3049160795 
-3505191268 1416228722 3011433267 3618970400 2634380746 
- 521960665 1258860577 3646964245  482700194  576607559 
-1025672363 1619715344 2931841378 2383672736 4168420462 
-3899810386 2725154884 1643576117 4113444955 1695213625 
- 929397946 4130386425 3278249905  338698100 2621561873 
- 760291850 1827462673 2953977437 2802490860  952114118 
-1564374766 1510012037 2517230207 2879255110 1376858550 
- 545337582  275466025 1766675460  841474537 2279046836 
- 160777324 1685578416   97066962   70420376 2697708528 
-1312050661  277966306 2512268326 3560039935 3707673740 
-1802069091 2214309607 3679963423 2799689014 2064212423 
-2518670131 1071037431 3289103113 2832242556  626819162 
-2821900349 4205402301 3092543042 1327800001 2111287012 
-3356990396 2106560895  980585039 2374462023 3972980985 
-1815212590 2934114838 2466983682 2647086546 1917133448 
- 757801743 2800426440 3462078459 1864979383 3711607473 
-3244474925 1082752058 1953813482 3572643973 1845637828 
-1693567413 1911166886   13616514 1527215536  944105697 
-3720955806 3011125828 3659854035 3491170189 1206734392 
-2464190967  259012728  351640621  348063345  237157049 
-2592736807 3472084471  967215995 1941684155 3333469178 
-4243822747 2837898655 2173645309 2144297387 4085774723 
-2739089063 1721981340 1029091741 3863714757 3169542690 
-1736267037 1087293093 3741407119 3003360275 4039152624 
- 965607200 1494605756 2700809461 1862970278 2060187203 
-2636522014 2296966448 2138904618  830770044 2409839298 
- 946077889  676163933 2337773259 1967578486 1364110453 
-1120981439 1505148538 3176892430 3788500489 2221440449 
-2877805945 1848017526 1060239654 2981107887  394732496 
- 775694702 2465430652  256035109  672200319 4034366090 
- 652227015  224664253 2832534389 2590752268 1616461983 
- 474981047 1729743343 1033065486 3679817635 1945677673 
-4142123708 3441705395 3623363652 2888854797 3848994849 
-2774468965  733621242 1559397411  610848083 1861857918 
- 290039215 1969085557 2949458979 4146721138 1709209040 
-3104641793 2414678267 3702112927 1922014713 3006301085 
-2557432695 1953275956 3475362527 3440824021 1879890923 
-4118996054  524339283 2248075324 1608569809 1946682979 
-1598268490 3463673619  456566908 1513321122 1918511241 
-3005439161 1218124360 2614200732 1479017575 2505142496 
-3134113721 2091183380 2232940223 1740181808 2202332383 
-2146620821 2123780007 3400091025 3142337592 1128001831 
-3655589806 3699941203  871253103 1532083500  883298808 
-2042462485 1141767415 3305182865 2246327140 1481051047 
-2467236685 1053025675 1128030915  579308527 4094341357 
-3312590487 2638764195 4224606959  975347930 2780688281 
-3249107391 1737859059  562230366 3107238138 1630808317 
-3323952099 2688243612 1676966491 1391319909 1149056605 
- 160522031 1888652620 1204167962 2599816629 4096616603 
-2153451204 2234463327 2254107492 2798858945 1904589021 
-3082279528  618798780 3162900214  746972615 4152315314 
-3641376911  347959902  847266746 3443266042 4212579027 
-2141521991 2369733694 4051999217 2434367934 2274132668 
-3939258516  365865295 1762948411 3765297135 4284895923 
-1178072377 1164762067 2304673964 2601931087  660951723 
- 324246673 1237854749 1390986182 3123416686 3229473430 
- 647145616 2228556457 3484897681 3854370955 3714649568 
-1924448690  275933853 3254129074 1742363440 1030650439 
diff --git a/Tests/C_BaseLib/t8BIT.cpp b/Tests/C_BaseLib/t8BIT.cpp
deleted file mode 100644
index 2653a402c9e..00000000000
--- a/Tests/C_BaseLib/t8BIT.cpp
+++ /dev/null
@@ -1,32 +0,0 @@
-
-// A simple program to read in a MultiFab and write out in 8BIT format.
-//
-
-#include <string>
-
-#include <AMReX_VisMF.H>
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    argc--; argv++;
-
-    FArrayBox::setFormat(FABio::FAB_8BIT);
-
-    for (int i = 0; i < argc; i++)
-    {
-	std::cout << "Transforming " << argv[i] << " ... " << std::flush;
-
-	std::string name = argv[i];
-
-        MultiFab mf;
-
-        VisMF::Read(mf, name);
-
-        VisMF::Write(mf, name, VisMF::OneFilePerCPU, true);
-
-	std::cout << "done" << std::endl;
-    }
-}
diff --git a/Tests/C_BaseLib/tBA.cpp b/Tests/C_BaseLib/tBA.cpp
deleted file mode 100644
index 585fa8f11da..00000000000
--- a/Tests/C_BaseLib/tBA.cpp
+++ /dev/null
@@ -1,387 +0,0 @@
-#include <iostream>
-#include <fstream>
-#include <AMReX_BoxArray.H>
-#include <AMReX_BoxDomain.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <map>
-
-using namespace amrex;
-
-static
-BoxArray
-GetBndryCells_old (const BoxArray& ba,
-                   int             ngrow,
-                   const Box&      domain)
-{
-    std::cout << "GetBndryCells_old():" << std::endl;
-
-    Real beg = ParallelDescriptor::second();
-
-    const BoxList blgrids = BoxList(ba);
-
-    BoxDomain bd;
-    for (int i = 0; i < ba.size(); ++i)
-    {
-	BoxList gCells = amrex::boxDiff(amrex::grow(ba[i],ngrow),ba[i]);
-
-	for (BoxList::iterator bli = gCells.begin(); bli != gCells.end(); ++bli)
-	    bd.add(amrex::complementIn(*bli,blgrids));
-    }
-
-    BoxList bl;
-    for (BoxDomain::const_iterator bdi = bd.begin(); bdi != bd.end(); ++bdi)
-    {
-        bl.push_back(*bdi);
-    }
-
-    std::cout << "    size before simplify() = " << bl.size() << std::endl;
-    bl.simplify();
-    Real end = ParallelDescriptor::second() - beg;
-    std::cout << "    size after simplify() = " << bl.size() << std::endl;
-    std::cout << "    time = " << end << std::endl;
-
-    return BoxArray(bl);
-}
-
-static
-BoxArray
-GetBndryCells_new (const BoxArray& ba,
-                   int             ngrow,
-                   const Box&      domain)
-{
-    std::cout << "GetBndryCells_new():" << std::endl;
-
-    Real beg = ParallelDescriptor::second();
-    //
-    // First get list of all ghost cells.
-    //
-    BoxList gcells;
-    for (int i = 0; i < ba.size(); ++i)
-    {
-	gcells.join(amrex::boxDiff(amrex::grow(ba[i],ngrow),ba[i]));
-    }
-    std::cout << "    size of ghostcell list: " << gcells.size() << std::endl;
-    //
-    // Now strip out intersections with original BoxArray.
-    //
-    BoxList bcells;
-    for (BoxList::const_iterator it = gcells.begin(); it != gcells.end(); ++it)
-    {
-        std::vector< std::pair<int,Box> > isects = ba.intersections(*it);
-
-        if (isects.empty())
-        {
-            bcells.push_back(*it);
-        }
-        else
-        {
-            //
-            // Collect all the intersection pieces.
-            //
-            BoxList pieces;
-            for (int i = 0; i < isects.size(); i++)
-                pieces.push_back(isects[i].second);
-            BoxList leftover = amrex::complementIn(*it,pieces);
-            bcells.catenate(leftover);
-        }
-    }
-
-    std::cout << "    size of bndrycell list: " << bcells.size() << std::endl;
-    //
-    // Now strip out overlaps.
-    //
-    gcells.clear();
-
-    gcells = amrex::removeOverlap(bcells);
-
-    std::cout << "    size before simplify(): " << gcells.size() << std::endl;
-
-    int min[BL_SPACEDIM] = {10000};
-    int max[BL_SPACEDIM] = {0};
-
-    std::map<int,int> dist;
-
-    for (BoxList::const_iterator it = gcells.begin(); it != gcells.end(); ++it)
-    {
-        dist[it->numPts()]++;
-
-        for (int i = 0; i < BL_SPACEDIM; i++)
-        {
-            int l = it->length(i);
-            if (l > max[i]) max[i] = l;
-            if (l < min[i]) min[i] = l;
-        }
-    }
-
-    std::cout << "min,max length:\n";
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        std::cout << "i: " << i << ' ' << min[i] << ' ' << max[i] << '\n';
-    }
-    std::cout << std::endl;
-
-    std::cout << "numPts() distribution before simplify():\n";
-    for (std::map<int,int>::const_iterator it = dist.begin();
-         it != dist.end();
-         ++it)
-    {
-        std::cout << it->first << ' ' << it->second << '\n';
-    }
-
-    gcells.simplify();
-    std::cout << "    size after simplify() = " << gcells.size() << std::endl;
-
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        min[i] = 10000; max[i] = 0;
-    }
-    dist.clear();
-
-    for (BoxList::const_iterator it = gcells.begin(); it != gcells.end(); ++it)
-    {
-        dist[it->numPts()]++;
-
-        for (int i = 0; i < BL_SPACEDIM; i++)
-        {
-            int l = it->length(i);
-            if (l > max[i]) max[i] = l;
-            if (l < min[i]) min[i] = l;
-        }
-    }
-
-    std::cout << "min,max length:\n";
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        std::cout << "i: " << i << ' ' << min[i] << ' ' << max[i] << '\n';
-    }
-    std::cout << std::endl;
-
-    std::cout << "numPts() distribution after simplify():\n";
-    for (std::map<int,int>::const_iterator it = dist.begin();
-         it != dist.end();
-         ++it)
-    {
-        std::cout << it->first << ' ' << it->second << '\n';
-    }
-
-    gcells.maxSize(64);
-    std::cout << "    size after maxSize() = " << gcells.size() << std::endl;
-    Real end = ParallelDescriptor::second() - beg;
-    std::cout << "    time = " << end << std::endl;
-
-    dist.clear();
-    for (BoxList::const_iterator it = gcells.begin(); it != gcells.end(); ++it)
-    {
-        dist[it->numPts()]++;
-    }
-    std::cout << "numPts() distribution after maxSize():\n";
-    for (std::map<int,int>::const_iterator it = dist.begin();
-         it != dist.end();
-         ++it)
-    {
-        std::cout << it->first << ' ' << it->second << '\n';
-    }
-
-    
-    return BoxArray(gcells);
-}
-
-static
-void
-intersections_old (const BoxArray& ba)
-{
-    const Real beg = ParallelDescriptor::second();
- 
-    int cnt = 0;
-
-    const int ngrow = 1;
-
-    Box isect;
-
-    for (int j = 0; j < ba.size(); j++)
-    {
-        const Box& bx = amrex::grow(ba[j], ngrow);
-
-        for (int i = 0; i < ba.size(); i++)
-        {
-            isect = bx & ba[i];
-
-            if (isect.ok())
-                cnt++;
-        }
-    }
-
-    Real end = ParallelDescriptor::second() - beg;
-
-    std::cout << "old cnt = " << cnt << ", time = " << end << std::endl;
-}
-
-static
-void
-intersections_new (const BoxArray& ba)
-{
-    const Real beg = ParallelDescriptor::second();
-
-    int cnt = 0;
-
-    const int ngrow = 1;
-    
-    for (int j = 0; j < ba.size(); j++)
-    {
-        std::vector< std::pair<int,Box> > v = ba.intersections(amrex::grow(ba[j], ngrow));
-
-        cnt += v.size();
-    }
-
-    Real end = ParallelDescriptor::second() - beg;
-
-    std::cout << "new cnt = " << cnt << ", time = " << end << std::endl;
-}
-
-static
-BoxList
-newComplementIn_old (const Box&     b,
-                     const BoxList& bl)
-{
-    BoxList newb(b.ixType());
-    newb.push_back(b);
-    for (BoxList::const_iterator bli = bl.begin(); bli != bl.end() && newb.isNotEmpty(); ++bli)
-    {
-        for (BoxList::iterator newbli = newb.begin(); newbli != newb.end(); )
-        {
-            if (newbli->intersects(*bli))
-            {
-                BoxList tm = amrex::boxDiff(*newbli, *bli);
-                newb.catenate(tm);
-                newb.remove(newbli++);
-            }
-            else
-            {
-                ++newbli;
-            }
-        }
-    }
-    return newb;
-}
-
-static
-void
-Print (const BoxList& bl, const char* str)
-{
-    std::cout << str << ", size = " << bl.size() << " :\n";
-
-    for (BoxList::const_iterator bli = bl.begin(); bli != bl.end(); ++bli)
-    {
-        std::cout << *bli << '\n';
-    }
-}
-
-int
-main ()
-{
-//    std::ifstream ifs("ba.60", std::ios::in);
-//    std::ifstream ifs("ba.213", std::ios::in);
-//    std::ifstream ifs("ba.1000", std::ios::in);
-//    std::ifstream ifs("ba.5034", std::ios::in);
-    std::ifstream ifs("ba.15456", std::ios::in);
-//    std::ifstream ifs("ba.mac.294", std::ios::in);
-//    std::ifstream ifs("ba.3865", std::ios::in);
-
-    std::cout << "Got Here" << std::endl;
-
-    BoxArray ba;
-
-    ba.readFrom(ifs);
-
-    std::cout << "Got Here 2" << std::endl;
-
-//    ba.writeOn(std::cout); std::cout << std::endl;
-
-    Box bb = ba.minimalBox();
-    std::cout << "First Minimal box: " << bb << std::endl;
-
-//    ba.refine(2);
-//    ba.maxSize(32);
-    
-//    std::cout << "ba.size() = " << ba.size() << std::endl;
-//    bb = ba.minimalBox();
-//    std::cout << "Second Minimal box: " << bb << std::endl;
-
-//    for (int i = 0; i < ba.size(); i++)
-//        std::cout << ba[i] << '\n';
-
-    if (ba.isDisjoint())
-        std::cout << "The new BoxArray is disjoint" << std::endl;
-    else
-        std::cout << "The new BoxArray is NOT disjoint" << std::endl;
-
-//    exit(0);
-
-    bb.grow(4);
-
-    BoxList bl;
-    for (int i = 0; i < ba.size(); i++)
-        bl.push_back(ba[i]);
-
-//    bl.push_back(Box(IntVect(43,0,0),IntVect(52,31,31)));
-//    bl.push_back(Box(IntVect(53,3,3),IntVect(70,28,28)));
-//    bb = Box(IntVect(46,-2,-2),IntVect(51,4,33));
-
-//    intersections_old(ba);
-//    intersections_new(ba);
-
-    BoxList bl1, bl2;
-
-    {
-    const Real beg = ParallelDescriptor::second();
-    bl1 = amrex::complementIn(bb, bl);
-    const Real end = ParallelDescriptor::second() - beg;
-    std::cout << "complementIn(), size = " << bl1.size() << " time = " << end << std::endl;
-    bl1.simplify();
-    std::cout << "complementIn(), size after simplify() = " << bl1.size() << std::endl;
-    bl1.minimize();
-    std::cout << "complementIn(), size after minimize() = " << bl1.size() << std::endl;
-    }
-
-    {
-    const Real beg = ParallelDescriptor::second();
-    bl2 = newComplementIn_old(bb, bl);
-    const Real end = ParallelDescriptor::second() - beg;
-    std::cout << "newComplementIn_old(), size = " << bl2.size() << " time = " << end << std::endl;
-    }
-
-//    bl1.simplify();
-//    bl2.simplify();
-
-    BoxArray nba1(bl1);
-    BoxArray nba2(bl2);
-
-    std::cout << "nba1.numPts = " << nba1.numPts() << std::endl;
-    std::cout << "nba2.numPts = " << nba2.numPts() << std::endl;
-
-    if (nba1.contains(nba2) && nba2.contains(nba1))
-    {
-        std::cout << "nba1 & nba2 cover the same area" << std::endl;
-    }
-    else
-    {
-        std::cout << "nba1 & nba2 do NOT cover the same area" << std::endl;
-        Print(bl1, "bl1");
-        Print(bl2, "bl2");
-    }
-
-    exit(0);
-
-    nba2 = GetBndryCells_new(ba, 1, bb);
-    nba1 = GetBndryCells_old(ba, 1, bb);
-
-    if (nba2.isDisjoint())
-        std::cout << "The new BoxArray is disjoint" << std::endl;
-    else
-        std::cout << "The new BoxArray is NOT disjoint" << std::endl;
-    
-    if (nba1.contains(nba2) && nba2.contains(nba1))
-        std::cout << "nba1 & nba2 cover the same area" << std::endl;
-    else
-        std::cout << "nba1 & nba2 do NOT cover the same area" << std::endl;
-}
diff --git a/Tests/C_BaseLib/tCArena.cpp b/Tests/C_BaseLib/tCArena.cpp
deleted file mode 100644
index 119e625f4b7..00000000000
--- a/Tests/C_BaseLib/tCArena.cpp
+++ /dev/null
@@ -1,89 +0,0 @@
-
-#include <unistd.h>
-
-#include <AMReX_REAL.H>
-#include <AMReX_CArena.H>
-#include <AMReX_Utility.H>
-
-#include <list>
-#include <new>
-using std::list;
-
-using namespace amrex;
-
-//
-// A simple class emulating how we use FABs.
-//
-class FB
-{
-public:
-    FB ();
-    ~FB ();
-
-    bool ok () const;
-
-    enum { CHUNKSIZE = 1024 };
-
-private:
-    //
-    // Disallowed
-    //
-    FB (const FB& rhs);
-    FB& operator= (const FB&);
-
-    static CArena m_CArena;
-
-    size_t  m_size;
-    double* m_data;
-};
-
-CArena FB::m_CArena(100*CHUNKSIZE);
-
-FB::FB ()
-{
-    m_size = size_t(CHUNKSIZE*amrex::Random());
-    m_data = (double*) m_CArena.alloc(m_size*sizeof(double));
-    //
-    // Set specific values in the data.
-    //
-    for (int i = 0; i < m_size; i++)
-        m_data[i] = m_size;
-}
-
-FB::~FB ()
-{
-    ok();
-    m_CArena.free(m_data);
-}
-
-bool
-FB::ok () const
-{
-    for (int i = 0; i < m_size; i++)
-        BL_ASSERT(m_data[i] == m_size);
-    return true;
-}
-
-int
-main ()
-{
-    list<FB*> fbl;
-
-    for (int j = 0; j < 10; j++)
-    {
-	std::cout << "Loop == " << j << std::endl;
-
-        for (int i = 0; i < 1000; i++)
-        {
-            fbl.push_back(new FB);
-        }
-
-        while (!fbl.empty())
-        {
-            delete fbl.back();
-            fbl.pop_back();
-        }
-    }
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tDM.cpp b/Tests/C_BaseLib/tDM.cpp
deleted file mode 100644
index 6a984d45068..00000000000
--- a/Tests/C_BaseLib/tDM.cpp
+++ /dev/null
@@ -1,58 +0,0 @@
-#include <iostream>
-#include <fstream>
-#include <AMReX_BoxArray.H>
-#include <AMReX_BoxDomain.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_DistributionMapping.H>
-
-using namespace amrex;
-
-static
-void
-Print (const BoxList& bl, const char* str)
-{
-    std::cout << str << ", size = " << bl.size() << " :\n";
-
-    for (BoxList::const_iterator bli = bl.begin(); bli != bl.end(); ++bli)
-    {
-        std::cout << *bli << '\n';
-    }
-}
-
-int
-main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-
-//    std::ifstream ifs("ba.60", std::ios::in);
-//    std::ifstream ifs("ba.213", std::ios::in);
-//    std::ifstream ifs("ba.1000", std::ios::in);
-//    std::ifstream ifs("ba.5034", std::ios::in);
-//    std::ifstream ifs("ba.15456", std::ios::in);
-//    std::ifstream ifs("ba.mac.294", std::ios::in);
-//    std::ifstream ifs("ba.3865", std::ios::in);
-    std::ifstream ifs("ba.23925", std::ios::in);
-
-    BoxArray ba;
-
-    ba.readFrom(ifs);
-
-    std::cout << "# of grids: " << ba.size() << '\n';
-
-    for (int nprocs = 2; nprocs < 5000; nprocs *= 2)
-    {
-        std::cout << "\nnprocs = " << nprocs << '\n';
-
-        DistributionMapping::strategy(DistributionMapping::SFC);
-        DistributionMapping dm1(ba,nprocs);
-        DistributionMapping::FlushCache();
-
-        std::cout << '\n';
-
-        DistributionMapping::strategy(DistributionMapping::KNAPSACK);
-        DistributionMapping dm2(ba,nprocs);
-        DistributionMapping::FlushCache();
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/C_BaseLib/tDir.cpp b/Tests/C_BaseLib/tDir.cpp
deleted file mode 100644
index c26faae60f0..00000000000
--- a/Tests/C_BaseLib/tDir.cpp
+++ /dev/null
@@ -1,14 +0,0 @@
-
-#include <AMReX_Utility.H>
-
-int
-main (int argc, char** argv)
-{
-    if (argc == 2)
-    {
-        if (!amrex::UtilCreateDirectory(argv[1], 0755))
-        {
-            std::cout << "Utility::UtilCreateDirectory() failed!!!\n";
-        }
-    }
-}
diff --git a/Tests/C_BaseLib/tFAC.cpp b/Tests/C_BaseLib/tFAC.cpp
deleted file mode 100644
index a1faa2e21b7..00000000000
--- a/Tests/C_BaseLib/tFAC.cpp
+++ /dev/null
@@ -1,62 +0,0 @@
-
-//
-// A simple program to test FabArray<T>::copy() in parallel.
-//
-
-#if !(BL_SPACEDIM==2)
-#error "This code assumes BL_SPACEDIM==2"
-#endif
-
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-
-    BL_ASSERT(ParallelDescriptor::NProcs() == 2);
-
-    BoxArray ba_1(1);
-    BoxArray ba_2(5);
-
-    ba_1.set(0, Box(IntVect(0,0), IntVect(4,4)));
-
-    ba_2.set(0, Box(IntVect( 1,0), IntVect(3,0)));
-    ba_2.set(1, Box(IntVect( 0,1), IntVect(4,1)));
-    ba_2.set(2, Box(IntVect(-1,2), IntVect(3,2)));
-    ba_2.set(3, Box(IntVect( 1,3), IntVect(5,3)));
-    ba_2.set(4, Box(IntVect(-1,4), IntVect(5,4)));
-
-    DistributionMapping dm_1 {ba_1};
-    DistributionMapping dm_2 {ba_2};
-
-    MultiFab mf_1(ba_1,dm_1,1,0);
-
-    MultiFab mf_2(ba_2,dm_2,2,0);
-    //
-    // Set all on mf_1 to zero.
-    //
-    mf_1.setVal(0);
-    //
-    // Set the first component of mf_2 to zero.
-    //
-    mf_2.setVal(0,0,1,0);
-    //
-    // Set second component to relevent index.
-    //
-    for (int i = 0; i < mf_2.size(); i++)
-    {
-        mf_2.setVal(i+1,ba_2[i],1,1,0);
-    }
-
-    mf_1.copy(mf_2, 1, 0, 1);
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-	std::cout << mf_1[0] << std::endl;
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/C_BaseLib/tFB.cpp b/Tests/C_BaseLib/tFB.cpp
deleted file mode 100644
index 8d1f6e59142..00000000000
--- a/Tests/C_BaseLib/tFB.cpp
+++ /dev/null
@@ -1,159 +0,0 @@
-//
-// A test program for FillBoundary().
-//
-
-#include <AMReX_Utility.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-const int nTimes(5);
-const int nStrategies(4);
-
-
-int
-main (int argc, char** argv)
-{
-  amrex::Initialize(argc, argv);
-
-  BL_PROFILE_VAR("main()", pmain);
-
-  Vector<DistributionMapping::Strategy> dmStrategies(nStrategies);
-  dmStrategies[0] = DistributionMapping::ROUNDROBIN;
-  dmStrategies[1] = DistributionMapping::KNAPSACK;
-  dmStrategies[2] = DistributionMapping::SFC;
-  dmStrategies[3] = DistributionMapping::PFC;
-
-  Vector<std::string> dmSNames(nStrategies);
-  dmSNames[0] = "ROUNDROBIN";
-  dmSNames[1] = "KNAPSACK";
-  dmSNames[2] = "SFC";
-  dmSNames[3] = "PFC";
-
-  Vector<double> dmSTimes(nStrategies, 0.0);
-
-  for(int iS(0); iS < nStrategies * nTimes; ++iS) {
-
-    int whichStrategy(iS % nStrategies);
-
-    DistributionMapping::strategy(dmStrategies[whichStrategy]);
-
-//    Box bx(IntVect(0,0,0),IntVect(511,511,255));
-//    Box bx(IntVect(0,0,0),IntVect(1023,1023,255));
-    Box bx(IntVect(0,0,0),IntVect(1023,1023,1023));
-//    Box bx(IntVect(0,0,0),IntVect(2047,2047,1023));
-//    Box bx(IntVect(0,0,0),IntVect(127,127,127));
-//    Box bx(IntVect(0,0,0),IntVect(255,255,255));
-
-    BoxArray ba(bx);
-    ba.maxSize(64);
-
-    DistributionMapping dm{ba};
-
-    const int N = 2000;  // This should be divisible by 4 !!!
-
-    if (ParallelDescriptor::IOProcessor() && iS == 0) {
-        std::cout << "Domain: " << bx << "  # boxes in BoxArray:  " << ba.size() << '\n';
-    }
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "Strategy: " << dmSNames[DistributionMapping::strategy()] << '\n';
-
-
-    ParallelDescriptor::Barrier();
-
-    {
-        //
-        // A test of FillBoundary() on 1 grow cell with cross stencil.
-        //
-        MultiFab mf(ba,dm,1,1); mf.setVal(1.23);
-
-        ParallelDescriptor::Barrier();
-        double beg = ParallelDescriptor::second();
-        for (int i = 0; i < N; i++)
-            mf.FillBoundary(true);
-        double end = (ParallelDescriptor::second() - beg);
-
-        ParallelDescriptor::ReduceRealMax(end,ParallelDescriptor::IOProcessorNumber());
-        if (ParallelDescriptor::IOProcessor()) {
-          std::cout << N << " cross x 1: " << end << std::endl;
-	  dmSTimes[whichStrategy] += end;
-	}
-    }
-
-
-    {
-        //
-        // A test of FillBoundary() on 1 grow cell with dense stencil.
-        //
-        MultiFab mf(ba,dm,1,1); mf.setVal(1.23);
-
-        ParallelDescriptor::Barrier();
-        double beg = ParallelDescriptor::second();
-        for (int i = 0; i < N; i++)
-            mf.FillBoundary();
-        double end = (ParallelDescriptor::second() - beg);
-
-        ParallelDescriptor::ReduceRealMax(end,ParallelDescriptor::IOProcessorNumber());
-        if (ParallelDescriptor::IOProcessor()) {
-          std::cout << N << " dense x 1: " << end << std::endl;
-	  dmSTimes[whichStrategy] += end;
-	}
-    }
-
-    {
-        //
-        // First a test of FillBoundary() on 2 grow cells with dense stencil.
-        //
-        MultiFab mf(ba,dm,1,2); mf.setVal(1.23);
-
-        ParallelDescriptor::Barrier();
-        double beg = ParallelDescriptor::second();
-        for (int i = 0; i < N/2; i++)
-            mf.FillBoundary();
-        double end = (ParallelDescriptor::second() - beg);
-
-        ParallelDescriptor::ReduceRealMax(end,ParallelDescriptor::IOProcessorNumber());
-        if (ParallelDescriptor::IOProcessor()) {
-          std::cout << (N/2) << " dense x 2: " << end << std::endl;
-	  dmSTimes[whichStrategy] += end;
-	}
-    }
-
-    {
-        //
-        // First a test of FillBoundary() on 4 grow cells with dense stencil.
-        //
-        MultiFab mf(ba,dm,1,4); mf.setVal(1.23);
-
-        ParallelDescriptor::Barrier();
-        double beg = ParallelDescriptor::second();
-        for (int i = 0; i < N/4; i++)
-            mf.FillBoundary();
-        double end = (ParallelDescriptor::second() - beg);
-
-        ParallelDescriptor::ReduceRealMax(end,ParallelDescriptor::IOProcessorNumber());
-        if (ParallelDescriptor::IOProcessor()) {
-          std::cout << (N/4) << " dense x 4: " << end << std::endl;
-	  dmSTimes[whichStrategy] += end;
-	}
-    }
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << std::endl;
-
-  }  // end for iS
-
-
-    if(ParallelDescriptor::IOProcessor()) {
-      for(int i(0); i < nStrategies; ++i) {
-        std::cout << std::endl << "Total times:" << std::endl;
-	std::cout << dmSNames[i] << " time = " << dmSTimes[i] << std::endl;
-      }
-      std::cout << std::endl << std::endl;
-    }
-
-    BL_PROFILE_VAR_STOP(pmain);
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tFillFab.cpp b/Tests/C_BaseLib/tFillFab.cpp
deleted file mode 100644
index 41d02aad748..00000000000
--- a/Tests/C_BaseLib/tFillFab.cpp
+++ /dev/null
@@ -1,52 +0,0 @@
-
-
-#include <fstream>
-
-#include <AMReX_BLFort.H>
-#include <AMReX_Utility.H>
-#include <AMReX_MultiFab.H>
-
-BL_FORT_PROC_DECL(FILLFAB,fillfab)(Real* d, const int* nx, const int* ny);
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-    //
-    // This in only for 2D.
-    //
-#if BL_SPACEDIM==2
-
-    const int NY = 1720;
-    const int NX = 2000;
-
-    Box bx(IntVect::TheZeroVector(),IntVect(NX-1,NY-1));
-
-    FArrayBox fab(bx,2);
-
-    fab.setVal(1.e200);
-
-    std::ofstream ofs;
-
-    ofs.open("out.fab", std::ios::out|std::ios::trunc);
-
-    if (!ofs.good())
-        amrex::FileOpenFailed("out.fab");
-
-    BL_FORT_PROC_CALL(FILLFAB,fillfab)(fab.dataPtr(), &NX, &NY);
-
-    fab.writeOn(ofs);
-
-    ofs.close();
-
-    if (!ofs.good())
-        amrex::Error("Write failed");
-
-#endif
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tMF.cpp b/Tests/C_BaseLib/tMF.cpp
deleted file mode 100644
index d68efe8b305..00000000000
--- a/Tests/C_BaseLib/tMF.cpp
+++ /dev/null
@@ -1,211 +0,0 @@
-//
-// A test program for MultiFab.
-//
-
-#include <map>
-#include <vector>
-
-#include <AMReX_Utility.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-
-    typedef std::map<Vector<int>,Vector<Real> > OurBinMap;
-
-    OurBinMap bins;
-
-    const int MyProc = ParallelDescriptor::MyProc();
-    const int NProcs = ParallelDescriptor::NProcs();
-    const int IOProc = ParallelDescriptor::IOProcessorNumber();
-
-    //
-    // The number of "ints" in the key to our map.
-    //
-    const int nKeys = BL_SPACEDIM;
-    const int nVals = 1;
-    //
-    // Each CPU will put a different # of things in map.
-    //
-    for (int i = 0; i < 10 + (10*MyProc); i++)
-    {
-      Vector<int> iv(nKeys);
-      for (int j=0; j<nKeys; ++j) {
-        iv[j] = 1000*MyProc+i;
-      }
-      bins[iv].resize(1, Real(MyProc) );
-    }
-
-#ifdef BL_USE_MPI
-    //
-    // The number of keys and their respective offsets.
-    // Used by IOProc but the "1" is so others can call dataPtr()
-    // without error.
-    //
-    Vector<int> nmkeys(1);
-    Vector<int> nmvals(1);
-    Vector<int> nmentries(1);
-    Vector<int> offset(1);
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-         nmentries.resize(NProcs,0);
-         nmkeys.resize(NProcs,0);
-         nmvals.resize(NProcs,0);
-         offset.resize(NProcs,0);
-    }
-    //
-    // Here lcount is the number of entries.
-    //
-    int lcount = bins.size();
-
-    MPI_Gather(&lcount,
-               1,
-               ParallelDescriptor::Mpi_typemap<int>::type(),
-               nmentries.dataPtr(),
-               1,
-               ParallelDescriptor::Mpi_typemap<int>::type(),
-               IOProc,
-               ParallelDescriptor::Communicator());
-
-    //
-    // Each CPU must pack its data into simple arrays.
-    //
-    Vector<int>  lkeys;
-    Vector<Real> lvals;
-
-    for (OurBinMap::const_iterator it = bins.begin(), End = bins.end();
-         it != End;
-         ++it)
-    {
-        const Vector<int>& iv = it->first;
-        BL_ASSERT(iv.size() == nKeys);
-
-        for (int i = 0; i < nKeys; i++)
-            lkeys.push_back(iv[i]);
-
-        const Vector<Real>& vals = it->second;
-        BL_ASSERT(vals.size() == nVals);
-
-        for (int i = 0; i < nVals; i++)
-            lvals.push_back(vals[i]);
-    }
-
-    //
-    // Clear all the "bins" including IOProc's.
-    // For IOProc we do this so that when we add back
-    // things into "bin" at the end we don't double
-    // count anything.  For all others it's just to cut
-    // out unnecessary memory since MPI will need to use
-    // some memory for the Gatherv().
-    //
-    bins.clear();
-    //
-    // The "global" (keys,vals) pairs into which all processors send their data.
-    //
-    Vector<int>  keys(1);
-    Vector<Real> vals(1);
-    //
-    // First pass the vals.
-    //
-    if (ParallelDescriptor::IOProcessor())
-    {
-        int tcount = 0;
-        for (int i = 0; i < NProcs; i++)
-        {
-            nmvals[i] = nmentries[i] * nVals;
-            tcount    += nmvals[i];
-        }
-
-        vals.resize(tcount);
-
-        for (int i = 1, N = offset.size(); i < N; i++) {
-            offset[i] = offset[i-1] + nmvals[i-1];
-        }
-    }
-
-    ParallelDescriptor::Barrier();
-
-    int vcount = lcount * nVals;
-
-    MPI_Gatherv(lcount == 0 ? 0 : lvals.dataPtr(),
-                vcount,
-                ParallelDescriptor::Mpi_typemap<Real>::type(),
-                vals.dataPtr(),
-                nmvals.dataPtr(),
-                offset.dataPtr(),
-                ParallelDescriptor::Mpi_typemap<Real>::type(),
-                IOProc,
-                ParallelDescriptor::Communicator());
-
-    //
-    // Then the keys
-    //
-    if (ParallelDescriptor::IOProcessor())
-    {
-
-        int tcount = 0;
-        for (int i = 0; i < NProcs; i++)
-        {
-            nmkeys[i] = nmentries[i] * nKeys;
-            tcount    += nmkeys[i];
-        }
-        keys.resize(tcount);
-
-        for (int i = 1, N = offset.size(); i < N; i++) {
-            offset[i] = offset[i-1] + nmkeys[i-1];
-        }
-    }
-
-    //
-    // There are nKeys ints in each Key.
-    //
-    int kcount = lcount * nKeys;
-
-    MPI_Gatherv(kcount == 0 ? 0 : lkeys.dataPtr(),
-                kcount,
-                ParallelDescriptor::Mpi_typemap<int>::type(),
-                keys.dataPtr(),
-                nmkeys.dataPtr(),
-                offset.dataPtr(),
-                ParallelDescriptor::Mpi_typemap<int>::type(),
-                IOProc,
-                ParallelDescriptor::Communicator());
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        //
-        // Put the (keys,vals) into our map and then print out map.
-        //
-        int nentries = vals.size() / nVals;
-        BL_ASSERT(nentries * nVals == vals.size());
-
-        for (int i = 0; i < nentries; i++)
-        {
-            int ik = i * nKeys;
-            Vector<int> key(nKeys);
-            for (int k=0; k<nKeys; ++k) {
-                key[k] = keys[ik+k];
-            }
-
-            int iv = i * nVals;
-            Vector<Real> val(nVals);
-            for (int k=0; k<nVals; ++k) {
-                val[k] = vals[iv+k];
-            }
-
-            bins[key] = val;
-        }
-
-        std::cout << "Got " << bins.size() << " (key,val) pairs:\n";
-    }
-#endif
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tMFcopy.cpp b/Tests/C_BaseLib/tMFcopy.cpp
deleted file mode 100644
index 74a384e5051..00000000000
--- a/Tests/C_BaseLib/tMFcopy.cpp
+++ /dev/null
@@ -1,88 +0,0 @@
-#include <iostream>
-#include <fstream>
-#include <AMReX_BoxArray.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_ParallelDescriptor.H>
-
-using namespace amrex;
-
-int
-main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-    //
-    // Use Space Filling Curve algorithm for distributing grids.
-    //
-    DistributionMapping::strategy(DistributionMapping::SFC);
-    //
-    // If there are >= "2" grids per CPU on average use Space Filling
-    // Curve algorithm for distributing grids, otherwise use KnapSack
-    // algorithm.
-    //
-    DistributionMapping::SFC_Threshold(2);
-
-    const char* file = "ba.23925";
-
-    std::ifstream ifs(file, std::ios::in);
-
-    if (!ifs.good())
-        amrex::Error("Unable to open file");
-
-    BoxArray fba;
-
-    fba.readFrom(ifs);
-
-    if (!ifs.good())
-        amrex::Error("Read of BoxArray failed");
-
-    if (!fba.ok())
-        amrex::Error("BoxArray is not OK");
-
-    if (!fba.isDisjoint())
-        amrex::Error("BoxArray is not disjoint");
-
-    fba.maxSize(32);
-
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "number of grids in fba: " << fba.size() << '\n';
-    //
-    // Let do a simple example of copy()ing from one MultiFab to another
-    // that it covers. We'll build a BoxArray that contains every other Box
-    // in fba.
-    //
-    BoxList cbl;
-
-    for (int i = 0; i < fba.size(); i++)
-        if (i%2 == 0)
-            cbl.push_back(fba[i]);
-
-    cbl.simplify();
-
-    cbl.maxSize(32);
-
-    BoxArray cba(cbl);
-
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "number of grids in cba: " << cba.size() << std::endl;
-    //
-    // If you want to make the copy do more work increase NComp.
-    //
-    const int NComp = 1;
-
-    DistributionMapping fdm{fba};
-    DistributionMapping cdm{cba};
-
-    MultiFab fmf(fba, fdm, NComp, 0);
-    MultiFab cmf(cba, cdm, NComp, 0);
-
-    fmf.setVal(1.23e45);
-
-    cmf.copy(fmf);
-
-    if (cdm[0] == ParallelDescriptor::MyProc())
-        std::cout << cmf[0] << std::endl;
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tParmParse.cpp b/Tests/C_BaseLib/tParmParse.cpp
deleted file mode 100644
index 4b1a9601df3..00000000000
--- a/Tests/C_BaseLib/tParmParse.cpp
+++ /dev/null
@@ -1,26 +0,0 @@
-
-#include <iostream>
-
-#include <AMReX_Vector.H>
-#include <AMReX_ParmParse.H>
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc,argv);
-
-    ParmParse pp;
-
-    Vector<int> arr;
-
-    pp.queryarr("arr",arr);
-
-    for (int i = 0; i < arr.size(); i++)
-    {
-        std::cout << arr[i] << std::endl;
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/C_BaseLib/tProfiler.cpp b/Tests/C_BaseLib/tProfiler.cpp
deleted file mode 100644
index 14616d8f818..00000000000
--- a/Tests/C_BaseLib/tProfiler.cpp
+++ /dev/null
@@ -1,388 +0,0 @@
-// --------------------------------------------------------------
-// tProfiler.cpp
-// --------------------------------------------------------------
-#include <iostream>
-#include <fstream>
-#include <cstdlib>
-#include <vector>
-#include <string>
-#include <sstream>
-#include <unistd.h>
-using std::cout;
-using std::endl;
-
-#include <AMReX_BLProfiler.H>
-#include <AMReX_Utility.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <TPROFILER_F.H>
-
-#include <AMReX_FArrayBox.H>
-#include <AMReX_FabConv.H>
-#include <AMReX_FPC.H>
-
-using namespace amrex;
-
-// --------------------------------------------------------------
-void Sleep(unsigned int sleeptime) {
-  BL_PROFILE("Sleep()");
-  BL_PROFILE_REGION_START("R::Sleep");
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << "Sleeping " << sleeptime << endl;
-  }
-  sleep(sleeptime);
-  ParallelDescriptor::Barrier();
-  BL_PROFILE_REGION_STOP("R::Sleep");
-}
-
-
-// --------------------------------------------------------------
-void nap(unsigned int sleeptime) {
-  BL_PROFILE("nap()");
-  BL_PROFILE_REGION_START("R::nap");
-  sleep(sleeptime);
-  BL_PROFILE_REGION_STOP("R::nap");
-}
-
-
-// --------------------------------------------------------------
-void napabort(unsigned int sleeptime) {
-  BL_PROFILE("napabort()");
-  Sleep(sleeptime);
-  amrex::Finalize();
-  amrex::Abort("From napabort");
-}
-
-
-// --------------------------------------------------------------
-void nestnap(int s) {
-  BL_PROFILE("nestnap()");
-  BL_PROFILE_REGION_START("R::nestnap");
-  Sleep(1 * s);
-  nap(2 * s);
-  nap(1 * s);
-  BL_PROFILE_REGION_STOP("R::nestnap");
-}
-
-
-// --------------------------------------------------------------
-void nestnap2(int s) {
-  BL_PROFILE("nestnap2()");
-  BL_PROFILE_REGION_START("R::nestnap2");
-  Sleep(1 * s);
-  nestnap(2 * s);
-  //Sleep(2 * s);
-  nap(3 * s);
-  BL_PROFILE_REGION_STOP("R::nestnap2");
-}
-
-
-// --------------------------------------------------------------
-void nestnapabort(int s) {
-  BL_PROFILE("nestnapabort()");
-  Sleep(1 * s);
-  napabort(2 * s);
-}
-
-
-// --------------------------------------------------------------
-void nonap() {
-  BL_PROFILE("nonap()");
-}
-
-
-// --------------------------------------------------------------
-int main(int argc, char *argv[]) {
-  amrex::Initialize(argc, argv);
-
-//  sleep(1);
-  BL_PROFILE_INIT_PARAMS(3.0, true, true);
-  BL_PROFILE_REGION_START("R::main");
-  BL_PROFILE_VAR("main()", pmain);
-
-  int myProc(ParallelDescriptor::MyProc());
-  int nProcs(ParallelDescriptor::NProcs());
-
-{ // ---- test sync strings
-  Vector<std::string> localStrings, syncedStrings;
-  bool alreadySynced;
-
-  localStrings.push_back("allString 0");
-  localStrings.push_back("allString 1");
-  if(ParallelDescriptor::IOProcessor()) {
-    localStrings.push_back("proc_0");
-  }
-  std::stringstream sstr;
-  sstr << "proc_";
-  for(int i(0); i < myProc; ++i) {
-    sstr << myProc;
-  }
-  for(int i(0); i < myProc; ++i) {
-    localStrings.push_back(sstr.str());
-  }
-  localStrings.push_back("allString zzz");
-  ParallelDescriptor::Barrier();
-
-
-  amrex::SyncStrings(localStrings, syncedStrings, alreadySynced);
-
-  if( ! alreadySynced) {
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << "not already synced." << endl;
-    }
-    std::ofstream ofs("syncedstrings.txt");
-    ParallelDescriptor::Barrier();
-    if(ParallelDescriptor::IOProcessor()) {
-      for(int i(0); i < syncedStrings.size(); ++i) {
-        cout << myProc << "::ss[" << i << "] = " << syncedStrings[i] << endl;
-        ofs << myProc << "::ss[" << i << "] = " << syncedStrings[i] << endl;
-      }
-    }
-    ofs.close();
-  } else {
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << "already synced." << endl;
-    }
-  }
-
-}
-
-{ // ---- test already synced strings
-  Vector<std::string> localStrings, syncedStrings;
-  bool alreadySynced;
-  
-  localStrings.push_back("samestrings 0");
-  localStrings.push_back("samestrings 1");
-  std::stringstream sstr;
-  localStrings.push_back("allString zzz");
-  ParallelDescriptor::Barrier();
-  
-  amrex::SyncStrings(localStrings, syncedStrings, alreadySynced);
-  
-  if( ! alreadySynced) {
-    if(ParallelDescriptor::IOProcessor()) {
-      for(int i(0); i < syncedStrings.size(); ++i) {
-        cout << myProc << "::ss[" << i << "] = " << syncedStrings[i] << endl;
-      }
-    }
-  }
-
-  if(ParallelDescriptor::IOProcessor()) {
-    if(alreadySynced) {
-      cout << "already synced." << endl;
-    } else {
-      cout << "not already synced." << endl;
-    }
-  }
-
-}
-
-
-
-    BL_PROFILE_VAR("NProcs-1 func(2)", pnpm1);
-    sleep(2);
-    BL_PROFILE_VAR_STOP(pnpm1);
-
-  if(myProc == 0) {
-    BL_PROFILE_VAR("Proc 0 func(1)", p0fun);
-    sleep(1);
-    BL_PROFILE_VAR_STOP(p0fun);
-  }
-
-  BL_PROFILE_REGION_START("R::Sleepnap");
-  Sleep(2);
-  nap(3);
-  BL_PROFILE_REGION_STOP("R::Sleepnap");
-
-/*
-  BL_PROFILE_REGION_START("R::Part 1");
-  //nap(1);
-  //nonap();
-  BL_PROFILE_REGION_START("R::P12 overlap");
-  nestnap(1);
-  BL_PROFILE_REGION_STOP("R::Part 1");
-  BL_PROFILE_REGION_START("R::Part 2");
-  //nap(1);
-  //nestnap2(1);
-  //nap(3);
-  BL_PROFILE_REGION_STOP("R::P12 overlap");
-  //sleep(2);
-  //nestnapabort(1);
-  nonap();
-  BL_PROFILE_REGION_STOP("R::Part 2");
-  //Sleep(2);
-*/
-
-  Real tpStart(ParallelDescriptor::second());
-  BL_PROFILE_VAR("TESTPROF", ptp);
-  FORT_TESTPROFILER();
-  BL_PROFILE_VAR_STOP(ptp);
-  cout << "Test fort time = " << ParallelDescriptor::second() - tpStart << endl;
-
-  Real tpiStart(ParallelDescriptor::second());
-  BL_PROFILE_CHANGE_FORT_INT_NAME("eos3", 3);
-  BL_PROFILE_VAR("TESTPROFINT", ptpi);
-  FORT_TESTPROFILERINT();
-  BL_PROFILE_VAR_STOP(ptpi);
-  cout << "Test fort int time = " << ParallelDescriptor::second() - tpiStart << endl;
-
-
-  //sleep(1);
-
-/*
-  Box b(IntVect(0,0), IntVect(80,80));
-  Box b0(IntVect(0,0), IntVect(39,80));
-  Box b1(IntVect(40,0), IntVect(80,80));
-  FArrayBox dfab(b);
-  dfab.setVal(42.0e-128, b0, 0, 1);
-  dfab.setVal(42.0e+128, b1, 0, 1);
-  std::ofstream dfabos("fab.fab");
-  dfab.writeOn(dfabos);
-  dfabos.close();
-
-  FArrayBox::setFormat(FABio::FAB_IEEE_32);
-  FArrayBox sfab(b);
-  sfab.copy(dfab);
-  std::ofstream sfabos("fab_ieee_32.fab");
-  sfab.writeOn(sfabos);
-  sfabos.close();
-
-  FArrayBox::setFormat(FABio::FAB_NATIVE);
-  FArrayBox nfab(b);
-  nfab.copy(dfab);
-  std::ofstream nfabos("fab_native.fab");
-  nfab.writeOn(nfabos);
-  nfabos.close();
-
-  FArrayBox::setFormat(FABio::FAB_NATIVE_32);
-  FArrayBox n32fab(b);
-  n32fab.copy(dfab);
-  std::ofstream n32fabos("fab_native32.fab");
-  n32fab.writeOn(n32fabos);
-  n32fabos.close();
-
-  cout << "minmax double = " << std::numeric_limits<double>::min()
-       << "  " << std::numeric_limits<double>::max() << endl;
-  cout << "minmax float  = " << std::numeric_limits<float>::min()
-       << "  " << std::numeric_limits<float>::max() << endl;
-
-  int nTimes(100);
-  long nPts(128 * 128 * 128);
-  Vector<Real> nativeVals(nPts);
-  Vector<float> floatVals(nPts);
-  Real nMin(std::numeric_limits<Real>::max());
-  Real nMax(-std::numeric_limits<Real>::max());
-  float fMin(std::numeric_limits<float>::max());
-  float fMax(-std::numeric_limits<float>::max());
-  unsigned int rint(std::numeric_limits<unsigned int>::max());
-  cout << "rint = " << rint << endl;
-
-  for(int i(0); i < nPts; ++i) {
-    int ri(amrex::Random_int(rint));
-    nativeVals[i] = ri;
-    if(i == 0) {
-      nativeVals[i] = 1.234e+123;
-    }
-    if(i == 1) {
-      nativeVals[i] = 2.341e-231;
-    }
-    if(i < 256) {
-      cout << "nativeVals[" << i << "] = " << nativeVals[i] << endl;
-    }
-    nMin = std::min(nMin, nativeVals[i]);
-    nMax = std::max(nMax, nativeVals[i]);
-  }
-  cout << "nMin nMax = " << nMin << "  " << nMax << endl;
-
-  RealDescriptor rdNative(FPC::NativeRealDescriptor());
-  cout << "rdNative = " << rdNative << endl;
-  RealDescriptor rdIEEE32(FPC::Ieee32NormalRealDescriptor());
-  cout << "rdIEEE32 = " << rdIEEE32 << endl;
-  RealDescriptor rdNative32(FPC::ieee_float, FPC::reverse_float_order, 4);
-  cout << "rdNative32 = " << rdNative32 << endl;
-  RealDescriptor n32RD(FPC::Native32RealDescriptor());
-  cout << "n32RD = " << n32RD << endl;
-*/
-
-/*
-// ----
-  BL_PROFILE_VAR("TestPD_convert_native", tpdcnative);
-  for(int nt(0); nt < nTimes; ++nt) {
-    RealDescriptor::convertFromNativeFormat(floatVals.dataPtr(), nPts,
-                                            nativeVals.dataPtr(), rdNative32);
-  }
-  BL_PROFILE_VAR_STOP(tpdcnative);
-
-  fMin = std::numeric_limits<float>::max();
-  fMax = -std::numeric_limits<float>::max();
-  for(int i(0); i < nPts; ++i) {
-    fMin = std::min(fMin, floatVals[i]);
-    fMax = std::max(fMax, floatVals[i]);
-  }
-  cout << "after TestPD_convert_native:  fMin fMax = " << fMin << "  " << fMax << endl;
-
-  // ----
-  BL_PROFILE_VAR("TestPD_convert", tpdc);
-  for(int nt(0); nt < nTimes; ++nt) {
-    RealDescriptor::convertFromNativeFormat(floatVals.dataPtr(), nPts,
-                                            nativeVals.dataPtr(), rdIEEE32);
-  }
-  BL_PROFILE_VAR_STOP(tpdc);
-
-  fMin = std::numeric_limits<float>::max();
-  fMax = -std::numeric_limits<float>::max();
-  for(int i(0); i < nPts; ++i) {
-    fMin = std::min(fMin, floatVals[i]);
-    fMax = std::max(fMax, floatVals[i]);
-  }
-  cout << "after TestPD_convert:  fMin fMax = " << fMin << "  " << fMax << endl;
-*/
-
-/*
-  // ----
-  BL_PROFILE_VAR("TestPD_convert_native32", tpdcn32);
-  for(int nt(0); nt < nTimes; ++nt) {
-    RealDescriptor::convertFromNativeFormat(floatVals.dataPtr(), nPts,
-                                            nativeVals.dataPtr(), n32RD);
-  }
-  BL_PROFILE_VAR_STOP(tpdcn32);
-
-  fMin = std::numeric_limits<float>::max();
-  fMax = -std::numeric_limits<float>::max();
-  for(int i(0); i < nPts; ++i) {
-    fMin = std::min(fMin, floatVals[i]);
-    fMax = std::max(fMax, floatVals[i]);
-  }
-  cout << "after TestPD_convert_native32:  fMin fMax = " << fMin << "  " << fMax << endl;
-
-  // ----
-  BL_PROFILE_VAR("TestCast_convert", tcc);
-  for(int nt(0); nt < nTimes; ++nt) {
-    for(int i(0); i < nPts; ++i) {
-      floatVals[i] = nativeVals[i];
-    }
-  }
-  BL_PROFILE_VAR_STOP(tcc);
-
-  fMin = std::numeric_limits<float>::max();
-  fMax = -std::numeric_limits<float>::max();
-  for(int i(0); i < nPts; ++i) {
-    fMin = std::min(fMin, floatVals[i]);
-    fMax = std::max(fMax, floatVals[i]);
-  }
-  cout << "after TestCast_convert:  fMin fMax = " << fMin << "  " << fMax << endl;
-*/
-
-
-
-  BL_PROFILE_VAR_STOP(pmain);
-  BL_PROFILE_REGION_STOP("R::main");
-
-  BL_PROFILE_FINALIZE();
-  amrex::Finalize();
-}
-
-// --------------------------------------------------------------
-// --------------------------------------------------------------
-
-
-
diff --git a/Tests/C_BaseLib/tRABcast.cpp b/Tests/C_BaseLib/tRABcast.cpp
deleted file mode 100644
index fac7945042b..00000000000
--- a/Tests/C_BaseLib/tRABcast.cpp
+++ /dev/null
@@ -1,52 +0,0 @@
-// ------------------------------------------------------------
-// A test program for ReadAndBcastFile().
-// ------------------------------------------------------------
-#include <AMReX_ParallelDescriptor.H>
-
-using namespace amrex;
-
-// ------------------------------------------------------------
-int main(int argc, char **argv) {
-  amrex::Initialize(argc, argv);
-
-  BL_PROFILE_VAR("main()", pmain);
-
-
-  Vector<double> dmSTimes(nStrategies, 0.0);
-
-    ParallelDescriptor::Barrier();
-
-    // Open the checkpoint header file for reading.
-    std::string File(filename);
-    File += "/Header";
-
-    VisMF::IO_Buffer io_buffer(VisMF::IO_Buffer_Size);
-
-    Vector<char> fileCharPtr;
-    ParallelDescriptor::ReadAndBcastFile(File, fileCharPtr);
-    std::string fileCharPtrString(fileCharPtr.dataPtr());
-    std::istringstream is(fileCharPtrString, std::istringstream::in);
-
-    std::stringbuf *pbuf = iss.rdbuf();
-
-    is >> value;
-
-
-
-  if(ParallelDescriptor::IOProcessor()) {
-      for(int i(0); i < nStrategies; ++i) {
-        std::cout << std::endl << "Total times:" << std::endl;
-	std::cout << dmSNames[i] << " time = " << dmSTimes[i] << std::endl;
-      }
-      std::cout << std::endl << std::endl;
-  }
-
-
-
-
-    BL_PROFILE_VAR_STOP(pmain);
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tRan.cpp b/Tests/C_BaseLib/tRan.cpp
deleted file mode 100644
index 0e43537c9ba..00000000000
--- a/Tests/C_BaseLib/tRan.cpp
+++ /dev/null
@@ -1,23 +0,0 @@
-#include <iostream>
-#include <iomanip>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-// this mersenne_ran_main() outputs first 1000 generated numbers
-// compare against the output of mt19937int.out
-int
-main(int argc, char** argv)
-{
-  amrex::Initialize(argc,argv);
-  amrex::mt19937 rr(4357UL);
-    std::ios::fmtflags ofmtflags = std::cout.setf(std::ios::fixed, std::ios::floatfield);
-    std::cout << std::setprecision(8);
-    for ( int j=0; j<1000; j++ )
-    {
-	std::cout << std::setw(10) << rr.u_value() << ' ';
-	if ( j%5==4 ) std::cout << std::endl;
-    }
-    std::cout << std::endl;
-    amrex::Finalize();
-}
diff --git a/Tests/C_BaseLib/tUMap.cpp b/Tests/C_BaseLib/tUMap.cpp
deleted file mode 100644
index afb563f3168..00000000000
--- a/Tests/C_BaseLib/tUMap.cpp
+++ /dev/null
@@ -1,63 +0,0 @@
-
-
-#include <fstream>
-
-#include <AMReX_BLFort.H>
-#include <AMReX_Utility.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_BaseUmap.H>
-#include <AMReX_BaseUmap_f.H>
-#include <AMReX_ArrayLim.H>
-
-//BL_FORT_PROC_DECL(FILLFAB,fillfab)(Real* d, const int* nx, const int* ny);
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-    //
-    // This in only for 2D.
-    //
-
-    const int NY = 4;
-    const int NX = 3;
-    const int NZ = 2;
-
-    Box bx(IntVect::TheZeroVector(),IntVect(AMREX_D_DECL(NX-1,NY-1,NZ-1)));
-
-    FArrayBox fab(bx,2);
-    fab.setVal<RunOn::Host>(1.e200);
-
-    BaseUmap<Real> umap(bx, 2);
-
-    Real v;
-    v = 2.0;
-    umap.setVal( v, IntVect(2,1,0), 0, 1);
-
-    for (IntVect iv=bx.smallEnd(); iv<=bx.bigEnd(); bx.next(iv)) {
-        v = umap.getVal(iv, 0, 1);
-        std::cout << iv << " has value " << v <<std::endl;
-//
-    }
-
-// Convert to references.
-// umap.numPts() returns a long, fort_umap_norm expects an int
-// Keytable location may not be quite right
-    int npts = umap.numPts();
-    int max_mv = umap.MaxMV();
-    int ncomp = umap.nComp();
-    Real norm =  amrex_fort_umap_norm(AMREX_ARLIM_3D(umap.box().loVect()), AMREX_ARLIM_3D(umap.box().hiVect()),
-                                umap.dataPtr(),&npts, 
-                                umap.keyTablePtr(), AMREX_ARLIM_3D(umap.box().loVect()), AMREX_ARLIM_3D(umap.box().hiVect()),
-                                &max_mv, &ncomp, 0);
-    
-
-    std::cout << "Norm (from fotran): " << norm << std::endl;
-
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/C_BaseLib/tVisMF.cpp b/Tests/C_BaseLib/tVisMF.cpp
deleted file mode 100644
index 78dc89492c8..00000000000
--- a/Tests/C_BaseLib/tVisMF.cpp
+++ /dev/null
@@ -1,154 +0,0 @@
-// ----------------------------------
-// email push test 0
-// ----------------------------------
-
-#include <cstdlib>
-#include <string>
-
-#include <AMReX_VisMF.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-static int nBoxs  = 10;
-
-static char* the_prog_name;
-
-
-static
-void
-usage ()
-{
-    std::cout << "usage: "
-              << the_prog_name
-              << " [-nboxs N]"
-              << std::endl;
-    exit(1);
-}
-
-static
-void
-parse_args (char**& argv)
-{
-    while (*++argv && **argv == '-')
-    {
-        if (strcmp(*argv, "-nboxs") ==  0)
-        {
-            if (*++argv)
-            {
-                nBoxs = atoi(*argv);
-
-                if (nBoxs <= 0)
-                {
-                    std::cout << "nboxs must be positive" << std::endl;
-                    usage();
-                }
-            }
-            else
-            {
-                std::cout << "No argument to -nboxs supplied.\n";
-                usage();
-            }
-        }
-        else
-        {
-            std::cout << "Exiting, unknown option: " << *argv << std::endl;
-            usage();
-        }
-    }
-}
-
-static
-void
-Write_N_Read (const MultiFab& mf,
-              const std::string&  mf_name)
-{
-    if (ParallelDescriptor::IOProcessor())
-    {
-        std::cout << "Writing the MultiFab to disk ...\n";
-    }
-
-    double start, end;
-
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        start = ParallelDescriptor::second();
-    }
-
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        end = ParallelDescriptor::second();
-
-        std::cout << "\nWallclock time for MF write: " << (end-start) << '\n';
-
-        std::cout << "Reading the MultiFab from disk ...\n";
-    }
-
-    VisMF vmf(mf_name);
-
-    BL_ASSERT(vmf.size() == mf.boxArray().size());
-
-    for (MFIter mfi(mf); mfi.isValid(); ++mfi)
-    {
-        //const FArrayBox& fab = vmf[mfi.index()];
-        const FArrayBox& fab = vmf.GetFab(mfi.index(), 0);
-
-        std::cout << "\tCPU #"
-                  << ParallelDescriptor::MyProc()
-                  << " read FAB #"
-                  << mfi.index()
-                  << '\n';
-    }
-
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        std::cout << "Building new MultiFab from disk version ....\n\n";
-    }
-
-    MultiFab new_mf;
-    
-    VisMF::Read(new_mf, mf_name);
-}
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-    the_prog_name = argv[0];
-    parse_args(argv);
-
-    BoxArray ba(nBoxs);
-
-    ba.set(0, Box(IntVect(AMREX_D_DECL(0,0,0)), IntVect(AMREX_D_DECL(2,2,2))));
-
-    for (int i = 1; i < nBoxs; i++)
-    {
-        ba.set(i,amrex::grow(ba[i-1],2));
-    }
-
-    DistributionMapping dm{ba};
-
-    MultiFab mf(ba, dm, 2, 1);
-
-    for (MFIter mfi(mf); mfi.isValid(); ++mfi)
-    {
-        mf[mfi.index()].setVal(mfi.index()+1);
-    }
-    //
-    // Set cells in ghost region to zero.
-    //
-    mf.setBndry(0);
-
-    static const std::string mf_name = "Spam-n-Eggs";
-
-    Write_N_Read (mf,
-                  mf_name);
-
-    amrex::Finalize();
-}
diff --git a/Tests/C_BaseLib/tVisMF2.cpp b/Tests/C_BaseLib/tVisMF2.cpp
deleted file mode 100644
index ef635956f43..00000000000
--- a/Tests/C_BaseLib/tVisMF2.cpp
+++ /dev/null
@@ -1,47 +0,0 @@
-
-#include <cstdlib>
-#include <string>
-
-#include <AMReX_VisMF.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "Successfully initialized BoxLib" << std::endl;
-
-    VisMF vmf(std::string("SD_0_New_MF"));
-
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "Successfully read the VisMF header" << std::endl;
-
-    DistributionMapping dm{vmf.boxArray()};
-
-    MultiFab rho(vmf.boxArray(),dm,1,0);
-
-    for (MFIter mfi(rho); mfi.isValid(); ++mfi)
-    {
-        std::cout << "Attempting to read fab at index: " << mfi.index() << std::endl;
-
-        rho[mfi].copy(vmf.GetFab(mfi.index(),3),0,0,1);
-
-        vmf.clear(mfi.index(),3);
-    }
-
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "Attempting to write Rho ..." << std::endl;
-
-    VisMF::Write(rho, std::string("Rho"));
-
-    if (ParallelDescriptor::IOProcessor())
-        std::cout << "Successfully wrote Rho ..." << std::endl;
-
-    amrex::Finalize();
-}
diff --git a/Tests/C_BaseLib/tread.cpp b/Tests/C_BaseLib/tread.cpp
deleted file mode 100644
index 15e399c8531..00000000000
--- a/Tests/C_BaseLib/tread.cpp
+++ /dev/null
@@ -1,74 +0,0 @@
-//
-// Read in and sum up FABs on command line.
-//
-// This assumes they're all the same size and shape.
-//
-
-#include <fstream>
-#include <iostream>
-
-#include <AMReX_Utility.H>
-#include <AMReX_FArrayBox.H>
-
-using namespace amrex;
-
-int
-main (int argc, char** argv)
-{
-    amrex::Initialize(argc, argv);
-
-    if (argc < 2)
-    {
-        std::cerr << "tread: fab1 fab2 fab3 ..." << std::endl;
-        exit(1);
-    }
-
-    int idx = 1;
-
-    FArrayBox sum;
-
-    std::ifstream ifs;
-
-    ifs.open(argv[idx], std::ios::in);
-
-    if (!ifs.good())
-        amrex::FileOpenFailed(argv[idx]);
-
-    std::cout << "Reading " << argv[idx] << " ..." << std::endl;
-
-    sum.readFrom(ifs);
-
-    idx++;
-
-    for ( ; idx < argc; idx++)
-    {
-
-
-        FArrayBox tmp;
-
-        std::ifstream ifs;
-
-        ifs.open(argv[idx], std::ios::in);
-
-        if (!ifs.good())
-            amrex::FileOpenFailed(argv[idx]);
-
-        std::cout << "Reading " << argv[idx] << " ..." << std::endl;
-
-        tmp.readFrom(ifs);
-
-        sum += tmp;
-    }
-
-    std::ofstream ofs;
-
-    ofs.open("SUM",std::ios::out|std::ios::trunc);
-
-    if (!ofs.good()) amrex::FileOpenFailed("SUM");
-
-    sum.writeOn(ofs);
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tests/DataServicesTest0/DataServicesTest0.cpp b/Tests/DataServicesTest0/DataServicesTest0.cpp
deleted file mode 100644
index 7cacbce11a6..00000000000
--- a/Tests/DataServicesTest0/DataServicesTest0.cpp
+++ /dev/null
@@ -1,115 +0,0 @@
-// --------------------------------------------------------------------
-// DataServicesTest0.cpp
-// --------------------------------------------------------------------
-//   this file does the following:
-//     .................
-//     tests DataServices and AmrData.
-//     .................
-// --------------------------------------------------------------------
-#include <iostream>
-#include <cstdlib>
-#include <unistd.h>
-
-#include <AMReX_IntVect.H>
-#include <AMReX_Box.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_AmrData.H>
-#include <AMReX_DataServices.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-const unsigned int msps(1000000);
-
-const int XDIR(0);
-const int YDIR(1);
-const int ZDIR(2);
-
-// --------------------------------------------------------------------
-static void PrintUsage(const char *progName) {
-    std::cout << '\n';
-    std::cout << "Usage:" << '\n';
-    std::cout << progName << "    plotFileName" << '\n';
-    std::cout << '\n';
-    std::cout << '\n';
-    exit(1);
-}
-
-
-// --------------------------------------------------------------------
-int main(int argc, char *argv[]) {
-    if(argc != 2) {
-      PrintUsage(argv[0]);
-    }
-
-    bool bInitParmParse(false);
-    amrex::Initialize(argc, argv, bInitParmParse);
-
-    int myProc(ParallelDescriptor::MyProc());
-
-    std::string infile(argv[1]);
-    if(ParallelDescriptor::IOProcessor()) {
-      std::cout << "argv[1] = " << argv[1] << std::endl;
-      std::cout << "infile  = " << infile << std::endl;
-    }
-
-    // ---- open pltfile and get amrData reference
-    DataServices::SetBatchMode();
-    Amrvis::FileType fileType(Amrvis::NEWPLT);
-    DataServices dataServices(infile, fileType);
-    if( ! dataServices.AmrDataOk()) {
-      DataServices::Dispatch(DataServices::ExitRequest, NULL);
-    }
-    AmrData &amrData = dataServices.AmrDataRef();
-
-    int finestLevel(amrData.FinestLevel());
-    int numberOfLevels(finestLevel + 1);
-    const Vector<std::string> &plotVarNames = amrData.PlotVarNames();
-
-    // ---- print some information about the plot file
-    if(ParallelDescriptor::IOProcessor()) {
-      std::cout << "finestLevel = " << finestLevel << std::endl;
-      std::cout << "nuberOfLevels = " << numberOfLevels << std::endl;
-      for(int i(0); i < amrData.ProbDomain().size(); ++i) {
-        std::cout << "ProbDomain[" << i << "] = " << amrData.ProbDomain()[i]  << std::endl;
-      }
-      std::cout << "NComp       = " << amrData.NComp()       << std::endl;
-      for(int i(0); i < plotVarNames.size(); ++i) {
-        std::cout << "plotVarNames[" << i << "] = " << plotVarNames[i] << std::endl;
-      }
-      for(int i(0); i < numberOfLevels; ++i) {
-        //std::cout << "BoxArray[" << i << "] = " << amrData.boxArray(i) << std::endl;
-      }
-    }
-
-
-    BoxArray fillBoxes(amrData.ProbDomain()[0]);
-    fillBoxes.maxSize(128);  // ---- break the boxarray into smaller boxes
-    int nVar(1), nGrow(0);
-    DistributionMapping dmap(fillBoxes);
-    MultiFab fillMF(fillBoxes, dmap, nVar, nGrow);  // ---- one component
-    if(ParallelDescriptor::IOProcessor()) {
-      std::cout << "fillBoxes = " << fillBoxes << std::endl;
-      std::cout << "filling multifab for " << plotVarNames[0] << std::endl;
-    }
-    int fillLevelZero(0);
-    int compZero(0);
-    amrData.FillVar(fillMF, fillLevelZero, plotVarNames[0], compZero);
-    VisMF::Write(fillMF, "fillMF");
-
-    for(MFIter mfi(fillMF); mfi.isValid(); ++mfi) {
-      FArrayBox &currentFAB = fillMF[mfi];
-      const Box &fabBox = currentFAB.box();
-      Real *dataPtr = currentFAB.dataPtr();  // ---- this points to the data
-      usleep(myProc * msps / 10.0);  // ---- to make the output readable
-      std::cout << myProc << ":: fabBox = " << fabBox << std::endl;
-      std::cout << myProc << ":: dataPtr[0] = " << dataPtr[0] << std::endl;
-    }
-    usleep(msps);  // ---- to make the output readable
-
-    amrex::Finalize();
-
-    return 0;
-}
-// --------------------------------------------------------------------
diff --git a/Tests/DataServicesTest0/GNUmakefile b/Tests/DataServicesTest0/GNUmakefile
deleted file mode 100644
index 597611cab40..00000000000
--- a/Tests/DataServicesTest0/GNUmakefile
+++ /dev/null
@@ -1,55 +0,0 @@
-AMREX_HOME = ../../../amrex
-
-EBASE = DataServicesTest0
-
-DEBUG	  = FALSE
-DEBUG	  = TRUE
-
-#TINY_PROFILE=TRUE
-#PROFILE = FALSE
-#PROFILE = TRUE
-
-#TRACE_PROFILE = TRUE
-#COMM_PROFILE = TRUE 
-#MEM_PROFILE = TRUE 
-USE_PROFPARSER = TRUE
-
-DIM       = 3 
-USE_MPI   = FALSE
-USE_MPI   = TRUE
-COMP      = gnu
-
-HERE = .
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-CEXE_sources += $(EBASE).cpp
-
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/Extern/amrdata/Make.package
-
-INCLUDE_LOCATIONS += $(HERE)
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Base
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/amrdata
-
-PATHDIRS  = $(HERE)
-PATHDIRS += $(AMREX_HOME)/Src/Base
-PATHDIRS += $(AMREX_HOME)/Src/Extern/amrdata
-
-vpath %.f   $(PATHDIRS)
-vpath %.F   $(PATHDIRS)
-vpath %.f90 $(PATHDIRS)
-vpath %.h   $(PATHDIRS)
-vpath %.H   $(PATHDIRS)
-vpath %.cpp $(PATHDIRS)
-
-all: $(executable)
-
-$(executable):
-
-cclean:
-	rm -f amrprofparser BLProfParser.lex.yy.cpp BLProfParser.tab.cpp \
-              BLProfParser.tab.H core
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tests/FillBoundaryComparison/CMakeLists.txt b/Tests/FillBoundaryComparison/CMakeLists.txt
new file mode 100644
index 00000000000..e11cc64ab2b
--- /dev/null
+++ b/Tests/FillBoundaryComparison/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files ba.max)
+
+setup_test(_sources _input_files CMDLINE_PARAMS nrounds=1)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/GPU/CudaGraphs/BuildingGraphs/GNUmakefile b/Tests/GPU/CudaGraphs/BuildingGraphs/GNUmakefile
deleted file mode 100644
index 99825c7add6..00000000000
--- a/Tests/GPU/CudaGraphs/BuildingGraphs/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-AMREX_HOME ?= ../../../..
-
-DEBUG	= FALSE
-#DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gnu 
-
-USE_MPI   = FALSE 
-USE_OMP   = FALSE
-USE_CUDA  = TRUE
-TINY_PROFILE = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/GPU/CudaGraphs/BuildingGraphs/Make.package b/Tests/GPU/CudaGraphs/BuildingGraphs/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/GPU/CudaGraphs/BuildingGraphs/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/GPU/CudaGraphs/BuildingGraphs/inputs_3d b/Tests/GPU/CudaGraphs/BuildingGraphs/inputs_3d
deleted file mode 100644
index 27cb1dada91..00000000000
--- a/Tests/GPU/CudaGraphs/BuildingGraphs/inputs_3d
+++ /dev/null
@@ -1,7 +0,0 @@
-#nsteps = 1000 
-#plot_int = -1 
-n_cell = 256 
-max_grid_size = 64
-
-#amrex.v = 1
-#amrex.v = 0
diff --git a/Tests/GPU/CudaGraphs/BuildingGraphs/main.cpp b/Tests/GPU/CudaGraphs/BuildingGraphs/main.cpp
deleted file mode 100644
index a3dfadf6b73..00000000000
--- a/Tests/GPU/CudaGraphs/BuildingGraphs/main.cpp
+++ /dev/null
@@ -1,515 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-// MFIterLoop
-// Written as a seperate function for easy changes/testing.
-void MFIterLoopFunc(const Box &bx, double* val, Array4<Real> &a)
-{
-    amrex::ParallelFor(bx,
-    [=] AMREX_GPU_DEVICE (int i, int j, int k)
-    {
-        a(i,j,k) = *val;
-    });
-}
-
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-    amrex::Gpu::GraphSafeGuard gpu_gsg(true);
-    {
-        amrex::Print() << "amrex::Initialize complete." << "\n";
-
-        // AMREX_SPACEDIM: number of dimensions
-        int n_cell, max_grid_size, Nghost, Ncomp;
-        Vector<int> is_periodic(AMREX_SPACEDIM,1);  // periodic in all direction by default
-
-        // inputs parameters
-        {
-            // ParmParse is way of reading inputs from the inputs file
-            ParmParse pp;
-
-            // We need to get n_cell from the inputs file - this is the number of cells on each side of 
-            //   a square (or cubic) domain.
-            pp.get("n_cell",n_cell);
-
-            // The domain is broken into boxes of size max_grid_size
-            pp.get("max_grid_size",max_grid_size);
-
-            // The domain is broken into boxes of size max_grid_size
-            Nghost = 0;
-            pp.query("nghost", Nghost);
-
-            Ncomp = 1;
-            pp.query("ncomp", Ncomp);
-        }
-
-        // make BoxArray and Geometry
-        BoxArray ba;
-        {
-            IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-            IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-            Box domain(dom_lo, dom_hi);
-
-            // Initialize the boxarray "ba" from the single box "bx"
-            ba.define(domain);
-            // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-            ba.maxSize(max_grid_size);
-        }
-  
-        // How Boxes are distrubuted among MPI processes
-        DistributionMapping dm(ba);
-
-        // Malloc value for setval testing.
-        Real* val;
-        cudaMallocManaged(&val, sizeof(Real));
-        *val = 0.0;
-
-        // Create the MultiFab and touch the data.
-        // Ensures the data in on the GPU for all further testing.
-        MultiFab x(ba, dm, Ncomp, Nghost);
-        x.setVal(*val);
-
-        amrex::Print() << "Number of boxes = " << x.size() << std::endl << std::endl;
-
-        Real points = ba.numPts();
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Initial launch to remove any unknown costs in HtoD setup. 
-
-        {
-            BL_PROFILE("Initial");
-            *val = 0.42;
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-            }
-
-            amrex::Print() << "Initial sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-        }
-
-
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Launch without graphs
-
-        {
-            BL_PROFILE("Standard");
-            *val = 1.0;
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-            }
-
-            amrex::Print() << "No Graph sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create one graph per MFIter iteration and execute them.
-
-        {
-            BL_PROFILE("IterPerGraph");
-            *val = 2.0;
-
-            BL_PROFILE_VAR("CREATE: IterPerGraph", cgc);
-            cudaGraph_t     graph[x.local_size()];
-            cudaGraphExec_t graphExec[x.local_size()];
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream()));
-#else
-                AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream(),
-                                                           cudaStreamCaptureModeGlobal));
-#endif
-
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-
-                AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(amrex::Gpu::Device::cudaStream(), &(graph[mfi.LocalIndex()])));
-            }
-
-            BL_PROFILE_VAR_STOP(cgc);
-            BL_PROFILE_VAR("INSTANTIATE: IterPerGraph", cgi);
-
-            for (int i = 0; i<x.local_size(); ++i)
-            {
-                AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec[i], graph[i], NULL, NULL, 0));
-            }
-
-            BL_PROFILE_VAR_STOP(cgi);
-            BL_PROFILE_VAR("LAUNCH: IterPerGraph", cgl);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec[mfi.LocalIndex()], amrex::Gpu::Device::cudaStream())); 
-            }
-
-            amrex::Gpu::Device::synchronize();
-            BL_PROFILE_VAR_STOP(cgl);
-
-            amrex::Print() << "Graph-per-iter sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create one graph per CUDA stream and execute them.
-
-        {
-            BL_PROFILE("StreamPerGraph");
-            *val = 3.0;
-
-            BL_PROFILE_VAR("CREATE: StreamPerGraph", cgc);
-
-            cudaGraph_t     graph[amrex::Gpu::numGpuStreams()];
-            cudaGraphExec_t graphExec[amrex::Gpu::numGpuStreams()];
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                if (mfi.LocalIndex() == 0)
-                {
-                    for (int i=0; i<amrex::Gpu::numGpuStreams(); ++i)
-                    {
-                        amrex::Gpu::Device::setStreamIndex(i);
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                       AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream()));
-#else
-                       AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream(),
-                                                                  cudaStreamCaptureModeGlobal));
-#endif
-                    }
-                    amrex::Gpu::Device::setStreamIndex(mfi.tileIndex());
-                } 
-
-                // ..................
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-                // ..................
-
-                if (mfi.LocalIndex() == (x.local_size() - 1) )
-                { 
-                    for (int i=0; i<amrex::Gpu::numGpuStreams(); ++i)
-                    {
-                        amrex::Gpu::Device::setStreamIndex(i); 
-                        AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(amrex::Gpu::Device::cudaStream(), &(graph[i])));
-                    }  
-                }
-            }
-
-            BL_PROFILE_VAR_STOP(cgc);
-            BL_PROFILE_VAR("INSTANTIATE: StreamPerGraph", cgi);
-
-            for (int i = 0; i<amrex::Gpu::numGpuStreams(); ++i)
-            {
-                AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec[i], graph[i], NULL, NULL, 0));
-            }
-
-            BL_PROFILE_VAR_STOP(cgi);
-            BL_PROFILE_VAR("LAUNCH: StreamPerGraph", cgl);
-
-            for (int i = 0; i<amrex::Gpu::numGpuStreams(); ++i)
-            {
-                amrex::Gpu::Device::setStreamIndex(i); 
-                AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec[i], amrex::Gpu::Device::cudaStream())); 
-            }
-            amrex::Gpu::Device::synchronize();
-            amrex::Gpu::Device::resetStreamIndex();
-            BL_PROFILE_VAR_STOP(cgl);
-
-            amrex::Print() << "Graph-per-stream sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create a single graph for the MFIter loop:
-//        an empty node at the start linked to each individually captured stream graph.
-
-        {
-            BL_PROFILE("IterGraph");
-            *val = 4.0;
-
-            BL_PROFILE_VAR("CREATE: IterGraph", cgc);
-
-            cudaGraph_t     graph[x.local_size()];
-            cudaGraphExec_t graphExec;
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream()));
-#else
-                AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream(),
-                                                           cudaStreamCaptureModeGlobal));
-#endif
-
-                // ..................
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-                // ..................
-
-                AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(amrex::Gpu::Device::cudaStream(), &(graph[mfi.LocalIndex()])));
-            }
-
-            cudaGraph_t     graphFull;
-            cudaGraphNode_t emptyNode, placeholder;
-
-            AMREX_GPU_SAFE_CALL(cudaGraphCreate(&graphFull, 0));
-            AMREX_GPU_SAFE_CALL(cudaGraphAddEmptyNode(&emptyNode, graphFull, &placeholder, 0));
-            for (int i=0; i<x.local_size(); ++i)
-            {
-                AMREX_GPU_SAFE_CALL(cudaGraphAddChildGraphNode(&placeholder, graphFull, &emptyNode, 1, graph[i]));
-            }
-
-            BL_PROFILE_VAR_STOP(cgc);
-            BL_PROFILE_VAR("INSTANTIATE: IterGraph", cgi);
-
-            AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec, graphFull, NULL, NULL, 0));
-
-            BL_PROFILE_VAR_STOP(cgi);
-            BL_PROFILE_VAR("LAUNCH: IterGraph", cgl);
-
-            amrex::Gpu::Device::setStreamIndex(0); 
-            AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec, amrex::Gpu::Device::cudaStream())); 
-            AMREX_GPU_SAFE_CALL(cudaGraphDestroy(graphFull));
-            amrex::Gpu::Device::synchronize();
-            amrex::Gpu::Device::resetStreamIndex();
-
-            BL_PROFILE_VAR_STOP(cgl);
-
-            amrex::Print() << "Full-graph-iter sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create a single graph for the MFIter loop:
-//        an empty node at the start linked to each individually captured stream graph.
-
-        {
-            BL_PROFILE("StreamGraph");
-            *val = 5.0;
-
-            BL_PROFILE_VAR("CREATE: StreamGraph", cgc);
-
-            cudaGraph_t     graph[amrex::Gpu::numGpuStreams()];
-            cudaGraphExec_t graphExec;
-            cudaEvent_t memcpy_event = {0};
-            cudaEventCreate(&memcpy_event);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                if (mfi.LocalIndex() == 0)
-                {
-                    for (int i=0; i<amrex::Gpu::numGpuStreams(); ++i)
-                    {
-                        amrex::Gpu::Device::setStreamIndex(i);
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                        AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream()));
-#else
-                        AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream(),
-                                                                   cudaStreamCaptureModeGlobal));
-#endif
-                    }
-                    amrex::Gpu::Device::setStreamIndex(mfi.tileIndex());
-                } 
-
-                // ..................
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-                // ..................
-
-                if (mfi.LocalIndex() == (x.local_size() - 1) )
-                { 
-                    for (int i=0; i<amrex::Gpu::numGpuStreams(); ++i)
-                    {
-                        amrex::Gpu::Device::setStreamIndex(i); 
-                        AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(amrex::Gpu::Device::cudaStream(), &(graph[i])));
-                    }
-                }
-            }
-
-            cudaGraph_t     graphFull;
-            cudaGraphNode_t emptyNode, placeholder;
-
-            AMREX_GPU_SAFE_CALL(cudaGraphCreate(&graphFull, 0));
-            AMREX_GPU_SAFE_CALL(cudaGraphAddEmptyNode(&emptyNode, graphFull, &placeholder, 0));
-            for (int i=0; i<amrex::Gpu::numGpuStreams(); ++i)
-            {
-                AMREX_GPU_SAFE_CALL(cudaGraphAddChildGraphNode(&placeholder, graphFull, &emptyNode, 1, graph[i]));
-            }
-
-            BL_PROFILE_VAR_STOP(cgc);
-            BL_PROFILE_VAR("INSTANTIATE: StreamGraph", cgi);
-
-            AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec, graphFull, NULL, NULL, 0));
-
-            BL_PROFILE_VAR_STOP(cgi);
-            BL_PROFILE_VAR("LAUNCH: StreamGraph", cgl);
-
-            amrex::Gpu::Device::setStreamIndex(0); 
-            AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec, amrex::Gpu::Device::cudaStream())); 
-            AMREX_GPU_SAFE_CALL(cudaGraphDestroy(graphFull));
-
-            amrex::Gpu::Device::synchronize();
-            amrex::Gpu::Device::resetStreamIndex();
-
-            BL_PROFILE_VAR_STOP(cgl);
-
-            amrex::Print() << "Linked-graph-stream sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        {
-            BL_PROFILE("Indep - Streamless");
-            *val = 6.0;
-
-            BL_PROFILE_VAR("CREATE: Indep - Streamless", cgc);
-
-            cudaGraph_t     graph[x.local_size()];
-            cudaGraphExec_t graphExec;
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::setStreamIndex(0);
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream()));
-#else
-                AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream(),
-                                                           cudaStreamCaptureModeGlobal));
-#endif
-
-                // ..................
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-                // ..................
-
-                AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(amrex::Gpu::Device::cudaStream(), &(graph[mfi.LocalIndex()])));
-            }
-
-            cudaGraph_t     graphFull;
-            cudaGraphNode_t emptyNode, placeholder;
-
-            AMREX_GPU_SAFE_CALL(cudaGraphCreate(&graphFull, 0));
-            AMREX_GPU_SAFE_CALL(cudaGraphAddEmptyNode(&emptyNode, graphFull, &placeholder, 0));
-            for (int i=0; i<x.local_size(); ++i)
-            {
-                AMREX_GPU_SAFE_CALL(cudaGraphAddChildGraphNode(&placeholder, graphFull, &emptyNode, 1, graph[i]));
-            }
-
-            BL_PROFILE_VAR_STOP(cgc);
-            BL_PROFILE_VAR("INSTANTIATE: Indep - Streamless", cgi);
-/*
-            constexpr int log_size = 1028;
-            char graph_log[log_size];
-            graph_log[0]='\0';
-
-            cudaGraphInstantiate(&graphExec, graphFull, NULL, &(graph_log[0]), log_size);
-
-            amrex::Print() << graph_log << std::endl;
-            AMREX_GPU_ERROR_CHECK();
-*/
-            AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec, graphFull, NULL, NULL, 0));
-
-            BL_PROFILE_VAR_STOP(cgi);
-            BL_PROFILE_VAR("LAUNCH: Indep - Streamless", cgl);
-
-            amrex::Gpu::Device::setStreamIndex(0); 
-            AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec, amrex::Gpu::Device::cudaStream())); 
-            AMREX_GPU_SAFE_CALL(cudaGraphDestroy(graphFull));
-            amrex::Gpu::Device::synchronize();
-            amrex::Gpu::Device::resetStreamIndex();
-
-
-            BL_PROFILE_VAR_STOP(cgl);
-
-            amrex::Print() << "Full-graph-independent-streamless sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        {
-            BL_PROFILE("Depend - Streamless");
-            *val = 7.0;
-
-            BL_PROFILE_VAR("CREATE: Depend - Streamless", cgc);
-
-            cudaGraph_t     graph;
-            cudaGraphExec_t graphExec;
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::setStreamIndex(0);
-                if (mfi.LocalIndex() == 0)
-                {
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                    AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream()));
-#else
-                    AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(amrex::Gpu::Device::cudaStream(),
-                                                               cudaStreamCaptureModeGlobal));
-#endif
-                } 
-
-                // ..................
-                const Box bx = mfi.validbox();
-                Array4<Real> a = x.array(mfi);
-
-                MFIterLoopFunc(bx, val, a);
-                // ..................
-
-                if (mfi.LocalIndex() == (x.local_size() - 1) )
-                { 
-                    amrex::Gpu::Device::setStreamIndex(0); 
-                    AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(amrex::Gpu::Device::cudaStream(), &graph));
-                }
-            }
-
-            BL_PROFILE_VAR_STOP(cgc);
-            BL_PROFILE_VAR("INSTANTIATE: Depend - Streamless", cgi);
-
-            AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec, graph, NULL, NULL, 0));
-
-            BL_PROFILE_VAR_STOP(cgi);
-            BL_PROFILE_VAR("LAUNCH: Depend - Streamless", cgl);
-
-            amrex::Gpu::Device::setStreamIndex(0); 
-            AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec, amrex::Gpu::Device::cudaStream())); 
-
-            amrex::Gpu::Device::synchronize();
-            amrex::Gpu::Device::resetStreamIndex();
-
-            BL_PROFILE_VAR_STOP(cgl);
-
-            amrex::Print() << "Linked-graph-dependent-streamless sum = " << x.sum() << ". Expected = " << points*(*val) << std::endl;
-
-        }
-
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        amrex::Print() << "Test Completed." << std::endl;
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/GPU/CudaGraphs/BuildingGraphs/run.corigpu b/Tests/GPU/CudaGraphs/BuildingGraphs/run.corigpu
deleted file mode 100755
index ce02364631e..00000000000
--- a/Tests/GPU/CudaGraphs/BuildingGraphs/run.corigpu
+++ /dev/null
@@ -1,42 +0,0 @@
-#!/bin/bash -l
-#SBATCH -C gpu
-#SBATCH -t 00:05:00 
-#SBATCH -J AMREX_GPU
-#SBATCH -o AMREX_GPU.o%j
-#SBATCH -A nstaff 
-
-#SBATCH -N 1
-#SBATCH -n 1 
-#SBATCH -c 1
-#SBATCH --gres=gpu:1
-#SBATCH --ntasks-per-node=1
-
-# Note: Given exclusive configuration mode,
-#       you MUST specify your desired resources up top like this.
-#       Cannot put it in the srun line alone.
-#       (You can force lower than your full request in the srun line,
-#        or put the configuration again for safety, but shouldn't be needed.)
-# ============
-# -N =                nodes
-# -n =                tasks (MPI ranks)
-# -c =                CPU per task (full coriGPU node, c*n <= 80)
-# --gres=gpu: =       GPUs per node (full coriGPU node, 8)
-# --ntasks-per-node = number of tasks (MPI ranks) per node (full node, 8)
-#
-
-# For one node:  -N 1, -n  8, -c 10, --gres=gpu:8 --ntasks-per-node 8
-# For two nodes: -N 2, -n 16, -c 10, --gres=gpu:8 --ntasks-per-node 8
-
-# salloc commands:
-# ================
-# Single node:
-# salloc -N 1 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-# Multi node:
-# salloc -N 2 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-
-# environment setup:
-# ==================
-# module purge
-# module load modules esslurm gcc cuda mvapich2 
-
-srun ./main3d.gnu.TPROF.CUDA.ex inputs_3d
diff --git a/Tests/GPU/CudaGraphs/CrazyGraphs/GNUmakefile b/Tests/GPU/CudaGraphs/CrazyGraphs/GNUmakefile
deleted file mode 100644
index 93f8449a6b2..00000000000
--- a/Tests/GPU/CudaGraphs/CrazyGraphs/GNUmakefile
+++ /dev/null
@@ -1,10 +0,0 @@
-MAKE_FLAGS := -I$(CUDA_DIR)/include -L$(CUDA_DIR)/lib64
-
-all: main.cpp
-	nvcc main.cpp -ccbin=g++ -Xcompiler=' -g -O3  --std=c++14' --std=c++14 --expt-extended-lambda -Wno-deprecated-gpu-targets -m64 -arch=compute_70 -code=sm_70 -x cu -I. $(MAKE_FLAGS) -L. -L/opt/gcc/7.3.0/snos/lib/gcc/x86_64-suse-linux/7.3.0/../../../../lib64/ -lcuda -o graphs.ex 
-
-clean:
-	rm graphs.ex
-
-realclean:
-	rm graphs.ex
diff --git a/Tests/GPU/CudaGraphs/CrazyGraphs/main.cpp b/Tests/GPU/CudaGraphs/CrazyGraphs/main.cpp
deleted file mode 100644
index 1b573662476..00000000000
--- a/Tests/GPU/CudaGraphs/CrazyGraphs/main.cpp
+++ /dev/null
@@ -1,195 +0,0 @@
-#include <cuda_runtime.h>
-#include <iostream>
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-__global__ void func (double *ptr)
-{
-    *ptr = 3;
-}
-
-template<class L>
-__global__ void lambda (L f0) { f0(); }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-int main (int argc, char* argv[])
-{
-    std::cout << "**********************************\n";
-    // ===================================
-    // Simple cuda action to make sure all tests have cuda.
-    // Allows nvprof to return data.
-    int devices = 0;
-    cudaGetDeviceCount(&devices);
-
-    std::cout << "GPU devices: " << devices << "\n";
-    std::cout << "**********************************\n"; 
-    // ===================================
-
-    {
-        // Malloc value for double testing
-        double *p, *q;
-        cudaMallocManaged(&p, sizeof(double));
-        cudaMallocManaged(&q, sizeof(double));
-        *p = 0.0;
-        *q = 0.0;
-
-        cudaStream_t    stream;
-        cudaStreamCreate(&stream);
-
-        cudaGraph_t     graphP, graphQ;
-        cudaGraphExec_t graphExec;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create P graph, instantiate and execute. 
-
-        {
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-            cudaStreamBeginCapture(stream);
-#else
-            cudaStreamBeginCapture(stream, cudaStreamCaptureModeGlobal);
-#endif
-            func<<<1,1,0,stream>>>(p);
-            cudaStreamEndCapture(stream, &(graphP));
-
-            cudaGraphInstantiate(&graphExec, graphP, NULL, NULL, 0);
-            cudaGraphLaunch(graphExec, stream);  
-
-            cudaDeviceSynchronize();
-
-            std::cout << "1: p, q = " << *p << ", " << *q << std::endl;
-
-// ------------------------------------------------------------------------------- 
-//          Make Q graph
-
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-            cudaStreamBeginCapture(stream);
-#else
-            cudaStreamBeginCapture(stream, cudaStreamCaptureModeGlobal);
-#endif
-
-            func<<<1,1,0,stream>>>(q);
-            cudaStreamEndCapture(stream, &(graphQ));
-
-// ------------------------------------------------------------------------------- 
-//          Get nodes from graphs
-
-            size_t numP, numQ;
-            cudaGraphGetNodes(graphP, NULL, &numP);
-            cudaGraphGetNodes(graphQ, NULL, &numQ); 
-
-            std::cout << "numP, numQ = " << numP << ", " << numQ << std::endl;
-
-            cudaGraphNode_t nodesP[numP], nodesQ[numQ];
-            cudaGraphGetNodes(graphP, nodesP, &numP);
-            cudaGraphGetNodes(graphQ, nodesQ, &numQ);
-
-// ------------------------------------------------------------------------------- 
-//          Swap params in CudaGraphExec and re-execute without instantiation.
-
-            cudaKernelNodeParams knp;
-            cudaGraphKernelNodeGetParams(nodesQ[0], &knp);
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-            cudaGraphExecKernelNodeSetParams(graphExec, nodesP[0], &knp);
-#endif
-            cudaGraphLaunch(graphExec, stream);  
-            cudaDeviceSynchronize();
-
-            // "2: p, q = 3, 3"?
-            std::cout << "2: p, q = " << *p << ", " << *q << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        std::cout << "Double Test Completed." << std::endl << std::endl; 
-    }
-
-// ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
-// ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
-
-    {
-        std::cout << "**********************************\n"; 
-        // ===================================
-
-        // Malloc values for lambda testing.
-        double *p, *q;
-        cudaMallocManaged(&p, sizeof(double));
-        cudaMallocManaged(&q, sizeof(double));
-        *p = 0.0;
-        *q = 0.0;
-
-        cudaStream_t    stream;
-        cudaStreamCreate(&stream);
-
-        cudaGraph_t     graphP, graphQ;
-        cudaGraphExec_t graphExec;
-
-        auto plus  = [=] __device__ (double* p) { *p = *p + 1; };
-        auto minus = [=] __device__ (double* p) { *p = *p - 1; };
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create P graph, instantiate and execute. 
-
-        {
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-            cudaStreamBeginCapture(stream);
-#else
-            cudaStreamBeginCapture(stream, cudaStreamCaptureModeGlobal);
-#endif
-
-            lambda<<<1,1,0,stream>>>( [=] __device__ () { plus(p); } );
-            cudaStreamEndCapture(stream, &(graphP));
-
-            cudaGraphInstantiate(&graphExec, graphP, NULL, NULL, 0);
-            cudaGraphLaunch(graphExec, stream);  
-
-            cudaDeviceSynchronize();
-
-            std::cout << "1: p = " << *p << std::endl;
-
-// ------------------------------------------------------------------------------- 
-//          Make Q graph
-
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-            cudaStreamBeginCapture(stream);
-#else
-            cudaStreamBeginCapture(stream, cudaStreamCaptureModeGlobal);
-#endif
-
-            lambda<<<1,1,0,stream>>>( [=] __device__ () { minus(p); } );
-            cudaStreamEndCapture(stream, &(graphQ));
-
-// ------------------------------------------------------------------------------- 
-//          Get nodes from graphs
-
-            size_t numP, numQ;
-            cudaGraphGetNodes(graphP, NULL, &numP);
-            cudaGraphGetNodes(graphQ, NULL, &numQ); 
-
-            std::cout << "numP, numQ = " << numP << ", " << numQ << std::endl;
-
-            cudaGraphNode_t nodesP[numP], nodesQ[numQ];
-            cudaGraphGetNodes(graphP, nodesP, &numP);
-            cudaGraphGetNodes(graphQ, nodesQ, &numQ);
-
-// ------------------------------------------------------------------------------- 
-//          Swap params in CudaGraphExec and re-execute without instantiation.
-
-            cudaKernelNodeParams knp, knpB;
-            cudaGraphKernelNodeGetParams(nodesQ[0], &knp);
-
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-            cudaGraphExecKernelNodeSetParams(graphExec, nodesP[0], &knp);
-#endif
-            cudaGraphLaunch(graphExec, stream);  
-            cudaDeviceSynchronize();
-
-            std::cout << "2: p = " << *p << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        std::cout << "Lambda Test Completed." << std::endl << std::endl;
-    }
-
-}
diff --git a/Tests/GPU/CudaGraphs/CrazyGraphs/run.corigpu b/Tests/GPU/CudaGraphs/CrazyGraphs/run.corigpu
deleted file mode 100755
index 57e94140139..00000000000
--- a/Tests/GPU/CudaGraphs/CrazyGraphs/run.corigpu
+++ /dev/null
@@ -1,42 +0,0 @@
-#!/bin/bash -l
-#SBATCH -C gpu
-#SBATCH -t 00:05:00 
-#SBATCH -J CUDA_GRAPHS 
-#SBATCH -o CUDA_GRAPHS.o%j
-#SBATCH -A nstaff 
-
-#SBATCH -N 1
-#SBATCH -n 1 
-#SBATCH -c 1
-#SBATCH --gres=gpu:1
-#SBATCH --ntasks-per-node=1
-
-# Note: Given exclusive configuration mode,
-#       you MUST specify your desired resources up top like this.
-#       Cannot put it in the srun line alone.
-#       (You can force lower than your full request in the srun line,
-#        or put the configuration again for safety, but shouldn't be needed.)
-# ============
-# -N =                nodes
-# -n =                tasks (MPI ranks)
-# -c =                CPU per task (full coriGPU node, c*n <= 80)
-# --gres=gpu: =       GPUs per node (full coriGPU node, 8)
-# --ntasks-per-node = number of tasks (MPI ranks) per node (full node, 8)
-#
-
-# For one node:  -N 1, -n  8, -c 10, --gres=gpu:8 --ntasks-per-node 8
-# For two nodes: -N 2, -n 16, -c 10, --gres=gpu:8 --ntasks-per-node 8
-
-# salloc commands:
-# ================
-# Single node:
-# salloc -N 1 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-# Multi node:
-# salloc -N 2 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-
-# environment setup:
-# ==================
-# module purge
-# module load modules esslurm gcc cuda mvapich2 
-
-srun ./graphs.ex
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/Make.package b/Tests/GPU/CudaGraphs/GraphBoundary/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/Prob.H b/Tests/GPU/CudaGraphs/GraphBoundary/Prob.H
deleted file mode 100644
index 262241a8f77..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/Prob.H
+++ /dev/null
@@ -1,42 +0,0 @@
-#ifndef MY_PROB_H_
-#define MY_PROB_H_
-
-#include <AMReX_Box.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Geometry.H>
-
-using namespace amrex;
-
-AMREX_GPU_HOST_DEVICE
-AMREX_FORCE_INLINE
-void
-initdata(Box const& bx, Array4<Real> const& phi, GeometryData const& geomdata)
-{
-    const auto lo = lbound(bx);
-    const auto hi = ubound(bx);    
-
-    const Real* AMREX_RESTRICT prob_lo = geomdata.ProbLo();
-    const Real* AMREX_RESTRICT dx      = geomdata.CellSize();
-
-#ifdef _OPENMP
-#pragma omp parallel for collapse(2) if (GPU::notInLaunchRegion())
-#endif
-    for         (int k = lo.z; k <= hi.z; ++k) {
-        for     (int j = lo.y; j <= hi.y; ++j) {
-            Real z = prob_lo[2] + (0.5+k) * dx[2];
-            Real y = prob_lo[1] + (0.5+j) * dx[1];
-            AMREX_PRAGMA_SIMD
-            for (int i = lo.x; i <= hi.x; ++i) {
-                Real x = prob_lo[0] + (0.5+i) * dx[0]; 
-#if (AMREX_SPACEDIM == 2)
-                Real r2 = (pow(x-0.5, 2) + pow((y-0.75),2)) / 0.01;
-#else
-                Real r2 = (pow(x-0.5, 2) + pow((y-0.75),2) + pow((z-0.5),2)) / 0.01;
-#endif
-                phi(i,j,k) = 1.0 + std::exp(-r2);
-            }
-        }
-    }
-}
-
-#endif
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/inputs_3d b/Tests/GPU/CudaGraphs/GraphBoundary/inputs_3d
deleted file mode 100644
index a5ad333853d..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/inputs_3d
+++ /dev/null
@@ -1,8 +0,0 @@
-nsteps = 10
- 
-n_cell = 256 
-max_grid_size = 128 
-nghost = 1 
-ncomp = 1
-
-amrex.v = 1
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/main.cpp b/Tests/GPU/CudaGraphs/GraphBoundary/main.cpp
deleted file mode 100644
index 2b733a89aaa..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/main.cpp
+++ /dev/null
@@ -1,257 +0,0 @@
-
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-
-#include <Prob.H>
-
-// Non-uniform MultiFab setup for FillBoundary testing.
-void setup(amrex::MultiFab &mfab, const amrex::Geometry &geom)
-{
-    // Setup the data outside the FillBoundary timers.
-    // Ensures data is moved to GPU.
-    for (MFIter mfi(mfab); mfi.isValid(); ++mfi)
-    {
-        const Box bx = mfi.validbox();
-        Array4<Real> phi = mfab[mfi].array(); 
-        GeometryData geomData = geom.data();
-
-        amrex::launch(bx,
-        [=] AMREX_GPU_DEVICE (Box const& tbx)
-        {
-            initdata(tbx, phi, geomData);
-        });
-    }    
-}
-
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-
-using namespace amrex;
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-    amrex::Gpu::GraphSafeGuard gpu_gsg(true);
-    {
-    
-        // AMREX_SPACEDIM: number of dimensions
-        int n_cell, max_grid_size, nsteps, Nghost, Ncomp;
-        Vector<int> is_periodic(AMREX_SPACEDIM,1);  // periodic in all direction by default
-    
-        // inputs parameters
-        {
-            // ParmParse is way of reading inputs from the inputs file
-            ParmParse pp;
-    
-            // We need to get n_cell from the inputs file - this is the number of cells on each side of 
-            //   a square (or cubic) domain.
-            pp.get("n_cell",n_cell);
-    
-            // The domain is broken into boxes of size max_grid_size
-            pp.get("max_grid_size",max_grid_size);
-    
-            // The number of ghost cells and components of the MultiFab
-            Nghost = 1; 
-            pp.query("nghost", Nghost); 
-    
-            Ncomp = 1;
-            pp.query("ncomp", Ncomp); 
-    
-            // Default nsteps to 0, allow us to set it to something else in the inputs file
-            nsteps = 10;
-            pp.query("nsteps",nsteps);
-    
-            // Periodic in all directions by default
-            pp.queryarr("is_periodic", is_periodic);
-        }
-    
-        // make BoxArray and Geometry
-        BoxArray ba;
-        Geometry geom;
-        {
-            IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-            IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-            Box domain(dom_lo, dom_hi);
-    
-            // Initialize the boxarray "ba" from the single box "bx"
-            ba.define(domain);
-            // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-            ba.maxSize(max_grid_size);
-    
-           // This defines the physical box, [-1,1] in each direction.
-            RealBox real_box({AMREX_D_DECL(-1.0,-1.0,-1.0)},
-                             {AMREX_D_DECL( 1.0, 1.0, 1.0)});
-    
-            // This defines a Geometry object
-            geom.define(domain,&real_box,CoordSys::cartesian,is_periodic.data());
-        }
-    
-        // How Boxes are distrubuted among MPI processes
-        DistributionMapping dm(ba);
-
-        Real b_per_mpi = Real(ba.size()) / Real(ParallelDescriptor::NProcs());
-        Real b_per_stream = b_per_mpi / Gpu::Device::numGpuStreams();
-     
-        amrex::Print() << "========================================================" << std::endl; 
-        amrex::Print() << " Fill Boundary CUDA Graph Test " << std::endl;
-        amrex::Print() << " Domain size: " << n_cell << "^3." << std::endl;
-        amrex::Print() << " Max grid size: " << max_grid_size << " cells." << std::endl;
-        amrex::Print() << " Boxes: " << ba.size() << std::endl;
-        amrex::Print() << " Boxes per MPI: " << b_per_mpi << std::endl;
-        amrex::Print() << " Boxes per stream: " << b_per_stream << std::endl;
-        amrex::Print() << "========================================================" << std::endl; 
-    
-        MultiFab mf_graph(ba, dm, Ncomp, Nghost);
-        MultiFab mf_gpu  (ba, dm, Ncomp, Nghost);
-        MultiFab mf_cpu  (ba, dm, Ncomp, Nghost);
-
-        mf_graph.setVal(0.0);
-        mf_gpu.setVal(0.0);
-        mf_cpu.setVal(0.0);
- 
-        Real start_time, end_time;
-        Real cpu_avg, gpu_avg, graph_avg, graph_init, gpu_even;
-
-        // With CPU
-        Gpu::setLaunchRegion(false);
-        Gpu::setGraphRegion(false); 
-        {
-            // Setup the data outside the FillBoundary timers.
-            setup(mf_cpu, geom);
-    
-            // Run the remainder of the FillBoundary's (nsteps-1)
-            // -------------------------------------
-            ParallelDescriptor::Barrier();
-            {
-                BL_PROFILE_REGION("CPU");
-                BL_PROFILE_VAR("CPU: FillBoundary", CPUFB);
-                start_time = amrex::second();
-    
-                for (int i=0; i<nsteps; ++i)
-                {
-                    mf_cpu.FillBoundary(geom.periodicity());
-                }
-    
-                ParallelDescriptor::Barrier();
-                end_time = amrex::second();
-                BL_PROFILE_VAR_STOP(CPUFB);
-            }
-    
-            cpu_avg = (end_time - start_time)/nsteps;
-            amrex::Print() << "Average time per CPU FillBoundary = " << cpu_avg << std::endl;
-        }
- 
-        // With GPUs and Graphs
-        Gpu::setLaunchRegion(true); 
-        Gpu::setGraphRegion(true); 
-        {
-            // Setup the data outside the FillBoundary timers.
-            // Ensures data is moved to GPU.
-            setup(mf_graph, geom);
-    
-            // First FillBoundary will create graph and run.
-            // Timed separately.
-            // -------------------------------------
-            ParallelDescriptor::Barrier();
-            {
-                BL_PROFILE_REGION("GRAPH #1");
-                BL_PROFILE_VAR("GRAPH: Create Graph and Run", makeandrungraph);
-                start_time = amrex::second();
-    
-                mf_graph.FillBoundary(geom.periodicity());
-    
-                ParallelDescriptor::Barrier();
-                end_time = amrex::second();
-                BL_PROFILE_VAR_STOP(makeandrungraph);
-            }
-            graph_init = end_time - start_time;
-            amrex::Print() << "Time for 1st graphed FillBoundary (Recorded, Instantiated Ran) = " << graph_init << std::endl;
-            // -------------------------------------
-    
-            // Run the remainder of the FillBoundarys (nsteps-1)
-            ParallelDescriptor::Barrier();
-            {
-                BL_PROFILE_REGION("GRAPH");
-                BL_PROFILE_VAR("GRAPH: Run Graph", rungraph);
-                start_time = amrex::second();
-    
-                for (int i=1; i<nsteps; ++i)
-                {
-                    mf_graph.FillBoundary(geom.periodicity());
-                }
-    
-                ParallelDescriptor::Barrier();
-                end_time = amrex::second();
-                BL_PROFILE_VAR_STOP(rungraph);
-            }
-    
-            graph_avg = (end_time - start_time)/(nsteps-1);
-            amrex::Print() << "Average time per graph-only FillBoundary = " << graph_avg << std::endl;
-        }
-
-        // With GPU and no graphs
-        Gpu::setLaunchRegion(true); 
-        Gpu::setGraphRegion(false); 
-        {
-            // Setup the data outside the FillBoundary timers.
-            // Ensures data is moved to GPU.
-            setup(mf_gpu, geom);
-    
-            // Run the nstep FillBoundaries
-            // -------------------------------------
-    
-            ParallelDescriptor::Barrier();
-            {
-                BL_PROFILE_REGION("GPU");
-                BL_PROFILE_VAR("GPU: FillBoundary", GPUFB);
-                start_time = amrex::second();
-    
-                for (int i=0; i<nsteps; ++i)
-                {
-                    mf_gpu.FillBoundary(geom.periodicity());
-                }
-      
-                ParallelDescriptor::Barrier();
-                end_time = amrex::second();
-                BL_PROFILE_VAR_STOP(GPUFB);
-            }
-    
-            gpu_avg = (end_time - start_time)/nsteps;
-            gpu_even = (graph_init - graph_avg)/(gpu_avg - graph_avg);
-            amrex::Print() << "Average time per GPU FillBoundary = " << gpu_avg << std::endl;
-            amrex::Print() << "   Graphed FillBoundary(s) needed to break even = " << gpu_even << std::endl;
-            amrex::Print() << "   Average expected maximum speedup = " << (gpu_avg/graph_avg) << std::endl;
-        }
-    
-        // Check the results of Graph vs. CPU and GPU.
-        // Maximum of difference of all cells.
-        {
-            amrex::Real max_error = 0;
-            MultiFab mf_error (ba, dm, Ncomp, Nghost);
-    
-            MultiFab::Copy(mf_error, mf_cpu, 0, 0, Ncomp, Nghost);
-            MultiFab::Subtract(mf_error, mf_gpu, 0, 0, Ncomp, Nghost);
-            for (int i = 0; i<Ncomp; ++i)
-            {
-                max_error = std::max(max_error, mf_error.norm0(0, Nghost));
-            }
-            amrex::Print() << std::endl;
-            amrex::Print() << "Max difference between CPU and GPU: " << max_error << std::endl; 
-    
-            MultiFab::Copy(mf_error, mf_graph, 0, 0, Ncomp, Nghost);
-            MultiFab::Subtract(mf_error, mf_cpu, 0, 0, Ncomp, Nghost);
-            for (int i = 0; i<Ncomp; ++i)
-            {
-                max_error = std::max(max_error, mf_error.norm0(0, Nghost));
-            }
-            amrex::Print() << "Max difference between CPU and Graph: " << max_error << std::endl; 
-    
-            amrex::Print() << "========================================================" << std::endl << std::endl;
-        }
-
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/profile.sh b/Tests/GPU/CudaGraphs/GraphBoundary/profile.sh
deleted file mode 100755
index e776d3e2dc4..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/profile.sh
+++ /dev/null
@@ -1,3 +0,0 @@
-#!/bin/bash
-nvprof -o nvprof_$$.nvvp ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
-#nv-nsight-cu-cli -o nsight_$$.gui ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/run.corigpu b/Tests/GPU/CudaGraphs/GraphBoundary/run.corigpu
deleted file mode 100755
index 9b833e3f6d0..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/run.corigpu
+++ /dev/null
@@ -1,49 +0,0 @@
-#!/bin/bash -l
-#SBATCH -C gpu
-#SBATCH -t 00:05:00 
-#SBATCH -J AMREX_GPU
-#SBATCH -o AMREX_GPU.o%j
-#SBATCH -A nstaff 
-
-#SBATCH -N 1
-#SBATCH -n 8 
-#SBATCH -c 10
-#SBATCH --gres=gpu:8
-#SBATCH --ntasks-per-node=8
-
-# Note: Given exclusive configuration mode,
-#       you MUST specify your desired resources up top like this.
-#       Cannot put it in the srun line alone.
-#       (You can force lower than your full request in the srun line,
-#        or put the configuration again for safety, but shouldn't be needed.)
-# ============
-# -N                = nodes
-# -n                = tasks (MPI ranks)
-# -c                = CPU per task (full coriGPU node, c*n <= 80)
-# --gres=gpu:       = GPUs per node (full coriGPU node, 8)
-# --ntasks-per-node = number of tasks (MPI ranks) per node (full node, 8)
-#
-
-# For one node:  -N 1, -n  8, -c 10, --gres=gpu:8 --ntasks-per-node 8
-# For two nodes: -N 2, -n 16, -c 10, --gres=gpu:8 --ntasks-per-node 8
-
-# salloc commands:
-# ================
-# Single node:
-# salloc -N 1 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-# Multi node:
-# salloc -N 2 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-
-# environment setup:
-# ==================
-# module purge
-# module load modules esslurm gcc cuda mvapich2 
-
-srun -n 8 -c 10 --gres=gpu:8 ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
-
-#srun -n 8 -c 10 --gres=gpu:8 ./main3d.gnu.DEBUG.TPROF.MPI.CUDA.ex inputs_3d
-
-#srun nvprof -o nvprof.${SLURM_TASK_PID}.nvvp ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
-#srun nv-nsight-cu-cli -o profile ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
-#srun nsys profile ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
-#srun ./profile.sh
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/run.summit b/Tests/GPU/CudaGraphs/GraphBoundary/run.summit
deleted file mode 100755
index e4d793efad1..00000000000
--- a/Tests/GPU/CudaGraphs/GraphBoundary/run.summit
+++ /dev/null
@@ -1,44 +0,0 @@
-#!/bin/bash
-#BSUB -P CSC308
-#BSUB -W 10 
-#BSUB -nnodes 1
-#BSUB -J MMtest 
-#BSUB -o MMtest.%J
-#BSUB -e MMtest.%J
-
-module load pgi 
-module load cuda
-module list
-set -x
-
-omp=1
-export OMP_NUM_THREADS=${omp}
-EXE="./main3d.pgi.TPROF.CUDA.ex"
-#EXE="../main3d.pgi.CUDA.ex"
-JSRUN="jsrun -n 1 -a 1 -g 1 -c 1 --bind=packed:${omp}"
-INPUTS=inputs_3d
-
-rundir="${LSB_JOBNAME}-${LSB_JOBID}"
-#mkdir $rundir
-#cp $0 $rundir
-#cp ${INPUTS} $rundir
-#cd $rundir
-
-# 1. Run normally
-${JSRUN} ${EXE} ${INPUTS} >& out.${LSB_JOBID}
-#${JSRUN} cuda-memcheck ${EXE} ${INPUTS} >& out.${LSB_JOBID}
-
-# 2. Run under nvprof and direct all stdout and stderr to nvprof.txt
-#${JSRUN} nvprof ${EXE} ${INPUTS} &> nvprof.txt
-#${JSRUN} nvprof --profile-child-processes ${EXE} inputs &> nvprof.txt
-
-# 3. Run under nvprof and store performance data in a nvvp file
-# Can be converted to text using nvprof -i nvprof-timeline-%p.nvvp
-#${JSRUN} nvprof --profile-child-processes -o nvprof-timeline-%p.nvvp ${EXE} ${INPUTS} 
-
-# COLLECT PERFORMANCE METRICS - THIS IS MUCH SLOWER. Set nsteps=2 in the inputs files
-# 4. Run under nvprof and collect metrics for a subset of kernels
-#${JSRUN} nvprof --profile-child-processes --kernels '(deposit_current|gather_\w+_field|push_\w+_boris)' --analysis-metrics -o nvprof-metrics-kernel-%p.nvvp ${EXE} ${INPUTS} 
-
-# 5. Run under nvprof and collect metrics for all kernels -- much slower!
-#${JSRUN} nvprof --profile-child-processes --analysis-metrics -o nvprof-metrics-%p.nvvp ${EXE} ${INPUTS}
diff --git a/Tests/GPU/CudaGraphs/GraphInitTest/inputs_3d b/Tests/GPU/CudaGraphs/GraphInitTest/inputs_3d
deleted file mode 100644
index 10a3eb66771..00000000000
--- a/Tests/GPU/CudaGraphs/GraphInitTest/inputs_3d
+++ /dev/null
@@ -1,12 +0,0 @@
-init = 1 
-write_to_file = 0 
-begin_nnodes = 4 
-end_nnodes = 4
-threads_per_stream = 32
-nstreams = 16 
-output = timersStreamsInit.txt
-
-init_factor = 10 
-
-#amrex.v = 1
-#amrex.v = 0
diff --git a/Tests/GPU/CudaGraphs/GraphInitTest/main.cpp b/Tests/GPU/CudaGraphs/GraphInitTest/main.cpp
deleted file mode 100644
index 70878016676..00000000000
--- a/Tests/GPU/CudaGraphs/GraphInitTest/main.cpp
+++ /dev/null
@@ -1,322 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-// TestLoop
-// Written as a seperate function for easy changes/testing.
-
-__global__ void fillerKernel() { }
-
-void TestLoopFunc(long* a, int num)
-{
-    amrex::ParallelFor(num,
-    [=] AMREX_GPU_HOST_DEVICE (int i)
-    {
-        *(a+i) += 1;
-    });
-}
-
-void Check(AsyncArray<long> &arr, Vector<long> &vec, int value)
-{
-    arr.copyToHost(vec.data(), vec.size());
-    for (int i=0; i<vec.size(); ++i)
-    {
-        if (vec[i] != (value))
-        {
-            amrex::Print() << "vec[" << i << "] = " << vec[i]
-                           << " != " << value << std::endl;
-        }
-    }
-}
-
-void WriteTimers(std::ofstream& file, long Nnodes,
-                 double loop_1, double loop_2, 
-                 double buildg_1, double buildg_2, 
-                 double instg_1, double instg_2,
-                 double rung_1, double rung_2,
-                 double graph_1, double graph_2)
-{
-   file << Nnodes  << " " << loop_1 << " " << buildg_1 << " " << instg_1 << " "
-        << rung_1  << " " << graph_1 << " " << loop_2 << " " << buildg_2 << " "
-        << instg_2 << " " << rung_2 << " " << graph_2 << std::endl;
-}
-
-void InitGraph(int Nnodes)
-{
-    BL_PROFILE("InitGraph");
-
-    int streams = 16;
-
-    amrex::Print() << "Instantiating a " << Nnodes << " node graph." << std::endl;
-
-    cudaGraphExec_t graphExec;
-
-    for (int n=0; n<(Nnodes); ++n)
-    {
-        Gpu::Device::startGraphRecording((n == 0), NULL, NULL, 0);
-
-        // ..................
-        Gpu::Device::setStreamIndex(n%streams);
-        fillerKernel<<<1, 1, 0, Gpu::gpuStream()>>>();
-        // ..................
-
-        graphExec = Gpu::Device::stopGraphRecording((n == (Nnodes-1)));
-    }
-
-    AMREX_GPU_SAFE_CALL(cudaGraphExecDestroy(graphExec));
-}
-
-double Loop(long* h_ptr, long* d_ptr, int Nnodes, int streams, int warp, std::string label)
-{
-    BL_PROFILE(label);
-    double timer = amrex::second(); 
-
-    Gpu::Device::setStreamIndex(0);
-    cudaMemcpy(d_ptr, h_ptr, streams*warp, cudaMemcpyHostToDevice);
-    for (int n=0; n<(Nnodes*streams); ++n)
-    {
-        Gpu::Device::setStreamIndex(n%streams);
-        size_t offset = (n%streams)*warp;
-        TestLoopFunc((d_ptr+offset), warp);
-    }
-    Gpu::Device::synchronize();
-    Gpu::Device::resetStreamIndex();
-
-    timer = amrex::second() - timer; 
-
-    return timer;
-}
-
-void Graph(long* h_ptr, long* d_ptr, int Nnodes, int streams, int warp, 
-           double& build_time, double& inst_time, double& run_time, double& total_time,
-           std::string label)
-{
-    BL_PROFILE(label);
-    total_time = amrex::second();
-
-    BL_PROFILE_VAR("CREATE: " + label, cgc);
-    build_time = amrex::second();
-
-    cudaGraph_t     graph;
-    cudaGraphExec_t graphExec;
-
-    for (int n=0; n<(Nnodes*streams); ++n)
-    {
-        if (n == 0)
-        {
-            Gpu::Device::setStreamIndex(0);
-            cudaStream_t graph_stream = Gpu::gpuStream();
-            cudaEvent_t memcpy_event = {0};
-            AMREX_GPU_SAFE_CALL(cudaEventCreateWithFlags(&memcpy_event, cudaEventDisableTiming));
-
-            AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(graph_stream, cudaStreamCaptureModeGlobal));
-
-            AMREX_GPU_SAFE_CALL(cudaMemcpyAsync(d_ptr, h_ptr, warp*streams, cudaMemcpyHostToDevice, graph_stream));
-            AMREX_GPU_SAFE_CALL(cudaEventRecord(memcpy_event, graph_stream));
-
-            for (int i=1; i<streams; ++i)
-            {
-                Gpu::Device::setStreamIndex(i);
-                AMREX_GPU_SAFE_CALL(cudaStreamWaitEvent(Gpu::gpuStream(), memcpy_event, 0));
-            }
-
-            AMREX_GPU_SAFE_CALL(cudaEventDestroy(memcpy_event));
-        }
-
-
-        // ..................
-        Gpu::Device::setStreamIndex(n%streams);
-        size_t offset = (n%streams)*warp;
-        TestLoopFunc((d_ptr+offset), warp);
-        // ..................
-
-        if (n == (Nnodes*streams-1))
-        { 
-            Gpu::Device::setStreamIndex(0);
-            cudaStream_t graph_stream = Gpu::gpuStream();
-            cudaEvent_t rejoin_event = {0};
-            AMREX_GPU_SAFE_CALL(cudaEventCreateWithFlags(&rejoin_event, cudaEventDisableTiming));
-
-            for (int i=1; i<streams; ++i)
-            {
-                Gpu::Device::setStreamIndex(i);
-                cudaEventRecord(rejoin_event, Gpu::gpuStream());
-                cudaStreamWaitEvent(graph_stream, rejoin_event, 0);
-            }
-
-            Gpu::Device::resetStreamIndex();
-
-            AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(graph_stream, &graph));
-            AMREX_GPU_SAFE_CALL(cudaEventDestroy(rejoin_event));
-        }
-    }
-
-    build_time = amrex::second() - build_time;
-    BL_PROFILE_VAR_STOP(cgc);
-    BL_PROFILE_VAR("INSTANTIATE: " + label, cgi);
-    inst_time = amrex::second();
-
-    AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec, graph, NULL, NULL, 0));
-
-    inst_time = amrex::second() - inst_time;
-    BL_PROFILE_VAR_STOP(cgi);
-    BL_PROFILE_VAR("LAUNCH: " + label, cgl);
-    run_time = amrex::second();
-
-    amrex::Gpu::Device::setStreamIndex(0); 
-    AMREX_GPU_SAFE_CALL(cudaGraphLaunch(graphExec, amrex::Gpu::Device::cudaStream())); 
-
-    amrex::Gpu::Device::synchronize();
-    amrex::Gpu::Device::resetStreamIndex();
-
-    run_time = amrex::second() - run_time;
-    BL_PROFILE_VAR_STOP(cgl);
-    BL_PROFILE_VAR("DESTROY: " + label, cgd);
-
-    AMREX_GPU_SAFE_CALL(cudaGraphExecDestroy(graphExec));
-    AMREX_GPU_SAFE_CALL(cudaGraphDestroy(graph));
-
-    BL_PROFILE_VAR_STOP(cgl);
-
-    total_time = amrex::second() - total_time;
-}
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-    {
-        amrex::Gpu::GraphSafeGuard gsf(true);
-
-        int begin_nodes, end_nodes, streams, factor, warp, init, tofile;
-        std::string filename;
-        {
-            ParmParse pp;
-
-            begin_nodes = 1;
-            pp.query("begin_nnodes", begin_nodes);
-
-            end_nodes = 10;
-            pp.query("end_nnodes", end_nodes);
-
-            warp = Gpu::Device::warp_size;
-            pp.query("threads_per_stream", warp);
-
-            streams = Gpu::Device::numGpuStreams();
-            pp.query("nstreams", streams);
-
-            factor = 10;
-            pp.query("init_factor", factor);
-
-            filename = "timers.txt";
-            pp.query("output", filename);
-
-            init = 0;
-            pp.query("init", init);
-
-            tofile = 1;
-            pp.query("write_to_file", tofile);
-        }
-
-        // Setup data to work on:
-        int size = warp*streams;
-        Vector<long> vec(size);
-        for (int i=0; i<size; ++i)
-        {
-            vec[i] = 0;
-        }
-        Gpu::AsyncArray<long> arr(vec.data(), size);
-        long* ptr = arr.data();
-
-        if (init)
-        {
-            InitGraph(end_nodes*16*10);
-        }
-
-        amrex::Print() << "Init Graph = " << init << std::endl;
-        amrex::Print() << "Number of streams = " << streams << std::endl;
-        amrex::Print() << "Threads per stream = " << warp << std::endl;
-        amrex::Print() << "Stating number of nodes per stream = " << begin_nodes << std::endl; 
-        amrex::Print() << "Ending number of nodes per stream = " << end_nodes << std::endl << std::endl;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        std::ofstream file;
-        if (tofile)
-        {
-            file.open(filename);
-            file.setf(std::ios_base::scientific, std::ios_base::floatfield);
-            file << "Nodes / Loop1 / Build1 / Instantiate1 / Run1 / Total1 "
-                         << "Loop2 / Build2 / Instantiate2 / Run2 / Total2" << std::endl;
-        }
-
-        double loop_1 = 0.0,   loop_2 = 0.0, 
-               buildg_1 = 0.0, buildg_2 = 0.0, 
-               instg_1 = 0.0,  instg_2 = 0.0, 
-               rung_1 = 0.0,   rung_2 = 0.0, 
-               graph_1 = 0.0,  graph_2 = 0.0;
-
-        int kidx = 0;
-
-        for (int Nnodes=begin_nodes; Nnodes<=end_nodes; ++Nnodes)
-        {
-            amrex::Print() << "Testing " << Nnodes << " per stream." << std::endl;
-
-            loop_1 = Loop(vec.data(), ptr, Nnodes, streams, warp, "Loop 1");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            loop_2 = Loop(vec.data(), ptr, Nnodes, streams, warp, "Loop 2");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            Graph(vec.data(), ptr, Nnodes, streams, warp, 
-                  buildg_1, instg_1, rung_1, graph_1,
-                  "Graph 1");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            loop_2 = Loop(vec.data(), ptr, Nnodes, streams, warp, "Loop 3");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            Graph(vec.data(), ptr, Nnodes, streams, warp, 
-                  buildg_2, instg_2, rung_2, graph_2,
-                  "Graph 2");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            loop_2 = Loop(vec.data(), ptr, Nnodes, streams, warp, "Loop 4");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            Graph(vec.data(), ptr, Nnodes, streams, warp, 
-                  buildg_2, instg_2, rung_2, graph_2,
-                  "Graph 3");
-            kidx += Nnodes;
-            Check(arr, vec, kidx);
-
-            arr.clear();
-
-            if (tofile)
-            {
-                WriteTimers(file, (Nnodes*streams),
-                            loop_1, loop_2, buildg_1, buildg_2, instg_1,
-                            instg_2, rung_1, rung_2, graph_1, graph_2);
-            }
-        }
-
-        if (tofile)
-        {
-           file.close();
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-    } // amrex scope
-
-    amrex::Finalize();
-}
diff --git a/Tests/GPU/CudaGraphs/GraphReuseCopy/GNUmakefile b/Tests/GPU/CudaGraphs/GraphReuseCopy/GNUmakefile
deleted file mode 100644
index 5d099193be7..00000000000
--- a/Tests/GPU/CudaGraphs/GraphReuseCopy/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-AMREX_HOME ?= ../../../..
-
-DEBUG	= FALSE
-#DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gnu 
-
-USE_MPI   = TRUE 
-USE_OMP   = FALSE
-USE_CUDA  = TRUE
-TINY_PROFILE = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/GPU/CudaGraphs/GraphReuseCopy/Make.package b/Tests/GPU/CudaGraphs/GraphReuseCopy/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/GPU/CudaGraphs/GraphReuseCopy/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/GPU/CudaGraphs/GraphReuseCopy/inputs_3d b/Tests/GPU/CudaGraphs/GraphReuseCopy/inputs_3d
deleted file mode 100644
index 27cb1dada91..00000000000
--- a/Tests/GPU/CudaGraphs/GraphReuseCopy/inputs_3d
+++ /dev/null
@@ -1,7 +0,0 @@
-#nsteps = 1000 
-#plot_int = -1 
-n_cell = 256 
-max_grid_size = 64
-
-#amrex.v = 1
-#amrex.v = 0
diff --git a/Tests/GPU/CudaGraphs/GraphReuseCopy/main.cpp b/Tests/GPU/CudaGraphs/GraphReuseCopy/main.cpp
deleted file mode 100644
index a8ecc0f5ee9..00000000000
--- a/Tests/GPU/CudaGraphs/GraphReuseCopy/main.cpp
+++ /dev/null
@@ -1,612 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::Array4<Real> src, amrex::Array4<Real> dst,
-           int scomp, int dcomp, int ncomp)
-{
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-        }
-    }
-
-}
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::Array4<Real>* src, amrex::Array4<Real>* dst,
-           int scomp, int dcomp, int ncomp)
-{
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            (*dst)(i,j,k,dcomp+n) = (*src)(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-        }
-    }
-
-}
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::FArrayBox* src_fab, amrex::FArrayBox* dst_fab,
-           int scomp, int dcomp, int ncomp)
-{
-    Array4<Real> src = src_fab->array();
-    Array4<Real> dst = dst_fab->array();
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-        }
-    }
-}
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::FArrayBox** src_fab, amrex::FArrayBox** dst_fab,
-           int scomp, int dcomp, int ncomp)
-{
-    Array4<Real> src = (*src_fab)->array();
-    Array4<Real> dst = (*dst_fab)->array();
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-        }
-    }
-}
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-    amrex::Gpu::GraphSafeGuard gpu_gsg(true);
-    {
-
-        // AMREX_SPACEDIM: number of dimensions
-        int n_cell, max_grid_size;
-        Vector<int> is_periodic(AMREX_SPACEDIM,1);  // periodic in all direction by default
-
-        // inputs parameters
-        {
-            // ParmParse is way of reading inputs from the inputs file
-            ParmParse pp;
-
-            // We need to get n_cell from the inputs file - this is the number of cells on each side of 
-            //   a square (or cubic) domain.
-            pp.get("n_cell",n_cell);
-
-            // The domain is broken into boxes of size max_grid_size
-            pp.get("max_grid_size",max_grid_size);
-        }
-
-        // make BoxArray and Geometry
-        BoxArray ba;
-        {
-            IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-            IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-            Box domain(dom_lo, dom_hi);
-
-            // Initialize the boxarray "ba" from the single box "bx"
-            ba.define(domain);
-            // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-            ba.maxSize(max_grid_size);
-        }
-
-        // Nghost = number of ghost cells for each array 
-        int Nghost = 1;
-    
-        // Ncomp = number of components for each array
-        int Ncomp  = 1;
-  
-        // How Boxes are distrubuted among MPI processes
-        DistributionMapping dm(ba);
-
-        // Malloc value for setval testing.
-        Real* val;
-        cudaMallocManaged(&val, sizeof(Real));
-
-        // Create the MultiFab and touch the data.
-        // Ensures the data in on the GPU for all further testing.
-        MultiFab x(ba, dm, Ncomp, Nghost);
-        MultiFab y(ba, dm, Ncomp, Nghost);
-        MultiFab v(ba, dm, Ncomp, Nghost);
-        MultiFab w(ba, dm, Ncomp, Nghost);
-        x.setVal(0.0);
-        y.setVal(0.0);
-        v.setVal(0.0);
-        w.setVal(0.0);
-
-        int size = x.local_size();
-
-        // Array4<Real> Variation
-        Array4<Real>* src_arrs_h = static_cast<Array4<Real>*>(malloc(sizeof(Array4<Real>)*size));
-        Array4<Real>* dst_arrs_h = static_cast<Array4<Real>*>(malloc(sizeof(Array4<Real>)*size));
-        Array4<Real>* src_arrs_d;
-        Array4<Real>* dst_arrs_d;
-        cudaMalloc(&src_arrs_d, sizeof(Array4<Real>)*size);
-        cudaMalloc(&dst_arrs_d, sizeof(Array4<Real>)*size);
-
-        // FAB* Variation
-        FArrayBox** src_fab = static_cast<FArrayBox**>( std::malloc(sizeof(FArrayBox*)*size) );
-        FArrayBox** dst_fab = static_cast<FArrayBox**>( std::malloc(sizeof(FArrayBox*)*size) );
-        FArrayBox** src_fab_d;
-        FArrayBox** dst_fab_d;
-        cudaMalloc(&src_fab_d, sizeof(FArrayBox*)*size);
-        cudaMalloc(&dst_fab_d, sizeof(FArrayBox*)*size);
-
-        Real points = ba.numPts();
-
-        amrex::Print() << "Testing on " << n_cell << "^3 boxes with max grid size " << max_grid_size << std::endl 
-                       << "Number of boxes per MultiFab: " << x.size() << std::endl << std::endl;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Launch without graphs
-
-        amrex::Print() << "Testing Cases" << std::endl;
-
-        {
-            x.setVal(4.5);
-            y.setVal(5.3);
-
-            BL_PROFILE("HtoD Copy Clean-up");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.validbox();
-                Array4<Real> src = x.array(mfi);
-                Array4<Real> dst = y.array(mfi);
-                Dim3 offset {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D ( bx, Ncomp, i, j, k, n,
-                {
-                    dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-            }
-
-            amrex::Print() << "Clean up sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-// ---------------------------------------
-
-        {
-            x.setVal(4.0);
-            y.setVal(5.0);
-
-            BL_PROFILE("Lambda Copy - Array4");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.validbox();
-                Array4<Real> src = x.array(mfi);
-                Array4<Real> dst = y.array(mfi);
-                Dim3 offset {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D ( bx, Ncomp, i, j, k, n,
-                {
-                    dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-            }
-
-            amrex::Print() << "No Graph Lambda sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-// ---------------------------------------
-
-        {
-            x.setVal(0.75);
-            y.setVal(0.25);
-
-            BL_PROFILE("Function Copy - FAB");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box bx = mfi.validbox();
-
-                int idx = mfi.LocalIndex();
-                const auto src = x.fabPtr(mfi);
-                const auto dst = y.fabPtr(mfi);
-
-                int ncells = bx.numPts();
-                const auto lo  = amrex::lbound(bx);
-                const auto len = amrex::length(bx);
-                const auto ec = Gpu::ExecutionConfig(ncells);
-                const Dim3 offset = {0,0,0};
-
-                AMREX_GPU_LAUNCH_GLOBAL(ec, copy,
-                                        lo, len, ncells,
-                                        offset, src, dst,
-                                        0, 0, 1);
-            }
-
-            amrex::Print() << "No Graph Function FAB sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-// ---------------------------------------
-
-        {
-            x.setVal(0.867);
-            y.setVal(0.5309);
-
-            BL_PROFILE("Lambda Copy - FAB");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box bx = mfi.validbox();
-
-                int idx = mfi.LocalIndex();
-                const auto src_fab = x.fabPtr(mfi);
-                const auto dst_fab = y.fabPtr(mfi);
-                const Dim3 offset = {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D ( bx, Ncomp, i, j, k, n,
-                {
-                    Array4<Real> src = src_fab->array();
-                    Array4<Real> dst = dst_fab->array();
-                    dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-            }
-
-            amrex::Print() << "No Graph Lambda FAB sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-        amrex::Print() << "=============" << std::endl;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create a single graph for the MFIter loop using a function:
-//        an empty node at the start linked to each individually captured stream graph.
-
-        cudaGraphExec_t graphExec;
-
-        amrex::Print() << "Function w/ FAB" << std::endl;
-
-        {
-            x.setVal(2e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE("cudaGraph - Function FAB");
-
-// --------- Capture each stream in the MFIter loop ----------
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: create", cgfc);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex() == 0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-
-                int idx = mfi.LocalIndex();
-
-                int ncells = bx.numPts();
-                const auto lo  = amrex::lbound(bx);
-                const auto len = amrex::length(bx);
-                const auto ec = Gpu::ExecutionConfig(ncells);
-                const Dim3 offset = {0,0,0};
-
-                AMREX_GPU_LAUNCH_GLOBAL(ec, copy,
-                                        lo, len, ncells,
-                                        offset, &(src_fab_d[idx]), &(dst_fab_d[idx]), 0, 0, 1); 
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() -1)); 
-            }
-
-            BL_PROFILE_VAR_STOP(cgfc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: launch", cgfl);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                src_fab[idx] = x.fabPtr(mfi);
-                dst_fab[idx] = y.fabPtr(mfi); 
-            }
-            cudaMemcpy(src_fab_d, src_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_fab_d, dst_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfl);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(4337654e-9);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: relaunch", cgfrl);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-// --------- Doesn't work changing the Array4 in CPU memory, even with function. ----------
-// --------- Trying with Array4 in device memory defined by Arena. ----------
-
-            x.setVal(0.238761);
-            v.setVal(0.5e-5);
-            w.setVal(0.0);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                src_fab[idx] = v.fabPtr(mfi);
-                dst_fab[idx] = w.fabPtr(mfi);
-            }
-            cudaMemcpy(src_fab_d, src_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_fab_d, dst_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: diff", cgfdiff);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Diff Graph Function = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create a single graph for the MFIter loop using a lambda:
-//        an empty node at the start linked to each individually captured stream graph.
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Lambda w/ Array4" << std::endl;
-
-        {
-            x.setVal(4e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE("cudaGraph - Lambda Array4");
-
-// --------- Capture each stream in the MFIter loop ----------
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: create", cgfc);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex() == 0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                const Dim3 offset = {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D (bx, Ncomp, i, j, k, n,
-                {
-                    (dst_arrs_d[idx])(i,j,k,dcomp+n) = (src_arrs_d[idx])(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() -1)); 
-            }
-
-            BL_PROFILE_VAR_STOP(cgfc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: launch", cgfl);
-
-            // Setup the data for this execution.
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                Array4<Real> src = x[mfi].array();
-                Array4<Real> dst = y[mfi].array();
-                std::memcpy(&src_arrs_h[idx], &src, sizeof(Array4<Real>));
-                std::memcpy(&dst_arrs_h[idx], &dst, sizeof(Array4<Real>));
-            }
-            cudaMemcpy(src_arrs_d, src_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_arrs_d, dst_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfl);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(6.5784e-9);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: relaunch", cgfrl);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-// --------- Doesn't work changing the Array4 in CPU memory, even with function. ----------
-// --------- Trying with Array4 in device memory defined by Arena. ----------
-
-            x.setVal(0.167852);
-            v.setVal(0.15e-5);
-            w.setVal(0.0);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                Array4<Real> src = v[mfi].array();
-                Array4<Real> dst = w[mfi].array();
-                std::memcpy(&src_arrs_h[idx], &src, sizeof(Array4<Real>));
-                std::memcpy(&dst_arrs_h[idx], &dst, sizeof(Array4<Real>));
-            }
-            cudaMemcpy(src_arrs_d, src_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_arrs_d, dst_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: diff", cgfdiff);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-        }
-
-        std::free(src_arrs_h);
-        std::free(dst_arrs_h);
-        cudaFree (src_arrs_d);
-        cudaFree (dst_arrs_d);
-
-        std::free(src_fab);
-        std::free(dst_fab); 
-        cudaFree (src_fab_d);
-        cudaFree (dst_fab_d);
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Using Graph Object" << std::endl;
-
-        {
-            x.setVal(253.37116);
-            y.setVal(26877.2268);
-
-            BL_PROFILE("GraphObject");
-            BL_PROFILE_VAR("GraphObject: create", goc);
-
-            // Creates appropriate device storage of graph parameters.
-            CudaGraph<CopyMemory> cgraph(x.local_size());
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex() == 0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                Dim3 offset = {0,0,0};
-
-                CopyMemory* cgd = cgraph.getDevicePtr(idx); 
-                AMREX_HOST_DEVICE_FOR_3D (bx, i, j, k,
-                {
-                    // Build the Array4's.
-                    auto const dst = cgd->getDst<Real>();
-                    auto const src = cgd->getSrc<Real>();
-                    int scomp   = cgd->scomp;
-                    for (int n = 0; n < cgd->ncomp; ++n) {
-                        dst(i,j,k,scomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-                    }
-                });
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() -1)); 
-            }
-
-            cgraph.setGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(goc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("GraphObject: launch", gol);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(x[mfi].array(),
-                                                            y[mfi].array(),
-                                                            0, 1));
-            }
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(gol);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(55.555e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("GraphObject: relaunch", cgfrl);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-
-            x.setVal(0.167852);
-            v.setVal(0.0);
-            w.setVal(0.15e-5);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(w[mfi].array(),
-                                                            v[mfi].array(),
-                                                            0, 1));
-            }
-
-            BL_PROFILE_VAR("GraphObject: diff", cgfdiff);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-
-        }
-
-        amrex::Print() << "Test Completed." << std::endl;
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/GPU/CudaGraphs/GraphReuseCopy/run.corigpu b/Tests/GPU/CudaGraphs/GraphReuseCopy/run.corigpu
deleted file mode 100755
index 0a5c592f34d..00000000000
--- a/Tests/GPU/CudaGraphs/GraphReuseCopy/run.corigpu
+++ /dev/null
@@ -1,42 +0,0 @@
-#!/bin/bash -l
-#SBATCH -C gpu
-#SBATCH -t 00:05:00 
-#SBATCH -J AMREX_GPU
-#SBATCH -o AMREX_GPU.o%j
-#SBATCH -A nstaff 
-
-#SBATCH -N 1
-#SBATCH -n 1 
-#SBATCH -c 10
-#SBATCH --gres=gpu:1
-#SBATCH --ntasks-per-node=1
-
-# Note: Given exclusive configuration mode,
-#       you MUST specify your desired resources up top like this.
-#       Cannot put it in the srun line alone.
-#       (You can force lower than your full request in the srun line,
-#        or put the configuration again for safety, but shouldn't be needed.)
-# ============
-# -N =                nodes
-# -n =                tasks (MPI ranks)
-# -c =                CPU per task (full coriGPU node, c*n <= 80)
-# --gres=gpu: =       GPUs per node (full coriGPU node, 8)
-# --ntasks-per-node = number of tasks (MPI ranks) per node (full node, 8)
-#
-
-# For one node:  -N 1, -n  8, -c 10, --gres=gpu:8 --ntasks-per-node 8
-# For two nodes: -N 2, -n 16, -c 10, --gres=gpu:8 --ntasks-per-node 8
-
-# salloc commands:
-# ================
-# Single node:
-# salloc -N 1 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-# Multi node:
-# salloc -N 2 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-
-# environment setup:
-# ==================
-# module purge
-# module load modules esslurm gcc cuda mvapich2 
-
-srun ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
diff --git a/Tests/GPU/CudaGraphs/GraphWithMemcpy/GNUmakefile b/Tests/GPU/CudaGraphs/GraphWithMemcpy/GNUmakefile
deleted file mode 100644
index 5d099193be7..00000000000
--- a/Tests/GPU/CudaGraphs/GraphWithMemcpy/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-AMREX_HOME ?= ../../../..
-
-DEBUG	= FALSE
-#DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gnu 
-
-USE_MPI   = TRUE 
-USE_OMP   = FALSE
-USE_CUDA  = TRUE
-TINY_PROFILE = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/GPU/CudaGraphs/GraphWithMemcpy/Make.package b/Tests/GPU/CudaGraphs/GraphWithMemcpy/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/GPU/CudaGraphs/GraphWithMemcpy/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/GPU/CudaGraphs/GraphWithMemcpy/inputs_3d b/Tests/GPU/CudaGraphs/GraphWithMemcpy/inputs_3d
deleted file mode 100644
index 0d819e3e006..00000000000
--- a/Tests/GPU/CudaGraphs/GraphWithMemcpy/inputs_3d
+++ /dev/null
@@ -1,7 +0,0 @@
-#nsteps = 1000 
-#plot_int = -1 
-n_cell = 256 
-max_grid_size = 16 
-
-#amrex.v = 1
-#amrex.v = 0
diff --git a/Tests/GPU/CudaGraphs/GraphWithMemcpy/main.cpp b/Tests/GPU/CudaGraphs/GraphWithMemcpy/main.cpp
deleted file mode 100644
index 8dcaa6a20b2..00000000000
--- a/Tests/GPU/CudaGraphs/GraphWithMemcpy/main.cpp
+++ /dev/null
@@ -1,969 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_Gpu.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::Array4<Real> src, amrex::Array4<Real> dst,
-           int scomp, int dcomp, int ncomp)
-{
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-        }
-    }
-
-}
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::Array4<Real>* src, amrex::Array4<Real>* dst,
-           int scomp, int dcomp, int ncomp)
-{
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            (*dst)(i,j,k,dcomp+n) = (*src)(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-        }
-    }
-
-}
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::FArrayBox* src_fab, amrex::FArrayBox* dst_fab,
-           int scomp, int dcomp, int ncomp)
-{
-    Array4<Real> src = src_fab->array();
-    Array4<Real> dst = dst_fab->array();
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-        }
-    }
-}
-
-AMREX_GPU_GLOBAL
-void copy (amrex::Dim3 lo, amrex::Dim3 len, int ncells,
-           amrex::Dim3 offset, amrex::FArrayBox** src_fab, amrex::FArrayBox** dst_fab,
-           int scomp, int dcomp, int ncomp)
-{
-    Array4<Real> src = (*src_fab)->array();
-    Array4<Real> dst = (*dst_fab)->array();
-
-    for (int icell = blockDim.x*blockIdx.x+threadIdx.x, stride = blockDim.x*gridDim.x;
-             icell < ncells; icell += stride) {
-        int k =  icell /   (len.x*len.y);
-        int j = (icell - k*(len.x*len.y)) /   len.x;
-        int i = (icell - k*(len.x*len.y)) - j*len.x;
-        i += lo.x;
-        j += lo.y;
-        k += lo.z;
-        for (int n = 0; n < ncomp; ++n) {
-            dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-        }
-    }
-}
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-    amrex::Gpu::GraphSafeGuard gpu_gsg(true);
-    {
-
-        // AMREX_SPACEDIM: number of dimensions
-        int n_cell, max_grid_size;
-        Vector<int> is_periodic(AMREX_SPACEDIM,1);  // periodic in all direction by default
-
-        // inputs parameters
-        {
-            // ParmParse is way of reading inputs from the inputs file
-            ParmParse pp;
-
-            // We need to get n_cell from the inputs file - this is the number of cells on each side of 
-            //   a square (or cubic) domain.
-            pp.get("n_cell",n_cell);
-
-            // The domain is broken into boxes of size max_grid_size
-            pp.get("max_grid_size",max_grid_size);
-        }
-
-        // make BoxArray and Geometry
-        BoxArray ba;
-        {
-            IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-            IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-            Box domain(dom_lo, dom_hi);
-
-            // Initialize the boxarray "ba" from the single box "bx"
-            ba.define(domain);
-            // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-            ba.maxSize(max_grid_size);
-        }
-
-        // Nghost = number of ghost cells for each array 
-        int Nghost = 1;
-    
-        // Ncomp = number of components for each array
-        int Ncomp  = 1;
-  
-        // How Boxes are distrubuted among MPI processes
-        DistributionMapping dm(ba);
-
-        // Malloc value for setval testing.
-        Real* val;
-        cudaMallocManaged(&val, sizeof(Real));
-
-        // Create the MultiFab and touch the data.
-        // Ensures the data in on the GPU for all further testing.
-        MultiFab x(ba, dm, Ncomp, Nghost);
-        MultiFab y(ba, dm, Ncomp, Nghost);
-        MultiFab v(ba, dm, Ncomp, Nghost);
-        MultiFab w(ba, dm, Ncomp, Nghost);
-        x.setVal(0.0);
-        y.setVal(0.0);
-        v.setVal(0.0);
-        w.setVal(0.0);
-
-        int size = x.local_size();
-
-        // Array4<Real> Variation
-        Array4<Real>* src_arrs_h = static_cast<Array4<Real>*>(malloc(sizeof(Array4<Real>)*size));
-        Array4<Real>* dst_arrs_h = static_cast<Array4<Real>*>(malloc(sizeof(Array4<Real>)*size));
-        Array4<Real>* src_arrs_d;
-        Array4<Real>* dst_arrs_d;
-        cudaMalloc(&src_arrs_d, sizeof(Array4<Real>)*size);
-        cudaMalloc(&dst_arrs_d, sizeof(Array4<Real>)*size);
-
-        // FAB* Variation
-        FArrayBox** src_fab = static_cast<FArrayBox**>( std::malloc(sizeof(FArrayBox*)*size) );
-        FArrayBox** dst_fab = static_cast<FArrayBox**>( std::malloc(sizeof(FArrayBox*)*size) );
-        FArrayBox** src_fab_d;
-        FArrayBox** dst_fab_d;
-        cudaMalloc(&src_fab_d, sizeof(FArrayBox*)*size);
-        cudaMalloc(&dst_fab_d, sizeof(FArrayBox*)*size);
-
-        Real points = ba.numPts();
-
-        amrex::Print() << "Testing on " << n_cell << "^3 boxes with max grid size " << max_grid_size << std::endl 
-                       << "Number of boxes per MultiFab: " << x.size() << std::endl << std::endl;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Launch without graphs
-
-        amrex::Print() << "Testing Cases" << std::endl;
-
-        {
-            x.setVal(4.5);
-            y.setVal(5.3);
-
-            BL_PROFILE("HtoD Copy Clean-up");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.validbox();
-                Array4<Real> src = x.array(mfi);
-                Array4<Real> dst = y.array(mfi);
-                Dim3 offset {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D ( bx, Ncomp, i, j, k, n,
-                {
-                    dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-            }
-
-            amrex::Print() << "Clean up sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-// ---------------------------------------
-
-        {
-            x.setVal(4.0);
-            y.setVal(5.0);
-
-            BL_PROFILE("Lambda Copy - Array4");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box& bx = mfi.validbox();
-                Array4<Real> src = x.array(mfi);
-                Array4<Real> dst = y.array(mfi);
-                Dim3 offset {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D ( bx, Ncomp, i, j, k, n,
-                {
-                    dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-            }
-
-            amrex::Print() << "No Graph Lambda sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-// ---------------------------------------
-
-        {
-            x.setVal(0.75);
-            y.setVal(0.25);
-
-            BL_PROFILE("Function Copy - FAB");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box bx = mfi.validbox();
-
-                int idx = mfi.LocalIndex();
-                const auto src = x.fabPtr(mfi);
-                const auto dst = y.fabPtr(mfi);
-
-                int ncells = bx.numPts();
-                const auto lo  = amrex::lbound(bx);
-                const auto len = amrex::length(bx);
-                const auto ec = Gpu::ExecutionConfig(ncells);
-                const Dim3 offset = {0,0,0};
-
-                AMREX_GPU_LAUNCH_GLOBAL(ec, copy,
-                                         lo, len, ncells,
-                                         offset, src, dst,
-                                         0, 0, 1);
-            }
-
-            amrex::Print() << "No Graph Function FAB sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-// ---------------------------------------
-
-        {
-            x.setVal(0.867);
-            y.setVal(0.5309);
-
-            BL_PROFILE("Lambda Copy - FAB");
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                const Box bx = mfi.validbox();
-
-                int idx = mfi.LocalIndex();
-                const auto src_fab = x.fabPtr(mfi);
-                const auto dst_fab = y.fabPtr(mfi);
-                const Dim3 offset = {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D ( bx, Ncomp, i, j, k, n,
-                {
-                    Array4<Real> src = src_fab->array();
-                    Array4<Real> dst = dst_fab->array();
-                    dst(i,j,k,dcomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-            }
-
-            amrex::Print() << "No Graph Lambda FAB sum = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-        }
-
-        amrex::Print() << "=============" << std::endl;
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create a single graph for the MFIter loop using a function:
-//        an empty node at the start linked to each individually captured stream graph.
-
-        cudaGraphExec_t graphExec;
-
-        amrex::Print() << "Function w/ FAB" << std::endl;
-
-        {
-            x.setVal(2e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE("cudaGraph - Function FAB");
-
-// --------- Capture each stream in the MFIter loop ----------
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: create", cgfc);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex()==0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-
-                int idx = mfi.LocalIndex();
-
-                int ncells = bx.numPts();
-                const auto lo  = amrex::lbound(bx);
-                const auto len = amrex::length(bx);
-                const auto ec = Gpu::ExecutionConfig(ncells);
-                const Dim3 offset = {0,0,0};
-
-                AMREX_GPU_LAUNCH_GLOBAL(ec, copy,
-                                         lo, len, ncells,
-                                         offset, &(src_fab_d[idx]), &(dst_fab_d[idx]), 0, 0, 1); 
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() - 1)); 
-            }
-
-            BL_PROFILE_VAR_STOP(cgfc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: launch", cgfl);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                src_fab[idx] = x.fabPtr(mfi);
-                dst_fab[idx] = y.fabPtr(mfi); 
-            }
-            cudaMemcpy(src_fab_d, src_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_fab_d, dst_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfl);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(4337654e-9);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: relaunch", cgfrl);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-// --------- Doesn't work changing the Array4 in CPU memory, even with function. ----------
-// --------- Trying with Array4 in device memory defined by Arena. ----------
-
-            x.setVal(0.238761);
-            v.setVal(0.5e-5);
-            w.setVal(0.0);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                src_fab[idx] = v.fabPtr(mfi);
-                dst_fab[idx] = w.fabPtr(mfi);
-            }
-            cudaMemcpy(src_fab_d, src_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_fab_d, dst_fab, sizeof(FArrayBox*)*size, cudaMemcpyHostToDevice);
-
-            BL_PROFILE_VAR("cudaGraph - Function FAB: diff", cgfdiff);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Diff Graph Function = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-//      Create a single graph for the MFIter loop using a lambda:
-//        an empty node at the start linked to each individually captured stream graph.
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Lambda w/ Array4" << std::endl;
-
-        {
-            x.setVal(4e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE("cudaGraph - Lambda Array4");
-
-// --------- Capture each stream in the MFIter loop ----------
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: create", cgfc);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex()==0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                const Dim3 offset = {0,0,0};
-                int dcomp = 0;
-                int scomp = 0;
-
-                AMREX_HOST_DEVICE_FOR_4D (bx, Ncomp, i, j, k, n,
-                {
-                    (dst_arrs_d[idx])(i,j,k,dcomp+n) = (src_arrs_d[idx])(i+offset.x,j+offset.y,k+offset.z,scomp+n); 
-                });
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() - 1)); 
-            }
-
-            BL_PROFILE_VAR_STOP(cgfc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: launch", cgfl);
-
-            // Setup the data for this execution.
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                Array4<Real> src = x[mfi].array();
-                Array4<Real> dst = y[mfi].array();
-                std::memcpy(&src_arrs_h[idx], &src, sizeof(Array4<Real>));
-                std::memcpy(&dst_arrs_h[idx], &dst, sizeof(Array4<Real>));
-            }
-            cudaMemcpy(src_arrs_d, src_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_arrs_d, dst_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfl);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(6.5784e-9);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: relaunch", cgfrl);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-// --------- Doesn't work changing the Array4 in CPU memory, even with function. ----------
-// --------- Trying with Array4 in device memory defined by Arena. ----------
-
-            x.setVal(0.167852);
-            v.setVal(0.15e-5);
-            w.setVal(0.0);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                Array4<Real> src = v[mfi].array();
-                Array4<Real> dst = w[mfi].array();
-                std::memcpy(&src_arrs_h[idx], &src, sizeof(Array4<Real>));
-                std::memcpy(&dst_arrs_h[idx], &dst, sizeof(Array4<Real>));
-            }
-            cudaMemcpy(src_arrs_d, src_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-            cudaMemcpy(dst_arrs_d, dst_arrs_h, sizeof(Array4<Real>)*size, cudaMemcpyHostToDevice);
-
-            BL_PROFILE_VAR("cudaGraph - Lambda Array4: diff", cgfdiff);
-
-            amrex::Gpu::Device::executeGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-        }
-
-        std::free(src_arrs_h);
-        std::free(dst_arrs_h);
-        cudaFree (src_arrs_d);
-        cudaFree (dst_arrs_d);
-
-        std::free(src_fab);
-        std::free(dst_fab); 
-        cudaFree (src_fab_d);
-        cudaFree (dst_fab_d);
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Using Graph Object" << std::endl;
-
-        {
-            x.setVal(253.37116);
-            y.setVal(26877.2268);
-
-            BL_PROFILE("GraphObject");
-            BL_PROFILE_VAR("GraphObject: create", goc);
-
-            // Creates appropriate device storage of graph parameters.
-            CudaGraph<CopyMemory> cgraph(x.local_size());
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex()==0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                Dim3 offset = {0,0,0};
-
-                CopyMemory* cgd = cgraph.getDevicePtr(idx); 
-
-                // ADD INDIVIDUAL MEMCPY_ASYNCS DIRECTLY HERE.
-                AMREX_HOST_DEVICE_FOR_3D (bx, i, j, k,
-                {
-                    // Build the Array4's.
-                    auto const dst = cgd->getDst<Real>();
-                    auto const src = cgd->getSrc<Real>();
-                    int scomp   = cgd->scomp;
-                    for (int n = 0; n < cgd->ncomp; ++n) {
-                        dst(i,j,k,scomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-                    }
-                });
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() - 1));
-            }
-
-            cgraph.setGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(goc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("GraphObject: launch", gol);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(x[mfi].array(),
-                                                            y[mfi].array(),
-                                                            0, 1));
-            }
-
-            cudaMemcpy(cgraph.getDevicePtr(0),
-                       cgraph.getHostPtr(0),
-                       std::size_t(sizeof(CopyMemory)*x.local_size()),
-                       cudaMemcpyHostToDevice);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(gol);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(55.555e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("GraphObject: relaunch", cgfrl);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-
-            x.setVal(0.167852);
-            v.setVal(0.0);
-            w.setVal(0.15e-5);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(w[mfi].array(),
-                                                            v[mfi].array(),
-                                                            0, 1));
-            }
-
-            BL_PROFILE_VAR("GraphObject: diff", cgfdiff);
-
-            cudaMemcpy(cgraph.getDevicePtr(0),
-                       cgraph.getHostPtr(0),
-                       std::size_t(sizeof(CopyMemory)*x.local_size()),
-                       cudaMemcpyHostToDevice);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Using Graph Object w/ Individual Asyncs" << std::endl;
-
-        {
-            x.setVal(3.6);
-            y.setVal(7.8);
-
-            BL_PROFILE("Included Asyncs");
-            BL_PROFILE_VAR("Included Asyncs: create", goc);
-
-            // Creates appropriate device storage of graph parameters.
-            CudaGraph<CopyMemory> cgraph(x.local_size());
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                amrex::Gpu::Device::startGraphRecording(mfi.LocalIndex()==0, NULL, NULL, 0);
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                Dim3 offset = {0,0,0};
-
-                CopyMemory* cgd = cgraph.getDevicePtr(idx); 
-
-                // Method to directly add individual memcpy_asyncs to the graph. 
-                CopyMemory* cgh = cgraph.getHostPtr(idx);
-                Gpu::htod_memcpy_async(cgd, cgh, sizeof(CopyMemory));
-
-                AMREX_HOST_DEVICE_FOR_3D (bx, i, j, k,
-                {
-                    // Build the Array4's.
-                    auto const dst = cgd->getDst<Real>();
-                    auto const src = cgd->getSrc<Real>();
-                    int scomp   = cgd->scomp;
-                    for (int n = 0; n < cgd->ncomp; ++n) {
-                        dst(i,j,k,scomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-                    }
-                });
-
-
-                graphExec = amrex::Gpu::Device::stopGraphRecording(mfi.LocalIndex() == (x.local_size() - 1));
-            }
-
-            cgraph.setGraph(graphExec);
-
-            BL_PROFILE_VAR_STOP(goc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("Included Asyncs: launch", gol);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(x[mfi].array(),
-                                                            y[mfi].array(),
-                                                            0, 1));
-            }
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(gol);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(55.555e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("Included Asyncs: relaunch", cgfrl);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-
-            x.setVal(0.167852);
-            v.setVal(0.0);
-            w.setVal(0.15e-5);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(w[mfi].array(),
-                                                            v[mfi].array(),
-                                                            0, 1));
-            }
-
-            BL_PROFILE_VAR("Included Asyncs: diff", cgfdiff);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Using Graph Object w/ Event Waits" << std::endl;
-
-        {
-            x.setVal(23.316);
-            y.setVal(277.8);
-
-            BL_PROFILE("Event Waits");
-            BL_PROFILE_VAR("Event Waits: create", goc);
-
-            // Creates appropriate device storage of graph parameters.
-            CudaGraph<CopyMemory> cgraph(x.local_size());
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                Gpu::Device::startGraphRecording( mfi.LocalIndex() == 0,
-                                                  cgraph.getHostPtr(0),
-                                                  cgraph.getDevicePtr(0),
-                                                  std::size_t(sizeof(CopyMemory)*x.local_size()) );
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                Dim3 offset = {0,0,0};
-
-                CopyMemory* cgd = cgraph.getDevicePtr(idx); 
-                AMREX_HOST_DEVICE_FOR_3D (bx, i, j, k,
-                {
-                    // Build the Array4's.
-                    auto const dst = cgd->getDst<Real>();
-                    auto const src = cgd->getSrc<Real>();
-                    int scomp   = cgd->scomp;
-                    for (int n = 0; n < cgd->ncomp; ++n) {
-                        dst(i,j,k,scomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-                    }
-                });
-
-                bool last_iter = (mfi.LocalIndex() == (x.local_size() - 1));
-                cudaGraphExec_t graphExec = Gpu::Device::stopGraphRecording(last_iter);
-                if (last_iter) { cgraph.setGraph(graphExec); } 
-            }
-
-            BL_PROFILE_VAR_STOP(goc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("Event Waits: launch", gol);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(x[mfi].array(),
-                                                            y[mfi].array(),
-                                                            0, 1));
-            }
-/*
-            cudaMemcpy(cgraph.getDevicePtr(0),
-                       cgraph.getHostPtr(0),
-                       std::size_t(sizeof(CopyMemory)*x.local_size()),
-                       cudaMemcpyHostToDevice);
-*/
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(gol);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(55.555e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("Event Waits: relaunch", cgfrl);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-
-            x.setVal(0.167852);
-            v.setVal(0.0);
-            w.setVal(0.15e-5);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(w[mfi].array(),
-                                                            v[mfi].array(),
-                                                            0, 1));
-            }
-
-            BL_PROFILE_VAR("Event Waits: diff", cgfdiff);
-/*
-            cudaMemcpy(cgraph.getDevicePtr(0),
-                       cgraph.getHostPtr(0),
-                       std::size_t(sizeof(CopyMemory)*x.local_size()),
-                       cudaMemcpyHostToDevice);
-*/
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-
-        }
-
-// &&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&
-
-        amrex::Print() << "=============" << std::endl;
-        amrex::Print() << "Using Graph Object w/ Event Waits, no Streams" << std::endl;
-
-        {
-            x.setVal(213.3089);
-            y.setVal(66.6);
-
-            BL_PROFILE("Streamless");
-            BL_PROFILE_VAR("Streamless: create", goc);
-
-            // Creates appropriate device storage of graph parameters.
-            CudaGraph<CopyMemory> cgraph(x.local_size());
-            cudaGraph_t mfiter_graph;
-            cudaStream_t graph_stream;
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                if (mfi.LocalIndex() == 0)
-                {
-                    Gpu::Device::setStreamIndex(0);
-                    graph_stream = amrex::Gpu::gpuStream(); 
-#if (__CUDACC_VER_MAJOR__ == 10) && (__CUDACC_VER_MINOR__ == 0)
-                    AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(graph_stream));
-#else
-                    AMREX_GPU_SAFE_CALL(cudaStreamBeginCapture(graph_stream, cudaStreamCaptureModeGlobal));
-#endif
-                    AMREX_GPU_SAFE_CALL(cudaMemcpyAsync(cgraph.getDevicePtr(0),
-                                        cgraph.getHostPtr(0),
-                                        std::size_t(sizeof(CopyMemory)*x.local_size()),
-                                        cudaMemcpyHostToDevice, graph_stream));
-                } 
-                Gpu::Device::setStreamIndex(0);
-
-                const Box bx = mfi.validbox();
-                int idx = mfi.LocalIndex();
-                Dim3 offset = {0,0,0};
-
-                CopyMemory* cgd = cgraph.getDevicePtr(idx); 
-                AMREX_HOST_DEVICE_FOR_3D (bx, i, j, k,
-                {
-                    // Build the Array4's.
-                    auto const dst = cgd->getDst<Real>();
-                    auto const src = cgd->getSrc<Real>();
-                    int scomp   = cgd->scomp;
-                    for (int n = 0; n < cgd->ncomp; ++n) {
-                        dst(i,j,k,scomp+n) = src(i+offset.x,j+offset.y,k+offset.z,scomp+n);
-                    }
-                });
-
-                if (mfi.LocalIndex() == (x.local_size() - 1) )
-                {
-                    Gpu::Device::setStreamIndex(0);
-
-                    cudaGraphExec_t graphExec;
-                    AMREX_GPU_SAFE_CALL(cudaStreamEndCapture(graph_stream, &mfiter_graph));
-                    AMREX_GPU_SAFE_CALL(cudaGraphInstantiate(&graphExec,mfiter_graph,NULL,NULL,0));
-                    cgraph.setGraph(graphExec);
-                }
-            }
-
-            BL_PROFILE_VAR_STOP(goc);
-
-// --------- Launch the graph  ----------
-
-            BL_PROFILE_VAR("Streamless: launch", gol);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(x[mfi].array(),
-                                                            y[mfi].array(),
-                                                            0, 1));
-            }
-/*
-            cudaMemcpy(cgraph.getDevicePtr(0),
-                       cgraph.getHostPtr(0),
-                       std::size_t(sizeof(CopyMemory)*x.local_size()),
-                       cudaMemcpyHostToDevice);
-*/
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(gol);
-
-            amrex::Print() << "Graphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph with a different result  ----------
-
-            x.setVal(55.5e-5);
-            y.setVal(0.0);
-
-            BL_PROFILE_VAR("Streamless: relaunch", cgfrl);
-
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfrl);
-
-            amrex::Print() << "Regraphed = " << y.sum() << "; Expected value = " << x.sum() << std::endl;
-
-// --------- Relaunch the graph on different MFIters  ----------
-
-            x.setVal(0.16752);
-            v.setVal(0.0);
-            w.setVal(0.17e-5);
-
-            for (MFIter mfi(x); mfi.isValid(); ++mfi)
-            {
-                int idx = mfi.LocalIndex();
-                cgraph.setParams(idx, amrex::makeCopyMemory(w[mfi].array(),
-                                                            v[mfi].array(),
-                                                            0, 1));
-            }
-
-            BL_PROFILE_VAR("Streamless: diff", cgfdiff);
-/*
-            cudaMemcpy(cgraph.getDevicePtr(0),
-                       cgraph.getHostPtr(0),
-                       std::size_t(sizeof(CopyMemory)*x.local_size()),
-                       cudaMemcpyHostToDevice);
-*/
-            cgraph.executeGraph();
-
-            BL_PROFILE_VAR_STOP(cgfdiff);
-
-            amrex::Print() << "Different MultiFab = " << v.sum() << "; Expected value = " << w.sum() << std::endl;
-            amrex::Print() << " x = " << x.sum() << "; y = " << y.sum() << std::endl;
-
-        }
-
-        amrex::Print() << "Test Completed." << std::endl;
-    }
-
-    amrex::Finalize();
-}
diff --git a/Tests/GPU/CudaGraphs/GraphWithMemcpy/run.corigpu b/Tests/GPU/CudaGraphs/GraphWithMemcpy/run.corigpu
deleted file mode 100755
index 0a5c592f34d..00000000000
--- a/Tests/GPU/CudaGraphs/GraphWithMemcpy/run.corigpu
+++ /dev/null
@@ -1,42 +0,0 @@
-#!/bin/bash -l
-#SBATCH -C gpu
-#SBATCH -t 00:05:00 
-#SBATCH -J AMREX_GPU
-#SBATCH -o AMREX_GPU.o%j
-#SBATCH -A nstaff 
-
-#SBATCH -N 1
-#SBATCH -n 1 
-#SBATCH -c 10
-#SBATCH --gres=gpu:1
-#SBATCH --ntasks-per-node=1
-
-# Note: Given exclusive configuration mode,
-#       you MUST specify your desired resources up top like this.
-#       Cannot put it in the srun line alone.
-#       (You can force lower than your full request in the srun line,
-#        or put the configuration again for safety, but shouldn't be needed.)
-# ============
-# -N =                nodes
-# -n =                tasks (MPI ranks)
-# -c =                CPU per task (full coriGPU node, c*n <= 80)
-# --gres=gpu: =       GPUs per node (full coriGPU node, 8)
-# --ntasks-per-node = number of tasks (MPI ranks) per node (full node, 8)
-#
-
-# For one node:  -N 1, -n  8, -c 10, --gres=gpu:8 --ntasks-per-node 8
-# For two nodes: -N 2, -n 16, -c 10, --gres=gpu:8 --ntasks-per-node 8
-
-# salloc commands:
-# ================
-# Single node:
-# salloc -N 1 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-# Multi node:
-# salloc -N 2 -t 2:00:00 -c 80 -C gpu --exclusive --gres=gpu:8 -A (your_repo)
-
-# environment setup:
-# ==================
-# module purge
-# module load modules esslurm gcc cuda mvapich2 
-
-srun ./main3d.gnu.TPROF.MPI.CUDA.ex inputs_3d
diff --git a/Tests/GPU/CudaGraphs/Readme.txt b/Tests/GPU/CudaGraphs/Readme.txt
deleted file mode 100644
index 533c6f09ada..00000000000
--- a/Tests/GPU/CudaGraphs/Readme.txt
+++ /dev/null
@@ -1,8 +0,0 @@
-Tests for implementation of CudaGraphs in AMReX.
-
-BuildingGraphs: Different ways to build a graph around an MFIter. Uses raw cuda API calls.
-CrazyGraphs: Testing Cuda 10.1 API for reusing graphs with "cudaGraphExecKernelNodeSetParams". 
-GraphBoundary: Performs FillBoundary calls for testing graph accuracy and timings.
-GraphInitTest: Calculate difference in instantiate timings when Initializing CudaGraphs.
-GraphReuseCopy: Graph reuse strategies on a manually written MultiFab copy kernel.
-GraphWithMemcpy: Tests adding the reuse memcpy to the start of the graph.
diff --git a/Tests/GPU/CuptiTest/Exec/CUDA/GNUmakefile b/Tests/GPU/CuptiTest/Exec/CUDA/GNUmakefile
deleted file mode 100644
index a56deabd000..00000000000
--- a/Tests/GPU/CuptiTest/Exec/CUDA/GNUmakefile
+++ /dev/null
@@ -1,18 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../../
-
-DEBUG     = FALSE
-USE_MPI   = TRUE 
-USE_OMP   = FALSE
-USE_CUDA  = TRUE
-USE_CUPTI = TRUE
-COMP      = gcc
-DIM       = 3 
-
-TINY_PROFILE   = TRUE
-
-Bpack   := ./Make.package
-Blocs   := .
-
-include ../../Make.CUPTI
diff --git a/Tests/GPU/CuptiTest/Exec/CUDA/Make.package b/Tests/GPU/CuptiTest/Exec/CUDA/Make.package
deleted file mode 100644
index 41e532f39a4..00000000000
--- a/Tests/GPU/CuptiTest/Exec/CUDA/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-CEXE_headers += myfunc.H mykernel.H
-CEXE_sources += myfunc.cpp
diff --git a/Tests/GPU/CuptiTest/Exec/CUDA/myfunc.H b/Tests/GPU/CuptiTest/Exec/CUDA/myfunc.H
deleted file mode 100644
index fc94096eec4..00000000000
--- a/Tests/GPU/CuptiTest/Exec/CUDA/myfunc.H
+++ /dev/null
@@ -1,13 +0,0 @@
-#ifndef MYFUNC_H_
-#define MYFUNC_H_
-
-#include <AMReX_Geometry.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-void main_main ();
-
-void doDeviceSleep (amrex::MultiFab& mf, int& n);
-
-#endif
diff --git a/Tests/GPU/CuptiTest/Exec/CUDA/myfunc.cpp b/Tests/GPU/CuptiTest/Exec/CUDA/myfunc.cpp
deleted file mode 100644
index cc566a6b5f0..00000000000
--- a/Tests/GPU/CuptiTest/Exec/CUDA/myfunc.cpp
+++ /dev/null
@@ -1,94 +0,0 @@
-#include "myfunc.H"
-#include "mykernel.H"
-
-#ifdef AMREX_USE_CUPTI
-#ifndef AMREX_TINY_PROFILING
-#include <AMReX_CuptiTrace.H> // No need to import if using only the CUPTI profiling macros
-#endif
-#endif
-
-void doDeviceSleep (MultiFab& mf, int& n) {
-    // Call device sleep function at each iteration of MFIter loop
-
-    // Code is instrumented here to capture CUPTI
-    // kernel activity from outside MFIter loop
-#ifdef AMREX_USE_CUPTI
-#ifdef AMREX_TINY_PROFILING
-    BL_PROFILE_VAR_NS("CPU::deviceSleep", blpCpuSleep);
-    BL_PROFILE_VAR_NS_CUPTI("GPU::deviceSleep", blpGpuSleep);
-    BL_PROFILE_VAR_START(blpCpuSleep);      
-    BL_PROFILE_VAR_START_CUPTI(blpGpuSleep);
-#else
-    CuptiTrace cuptiTrace = CuptiTrace();
-    cuptiTrace.start();
-#endif
-#else
-#ifdef AMREX_TINY_PROFILING
-    BL_PROFILE_VAR_NS("CPU::deviceSleep", blpCpuSleep);
-    BL_PROFILE_VAR_START(blpCpuSleep);
-#endif
-#endif
-
-    for ( MFIter mfi(mf); mfi.isValid(); ++mfi )
-    {
-        // Test 1: launch kernel
-        // deviceSleep<<<1, 1, 0, amrex::Gpu::Device::gpuStream()>>>();
-
-        // Test 2: launch kernel as inlined lambda      
-        const Box& bx = mfi.tilebox();
-        const Dim3 lo = amrex::lbound(bx);
-        const Dim3 hi = amrex::ubound(bx);
-        amrex::ParallelFor(bx, 1,
-                           [=] AMREX_GPU_DEVICE (int i, int j, int k, int n)
-                           {
-                               if (i==lo.x & j==lo.y & k==lo.z) {
-                                   // Test 2.1: single sleep
-                                   // deviceSleep(1e8);
-                                   
-                                   // Test 2.2: nested sleep
-                                   // Expected to be similar to above
-                                   deviceNestedSleep(1e8/3, 3);
-                               }
-                           });
-    }
-#ifdef AMREX_USE_CUPTI
-#ifdef AMREX_TINY_PROFILING
-    BL_PROFILE_VAR_STOP_CUPTI_ID(blpGpuSleep, (int) 1729*amrex::Random());
-    // BL_PROFILE_VAR_STOP(blpGpuSleep); // Alternatively, may call without unsigned flag
-    BL_PROFILE_VAR_STOP(blpCpuSleep);
-#else
-    cuptiTrace.stop(1729*amrex::Random());
-    // cuptiTrace.stop();  // Alternatively, may call without unsigned flag
-#endif
-
-    if (true)
-    {
-        amrex::Print() << "Average time per box (s): "
-                       << computeElapsedTimeUserdata(activityRecordUserdata) << "\n";
-
-        unsigned long long t_start = 0;
-        unsigned long long t_stop = 0;
-        for (auto& record : activityRecordUserdata) {
-            t_start = (unsigned long long) record->getStartTime();
-            t_stop = (unsigned long long) record->getEndTime();
-
-            unsigned long long dt = 0;
-            dt = (((unsigned long long)t_stop) - ((unsigned long long)t_start));
-
-            // Kernel data captured in a vector `activityRecordUserdata`
-            // Print here some information from the captured records
-            amrex::AllPrint() << "  t_elapsed (ns):  " << dt
-                              << "; n_step: " << n
-                              << "; Proc.: " << ParallelContext::MyProcSub()
-                              << "; Act. Size: " << activityRecordUserdata.size()
-                // In this example, random unsigned flag is assigned
-                // for all records captured outside same MFIter loop,
-                // but if instrumenting kernel launch within an
-                // MFIter loop, records may be flagged with, e.g.,
-                // an ID corresponding to the loop iteration
-                              << "; Unsigned flag: " << record->getUintID()
-                              << "\n";
-        }
-    }
-#endif
-}
diff --git a/Tests/GPU/CuptiTest/Exec/CUDA/mykernel.H b/Tests/GPU/CuptiTest/Exec/CUDA/mykernel.H
deleted file mode 100644
index 8614091b8f8..00000000000
--- a/Tests/GPU/CuptiTest/Exec/CUDA/mykernel.H
+++ /dev/null
@@ -1,40 +0,0 @@
-#ifndef MY_KERNEL_H_
-#define MY_KERNEL_H_
-
-#include <AMReX_FArrayBox.H>
-
-using clock_value_t = long long;
-
-AMREX_GPU_DEVICE
-void deviceSleep (clock_value_t sleep_cycles)
-{
-    clock_value_t start = clock64();
-    clock_value_t cycles_elapsed;
-    do { cycles_elapsed = clock64() - start; } 
-    while (cycles_elapsed < sleep_cycles);
-}
-
-AMREX_GPU_DEVICE
-void deviceNestedSleep (clock_value_t sleep_cycles, int level)
-{
-    if (level==0) {
-        return;
-    }
-    clock_value_t start = clock64();
-    clock_value_t cycles_elapsed;
-    do {cycles_elapsed = clock64() - start;} 
-    while (cycles_elapsed < sleep_cycles);
-
-    deviceNestedSleep(sleep_cycles, level - 1);
-}
-
-AMREX_GPU_GLOBAL
-void deviceSleep ()
-{
-    // Sleep for some number of cycles
-    int cycles;
-    cycles = (int) (1e8);
-    deviceSleep(cycles);
-}
-
-#endif
diff --git a/Tests/GPU/CuptiTest/Make.CUPTI b/Tests/GPU/CuptiTest/Make.CUPTI
deleted file mode 100644
index 031c3d41e9c..00000000000
--- a/Tests/GPU/CuptiTest/Make.CUPTI
+++ /dev/null
@@ -1,27 +0,0 @@
-AMREX_HOME ?= ../../../
-CUPTI_EX_DIR  ?= $(AMREX_HOME)/Tests/GPU/CuptiTest/
-
-TOP := $(CUPTI_EX_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-Bdirs   := Source
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs             := Base
-Ppack             += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-
-all: $(executable)
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/GPU/CuptiTest/Source/Make.package b/Tests/GPU/CuptiTest/Source/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/GPU/CuptiTest/Source/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/GPU/CuptiTest/Source/main.cpp b/Tests/GPU/CuptiTest/Source/main.cpp
deleted file mode 100644
index 9de0208e7cf..00000000000
--- a/Tests/GPU/CuptiTest/Source/main.cpp
+++ /dev/null
@@ -1,85 +0,0 @@
-#include <AMReX_Gpu.H>
-#include <AMReX_Print.H>
-#ifdef AMREX_USE_CUPTI
-#include <AMReX_CuptiTrace.H>
-#endif
-
-#include "myfunc.H"
-
-using namespace amrex;
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-
-    // Initialize the CUPTI trace
-#ifdef AMREX_USE_CUPTI
-    initCuptiTrace();
-#endif
-
-    main_main();
-
-    amrex::Finalize();
-    return 0;
-}
-
-void main_main ()
-{
-    // AMREX_SPACEDIM: number of dimensions
-    int n_cell, max_grid_size, nsteps;
-
-    // Periodic in all direction by default
-    Vector<int> is_periodic(AMREX_SPACEDIM,1);
-
-    // Set parameters
-    // Number of cells on each side of a square (or cubic) domain
-    n_cell = 12;
-
-    // The domain is broken into boxes of size max_grid_size
-    max_grid_size = 7;
-
-    // Number of steps to advance
-    nsteps = 50;
-
-    // Make BoxArray
-    BoxArray ba;
-
-    {
-        IntVect dom_lo(AMREX_D_DECL(0, 0, 0));
-        IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-        Box domain(dom_lo, dom_hi);
-
-        // Initialize the boxarray "ba"
-        ba.define(domain);
-
-        // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-        ba.maxSize(max_grid_size);
-
-        // This defines the physical box, [-1,1] in each direction
-        RealBox real_box({AMREX_D_DECL(-1.0,-1.0,-1.0)},
-                         {AMREX_D_DECL(1.0, 1.0, 1.0)});
-    }
-
-    // Nghost = number of ghost cells for each array 
-    int Nghost = 1;
-
-    // Ncomp = number of components for each array
-    int Ncomp  = 1;
-
-    // How Boxes are distrubuted among MPI processes
-    DistributionMapping dm(ba);
-
-    // Allocate a MultiFab
-    MultiFab mf(ba, dm, Ncomp, Nghost);
-
-    // Initialize MultiFab
-    mf.setVal(0.0);
-
-    for (int n = 1; n <= nsteps; ++n)
-    {
-        doDeviceSleep(mf, n); 
-
-        // Tell the I/O Processor to write out which step we're doing
-        amrex::Print() << "Advanced step " << n << "\n";
-    }
-}
diff --git a/Tests/GPU/CudaGraphs/GraphBoundary/GNUmakefile b/Tests/GPU/Fuse/GNUmakefile
similarity index 67%
rename from Tests/GPU/CudaGraphs/GraphBoundary/GNUmakefile
rename to Tests/GPU/Fuse/GNUmakefile
index 5d099193be7..111a260e1cf 100644
--- a/Tests/GPU/CudaGraphs/GraphBoundary/GNUmakefile
+++ b/Tests/GPU/Fuse/GNUmakefile
@@ -1,15 +1,18 @@
-AMREX_HOME ?= ../../../..
+AMREX_HOME = ../../..
 
+DEBUG	= TRUE
 DEBUG	= FALSE
-#DEBUG	= TRUE
 
-DIM	= 3
+DIM	= 2
 
-COMP    = gnu 
+COMP    = gcc
 
-USE_MPI   = TRUE 
+USE_MPI   = FALSE
 USE_OMP   = FALSE
 USE_CUDA  = TRUE
+USE_HIP   = FALSE
+USE_DPCPP = FALSE
+
 TINY_PROFILE = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
diff --git a/Tests/Algoim/Make.package b/Tests/GPU/Fuse/Make.package
similarity index 100%
rename from Tests/Algoim/Make.package
rename to Tests/GPU/Fuse/Make.package
diff --git a/Tests/GPU/Fuse/main.cpp b/Tests/GPU/Fuse/main.cpp
new file mode 100644
index 00000000000..c76fd0916a2
--- /dev/null
+++ b/Tests/GPU/Fuse/main.cpp
@@ -0,0 +1,98 @@
+
+#include <AMReX.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_BLProfiler.H>
+
+using namespace amrex;
+
+void fused_test (MultiFab const& mfa, MultiFab const& mfb, MultiFab& mfc)
+{
+    Gpu::FuseSafeGuard fsg(true);
+    for (MFIter mfi(mfc); mfi.isValid(); ++mfi) {
+        Array4<Real const> const& a = mfa.const_array(mfi);
+        Array4<Real const> const& b = mfb.const_array(mfi);
+        Array4<Real      > const& c = mfc.array(mfi);
+        Box const& vbx = mfi.validbox();
+        amrex::Gpu::Register(vbx, [=] AMREX_GPU_DEVICE (int i, int j, int k)
+        {
+            c(i,j,k,0) = a(i,j,k) + b(i,j,k);
+        });
+        amrex::Gpu::Register(vbx, [=] AMREX_GPU_DEVICE (int i, int j, int k)
+        {
+            c(i,j,k,1) = a(i,j,k) - b(i,j,k);
+        });
+    }
+    amrex::Gpu::LaunchFusedKernels();
+}
+
+void unfused_test (MultiFab const& mfa, MultiFab const& mfb, MultiFab& mfc)
+{
+    for (MFIter mfi(mfc); mfi.isValid(); ++mfi) {
+        Array4<Real const> const& a = mfa.const_array(mfi);
+        Array4<Real const> const& b = mfb.const_array(mfi);
+        Array4<Real      > const& c = mfc.array(mfi);
+        Box const& vbx = mfi.validbox();
+        amrex::ParallelFor(vbx, [=] AMREX_GPU_DEVICE (int i, int j, int k)
+        {
+            c(i,j,k,0) = a(i,j,k) + b(i,j,k);
+        });
+        amrex::ParallelFor(vbx, [=] AMREX_GPU_DEVICE (int i, int j, int k)
+        {
+            c(i,j,k,1) = a(i,j,k) - b(i,j,k);
+        });
+    }
+}
+
+void verify (MultiFab& mfc)
+{
+    Real min0 = mfc.min(0);
+    Real min1 = mfc.min(1);
+    Real max0 = mfc.max(0);
+    Real max1 = mfc.max(1);
+    if (min0 != 4.0 || max0 != min0 || min1 != -2.0 || max1 != min1) {
+        amrex::Print() << "Failed!" << std::endl;
+    } else {
+        amrex::Print() << "Success" << std::endl;
+    }
+    mfc.setVal(-1.);
+}
+
+int main(int argc, char* argv[])
+{
+    amrex::Initialize(argc,argv);
+    {
+        BL_PROFILE("main()");
+
+        Box bx(IntVect(0),IntVect(127));
+        BoxArray ba(bx);
+        ba.maxSize(16);
+        DistributionMapping dm{ba};
+
+        MultiFab mfa(ba,dm,1,0);
+        MultiFab mfb(ba,dm,1,0);
+        MultiFab mfc(ba,dm,2,0);
+        mfa.setVal(1.0);
+        mfb.setVal(3.0);
+        mfc.setVal(-1.0);
+
+        {
+            BL_PROFILE("fuesd-test1");
+            fused_test(mfa,mfb,mfc);
+        }
+        verify(mfc);
+        
+        {
+            BL_PROFILE("fused-test2");
+            fused_test(mfa,mfb,mfc);
+        }
+        verify(mfc);
+
+        {
+            BL_PROFILE("unfused-test");
+            unfused_test(mfa,mfb,mfc);
+        }
+        verify(mfc);
+    }
+    amrex::Finalize();
+}
+
diff --git a/Tests/GPU/Locking/inputs b/Tests/GPU/Locking/inputs
deleted file mode 100644
index f9d69ffc8a0..00000000000
--- a/Tests/GPU/Locking/inputs
+++ /dev/null
@@ -1 +0,0 @@
-num_draw = 10000000
\ No newline at end of file
diff --git a/Tests/GPU/Locking/main.cpp b/Tests/GPU/Locking/main.cpp
deleted file mode 100644
index e9b86f0bdcc..00000000000
--- a/Tests/GPU/Locking/main.cpp
+++ /dev/null
@@ -1,168 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_Gpu.H>
-#include <AMReX_Utility.H>
-#include <AMReX_Array.H>
-#include <AMReX_GpuContainers.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BlockMutex.H>
-
-using namespace amrex;
-
-void lockingTest(int num_draw);
-void blockCountingTest();
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    {
-        int num_draw, num_states = 1e5;
-        
-        ParmParse pp;
-        pp.get("num_draw", num_draw);
-        pp.query("num_states", num_states);
-        if (num_states != 1e5)
-            { amrex::ResizeRandomSeed(num_states); }
-
-        auto begin = std::chrono::high_resolution_clock::now();
-        amrex::Print() << "Testing using locks to do atomic adds \n";
-        for (int i = 0; i < 10; ++i)
-            lockingTest(num_draw);
-        amrex::Print() << "Testing using locks to count the number of blocks a kernel was launched with \n";
-        for (int i = 0; i < 10; ++i)
-            blockCountingTest();
-        amrex::Print() << "Locking test passed! \n";
-        auto end = std::chrono::high_resolution_clock::now();
-        std::cout << "Execution Time: ";
-        std::cout << std::chrono::duration_cast<std::chrono::nanoseconds>(end-begin).count()
-                  << "ns" << std::endl;
-    }
-    amrex::Finalize();
-}
-
-AMREX_GPU_DEVICE
-void addone(double volatile * num)
-{
-  int blockId = blockIdx.x + blockIdx.y * gridDim.x + gridDim.x * gridDim.y * blockIdx.z;
-  
-  int tid = blockId * (blockDim.x * blockDim.y * blockDim.z)
-    + (threadIdx.z * (blockDim.x * blockDim.y))
-    + (threadIdx.y * blockDim.x) + threadIdx.x ;
-
-  int i = amrex::get_state(tid);
-  num[i] = num[i]+1;
-  __threadfence();
-  amrex::free_state(tid);
-}
-
-void lockingTest (int Ndraw)
-{
-#ifdef AMREX_USE_GPU
-    Gpu::DeviceVector<double> d_xpos;
-    Gpu::DeviceVector<double> d_ypos;
-    Gpu::DeviceVector<double> d_zpos;
-
-    d_xpos.resize(Ndraw, 0.0);
-    d_ypos.resize(Ndraw, 0.0);
-    d_zpos.resize(Ndraw, 0.0);
-
-    double *dxpos = d_xpos.dataPtr();
-    double *dypos = d_ypos.dataPtr();
-    double *dzpos = d_zpos.dataPtr();    
-#endif
-
-    amrex::Vector<double> hx(Ndraw);
-    amrex::Vector<double> hy(Ndraw);
-    amrex::Vector<double> hz(Ndraw);
-    double *hxpos = hx.dataPtr();
-    double *hypos = hy.dataPtr();
-    double *hzpos = hz.dataPtr();
-
-    AMREX_PARALLEL_FOR_1D (Ndraw, i,
-    {
-#ifdef AMREX_USE_GPU
-        addone(dxpos);
-        addone(dypos);
-        addone(dzpos);	  
-#else // Not defined for CPU -> this will still have the test pass if run with cpus
-        hx[i] = hx[i]+1;
-        hy[i] = hy[i]+1;
-        hz[i] = hz[i]+1;
-#endif	   
-    });
-
-#ifdef AMREX_USE_GPU
-    amrex::Gpu::dtoh_memcpy(hxpos, dxpos, sizeof(double)*Ndraw);
-    amrex::Gpu::dtoh_memcpy(hypos, dypos, sizeof(double)*Ndraw);
-    amrex::Gpu::dtoh_memcpy(hzpos, dzpos, sizeof(double)*Ndraw);
-#endif
-
-   int sumx = 0;
-   int sumy = 0;
-   int sumz = 0;
-   for (int i = 0; i < Ndraw; i++ )
-   {
-       sumx = sumx + hxpos[i];
-       sumy = sumy + hypos[i];
-       sumz = sumz + hzpos[i];
-   }
-
-   // For the test to pass and race conditions avoided successfuly
-   // All of these numbers should be the same
-   amrex::Print() << "Sumx  = " << sumx << std::endl;
-   amrex::Print() << "Sumy  = " << sumy << std::endl;
-   amrex::Print() << "Sumz  = " << sumz << std::endl;
-   amrex::Print() << "Ndraw = " << Ndraw << std::endl;
-   amrex::Print() << "\n";
-   
-   AMREX_ALWAYS_ASSERT((sumx == sumy) && (sumz == Ndraw) && (sumx == sumz));   
-}
-
-__global__
-void count_blocks (BlockMutex* mut, int *numBlocks, int lock_index)
-{
-    mut->lock(lock_index);
-    if (threadIdx.x == 0) { numBlocks[0] = numBlocks[0] + 1; }
-    __threadfence();
-    mut->unlock(lock_index);
-}
-
-void blockCountingTest ()
-{
-    
-    constexpr int NUMBLOCKS = 512;
-    constexpr int NUMTHREADS = 1024;
-    {
-        int h_counting, *d_counting;
-
-        d_counting = static_cast<int*>(The_Device_Arena()->alloc(sizeof(int)));        
-
-        h_counting = 0;
-
-        amrex::Gpu::htod_memcpy(d_counting, &h_counting, sizeof(int));
-
-        BlockMutex h_mut(1);
-        BlockMutex* d_mut;
-        d_mut = static_cast<BlockMutex*>(The_Device_Arena()->alloc(sizeof(BlockMutex)));
-        amrex::Gpu::htod_memcpy(d_mut, &h_mut, sizeof(BlockMutex));
-
-#ifdef AMREX_USE_HIP
-        hipLaunchKernelGGL(count_blocks, NUMBLOCKS, NUMTHREADS, 0, 0, d_mut, d_counting, 0);
-#else
-        count_blocks<<<NUMBLOCKS, NUMTHREADS>>>(d_mut, d_counting, 0);
-#endif
-
-        AMREX_HIP_OR_CUDA( hipPeekAtLastError();,
-                           cudaPeekAtLastError(); );
-
-        Gpu::Device::synchronize();
-
-        amrex::Gpu::dtoh_memcpy(&h_counting, d_counting, sizeof(int));
-
-        amrex::Print() << "Number of blocks is: " << h_counting << "\n";
-
-        if (h_counting != NUMBLOCKS) amrex::Abort();
-
-        The_Device_Arena()->free(d_counting);
-    }
-}
diff --git a/Tests/GPU/RandomNumberGeneration/GNUmakefile b/Tests/GPU/RandomNumberGeneration/GNUmakefile
index 3f82c35477d..c787fca5b68 100644
--- a/Tests/GPU/RandomNumberGeneration/GNUmakefile
+++ b/Tests/GPU/RandomNumberGeneration/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tests/GPU/RandomNumberGeneration/inputs b/Tests/GPU/RandomNumberGeneration/inputs
index ddef6983fb9..3bfe2d0e97c 100644
--- a/Tests/GPU/RandomNumberGeneration/inputs
+++ b/Tests/GPU/RandomNumberGeneration/inputs
@@ -1,2 +1 @@
-num_states = 100
-num_draw = 10000
+num_draw = 1000000
diff --git a/Tests/GPU/RandomNumberGeneration/main.cpp b/Tests/GPU/RandomNumberGeneration/main.cpp
index 0fd7918ddc2..5eb913ab0ee 100644
--- a/Tests/GPU/RandomNumberGeneration/main.cpp
+++ b/Tests/GPU/RandomNumberGeneration/main.cpp
@@ -1,106 +1,77 @@
 #include <AMReX.H>
-#include <AMReX_MultiFab.H>
 #include <AMReX_Gpu.H>
-#include <AMReX_Utility.H>
-#include <AMReX_Array.H>
-#include <AMReX_GpuContainers.H>
+#include <AMReX_Random.H>
 #include <AMReX_ParmParse.H>
+#include <AMReX_BLProfiler.H>
+#include <cmath>
 
 using namespace amrex;
 
-
 void RandomNumGen();
 
 int main (int argc, char* argv[])
 {
-
     amrex::Initialize(argc,argv);
     RandomNumGen();
     amrex::Finalize();
-
 }
 
 void RandomNumGen ()
 {
+    BL_PROFILE("main");
 
     ParmParse pp;
 
-    int Nstates;
-    int Ndraw;
-
-    pp.get("num_states", Nstates);
-    pp.get("num_draw", Ndraw);    
-
-#ifdef AMREX_USE_GPU
-    amrex::Print() << "Generating random numbers using GPU ";
-    amrex::Print() << amrex::Gpu::Device::deviceId() << " on rank ";
-    amrex::Print() << amrex::ParallelDescriptor::MyProc() << "\n";
-
-#else
-    amrex::InitRandom(1024UL,1);
-#endif
+    int Ndraw = 1000000;
 
-    Gpu::HostVector<Real> x_h(Ndraw);
-    Gpu::HostVector<Real> y_h(Ndraw);
-    Gpu::HostVector<Real> z_h(Ndraw);
+    pp.query("num_draw", Ndraw);
 
     Gpu::DeviceVector<Real> x_d(Ndraw);
     Gpu::DeviceVector<Real> y_d(Ndraw);
     Gpu::DeviceVector<Real> z_d(Ndraw);
 
-    // Test for random numbers. 
     {
-
-        BL_PROFILE_REGION("Draw");
+        BL_PROFILE("Draw");
 
         auto x_d_ptr = x_d.dataPtr();
         auto y_d_ptr = y_d.dataPtr();
-        auto z_d_ptr = z_d.dataPtr(); 
-        AMREX_PARALLEL_FOR_1D (Ndraw, idx,
+        auto z_d_ptr = z_d.dataPtr();
+
+        amrex::ParallelForRNG(Ndraw,
+        [=] AMREX_GPU_DEVICE (int i, RandomEngine const& engine) noexcept
         {
-            x_d_ptr[idx] = amrex::Random();
-            y_d_ptr[idx] = amrex::Random();
-            z_d_ptr[idx] = amrex::Random();
+            x_d_ptr[i] = amrex::Random(engine);
+            y_d_ptr[i] = amrex::Random(engine);
+            z_d_ptr[i] = amrex::Random(engine);
         });
-   
-        Gpu::Device::synchronize();
 
+        Gpu::synchronize();
     }
 
-    Gpu::dtoh_memcpy(x_h.dataPtr(), x_d.dataPtr(), sizeof(Real)*Ndraw);
-    Gpu::dtoh_memcpy(y_h.dataPtr(), y_d.dataPtr(), sizeof(Real)*Ndraw);
-    Gpu::dtoh_memcpy(z_h.dataPtr(), z_d.dataPtr(), sizeof(Real)*Ndraw);
-    
-    // Output to check for random-ness
-    // for (int i = 0; i < Ndraw; i++ )
-    // {
-    //     amrex::Print() << i << " " << x_h[i]  << " " << y_h[i] << " " << z_h[i] << "\n";
-    // }
-
-    // Test for a subset of threads calling amrex::Random().
-    // Testing for a possible hang.
-    {
-        BL_PROFILE_REGION("Draw2");
-
-        auto x_d_ptr = x_d.dataPtr();
-        auto y_d_ptr = y_d.dataPtr();
-        auto z_d_ptr = z_d.dataPtr(); 
-        AMREX_PARALLEL_FOR_1D (Ndraw, idx,
-        {
-            if (idx % 2 == 0)
-            {
-                x_d_ptr[idx] = amrex::Random();
-                y_d_ptr[idx] = amrex::Random();
-                z_d_ptr[idx] = amrex::Random();
-            }
-        });
-   
-        Gpu::Device::synchronize();
-
+    std::vector<Real> x_h(Ndraw);
+    std::vector<Real> y_h(Ndraw);
+    std::vector<Real> z_h(Ndraw);
+    Gpu::copyAsync(Gpu::deviceToHost, x_d.begin(), x_d.end(), x_h.begin());
+    Gpu::copyAsync(Gpu::deviceToHost, y_d.begin(), y_d.end(), y_h.begin());
+    Gpu::copyAsync(Gpu::deviceToHost, z_d.begin(), z_d.end(), z_h.begin());
+    Gpu::synchronize();
+
+    Real xmean=0., ymean=0., zmean=0., xvar=0., yvar=0., zvar=0.;
+    for (int i = 0; i < Ndraw; ++i) {
+        xmean += x_h[i];
+        ymean += y_h[i];
+        zmean += z_h[i];
+        xvar += std::pow(x_h[i]-0.5,2);
+        yvar += std::pow(y_h[i]-0.5,2);
+        zvar += std::pow(z_h[i]-0.5,2);
     }
+    xmean /= Ndraw;
+    ymean /= Ndraw;
+    zmean /= Ndraw;
+    xvar /= Ndraw;
+    yvar /= Ndraw;
+    zvar /= Ndraw;
+    amrex::Print() << "\n  Means: " << xmean << ", " << ymean << ", " << zmean
+                   << "  Variances: " << xvar << ", " << yvar << ", " << zvar
+                   << std::endl;
 }
-
-
-
-
-
diff --git a/Tests/GPU/Vector/GNUmakefile b/Tests/GPU/Vector/GNUmakefile
index effe1a08c3d..42cbc3ea210 100644
--- a/Tests/GPU/Vector/GNUmakefile
+++ b/Tests/GPU/Vector/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tests/GPU/libamrex_CUDA/GNUmakefile b/Tests/GPU/libamrex_CUDA/GNUmakefile
deleted file mode 100644
index 1e6c5d35187..00000000000
--- a/Tests/GPU/libamrex_CUDA/GNUmakefile
+++ /dev/null
@@ -1,31 +0,0 @@
-AMREX_INSTALL_DIR ?= ../../../tmp_install_dir
-CUDA_ARCH ?= 60
-
-CXX = nvcc
-
-includes = -I$(AMREX_INSTALL_DIR)/include
-CXXFLAGS = -ccbin=g++ -Xcompiler='-g -O3 -std=c++14' --std=c++14 -Wno-deprecated-gpu-targets -m64 -arch=compute_$(CUDA_ARCH) -code=sm_$(CUDA_ARCH) -maxrregcount=255 -lineinfo --ptxas-options=-O3,-v --use_fast_math -dc -x cu --expt-relaxed-constexpr --expt-extended-lambda
-LINKFLAGS = -Wno-deprecated-gpu-targets -m64 -arch=compute_$(CUDA_ARCH) -code=sm_$(CUDA_ARCH) -maxrregcount=255 -lineinfo --ptxas-options=-O3,-v --use_fast_math
-LDFLAGS = -L$(AMREX_INSTALL_DIR)/lib
-
-LIBRARIES = -lamrex -lgfortran -lcuda
-
-# libamrex.a may contain unresolved symbols, amrex_probinit and getLevelBld()
-# -Xlinker='--unresolved-symbols=ignore-in-object-files'
-LINKFLAGS += -Xlinker='--warn-unresolved-symbols'
-
-default: main.exe
-
-main.exe: main.o
-	$(CXX) -o $@ $< $(includes) $(LINKFLAGS) $(LDFLAGS) $(LIBRARIES)
-
-main.o: main.cpp
-	$(CXX) -o $@ -c $(CXXFLAGS) $(includes) $<
-
-.PHONY: clean realclean
-
-clean:
-	$(RM) *.o
-
-realclean: clean
-	$(RM) main.exe
diff --git a/Tests/GPU/libamrex_CUDA/README.md b/Tests/GPU/libamrex_CUDA/README.md
deleted file mode 100644
index f47cd80923d..00000000000
--- a/Tests/GPU/libamrex_CUDA/README.md
+++ /dev/null
@@ -1,12 +0,0 @@
-
-(1) At the top directory of amrex
-
-    ./configure --with-mpi=no --with-cuda=yes
-    make
-    make install
-    
-(2) In this directory
-
-    make
-    
-
diff --git a/Tests/GPU/libamrex_CUDA/main.cpp b/Tests/GPU/libamrex_CUDA/main.cpp
deleted file mode 100644
index f6acda712fb..00000000000
--- a/Tests/GPU/libamrex_CUDA/main.cpp
+++ /dev/null
@@ -1,33 +0,0 @@
-
-#include <AMReX.H>
-#include <AMReX_Print.H>
-#include <AMReX_MultiFab.H>
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    amrex::Print() << "Hello world from AMReX version " << amrex::Version() << "\n";
-
-    {
-        amrex::Box domain_box(amrex::IntVect(0), amrex::IntVect(127));
-        amrex::BoxArray ba(domain_box);
-        ba.maxSize(64);
-        amrex::DistributionMapping dm{ba};
-        amrex::MultiFab mf(ba, dm, 1, 0);
-
-        mf.setVal(1.0);
-
-        for (amrex::MFIter mfi(mf); mfi.isValid(); ++mfi) {
-            const amrex::Box& box = mfi.validbox();
-            const auto& a = mf.array(mfi);
-            amrex::ParallelFor(box,
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                a(i,j,k) = 1.*i + 10.*j + 100.*k;
-            });
-        }
-    }
-
-    amrex::Finalize();
-}
-
diff --git a/Tests/HDF5Benchmark/CMakeLists.txt b/Tests/HDF5Benchmark/CMakeLists.txt
new file mode 100644
index 00000000000..f3b8df6e684
--- /dev/null
+++ b/Tests/HDF5Benchmark/CMakeLists.txt
@@ -0,0 +1,12 @@
+# This tests requires particle support
+if (NOT AMReX_PARTICLES)
+   return()
+endif ()
+
+set(_sources     main.cpp)
+set(_input_files inputs  )
+
+setup_test(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/HDF5Benchmark/GNUmakefile b/Tests/HDF5Benchmark/GNUmakefile
index 0524489fe45..83cf9e997cd 100644
--- a/Tests/HDF5Benchmark/GNUmakefile
+++ b/Tests/HDF5Benchmark/GNUmakefile
@@ -1,11 +1,11 @@
-AMREX_HOME ?= ../../
+AMREX_HOME = ../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
 
 DIM	= 3
 
-COMP    = gnu 
+COMP    = gnu
 
 PRECISION = DOUBLE
 
@@ -14,17 +14,14 @@ USE_OMP   = FALSE
 
 TINY_PROFILE = TRUE
 
+MPI_THREAD_MULTIPLE = TRUE
+
 ###################################################
 
 EBASE     = main
 
-# HDF5_HOME   = /home/khl7265/.local
-USE_HDF5 = TRUE
-ifeq ($(USE_HDF5), TRUE)
-DEFINES += -DAMREX_USE_HDF5
-INCLUDE_LOCATIONS += $(HDF5_HOME)/include
-LIBRARIES         += -lhdf5 -lz -ldl -L$(HDF5_HOME)/lib
-endif
+USE_HDF5  = TRUE
+HDF5_HOME = $(HOME)/summit/hdf5/async_gnu/hdf5
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
@@ -34,3 +31,12 @@ include $(AMREX_HOME)/Src/Particle/Make.package
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.rules
 
+# To use HDF5 asynchronous I/O VOL connector, follow the instructions at https://bitbucket.hdfgroup.org/projects/HDF5VOL/repos/async/browse
+USE_HDF5_ASYNC = FALSE
+ABT_HOME       = $(HOME)/summit/argobots/install
+ASYNC_HOME     = $(HOME)/summit/async/src
+ifeq ($(USE_HDF5_ASYNC), TRUE)
+DEFINES   	  += -DAMREX_USE_HDF5_ASYNC -DAMREX_MPI_THREAD_MULTIPLE
+INCLUDE_LOCATIONS += $(ABT_HOME)/include $(ASYNC_HOME)
+LIBRARIES 	  += -L$(ABT_HOME)/lib -L$(ASYNC_HOME) -lh5async -labt -Wl,-rpath=$(ABT_HOME)/lib  -Wl,-rpath=$(ASYNC_HOME)
+endif
diff --git a/Tests/HDF5Benchmark/inputs b/Tests/HDF5Benchmark/inputs
index c83791eb79f..412132ce13c 100644
--- a/Tests/HDF5Benchmark/inputs
+++ b/Tests/HDF5Benchmark/inputs
@@ -1,7 +1,7 @@
 # Domain size
 ncells = 128
 
-# Maximum allowable size of each subdomain in the problem domain; 
+# Maximum allowable size of each subdomain in the problem domain;
 # this is used to decompose the domain for parallel calculations.
 max_grid_size = 32
 
@@ -14,5 +14,19 @@ ncomp = 6
 # Number of particles per cell
 nppc = 2
 
+# Number of plot files to write
+nplotfile = 5
+
+# Number of plot files to write
+nparticlefile = 5
+
+# Time to sleep before each write
+sleeptime = 2
+
 # Whether to check the correctness of Checkpoint / Restart
-restart_check = 1
\ No newline at end of file
+restart_check = 1
+
+## Uncomment to read grids from file
+#nlevs = 3
+#grids_from_file = 1
+#ref_ratio_file = 4 2
\ No newline at end of file
diff --git a/Tests/HDF5Benchmark/main.cpp b/Tests/HDF5Benchmark/main.cpp
index 189ea997aa1..eccc4f3b445 100644
--- a/Tests/HDF5Benchmark/main.cpp
+++ b/Tests/HDF5Benchmark/main.cpp
@@ -3,15 +3,35 @@
 #include <AMReX_PlotFileUtil.H>
 #include <AMReX_Particles.H>
 
+#include <unistd.h>
+#ifdef AMREX_USE_HDF5_ASYNC
+#include "h5_vol_external_async_native.h"
+#endif
+
 using namespace amrex;
 
+void set_grids_nested (Vector<Box>& domains,
+                       Vector<BoxArray>& grids,
+                       Vector<IntVect>& ref_ratio);
+void set_grids_file (Vector<Box>& domains,
+                     Vector<BoxArray>& grids,
+                     Vector<IntVect>& ref_ratio);
+void test ();
+BoxArray readBoxList (const std::string& file, Box& domain);
+
 int main(int argc, char* argv[])
-{    
+{
     amrex::Initialize(argc,argv);
-    { 
+    test();
+    amrex::Finalize();
+}
+
+void test ()
+{
     const int nghost = 0;
     int ncells, max_grid_size, ncomp, nlevs, nppc;
-    int restart_check = 0;
+    int restart_check = 0, nplotfile = 1, nparticlefile = 1, sleeptime = 0;
+    int grids_from_file = 0;
 
     ParmParse pp;
     pp.get("ncells", ncells);
@@ -19,13 +39,24 @@ int main(int argc, char* argv[])
     pp.get("ncomp", ncomp);
     pp.get("nlevs", nlevs);
     pp.get("nppc", nppc);
+    pp.query("nplotfile", nplotfile);
+    pp.query("nparticlefile", nparticlefile);
+    pp.query("sleeptime", sleeptime);
     pp.query("restart_check", restart_check);
-    
-    AMREX_ALWAYS_ASSERT(nlevs < 2); // relax this later
+    pp.query("grids_from_file", grids_from_file);
 
-    IntVect domain_lo(AMREX_D_DECL(0, 0, 0));
-    IntVect domain_hi(AMREX_D_DECL(ncells-1, ncells-1, ncells-1)); 
-    const Box domain(domain_lo, domain_hi);
+    Vector<Box> domains;
+    Vector<BoxArray> ba;
+    Vector<IntVect> ref_ratio;
+
+    if (grids_from_file)
+    {
+        set_grids_file(domains, ba, ref_ratio);
+    }
+    else
+    {
+        set_grids_nested(domains, ba, ref_ratio);
+    }
 
     RealBox real_box;
     for (int n = 0; n < AMREX_SPACEDIM; n++) {
@@ -33,11 +64,6 @@ int main(int argc, char* argv[])
         real_box.setHi(n, 1.0);
     }
 
-    // Define the refinement ratio
-    Vector<IntVect> ref_ratio(nlevs-1);
-    for (int lev = 1; lev < nlevs; lev++)
-        ref_ratio[lev-1] = IntVect(AMREX_D_DECL(2, 2, 2));
-
     // This sets the boundary conditions to be doubly or triply periodic
     int is_per[AMREX_SPACEDIM];
     for (int i = 0; i < AMREX_SPACEDIM; i++)
@@ -45,29 +71,9 @@ int main(int argc, char* argv[])
 
     // This defines a Geometry object for each level
     Vector<Geometry> geom(nlevs);
-    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
+    geom[0].define(domains[0], &real_box, CoordSys::cartesian, is_per);
     for (int lev = 1; lev < nlevs; lev++) {
-	geom[lev].define(amrex::refine(geom[lev-1].Domain(), ref_ratio[lev-1]),
-			 &real_box, CoordSys::cartesian, is_per);
-    }
-    
-    Vector<BoxArray> ba(nlevs);
-    ba[0].define(domain);
-    
-    // Now we make the refined level be the center eighth of the domain
-    if (nlevs > 1) {
-        int n_fine = ncells*ref_ratio[0][0];
-        IntVect refined_lo(D_DECL(n_fine/4,n_fine/4,n_fine/4)); 
-        IntVect refined_hi(D_DECL(3*n_fine/4-1,3*n_fine/4-1,3*n_fine/4-1));
-
-        // Build a box for the level 1 domain
-        Box refined_patch(refined_lo, refined_hi);
-        ba[1].define(refined_patch);
-    }
-    
-    // break the BoxArrays at both levels into max_grid_size^3 boxes
-    for (int lev = 0; lev < nlevs; lev++) {
-        ba[lev].maxSize(max_grid_size);
+	geom[lev].define(domains[lev], &real_box, CoordSys::cartesian, is_per);
     }
 
     Vector<DistributionMapping> dmap(nlevs);
@@ -95,9 +101,9 @@ int main(int argc, char* argv[])
     MyPC::ParticleInitData pdata = {1.0, 2.0, 3.0, 4.0, 5, 6.0,
                                     7.0, 8.0, 9.0, 10.0, 11.0,
                                     12.0, 13.0, 14, 15, 16};
-    
+
     myPC.InitRandom(num_particles, iseed, pdata, serialize);
-    
+
     // these don't really matter, make something up
     const Real time = 0.0;
     const Real dt = 0.0;
@@ -110,12 +116,36 @@ int main(int argc, char* argv[])
 
     Vector<int> level_steps(nlevs, 0);
 
-    WriteMultiLevelPlotfile("plt00000", nlevs, amrex::GetVecOfConstPtrs(mf),
-                            varnames, geom, time, level_steps, ref_ratio);
-#ifdef AMREX_USE_HDF5    
-    WriteMultiLevelPlotfileHDF5("plt00000", nlevs, amrex::GetVecOfConstPtrs(mf), 
+    char fname[128];
+    for (int ts = 0; ts < nplotfile; ts++) {
+        sprintf(fname, "plt%05d", ts);
+
+        // Fake computation
+        if (ts > 0 && sleeptime > 0) {
+            if (ParallelDescriptor::IOProcessor()) {
+                std::cout << "Sleep for " << sleeptime << " seconds." << std::endl;
+                fflush(stdout);
+            }
+            sleep(sleeptime);
+        }
+
+        if (ParallelDescriptor::IOProcessor())
+            std::cout << "Writing plot file [" << fname << "]" << std::endl;
+#ifdef AMREX_USE_HDF5
+        WriteMultiLevelPlotfileHDF5(fname, nlevs, amrex::GetVecOfConstPtrs(mf),
+                                    varnames, geom, time, level_steps, ref_ratio);
+#else
+        WriteMultiLevelPlotfile(fname, nlevs, amrex::GetVecOfConstPtrs(mf),
                                 varnames, geom, time, level_steps, ref_ratio);
 #endif
+    }
+
+#ifdef AMREX_USE_HDF5_ASYNC
+    // Complete all previous async writes
+    H5VLasync_waitall();
+#endif
+
+    /* ParallelDescriptor::Barrier(); */
 
     Vector<std::string> particle_realnames;
     for (int i = 0; i < NStructReal + NArrayReal; ++i)
@@ -128,23 +158,42 @@ int main(int argc, char* argv[])
     {
         particle_intnames.push_back("particle_int_component_" + std::to_string(i));
     }
-    
-#ifdef AMREX_USE_HDF5    
-    myPC.CheckpointHDF5("plt00000", "particle0", false, particle_realnames, particle_intnames);
+
+    for (int ts = 0; ts < nparticlefile; ts++) {
+        sprintf(fname, "plt%05d", ts);
+
+        // Fake computation
+        if (ts > 0 && sleeptime > 0) {
+            if (ParallelDescriptor::IOProcessor()) {
+                std::cout << "Sleep for " << sleeptime << " seconds." << std::endl;
+                fflush(stdout);
+            }
+            sleep(sleeptime);
+        }
+
+#ifdef AMREX_USE_HDF5
+        myPC.CheckpointHDF5(fname, "particle0", false, particle_realnames, particle_intnames);
 #else
-    myPC.Checkpoint("plt00000", "particle0", false, particle_realnames, particle_intnames);
-    /* myPC.WriteAsciiFile("particle0_ascii"); */
+        myPC.Checkpoint(fname, "particle0", false, particle_realnames, particle_intnames);
+        /* myPC.WriteAsciiFile("particle0_ascii"); */
+#endif
+    }
+
+#ifdef AMREX_USE_HDF5_ASYNC
+    // Complete all previous async writes
+    H5VLasync_waitall();
+    /* ParallelDescriptor::Barrier(); */
 #endif
 
     if (restart_check)
     {
         MyPC newPC(geom, dmap, ba, ref_ratio);
-#ifdef AMREX_USE_HDF5    
+#ifdef AMREX_USE_HDF5
         newPC.RestartHDF5("plt00000", "particle0");
 #else
         newPC.Restart("plt00000", "particle0");
 #endif
-        
+
         using PType = typename MyPC::SuperParticleType;
 
         for (int icomp=0; icomp<NStructReal+NArrayReal+NStructInt+NArrayInt; ++icomp)
@@ -160,14 +209,109 @@ int main(int argc, char* argv[])
                 {
                     return p.rdata(1);
                 });
-            
+
             ParallelDescriptor::ReduceRealSum(sm_new);
             ParallelDescriptor::ReduceRealSum(sm_old);
-        
+
             AMREX_ALWAYS_ASSERT(sm_old = sm_new);
         }
     }
-    
+}
+
+BoxArray
+readBoxList (const std::string& file, Box& domain)
+{
+    BoxArray retval;
+
+    Vector<char> fileCharPtr;
+    ParallelDescriptor::ReadAndBcastFile(file, fileCharPtr);
+    std::istringstream is(fileCharPtr.data());
+
+    is >> domain;
+    is.ignore(1000,'\n');
+    retval.readFrom(is);
+
+    return retval;
+}
+
+void set_grids_nested (Vector<Box>& domains,
+                       Vector<BoxArray>& grids,
+                       Vector<IntVect>& ref_ratio)
+{
+    int ncells, max_grid_size, nlevs;
+
+    ParmParse pp;
+    pp.get("ncells", ncells);
+    pp.get("max_grid_size", max_grid_size);
+    pp.get("nlevs", nlevs);
+
+    AMREX_ALWAYS_ASSERT(nlevs < 2); // relax this later
+
+    IntVect domain_lo(AMREX_D_DECL(0, 0, 0));
+    IntVect domain_hi(AMREX_D_DECL(ncells-1, ncells-1, ncells-1));
+
+    domains.resize(nlevs);
+    domains[0].setSmall(domain_lo);
+    domains[0].setBig(domain_hi);
+
+    ref_ratio.resize(nlevs-1);
+    for (int lev = 1; lev < nlevs; lev++)
+        ref_ratio[lev-1] = IntVect(AMREX_D_DECL(2, 2, 2));
+
+    grids.resize(nlevs);
+    grids[0].define(domains[0]);
+
+    // Now we make the refined level be the center eighth of the domain
+    if (nlevs > 1) {
+        int n_fine = ncells*ref_ratio[0][0];
+        IntVect refined_lo(D_DECL(n_fine/4,n_fine/4,n_fine/4));
+        IntVect refined_hi(D_DECL(3*n_fine/4-1,3*n_fine/4-1,3*n_fine/4-1));
+
+        // Build a box for the level 1 domain
+        Box refined_patch(refined_lo, refined_hi);
+        grids[1].define(refined_patch);
+    }
+
+    // break the BoxArrays at both levels into max_grid_size^3 boxes
+    for (int lev = 0; lev < nlevs; lev++) {
+        grids[lev].maxSize(max_grid_size);
+    }
+
+    for (int lev = 1; lev < nlevs; lev++) {
+	domains[lev] = amrex::refine(domains[lev-1], ref_ratio[lev-1]);
+    }
+}
+
+void set_grids_file (Vector<Box>& domains,
+                     Vector<BoxArray>& grids,
+                     Vector<IntVect>& ref_ratio)
+{
+    int ncells, max_grid_size, nlevs;
+    Vector<int> ref_ratio_file;
+
+    ParmParse pp;
+    pp.get("ncells", ncells);
+    pp.get("max_grid_size", max_grid_size);
+    pp.get("nlevs", nlevs);
+
+    ref_ratio_file.resize(nlevs-1);
+    pp.getarr("ref_ratio_file", ref_ratio_file);
+
+    domains.resize(nlevs);
+    grids.resize(nlevs);
+    ref_ratio.resize(nlevs-1);
+
+    for (int lev=0; lev < nlevs-1; ++lev)
+    {
+        ref_ratio[lev] = IntVect(AMREX_D_DECL(ref_ratio_file[lev],
+                                              ref_ratio_file[lev],
+                                              ref_ratio_file[lev]));
+    }
+
+    for (int lev=0; lev < nlevs; ++lev)
+    {
+        Box domain;
+        grids[lev] = readBoxList("grids/Level_"+std::to_string(lev), domain);
+        domains[lev] = domain;
     }
-    amrex::Finalize();
 }
diff --git a/Tests/IOBenchmark/GNUmakefile b/Tests/IOBenchmark/GNUmakefile
deleted file mode 100644
index bb76f5e13cd..00000000000
--- a/Tests/IOBenchmark/GNUmakefile
+++ /dev/null
@@ -1,44 +0,0 @@
-AMREX_HOME = ../../../amrex
-
-PRECISION = DOUBLE
-DEBUG     = TRUE
-DEBUG     = FALSE
-DIM       = 3
-COMP      = gnu
-
-USE_MPI=FALSE
-USE_MPI=TRUE
-
-USE_OMP=FALSE
-
-USE_CXX11 = TRUE
-
-PROFILE       = TRUE
-TRACE_PROFILE = TRUE
-COMM_PROFILE  = TRUE
-MEM_PROFILE   = TRUE
-#TINY_PROFILE  = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-EBASE = iotest
-
-HERE = .
-
-include $(AMREX_HOME)/Src/Base/Make.package
-
-INCLUDE_LOCATIONS += $(HERE)
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Base
-
-CEXE_sources += IOTestDriver.cpp IOTest.cpp
-
-vpath %.H   $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.cpp $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.F   $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.f   $(HERE) $(AMREX_HOME)/Src/Base
-vpath %.f90 $(HERE) $(AMREX_HOME)/Src/Base
-
-all: $(executable)
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tests/IOBenchmark/IOTest.cpp b/Tests/IOBenchmark/IOTest.cpp
deleted file mode 100644
index 9f57fbba5f3..00000000000
--- a/Tests/IOBenchmark/IOTest.cpp
+++ /dev/null
@@ -1,620 +0,0 @@
-// -------------------------------------------------------------
-// IOTest.cpp
-// -------------------------------------------------------------
-#include <AMReX_Vector.H>
-#include <AMReX_IntVect.H>
-#include <AMReX_Box.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_NFiles.H>
-
-#include <iostream>
-#include <sstream>
-#include <cstdio>
-#include <cstdlib>
-#include <fstream>
-#include <iomanip>
-#include <cerrno>
-#include <deque>
-
-#include <unistd.h>
-#include <string.h>
-#include <sys/stat.h>
-
-using std::cout;
-using std::endl;
-using std::ends;
-using std::ofstream;
-using std::streamoff;
-
-using namespace amrex;
-
-const int XDIR(0);
-const int YDIR(1);
-const int ZDIR(2);
-Real bytesPerMB(1.0e+06);
-const bool verboseDir(true);
-
-
-// -------------------------------------------------------------
-void DirectoryTests() {
-    int ndirs(256), nlevels(4);
-
-    if(ParallelDescriptor::IOProcessor()) { 
-      errno = 0;
-      mkdir("testdir", 0755);
-      std::cout << "_here 0:  errno = " << strerror(errno) << std::endl;
-      errno = 0;
-      rmdir("testdir");
-      std::cout << "_here 1:  errno = " << strerror(errno) << std::endl;
-      errno = 0;
-      mkdir("testnest/n0/n1", 0755);
-      std::cout << "_here 2:  errno = " << strerror(errno) << std::endl;
-      errno = 0;
-    }
-
-    BL_PROFILE_VAR("mkdirs", mkdirs);
-    for(int i(0); i < ndirs; ++i) {
-      std::stringstream dirname;
-      dirname << "dir" << i;
-      if(ParallelDescriptor::IOProcessor()) {
-        if( ! amrex::UtilCreateDirectory(dirname.str(), 0755, verboseDir)) {
-          amrex::CreateDirectoryFailed(dirname.str());
-        }
-        for(int level(0); level < nlevels; ++level) {
-          std::stringstream dirname;
-          dirname << "dir" << i << "/Level_" << level;
-          if( ! amrex::UtilCreateDirectory(dirname.str(), 0755, verboseDir)) {
-            amrex::CreateDirectoryFailed(dirname.str());
-          }
-        }
-      }
-    }
-    ParallelDescriptor::Barrier("waitfordir");
-    BL_PROFILE_VAR_STOP(mkdirs);
-
-    BL_PROFILE_VAR("renamedirs", renamedirs);
-    for(int i(0); i < ndirs; ++i) {
-      if(ParallelDescriptor::IOProcessor()) {
-        std::stringstream dirname;
-        dirname << "dir" << i;
-        std::string newdirname;
-        newdirname = dirname.str() + ".old";
-        std::rename(dirname.str().c_str(), newdirname.c_str());
-      }
-    }
-    ParallelDescriptor::Barrier("renamedirs");
-    BL_PROFILE_VAR_STOP(renamedirs);
-}
-
-
-// -------------------------------------------------------------
-void NFileTests(int nOutFiles, const std::string &filePrefix) {
-  int myProc(ParallelDescriptor::MyProc());
-  Vector<int> data(32);
-
-  for(int i(0); i < data.size(); ++i) {
-    data[i] = (100 * myProc) + i;
-  }
-
-  bool groupSets(false), setBuf(true);
-  for(NFilesIter nfi(nOutFiles, filePrefix, groupSets, setBuf); nfi.ReadyToWrite(); ++nfi) {
-    nfi.Stream().write((const char *) data.dataPtr(), data.size() * sizeof(int));
-  }
-}
-
-
-
-// -------------------------------------------------------------
-void FileTests() {
-  Vector<int> myInts(4096 * 4096);
-  for(int i(0); i < myInts.size(); ++i) {
-    myInts[i] = i;
-  }
-
-  std::fstream myFile;
-
-  BL_PROFILE_VAR("makeafile", makeafile);
-  myFile.open("myFile", std::ios::out|std::ios::trunc|std::ios::binary);
-  myFile.write((const char *) myInts.dataPtr(), myInts.size() * sizeof(int));
-  myFile.close();
-  BL_PROFILE_VAR_STOP(makeafile);
-
-  BL_PROFILE_VAR_NS("seektests", seektests);
-  myFile.open("myFile", std::ios::in|std::ios::binary);
-  myFile.seekg(0, std::ios::end);
-  myFile.seekg(0, std::ios::beg);
-  for(int i(0); i < myInts.size()/10; ++i) {
-    BL_PROFILE_VAR_START(seektests);
-    myFile.seekg(1, std::ios::cur);
-    BL_PROFILE_VAR_STOP(seektests);
-  }
-  myFile.close();
-
-
-  std::string dirname("/home/vince/Development/BoxLib/Tests/IOBenchmark/a/b/c/d");
-  if(ParallelDescriptor::IOProcessor()) {
-    if( ! amrex::UtilCreateDirectory(dirname, 0755, verboseDir)) {
-      amrex::CreateDirectoryFailed(dirname);
-    }
-  }
-  std::string rdirname("relative/e/f/g");
-  if(ParallelDescriptor::IOProcessor()) {
-    if( ! amrex::UtilCreateDirectory(rdirname, 0755, verboseDir)) {
-      amrex::CreateDirectoryFailed(rdirname);
-    }
-  }
-  std::string nsdirname("noslash");
-  if(ParallelDescriptor::IOProcessor()) {
-    if( ! amrex::UtilCreateDirectory(nsdirname, 0755, verboseDir)) {
-      amrex::CreateDirectoryFailed(nsdirname);
-    }
-  }
-
-}
-
-
-// -------------------------------------------------------------
-BoxArray MakeBoxArray(int maxgrid,  int nboxes) {
-#if (BL_SPACEDIM == 2)
-  IntVect ivlo(0, 0);
-  IntVect ivhi(maxgrid - 1, maxgrid - 1);
-#else
-  IntVect ivlo(0, 0, 0);
-  IntVect ivhi(maxgrid - 1, maxgrid - 1, maxgrid - 1);
-#endif
-  int iSide(pow(static_cast<Real>(nboxes), 1.0/3.0));
-  Box tempBox(ivlo, ivhi);
-  BoxArray bArray(nboxes);
-  int ix(0), iy(0), iz(0);
-  for(int ibox(0); ibox < nboxes; ++ibox) {
-    Box sBox(tempBox);
-    sBox.shift(XDIR, ix * maxgrid);
-    sBox.shift(YDIR, iy * maxgrid);
-#if (BL_SPACEDIM == 3)
-    sBox.shift(ZDIR, iz * maxgrid);
-#endif
-    bArray.set(ibox, sBox);
-    ++ix;
-    if(ix > iSide) {
-      ix = 0;
-      ++iy;
-    }
-    if(iy > iSide) {
-      iy = 0;
-      ++iz;
-    }
-  }
-  return bArray;
-}
-
-
-// -------------------------------------------------------------
-void TestWriteNFiles(int nfiles, int maxgrid, int ncomps, int nboxes,
-                     bool raninit, bool mb2,
-		     VisMF::Header::Version whichVersion,
-		     bool groupSets, bool setBuf,
-		     bool useDSS, int nMultiFabs,
-		     bool checkmf, const std::string &dirName)
-{
-  VisMF::SetNOutFiles(nfiles);
-  VisMF::SetGroupSets(groupSets);
-  VisMF::SetSetBuf(setBuf);
-  VisMF::SetUseDynamicSetSelection(useDSS);
-  if(mb2) {
-    bytesPerMB = pow(2.0, 20);
-  }
-
-  bool useDir( ! dirName.empty());
-  Vector<std::string> pathNames(nMultiFabs);
-  if(useDir) {
-    // ---- make the directory and nMultiFabs Level_n directories
-    for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-      std::stringstream path;
-      path << dirName << "/Level_" << nmf << "/";
-      pathNames[nmf] = path.str();
-    }
-    if(ParallelDescriptor::IOProcessor()) {
-      const bool verboseDir(false);
-      if( ! amrex::UtilCreateDirectory(dirName, 0755, verboseDir)) {
-        amrex::CreateDirectoryFailed(dirName);
-      }
-      for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-        if( ! amrex::UtilCreateDirectory(pathNames[nmf], 0755, verboseDir)) {
-          amrex::CreateDirectoryFailed(pathNames[nmf]);
-        }
-      }
-    }
-    ParallelDescriptor::Barrier("waitfordirName");
-  }
-
-  BoxArray bArray(MakeBoxArray(maxgrid, nboxes));
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << "  Timings for writing to " << nfiles << " files with version:  "
-         << whichVersion << endl;
-  }
-
-  std::string mfName;
-  switch(whichVersion) {
-    case VisMF::Header::Version_v1:
-      mfName = "TestMF";
-    break;
-    case VisMF::Header::NoFabHeader_v1:
-      mfName = "TestMFNoFabHeader";
-    break;
-    case VisMF::Header::NoFabHeaderMinMax_v1:
-      mfName = "TestMFNoFabHeaderMinMax";
-    break;
-    case VisMF::Header::NoFabHeaderFAMinMax_v1:
-      mfName = "TestMFNoFabHeaderFAMinMax";
-    break;
-    default:
-      amrex::Abort("**** Error in TestWriteNFiles:  bad version.");
-  }
-
-  // ---- make the MultiFabs
-  Vector<std::string> mfNames(nMultiFabs);
-  Vector<MultiFab *> multifabs(nMultiFabs);
-  DistributionMapping dmap{bArray};
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    std::stringstream suffix;
-    suffix << "_" << nmf;
-    if(useDir) {
-      mfNames[nmf] = pathNames[nmf] + mfName + suffix.str();
-    } else {
-      mfNames[nmf] = mfName + suffix.str();
-    }
-    VisMF::RemoveFiles(mfNames[nmf], false);  // ---- not verbose
-
-    multifabs[nmf] = new MultiFab(bArray, dmap, ncomps, 0);
-
-    for(MFIter mfiset(*(multifabs[nmf])); mfiset.isValid(); ++mfiset) {
-      for(int invar(0); invar < ncomps; ++invar) {
-        if(raninit) {
-          Real *dp = (*multifabs[nmf])[mfiset].dataPtr(invar);
-	  for(int i(0); i < (*multifabs[nmf])[mfiset].box().numPts(); ++i) {
-	    dp[i] = amrex::Random() + (1.0 + static_cast<Real> (invar));
-	  }
-        } else {
-          (*multifabs[nmf])[mfiset].setVal<RunOn::Host>((100.0 * mfiset.index()) + invar +
-	                                (static_cast<Real> (nmf) / 100.0), invar);
-        }
-      }
-    }
-  }
-
-
-  long totalBytesWritten(0);
-
-
-  VisMF::Header::Version currentVersion(VisMF::GetHeaderVersion());
-  VisMF::SetHeaderVersion(whichVersion);
-
-  ParallelDescriptor::Barrier("TestWriteNFiles:BeforeWrite");
-  double wallTimeStart(ParallelDescriptor::second());
-
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    totalBytesWritten += VisMF::Write(*multifabs[nmf], mfNames[nmf]);
-  }
-  double wallTime(ParallelDescriptor::second() - wallTimeStart);
-
-  ParallelDescriptor::Barrier("TestWriteNFiles:AfterWrite");
-
-  double wallTimeMax(wallTime);
-  double wallTimeMin(wallTime);
-
-  ParallelDescriptor::ReduceLongSum(totalBytesWritten, ParallelDescriptor::IOProcessorNumber());
-  ParallelDescriptor::ReduceRealMin(wallTimeMin, ParallelDescriptor::IOProcessorNumber());
-  ParallelDescriptor::ReduceRealMax(wallTimeMax, ParallelDescriptor::IOProcessorNumber());
-  Real megabytes((static_cast<Real> (totalBytesWritten)) / bytesPerMB);
-
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << std::setprecision(5);
-    cout << "------------------------------------------" << endl;
-    cout << "  Total megabytes       = " << megabytes << endl;
-    cout << "  Write:  Megabytes/sec = " << megabytes/wallTimeMax << endl;
-    cout << "  Wall clock time       = " << wallTimeMax << " s." << endl;
-    cout << "  Min wall clock time   = " << wallTimeMin << " s." << endl;
-    cout << "  Max wall clock time   = " << wallTimeMax << " s." << endl;
-    cout << "------------------------------------------" << endl;
-  }
-
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    delete multifabs[nmf];
-  }
-
-
-  if(checkmf) {
-    ParallelDescriptor::Barrier("TestWriteNFiles:checkmf");
-    wallTime = ParallelDescriptor::second();
-
-    bool isOk(true);
-    for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-      isOk &= VisMF::Check(mfNames[nmf]);
-    }
-    wallTimeMax = ParallelDescriptor::second() - wallTime;
-    ParallelDescriptor::ReduceRealMax(wallTimeMax, ParallelDescriptor::IOProcessorNumber());
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << std::setprecision(5);
-      cout << "------------------------------------------" << endl;
-      cout << "VisMF::Check():  time = " << wallTimeMax << " s." << endl;
-      if(isOk) {
-        cout << "VisMF::Check():  multifab is ok." << endl;
-      } else {
-        cout << "**** Error:  VisMF::Check():  multifab is not ok." << endl;
-      }
-      cout << "------------------------------------------" << endl;
-    }
-  }
-
-  VisMF::SetHeaderVersion(currentVersion);  // ---- set back to previous version
-}
-
-
-// -------------------------------------------------------------
-void TestReadMF(const std::string &mfName, bool useSyncReads,
-                int nMultiFabs, const std::string &dirName)
-{
-  bool useDir( ! dirName.empty());
-  Vector<std::string> pathNames(nMultiFabs);
-  Vector<std::string> mfNames(nMultiFabs);
-  Vector<MultiFab *> multifabs(nMultiFabs);
-
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    std::stringstream suffix;
-    suffix << "_" << nmf;
-    if(useDir) {
-      std::stringstream path;
-      path << dirName << "/Level_" << nmf << "/";
-      pathNames[nmf] = path.str();
-      mfNames[nmf] = pathNames[nmf] + mfName + suffix.str();
-    } else {
-      mfNames[nmf] = mfName + suffix.str();
-    }
-    multifabs[nmf] = new MultiFab;
-  }
-
-  VisMF::SetUseSynchronousReads(useSyncReads);
-  VisMF::CloseAllStreams(); 
-
-  ParallelDescriptor::Barrier("TestReadMF:BeforeRead");
-  double wallTimeStart(ParallelDescriptor::second());
-
-  Vector<Vector<char> > faHeaders(nMultiFabs);
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    std::string faHName(mfNames[nmf] + "_H");
-    bool bExitOnError(false);  // ---- dont exit if this file does not exist
-    ParallelDescriptor::ReadAndBcastFile(faHName, faHeaders[nmf], bExitOnError);
-  }
-  VisMF::Read(*multifabs[0], mfNames[0], faHeaders[0].dataPtr(), 0); 
-  const BoxArray& ba = multifabs[0]->boxArray();
-  const DistributionMapping& dm = multifabs[0]->DistributionMap();
-  const int ncomps = multifabs[0]->nComp();
-  const int ng = multifabs[0]->nGrow();
-  for(int nmf(1); nmf < nMultiFabs; ++nmf) {
-      multifabs[nmf]->define(ba,dm,ncomps,ng);
-      VisMF::Read(*multifabs[nmf], mfNames[nmf], faHeaders[nmf].dataPtr(), nmf); 
-  }
-
-  double wallTime(ParallelDescriptor::second() - wallTimeStart);
-
-  ParallelDescriptor::Barrier("TestReadMF:AfterRead");
-
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    for(int i(0); i < multifabs[nmf]->nComp(); ++i) {
-      Real mfMin = multifabs[nmf]->min(i);
-      Real mfMax = multifabs[nmf]->max(i);
-      if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "MMMMMMMM:  i mfMin mfMax = " << i << "  " << mfMin << "  " << mfMax << std::endl;
-      }
-    }
-  }
-
-  double wallTimeMax(wallTime);
-  double wallTimeMin(wallTime);
-
-  ParallelDescriptor::ReduceRealMin(wallTimeMin);
-  ParallelDescriptor::ReduceRealMax(wallTimeMax);
-
-  long totalNBytes(0);
-
-  for(int nmf(0); nmf < nMultiFabs; ++nmf) {
-    for(MFIter mfi(*multifabs[nmf]); mfi.isValid(); ++mfi) {
-      totalNBytes += (*multifabs[nmf])[mfi].nBytes();
-    }
-    delete multifabs[nmf];
-  }
-  ParallelDescriptor::ReduceLongSum(totalNBytes);
-
-  Real megabytes((static_cast<Real> (totalNBytes)) / bytesPerMB);
-
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << std::setprecision(5);
-    cout << "------------------------------------------" << endl;
-    cout << "  Total megabytes = " << megabytes << endl;
-    cout << "  Read:  Megabytes/sec   = " << megabytes/wallTimeMax << endl;
-    cout << "  Wall clock time = " << wallTimeMax << endl;
-    cout << "  Min wall clock time = " << wallTimeMin << endl;
-    cout << "  Max wall clock time = " << wallTimeMax << endl;
-    cout << "------------------------------------------" << endl;
-  }
-}
-
-
-
-// -------------------------------------------------------------
-void DSSNFileTests(int noutfiles, const std::string &filePrefixIn,
-                   bool useIter)
-{
-#ifdef BL_USE_MPI
-  bool groupSets(false), setBuf(true);
-  std::string filePrefix(filePrefixIn);
-
-  if(useIter) {
-    int myProc(ParallelDescriptor::MyProc());
-    Vector<int> data(10240);
-
-    for(int i(0); i < data.size(); ++i) {
-      data[i] = (100 * myProc) + i;
-    }
-
-    NFilesIter nfi(noutfiles, filePrefix, groupSets, setBuf);
-    nfi.SetDynamic(-1);
-    for( ; nfi.ReadyToWrite(); ++nfi) {
-      nfi.Stream().write((const char *) data.dataPtr(), data.size() * sizeof(int));
-    }
-  }
-
-  filePrefix += "_Check";
-
-  int myProc(ParallelDescriptor::MyProc());
-  int nProcs    = ParallelDescriptor::NProcs();
-  int nOutFiles = NFilesIter::ActualNFiles(noutfiles);
-  int mySetPosition = NFilesIter::WhichSetPosition(myProc, nProcs, nOutFiles, groupSets);
-  Vector<int> data(10240);
-  int deciderProc(nProcs - 1), coordinatorProc(-1);
-  int deciderTag(ParallelDescriptor::SeqNum());
-  int coordinatorTag(ParallelDescriptor::SeqNum());
-  int doneTag(ParallelDescriptor::SeqNum());
-  int writeTag(ParallelDescriptor::SeqNum());
-  bool finishedWriting(false);
-  ParallelDescriptor::Message rmess;
-  int remainingWriters(nProcs);
-
-  for(int i(0); i < data.size(); ++i) {
-    data[i] = (100 * myProc) + i;
-  }
-
-  NFilesIter::CheckNFiles(nProcs, nOutFiles, false);
-
-  int nSetZeros(0), nonZeroDeciderProc(-1);
-  for(int i(0); i < nProcs; ++i) {
-    // ---- count zero set positions  and find an alternate decider
-    if(NFilesIter::WhichSetPosition(i, nProcs, nOutFiles, groupSets) == 0) {
-      ++nSetZeros;
-    } else {
-      nonZeroDeciderProc = i;  // ---- this will end up with the last value
-    }
-  }
-
-  if(NFilesIter::WhichSetPosition(deciderProc, nProcs, nOutFiles, groupSets) == 0) {
-    deciderProc = nonZeroDeciderProc;
-  }
-
-
-    if(mySetPosition == 0) {    // ---- write data
-      int fileNumber(NFilesIter::FileNumber(nOutFiles, myProc, groupSets));
-      std::ofstream csFile;
-      std::string FullName(amrex::Concatenate(filePrefix, fileNumber, 5));
-      csFile.open(FullName.c_str(), std::ios::out | std::ios::trunc | std::ios::binary);
-      if( ! csFile.good()) { amrex::FileOpenFailed(FullName); }
-      // ----------------------------- write to file here
-      csFile.write((const char *) data.dataPtr(), data.size() * sizeof(int));
-      // ----------------------------- end write to file here
-      csFile.flush();
-      csFile.close();
-      finishedWriting = true;
-
-      // ---- tell the decider we are done
-      ParallelDescriptor::Send(&myProc, 1, deciderProc, deciderTag);
-
-      // ---- wait to find out who will coordinate
-      ParallelDescriptor::Recv(&coordinatorProc, 1, deciderProc, coordinatorTag);
-
-      if(myProc == coordinatorProc) {
-	Vector<std::deque<int> > procsToWrite(nOutFiles);    // ---- [fileNumber](procsToWriteToFileNumber)
-	// ---- populate with the static nfiles sets
-	for(int i(0); i < nProcs; ++i) {
-          int fileNumber(NFilesIter::FileNumber(nOutFiles, i, groupSets));
-          int procSet(NFilesIter::WhichSetPosition(i, nProcs, nOutFiles, groupSets));
-	  if(procSet == 0) {    // ---- set 0 procs have already written their data
-	    --remainingWriters;
-	  }
-	  if(procSet != 0) {
-	    procsToWrite[fileNumber].push_back(i);
-	  }
-	}
-
-        // ---- signal each remaining processor when to write and to which file
-	std::set<int> availableFileNumbers;
-	availableFileNumbers.insert(fileNumber);  // ---- the coordinators file number
-
-	// ---- recv incoming available files
-	while(remainingWriters > 0) {
-
-	  int nextProcToWrite, nextFileNumberToWrite, nextFileNumberAvailable;
-	  std::set<int>::iterator ait = availableFileNumbers.begin();
-	  nextFileNumberToWrite = *ait;
-	  availableFileNumbers.erase(nextFileNumberToWrite);
-
-	  for(int nfn(0); nfn < procsToWrite.size(); ++nfn) {
-	    // ---- start with the current next file number
-	    // ---- get a proc from another file number if the queue is empty
-	    int tempNFN((nextFileNumberToWrite + nfn) % procsToWrite.size());
-	    if(procsToWrite[tempNFN].size() > 0) {
-	      nextProcToWrite = procsToWrite[tempNFN].front();
-	      procsToWrite[tempNFN].pop_front();
-	      break;  // ---- found one
-	    }
-	  }
-
-          ParallelDescriptor::Asend(&nextFileNumberToWrite, 1, nextProcToWrite, writeTag);
-
-          ParallelDescriptor::Recv(&nextFileNumberAvailable, 1, MPI_ANY_SOURCE, doneTag);
-	  availableFileNumbers.insert(nextFileNumberAvailable);
-	  --remainingWriters;
-	}
-
-      } else {
-        // ---- tell the coordinatorProc we are done writing
-        ParallelDescriptor::Send(&fileNumber, 1, coordinatorProc, doneTag);
-      }
-
-    } else if(myProc == deciderProc) {  // ---- this proc decides who decides
-
-      // ---- the first message received is the coordinator
-      ParallelDescriptor::Recv(&coordinatorProc, 1, MPI_ANY_SOURCE, deciderTag);
-      // ---- tell the coordinatorProc to start coordinating
-      ParallelDescriptor::Asend(&coordinatorProc, 1, coordinatorProc, coordinatorTag);
-      for(int i(0); i < nSetZeros - 1; ++i) {  // ---- tell the others who is coorinating
-        int nonCoordinatorProc(-1);
-        ParallelDescriptor::Recv(&nonCoordinatorProc, 1, MPI_ANY_SOURCE, deciderTag);
-        ParallelDescriptor::Asend(&coordinatorProc, 1, nonCoordinatorProc, coordinatorTag);
-      }
-    }
-
-    // ---- these are the rest of the procs who need to write
-    if( ! finishedWriting) {  // ---- the deciderProc drops through to here
-      int fileNumber;
-      // ---- wait for signal to start writing
-      rmess = ParallelDescriptor::Recv(&fileNumber, 1, MPI_ANY_SOURCE, writeTag);
-      coordinatorProc = rmess.pid();
-      std::string FullName(amrex::Concatenate(filePrefix, fileNumber, 5));
-
-      std::ofstream csFile;
-      csFile.open(FullName.c_str(), std::ios::out | std::ios::app | std::ios::binary);
-      csFile.seekp(0, std::ios::end);   // set to eof
-      if( ! csFile.good()) { amrex::FileOpenFailed(FullName); }
-      // ----------------------------- write to file here
-      csFile.write((const char *) data.dataPtr(), data.size() * sizeof(int));
-      // ----------------------------- end write to file here
-      csFile.flush();
-      csFile.close();
-      finishedWriting = true;
-
-      // ---- signal we are finished
-      ParallelDescriptor::Send(&fileNumber, 1, coordinatorProc, doneTag);
-    }
-ParallelDescriptor::Barrier();
-#endif
-}
-
-
-// -------------------------------------------------------------
-// -------------------------------------------------------------
-
-
diff --git a/Tests/IOBenchmark/IOTestDriver.cpp b/Tests/IOBenchmark/IOTestDriver.cpp
deleted file mode 100644
index debef02c273..00000000000
--- a/Tests/IOBenchmark/IOTestDriver.cpp
+++ /dev/null
@@ -1,490 +0,0 @@
-// -------------------------------------------------------------
-// IOTestDriver.cpp
-// -------------------------------------------------------------
-#include <new>
-#include <iostream>
-#include <cstdio>
-#include <cstdlib>
-#include <cstring>
-using std::ios;
-
-#include <unistd.h>
-
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_FabConv.H>
-
-
-using std::cout;
-using std::cerr;
-using std::endl;
-
-using namespace amrex;
-
-void DirectoryTests();
-void FileTests();
-void TestWriteNFiles(int nfiles, int maxgrid, int ncomps, int nboxes,
-                     bool raninit, bool mb2,
-		     VisMF::Header::Version writeMinMax,
-		     bool groupsets, bool setbuf, bool useDSS,
-		     int nMultiFabs, bool checkmf,
-		     const std::string &dirName);
-void TestReadMF(const std::string &mfName, bool useSyncReads,
-                     int nMultiFabs, const std::string &dirName);
-void NFileTests(int nOutFiles, const std::string &filePrefix);
-void DSSNFileTests(int nOutFiles, const std::string &filePrefix,
-                   bool useIter);
-
-
-// -------------------------------------------------------------
-static void PrintUsage(const char *progName) {
-    cout << '\n';
-    cout << "Usage:" << '\n';
-    cout << progName << "  inputsfile" << '\n';
-    cout << "   [nfiles            = nfiles   ]" << '\n';
-    cout << "   [maxgrid           = maxgrid  ]" << '\n';
-    cout << "   [ncomps            = ncomps   ]" << '\n';
-    cout << "   [nboxes            = nboxes   ]" << '\n';
-    cout << "   [nsleep            = nsleep   ]" << '\n';
-    cout << "   [ntimes            = ntimes   ]" << '\n';
-    cout << "   [raninit           = tf       ]" << '\n';
-    cout << "   [mb2               = tf       ]" << '\n';
-    cout << "   [rbuffsize         = rbsize   ]" << '\n';
-    cout << "   [wbuffsize         = wbsize   ]" << '\n';
-    cout << "   [groupsets         = tf       ]" << '\n';
-    cout << "   [setbuf            = tf       ]" << '\n';
-    cout << "   [nfileitertest     = tf       ]" << '\n';
-    cout << "   [dssnfileitertest  = tf       ]" << '\n';
-    cout << "   [filetests         = tf       ]" << '\n';
-    cout << "   [dirtests          = tf       ]" << '\n';
-    cout << "   [testwritenfiles   = versions ]" << '\n';
-    cout << "   [testreadmf        = tf       ]" << '\n';
-    cout << "   [readFANames       = fanames  ]" << '\n';
-    cout << "   [nreadstreams      = nrs      ]" << '\n';
-    cout << "   [usesingleread     = tf       ]" << '\n';
-    cout << "   [usesinglewrite    = tf       ]" << '\n';
-    cout << "   [checkfpositions   = tf       ]" << '\n';
-    cout << "   [checkfmf          = tf       ]" << '\n';
-    cout << "   [pifstreams        = tf       ]" << '\n';
-    cout << "   [usedss            = tf       ]" << '\n';
-    cout << "   [usesyncreads      = tf       ]" << '\n';
-    cout << "   [nmultifabs        = nmf      ]" << '\n';
-    cout << "   [dirname           = dirname  ]" << '\n';
-    cout << '\n';
-}
-
-
-// -------------------------------------------------------------
-int main(int argc, char *argv[]) {
-
-  if(argc == 1) {
-    PrintUsage(argv[0]);
-    return 0;
-  }
-
-  amrex::Initialize(argc,argv);
-
-  ParmParse pp;
-
-  int myproc(ParallelDescriptor::MyProc());
-  int nprocs(ParallelDescriptor::NProcs());
-  int nsleep(0), nfiles(std::min(nprocs, 128));  // limit default to max of 128
-  int maxgrid(32), ncomps(4), nboxes(nprocs), ntimes(1);
-  int rbs(8192), wbs(8192);
-  bool raninit(false), mb2(false);
-  bool groupSets(false), setBuf(true);
-  bool nfileitertest(false), dssnfileitertest(false);
-  bool filetests(false), dirtests(false);
-  bool testreadmf(false);
-  bool useSingleRead(false), useSingleWrite(false);
-  bool checkFPositions(false), pIFStreams(false);
-  bool checkmf(false);
-  bool useDSS(false), useSyncReads(false);
-  Vector<int> testWriteNFilesVersions;
-  Vector<std::string> readFANames;
-  int nReadStreams(1), nMultiFabs(1);
-  std::string dirName("");
-
-
-  pp.query("nfiles", nfiles);
-  nfiles = std::max(1, std::min(nfiles, nprocs));
-
-  pp.query("maxgrid", maxgrid);
-  maxgrid = std::max(4, std::min(maxgrid, 256));
-
-  pp.query("ncomps", ncomps);
-  ncomps = std::max(1, std::min(ncomps, 256));
-
-  pp.query("nboxes", nboxes);
-  nboxes = std::max(1, nboxes);
-
-  pp.query("ntimes", ntimes);
-  ntimes = std::max(1, ntimes);
-
-  pp.query("raninit", raninit);
-  pp.query("mb2", mb2);
-
-  int nWNFTests(pp.countval("testwritenfiles"));
-  if(nWNFTests > 0) {
-    pp.getarr("testwritenfiles", testWriteNFilesVersions, 0, nWNFTests);
-  }
-
-  pp.query("groupsets", groupSets);
-  pp.query("setbuf", setBuf);
-  pp.query("usesingleread", useSingleRead);
-  pp.query("usesinglewrite", useSingleWrite);
-  pp.query("checkfpositions", checkFPositions);
-  pp.query("checkmf", checkmf);
-  pp.query("pifstreams", pIFStreams);
-  pp.query("usedss", useDSS);
-  pp.query("usesyncreads", useSyncReads);
-  pp.query("nmultifabs", nMultiFabs);
-  nMultiFabs = std::max(1, std::min(nMultiFabs, 32));
-
-  pp.query("rbuffsize", rbs);
-  pp.query("wbuffsize", wbs);
-  RealDescriptor::SetReadBufferSize(rbs);
-  RealDescriptor::SetWriteBufferSize(wbs);
-
-  pp.query("nfileitertest", nfileitertest);
-  pp.query("dssnfileitertest", dssnfileitertest);
-  pp.query("filetests", filetests);
-  pp.query("dirtests", dirtests);
-  pp.query("testreadmf", testreadmf);
-  int nNames(pp.countval("readfanames"));
-  if(nNames > 0) {
-    pp.getarr("readfanames", readFANames, 0, nNames);
-  }
-  pp.query("nreadstreams", nReadStreams);
-  nReadStreams = std::max(1, nReadStreams);
-  pp.query("dirname", dirName);
-
-
-  if(ParallelDescriptor::IOProcessor()) {
-    cout << '\n';
-    cout << "**************************************************" << '\n';
-    cout << "nprocs            = " << nprocs << '\n';
-    cout << "nfiles            = " << nfiles << '\n';
-    cout << "maxgrid           = " << maxgrid << '\n';
-    cout << "ncomps            = " << ncomps << '\n';
-    cout << "nboxes            = " << nboxes << '\n';
-    cout << "ntimes            = " << ntimes << '\n';
-    cout << "raninit           = " << raninit << '\n';
-    cout << "mb2               = " << mb2 << '\n';
-    cout << "rbuffsize         = " << rbs << '\n';
-    cout << "wbuffsize         = " << wbs << '\n';
-    cout << "groupsets         = " << groupSets << '\n';
-    cout << "setbuf            = " << setBuf << '\n';
-    cout << "nfileitertest     = " << nfileitertest << '\n';
-    cout << "dssnfileitertest  = " << dssnfileitertest << '\n';
-    cout << "filetests         = " << filetests << '\n';
-    cout << "dirtests          = " << dirtests << '\n';
-    cout << "testreadmf        = " << testreadmf << '\n';
-    for(int i(0); i < testWriteNFilesVersions.size(); ++i) {
-      cout << "testWriteNFilesVersions[" << i << "]    = " << testWriteNFilesVersions[i] << '\n';
-    }
-    for(int i(0); i < readFANames.size(); ++i) {
-      cout << "readFANames[" << i << "]    = " << readFANames[i] << '\n';
-    }
-    cout << "nreadstreams      = " << nReadStreams << '\n';
-    cout << "usesingleread     = " << useSingleRead << '\n';
-    cout << "usesinglewrite    = " << useSingleWrite << '\n';
-    cout << "checkfpositions   = " << checkFPositions << '\n';
-    cout << "checkmf           = " << checkmf << '\n';
-    cout << "pifstreams        = " << pIFStreams << '\n';
-    cout << "usedss            = " << useDSS << '\n';
-    cout << "usesyncreads      = " << useSyncReads << '\n';
-    cout << "nmultifabs        = " << nMultiFabs << '\n';
-    cout << "dirName           = " << dirName << '\n';
-
-    cout << '\n';
-    cout << "sizeof(int) = " << sizeof(int) << '\n';
-    cout << "sizeof(size_t) = " << sizeof(size_t) << '\n';
-    cout << "sizeof(long) = " << sizeof(long) << '\n';
-    cout << "sizeof(long long) = " << sizeof(long long) << '\n';
-    cout << "sizeof(std::streampos) = " << sizeof(std::streampos) << '\n';
-    cout << "sizeof(std::streamoff) = " << sizeof(std::streamoff) << '\n';
-    cout << "sizeof(std::streamsize) = " << sizeof(std::streamsize) << '\n';
-    cout << '\n';
-    cout << "std::numeric_limits<int>::min()  = " << std::numeric_limits<int>::min() << '\n';
-    cout << "std::numeric_limits<int>::max()  = " << std::numeric_limits<int>::max() << '\n';
-    cout << "std::numeric_limits<Real>::min() = " << std::numeric_limits<Real>::min() << '\n';
-    cout << "std::numeric_limits<Real>::max() = " << std::numeric_limits<Real>::max() << '\n';
-    cout << "***************************************************" << '\n';
-    cout << endl;
-  }
-
-#ifdef _OPENMP
-  std::ofstream sharedThreadFile;
-#pragma omp parallel private(sharedThreadFile)
-{
-  int nThreads(omp_get_max_threads());
-  int myThread(omp_get_thread_num());
-  long baseDataItems(8);
-  long dataItems(baseDataItems * (myThread + 1));
-  amrex::USleep(myproc+1/10.0);
-  amrex::USleep(myThread/10.0);
-  if(myproc == 0 && myThread == 0) {
-    cout << "nThreads = " << nThreads << endl;
-  }
-  cout << "myproc = " << myproc << " :: tnum = " << myThread << endl;
-
-  Vector<unsigned long> fileOffset(nThreads, 0L);  // ---- [tnum]
-  for(long i(0); i < fileOffset.size(); ++i) {
-    for(long j(i); j > 0; --j) {
-      fileOffset[i] += baseDataItems * j * sizeof(unsigned long);
-    }
-    if(myThread == 0) {
-      cout << "fileOffset[" << i << "] = " << fileOffset[i] << endl;
-    }
-  }
-
-  Vector<Vector<long>> data(nThreads);  // ---- [tnum][data]
-  data[myThread].resize(dataItems);
-  long startValue(fileOffset[myThread] / sizeof(unsigned long));
-  for(long i(0); i < dataItems; ++i) {
-    data[myThread][i] = i + startValue;
-  }
-
-  std::stringstream fileName;
-  fileName << "ompfile_mpirank_" << myproc << "_tn_" << myThread;
-  cout << "fileName = " << fileName.str() << endl;
-
-  std::ofstream threadFile;
-  threadFile.open(fileName.str(), std::ios::out | std::ios::trunc | std::ios::binary);
-  threadFile.write((const char *) data[myThread].dataPtr(), dataItems * sizeof(unsigned long));
-  threadFile.flush();
-  threadFile.close();
-
-{
-  std::stringstream sharedFileName;
-  sharedFileName << "sompfile_mpirank_" << myproc;
-
-  if(myThread == 0) {
-    sharedThreadFile.open(sharedFileName.str(), std::ios::out | std::ios::trunc | std::ios::binary);
-  }
-  #pragma omp barrier
-  if(myThread != 0) {
-    sharedThreadFile.open(sharedFileName.str(), std::ios::out | std::ios::binary);
-    sharedThreadFile.seekp(fileOffset[myThread]);
-  }
-  sharedThreadFile.write((const char *) data[myThread].dataPtr(), dataItems * sizeof(unsigned long));
-  if(myThread == 0) {
-    sharedThreadFile.flush();
-    sharedThreadFile.close();
-  }
-}
-
-  std::stringstream sharedFileName;
-  sharedFileName << "sompfile_mpirank_" << myproc;
-
-  #pragma omp barrier
-  if(myThread == 0) {
-    sharedThreadFile.open(sharedFileName.str(), std::ios::out | std::ios::trunc | std::ios::binary);
-    sharedThreadFile.write((const char *) data[myThread].dataPtr(), dataItems * sizeof(unsigned long));
-    sharedThreadFile.flush();
-    sharedThreadFile.close();
-  }
-  #pragma omp barrier
-  if(myThread == 1) {
-    sharedThreadFile.open(sharedFileName.str(), std::ios::out | std::ios::app | std::ios::binary);
-    sharedThreadFile.seekp(fileOffset[myThread]);
-    cout << "1: seeking to " << fileOffset[myThread] << endl;
-    sharedThreadFile.flush();
-    sharedThreadFile.close();
-  }
-  /*
-  #pragma omp barrier
-  if(myThread == 2) {
-    sharedThreadFile.open(sharedFileName.str(), std::ios::out | std::ios::binary);
-    sharedThreadFile.seekp(fileOffset[myThread]);
-    sharedThreadFile.flush();
-    sharedThreadFile.close();
-  }
-  #pragma omp barrier
-  if(myThread == 3) {
-    sharedThreadFile.open(sharedFileName.str(), std::ios::out | std::ios::binary);
-    sharedThreadFile.seekp(fileOffset[myThread]);
-    sharedThreadFile.flush();
-    sharedThreadFile.close();
-  }
-  #pragma omp barrier
-  */
-}
-#endif
-
-  pp.query("nsleep", nsleep);
-  if(nsleep > 0) {  // test the timer
-    double timerTimeStart = ParallelDescriptor::second();
-    sleep(nsleep);  // for attaching a debugger or testing the timer
-    double timerTime = ParallelDescriptor::second() - timerTimeStart;
-    cout << "  ----- " << myproc << " :  " << "Sleep time = "
-         << timerTime << "  (should be " << nsleep << " seconds)" << endl;
-  }
-
-  ParallelDescriptor::Barrier("main:top");
-
-  VisMF::SetUseSingleRead(useSingleRead);
-  VisMF::SetUseSingleWrite(useSingleWrite);
-  VisMF::SetCheckFilePositions(checkFPositions);
-  VisMF::SetUsePersistentIFStreams(pIFStreams);
-
-  if(nfileitertest) {
-    for(int itimes(0); itimes < ntimes; ++itimes) {
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << endl << "--------------------------------------------------" << endl;
-        cout << "Testing NFile Operations" << endl;
-      }
-
-      std::string filePrefix("NFiles");
-      NFileTests(nfiles, filePrefix);
-
-      ParallelDescriptor::Barrier("after NFileTests");
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << "==================================================" << endl;
-        cout << endl;
-      }
-    }
-  }
-
-
-  if(dssnfileitertest) {
-    for(int itimes(0); itimes < ntimes; ++itimes) {
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << endl << "--------------------------------------------------" << endl;
-        cout << "Testing DSSNFile Operations" << endl;
-      }
-
-      std::string filePrefix("DSSFiles");
-      bool useIter(true);
-      DSSNFileTests(nfiles, filePrefix, useIter);
-
-      ParallelDescriptor::Barrier("after DSSNFileTests");
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << "==================================================" << endl;
-        cout << endl;
-      }
-    }
-  }
-
-
-  if(filetests) {
-    for(int itimes(0); itimes < ntimes; ++itimes) {
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << endl << "--------------------------------------------------" << endl;
-        cout << "Testing File Operations" << endl;
-      }
-
-      FileTests();
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << "==================================================" << endl;
-        cout << endl;
-      }
-    }
-  }
-
-
-
-
-  if(dirtests) {
-    for(int itimes(0); itimes < ntimes; ++itimes) {
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << endl << "--------------------------------------------------" << endl;
-        cout << "Testing Directory Operations" << endl;
-      }
-
-      DirectoryTests();
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << "==================================================" << endl;
-        cout << endl;
-      }
-    }
-  }
-
-
-
-  for(int v(0); v < testWriteNFilesVersions.size(); ++v) {
-    if(ParallelDescriptor::IOProcessor()) {
-      cout << "testWriteNFilesVersions[" << v << "] = " << testWriteNFilesVersions[v] << std::endl;
-    }
-    VisMF::Header::Version hVersion;
-    switch(testWriteNFilesVersions[v]) {
-      case 1:
-        hVersion = VisMF::Header::Version_v1;
-      break;
-      case 2:
-        hVersion = VisMF::Header::NoFabHeader_v1;
-      break;
-      case 3:
-        hVersion = VisMF::Header::NoFabHeaderMinMax_v1;
-      break;
-      case 4:
-        hVersion = VisMF::Header::NoFabHeaderFAMinMax_v1;
-      break;
-      default:
-        amrex::Abort("**** Error:  bad hVersion.");
-      }
-
-    for(int itimes(0); itimes < ntimes; ++itimes) {
-      ParallelDescriptor::Barrier("TestWriteNFiles::BeforeSleep2");
-      amrex::USleep(2);
-      ParallelDescriptor::Barrier("TestWriteNFiles::AfterSleep2");
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << endl << "--------------------------------------------------" << endl;
-        cout << "Testing NFiles Write:  version = " << hVersion << endl;
-      }
-
-      TestWriteNFiles(nfiles, maxgrid, ncomps, nboxes, raninit, mb2,
-                      hVersion, groupSets, setBuf, useDSS, nMultiFabs,
-		      checkmf, dirName);
-
-      ParallelDescriptor::Barrier("TestWriteNFiles::finished");
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << "==================================================" << endl;
-        cout << endl;
-      }
-    }
-  }
-
-
-
-  if(testreadmf) {
-    VisMF::SetMFFileInStreams(nReadStreams);
-    for(int itimes(0); itimes < ntimes; ++itimes) {
-      ParallelDescriptor::Barrier("TestReadMF::BeforeSleep2");
-      amrex::USleep(2);
-      ParallelDescriptor::Barrier("TestReadMF::AfterSleep2");
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << endl << "++++++++++++++++++++++++++++++++++++++++++++++++++" << endl;
-        cout << "Testing MF Read" << endl;
-      }
-
-      for(int i(0); i < readFANames.size(); ++i) {
-        TestReadMF(readFANames[i], useSyncReads, nMultiFabs, dirName);
-      }
-
-      ParallelDescriptor::Barrier("TestReadMF::finished");
-
-      if(ParallelDescriptor::IOProcessor()) {
-        cout << "##################################################" << endl;
-        cout << endl;
-      }
-    }
-  }
-
-
-
-  amrex::Finalize();
-  return 0;
-}
-// -------------------------------------------------------------
-// -------------------------------------------------------------
diff --git a/Tests/IOBenchmark/README b/Tests/IOBenchmark/README
deleted file mode 100644
index 4c3c51a1a1b..00000000000
--- a/Tests/IOBenchmark/README
+++ /dev/null
@@ -1,55 +0,0 @@
-this is a boxlib i/o test.
-it writes and reads a multifab.
-
-Usage:
-iotest3d.Linux.g++.gfortran.MPI.ex inputsfile
-   [nfiles            = nfiles   ]
-   [maxgrid           = maxgrid  ]
-   [ncomps            = ncomps   ]
-   [nboxes            = nboxes   ]
-   [nsleep            = nsleep   ]
-   [ntimes            = ntimes   ]
-   [raninit           = tf       ]
-   [mb2               = tf       ]
-   [rbuffsize         = rbsize   ]
-   [wbuffsize         = wbsize   ]
-   [groupsets         = tf       ]
-   [setbuf            = tf       ]
-   [nfileitertest     = tf       ]
-   [dssnfileitertest  = tf       ]
-   [filetests         = tf       ]
-   [dirtests          = tf       ]
-   [testwritenfiles   = versions ]
-   [testreadmf        = tf       ]
-   [readFANames       = fanames  ]
-   [nreadstreams      = nrs      ]
-   [usesingleread     = tf       ]
-   [usesinglewrite    = tf       ]
-   [checkfpositions   = tf       ]
-   [checkfmf          = tf       ]
-   [pifstreams        = tf       ]
-   [usedss            = tf       ]
-   [usesyncreads      = tf       ]
-   [nmultifabs        = nmf      ]
-   [dirname           = dirname  ]
-
-
-
-the range [1,nprocs] is enforced for nfiles.
-ncomps is the number of FAB components.
-nboxes is the number of boxes in the multifab.
-nsleep will sleep for nsleep seconds.
-ntimes is the number of times to run the test.
-raninit will initialize the multifab with random values.
-mb2 will use 2^20 instead of 1.0e+06 to calculate megabytes.
-rbuffsize sets the read  buffer size
-wbuffsize sets the write buffer size
-writeminmax writes fab min and max values into the raw native format
-dirname will write multifabs to dirname/Level_n where n is [0,nmultifabs)
-
-
-example run:
-
-mpiexec -n 4 iotest3d.Linux.g++.gfortran.MPI.ex inputs.dssmf nfiles=4 maxgrid=64 ncomps=16 nboxes=32 ntimes=4 raninit=true mb2=true
-
-
diff --git a/Tests/IOBenchmark/inputs b/Tests/IOBenchmark/inputs
deleted file mode 100644
index e383ddb9118..00000000000
--- a/Tests/IOBenchmark/inputs
+++ /dev/null
@@ -1,40 +0,0 @@
-nfiles        = 7
-maxgrid       = 64
-ncomps        = 1
-nboxes        = 16
-nboxes        = 64
-ntimes        = 1
-raninit       = false
-mb2           = true
-
-rbuffsize     = 16000
-wbuffsize     = 32000
-
-nfiletest     = false
-filetests     = false
-dirtests      = false
-testreadmf    = true
-
-groupsets     = false
-setbuf        = false
-
-usesingleread   = true
-usesinglewrite  = true
-checkfpositions = true
-pifstreams      = true
-usesingleread   = false
-usesinglewrite  = false
-checkfpositions = false
-pifstreams      = false
-
-nreadstreams  = 1
-usesyncreads  = true
-
-#testwritenfiles = 1 2 3 4
-#testwritenfiles = 1
-testwritenfiles = 2
-
-#readfanames = TestMF TestMFNoFabHeader TestMFNoFabHeaderMinMax TestMFNoFabHeaderFAMinMax
-#readfanames = TestMF
-readfanames = TestMFNoFabHeader
-
diff --git a/Tests/IOBenchmark/inputs.dirname b/Tests/IOBenchmark/inputs.dirname
deleted file mode 100644
index 653e82a7ace..00000000000
--- a/Tests/IOBenchmark/inputs.dirname
+++ /dev/null
@@ -1,40 +0,0 @@
-nfiles        = 4
-maxgrid       = 16
-ncomps        = 4
-nboxes        = 64
-ntimes        = 2
-raninit       = false
-mb2           = true
-
-rbuffsize     = 16000
-wbuffsize     = 32000
-
-nfiletest     = false
-filetests     = false
-dirtests      = false
-testreadmf    = true
-dssnfiletest  = false
-
-groupsets     = false
-setbuf        = false
-
-usesingleread   = true
-usesinglewrite  = true
-checkfpositions = true
-pifstreams      = true
-usedss          = true
-usesyncreads    = false
-
-nmultifabs      = 3
-
-nreadstreams  = 4
-
-testwritenfiles = 2
-testwritenfiles = 1 2
-
-readfanames = TestMF TestMFNoFabHeader TestMFNoFabHeaderMinMax TestMFNoFabHeaderFAMinMax
-readfanames = TestMFNoFabHeader
-readfanames = TestMF TestMFNoFabHeader
-
-dirname = chk00000
-
diff --git a/Tests/IOBenchmark/inputs.dss b/Tests/IOBenchmark/inputs.dss
deleted file mode 100644
index 16069fd1ba2..00000000000
--- a/Tests/IOBenchmark/inputs.dss
+++ /dev/null
@@ -1,26 +0,0 @@
-nfiles        = 4
-maxgrid       = 64
-ncomps        = 1
-nboxes        = 64
-nboxes        = 16
-ntimes        = 1
-raninit       = false
-mb2           = true
-
-rbuffsize     = 16000
-wbuffsize     = 32000
-
-dssnfiletest  = true
-filetests     = false
-dirtests      = false
-testreadmf    = false
-
-groupsets     = false
-setbuf        = false
-
-usesingleread   = true
-usesinglewrite  = true
-checkfpositions = true
-pifstreams      = true
-
-dssnfileitertest = true
diff --git a/Tests/IOBenchmark/inputs.dssmf b/Tests/IOBenchmark/inputs.dssmf
deleted file mode 100644
index 03040202bb3..00000000000
--- a/Tests/IOBenchmark/inputs.dssmf
+++ /dev/null
@@ -1,42 +0,0 @@
-nfiles        = 4
-maxgrid       = 64
-ncomps        = 4
-nboxes        = 131
-ntimes        = 1
-raninit       = false
-mb2           = true
-
-rbuffsize     = 16000
-wbuffsize     = 32000
-
-nfiletest     = false
-filetests     = false
-dirtests      = false
-testreadmf    = true
-dssnfiletest  = false
-
-groupsets     = false
-setbuf        = false
-
-usesingleread   = true
-usesinglewrite  = true
-checkfpositions = true
-pifstreams      = true
-usedss          = true
-usesyncreads    = false
-
-nmultifabs      = 4
-
-nreadstreams  = 4
-
-testwritenfiles = 2
-testwritenfiles = 3
-testwritenfiles = 1
-testwritenfiles = 1 2 3 4
-
-readfanames = TestMF TestMFNoFabHeader
-readfanames = TestMFNoFabHeader
-readfanames = TestMFNoFabHeaderMinMax
-readfanames = TestMF
-readfanames = TestMF TestMFNoFabHeader TestMFNoFabHeaderMinMax TestMFNoFabHeaderFAMinMax
-
diff --git a/Tests/IOBenchmark/inputs.nft b/Tests/IOBenchmark/inputs.nft
deleted file mode 100644
index c7c0d81846c..00000000000
--- a/Tests/IOBenchmark/inputs.nft
+++ /dev/null
@@ -1,26 +0,0 @@
-nfiles        = 5
-maxgrid       = 64
-ncomps        = 1
-nboxes        = 64
-nboxes        = 16
-ntimes        = 1
-raninit       = false
-mb2           = true
-
-rbuffsize     = 16000
-wbuffsize     = 32000
-
-filetests     = false
-dirtests      = false
-testreadmf    = false
-
-groupsets     = false
-setbuf        = false
-
-usesingleread   = true
-usesinglewrite  = true
-checkfpositions = true
-pifstreams      = true
-
-nfileitertest = true
-dssnfileitertest = false
diff --git a/Tests/IOBenchmark/inputs.small b/Tests/IOBenchmark/inputs.small
deleted file mode 100644
index f229dde0287..00000000000
--- a/Tests/IOBenchmark/inputs.small
+++ /dev/null
@@ -1,38 +0,0 @@
-nfiles        = 4
-maxgrid       = 16
-ncomps        = 4
-nboxes        = 64
-ntimes        = 2
-raninit       = false
-mb2           = true
-
-rbuffsize     = 16000
-wbuffsize     = 32000
-
-nfiletest     = false
-filetests     = false
-dirtests      = false
-testreadmf    = true
-dssnfiletest  = false
-
-groupsets     = false
-setbuf        = false
-
-usesingleread   = true
-usesinglewrite  = true
-checkfpositions = true
-pifstreams      = true
-usedss          = true
-usesyncreads    = false
-
-nmultifabs      = 3
-
-nreadstreams  = 4
-
-testwritenfiles = 2
-testwritenfiles = 1 2
-
-readfanames = TestMF TestMFNoFabHeader TestMFNoFabHeaderMinMax TestMFNoFabHeaderFAMinMax
-readfanames = TestMFNoFabHeader
-readfanames = TestMF TestMFNoFabHeader
-
diff --git a/Tests/LinearSolvers/C_CellMG/COEF_2D.F b/Tests/LinearSolvers/C_CellMG/COEF_2D.F
deleted file mode 100644
index c22de5861b5..00000000000
--- a/Tests/LinearSolvers/C_CellMG/COEF_2D.F
+++ /dev/null
@@ -1,75 +0,0 @@
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include <AMReX_REAL.H>
-#include "COEF_F.H"
-#include "AMReX_ArrayLim.H"
-
-c-----------------------------------------------------------------------
-      subroutine FORT_SET_CC_COEF (
-     $     coef, DIMS(coef), lo, hi, dx, prob_lo, prob_hi)
-
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(coef)
-      REAL_T coef(DIMV(coef))
-      REAL_T  dx(BL_SPACEDIM)
-      REAL_T prob_lo(BL_SPACEDIM)
-      REAL_T prob_hi(BL_SPACEDIM)
-c
-      integer i,j
-      REAL_T  x,y,r
-      REAL_T  xcent,ycent
-      REAL_T  xlen,ylen
-
-      xlen = prob_hi(1)-prob_lo(1)
-      ylen = prob_hi(2)-prob_lo(2)
-
-      xcent = prob_lo(1) + 0.5d0 * xlen 
-      ycent = prob_lo(2) + 0.5d0 * ylen
-c
-      do j = lo(2)-1, hi(2)+1
-         y = ( (dble(j)+0.5d0)*dx(2) - ycent)  / ylen
-         do i = lo(1)-1, hi(1)+1
-            x = ( (dble(i)+0.5d0)*dx(1) - xcent) / xlen
-            r = sqrt(x**2 + y**2) / 0.1d0
-c           coef(i,j) = 1.0d0 + 100.d0 * (0.5d0 * (1.0d0 + tanh((2.d0-r))))
-            coef(i,j) = 1.0d0 + 10.d0 * (0.5d0 * (1.0d0 + tanh((2.d0-r))))
-c           coef(i,j) = 1.0d0
-         end do
-      end do
-c
-      end
-
-c-----------------------------------------------------------------------
-      subroutine FORT_COEF_TO_EDGES (dir, edge, DIMS(edge),
-     $                               coef, DIMS(coef), lo, hi)
-
-      integer dir
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(edge)
-      REAL_T edge(DIMV(edge))
-      integer DIMDEC(coef)
-      REAL_T coef(DIMV(coef))
-c
-      integer i,j
-c
-      if (dir .eq. 0) then
-        do j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-            edge(i,j) = 0.5d0 * (coef(i,j) + coef(i-1,j))
-         end do
-        end do
-      else if (dir .eq. 1) then
-        do j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-            edge(i,j) = 0.5d0 * (coef(i,j) + coef(i,j-1))
-         end do
-        end do
-      end if
-c
-      end
-
diff --git a/Tests/LinearSolvers/C_CellMG/COEF_3D.F b/Tests/LinearSolvers/C_CellMG/COEF_3D.F
deleted file mode 100644
index 291bebbd935..00000000000
--- a/Tests/LinearSolvers/C_CellMG/COEF_3D.F
+++ /dev/null
@@ -1,92 +0,0 @@
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include <AMReX_REAL.H>
-#include "AMReX_ArrayLim.H"
-#include "COEF_F.H"
-
-c-----------------------------------------------------------------------
-      subroutine FORT_SET_CC_COEF (
-     $     coef, DIMS(coef), lo, hi, dx, prob_lo, prob_hi)
-
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(coef)
-      REAL_T coef(DIMV(coef))
-      REAL_T dx(BL_SPACEDIM)
-      REAL_T prob_lo(BL_SPACEDIM)
-      REAL_T prob_hi(BL_SPACEDIM)
-c
-      integer i,j,k
-      REAL_T  x,y,z,r
-      REAL_T  xcent,ycent,zcent
-      REAL_T  xlen ,ylen ,zlen
-
-      xlen = prob_hi(1)-prob_lo(1)
-      ylen = prob_hi(2)-prob_lo(2)
-      zlen = prob_hi(3)-prob_lo(3)
-
-      xcent = prob_lo(1) + 0.5d0 * xlen
-      ycent = prob_lo(2) + 0.5d0 * ylen
-      zcent = prob_lo(3) + 0.5d0 * zlen
-c
-      do k = lo(3)-1, hi(3)+1
-       z = ( (dble(k)+0.5)*dx(3) - zcent ) / zlen
-       do j = lo(2)-1, hi(2)+1
-         y = ( (dble(j)+0.5)*dx(2) - ycent ) / ylen
-         do i = lo(1)-1, hi(1)+1
-            x = ( (dble(i)+0.5)*dx(1) - xcent ) / xlen
-            r = sqrt(x**2 + y**2 + z**2) / 0.1d0
-c           coef(i,j,k) = 1.d0 + 1000.d0 * (0.5d0 * (1.0d0 + tanh((2.d0-r))))
-            coef(i,j,k) = 1.d0 + 10.d0 * (0.5d0 * (1.0d0 + tanh((2.d0-r))))
-c           coef(i,j,k) = 1.d0
-         end do
-      end do
-      end do
-c
-      end
-
-c-----------------------------------------------------------------------
-      subroutine FORT_COEF_TO_EDGES (dir, edge, DIMS(edge),
-     $                               coef, DIMS(coef), lo, hi)
-
-      integer dir
-      integer lo(BL_SPACEDIM)
-      integer hi(BL_SPACEDIM)
-      integer DIMDEC(edge)
-      REAL_T edge(DIMV(edge))
-      integer DIMDEC(coef)
-      REAL_T coef(DIMV(coef))
-c
-      integer i,j,k
-c
-      if (dir .eq. 0) then 
-        do k = lo(3), hi(3)
-        do j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-          edge(i,j,k) = 0.5d0 * (coef(i,j,k) + coef(i-1,j,k))
-        end do
-        end do
-        end do
-      else if (dir .eq. 1) then
-        do k = lo(3), hi(3)
-        do j = lo(2), hi(2)+1
-        do i = lo(1), hi(1)
-          edge(i,j,k) = 0.5d0 * (coef(i,j,k) + coef(i,j-1,k))
-        end do
-        end do
-        end do
-      else if (dir .eq. 2) then
-        do k = lo(3), hi(3)+1
-        do j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           edge(i,j,k) = 0.5d0 * (coef(i,j,k) + coef(i,j,k-1))
-        end do
-        end do
-        end do
-      end if
-c
-      end
-
diff --git a/Tests/LinearSolvers/C_CellMG/COEF_F.H b/Tests/LinearSolvers/C_CellMG/COEF_F.H
deleted file mode 100644
index 15db7145ea4..00000000000
--- a/Tests/LinearSolvers/C_CellMG/COEF_F.H
+++ /dev/null
@@ -1,66 +0,0 @@
-#ifndef _COEFF_H_
-#define _COEFF_H_
-
-#include <AMReX_REAL.H>
-
-#if        defined(BL_LANG_FORT)
-
-#if (BL_SPACEDIM == 2)
-#define FORT_SET_CC_COEF        set_cc_coef_2d
-#define FORT_COEF_TO_EDGES      coef_to_edges_2d
-#elif (BL_SPACEDIM == 3)
-#define FORT_SET_CC_COEF        set_cc_coef_3d
-#define FORT_COEF_TO_EDGES      coef_to_edges_3d
-#endif
-
-#else
-
-#if (BL_SPACEDIM == 2)
-#if    defined(BL_FORT_USE_UPPERCASE)
-#define FORT_SET_CC_COEF        SET_CC_COEF_2d
-#define FORT_COEF_TO_EDGES      COEF_TO_EDGES_2d
-#elif  defined(BL_FORT_USE_LOWERCASE)
-#define FORT_SET_CC_COEF        set_cc_coef_2d
-#define FORT_COEF_TO_EDGES      coef_to_edges_2d
-#elif  defined(BL_FORT_USE_UNDERSCORE)
-#define FORT_SET_CC_COEF        set_cc_coef_2d_
-#define FORT_COEF_TO_EDGES      coef_to_edges_2d_
-#endif
-#endif
-
-#if (BL_SPACEDIM == 3)
-#if    defined(BL_FORT_USE_UPPERCASE)
-#define FORT_SET_CC_COEF        SET_CC_COEF_3d
-#define FORT_COEF_TO_EDGES      COEF_TO_EDGES_3d
-#elif  defined(BL_FORT_USE_LOWERCASE)
-#define FORT_SET_CC_COEF        set_cc_coef_3d
-#define FORT_COEF_TO_EDGES      coef_to_edges_3d
-#elif  defined(BL_FORT_USE_UNDERSCORE)
-#define FORT_SET_CC_COEF        set_cc_coef_3d_
-#define FORT_COEF_TO_EDGES      coef_to_edges_3d_
-#endif
-#endif
-
-
-#include <AMReX_ArrayLim.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    void FORT_SET_CC_COEF (
-        amrex_real* coef     , AMREX_ARLIM_P(coef_lo), AMREX_ARLIM_P(coef_hi),
-        const int* lo, const int* hi, const amrex_real* dx,
-        const amrex_real* prob_lo, const amrex_real* prob_hi);
-
-    void FORT_COEF_TO_EDGES (int * dir, 
-        amrex_real* edge     , AMREX_ARLIM_P(edge_lo), AMREX_ARLIM_P(edge_hi),
-        amrex_real* coef     , AMREX_ARLIM_P(coef_lo), AMREX_ARLIM_P(coef_hi),
-        const int* lo, const int* hi);
-
-#ifdef __cplusplus
-}
-#endif
-#endif
-
-#endif /*_COEF_F_H_*/
diff --git a/Tests/LinearSolvers/C_CellMG/GNUmakefile b/Tests/LinearSolvers/C_CellMG/GNUmakefile
deleted file mode 100644
index 7087b10cf0d..00000000000
--- a/Tests/LinearSolvers/C_CellMG/GNUmakefile
+++ /dev/null
@@ -1,28 +0,0 @@
-AMREX_HOME := ../../..
-
-PRECISION = DOUBLE
-
-DEBUG	= FALSE
-DEBUG	= TRUE
-
-DIM	= 3
-DIM	= 2
-
-COMP =g++
-
-USE_MPI=FALSE
-
-EBASE = main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-CEXE_sources += $(EBASE).cpp
-
-include ./Make.package
-
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/LinearSolvers/C_CellMG/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/LinearSolvers/C_CellMG/GNUmakefile.dumpi b/Tests/LinearSolvers/C_CellMG/GNUmakefile.dumpi
deleted file mode 100644
index a5151dd92b9..00000000000
--- a/Tests/LinearSolvers/C_CellMG/GNUmakefile.dumpi
+++ /dev/null
@@ -1,59 +0,0 @@
-BOXLIB_HOME := ../../..
-
-PRECISION = DOUBLE
-
-DEBUG	= TRUE
-DEBUG	= FALSE
-
-DIM	= 2
-DIM	= 3
-
-COMP =PGI
-FCOMP=PGI
-
-USE_MPI=TRUE
-
-EBASE = main
-
-LIBRARIES += -ldumpi
-
-include $(BOXLIB_HOME)/Tools/GNUMake/Make.defs
-
-CEXE_sources += $(EBASE).cpp
-
-include ./Make.package
-
-#LIBRARIES += /global/homes/j/jpkenny/install-hopper/dumpi-sstmacro-1.1.0/lib
-
-include $(BOXLIB_HOME)/Src/Boundary/Make.package
-include $(BOXLIB_HOME)/Src/LinearSolvers/C_CellMG/Make.package
-include $(BOXLIB_HOME)/Src/Base/Make.package
-
-LIBRARY_LOCATIONS += /global/homes/j/jpkenny/install-hopper/dumpi-sstmacro-1.1.0/lib
-
-INCLUDE_LOCATIONS += $(BOXLIB_HOME)/Src/Boundary
-vpathdir          += $(BOXLIB_HOME)/Src/Boundary
-
-INCLUDE_LOCATIONS += $(BOXLIB_HOME)/Src/Base
-vpathdir          += $(BOXLIB_HOME)/Src/Base
-
-INCLUDE_LOCATIONS += $(BOXLIB_HOME)/Src/Amr
-vpathdir          += $(BOXLIB_HOME)/Src/Amr
-
-INCLUDE_LOCATIONS += $(BOXLIB_HOME)/Src/LinearSolvers/C_CellMG
-vpathdir          += $(BOXLIB_HOME)/Src/LinearSolvers/C_CellMG
-
-CEXE_sources += BCRec.cpp 
-CEXE_headers += BCRec.H BC_TYPES.H
-
-vpath %.c   : . $(vpathdir)
-vpath %.h   : . $(vpathdir)
-vpath %.cpp : . $(vpathdir)
-vpath %.H   : . $(vpathdir)
-vpath %.F   : . $(vpathdir)
-vpath %.f   : . $(vpathdir)
-vpath %.f90 : . $(vpathdir)
-
-all: $(executable)
-
-include $(BOXLIB_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/LinearSolvers/C_CellMG/MACOPERATOR_2D.F b/Tests/LinearSolvers/C_CellMG/MACOPERATOR_2D.F
deleted file mode 100644
index f4d52201032..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MACOPERATOR_2D.F
+++ /dev/null
@@ -1,244 +0,0 @@
-
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include "AMReX_REAL.H"
-#include "AMReX_CONSTANTS.H"
-#include "MACOPERATOR_F.H"
-#include "AMReX_ArrayLim.H"
-
-#define SDIM 2
-
-c :: ----------------------------------------------------------
-c :: MACCOEF
-c ::             Compute the coefficents for MAC solve
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  cx,cy       <=  edge coef arrays
-c ::  DIMS(cx)     => index limits for cx
-c ::  DIMS(cy)     => index limits for cy
-c ::  lo,hi        => index limits for rhs
-c ::  ax,ay        => edge based area arrays
-c ::  DIMS(ax)     => index limits for ax
-c ::  DIMS(ay)     => index limits for ay
-c ::  rho          => cell centered density array
-c ::  DIMS(rho)    => index limits for rho
-c ::  dx           => cell size
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACCOEF (cx,DIMS(cx),cy,DIMS(cy),
-     &                          ax,DIMS(ax),ay,DIMS(ay),
-     &                          rho,DIMS(rho),lo,hi,dx)
-       implicit none
-       integer DIMDEC(cx)
-       integer DIMDEC(cy)
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(rho)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  dx(SDIM)
-       REAL_T  cx(DIMV(cx))
-       REAL_T  cy(DIMV(cy))
-       REAL_T  ax(DIMV(ax))
-       REAL_T  ay(DIMV(ay))
-       REAL_T  rho(DIMV(rho))
-
-       integer i, j
-       REAL_T rhoavg
-
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-            if (rho(i,j) .lt. zero) then
-	      print *,' '
-	      print *,'TESTING in MACCOEF '
-	      print *,'RHO HAS GONE NEGATIVE AT ',i,j,rho(i,j)
-              call bl_abort(" ")
-            end if
-          end do
-       end do
-c
-c      ::::: finish coef in X direction (part 2)
-c
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-             rhoavg = half * (rho(i,j) + rho(i-1,j))
-             cx(i,j) = dx(1) * ax(i,j) / rhoavg
-          end do
-       end do
-c
-c      ::::: finish coef in Y direction (part 2)
-c
-       do j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-             rhoavg = half * (rho(i,j) + rho(i,j-1))
-             cy(i,j) = dx(2) * ay(i,j) / rhoavg
-          end do
-       end do
-
-       end
-
-c :: ----------------------------------------------------------
-c :: MACRHS
-c ::             Compute the RHS for MAC solve
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  ux,uy       <=  edge velocity arrays
-c ::  DIMS(ux)     => index limits for ux
-c ::  DIMS(uy)     => index limits for uy
-c ::  lo,hi        => index limits for rhs
-c ::  ax,ay        => edge based area arrays
-c ::  DIMS(ax)     => index limits for ax
-c ::  DIMS(ay)     => index limits for ay
-c ::  vol          => cell centered volume array
-c ::  vlo,vhi      => index limits of vol array
-c ::  DIMS(vol)    => index limits for vol
-c ::  rhs         <=> cell centered rhs array
-c ::  DIMS(rhs)    => index limits for rhs
-c ::  scale        => scale factor
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACRHS (ux,DIMS(ux),uy,DIMS(uy),
-     &                         ax,DIMS(ax),ay,DIMS(ay),
-     &                         vol,DIMS(vol),rhs,DIMS(rhs),
-     &                         lo,hi,scale)
-       implicit none
-       integer DIMDEC(ux)
-       integer DIMDEC(uy)
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(vol)
-       integer DIMDEC(rhs)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  scale
-       REAL_T  ux(DIMV(ux))
-       REAL_T  uy(DIMV(uy))
-       REAL_T  ax(DIMV(ax))
-       REAL_T  ay(DIMV(ay))
-       REAL_T  vol(DIMV(vol))
-       REAL_T  rhs(DIMV(rhs))
-
-       integer i, j
-       REAL_T  divu
-c
-c      ::::: rhs holds the divergence condition (possibly zero)
-c
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             divu = ax(i+1,j)*ux(i+1,j) - ax(i,j)*ux(i,j)
-     &            + ay(i,j+1)*uy(i,j+1) - ay(i,j)*uy(i,j)
-             rhs(i,j) = scale*(divu - vol(i,j)*rhs(i,j))
-          end do
-       end do
- 
-       end
-
-c :: ----------------------------------------------------------
-c :: MACUPDATE
-c ::             Compute the update to velocity field to
-c ::             make it divergence free
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  ux,uy       <=  edge based velocity arrays
-c ::  DIMS(ux)     => index limits for ux
-c ::  DIMS(uy)     => index limits for uy
-c ::  phi          => soln from MAC project
-c ::  DIMS(phi)    => index limits for phi
-c ::  rho          => density at time N
-c ::  DIMS(rho)    => index limits for rho
-c ::  dx           => cell size
-c ::  mult         => scalar multiplier
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACUPDATE(init,ux,DIMS(ux),uy,DIMS(uy),
-     &                           phi,DIMS(phi),rho,DIMS(rho),
-     &                           lo,hi,dx,mult)
-
-       implicit none
-       integer DIMDEC(ux)
-       integer DIMDEC(uy)
-       integer DIMDEC(phi)
-       integer DIMDEC(rho)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  ux(DIMV(ux))
-       REAL_T  uy(DIMV(uy))
-       REAL_T  phi(DIMV(phi))
-       REAL_T  rho(DIMV(rho))
-       REAL_T  dx(SDIM), mult
-       integer init
-
-       integer i, j
-       REAL_T  rhoavg, gp
-c
-c     set values to 0.0 if initializing
-c
-       if ( init .eq. 1 ) then
-          do j = ARG_L2(ux), ARG_H2(ux)
-             do i = ARG_L1(ux), ARG_H1(ux)
-                ux(i,j) = zero
-             end do
-          end do
-          do j = ARG_L2(uy), ARG_H2(uy)
-             do i = ARG_L1(uy), ARG_H1(uy)
-                uy(i,j) = zero
-             end do
-          end do
-       end if
-c
-c     compute the x mac gradient
-c
-       do j = lo(2),hi(2)
-          do i = lo(1),hi(1)+1
-             rhoavg = half*(rho(i,j) + rho(i-1,j))
-             gp = (phi(i,j)-phi(i-1,j))/dx(1)
-             ux(i,j) = ux(i,j) + mult * gp / rhoavg
-          end do
-       end do
-c
-c      compute the y mac gradient
-c
-       do j = lo(2),hi(2)+1
-          do i = lo(1),hi(1)
-             rhoavg = half*(rho(i,j) + rho(i,j-1))
-             gp = (phi(i,j)-phi(i,j-1))/dx(2)
-             uy(i,j) = uy(i,j) + mult * gp / rhoavg
-          end do
-       end do
-
-       end
-
-c :: ----------------------------------------------------------
-c :: MACSYNCRHS
-c ::        Modify the RHS for MAC SYNC solve
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  rhs         <=  right hand side array
-c ::  DIMS(rhs)    => index limits for rhs
-c ::  vol          => cell centered volume array
-c ::  DIMS(vol)    => index limits of vol array
-c ::  rhsscale     => const multiplier to rhs
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACSYNCRHS(rhs,DIMS(rhs),lo,hi,
-     &                            vol,DIMS(vol),rhsscale)
-       implicit none
-       integer DIMDEC(rhs)
-       integer DIMDEC(vol)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  rhsscale
-       REAL_T  rhs(DIMV(rhs))
-       REAL_T  vol(DIMV(vol))
-
-       integer i, j
-c
-c      ::::: multiply by volume since reflux step (which computed rhs)
-c      ::::: divided by volume.
-c
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             rhs(i,j) = rhsscale*vol(i,j)*rhs(i,j)
-          end do
-       end do
-
-       end
diff --git a/Tests/LinearSolvers/C_CellMG/MACOPERATOR_3D.F b/Tests/LinearSolvers/C_CellMG/MACOPERATOR_3D.F
deleted file mode 100644
index 2b27ef76fd8..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MACOPERATOR_3D.F
+++ /dev/null
@@ -1,326 +0,0 @@
-
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include "AMReX_REAL.H"
-#include "AMReX_CONSTANTS.H"
-#include "MACOPERATOR_F.H"
-#include "AMReX_ArrayLim.H"
-
-#define SDIM 3
-
-c :: ----------------------------------------------------------
-c :: MACCOEF
-c ::             Compute the coefficents for MAC solve
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  cx,cy,cz    <=  edge coef arrays
-c ::  DIMS(cx)     => index limits for cx
-c ::  DIMS(cy)     => index limits for cy
-c ::  DIMS(cz)     => index limits for cz
-c ::  ax,ay,az     => edge based area arrays
-c ::  DIMS(ax)     => index limits for ax
-c ::  DIMS(ay)     => index limits for ay
-c ::  DIMS(az)     => index limits for az
-c ::  rho          => cell centered density array
-c ::  DIMS(rho)    => index limits of rho array
-c ::  lo,hi        => index limits for rhs
-c ::  dx           => cell size
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACCOEF (cx,DIMS(cx),cy,DIMS(cy),cz,DIMS(cz),
-     &                          ax,DIMS(ax),ay,DIMS(ay),az,DIMS(az),
-     &                          rho,DIMS(rho),lo,hi,dx)
-       implicit none
-       integer DIMDEC(cx)
-       integer DIMDEC(cy)
-       integer DIMDEC(cz)
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(az)
-       integer DIMDEC(rho)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  dx(SDIM)
-       REAL_T  cx(DIMV(cx))
-       REAL_T  cy(DIMV(cy))
-       REAL_T  cz(DIMV(cz))
-       REAL_T  ax(DIMV(ax))
-       REAL_T  ay(DIMV(ay))
-       REAL_T  az(DIMV(az))
-       REAL_T  rho(DIMV(rho))
-
-       integer i, j, k
-       REAL_T  rhoavg
-
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                if (rho(i,j,k) .lt. zero) then
-                   print *,' '
-                   print *,'TESTING in MACCOEF '
-                   print *,'RHO HAS GONE NEGATIVE AT ',i,j,k,rho(i,j,k)
-                   call bl_abort(" ")
-                end if
-             end do
-          end do
-       end do
-!$omp parallel private(i,j,k,rhoavg)
-c
-c      ::::: finish coef in X direction (part 2)
-c
-!$omp do
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)+1
-                rhoavg = half * ( rho(i,j,k) + rho(i-1,j,k) )
-                cx(i,j,k) = dx(1) * ax(i,j,k) / rhoavg 
-             end do
-          end do
-       end do
-!$omp end do nowait
-c
-c      ::::: finish coef in Y direction (part 2)
-c
-!$omp do
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)+1
-             do i = lo(1), hi(1)
-                rhoavg = half * ( rho(i,j,k) + rho(i,j-1,k) )
-                cy(i,j,k) = dx(2) * ay(i,j,k) / rhoavg 
-             end do
-          end do
-       end do
-!$omp end do nowait
-c
-c      ::::: finish coef in Z direction (part 2)
-c
-!$omp do
-       do k = lo(3), hi(3)+1
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                rhoavg = half * ( rho(i,j,k) + rho(i,j,k-1) )
-                cz(i,j,k) = dx(3) * az(i,j,k) / rhoavg 
-             end do
-          end do
-       end do
-!$omp end do nowait
-!$omp end parallel
-       end
-
-c :: ----------------------------------------------------------
-c :: MACRHS
-c ::             Compute the RHS for MAC solve
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  ux,uy,uz    <=  edge velocity arrays
-c ::  DIMS(ux)     => index limits for ux
-c ::  DIMS(uy)     => index limits for uy
-c ::  DIMS(uz)     => index limits for uz
-c ::  ax,ay,az     => edge based area arrays
-c ::  DIMS(ax)     => index limits for ax
-c ::  DIMS(ay)     => index limits for ay
-c ::  DIMS(az)     => index limits for az
-c ::  vol          => cell centered volume array
-c ::  DIMS(vol)    => index limits of vol array
-c ::  rhs         <=> cell centered rhs array
-c ::  DIMS(rhs)    => index limits of rhs array
-c ::  lo,hi        => index limits for rhs
-c ::  scale        => scale factor
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACRHS (ux,DIMS(ux),uy,DIMS(uy),uz,DIMS(uz),
-     &                         ax,DIMS(ax),ay,DIMS(ay),az,DIMS(az),
-     &                         vol,DIMS(vol),rhs,DIMS(rhs),lo,hi,scale)
-       implicit none
-       integer DIMDEC(ux)
-       integer DIMDEC(uy)
-       integer DIMDEC(uz)
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(az)
-       integer DIMDEC(vol)
-       integer DIMDEC(rhs)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  scale
-       REAL_T  ux(DIMV(ux))
-       REAL_T  uy(DIMV(uy))
-       REAL_T  uz(DIMV(uz))
-       REAL_T  ax(DIMV(ax))
-       REAL_T  ay(DIMV(ay))
-       REAL_T  az(DIMV(az))
-       REAL_T  vol(DIMV(vol))
-       REAL_T  rhs(DIMV(rhs))
-
-       integer i, j, k
-       REAL_T  divu
-c
-c      ::::: rhs holds the divergence condition (possibly zero)
-c
-!$omp parallel do private(i,j,k,divu)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                divu = ax(i+1,j,k)*ux(i+1,j,k) - ax(i,j,k)*ux(i,j,k)
-     &               + ay(i,j+1,k)*uy(i,j+1,k) - ay(i,j,k)*uy(i,j,k)
-     &               + az(i,j,k+1)*uz(i,j,k+1) - az(i,j,k)*uz(i,j,k)
-                rhs(i,j,k) = scale*(divu - vol(i,j,k)*rhs(i,j,k))
-             end do
-          end do
-       end do
-!$omp end parallel do
-
-       end
-
-c :: ----------------------------------------------------------
-c :: MACUPDATE
-c ::             Compute the update to velocity field to
-c ::             make it divergence free
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  ux,uy,uz    <=  edge based velocity arrays
-c ::  DIMS(ux)     => index limits for ux
-c ::  DIMS(uy)     => index limits for uy
-c ::  DIMS(uz)     => index limits for uz
-c ::  phi          => soln from MAC project
-c ::  DIMS(phi)    => index limits for phi
-c ::  rho          => density at time N
-c ::  DIMS(rho)    => index limits for rho
-c ::  dx           => cell size
-c ::  mult         => scalar multiplier
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACUPDATE(
-     &     init,
-     &     ux,DIMS(ux),uy,DIMS(uy),uz,DIMS(uz),
-     &     phi,DIMS(phi),rho,DIMS(rho),
-     &     lo,hi,dx,mult)
-
-       implicit none
-       integer DIMDEC(ux)
-       integer DIMDEC(uy)
-       integer DIMDEC(uz)
-       integer DIMDEC(phi)
-       integer DIMDEC(rho)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  dx(SDIM), mult
-       REAL_T  ux(DIMV(ux))
-       REAL_T  uy(DIMV(uy))
-       REAL_T  uz(DIMV(uz))
-       REAL_T  phi(DIMV(phi))
-       REAL_T  rho(DIMV(rho))
-       integer init
-
-       integer i, j, k
-       REAL_T  rhoavg, gp
-c
-c     set gradient to zero if initializing
-c
-       if ( init .eq. 1 ) then
-          do k = ARG_L3(ux), ARG_H3(ux)
-             do j = ARG_L2(ux), ARG_H2(ux)
-                do i = ARG_L1(ux), ARG_H1(ux)
-                   ux(i,j,k) = zero
-                end do
-             end do
-          end do
-          do k = ARG_L3(uy), ARG_H3(uy)
-             do j = ARG_L2(uy), ARG_H2(uy)
-                do i = ARG_L1(uy), ARG_H1(uy)
-                   uy(i,j,k) = zero
-                end do
-             end do
-          end do
-          do k = ARG_L3(uz), ARG_H3(uz)
-             do j = ARG_L2(uz), ARG_H2(uz)
-                do i = ARG_L1(uz), ARG_H1(uz)
-                   uz(i,j,k) = zero
-                end do
-             end do
-          end do
-       end if
-!$omp parallel private(i,j,k,rhoavg,gp)
-c
-c      compute x MAC gradient
-c
-!$omp do
-       do k = lo(3),hi(3)
-          do j = lo(2),hi(2)
-             do i = lo(1),hi(1)+1
-                rhoavg = half*(rho(i,j,k) + rho(i-1,j,k))
-                gp = (phi(i,j,k)-phi(i-1,j,k))/dx(1)
-                ux(i,j,k) = ux(i,j,k) + mult * gp / rhoavg
-             end do
-          end do
-       end do
-!$omp end do nowait
-c     
-c     compute y mac gradient
-c
-!$omp do
-       do k = lo(3),hi(3)
-          do j = lo(2),hi(2)+1
-             do i = lo(1),hi(1)
-                rhoavg = half*(rho(i,j,k) + rho(i,j-1,k))
-                gp = (phi(i,j,k)-phi(i,j-1,k))/dx(2)
-                uy(i,j,k) = uy(i,j,k) + mult * gp / rhoavg
-             end do
-          end do
-       end do
-!$omp end do nowait
-c       
-c     compute z mac gradient
-c
-!$omp do
-       do k = lo(3),hi(3)+1
-          do j = lo(2),hi(2)
-             do i = lo(1),hi(1)
-                rhoavg = half*(rho(i,j,k) + rho(i,j,k-1))
-                gp = (phi(i,j,k)-phi(i,j,k-1))/dx(3)
-                uz(i,j,k) = uz(i,j,k) + mult * gp / rhoavg
-             end do
-          end do
-       end do
-!$omp end do nowait
-!$omp end parallel
-       end
-
-c :: ----------------------------------------------------------
-c :: MACSYNCRHS
-c ::        Modify the RHS for MAC SYNC solve
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  rhs         <=  right hand side array
-c ::  lo,hi        => index limits for rhs
-c ::  vol          => cell centered volume array
-c ::  vlo,vhi      => index limits of vol array
-c ::  rhsscale     => const multiplier to rhs
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACSYNCRHS(rhs,DIMS(rhs),lo,hi,
-     &                            vol,DIMS(vol),rhsscale)
-       implicit none
-       integer DIMDEC(rhs)
-       integer DIMDEC(vol)
-       integer lo(SDIM), hi(SDIM)
-       REAL_T  rhsscale
-       REAL_T  rhs(DIMV(rhs))
-       REAL_T  vol(DIMV(vol))
-
-       integer i, j, k
-c
-c      ::::: multiply by volume since reflux step (which computed rhs)
-c      ::::: divided by volume.
-c
-!$omp parallel do private(i,j,k)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                rhs(i,j,k) = rhsscale*vol(i,j,k)*rhs(i,j,k)
-             end do
-          end do
-       end do
-!$omp end parallel do
-
-       end
diff --git a/Tests/LinearSolvers/C_CellMG/MACOPERATOR_F.H b/Tests/LinearSolvers/C_CellMG/MACOPERATOR_F.H
deleted file mode 100644
index 39520848b88..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MACOPERATOR_F.H
+++ /dev/null
@@ -1,103 +0,0 @@
-
-#ifndef _MACOPERATOR_F_H_
-#define _MACOPERATOR_F_H_
-
-#ifdef BL_LANG_FORT
-#    define FORT_MACCOEF       maccoef
-#    define FORT_MACRHS        macrhs
-#    define FORT_MACUPDATE     macupdate
-#    define FORT_MACSYNCRHS    macsyncrhs
-#else
-#  if  defined(BL_FORT_USE_UPPERCASE)
-#    define FORT_MACCOEF       MACCOEF
-#    define FORT_MACRHS        MACRHS
-#    define FORT_MACUPDATE     MACUPDATE
-#    define FORT_MACSYNCRHS    MACSYNCRHS
-#  elif defined(BL_FORT_USE_LOWERCASE)
-#    define FORT_MACCOEF       maccoef
-#    define FORT_MACRHS        macrhs
-#    define FORT_MACUPDATE     macupdate
-#    define FORT_MACSYNCRHS    macsyncrhs
-#  elif defined(BL_FORT_USE_UNDERSCORE)
-#    define FORT_MACCOEF       maccoef_
-#    define FORT_MACRHS        macrhs_
-#    define FORT_MACUPDATE     macupdate_
-#    define FORT_MACSYNCRHS    macsyncrhs_
-#endif
-
-#include <AMReX_ArrayLim.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-#if (BL_SPACEDIM == 2)
-    void FORT_MACCOEF (amrex_real* cx, AMREX_ARLIM_P(cxlo), AMREX_ARLIM_P(cxhi),
-                       amrex_real* cy, AMREX_ARLIM_P(cylo), AMREX_ARLIM_P(cyhi),
-                       const amrex_real* ax, AMREX_ARLIM_P(axlo), AMREX_ARLIM_P(axhi),
-                       const amrex_real* ay, AMREX_ARLIM_P(aylo), AMREX_ARLIM_P(ayhi),
-                       const amrex_real* rho, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                       const int* lo, const int* hi,
-                       const amrex_real* dx);
-
-    void FORT_MACRHS  (const amrex_real* ux, AMREX_ARLIM_P(uxlo), AMREX_ARLIM_P(uxhi),
-                       const amrex_real* uy, AMREX_ARLIM_P(uylo), AMREX_ARLIM_P(uyhi),
-                       const amrex_real* ax, AMREX_ARLIM_P(axlo), AMREX_ARLIM_P(axhi),
-                       const amrex_real* ay, AMREX_ARLIM_P(aylo), AMREX_ARLIM_P(ayhi),
-                       const amrex_real* vol, AMREX_ARLIM_P(vlo), AMREX_ARLIM_P(vhi),
-                       amrex_real* rhs, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                       const int* lo, const int* hi,
-                       const amrex_real* scale);
-
-    void FORT_MACUPDATE (const int *init,
-                         amrex_real* ux, AMREX_ARLIM_P(uxlo), AMREX_ARLIM_P(uxhi),
-                         amrex_real* uy, AMREX_ARLIM_P(uylo), AMREX_ARLIM_P(uyhi),
-                         const amrex_real* phi, AMREX_ARLIM_P(p_lo), AMREX_ARLIM_P(p_hi),
-                         const amrex_real* rho, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                         const int* lo, const int* hi,
-                         const amrex_real* dx, const amrex_real* scale);
-#endif
-
-#if (BL_SPACEDIM == 3)
-    void FORT_MACCOEF (amrex_real* cx, AMREX_ARLIM_P(cxlo), AMREX_ARLIM_P(cxhi),
-                       amrex_real* cy, AMREX_ARLIM_P(cylo), AMREX_ARLIM_P(cyhi),
-                       amrex_real* cz, AMREX_ARLIM_P(czlo), AMREX_ARLIM_P(czhi),
-                       const amrex_real* ax, AMREX_ARLIM_P(axlo), AMREX_ARLIM_P(axhi),
-                       const amrex_real* ay, AMREX_ARLIM_P(aylo), AMREX_ARLIM_P(ayhi),
-                       const amrex_real* az, AMREX_ARLIM_P(azlo), AMREX_ARLIM_P(azhi),
-                       const amrex_real* rho, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                       const int* lo, const int* hi,
-                       const amrex_real* dx);
-
-    void FORT_MACRHS  (const amrex_real* ux, AMREX_ARLIM_P(uxlo), AMREX_ARLIM_P(uxhi),
-                       const amrex_real* uy, AMREX_ARLIM_P(uylo), AMREX_ARLIM_P(uyhi),
-                       const amrex_real* uz, AMREX_ARLIM_P(uzlo), AMREX_ARLIM_P(uzhi),
-                       const amrex_real* ax, AMREX_ARLIM_P(axlo), AMREX_ARLIM_P(axhi),
-                       const amrex_real* ay, AMREX_ARLIM_P(aylo), AMREX_ARLIM_P(ayhi),
-                       const amrex_real* az, AMREX_ARLIM_P(azlo), AMREX_ARLIM_P(azhi),
-                       const amrex_real* vol, AMREX_ARLIM_P(vlo), AMREX_ARLIM_P(vhi),
-                       amrex_real* rhs, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                       const int* lo, const int* hi,
-                       const amrex_real* scale);
-
-    void FORT_MACUPDATE (const int *init,
-                         amrex_real* ux, AMREX_ARLIM_P(uxlo), AMREX_ARLIM_P(uxhi),
-                         amrex_real* uy, AMREX_ARLIM_P(uylo), AMREX_ARLIM_P(uyhi),
-                         amrex_real* uz, AMREX_ARLIM_P(uzlo), AMREX_ARLIM_P(uzhi),
-                         const amrex_real* phi, AMREX_ARLIM_P(p_lo), AMREX_ARLIM_P(p_hi),
-                         const amrex_real* rho, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                         const int* lo, const int* hi,
-                         const amrex_real* dx, const amrex_real* scale); 
-
-#endif
-
-    void FORT_MACSYNCRHS (amrex_real* rhs, AMREX_ARLIM_P(rlo), AMREX_ARLIM_P(rhi),
-                          const int* lo, const int* hi,
-                          const amrex_real* vol, AMREX_ARLIM_P(vlo), AMREX_ARLIM_P(vhi),
-                          const amrex_real* rhs_scale);
-#ifdef __cplusplus
-}
-#endif
-#endif
-
-#endif /*_MACOPERATOR_F_H_*/
diff --git a/Tests/LinearSolvers/C_CellMG/MACPROJ_2D.F b/Tests/LinearSolvers/C_CellMG/MACPROJ_2D.F
deleted file mode 100644
index 37c42b36b5e..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MACPROJ_2D.F
+++ /dev/null
@@ -1,139 +0,0 @@
-
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include "AMReX_REAL.H"
-#include "AMReX_CONSTANTS.H"
-#include "AMReX_BC_TYPES.H"
-#include "AMReX_ArrayLim.H"
-
-#define SDIM 2
-
-c :: ----------------------------------------------------------
-c :: MACDIV:  compute the MAC divergence in generalized coordinates
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  dmac        <=  MAC divergence (cell centered)
-c ::  DIMS(dmac)   => index limits for dmac
-c ::  lo,hi        => index limits of grid interior
-c ::  ux           => X edge velocity
-c ::  DIMS(ux)     => index limits for ux
-c ::  uy           => Y edge velocity
-c ::  DIMS(uy)     => index limits for uy
-c ::  xarea        => area of cell faces in X dircetion
-c ::  DIMS(ax)     => index limits for ax
-c ::  yarea        => area of cell faces in Y dircetion
-c ::  DIMS(ay)     => index limits for ay
-c ::  vol          => cell volume
-c ::  DIMS(vol)    => index limits for vol
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACDIV (dmac,DIMS(dmac),lo,hi,
-     &                         ux,DIMS(ux),uy,DIMS(uy),
-     &                         xarea,DIMS(ax),yarea,DIMS(ay),
-     &                         vol,DIMS(vol))
-
-       implicit none
-       integer DIMDEC(dmac)
-       integer lo(SDIM), hi(SDIM)
-       integer DIMDEC(ux)
-       integer DIMDEC(uy)
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(vol)
-       REAL_T  dmac(DIMV(dmac))
-       REAL_T    ux(DIMV(ux))
-       REAL_T    uy(DIMV(uy))
-       REAL_T xarea(DIMV(ax))
-       REAL_T yarea(DIMV(ay))
-       REAL_T   vol(DIMV(vol))
-
-       integer i, j
-
-       do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dmac(i,j) = ( xarea(i+1,j)*ux(i+1,j) - xarea(i,j)*ux(i,j)
-     &                 +   yarea(i,j+1)*uy(i,j+1) - yarea(i,j)*uy(i,j)
-     &            )/vol(i,j)
-
-          end do
-       end do
-
-       end
-
-c :: ----------------------------------------------------------
-c :: SCALEAREA
-c ::          area = area * anel_coeff
-c ::                 OR 
-c ::          area = area / anel_coeff
-c :: ----------------------------------------------------------
-
-       subroutine FORT_SCALEAREA (xarea,DIMS(ax),yarea,DIMS(ay),
-     &                            anel_coeff,anel_coeff_lo,anel_coeff_hi,lo,hi,mult)
-
-       implicit none
-       integer lo(SDIM), hi(SDIM)
-       integer anel_coeff_lo,anel_coeff_hi
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       REAL_T xarea(DIMV(ax))
-       REAL_T yarea(DIMV(ay))
-       REAL_T anel_coeff(anel_coeff_lo:anel_coeff_hi)
-       integer mult
-
-       integer i,j
-
-       if (mult .eq. 1) then
-
-          do j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-             xarea(i,j) =  xarea(i,j) * anel_coeff(j)
-          end do
-          end do
-
-          do j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-             yarea(i,j) =  yarea(i,j) * 0.5d0 * (anel_coeff(j)+anel_coeff(j-1))
-          end do
-          end do
-
-          if (lo(2) .eq. 0) then
-             j = lo(2)
-             do i = lo(1), hi(1)
-                yarea(i,j) =  yarea(i,j) * anel_coeff(j-1) / 
-     $                        (0.5d0 * (anel_coeff(j)+anel_coeff(j-1)))
-             end do
-          end if
-
-       else if (mult .eq. -1) then
-
-          do j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-             xarea(i,j) =  xarea(i,j) / anel_coeff(j)
-          end do
-          end do
-
-          do j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-             yarea(i,j) =  yarea(i,j) / (0.5d0 * (anel_coeff(j)+anel_coeff(j-1)))
-          end do
-          end do
-
-          if (lo(2) .eq. 0) then
-             j = lo(2)
-             do i = lo(1), hi(1)
-                yarea(i,j) =  yarea(i,j) / anel_coeff(j-1) *
-     $                        (0.5d0 * (anel_coeff(j)+anel_coeff(j-1)))
-             end do
-          end if
-
-       else 
- 
-          print *,'BOGUS MULT IN SCALEAREA '
-          stop
-
-       end if
-
-       end
diff --git a/Tests/LinearSolvers/C_CellMG/MACPROJ_3D.F b/Tests/LinearSolvers/C_CellMG/MACPROJ_3D.F
deleted file mode 100644
index 62aa2e1fd91..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MACPROJ_3D.F
+++ /dev/null
@@ -1,186 +0,0 @@
-
-#undef  BL_LANG_CC
-#ifndef BL_LANG_FORT
-#define BL_LANG_FORT
-#endif
-
-#include "AMReX_REAL.H"
-#include "AMReX_CONSTANTS.H"
-#include "AMReX_BC_TYPES.H"
-#include "AMReX_ArrayLim.H"
-
-#define SDIM 3
-
-c :: ----------------------------------------------------------
-c :: MACDIV:  compute the MAC divergence in generalized coordinates
-c ::
-c :: INPUTS / OUTPUTS:
-c ::  dmac        <=  MAC divergence (cell centered)
-c ::  DIMS(dmac)   => index limits for dmac
-c ::  lo,hi        => index limits of grid interior
-c ::  ux           => X edge velocity
-c ::  DIMS(ux)     => index limits for ux
-c ::  uy           => Y edge velocity
-c ::  DIMS(uy)     => index limits for uy
-c ::  uz           => Y edge velocity
-c ::  DIMS(uz)     => index limits for uz
-c ::  xarea        => area of cell faces in X dircetion
-c ::  DIMS(ax)     => index limits for xarea
-c ::  yarea        => area of cell faces in Y dircetion
-c ::  DIMS(ay)     => index limits for yarea
-c ::  zarea        => area of cell faces in Z dircetion
-c ::  DIMS(az)     => index limits for zarea
-c ::  vol          => cell volume
-c ::  DIMS(vol)    => index limits for vol
-c :: ----------------------------------------------------------
-c ::
-       subroutine FORT_MACDIV (dmac,DIMS(dmac),lo,hi,
-     &                         ux,DIMS(ux),uy,DIMS(uy),uz,DIMS(uz),
-     &                         xarea,DIMS(ax),yarea,DIMS(ay),
-     &                         zarea,DIMS(az),vol,DIMS(vol))
-
-       implicit none
-       integer DIMDEC(dmac)
-       integer lo(SDIM), hi(SDIM)
-       integer DIMDEC(ux)
-       integer DIMDEC(uy)
-       integer DIMDEC(uz)
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(az)
-       integer DIMDEC(vol)
-       REAL_T  dmac(DIMV(dmac))
-       REAL_T    ux(DIMV(ux))
-       REAL_T    uy(DIMV(uy))
-       REAL_T    uz(DIMV(uz))
-       REAL_T xarea(DIMV(ax))
-       REAL_T yarea(DIMV(ay))
-       REAL_T zarea(DIMV(az))
-       REAL_T   vol(DIMV(vol))
-
-       integer i, j, k
-
-!$omp parallel do private(i,j,k)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                dmac(i,j,k) = (xarea(i+1,j,k)*ux(i+1,j,k) - xarea(i,j,k)*ux(i,j,k)
-     &               +     yarea(i,j+1,k)*uy(i,j+1,k) - yarea(i,j,k)*uy(i,j,k)
-     &               +     zarea(i,j,k+1)*uz(i,j,k+1) - zarea(i,j,k)*uz(i,j,k)
-     &               )/vol(i,j,k)
-             end do
-          end do
-       end do
-!$omp end parallel do
-
-       end
-
-c :: ----------------------------------------------------------
-c :: SCALEAREA
-c ::          area = area * anel_coeff
-c ::                 OR 
-c ::          area = area / anel_coeff
-c :: ----------------------------------------------------------
-
-       subroutine FORT_SCALEAREA (xarea,DIMS(ax),yarea,DIMS(ay),
-     &                            zarea,DIMS(az),
-     &                            anel_coeff,anel_coeff_lo,anel_coeff_hi,lo,hi,mult)
-
-       implicit none
-       integer lo(SDIM), hi(SDIM)
-       integer anel_coeff_lo,anel_coeff_hi
-       integer DIMDEC(ax)
-       integer DIMDEC(ay)
-       integer DIMDEC(az)
-       REAL_T xarea(DIMV(ax))
-       REAL_T yarea(DIMV(ay))
-       REAL_T zarea(DIMV(az))
-       REAL_T anel_coeff(anel_coeff_lo:anel_coeff_hi)
-       integer mult
-
-       integer i,j,k
-
-       if (mult .eq. 1) then
-
-          do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-             xarea(i,j,k) =  xarea(i,j,k) * anel_coeff(k)
-          end do
-          end do
-          end do
-
-          do k = lo(3), hi(3)
-          do j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-             yarea(i,j,k) =  yarea(i,j,k) * anel_coeff(k)
-          end do
-          end do
-          end do
-
-          do k = lo(3), hi(3)+1
-          do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             zarea(i,j,k) =  zarea(i,j,k) * 0.5d0 * (anel_coeff(k)+anel_coeff(k-1))
-          end do
-          end do
-          end do
-
-          if (lo(3) .eq. 0) then
-             k = lo(3)
-
-             do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                zarea(i,j,k) =  zarea(i,j,k) * anel_coeff(k-1) /
-     $                          (0.5d0 * (anel_coeff(k)+anel_coeff(k-1)))
-             end do
-             end do
-
-          end if
-
-       else if (mult .eq. -1) then
-
-          do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-             xarea(i,j,k) =  xarea(i,j,k) / anel_coeff(k)
-          end do
-          end do
-          end do
-
-          do k = lo(3), hi(3)
-          do j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-             yarea(i,j,k) =  yarea(i,j,k) / anel_coeff(k)
-          end do
-          end do
-          end do
-
-          do k = lo(3), hi(3)+1
-          do j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             zarea(i,j,k) =  zarea(i,j,k) / (0.5d0 * (anel_coeff(k)+anel_coeff(k-1)))
-          end do
-          end do
-          end do
-
-          if (lo(3) .eq. 0) then
-             k = lo(3)
-
-             do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                zarea(i,j,k) =  zarea(i,j,k) / anel_coeff(k-1) *
-     $                         (0.5d0 * (anel_coeff(k)+anel_coeff(k-1)))
-             end do
-             end do
-
-          end if
-
-       else 
- 
-          print *,'BOGUS MULT IN SCALEAREA '
-          stop
-
-       end if
-
-       end
diff --git a/Tests/LinearSolvers/C_CellMG/MacOpMacDrivers.H b/Tests/LinearSolvers/C_CellMG/MacOpMacDrivers.H
deleted file mode 100644
index 2844e48475a..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MacOpMacDrivers.H
+++ /dev/null
@@ -1,44 +0,0 @@
-
-#ifndef _MACOPMACDRIVERS_H_
-
-//====================================================================
-// This header file contains declarations for the MacOperator mac projection
-// driver routines
-//====================================================================
-
-
-// the driver functions for the MAC solves
-void mac_level_driver( amrex::AmrCore* parent, const amrex::MacBndry &mac_bndry, const amrex::BCRec& phys_bc,
-                       const amrex::BoxArray &grids,
-                       int use_cg_solve, int level, int Density,
-                       const amrex::Real *dx, amrex::Real dt,
-                       amrex::Real mac_tol, amrex::Real mac_abs_tol, amrex::Real rhs_scale,
-                       amrex::MultiFab *area,  amrex::MultiFab &volume,
-                       amrex::MultiFab &S,     amrex::MultiFab &Rhs,
-                       amrex::MultiFab *u_mac, amrex::MultiFab *mac_phi );
-
-// a driver function for computing a sync MAC solve
-void mac_sync_driver( amrex::AmrCore* parent, const amrex::MacBndry &mac_bndry, const amrex::BCRec& phys_bc,
-                      const amrex::BoxArray &grids,
-                      int use_cg_solve, int level, 
-                      const amrex::Real *dx, amrex::Real dt,
-                      amrex::Real mac_sync_tol, amrex::Real mac_abs_tol, amrex::Real rhs_scale,
-                      amrex::MultiFab *area,  amrex::MultiFab &volume,
-                      amrex::MultiFab &Rhs,   amrex::MultiFab *rho_half,
-                      amrex::MultiFab *mac_sync_phi );
-
-
-// apply the mac pressure gradient to a velocity field
-// init, means that velocities are initialized here
-void mac_vel_update( int init,
-                     amrex::FArrayBox &uvel,
-                     amrex::FArrayBox &vvel,
-#if (BL_SPACEDIM == 3 )
-                     amrex::FArrayBox &wvel,
-#endif
-                     const amrex::FArrayBox &phi,
-                     const amrex::FArrayBox *rho, int rho_comp,  
-                     const amrex::Box &grd, int level, int n,
-                     const amrex::Real *dx, amrex::Real scale );
-
-#endif
diff --git a/Tests/LinearSolvers/C_CellMG/MacOperator.H b/Tests/LinearSolvers/C_CellMG/MacOperator.H
deleted file mode 100644
index e7c2aa25fff..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MacOperator.H
+++ /dev/null
@@ -1,66 +0,0 @@
-
-#ifndef _MACOPERATOR_H_
-#define _MACOPERATOR_H_
-
-//==========================================================================
-// This class defines how mass continuity is defined for the projection operators
-// in class NavierStokes.  For the Mac project, this is done through setting a
-// linop and a few driver functions, while for the mac project this is done
-// through a few driver functions which scale variables.
-//==========================================================================
-
-#include <AMReX_ABecLaplacian.H>
-#include <AMReX_BndryData.H>
-#include <AMReX_AmrCore.H>
-
-class MacOperator
-    :
-    public amrex::ABecLaplacian
-{
-protected:
-
-    amrex::AmrCore*      parent;
-public:
-
-    MacOperator (amrex::AmrCore*             Parent,
-                 const amrex::BndryData& mgb,
-                 const amrex::Real*      _h);
-
-    virtual ~MacOperator ();
-    //
-    // Define the gradient coeficients used by the multigrid object.
-    //
-    void setCoefficients (amrex::MultiFab*   area,
-                          amrex::MultiFab&   rho,
-                          int                rho_comp,
-                          const amrex::Real* dx);
-    //
-    // Initialize the rhs for the level solves.
-    //
-    void defRHS (amrex::MultiFab* area,
-                 amrex::MultiFab& vol,
-                 amrex::MultiFab& rhs,
-                 amrex::MultiFab* vel,
-                 amrex::Real      scale);
-    //
-    // Apply the pressure gradient to the mac velocities.
-    //
-    void velUpdate (amrex::MultiFab*       vel,
-                    amrex::MultiFab&       phi,
-                    const amrex::MultiFab& Rho,
-                    int                    rho_comp,
-                    const amrex::Real*     dx,
-                    amrex::Real            scale);
-    //
-    // Scale the rhs for the sync solves.
-    //
-    void syncRhs (const amrex::MultiFab& Volume,
-                  amrex::MultiFab&       Rhs,
-                  amrex::Real            rhs_scale,
-                  const amrex::Real*     dx);
-
-    static void Initialize ();
-    static void Finalize ();
-};
-
-#endif
diff --git a/Tests/LinearSolvers/C_CellMG/MacOperator.cpp b/Tests/LinearSolvers/C_CellMG/MacOperator.cpp
deleted file mode 100644
index 7a2d44053e7..00000000000
--- a/Tests/LinearSolvers/C_CellMG/MacOperator.cpp
+++ /dev/null
@@ -1,455 +0,0 @@
-
-
-#include <AMReX_MacBndry.H>
-#include <MacOperator.H>
-#include <MacOpMacDrivers.H>
-#include <MACOPERATOR_F.H>
-#include <AMReX_CGSolver.H>
-#include <AMReX_MultiGrid.H>
-#include <AMReX_ParmParse.H>
-
-using namespace amrex;
-
-#ifndef _NavierStokes_H_
-enum StateType {State_Type=0, Press_Type};
-#endif
-
-#define DEF_LIMITS(fab,fabdat,fablo,fabhi)   \
-const int* fablo = (fab).loVect();           \
-const int* fabhi = (fab).hiVect();           \
-Real* fabdat = (fab).dataPtr();
-
-#define DEF_CLIMITS(fab,fabdat,fablo,fabhi)  \
-const int* fablo = (fab).loVect();           \
-const int* fabhi = (fab).hiVect();           \
-const Real* fabdat = (fab).dataPtr();
-//
-// This is the default maxorder for the linear operator.
-//
-// To change this ParmParse in a new value for "macop.max_order"
-//
-static int max_order;
-
-namespace
-{
-    bool initialized = false;
-}
-
-void
-MacOperator::Initialize ()
-{
-    if (initialized) return;
-    //
-    // This is the default maxorder for the linear operator.
-    //
-    // To change this ParmParse in a new value for "macop.max_order"
-    //
-    max_order = 4;
-
-    ParmParse pp("macop");
-
-    pp.query("max_order", max_order);
-
-    amrex::ExecOnFinalize(MacOperator::Finalize);
-
-    initialized = true;
-}
-
-void
-MacOperator::Finalize ()
-{
-    initialized = false;
-}
-
-MacOperator::MacOperator (AmrCore*             Parent,
-                          const BndryData& mgb,
-                          const Real*      h)
-    :
-    ABecLaplacian(mgb,h),
-    parent(Parent)
-{
-    Initialize();
-}
-
-MacOperator::~MacOperator () {}
-
-//
-// Define the meaning of gradient for the multigrid object.
-//
-
-void
-MacOperator::setCoefficients (MultiFab*   area,
-                              MultiFab&   rho,
-                              int         rho_comp,
-                              const Real* dx)
-{
-    //
-    // Should check that all BoxArrays are consistant.
-    //
-    const BoxArray& ba = boxArray(0);
-    const DistributionMapping& dm = DistributionMap();
-    BL_ASSERT(rho.boxArray() == ba);
-    BL_ASSERT(rho.DistributionMap() == dm);
-    //
-    // First set scalar coeficients.
-    //
-    setScalars(0.0,1.0);
-    //
-    // Don't need to set a because alpha is set to zero.
-    //
-    const int n_grow = 0;
-
-    AMREX_D_TERM(MultiFab bxcoef(area[0].boxArray(),dm,area[0].nComp(),n_grow);,
-           MultiFab bycoef(area[1].boxArray(),dm,area[1].nComp(),n_grow);,
-           MultiFab bzcoef(area[2].boxArray(),dm,area[2].nComp(),n_grow););
-    AMREX_D_TERM(bxcoef.setVal(0);,
-           bycoef.setVal(0);,
-           bzcoef.setVal(0););
-
-    for (MFIter rhomfi(rho); rhomfi.isValid(); ++rhomfi)
-    {
-        BL_ASSERT(ba[rhomfi.index()] == rhomfi.validbox());
-
-        const Box& grd       = ba[rhomfi.index()];
-        const int* lo        = grd.loVect();
-        const int* hi        = grd.hiVect();
-        FArrayBox& bx        = bxcoef[rhomfi];
-        FArrayBox& by        = bycoef[rhomfi];
-        const FArrayBox& ax  = area[0][rhomfi];
-        const FArrayBox& ay  = area[1][rhomfi];
-        const FArrayBox& den = rho[rhomfi];
-
-        DEF_LIMITS(bx,bx_dat,bxlo,bxhi);
-        DEF_LIMITS(by,by_dat,bylo,byhi);
-        DEF_CLIMITS(ax,ax_dat,axlo,axhi);
-        DEF_CLIMITS(ay,ay_dat,aylo,ayhi);
-
-        const int* dlo      = den.loVect();
-        const int* dhi      = den.hiVect();
-        const Real* den_dat = den.dataPtr(rho_comp);
-
-#if (BL_SPACEDIM == 2)
-        FORT_MACCOEF(bx_dat,AMREX_ARLIM(bxlo),AMREX_ARLIM(bxhi),
-                     by_dat,AMREX_ARLIM(bylo),AMREX_ARLIM(byhi),
-                     ax_dat,AMREX_ARLIM(axlo),AMREX_ARLIM(axhi),
-                     ay_dat,AMREX_ARLIM(aylo),AMREX_ARLIM(ayhi),
-                     den_dat,AMREX_ARLIM(dlo),AMREX_ARLIM(dhi),lo,hi,dx);
-#endif
-#if (BL_SPACEDIM == 3)
-        FArrayBox& bz       = bzcoef[rhomfi];
-        const FArrayBox& az = area[2][rhomfi];
-
-        DEF_CLIMITS(az,az_dat,azlo,azhi);
-        DEF_LIMITS(bz,bz_dat,bzlo,bzhi);
-
-        FORT_MACCOEF(bx_dat,AMREX_ARLIM(bxlo),AMREX_ARLIM(bxhi),
-                     by_dat,AMREX_ARLIM(bylo),AMREX_ARLIM(byhi),
-                     bz_dat,AMREX_ARLIM(bzlo),AMREX_ARLIM(bzhi),
-                     ax_dat,AMREX_ARLIM(axlo),AMREX_ARLIM(axhi),
-                     ay_dat,AMREX_ARLIM(aylo),AMREX_ARLIM(ayhi),
-                     az_dat,AMREX_ARLIM(azlo),AMREX_ARLIM(azhi),
-                     den_dat,AMREX_ARLIM(dlo),AMREX_ARLIM(dhi),lo,hi,dx);
-#endif
-    }
-  
-    AMREX_D_TERM(bCoefficients(bxcoef,0);,
-           bCoefficients(bycoef,1);,
-           bCoefficients(bzcoef,2););
-}
-
-//
-// This function creates the initial rhs for use in the mac multgrid solve.
-//
-
-void
-MacOperator::defRHS (MultiFab* area,
-                     MultiFab& volume,
-                     MultiFab& Rhs,
-                     MultiFab* vel,
-                     Real      scale)
-{
-    //
-    // Should check that all BoxArrays are consistant.
-    //
-    BL_ASSERT(Rhs.boxArray() == gbox[0]);
-
-    for (MFIter Rhsmfi(Rhs); Rhsmfi.isValid(); ++Rhsmfi)
-    {
-        const Box& grd       = Rhsmfi.validbox();
-        const int* lo        = grd.loVect();
-        const int* hi        = grd.hiVect();
-        const FArrayBox& ax  = area[0][Rhsmfi];
-        const FArrayBox& ay  = area[1][Rhsmfi];
-        const FArrayBox& vol = volume[Rhsmfi];
-        const FArrayBox& ux  = vel[0][Rhsmfi];
-        const FArrayBox& uy  = vel[1][Rhsmfi];
-        FArrayBox& rhs       = Rhs[Rhsmfi];
-
-        DEF_CLIMITS(ux,ux_dat,uxlo,uxhi);
-        DEF_CLIMITS(uy,uy_dat,uylo,uyhi);
-        DEF_CLIMITS(ax,ax_dat,axlo,axhi);
-        DEF_CLIMITS(ay,ay_dat,aylo,ayhi);
-        DEF_CLIMITS(vol,vol_dat,vlo,vhi);
-        DEF_LIMITS(rhs,rhs_dat,rlo,rhi);
-
-#if (BL_SPACEDIM == 2)
-        FORT_MACRHS(ux_dat,AMREX_ARLIM(uxlo),AMREX_ARLIM(uxhi),
-                    uy_dat,AMREX_ARLIM(uylo),AMREX_ARLIM(uyhi),
-                    ax_dat,AMREX_ARLIM(axlo),AMREX_ARLIM(axhi),
-                    ay_dat,AMREX_ARLIM(aylo),AMREX_ARLIM(ayhi),
-                    vol_dat,AMREX_ARLIM(vlo),AMREX_ARLIM(vhi), 
-                    rhs_dat,AMREX_ARLIM(rlo),AMREX_ARLIM(rhi),
-                    lo,hi,&scale);
-#endif
-#if (BL_SPACEDIM == 3)
-        const FArrayBox& az = area[2][Rhsmfi];
-        DEF_CLIMITS(az,az_dat,azlo,azhi);
-
-        const FArrayBox& uz = vel[2][Rhsmfi];
-        DEF_CLIMITS(uz,uz_dat,uzlo,uzhi);
-
-        FORT_MACRHS(ux_dat,AMREX_ARLIM(uxlo),AMREX_ARLIM(uxhi),
-                    uy_dat,AMREX_ARLIM(uylo),AMREX_ARLIM(uyhi),
-                    uz_dat,AMREX_ARLIM(uzlo),AMREX_ARLIM(uzhi),
-                    ax_dat,AMREX_ARLIM(axlo),AMREX_ARLIM(axhi),
-                    ay_dat,AMREX_ARLIM(aylo),AMREX_ARLIM(ayhi),
-                    az_dat,AMREX_ARLIM(azlo),AMREX_ARLIM(azhi),
-                    vol_dat,AMREX_ARLIM(vlo),AMREX_ARLIM(vhi),
-                    rhs_dat,AMREX_ARLIM(rlo),AMREX_ARLIM(rhi),
-                    lo,hi,&scale);
-#endif
-    }
-    Rhs.mult(-1.0,Rhs.nGrow());
-}
-
-//
-// Apply the mac pressure gradient to a velocity field.
-// init, means that velocities are initialized here.
-//
-
-void
-mac_vel_update (int              init,
-                AMREX_D_DECL(FArrayBox& ux,
-                       FArrayBox& uy,
-                       FArrayBox& uz),
-                const FArrayBox& phi,
-                const FArrayBox* rhoptr,
-                int              rho_comp,  
-                const Box&       grd,
-                int              level,
-                int              n,
-                const Real*      dx,
-                Real             scale)
-{
-    const int* lo        = grd.loVect();
-    const int* hi        = grd.hiVect();
-
-    const FArrayBox& rho = *rhoptr;
-    
-    DEF_LIMITS(ux,ux_dat,uxlo,uxhi);
-    DEF_LIMITS(uy,uy_dat,uylo,uyhi);
-    DEF_CLIMITS(phi,phi_dat,p_lo,p_hi);
-
-    const int* rlo      = rho.loVect();
-    const int* rhi      = rho.hiVect();
-    const Real* rho_dat = rho.dataPtr(rho_comp);
-    
-#if (BL_SPACEDIM == 2)
-    FORT_MACUPDATE(&init,
-                   ux_dat,AMREX_ARLIM(uxlo),AMREX_ARLIM(uxhi),
-                   uy_dat,AMREX_ARLIM(uylo),AMREX_ARLIM(uyhi),
-                   phi_dat,AMREX_ARLIM(p_lo),AMREX_ARLIM(p_hi),
-                   rho_dat,AMREX_ARLIM(rlo),AMREX_ARLIM(rhi),
-                   lo,hi,dx,&scale);
-#endif
-#if (BL_SPACEDIM == 3)
-    DEF_LIMITS(uz,uz_dat,uzlo,uzhi);
-    
-    FORT_MACUPDATE(&init,
-                   ux_dat,AMREX_ARLIM(uxlo),AMREX_ARLIM(uxhi),
-                   uy_dat,AMREX_ARLIM(uylo),AMREX_ARLIM(uyhi),
-                   uz_dat,AMREX_ARLIM(uzlo),AMREX_ARLIM(uzhi),
-                   phi_dat,AMREX_ARLIM(p_lo),AMREX_ARLIM(p_hi),
-                   rho_dat,AMREX_ARLIM(rlo),AMREX_ARLIM(rhi),
-                   lo,hi,dx,&scale);
-#endif
-}
-
-//
-// Apply the mac pressure gradient to the divergent mac velocities.
-// The resultant velocity field is nondivergent.
-//
-
-void
-MacOperator::velUpdate (MultiFab*       Vel,
-                        MultiFab&       Phi,
-                        const MultiFab& Rho,
-                        int             rho_comp,
-                        const Real*     dx,
-                        Real            scale)
-{
-    //
-    // Should check that all BoxArrays are consistant.
-    //
-    BL_ASSERT(Rho.boxArray() ==  gbox[0]);
-    //
-    // Set bndry data in ghost zones.
-    //
-    int apply_lev = 0;
-    applyBC(Phi,0,1,apply_lev);
-
-    for (MFIter Phimfi(Phi); Phimfi.isValid(); ++Phimfi)
-    {
-        const Box& grd = Phimfi.validbox();
-
-        mac_vel_update(0, 
-                       AMREX_D_DECL(Vel[0][Phimfi],Vel[1][Phimfi],Vel[2][Phimfi]),
-                       Phi[Phimfi],
-                       &(Rho[Phimfi]), rho_comp,  
-                       grd, 0, Phimfi.index(), dx, scale );
-    }
-}
-
-//
-// Multiply by volume*rhs_scale since reflux step (which computed rhs)
-// divided by volume.
-//
-
-void
-MacOperator::syncRhs (const MultiFab& Volume,
-                      MultiFab&       Rhs,
-                      Real            rhs_scale,
-                      const Real*     dx)
-{
-    for (MFIter Rhsmfi(Rhs); Rhsmfi.isValid(); ++Rhsmfi)
-    {
-        const Box& grd       = Rhsmfi.validbox();
-        const int* lo        = grd.loVect();
-        const int* hi        = grd.hiVect();
-        FArrayBox& rhs       = Rhs[Rhsmfi];
-        const FArrayBox& vol = Volume[Rhsmfi];
-
-        DEF_CLIMITS(vol,vol_dat,vlo,vhi);
-        DEF_LIMITS(rhs,rhs_dat,rlo,rhi);
-        FORT_MACSYNCRHS(rhs_dat,AMREX_ARLIM(rlo),AMREX_ARLIM(rhi),lo,hi,
-                        vol_dat,AMREX_ARLIM(vlo),AMREX_ARLIM(vhi),&rhs_scale);
-    }
-    Rhs.mult(-1.0,Rhs.nGrow());
-}
-
-//
-// Driver functions follow.
-//
-
-//
-// A driver function for computing a level MAC solve.
-//
-
-void
-mac_level_driver (AmrCore*        parent,
-                  const MacBndry& mac_bndry,
-		  const BCRec&    phys_bc,
-                  const BoxArray& grids,
-                  int             the_solver,
-                  int             level,
-                  int             Density,
-                  const Real*     dx,
-                  Real            dt,
-                  Real            mac_tol,
-                  Real            mac_abs_tol,
-                  Real            rhs_scale,
-                  MultiFab*       area,
-                  MultiFab&       volume,
-                  MultiFab&       S,
-                  MultiFab&       Rhs,
-                  MultiFab*       u_mac,
-                  MultiFab*       mac_phi)
-{
-    MacOperator mac_op(parent,mac_bndry,dx);
-
-    mac_op.setCoefficients(area,S,Density,dx);
-    mac_op.defRHS(area,volume,Rhs,u_mac,rhs_scale);
-    mac_op.maxOrder(max_order);
-
-    if (the_solver == 1 && mac_op.maxOrder() != 2)
-    {
-        amrex::Error("Can't use CGSolver with maxorder > 2");
-    }
-    //
-    // Construct MultiGrid or CGSolver object and solve system.
-    //
-    if (the_solver == 1)
-    {
-        bool use_mg_precond = true;
-        CGSolver mac_cg(mac_op,use_mg_precond);
-        mac_cg.solve(*mac_phi,Rhs,mac_tol,mac_abs_tol);
-    }
-    else if (the_solver == 2 )
-    {
-        amrex::Error("mac_level_driver::HypreABec not in this build");
-    }
-    else
-    {
-        MultiGrid mac_mg(mac_op);
-        mac_mg.solve(*mac_phi,Rhs,mac_tol,mac_abs_tol);
-    }
-    //
-    // velUpdate will set bndry values for mac_phi.
-    //
-    mac_op.velUpdate(u_mac,*mac_phi,S,Density,dx,-dt/2.0);
-}
-
-//
-// A driver function for computing a sync MAC solve.
-//
-
-void
-mac_sync_driver (AmrCore*            parent,
-                 const MacBndry& mac_bndry,
-	         const BCRec&    phys_bc,
-                 const BoxArray& grids,
-                 int             the_solver,
-                 int             level, 
-                 const Real*     dx,
-                 Real            dt,
-                 Real            mac_sync_tol,
-                 Real            mac_abs_tol,
-                 Real            rhs_scale,
-                 MultiFab*       area,
-                 MultiFab&       volume,
-                 MultiFab&       Rhs,
-                 MultiFab*       rho_half,
-                 MultiFab*       mac_sync_phi)
-{
-    MacOperator mac_op(parent,mac_bndry,dx);
-
-    mac_op.maxOrder(max_order);
-    mac_op.setCoefficients(area,*rho_half, 0, dx);
-    mac_op.syncRhs(volume,Rhs,rhs_scale,dx);
-
-    if (the_solver == 1 && mac_op.maxOrder() != 2)
-    {
-        amrex::Error("Can't use CGSolver with maxorder > 2");
-    }
-    //
-    // Now construct MultiGrid or CGSolver object to solve system.
-    //
-    if (the_solver == 1)
-    {
-        bool use_mg_precond = true;
-        CGSolver mac_cg(mac_op,use_mg_precond);
-        mac_cg.solve(*mac_sync_phi,Rhs,mac_sync_tol,mac_abs_tol);
-    }
-    else if ( the_solver == 2 )
-    {
-        amrex::Error("mac_sync_driver: HypreABec not in this build");
-    }
-    else
-    {
-        MultiGrid mac_mg(mac_op);
-        mac_mg.solve(*mac_sync_phi,Rhs,mac_sync_tol,mac_abs_tol);
-    }
-    
-    int mac_op_lev = 0;
-    mac_op.applyBC(*mac_sync_phi,0,1,mac_op_lev);
-}
diff --git a/Tests/LinearSolvers/C_CellMG/Make.package b/Tests/LinearSolvers/C_CellMG/Make.package
deleted file mode 100644
index e2ebfc11e2e..00000000000
--- a/Tests/LinearSolvers/C_CellMG/Make.package
+++ /dev/null
@@ -1,5 +0,0 @@
-
-CEXE_sources += MacOperator.cpp
-CEXE_headers += MacOperator.H
-FEXE_headers += COEF_F.H
-FEXE_sources += MACPROJ_$(DIM)D.F MACOPERATOR_$(DIM)D.F COEF_$(DIM)D.F 
diff --git a/Tests/LinearSolvers/C_CellMG/Palette b/Tests/LinearSolvers/C_CellMG/Palette
deleted file mode 100644
index e86ad05be1b..00000000000
Binary files a/Tests/LinearSolvers/C_CellMG/Palette and /dev/null differ
diff --git a/Tests/LinearSolvers/C_CellMG/amrvis.defaults b/Tests/LinearSolvers/C_CellMG/amrvis.defaults
deleted file mode 100644
index 8a7ff269504..00000000000
--- a/Tests/LinearSolvers/C_CellMG/amrvis.defaults
+++ /dev/null
@@ -1,11 +0,0 @@
-palette               Palette
-initialderived        blank
-initialscale          3
-numberformat          %7.5f
-numberformat          %12.8f
-maxpixmapsize         1000000
-reservesystemcolors   24
-showboxes             TRUE
-windowheight          550
-windowwidth           800
-fabordering           alpha
diff --git a/Tests/LinearSolvers/C_CellMG/dumpi/NOTE b/Tests/LinearSolvers/C_CellMG/dumpi/NOTE
deleted file mode 100644
index ce2e498805a..00000000000
--- a/Tests/LinearSolvers/C_CellMG/dumpi/NOTE
+++ /dev/null
@@ -1,9 +0,0 @@
-The original MultiGrid runs I did from which I passed DUMPI trace files to
-Joe Kenny was done with an early version of ComparisonTest, not C_CellMG.
-ComparisonTest has been changed so much that I fixed up C_CellMG so that
-it more-or-less does an equivalent problem.  Not exactly the same, but
-close enough to illustrate what we do.
-
-If anyone wants to duplicate exactly the original DUMPI trace files:
-
-  git checkout 22b9473cd7a908cfac60d6c4ca6613169c16721d
diff --git a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.4096core b/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.4096core
deleted file mode 100644
index 344d492dd28..00000000000
--- a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.4096core
+++ /dev/null
@@ -1,19 +0,0 @@
-
-geometry.coord_sys   =  0
-
-geometry.prob_lo     =  0. 0. 0.
-
-geometry.prob_hi     =  1. 1. 1.
-
-geometry.is_periodic =  1 1 1
-
-dump_MF=0
-
-n_cell        = 1024
-
-max_grid_size = 64
-
-tol = 1.e-8
-
-mg.v = 2
-cg.v = 0
diff --git a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.512core b/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.512core
deleted file mode 100644
index ba3557b807c..00000000000
--- a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.512core
+++ /dev/null
@@ -1,19 +0,0 @@
-
-geometry.coord_sys   =  0
-
-geometry.prob_lo     =  0. 0. 0.
-
-geometry.prob_hi     =  1. 1. 1.
-
-geometry.is_periodic =  1 1 1
-
-dump_MF=0
-
-n_cell        = 512
-
-max_grid_size = 64
-
-tol = 1.e-8
-
-mg.v = 2
-cg.v = 0
diff --git a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.64core b/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.64core
deleted file mode 100644
index 63372a79495..00000000000
--- a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.64core
+++ /dev/null
@@ -1,19 +0,0 @@
-
-geometry.coord_sys   =  0
-
-geometry.prob_lo     =  0. 0. 0.
-
-geometry.prob_hi     =  1. 1. 1.
-
-geometry.is_periodic =  1 1 1
-
-dump_MF=0
-
-n_cell        = 256
-
-max_grid_size = 64
-
-tol = 1.e-8
-
-mg.v = 2
-cg.v = 0
diff --git a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.8core b/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.8core
deleted file mode 100644
index 079e823683b..00000000000
--- a/Tests/LinearSolvers/C_CellMG/dumpi/inputs.3d.8core
+++ /dev/null
@@ -1,19 +0,0 @@
-
-geometry.coord_sys   =  0
-
-geometry.prob_lo     =  0. 0. 0.
-
-geometry.prob_hi     =  1. 1. 1.
-
-geometry.is_periodic =  1 1 1
-
-dump_MF=0
-
-n_cell        = 128
-
-max_grid_size = 64
-
-tol = 1.e-8
-
-mg.v = 2
-cg.v = 0
diff --git a/Tests/LinearSolvers/C_CellMG/inputs.2d b/Tests/LinearSolvers/C_CellMG/inputs.2d
deleted file mode 100644
index 2752ce14549..00000000000
--- a/Tests/LinearSolvers/C_CellMG/inputs.2d
+++ /dev/null
@@ -1,6 +0,0 @@
-geometry.coord_sys   =  0        # 0=cartesian, 1=r-z
-geometry.prob_lo     =  0. 0.   
-geometry.prob_hi     =  1. 1.   
-geometry.is_periodic =  0 0      # for each direction, 1=periodic
-dump_MF=1                        # dump RHS and soln to a "plotfile" named soln_pf
-boxes=grids/gr.2_19boxes         # work on this set of boxes
diff --git a/Tests/LinearSolvers/C_CellMG/inputs.3d b/Tests/LinearSolvers/C_CellMG/inputs.3d
deleted file mode 100644
index 8587adba21a..00000000000
--- a/Tests/LinearSolvers/C_CellMG/inputs.3d
+++ /dev/null
@@ -1,7 +0,0 @@
-geometry.coord_sys   =  0        # 0=cartesian
-geometry.prob_lo     =  0. 0. 0.
-geometry.prob_hi     =  1. 1. 1.
-geometry.is_periodic =  0 0 0    # for each direction, 1=periodic
-dump_MF=1                        # dump RHS and soln to a "plotfile" named soln_pf
-boxes=grids/grids.213           # work on this set of boxes
-mg.v=1
diff --git a/Tests/LinearSolvers/C_CellMG/macprojTest.cpp b/Tests/LinearSolvers/C_CellMG/macprojTest.cpp
deleted file mode 100644
index 8315c0284d4..00000000000
--- a/Tests/LinearSolvers/C_CellMG/macprojTest.cpp
+++ /dev/null
@@ -1,246 +0,0 @@
-//
-// In order to use this utility to mimic a MAC projection solve from the
-// full AMR code, the lines of code below need to be added to the top
-// of mac_level_driver in MacOperator.cpp.  This will dump the required 
-// information.  The data sent to cout needs to be set in the input and 
-// grid files for this test utility.  The boundary data and multifabs will 
-// be read directly.
-//
-//cout << grids << endl;
-//cout << "use_cg_solve = " << use_cg_solve << endl;
-//cout << "level = " << level << endl;
-//cout << "Density = " << Density << endl;
-//cout << "dx = " << dx[0] << " " << dx[1] << " " << dx[2] << endl;
-//cout << "dt = " << dt << endl;
-//cout << "mac_tol = " << mac_tol << endl;
-//cout << "mac_abs_tol = " << mac_abs_tol << endl;
-//cout << "rhs_scale = " << rhs_scale << endl;
-//ofstream macOS;
-//macOS.open("mac_bndry_OS",ios::out|ios::binary);
-//mac_bndry.writeOn(macOS);
-//macOS.close();
-//
-//
-//
-
-#include <AMReX_Utility.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_MacBndry.H>
-#include <AMReX_MultiGrid.H>
-#include <AMReX_CGSolver.H>
-#include <AMReX_Laplacian.H>
-#include <MacOperator.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_VisMF.H>
-#include <TV_TempWrite.H>
-
-#include <WritePlotFile.H>
-
-using namespace amrex;
-
-BoxList readBoxList(aString file, 
-                    Box& domain);
-
-void mac_driver (const MacBndry& mac_bndry,
-                 const BoxArray& grids,
-                 int             use_cg_solve,
-                 int             Density,
-                 const Real*     dx,
-                 Real            dt,
-                 Real            mac_tol,
-                 Real            mac_abs_tol,
-                 Real            rhs_scale,
-                 MultiFab*       area,
-                 MultiFab&       volume,
-                 MultiFab&       S,
-                 MultiFab&       Rhs,
-                 MultiFab*       u_mac,
-                 MultiFab*       mac_phi);
-
-int
-main (int   argc, char* argv[])
-{
-    amrex::Initialize(argc, argv);
-
-    //
-    // Instantiate after we're running in Parallel.
-    //
-    
-    //
-    // Obtain prob domain and box-list, set dx
-    //
-    Box container;
-#if (BL_SPACEDIM == 2)
-    aString boxfile("grids/gr.2_mac_tst");
-#elif (BL_SPACEDIM == 3)
-    aString boxfile("grids/gr.3_mac_tst");
-#endif
-    ParmParse pp;
-    pp.query("boxes", boxfile);
-
-    BoxArray bs(readBoxList(boxfile, container));
-    Geometry geom( container );
-
-    Real dx[BL_SPACEDIM];
-    for ( int n=0; n<BL_SPACEDIM; n++ )
-    {
-        dx[n] = ( geom.ProbHi(n) - geom.ProbLo(n) )/container.length(n);
-    }
-    
-    //
-    // Read the problem information
-    //
-    
-    int use_cg_solve;
-    if (!pp.query("use_cg_solve", use_cg_solve))
-        amrex::Abort("Must specify use_cg_solve");
-
-    int Density;
-    if (!pp.query("Density", Density))
-        amrex::Abort("Must specify Density");
-
-    Real dt;
-    if (!pp.query("dt", dt))
-        amrex::Abort("Must specify dt");
-
-    Real mac_tol;
-    if (!pp.query("mac_tol", mac_tol))
-        amrex::Abort("Must specify mac_tol");
-
-    Real mac_abs_tol;
-    if (!pp.query("mac_abs_tol", mac_abs_tol))
-        amrex::Abort("Must specify mac_abs_tol");
-
-    Real rhs_scale;
-    if (!pp.query("rhs_scale", rhs_scale))
-        amrex::Abort("Must specify rhs_scale");
-
-    bool dump_norm = false;
-    pp.query("dump_norm", dump_norm);
-
-    //
-    // Read the MultiFabs Defining the Problem
-    //
-    MultiFab volume, S, Rhs, mac_phi;
-    MultiFab area[3], u_mac[3];
-    MacBndry mac_bndry;
-
-    readMF(area[0], "area0_MF");
-    readMF(area[1], "area1_MF");
-    readMF(area[2], "area2_MF");
-    readMF(volume, "volume_MF");
-    readMF(S, "S_MF");
-    readMF(Rhs, "Rhs_MF");
-    readMF(u_mac[0], "u_mac0_MF");
-    readMF(u_mac[1], "u_mac1_MF");
-    readMF(u_mac[2], "u_mac2_MF");
-    readMF(mac_phi, "mac_phi_MF");
-
-    ifstream macOS;
-    macOS.open("mac_bndry_OS",ios::in|ios::binary);
-    mac_bndry.readFrom(macOS);
-    macOS.close();
-
-    //
-    // Solve System
-    //
-    mac_driver (mac_bndry, bs, use_cg_solve, Density, dx, dt,
-                mac_tol, mac_abs_tol, rhs_scale, area, volume, S,
-                Rhs, u_mac, &mac_phi);
-
-    //
-    // Write solution, and rhs
-    //
-    if ( dump_norm )
-    {
-        double d1 = mac_phi.norm2();
-        double d2 = mac_phi.norm0();
-
-        if ( ParallelDescriptor::IOProcessor() )
-        {
-            cout << "solution norm = " << d1 << " / " << d2 << endl;
-        }
-    }
-  
-    amrex::Finalize();
-}
-
-BoxList
-readBoxList(const aString file, BOX& domain)
-{
-  BoxList retval;
-  ifstream boxspec(file.c_str());
-  if( !boxspec )
-    {
-      amrex::Error("readBoxList: unable to open " + *file.c_str());
-    }
-  boxspec >> domain;
-    
-  int numbox;
-  boxspec >> numbox;
-
-  for ( int i=0; i<numbox; i++ )
-    {
-      BOX tmpbox;
-      boxspec >> tmpbox;
-      if( ! domain.contains(tmpbox))
-	{
-	  cerr << "readBoxList: bogus box " << tmpbox << '\n';
-	  exit(1);
-        }
-      retval.append(tmpbox);
-    }
-  boxspec.close();
-  return retval;
-}
-
-
-//
-//  This routine is intended to mimic the mac_level_driver in MacOperator.cpp.
-//  So, we can read in the appropriate MultiFabs and then pass them to this 
-//  routine
-//
-void
-mac_driver (const MacBndry& mac_bndry,
-            const BoxArray& grids,
-            int             use_cg_solve,
-            int             Density,
-            const Real*     dx,
-            Real            dt,
-            Real            mac_tol,
-            Real            mac_abs_tol,
-            Real            rhs_scale,
-            MultiFab*       area,
-            MultiFab&       volume,
-            MultiFab&       S,
-            MultiFab&       Rhs,
-            MultiFab*       u_mac,
-            MultiFab*       mac_phi)
-{
-    MacOperator mac_op(mac_bndry,dx);
-    mac_op.setCoefficients(area,S,Density,dx);
-    mac_op.defRHS(area,volume,Rhs,u_mac,rhs_scale);
-    mac_op.maxOrder(2);
-
-    if (use_cg_solve && mac_op.maxOrder() != 2)
-    {
-        amrex::Error("Can't use CGSolver with maxorder > 2");
-    }
-    //
-    // Construct MultiGrid or CGSolver object and solve system.
-    //
-    if (use_cg_solve)
-    {
-        bool use_mg_precond = true;
-        CGSolver mac_cg(mac_op,use_mg_precond);
-        mac_cg.solve(*mac_phi,Rhs,mac_tol,mac_abs_tol);
-    }
-    else
-    {
-        MultiGrid mac_mg(mac_op);
-        mac_mg.solve(*mac_phi,Rhs,mac_tol,mac_abs_tol);
-    }
-}
-
-
diff --git a/Tests/LinearSolvers/C_CellMG/main.cpp b/Tests/LinearSolvers/C_CellMG/main.cpp
deleted file mode 100644
index 0a9a97af443..00000000000
--- a/Tests/LinearSolvers/C_CellMG/main.cpp
+++ /dev/null
@@ -1,581 +0,0 @@
-
-#include <fstream>
-#include <iomanip>
-
-#include <AMReX_Utility.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_BndryData.H>
-#include <AMReX_MultiGrid.H>
-#include <AMReX_CGSolver.H>
-#include <AMReX_Laplacian.H>
-#include <AMReX_ABecLaplacian.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_VisMF.H>
-#include <COEF_F.H>
-
-using namespace amrex;
-
-static
-BoxArray
-readBoxList (const std::string file, Box& domain)
-{
-    BoxList retval;
-
-    std::ifstream boxspec;
-
-    boxspec.open(file.c_str(), std::ios::in);
-
-    if( !boxspec )
-    {
-        std::string msg = "readBoxList: unable to open ";
-        msg += file;
-        amrex::Error(msg.c_str());
-    }
-    boxspec >> domain;
-    
-    int numbox = 0;
-    boxspec >> numbox;
-
-    for ( int i=0; i<numbox; i++ )
-    {
-        Box tmpbox;
-        boxspec >> tmpbox;
-        if( !domain.contains(tmpbox) )
-	{
-            std::cerr << "readBoxList: bogus box " << tmpbox << '\n';
-            exit(1);
-        }
-        retval.push_back(tmpbox);
-    }
-
-    return BoxArray(retval);
-}
-
-static
-void
-writePlotFile (const std::string& dir,
-               const MultiFab&    mf,
-               const Geometry&    geom)
-{
-    BL_ASSERT(mf.nComp() == 2);
-    //
-    // Only let at most 64 CPUs write at any one time.
-    //
-    VisMF::SetNOutFiles(64);
-    //
-    // Only the I/O processor makes the directory if it doesn't already exist.
-    //
-    if (ParallelDescriptor::IOProcessor())
-        if (!amrex::UtilCreateDirectory(dir, 0755))
-            amrex::CreateDirectoryFailed(dir);
-    //
-    // Force other processors to wait till directory is built.
-    //
-    ParallelDescriptor::Barrier();
-
-    std::string HeaderFileName = dir + "/Header";
-
-    VisMF::IO_Buffer io_buffer(VisMF::IO_Buffer_Size);
-
-    std::ofstream HeaderFile;
-
-    HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        //
-        // Only the IOProcessor() writes to the header file.
-        //
-        HeaderFile.open(HeaderFileName.c_str(), std::ios::out|std::ios::trunc|std::ios::binary);
-        if (!HeaderFile.good())
-            amrex::FileOpenFailed(HeaderFileName);
-        HeaderFile << "NavierStokes-V1.1\n";
-        HeaderFile << 2 << '\n';
-        HeaderFile << "soln\nrhs\n";
-        HeaderFile << BL_SPACEDIM << '\n';
-        HeaderFile << 0 << '\n';
-        HeaderFile << 0 << '\n';
-        for (int i = 0; i < BL_SPACEDIM; i++)
-            HeaderFile << geom.ProbLo(i) << ' ';
-        HeaderFile << '\n';
-        for (int i = 0; i < BL_SPACEDIM; i++)
-            HeaderFile << geom.ProbHi(i) << ' ';
-        HeaderFile << '\n';
-        HeaderFile << '\n';
-        HeaderFile << geom.Domain() << ' ';
-        HeaderFile << '\n';
-        HeaderFile << 0 << ' ';
-        HeaderFile << '\n';
-        for (int k = 0; k < BL_SPACEDIM; k++)
-            HeaderFile << geom.CellSize()[k] << ' ';
-        HeaderFile << '\n';
-        HeaderFile << geom.Coord() << '\n';
-        HeaderFile << "0\n";
-    }
-    // Build the directory to hold the MultiFab at this level.
-    // The name is relative to the directory containing the Header file.
-    //
-    static const std::string BaseName = "/Cell";
-
-    std::string Level = amrex::Concatenate("Level_", 0, 1);
-    //
-    // Now for the full pathname of that directory.
-    //
-    std::string FullPath = dir;
-    if (!FullPath.empty() && FullPath[FullPath.length()-1] != '/')
-        FullPath += '/';
-    FullPath += Level;
-    //
-    // Only the I/O processor makes the directory if it doesn't already exist.
-    //
-    if (ParallelDescriptor::IOProcessor())
-        if (!amrex::UtilCreateDirectory(FullPath, 0755))
-            amrex::CreateDirectoryFailed(FullPath);
-    //
-    // Force other processors to wait till directory is built.
-    //
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        HeaderFile << 0 << ' ' << mf.boxArray().size() << ' ' << 0 << '\n';
-        HeaderFile << 0 << '\n';
-
-        for (int i = 0; i < mf.boxArray().size(); ++i)
-        {
-            RealBox loc = RealBox(mf.boxArray()[i],geom.CellSize(),geom.ProbLo());
-            for (int n = 0; n < BL_SPACEDIM; n++)
-                HeaderFile << loc.lo(n) << ' ' << loc.hi(n) << '\n';
-        }
-
-        std::string PathNameInHeader = Level;
-        PathNameInHeader += BaseName;
-        HeaderFile << PathNameInHeader << '\n';
-    }
-    //
-    // Use the Full pathname when naming the MultiFab.
-    //
-    std::string TheFullPath = FullPath;
-    TheFullPath += BaseName;
-    VisMF::Write(mf,TheFullPath);
-}
-
-int
-main (int argc, char* argv[])
-{
-  amrex::Initialize(argc,argv);
-
-  std::cout << std::setprecision(15);
-
-  ParmParse pp;
-  //
-  // Obtain prob domain and box-list, set H per phys domain [0:1]Xn
-  //
-  Box      dmn;
-  BoxArray bs;
-
-  int ba_coarsen = -1 ; pp.query("ba_coarsen", ba_coarsen);
-  int ncells     = -1 ; pp.query("n_cell", ncells);
-
-  if (ncells > 0)
-  {
-      if (ParallelDescriptor::IOProcessor())
-          std::cout << "Building grids bases on n_cell = " << ncells << std::endl;
-      
-      dmn = Box(IntVect(AMREX_D_DECL(0,0,0)),IntVect(AMREX_D_DECL(ncells-1,ncells-1,ncells-1)));
-
-      int maxgrid = -1 ; pp.query("max_grid_size", maxgrid);
-
-      if (maxgrid < 0)
-          amrex::Abort("max_grid_size must be positive");
-
-      bs = BoxArray(dmn);
-
-      bs.maxSize(maxgrid);
-  }
-  else
-  {
-#if (BL_SPACEDIM == 2)
-      std::string boxfile("grids/gr.2_small_a") ; pp.query("boxes", boxfile);
-#elif (BL_SPACEDIM == 3)
-      std::string boxfile("grids/gr.3_small_a") ; pp.query("boxes", boxfile);
-#endif
-
-      if (ParallelDescriptor::IOProcessor())
-          std::cout << "Reading in grids from file: " << boxfile << std::endl;
-
-     bs = readBoxList(boxfile,dmn);
-  }
-
-  if ( ba_coarsen > 1 )
-      bs.coarsen(ba_coarsen);
-
-  Geometry geom( dmn );
-  Real dx[BL_SPACEDIM];
-  for ( int n=0; n<BL_SPACEDIM; n++ )
-      dx[n] = ( geom.ProbHi(n) - geom.ProbLo(n) )/dmn.length(n);
-  //
-  // Allocate/initialize solution and right-hand-side, reset
-  // rhs=1 at each box center.
-  //
-  int Ncomp=1;
-  int Nghost=1;
-  DistributionMapping dm{bs};
-  MultiFab soln(bs, dm, Ncomp, Nghost); soln.setVal(0.0);
-  MultiFab  rhs(bs, dm, Ncomp, Nghost);  rhs.setVal(0.0);
-  for ( MFIter rhsmfi(rhs); rhsmfi.isValid(); ++rhsmfi )
-  {
-      IntVect ivmid = (rhs[rhsmfi].smallEnd() + rhs[rhsmfi].bigEnd())/2;
-      rhs[rhsmfi].operator()(ivmid,0) = 1;
-      ivmid += IntVect::TheUnitVector();
-      rhs[rhsmfi].operator()(ivmid,0) = -1;
-//    std::cout << rhs[rhsmfi] << std::endl;
-  }
-  //
-  // Initialize boundary data, set boundary condition flags and locations:
-  // (phys boundaries set to dirichlet on cell walls).
-  //
-  BndryData bd(bs, dm, 1, geom);
-  int comp = 0;
-  for ( int n=0; n<BL_SPACEDIM; ++n )
-    {
-        for ( MFIter mfi(rhs); mfi.isValid(); ++mfi )
-	{
-            int i = mfi.index();  //   ^^^ using rhs to get mfi.index() yes, this is a hack
-            bd.setBoundLoc(Orientation(n, Orientation::low) ,i,0.0 );
-            bd.setBoundLoc(Orientation(n, Orientation::high),i,0.0 );
-            bd.setBoundCond(Orientation(n, Orientation::low) ,i,comp,LO_DIRICHLET);
-            bd.setBoundCond(Orientation(n, Orientation::high),i,comp,LO_DIRICHLET);
-            bd.setValue(Orientation(n, Orientation::low) ,i, 0.0);
-            bd.setValue(Orientation(n, Orientation::high),i, 0.0);
-	}
-    }
-  //
-  // Choose operator (Laplacian or ABecLaplacian), get tolerance, numiter.
-  //
-  bool ABec=false           ; pp.query("ABec",ABec);
-  Real tolerance = 1.0e-12  ; pp.query("tol", tolerance);
-  Real tolerance_abs = -1.0 ; pp.query("tol_abs", tolerance_abs);
-  int numiter = 41          ; pp.query("numiter", numiter);
-  int maxiter = 40          ; pp.query("maxiter", maxiter);
-  bool mg = true            ; pp.query("mg", mg);
-  bool cg = false           ; pp.query("cg", cg);
-  bool bicg = false         ; pp.query("bicg", bicg);
-  bool use_mg_pre=false     ; pp.query("mg_pre",use_mg_pre);
-  bool new_bc=false         ; pp.query("new_bc",new_bc);
-  bool dump_norm=true       ; pp.query("dump_norm", dump_norm);
-  bool dump_Lp=false        ; pp.query("dump_Lp",dump_Lp);
-  bool dump_MF=false        ; pp.query("dump_MF", dump_MF);
-  bool dump_VisMF=false     ; pp.query("dump_VisMF", dump_VisMF);
-  bool dump_ascii=false     ; pp.query("dump_ascii", dump_ascii);
-  bool dump_rhs_ascii=false ; pp.query("dump_rhs_ascii", dump_rhs_ascii);
-
-  bool use_variable_coef=false; pp.query("use_variable_coef", use_variable_coef);
-
-  int res;
-
-  if ( !ABec )
-  {
-      //
-      // Build Laplacian operator, solver, then solve.
-      //
-      Laplacian lp(bd, dx[0]);
-      {
-          double d = lp.norm();
-          if ( ParallelDescriptor::IOProcessor() )
-	  {
-              std::cout << "Norm = " << d << std::endl;
-	  }
-      }
-      if ( mg )
-      {
-          const Real run_strt = ParallelDescriptor::second();
-
-	  MultiGrid mg_solver(lp);
-	  mg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	  if ( new_bc )
-          {
-	      for ( MFIter mfi(rhs); mfi.isValid(); ++mfi )
-              {
-		  int i = mfi.index(); //   ^^^ using rhs to get mfi.index() yes, this is a hack
-		  for (int n=0; n<BL_SPACEDIM; ++n)
-                  {
-		      bd.setValue(Orientation(n, Orientation::low) ,i,2.0);
-		      bd.setValue(Orientation(n, Orientation::high),i,2.0);
-                  }
-              }
-	      mg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-          }
-
-          const int IOProc   = ParallelDescriptor::IOProcessorNumber();
-          Real      run_stop = ParallelDescriptor::second() - run_strt;
-
-          ParallelDescriptor::ReduceRealMax(run_stop,IOProc);
-
-         if (ParallelDescriptor::IOProcessor())
-              std::cout << "Run time = " << run_stop << std::endl;
-      }
-      if ( cg )
-      {
-	  CGSolver cg_solver(lp,use_mg_pre);
-	  cg_solver.setMaxIter(maxiter);
-	  res = cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	  std::cout << "CG Result = " << res << std::endl;
-	  if ( new_bc )
-          {
-	      for ( MFIter mfi(rhs); mfi.isValid(); ++mfi )
-              {
-		  int i = mfi.index();  //   ^^^ using rhs to get mfi.index() yes, this is a hack
-		  for ( int n=0; n<BL_SPACEDIM; ++n )
-                  {
-		      bd.setValue(Orientation(n, Orientation::low) ,i,4.0);
-		      bd.setValue(Orientation(n, Orientation::high),i,4.0);
-                  }
-              }
-	      res  = cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	      std::cout << "CG (new_bc) Result = " << res << std::endl;
-          }
-      }
-      if ( bicg )
-      {
-	  CGSolver cg_solver(lp,use_mg_pre);
-	  cg_solver.setMaxIter(maxiter);
-	  res = cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	  std::cout << "BiCGStab Result = " << res << std::endl;
-	  if ( new_bc )
-          {
-	      for ( MFIter mfi(rhs); mfi.isValid(); ++mfi )
-              {
-		  int i = mfi.index();  //   ^^^ using rhs to get mfi.index() yes, this is a hack
-		  for ( int n=0; n<BL_SPACEDIM; ++n )
-                  {
-		      bd.setValue(Orientation(n, Orientation::low) ,i,4.0);
-		      bd.setValue(Orientation(n, Orientation::high),i,4.0);
-                  }
-              }
-	      res = cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	      std::cout << "BiCGStab (new_bc) Result = " << res << std::endl;
-          }
-      }
-
-      if ( dump_Lp )
-          std::cout << lp << std::endl;
-	
-        
-  }
-  else
-  {
-      //
-      // Allocate space for ABecLapacian coeffs, fill with values.
-      //
-      Real alpha = 1.0; pp.query("alpha",alpha);
-      Real beta =  1.0; pp.query("beta",beta);
-      Real a=0.0; pp.query("a",  a);
-      Array<Real, BL_SPACEDIM> b;
-      b[0]=1.0; pp.query("b0", b[0]);
-      b[1]=1.0; pp.query("b1", b[1]);
-#if (BL_SPACEDIM > 2)
-      b[2]=1.0; pp.query("b2", b[2]);
-#endif
-        
-      MultiFab  acoefs;
-      acoefs.define(bs, dm, Ncomp, Nghost);
-      acoefs.setVal(a);
-        
-      MultiFab bcoefs[BL_SPACEDIM];
-
-      if (use_variable_coef) {
-	MultiFab cc_coef(bs,dm,1,1);
-        for ( MFIter mfi(cc_coef); mfi.isValid(); ++mfi )
-        {
-          const int* clo = cc_coef[mfi].loVect();
-          const int* chi = cc_coef[mfi].hiVect();
-          const Box& bx = mfi.validbox();
-  
-          FORT_SET_CC_COEF(cc_coef[mfi].dataPtr(),AMREX_ARLIM(clo),AMREX_ARLIM(chi),bx.loVect(),bx.hiVect(),dx,geom.ProbLo(),geom.ProbHi());
-        }
-
-        VisMF::Write(cc_coef,"COEF");
-
-        for ( int n=0; n<BL_SPACEDIM; ++n )
-        {
-  	  BoxArray bsC(bs);
-	  bcoefs[n].define(bsC.surroundingNodes(n), dm, Ncomp, Nghost);
-          for ( MFIter mfi(bcoefs[n]); mfi.isValid(); ++mfi )
-          {
-            Box bx(bs[mfi.index()]);
-            const int* clo = cc_coef[mfi].loVect();
-            const int* chi = cc_coef[mfi].hiVect();
-            const int* edgelo = bcoefs[n][mfi].loVect();
-            const int* edgehi = bcoefs[n][mfi].hiVect();
-
-            FORT_COEF_TO_EDGES(&n,bcoefs[n][mfi].dataPtr(),AMREX_ARLIM(edgelo),AMREX_ARLIM(edgehi),
-                               cc_coef[mfi].dataPtr(),AMREX_ARLIM(clo),AMREX_ARLIM(chi),
-                               bx.loVect(),bx.hiVect());
-          }
-        }
-      } else {
-        for ( int n=0; n<BL_SPACEDIM; ++n )
-        {
-  	  BoxArray bsC(bs);
-	  bcoefs[n].define(bsC.surroundingNodes(n), dm, Ncomp, Nghost);
-  	  bcoefs[n].setVal(b[n]);
-        }
-      }
-      //
-      // Build operator, set coeffs, build solver, solve
-      //
-      {
-	  ABecLaplacian lp(bd, dx);
-	  lp.setScalars(alpha, beta);
-	  lp.setCoefficients(acoefs, bcoefs);
-          {
-              double d = lp.norm();
-              if ( ParallelDescriptor::IOProcessor() )
-	      {
-                  std::cout << "Norm = " << d << std::endl;
-	      }
-          }
-
-	  if ( mg )
-          {
-	      const Real run_strt = ParallelDescriptor::second();
-
-	      MultiGrid mg_solver(lp);
-	      mg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	      if ( new_bc )
-              {
-		  for ( int i=0; i < bs.size(); ++i )
-                  {
-		      for ( int n=0; n<BL_SPACEDIM; ++n )
-                      {
-			  bd.setValue(Orientation(n, Orientation::low) ,i,2.0);
-			  bd.setValue(Orientation(n, Orientation::high),i,2.0);
-                      } 
-                  }
-		  mg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-              }
-
-	      const int IOProc   = ParallelDescriptor::IOProcessorNumber();
-	      Real      run_stop = ParallelDescriptor::second() - run_strt;
-
-	      ParallelDescriptor::ReduceRealMax(run_stop,IOProc);
-
-	      if (ParallelDescriptor::IOProcessor())
-                  std::cout << "Run time = " << run_stop << std::endl;
-          }
-	  if ( cg )
-          {
-	      CGSolver cg_solver(lp,use_mg_pre);
-	      cg_solver.setMaxIter(maxiter);
-	      cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	      if ( new_bc )
-              {
-		  for ( int i=0; i < bs.size(); ++i )
-                  {
-		      for ( int n=0; n<BL_SPACEDIM; ++n )
-                      {
-			  bd.setValue(Orientation(n, Orientation::low) ,i,4.0);
-			  bd.setValue(Orientation(n, Orientation::high),i,4.0);
-                      }
-                  }
-		  cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-              }
-          }
-	  if ( bicg )
-          {
-	      CGSolver cg_solver(lp,use_mg_pre);
-	      cg_solver.setMaxIter(maxiter);
-	      cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-	      if ( new_bc )
-              {
-		  for ( int i=0; i < bs.size(); ++i )
-                  {
-		      for ( int n=0; n<BL_SPACEDIM; ++n )
-                      {
-			  bd.setValue(Orientation(n, Orientation::low) ,i,4.0);
-			  bd.setValue(Orientation(n, Orientation::high),i,4.0);
-                      }
-                  }
-		  cg_solver.solve(soln, rhs, tolerance, tolerance_abs);
-              }
-          }
-
-	  if ( dump_Lp )
-              std::cout << lp << std::endl;
-      }
-  } // -->> solve D^2(soln)=rhs   or   (alpha*a - beta*D.(b.G))soln=rhs
-
-  //
-  // Write solution, and rhs.
-  //
-  double d1, d2;
-  if ( dump_norm )
-  {
-      d1 = soln.norm2();
-      d2 = soln.norm0();
-      if ( ParallelDescriptor::IOProcessor() )
-      {
-	  std::cout << "solution 2-norm / 0-norm = " << d1 << " / " << d2 << std::endl;
-      }
-
-      if (false)
-      {
-          double mean = 0;
-          for (MFIter mfi(soln); mfi.isValid(); ++mfi) {
-              mean += soln[mfi].sum<RunOn::Host>(0);
-          }
-
-          ParallelDescriptor::ReduceRealSum(mean);
-
-          mean /= soln.boxArray().numPts();
-
-          for (MFIter mfi(soln); mfi.isValid(); ++mfi) {
-              soln[mfi].plus<RunOn::Host>(-mean);
-          }
-
-          d1 = soln.norm2();
-          d2 = soln.norm0();
-          if ( ParallelDescriptor::IOProcessor() )
-          {
-              std::cout << "solution norm (w/mean subtracted off) = " << d1 << "/" << d2 << std::endl;
-          }
-      }
-  }
-  if ( dump_MF || dump_VisMF )
-  {
-      MultiFab temp(bs, dm, 2, 0);
-      temp.setVal(0.0);
-      temp.copy(soln, 0, 0, 1);
-      temp.copy(rhs,  0, 1, 1);
-      if ( dump_MF )
-      {
-	  writePlotFile("soln_pf", temp, geom);
-      }
-      if ( dump_VisMF )
-      {
-	  VisMF::Write(temp, "soln_vismf", VisMF::OneFilePerCPU);
-      }
-  }
-  
-  if ( dump_ascii )
-  {
-      for ( MFIter mfi(soln); mfi.isValid(); ++mfi )
-      {
-	  std::cout << soln[mfi] << std::endl;
-      }
-  }
-
-  if ( dump_rhs_ascii )
-  {
-      for ( MFIter mfi(soln); mfi.isValid(); ++mfi )
-      {
-	  std::cout << rhs[mfi] << std::endl;
-      }
-  }
-
-  amrex::Finalize();
-
-}
-
diff --git a/Tests/LinearSolvers/C_CellMG/vpramps.dat b/Tests/LinearSolvers/C_CellMG/vpramps.dat
deleted file mode 100644
index 353ae4b0915..00000000000
--- a/Tests/LinearSolvers/C_CellMG/vpramps.dat
+++ /dev/null
@@ -1,10 +0,0 @@
-1
-2
-5
-0    42 140  220  255
-0.0 0.0 0.1  0.8  1.0
-4
-0    4  128 255
-0.0 0.6 0.8 1.0
-0.10
-0.90
diff --git a/Tests/LinearSolvers/C_TensorMG/GNUmakefile b/Tests/LinearSolvers/C_TensorMG/GNUmakefile
deleted file mode 100644
index 108401f390e..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/GNUmakefile
+++ /dev/null
@@ -1,34 +0,0 @@
-AMREX_HOME := ../../..
-
-PRECISION = DOUBLE
-
-DEBUG	= FALSE
-DEBUG	= TRUE
-
-DIM	= 2
-DIM	= 3
-
-COMP    = gnu
-
-USE_MPI = FALSE
-
-EBASE = main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-CXXFLAGS +=
-CXXOPTF  +=
-CXXDEBF  +=
-
-include ./Make.package
-
-include $(AMREX_HOME)/Src/LinearSolvers/C_TensorMG/Make.package
-include $(AMREX_HOME)/Src/LinearSolvers/C_CellMG/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/Boundary/Make.package
-
-all: $(executable)
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
diff --git a/Tests/LinearSolvers/C_TensorMG/Make.package b/Tests/LinearSolvers/C_TensorMG/Make.package
deleted file mode 100644
index 4be9d72fa44..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/Make.package
+++ /dev/null
@@ -1,10 +0,0 @@
-#
-# tensorMG test sources
-#
-CEXE_sources += TestMCViscBndry.cpp testVI.cpp
-CEXE_headers += TestMCViscBndry.H
-
-FEXE_sources += main_$(DIM)D.F
-FEXE_headers += main_F.H
-
-INCLUDE_LOCATIONS +=  .
diff --git a/Tests/LinearSolvers/C_TensorMG/Palette b/Tests/LinearSolvers/C_TensorMG/Palette
deleted file mode 100644
index e86ad05be1b..00000000000
Binary files a/Tests/LinearSolvers/C_TensorMG/Palette and /dev/null differ
diff --git a/Tests/LinearSolvers/C_TensorMG/TestMCViscBndry.H b/Tests/LinearSolvers/C_TensorMG/TestMCViscBndry.H
deleted file mode 100644
index 8d7d9a56a2f..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/TestMCViscBndry.H
+++ /dev/null
@@ -1,27 +0,0 @@
-#ifndef _MCVISCBNDRY_H_
-#define _MCVISCBNDRY_H_
-
-#include <AMReX_MCInterpBndryData.H>
-#include <AMReX_BC_TYPES.H>
-
-class MCViscBndry : public amrex::MCInterpBndryData
-{
-public:
-    MCViscBndry() : amrex::MCInterpBndryData()  {}
-
-    MCViscBndry(const amrex::BoxArray& _grids, 
-		const amrex::DistributionMapping& _dmap,
-		const amrex::Geometry& geom) :
-#if BL_SPACEDIM == 2
-        amrex::MCInterpBndryData(_grids,_dmap,4,geom) {};
-#elif BL_SPACEDIM == 3
-        amrex::MCInterpBndryData(_grids,_dmap,3*(1+3),geom) {};
-#endif
-
-    virtual void setBndryConds (const amrex::BCRec& phys_bc,
-                                int          ratio,
-                                int          comp=0);
-    void setHomogValues();
-};
-
-#endif
diff --git a/Tests/LinearSolvers/C_TensorMG/TestMCViscBndry.cpp b/Tests/LinearSolvers/C_TensorMG/TestMCViscBndry.cpp
deleted file mode 100644
index 750ab5621ad..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/TestMCViscBndry.cpp
+++ /dev/null
@@ -1,68 +0,0 @@
-#include <AMReX_LO_BCTYPES.H>
-#include <TestMCViscBndry.H>
-
-using namespace amrex;
-
-void
-MCViscBndry::setBndryConds (const BCRec& bc,
-			    int          ratio,
-			    int          comp)
-{
-#if BL_SPACEDIM == 2
-    BL_ASSERT(comp<2*2); // u and v, plus derivs of same
-#elif BL_SPACEDIM == 3
-    BL_ASSERT(comp<3*(3+1)); // u and v, plus derivs of same
-#endif
-
-    const Real* dx = geom.CellSize();
-    const Box& domain = geom.Domain();
-
-    for (OrientationIter fi; fi; ++fi)
-    {
-	RealTuple &bloc = bcloc[fi()];
-	Vector< Vector<BoundCond> >& bctag = bcond[fi()];
-	
-	int dir = fi().coordDir();
-	Real delta = dx[dir]*ratio;
-	int p_bc = (fi().isLow() ? bc.lo(dir): bc.hi(dir));
-	
-	for (int i = 0; i < boxes().size(); i++)
-	{
-	    if (domain[fi()] == boxes()[i][fi()] && !geom.isPeriodic(dir))
-	    {
-		// All physical bc values are located on face
-		if (p_bc == EXT_DIR ) {
-		    bctag[i][comp] = LO_DIRICHLET;
-		    bloc[i] = 0.0;
-		} else if (p_bc == FOEXTRAP      ||
-			   p_bc == HOEXTRAP      || 
-			   p_bc == REFLECT_EVEN)
-		{
-		    bctag[i][comp] = LO_NEUMANN;
-		    bloc[i] = 0.0;
-		} else if( p_bc == REFLECT_ODD )
-		{
-		    bctag[i][comp] = LO_REFLECT_ODD;
-		    bloc[i] = 0.0;
-		}
-	    }
-	    else
-	    {
-		// internal bndry, distance is half of crse
-		bctag[i][comp] = LO_DIRICHLET;
-		bloc[i] = 0.5*delta;
-	    }
-	}
-    }
-}
-
-
-// *************************************************************************
-
-void
-MCViscBndry::setHomogValues()
-{
-    for (int grd = 0; grd < boxes().size(); grd++)
-        for (OrientationIter fi; fi; ++fi)
-	    bndry[fi()][grd].setVal<RunOn::Host>(0.);
-}
diff --git a/Tests/LinearSolvers/C_TensorMG/amrvis.defaults b/Tests/LinearSolvers/C_TensorMG/amrvis.defaults
deleted file mode 100644
index dbb7452bf19..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/amrvis.defaults
+++ /dev/null
@@ -1,11 +0,0 @@
-palette               Palette
-initialderived        state_0
-initialscale          8
-numberformat          %8.5f
-maxpixmapsize         200000
-reservesystemcolors   24
-showboxes             TRUE
-windowheight          650
-windowwidth           700
-filetype              newplt
-fabordering           alpha
diff --git a/Tests/LinearSolvers/C_TensorMG/inputs b/Tests/LinearSolvers/C_TensorMG/inputs
deleted file mode 100644
index d536427f26a..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/inputs
+++ /dev/null
@@ -1,8 +0,0 @@
-geometry.coord_sys      = 0        # 0 => cart, 1 => RZ
-geometry.prob_lo   =   -0.0625 -0.0625 -0.0625
-geometry.prob_hi   =   1.0625 1.0625 1.0625
-cg.v = 2
-cg.maxiter = 500
-mg.v = 2
-mg.usecg = 0
-boxes = grids/gr16.dog
diff --git a/Tests/LinearSolvers/C_TensorMG/inputs2D b/Tests/LinearSolvers/C_TensorMG/inputs2D
deleted file mode 100644
index ad985816e66..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/inputs2D
+++ /dev/null
@@ -1,10 +0,0 @@
-geometry.coord_sys = 0        # 0 => cart, 1 => RZ
-geometry.prob_lo   = 0 0
-geometry.prob_hi   = 1 1
-geometry.is_periodic = 0 1
-cg.v = 2
-cg.maxiter = 500
-mg.v = 2
-mg.usecg = 0
-cg.maxiter = 500
-boxes = grids/gr2D
diff --git a/Tests/LinearSolvers/C_TensorMG/inputs3D b/Tests/LinearSolvers/C_TensorMG/inputs3D
deleted file mode 100644
index ccc55dddce1..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/inputs3D
+++ /dev/null
@@ -1,11 +0,0 @@
-geometry.coord_sys = 0        # 0 => cart, 1 => RZ
-geometry.prob_lo   = 0 0 0
-geometry.prob_hi   = 1 1 1
-cg.v = 2
-cg.maxiter = 500
-mg.v = 2
-mg.usecg = 0
-mg.maxiter = 500
-#boxes = grids/gr.3_2x3x4
-lo_bc = 4 4 1
-hi_bc = 4 4 2
diff --git a/Tests/LinearSolvers/C_TensorMG/inputs8 b/Tests/LinearSolvers/C_TensorMG/inputs8
deleted file mode 100644
index 13dfdb31401..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/inputs8
+++ /dev/null
@@ -1,8 +0,0 @@
-geometry.coord_sys      = 0        # 0 => cart, 1 => RZ
-geometry.prob_lo   =   -0.125 -0.125 -0.125
-geometry.prob_hi   =   1.125 1.125 1.125
-cg.v = 2
-cg.maxiter = 500
-mg.v = 2
-mg.usecg = 0
-boxes = grids/gr8.dog
diff --git a/Tests/LinearSolvers/C_TensorMG/main_2D.F b/Tests/LinearSolvers/C_TensorMG/main_2D.F
deleted file mode 100644
index e399c7d6b90..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/main_2D.F
+++ /dev/null
@@ -1,324 +0,0 @@
-#include <AMReX_CONSTANTS.H>
-#include <AMReX_REAL.H>
-
-#include "main_F.H"
-
-#if 0
-c .. 1 is 0
-c .. 2 is x
-c .. 3 is xy
-#define DOGU 1
-
-c .. 1 is y**2
-c .. 2 is y
-c .. 3 is (24-y)**2
-c .. 4 is 0
-c .. 5 is x**2
-#define DOGV 1
-
-      subroutine FORT_FILLCRSE (
-     $     crse, DIMS(crse),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(crse)
-      REAL_T crse(DIMV(crse),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, n
-      REAL_T x, y
-c      
-      do n=1,nc
-         if( n .eq. 1 ) then
-            do j=ARG_L2(crse), ARG_H2(crse)
-               y = (j + 0.5)*h(2)
-               do i=ARG_L1(crse), ARG_H1(crse)
-                  x = (i + 0.5)*h(1)
-#if DOGU==1
-                  crse(i,j,n)=0
-#elif DOGU==2
-                  crse(i,j,n)=x
-#elif DOGU==3
-                  crse(i,j,n)=x*y
-#else
-                  error is error
-#endif
-               enddo
-            enddo
-         else
-            do j=ARG_L2(crse), ARG_H2(crse)
-               y = (j + 0.5)*h(2)
-               do i=ARG_L1(crse), ARG_H1(crse)
-                  x = (i + 0.5)*h(1)
-#if DOGV==1
-                  crse(i,j,n)=y*y
-#elif DOGV==2
-                  crse(i,j,n)=y
-#elif DOGV==3
-                  crse(i,j,n)=(24-y)*(24-y)
-#elif DOGV==4
-                  crse(i,j,n)=0
-#elif DOGV==5
-                  crse(i,j,n)=x*x
-#else
-                  error is error
-#endif
-               enddo
-            enddo
-         endif
-      enddo
-      end
-      
-
-      
-      subroutine FORT_FILLFINE (
-     $     fine, DIMS(fine),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(fine)
-      REAL_T fine(DIMV(fine),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, n
-      REAL_T x, y
-c
-      do n=1,nc
-         if( n .eq. 1 ) then
-            do j=ARG_L2(fine), ARG_H2(fine)
-               y = (j + 0.5)*h(2)
-               do i=ARG_L1(fine), ARG_H1(fine)
-                  x = (i + 0.5)*h(1)
-                  if( x .gt. 0 ) then
-#if DOGU==1
-                  fine(i,j,n)=0
-#elif DOGU==2
-                  fine(i,j,n)=x
-#elif DOGU==3
-                  fine(i,j,n)=x*y
-#else
-                  error is error
-#endif
-                  else
-c....................at physical boundary, use homog bc
-                     fine(i,j,n) = 0
-                  endif
-               enddo
-            enddo
-         else
-            do j=ARG_L2(fine), ARG_H2(fine)
-               y = (j + 0.5)*h(2)
-               do i=ARG_L1(fine), ARG_H1(fine)
-                  x = (i + 0.5)*h(1)
-                  if( x .gt. 0 ) then
-#if DOGV==1
-                  fine(i,j,n)=y*y
-#elif DOGV==2
-                  fine(i,j,n)=y
-#elif DOGV==3
-                  fine(i,j,n)=(24-y)*(24-y)
-#elif DOGV==4
-                  fine(i,j,n)=0
-#elif DOGV==5
-                  fine(i,j,n)=x*x
-#else
-                  error is error
-#endif
-                  else
-                     fine(i,j,n) = 0
-                  endif
-               enddo
-            enddo
-         endif
-      enddo
-      end
-#else
-      
-#define TEST_EXT 0
-#define POWER 3
-#define MUPOWER 3
-
-
-      subroutine FORT_FILLCRSE (
-     $     crse, DIMS(crse),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(crse)
-      REAL_T crse(DIMV(crse),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, n
-      REAL_T x, y
-
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-
-      do j=ARG_L2(crse), ARG_H2(crse)
-         y = (j + 0.5)*h(2)
-         do i=ARG_L1(crse), ARG_H1(crse)
-            x = (i + 0.5)*h(1)
-            crse(i,j,1)=cux*x**POWER+cuy*y**POWER
-            crse(i,j,2)=cvx*x**POWER+cvy*y**POWER
-         enddo
-      enddo
-      
-      end
-      
-
-      
-      subroutine FORT_FILLFINE (
-     $     fine, DIMS(fine),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(fine)
-      REAL_T fine(DIMV(fine),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, n
-      REAL_T x, y
-c
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-c
-      do j=ARG_L2(fine), ARG_H2(fine)
-         y = (j + 0.5)*h(2)
-#if TEST_EXT
-         if( j.lt.0) y = 0
-#endif
-         do i=ARG_L1(fine), ARG_H1(fine)
-            x = (i + 0.5)*h(1)
-#if TEST_EXT
-            if( i.lt.0) x = 0
-#endif
-            fine(i,j,1)=cux*x**POWER+cuy*y**POWER
-            fine(i,j,2)=cvx*x**POWER+cvy*y**POWER
-         enddo
-      enddo
-
-
-      end
-      
-      subroutine FORT_FILLRHS (
-     $     rhs, DIMS(rhs),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(rhs)
-      REAL_T rhs(DIMV(rhs),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, n
-      REAL_T x, y
-c
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-c
-      do j=ARG_L2(rhs), ARG_H2(rhs)
-         y = (j + 0.5)*h(2)
-         do i=ARG_L1(rhs), ARG_H1(rhs)
-            x = (i + 0.5)*h(1)
-#if (POWER==3)&(MUPOWER==3)
-            rhs(i,j,1)= -(
-     -           18*alpha*cux*x**4 + 3*beta*y**2*(3*cvx*x**2 + 3*cuy*y**2) + 
-     -           12*cux*x*(1 + alpha*x**3 + beta*y**3) + 
-     -           6*cuy*y*(1 + alpha*x**3 + beta*y**3)
-     &           )
-            rhs(i,j,2)= -(
-     -           18*beta*cvy*y**4 + 3*alpha*x**2*(3*cvx*x**2 + 3*cuy*y**2) + 
-     -           6*cvx*x*(1 + alpha*x**3 + beta*y**3) + 
-     -           12*cvy*y*(1 + alpha*x**3 + beta*y**3) 
-     &           )
-#endif
-#if (POWER==2)&(MUPOWER==3)
-            rhs(i,j,1)= -(
-     -           12*alpha*cux*x**3 + 3*beta*y**2*(2*cvx*x + 2*cuy*y) + 
-     -           4*cux*(1 + alpha*x**3 + beta*y**3) + 
-     -           2*cuy*(1 + alpha*x**3 + beta*y**3)
-     &           )
-            rhs(i,j,2)= -(
-     -           12*beta*cvy*y**3 + 3*alpha*x**2*(2*cvx*x + 2*cuy*y) + 
-     -           2*cvx*(1 + alpha*x**3 + beta*y**3) + 
-     -           4*cvy*(1 + alpha*x**3 + beta*y**3)
-     &           )
-#endif
-         enddo
-      enddo
-      
-      
-      end
-      
-      subroutine FORT_MAKEMU(
-     $     mu,DIMS(mu),
-     $     h, idir ) bind(c)
-
-      integer idir
-      integer DIMDEC(mu)
-      REAL_T mu(DIMV(mu))
-      REAL_T h(BL_SPACEDIM)
-
-      integer i,j
-      REAL_T x,y
-c
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-c
-
-      if( idir .eq. 0 ) then
-         do j=ARG_L2(mu),ARG_H2(mu)
-            y = (j+0.5)*h(2)
-            do i=ARG_L1(mu),ARG_H1(mu)
-               x = (i)*h(1)
-               mu(i,j) = 1+alpha*x**MUPOWER+beta*y**MUPOWER
-            enddo
-         enddo
-      else if( idir .eq. 1 ) then
-         do j=ARG_L2(mu),ARG_H2(mu)
-            y = (j)*h(2)
-            do i=ARG_L1(mu),ARG_H1(mu)
-               x = (i+0.5)*h(1)
-               mu(i,j) = 1+alpha*x**MUPOWER+beta*y**MUPOWER
-            enddo
-         enddo
-      else
-         write(6,*)'FORT_MAKEMU: bad idir'
-         stop
-      endif
-      
-      return
-      end
-      
-#endif
diff --git a/Tests/LinearSolvers/C_TensorMG/main_3D.F b/Tests/LinearSolvers/C_TensorMG/main_3D.F
deleted file mode 100644
index 28cb47ec6ca..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/main_3D.F
+++ /dev/null
@@ -1,246 +0,0 @@
-#include <AMReX_CONSTANTS.H>
-#include <AMReX_REAL.H>
-
-#include "main_F.H"
-
-
-#define TEST_EXT 1
-#define POWER 3
-#define MUPOWER 3
-
-
-      subroutine FORT_FILLCRSE (
-     $     crse, DIMS(crse),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(crse)
-      REAL_T crse(DIMV(crse),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, k, n
-      REAL_T x, y, z
-
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-
-      do k=ARG_L3(crse), ARG_H3(crse)
-         z = (k+0.5)*h(3)
-         do j=ARG_L2(crse), ARG_H2(crse)
-            y = (j + 0.5)*h(2)
-            do i=ARG_L1(crse), ARG_H1(crse)
-               x = (i + 0.5)*h(1)
-               crse(i,j,k,1)=cux*x**POWER+cuy*y**POWER+cuz*z**POWER
-               crse(i,j,k,2)=cvx*x**POWER+cvy*y**POWER+cvz*z**POWER
-               crse(i,j,k,3)=cwx*x**POWER+cwy*y**POWER+cwz*z**POWER
-            enddo
-         enddo
-      enddo
-      
-      end
-      
-
-      
-      subroutine FORT_FILLFINE (
-     $     fine, DIMS(fine),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(fine)
-      REAL_T fine(DIMV(fine),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, k, n
-      REAL_T x, y,z
-c
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-c
-      do k=ARG_L3(fine), ARG_H3(fine)
-         z = (k + 0.5)*h(3)
-#if TEST_EXT
-         if( k.lt.0) z = 0
-#endif
-         do j=ARG_L2(fine), ARG_H2(fine)
-            y = (j + 0.5)*h(2)
-#if TEST_EXT
-            if( j.lt.0) y = 0
-#endif
-            do i=ARG_L1(fine), ARG_H1(fine)
-               x = (i + 0.5)*h(1)
-#if TEST_EXT
-               if( i.lt.0) x = 0
-#endif
-               fine(i,j,k,1)=cux*x**POWER+cuy*y**POWER+cuz*z**POWER
-               fine(i,j,k,2)=cvx*x**POWER+cvy*y**POWER+cvz*z**POWER
-               fine(i,j,k,3)=cwx*x**POWER+cwy*y**POWER+cwz*z**POWER
-            enddo
-         enddo
-      enddo
-
-
-      end
-      
-      subroutine FORT_FILLRHS (
-     $     rhs, DIMS(rhs),
-     $     h, nc
-     $     ) bind(c)
-      integer nc
-      integer DIMDEC(rhs)
-      REAL_T rhs(DIMV(rhs),nc)
-      REAL_T h(BL_SPACEDIM)
-c
-      integer  i, j, k, n
-      REAL_T x, y,z
-c
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-c
-      do k=ARG_L3(rhs), ARG_H3(rhs)
-         z = (k + 0.5)*h(3)
-         do j=ARG_L2(rhs), ARG_H2(rhs)
-            y = (j + 0.5)*h(2)
-            do i=ARG_L1(rhs), ARG_H1(rhs)
-               x = (i + 0.5)*h(1)
-#if (POWER==3)&(MUPOWER==3)
-               rhs(i,j,k,1)= -(
-     -  18*alpha*cux*x**4 + 3*beta*y**2*(3*cvx*x**2 + 3*cuy*y**2) + 
-     -  3*gamma*z**2*(3*cwx*x**2 + 3*cuz*z**2) + 
-     -  12*cux*x*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  6*cuy*y*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  6*cuz*z*(1 + alpha*x**3 + beta*y**3 + gamma*z**3)
-     &              )
-               rhs(i,j,k,2)= -(
-     -  18*beta*cvy*y**4 + 3*alpha*x**2*(3*cvx*x**2 + 3*cuy*y**2) + 
-     -  3*gamma*z**2*(3*cwy*y**2 + 3*cvz*z**2) + 
-     -  6*cvx*x*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  12*cvy*y*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  6*cvz*z*(1 + alpha*x**3 + beta*y**3 + gamma*z**3)
-     &              )
-               rhs(i,j,k,3)= -(
-     -  18*cwz*gamma*z**4 + 3*alpha*x**2*(3*cwx*x**2 + 3*cuz*z**2) + 
-     -  3*beta*y**2*(3*cwy*y**2 + 3*cvz*z**2) + 
-     -  6*cwx*x*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  6*cwy*y*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  12*cwz*z*(1 + alpha*x**3 + beta*y**3 + gamma*z**3)
-     &              )
-#endif
-#if (POWER==2)&(MUPOWER==3)
-               rhs(i,j,k,1)= -(
-     -   12*alpha*cux*x**3 + 3*beta*y**2*(2*cvx*x + 2*cuy*y) + 
-     -  3*gamma*z**2*(2*cwx*x + 2*cuz*z) + 
-     -  4*cux*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  2*cuy*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  2*cuz*(1 + alpha*x**3 + beta*y**3 + gamma*z**3)
-     &              )
-               rhs(i,j,k,2)= -(
-     -  12*beta*cvy*y**3 + 3*alpha*x**2*(2*cvx*x + 2*cuy*y) + 
-     -  3*gamma*z**2*(2*cwy*y + 2*cvz*z) + 
-     -  2*cvx*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  4*cvy*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  2*cvz*(1 + alpha*x**3 + beta*y**3 + gamma*z**3)
-     &              )
-               rhs(i,j,k,3)= -(
-     -  12*cwz*gamma*z**3 + 3*alpha*x**2*(2*cwx*x + 2*cuz*z) + 
-     -  3*beta*y**2*(2*cwy*y + 2*cvz*z) + 
-     -  2*cwx*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  2*cwy*(1 + alpha*x**3 + beta*y**3 + gamma*z**3) + 
-     -  4*cwz*(1 + alpha*x**3 + beta*y**3 + gamma*z**3)
-     &              )
-#endif
-            enddo
-         enddo
-      enddo
-
-
-      end
-      
-
-      subroutine FORT_MAKEMU(
-     $     mu,DIMS(mu),
-     $     h, idir ) bind(c)
-
-      integer idir
-      integer DIMDEC(mu)
-      REAL_T mu(DIMV(mu))
-      REAL_T h(BL_SPACEDIM)
-
-      integer i,j,k
-      REAL_T x,y,z
-c
-      REAL_T cux,cuy,cuz
-      REAL_T cvx,cvy,cvz
-      REAL_T cwx,cwy,cwz
-      REAL_T alpha,beta,gamma
-      namelist /fortin/ cux,cuy,cuz,
-     $     cvx,cvy,cvz,cwx,cwy,cwz,alpha,beta,gamma
-c      
-      open(9,file='probin',form='formatted',status='old')
-      read(9,fortin)
-      close(9)
-c
-
-      if( idir .eq. 0 ) then
-         do k=ARG_L3(mu),ARG_H3(mu)
-            z = (k+0.5)*h(3)
-            do j=ARG_L2(mu),ARG_H2(mu)
-               y = (j+0.5)*h(2)
-               do i=ARG_L1(mu),ARG_H1(mu)
-                  x = (i)*h(1)
-                  mu(i,j,k) = 1+alpha*x**MUPOWER+beta*y**MUPOWER+gamma*z**MUPOWER
-               enddo
-            enddo
-         enddo
-      else if( idir .eq. 1 ) then
-         do k=ARG_L3(mu),ARG_H3(mu)
-            z = (k+0.5)*h(3)
-            do j=ARG_L2(mu),ARG_H2(mu)
-               y = (j)*h(2)
-               do i=ARG_L1(mu),ARG_H1(mu)
-                  x = (i+0.5)*h(1)
-                  mu(i,j,k) = 1+alpha*x**MUPOWER+beta*y**MUPOWER+gamma*z**MUPOWER
-               enddo
-            enddo
-         enddo
-      else if( idir .eq. 2 ) then
-         do k=ARG_L3(mu),ARG_H3(mu)
-            z = (k)*h(3)
-            do j=ARG_L2(mu),ARG_H2(mu)
-               y = (j+0.5)*h(2)
-               do i=ARG_L1(mu),ARG_H1(mu)
-                  x = (i+0.5)*h(1)
-                  mu(i,j,k) = 1+alpha*x**MUPOWER+beta*y**MUPOWER+gamma*z**MUPOWER
-               enddo
-            enddo
-         enddo
-      else
-         write(6,*)'FORT_MAKEMU: bad idir'
-         stop
-      endif
-
-      return
-      end
diff --git a/Tests/LinearSolvers/C_TensorMG/main_F.H b/Tests/LinearSolvers/C_TensorMG/main_F.H
deleted file mode 100644
index 7ffe25e0ac6..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/main_F.H
+++ /dev/null
@@ -1,46 +0,0 @@
-#ifndef _main_F_H_
-#define _main_F_H_ 
-
-#include <AMReX_ArrayLim.H>
-#include <AMReX_REAL.H>
-
-#if (BL_SPACEDIM == 2)
-#define FORT_FILLCRSE  fillcrse2d
-#define FORT_FILLFINE  fillfine2d
-#define FORT_MAKEMU    makemu2d
-#define FORT_FILLRHS    fillrhs2d
-#endif
-
-#if (BL_SPACEDIM == 3)
-#define FORT_FILLCRSE  fillcrse3d
-#define FORT_FILLFINE  fillfine3d
-#define FORT_MAKEMU    makemu3d
-#define FORT_FILLRHS    fillrhs3d
-#endif
-
-#if !defined(BL_LANG_FORT)
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-    void FORT_FILLCRSE (
-	amrex_real* crse, ARLIM_P(crse_lo), ARLIM_P(crse_hi),
-	const amrex_real* h, const int* nc
-	);
-    void FORT_FILLFINE (
-	amrex_real* fine, ARLIM_P(fine_lo), ARLIM_P(fine_hi),
-	const amrex_real* h, const int* nc
-	);
-    void FORT_FILLRHS (
-	amrex_real* fine, ARLIM_P(fine_lo), ARLIM_P(fine_hi),
-	const amrex_real* h, const int* nc
-	);
-    void FORT_MAKEMU(
-		     amrex_real*mu, ARLIM_P(mulo),ARLIM_P(muhi),
-		     const amrex_real* h, int&idir );
-#ifdef __cplusplus
-};
-#endif
-#endif
-
-#endif
diff --git a/Tests/LinearSolvers/C_TensorMG/probin b/Tests/LinearSolvers/C_TensorMG/probin
deleted file mode 100644
index d362693dc0c..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/probin
+++ /dev/null
@@ -1,19 +0,0 @@
- $fortin
-
- cux = 1
- cuy = 0
- cuz = 0
-
- cvx = 0
- cvy = 0
- cvz = 0
-
- cwx = 0
- cwy = 0
- cwz = 1
-
- alpha = 1
- beta = 1
- gamma = 1
-
- $end
diff --git a/Tests/LinearSolvers/C_TensorMG/testVI.cpp b/Tests/LinearSolvers/C_TensorMG/testVI.cpp
deleted file mode 100644
index 18764c07585..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/testVI.cpp
+++ /dev/null
@@ -1,374 +0,0 @@
-#include <iostream>
-#include <fstream>
-#include <iomanip>
-#include <cmath>
-#include <cstdio>
-#include <string>
-
-#include <unistd.h>
-
-#include <AMReX_Utility.H>
-#include <AMReX_Box.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_VisMF.H>
-#ifdef AMREX_DEBUG
-#ifdef BL_USE_ARRAYVIEW
-#include <ArrayView.H>
-#endif
-#endif
-
-#include <TestMCViscBndry.H>
-#include <AMReX_DivVis.H>
-#include <AMReX_LO_BCTYPES.H>
-#include <AMReX_MCMultiGrid.H>
-#include <AMReX_MCCGSolver.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <main_F.H>
-
-using namespace amrex;
-
-int
-main (int   argc,
-      char* argv[])
-{
-    amrex::Initialize(argc,argv);
-
-    std::cout << std::setprecision(10);
-
-    if (argc < 2)
-    {
-      std::cerr << "usage:  " << argv[0] << " inputsfile [options]" << '\n';
-      exit(-1);
-    }
-
-    ParmParse pp;
-    
-    int n;
-
-    BoxArray bs;
-    
-#if BL_SPACEDIM == 2
-    Box domain(IntVect(0,0),IntVect(11,11));
-    std::string boxfile("gr.2_small_a") ;
-#elif BL_SPACEDIM == 3
-    Box domain(IntVect(0,0,0),IntVect(11,11,11));
-    std::string boxfile("grids/gr.3_2x3x4") ;
-#endif
-    pp.query("boxes", boxfile);
-
-    std::ifstream ifs(boxfile.c_str(), std::ios::in);
-
-    if (!ifs)
-    {
-        std::string msg = "problem opening grids file: ";
-        msg += boxfile.c_str();
-        amrex::Abort(msg.c_str());
-    }
-
-    ifs >> domain;
-
-    if (ParallelDescriptor::IOProcessor())
-	std::cout << "domain: " << domain << std::endl;
-
-    bs.readFrom(ifs);
-
-    if (ParallelDescriptor::IOProcessor())
-	std::cout << "grids:\n" << bs << std::endl;
-
-    Geometry geom(domain);
-    const Real* H = geom.CellSize();
-    int ratio=2; pp.query("ratio", ratio);
-
-    DistributionMapping dm {bs};
-    
-    // allocate/init soln and rhs
-    int Ncomp=BL_SPACEDIM;
-    int Nghost=0;
-    int Ngrids=bs.size();
-    MultiFab soln(bs, dm, Ncomp, Nghost); soln.setVal(0.0);
-    MultiFab out (bs, dm, Ncomp, Nghost); 
-    MultiFab rhs (bs, dm, Ncomp, Nghost); rhs.setVal(0.0);
-    for(MFIter rhsmfi(rhs); rhsmfi.isValid(); ++rhsmfi)
-    {
-	FORT_FILLRHS(rhs[rhsmfi].dataPtr(),
-		     ARLIM(rhs[rhsmfi].loVect()),ARLIM(rhs[rhsmfi].hiVect()),
-		     H,&Ncomp);
-    }
-    
-    // Create the boundary object
-    MCViscBndry vbd(bs,dm,geom);
-
-    BCRec phys_bc;
-    Vector<int> lo_bc(BL_SPACEDIM), hi_bc(BL_SPACEDIM);
-    pp.getarr("lo_bc",lo_bc,0,BL_SPACEDIM);
-    pp.getarr("hi_bc",hi_bc,0,BL_SPACEDIM);
-    for (int i = 0; i < BL_SPACEDIM; i++)
-    {
-        phys_bc.setLo(i,lo_bc[i]);
-        phys_bc.setHi(i,hi_bc[i]);
-    }
-
-    
-    // Create the BCRec's interpreted by ViscBndry objects
-#if BL_SPACEDIM==2
-    Vector<BCRec> pbcarray(4);
-    pbcarray[0] = BCRec(AMREX_D_DECL(REFLECT_ODD,REFLECT_EVEN,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[1] = BCRec(AMREX_D_DECL(REFLECT_EVEN,REFLECT_ODD,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[2] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[3] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-#elif BL_SPACEDIM==3
-    Vector<BCRec> pbcarray(12);
-
-#if 1
-    pbcarray[0] = BCRec(EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR);
-    pbcarray[1] = BCRec(EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR);
-    pbcarray[2] = BCRec(EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR,EXT_DIR);
-    pbcarray[3] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[4] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[5] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[6] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[7] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[8] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[9] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[10] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			 AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-    pbcarray[11] = BCRec(AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR),
-			 AMREX_D_DECL(EXT_DIR,EXT_DIR,EXT_DIR));
-#else
-    for (int i = 0; i < 12; i++)
-        pbcarray[i] = phys_bc;
-#endif
-#endif
-    
-    Nghost = 1; // need space for bc info
-    MultiFab fine(bs,dm,Ncomp,Nghost);
-    for(MFIter finemfi(fine); finemfi.isValid(); ++finemfi)
-    {
-	FORT_FILLFINE(fine[finemfi].dataPtr(),
-		      ARLIM(fine[finemfi].loVect()),ARLIM(fine[finemfi].hiVect()),
-		      H,&Ncomp);
-    }
-
-    // Create "background coarse data"
-    Box crse_bx = Box(domain).coarsen(ratio).grow(1);
-    BoxArray cba(crse_bx);
-    cba.maxSize(32);
-    Real h_crse[BL_SPACEDIM];
-    for (n=0; n<BL_SPACEDIM; n++) h_crse[n] = H[n]*ratio;
-
-    DistributionMapping cdm{cba};
-
-    MultiFab crse_mf(cba, cdm, Ncomp, 0);
-//    FArrayBox crse_fab(crse_bx,Ncomp);
-
-    for (MFIter mfi(crse_mf); mfi.isValid(); ++mfi)
-    {
-        FORT_FILLCRSE(crse_mf[mfi].dataPtr(),
-                      ARLIM(crse_mf[mfi].loVect()),ARLIM(crse_mf[mfi].hiVect()),
-                      h_crse,&Ncomp);
-    }
-
-
-    
-    // Create coarse boundary register, fill w/data from coarse FAB
-    int bndry_InRad=0;
-    int bndry_OutRad=1;
-    int bndry_Extent=1;
-    BoxArray cbs = BoxArray(bs).coarsen(ratio);
-    BndryRegister cbr(cbs,dm,bndry_InRad,bndry_OutRad,bndry_Extent,Ncomp);
-    for (OrientationIter face; face; ++face)
-    {
-	Orientation f = face();
-	FabSet& bnd_fs(cbr[f]);
-	bnd_fs.copyFrom(crse_mf, 0, 0, 0, Ncomp);
-    }
-  
-    // Interpolate crse data to fine boundary, where applicable
-    int cbr_Nstart=0;
-    int fine_Nstart=0;
-    int bndry_Nstart=0;
-    vbd.setBndryValues(cbr,cbr_Nstart,fine,fine_Nstart,
-		       bndry_Nstart,Ncomp,ratio,pbcarray);
-  
-    Nghost = 1; // other variables don't need extra space
-    
-    DivVis lp(vbd,H);
-    
-    Real a = 0.0;
-    Real b[BL_SPACEDIM];
-    b[0] = 1.0;
-    b[1] = 1.0;
-#if BL_SPACEDIM>2
-    b[2] = 1.0;
-#endif
-    MultiFab  acoefs;
-    int NcompA = (BL_SPACEDIM == 2  ?  2  :  1);
-    acoefs.define(bs, dm, NcompA, Nghost);
-    acoefs.setVal(a);
-    MultiFab bcoefs[BL_SPACEDIM];
-    for (n=0; n<BL_SPACEDIM; ++n)
-    {
-	BoxArray bsC(bs);
-	bcoefs[n].define(bsC.surroundingNodes(n), dm, 1, Nghost);
-#if 1
-	for(MFIter bmfi(bcoefs[n]); bmfi.isValid(); ++bmfi)
-	{
-	    FORT_MAKEMU(bcoefs[n][bmfi].dataPtr(),
-			ARLIM(bcoefs[n][bmfi].loVect()),ARLIM(bcoefs[n][bmfi].hiVect()),H,n);
-	}
-#else
-	bcoefs[n].setVal(b[n]);
-#endif
-    } // -->> over dimension
-    lp.setCoefficients(acoefs, bcoefs);
-#if 1
-    lp.maxOrder(4);
-#endif
-    
-    Nghost = 1;
-    MultiFab tsoln(bs, dm, Ncomp, Nghost); 
-    tsoln.setVal(0.0);
-#if 1
-    tsoln.copy(fine);
-#endif
-#if 0
-    // testing apply
-    lp.apply(out,tsoln);
-    Box subbox = out[0].box();
-    Real n1 = out[0].norm(subbox,1,0,BL_SPACEDIM)*pow(H[0],BL_SPACEDIM);
-    ParallelDescriptor::ReduceRealSum(n1);
-    if (ParallelDescriptor::IOProcessor())
-    {
-	cout << "n1 output is "<<n1<<std::endl;
-    }
-    out.minus(rhs,0,BL_SPACEDIM,0);
-    // special to single grid prob
-    Real n2 = out[0].norm(subbox,1,0,BL_SPACEDIM)*pow(H[0],BL_SPACEDIM);
-    ParallelDescriptor::ReduceRealSum(n2);
-    if (ParallelDescriptor::IOProcessor())
-    {
-	cout << "n2 difference is "<<n2<<std::endl;
-    }
-#if 0
-    subbox.grow(-1);
-    Real n3 = out[0].norm(subbox,0,0,BL_SPACEDIM)*pow(H[0],BL_SPACEDIM);
-    ParallelDescriptor::ReduceRealMax(n3);
-    if (ParallelDescriptor::IOProcessor())
-    {
-	cout << "n3 difference is "<<n3<<std::endl;
-    }
-#endif
-    
-#endif
-    
-    const IntVect refRatio(AMREX_D_DECL(2,2,2));
-    const Real bgVal = 1.0;
-    
-#if 1
-#ifdef AMREX_DEBUG
-    // testing flux computation
-    BoxArray xfluxbox(bs);
-    xfluxbox.surroundingNodes(0);
-    MultiFab xflux(xfluxbox,dm,Ncomp,Nghost);
-    xflux.setVal(1.e30);
-    BoxArray yfluxbox(bs);
-    yfluxbox.surroundingNodes(1);
-    MultiFab yflux(yfluxbox,dm,Ncomp,Nghost);
-    yflux.setVal(1.e30);
-#if BL_SPACEDIM>2
-    BoxArray zfluxbox(bs);
-    zfluxbox.surroundingNodes(2);
-    MultiFab zflux(zfluxbox,dm,Ncomp,Nghost);
-    zflux.setVal(1.e30);
-#endif
-    lp.compFlux(xflux,
-		yflux,
-#if BL_SPACEDIM>2
-		zflux,
-#endif
-		tsoln);
-    
-    // Write fluxes
-    //writeMF(&xflux,"xflux.mfab");
-    //writeMF(&yflux,"yflux.mfab");
-#if BL_SPACEDIM>2
-    //writeMF(&zflux,"zflux.mfab");
-#endif
-    
-#endif
-#endif
-    
-    Real tolerance = 1.0e-10; pp.query("tol", tolerance);
-    Real tolerance_abs = 1.0e-10; pp.query("tol_abs", tolerance_abs);
-
-#if 0
-    cout << "Bndry Data object:" << std::endl;
-    cout << lp.bndryData() << std::endl;
-#endif
-    
-#if 0
-    bool use_mg_pre = false;
-    MCCGSolver cg(lp,use_mg_pre);
-    cg.solve(soln,rhs,tolerance,tolerance_abs);
-#else
-    MCMultiGrid mg(lp);
-    mg.solve(soln,rhs,tolerance,tolerance_abs);
-#endif
-
-#if 0
-    cout << "MCLinOp object:" << std::endl;
-    cout << lp << std::endl;
-#endif
-    
-    VisMF::Write(soln,"soln");
-    
-#if 0
-    // apply operator to soln to see if really satisfies eqn
-    tsoln.copy(soln);
-    lp.apply(out,tsoln);
-    soln.copy(out);
-    // Output "apply" results on soln
-    VisMF::Write(soln,"apply");
-
-    // Compute truncation
-    for (MFIter smfi(soln); smfi.isValid(); ++smfi)
-    {
-	soln[smfi] -= fine[smfi];
-    }
-    for( int icomp=0; icomp < BL_SPACEDIM ; icomp++ )
-    {
-	Real solnMin = soln.min(icomp);
-	Real solnMax = soln.max(icomp);
-	ParallelDescriptor::ReduceRealMin(solnMin);
-	ParallelDescriptor::ReduceRealMax(solnMax);
-	if (ParallelDescriptor::IOProcessor())
-	{
-	    cout << icomp << "  "<<solnMin << " " << solnMax <<std::endl;
-	}
-    }
-    // Output truncation
-    VisMF::Write(soln,"trunc");
-#endif
-
-    int dumpLp=0; pp.query("dumpLp",dumpLp);
-    bool write_lp = (dumpLp == 1 ? true : false);
-    if (write_lp)
-	std::cout << lp << std::endl;
-
-    // Output trunc
-    ParallelDescriptor::EndParallel();
-}
diff --git a/Tests/LinearSolvers/C_TensorMG/vpramps.dat b/Tests/LinearSolvers/C_TensorMG/vpramps.dat
deleted file mode 100644
index db9d90d5a78..00000000000
--- a/Tests/LinearSolvers/C_TensorMG/vpramps.dat
+++ /dev/null
@@ -1,10 +0,0 @@
-1
-2
-5
-0    42 140  220  255
-0.0 0.0 0.5  0.8  1.0
-4
-0    4  128 255
-0.0 0.6 0.8 1.0
-0.10
-0.90
diff --git a/Tests/LinearSolvers/CellEB/GNUmakefile b/Tests/LinearSolvers/CellEB/GNUmakefile
index 1fe68d5cf54..45c97ff1584 100644
--- a/Tests/LinearSolvers/CellEB/GNUmakefile
+++ b/Tests/LinearSolvers/CellEB/GNUmakefile
@@ -15,7 +15,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 include ./Make.package
diff --git a/Tests/LinearSolvers/CellEB2/GNUmakefile b/Tests/LinearSolvers/CellEB2/GNUmakefile
index d6e18f293c8..3cb6e07f643 100644
--- a/Tests/LinearSolvers/CellEB2/GNUmakefile
+++ b/Tests/LinearSolvers/CellEB2/GNUmakefile
@@ -14,7 +14,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tests/LinearSolvers/CellOverset/GNUmakefile b/Tests/LinearSolvers/CellOverset/GNUmakefile
new file mode 100644
index 00000000000..6487feb7cc3
--- /dev/null
+++ b/Tests/LinearSolvers/CellOverset/GNUmakefile
@@ -0,0 +1,34 @@
+
+DEBUG = FALSE
+
+TEST = TRUE
+USE_ASSERTION = TRUE
+
+BL_NO_FORT = TRUE
+
+USE_EB = FALSE
+
+USE_MPI  = TRUE
+USE_OMP  = FALSE
+
+USE_HYPRE  = FALSE
+USE_PETSC  = FALSE
+
+COMP = gnu
+
+DIM = 2
+
+AMREX_HOME = ../../..
+
+include $(AMREX_HOME)/Tools/GNUMake/Make.defs
+include ./Make.package
+
+Pdirs := Base Boundary
+Pdirs += LinearSolvers/MLMG
+
+Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
+
+include $(Ppack)
+
+include $(AMREX_HOME)/Tools/GNUMake/Make.rules
+
diff --git a/Tests/LinearSolvers/CellOverset/Make.package b/Tests/LinearSolvers/CellOverset/Make.package
new file mode 100644
index 00000000000..2eec913790a
--- /dev/null
+++ b/Tests/LinearSolvers/CellOverset/Make.package
@@ -0,0 +1,3 @@
+CEXE_sources += main.cpp
+CEXE_sources += MyTest.cpp
+CEXE_headers += MyTest.H
diff --git a/Tests/LinearSolvers/CellOverset/MyTest.H b/Tests/LinearSolvers/CellOverset/MyTest.H
new file mode 100644
index 00000000000..bd1ce23d53c
--- /dev/null
+++ b/Tests/LinearSolvers/CellOverset/MyTest.H
@@ -0,0 +1,50 @@
+#ifndef MY_TEST_H_
+#define MY_TEST_H_
+
+#include <AMReX_MLMG.H>
+
+class MyTest
+{
+public:
+
+    MyTest ();
+
+    void solve ();
+    void writePlotfile ();
+    void initData ();
+
+private:
+
+    void readParameters ();
+    void initGrids ();
+
+    int n_cell = 128;
+    int max_grid_size = 64;
+
+    std::string plot_file_name{"plot"};
+
+    // For MLMG solver
+    int verbose = 2;
+    int bottom_verbose = 2;
+    int max_coarsening_level = 30;
+
+    amrex::Geometry geom;
+    amrex::BoxArray grids;
+    amrex::DistributionMapping dmap;
+
+    amrex::MultiFab phi;
+    amrex::MultiFab rhs;
+    amrex::MultiFab exact_phi;
+    amrex::MultiFab acoef;
+    amrex::MultiFab bcoef;
+
+    amrex::Real ascalar = 1.e-3;
+    amrex::Real bscalar = 1.0;
+
+    int do_overset = 1;
+    amrex::iMultiFab oversetmask;
+
+    int use_hypre = 0;
+};
+
+#endif
diff --git a/Tests/LinearSolvers/CellOverset/MyTest.cpp b/Tests/LinearSolvers/CellOverset/MyTest.cpp
new file mode 100644
index 00000000000..13ebd8613f1
--- /dev/null
+++ b/Tests/LinearSolvers/CellOverset/MyTest.cpp
@@ -0,0 +1,228 @@
+#include "MyTest.H"
+
+#include <AMReX_MLABecLaplacian.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_MultiFabUtil.H>
+#include <AMReX_PlotFileUtil.H>
+
+using namespace amrex;
+
+MyTest::MyTest ()
+{
+    readParameters();
+
+    initGrids();
+
+    initData();
+}
+
+//
+// Solve L(phi) = rhs
+//
+void
+MyTest::solve ()
+{
+    std::array<LinOpBCType,AMREX_SPACEDIM> mlmg_lobc;
+    std::array<LinOpBCType,AMREX_SPACEDIM> mlmg_hibc;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        mlmg_lobc[idim] = LinOpBCType::Dirichlet;
+        mlmg_hibc[idim] = LinOpBCType::Dirichlet;
+    }
+
+    LPInfo info;
+    info.setMaxCoarseningLevel(max_coarsening_level);
+
+    std::unique_ptr<MLABecLaplacian> mlabec;
+    if (do_overset) {
+        mlabec.reset(new MLABecLaplacian({geom}, {grids}, {dmap}, {&oversetmask}, info));
+    } else {
+        mlabec.reset(new MLABecLaplacian({geom}, {grids}, {dmap}, info));
+    }
+
+    mlabec->setDomainBC(mlmg_lobc, mlmg_hibc);
+    mlabec->setLevelBC(0, &exact_phi);
+
+    mlabec->setScalars(ascalar, bscalar);
+    mlabec->setACoeffs(0, acoef);
+
+    Array<MultiFab,AMREX_SPACEDIM> face_bcoef;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+    {
+        const BoxArray& ba = amrex::convert(bcoef.boxArray(),
+                                            IntVect::TheDimensionVector(idim));
+        face_bcoef[idim].define(ba, bcoef.DistributionMap(), 1, 0);
+    }
+    amrex::average_cellcenter_to_face(GetArrOfPtrs(face_bcoef),
+                                      bcoef, geom);
+    mlabec->setBCoeffs(0, amrex::GetArrOfConstPtrs(face_bcoef));
+
+    MLMG mlmg(*mlabec);
+    mlmg.setVerbose(verbose);
+    mlmg.setBottomVerbose(bottom_verbose);
+
+#ifdef AMREX_USE_HYPRE
+    if (use_hypre) {
+        mlmg.setBottomSolver(amrex::BottomSolver::hypre);
+    }
+#endif
+
+    // In region with overset mask = 0, phi has valid solution and rhs is zero.
+    Real mlmg_err = mlmg.solve({&phi}, {&rhs}, 1.e-11, 0.0);
+}
+
+void
+MyTest::writePlotfile ()
+{
+    Vector<std::string> varname = {"solution", "rhs", "exact_solution", "error", "acoef", "bcoef"};
+    MultiFab plotmf(grids, dmap, varname.size(), 0);
+    MultiFab::Copy(plotmf, phi       , 0, 0, 1, 0);
+    MultiFab::Copy(plotmf, rhs       , 0, 1, 1, 0);
+    MultiFab::Copy(plotmf, exact_phi , 0, 2, 1, 0);
+    MultiFab::Copy(plotmf, phi       , 0, 3, 1, 0);
+    MultiFab::Subtract(plotmf, plotmf, 2, 3, 1, 0); // error = soln - exact
+    MultiFab::Copy(plotmf, acoef     , 0, 4, 1, 0);
+    MultiFab::Copy(plotmf, bcoef     , 0, 5, 1, 0);
+    auto dx = geom.CellSize();
+    Real dvol = AMREX_D_TERM(dx[0],*dx[1],*dx[2]);
+    amrex::Print() << " max-norm error: " << plotmf.norminf(3)
+                   << " 1-norm error: " << plotmf.norm1(3)*dvol << std::endl;
+    WriteSingleLevelPlotfile("plot", plotmf, varname, geom, 0.0, 0);
+}
+
+void
+MyTest::readParameters ()
+{
+    ParmParse pp;
+    pp.query("n_cell", n_cell);
+    pp.query("max_grid_size", max_grid_size);
+
+    pp.query("plot_file", plot_file_name);
+
+    pp.query("verbose", verbose);
+    pp.query("bottom_verbose", bottom_verbose);
+    pp.query("max_coarsening_level", max_coarsening_level);
+
+    pp.query("do_overset", do_overset);
+
+#ifdef AMREX_USE_HYPRE
+    pp.query("use_hypre", use_hypre);
+    if (use_hypre) max_coarsening_level = 0;
+#endif
+}
+
+void
+MyTest::initGrids ()
+{
+    RealBox rb({AMREX_D_DECL(0.,0.,0.)}, {AMREX_D_DECL(1.,1.,1.)});
+    std::array<int,AMREX_SPACEDIM> isperiodic{AMREX_D_DECL(0,0,0)};
+    Geometry::Setup(&rb, 0, isperiodic.data());
+    Box domain(IntVect{AMREX_D_DECL(0,0,0)}, IntVect{AMREX_D_DECL(n_cell-1,n_cell-1,n_cell-1)});
+    geom.define(domain, rb, CoordSys::cartesian, isperiodic);
+
+    grids.define(domain);
+    grids.maxSize(max_grid_size);
+}
+
+void
+MyTest::initData ()
+{
+    dmap.define(grids);
+
+    phi.define(grids, dmap, 1, 1);
+    rhs.define(grids, dmap, 1, 0);
+    exact_phi.define(grids, dmap, 1, 1);
+    acoef.define(grids, dmap, 1, 0);
+    bcoef.define(grids, dmap, 1, 1);
+    oversetmask.define(grids, dmap, 1, 0);
+
+    Box overset_box = amrex::grow(geom.Domain(), -n_cell/4); // middle of the domain
+    // Box overset_box = amrex::shift(geom.Domain(), 0, n_cell/2); // right half
+
+    const auto prob_lo = geom.ProbLoArray();
+    const auto prob_hi = geom.ProbHiArray();
+    const auto dx      = geom.CellSizeArray();
+    auto a = ascalar;
+    auto b = bscalar;
+    auto loverset = do_overset;
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    for (MFIter mfi(rhs, TilingIfNotGPU()); mfi.isValid(); ++mfi)
+    {
+        const Box& vbx = mfi.tilebox();
+        const Box& gbx = mfi.growntilebox(1);
+
+        auto phifab = phi.array(mfi);
+        auto rhsfab = rhs.array(mfi);
+        auto exact = exact_phi.array(mfi);
+        auto alpha = acoef.array(mfi);
+        auto beta = bcoef.array(mfi);
+        auto mask = oversetmask.array(mfi);
+
+        amrex::ParallelFor(gbx,
+        [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            constexpr amrex::Real w = 0.05;
+            constexpr amrex::Real sigma = 10.;
+            const amrex::Real theta = 0.5*std::log(3.) / (w + 1.e-50);
+
+            constexpr amrex::Real pi = 3.1415926535897932;
+            constexpr amrex::Real tpi =  2.*pi;
+            constexpr amrex::Real fpi =  4.*pi;
+            constexpr amrex::Real fac = static_cast<amrex::Real>(AMREX_SPACEDIM)*4.*pi*pi;
+
+            amrex::Real xc = (prob_hi[0] + prob_lo[0])*0.5;
+            amrex::Real yc = (prob_hi[1] + prob_lo[1])*0.5;
+#if (AMREX_SPACEDIM == 2)
+            amrex::Real zc = 0.0;
+#else
+            amrex::Real zc = (prob_hi[2] + prob_lo[2])*0.5;
+#endif
+
+            amrex::Real x = prob_lo[0] + dx[0] * (i + 0.5);
+            amrex::Real y = prob_lo[1] + dx[1] * (j + 0.5);
+#if (AMREX_SPACEDIM == 2)
+            amrex::Real z = 0.0;
+#else
+            amrex::Real z = prob_lo[2] + dx[2] * (k + 0.5);
+#endif
+
+            amrex::Real r = std::sqrt((x-xc)*(x-xc) + (y-yc)*(y-yc) + (z-zc)*(z-zc));
+            amrex::Real tmp = std::cosh(theta*(r-0.25));
+            amrex::Real dbdrfac = (sigma-1.)/2./(tmp*tmp) * theta/r;
+            dbdrfac *= b;
+
+            // for domain boundary
+            x = amrex::min(prob_hi[0], amrex::max(prob_lo[0], x));
+            y = amrex::min(prob_hi[1], amrex::max(prob_lo[1], y));
+#if (AMREX_SPACEDIM == 3)
+            z = amrex::min(prob_hi[2], amrex::max(prob_lo[2], z));
+#endif
+
+            beta(i,j,k) = (sigma-1.)/2.*std::tanh(theta*(r-0.25)) + (sigma+1.)/2.;
+            exact(i,j,k) = std::cos(tpi*x) * std::cos(tpi*y) * std::cos(tpi*z)
+                   + .25 * std::cos(fpi*x) * std::cos(fpi*y) * std::cos(fpi*z);
+            phifab(i,j,k) = 0.0;
+
+            if (vbx.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
+                alpha(i,j,k) = 1.;
+                rhsfab(i,j,k) = beta(i,j,k)*b*fac*(std::cos(tpi*x) * std::cos(tpi*y) * std::cos(tpi*z)
+                                                 + std::cos(fpi*x) * std::cos(fpi*y) * std::cos(fpi*z))
+                            + dbdrfac*((x-xc)*(tpi*std::sin(tpi*x) * std::cos(tpi*y) * std::cos(tpi*z)
+                                              + pi*std::sin(fpi*x) * std::cos(fpi*y) * std::cos(fpi*z))
+                                     + (y-yc)*(tpi*std::cos(tpi*x) * std::sin(tpi*y) * std::cos(tpi*z)
+                                              + pi*std::cos(fpi*x) * std::sin(fpi*y) * std::cos(fpi*z))
+                                     + (z-zc)*(tpi*std::cos(tpi*x) * std::cos(tpi*y) * std::sin(tpi*z)
+                                              + pi*std::cos(fpi*x) * std::cos(fpi*y) * std::sin(fpi*z)))
+                                            + a * (std::cos(tpi*x) * std::cos(tpi*y) * std::cos(tpi*z)
+                                          + 0.25 * std::cos(fpi*x) * std::cos(fpi*y) * std::cos(fpi*z));
+                if (loverset and overset_box.contains(IntVect(AMREX_D_DECL(i,j,k)))) {
+                    mask(i,j,k) = 0;
+                    phifab(i,j,k) = exact(i,j,k);
+                } else {
+                    mask(i,j,k) = 1;
+                }
+            }
+        });
+    }
+}
diff --git a/Tests/LinearSolvers/CellOverset/main.cpp b/Tests/LinearSolvers/CellOverset/main.cpp
new file mode 100644
index 00000000000..90a13cc0493
--- /dev/null
+++ b/Tests/LinearSolvers/CellOverset/main.cpp
@@ -0,0 +1,17 @@
+
+#include <AMReX.H>
+#include <AMReX_ParmParse.H>
+#include "MyTest.H"
+
+int main (int argc, char* argv[])
+{
+    amrex::Initialize(argc, argv);
+
+    {
+        MyTest mytest;
+        mytest.solve();
+        mytest.writePlotfile();
+    }
+
+    amrex::Finalize();
+}
diff --git a/Tests/LinearSolvers/EBConvergenceTest/GNUmakefile b/Tests/LinearSolvers/EBConvergenceTest/GNUmakefile
index ec1e1307b10..43ead809598 100644
--- a/Tests/LinearSolvers/EBConvergenceTest/GNUmakefile
+++ b/Tests/LinearSolvers/EBConvergenceTest/GNUmakefile
@@ -13,7 +13,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tests/LinearSolvers/EBTensor/GNUmakefile b/Tests/LinearSolvers/EBTensor/GNUmakefile
index 1230546ec68..5dccf77d3bf 100644
--- a/Tests/LinearSolvers/EBTensor/GNUmakefile
+++ b/Tests/LinearSolvers/EBTensor/GNUmakefile
@@ -13,7 +13,7 @@ COMP = gnu
 
 DIM = 3
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tests/LinearSolvers/EBTensor/Make.package b/Tests/LinearSolvers/EBTensor/Make.package
index 9a4113b0b8b..084d6b0f0e3 100644
--- a/Tests/LinearSolvers/EBTensor/Make.package
+++ b/Tests/LinearSolvers/EBTensor/Make.package
@@ -1,5 +1,5 @@
 
 CEXE_sources += main.cpp
 CEXE_sources += MyTest.cpp MyTestPlotfile.cpp
-CEXE_headers += MyTest.H MyTest_K.H
+CEXE_headers += MyTest.H MyTest_$(DIM)D_K.H
 
diff --git a/Tests/LinearSolvers/EBTensor/MyTest.cpp b/Tests/LinearSolvers/EBTensor/MyTest.cpp
index 50744715ed7..3fd6133cdb6 100644
--- a/Tests/LinearSolvers/EBTensor/MyTest.cpp
+++ b/Tests/LinearSolvers/EBTensor/MyTest.cpp
@@ -1,5 +1,9 @@
 #include "MyTest.H"
-#include "MyTest_K.H"
+#if (AMREX_SPACEDIM == 2)
+#include "MyTest_2D_K.H"
+#elif (AMREX_SPACEDIM == 3)
+#include "MyTest_3D_K.H"
+#endif
 
 #include <AMReX_EB2.H>
 #include <AMReX_EB2_IF.H>
@@ -56,21 +60,30 @@ MyTest::solve ()
                                                            LinOpBCType::Neumann)};
 
     std::string geom_type;
+#if (AMREX_SPACEDIM == 2)
+    {
+        ParmParse pp("eb2");
+        pp.get("geom_type", geom_type);
+    }
+#elif (AMREX_SPACEDIM == 3)
     int cylinder_direction;
     {
         ParmParse pp("eb2");
         pp.get("geom_type", geom_type);
         pp.get("cylinder_direction", cylinder_direction);
     }
+#endif
 
     if (geom_type == "all_regular") {
         for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
             v_lo_bc[idim] = LinOpBCType::Dirichlet;
             v_hi_bc[idim] = LinOpBCType::Dirichlet;
         }
+#if (AMREX_SPACEDIM == 3)
     } else {
         v_lo_bc[cylinder_direction] = LinOpBCType::Dirichlet;
         v_hi_bc[cylinder_direction] = LinOpBCType::Dirichlet;
+#endif
     }
 
     ebtensorop.setDomainBC({AMREX_D_DECL(v_lo_bc,v_lo_bc,v_lo_bc)},
@@ -118,7 +131,7 @@ MyTest::solve ()
         const MultiFab& vfrc = factory->getVolFrac();
         MultiFab::Multiply(error, vfrc, 0, 0, 1, 0);
         const auto dx = geom.CellSize();
-        error.mult(dx[0]*dx[1]*dx[2]);
+        error.mult(AMREX_D_TERM(dx[0],*dx[1],*dx[2]));
         amrex::Print() << "    1-norm error = " << error.norm1() << std::endl;
     }
 }
@@ -150,19 +163,25 @@ MyTest::initData ()
 
     factory = makeEBFabFactory(geom, grids, dmap, {2,2,2}, EBSupport::full);
 
-    solution.define(grids, dmap, 3, 1, MFInfo(), *factory);
-    exact.define(grids, dmap, 3, 1, MFInfo(), *factory);
-    rhs.define(grids, dmap, 3, 1, MFInfo(), *factory);
+    solution.define(grids, dmap, AMREX_SPACEDIM, 1, MFInfo(), *factory);
+    exact.define(grids, dmap, AMREX_SPACEDIM, 1, MFInfo(), *factory);
+    rhs.define(grids, dmap, AMREX_SPACEDIM, 1, MFInfo(), *factory);
     eta.define(grids, dmap, 1, 1, MFInfo(), *factory);
 
     const auto& dx = geom.CellSizeArray();
     const auto& problo = geom.ProbLo();
 
-    int cylinder_direction;
     amrex::Real R;
+
+#if (AMREX_SPACEDIM == 2)
+    ParmParse pp("eb2");
+    pp.get("sphere_radius", R);
+#elif (AMREX_SPACEDIM == 3)
+    int cylinder_direction;
     ParmParse pp("eb2");
     pp.get("cylinder_direction", cylinder_direction);
     pp.get("cylinder_radius", R);
+#endif
     amrex::Real R2 = R*R;
 
     for (MFIter mfi(exact); mfi.isValid(); ++mfi) {
@@ -175,10 +194,15 @@ MyTest::initData ()
         for         (int k = lo.z; k <= hi.z; ++k) {
             for     (int j = lo.y; j <= hi.y; ++j) {
                 for (int i = lo.x; i <= hi.x; ++i) {
-                    Real x = (i+0.5)*dx[0] + problo[0];
-                    Real y = (j+0.5)*dx[1] + problo[1];
-                    Real z = (k+0.5)*dx[2] + problo[2];
-                    Real u,v,w,urhs,vrhs,wrhs,seta;
+                    AMREX_D_TERM(Real x = (i+0.5)*dx[0] + problo[0];,
+                                 Real y = (j+0.5)*dx[1] + problo[1];,
+                                 Real z = (k+0.5)*dx[2] + problo[2];)
+
+                    Real u,v,urhs,vrhs,seta;
+#if (AMREX_SPACEDIM == 2)
+                    init(x,y,R2,u,v,urhs,vrhs,seta);
+#elif (AMREX_SPACEDIM == 3)
+                    Real w,wrhs;
                     if (cylinder_direction == 2) {
                         init(x,y,z,R2,u,v,w,urhs,vrhs,wrhs,seta);
                     } else if (cylinder_direction == 0) {
@@ -186,20 +210,30 @@ MyTest::initData ()
                     } else {
                         init(z,x,y,R2,w,u,v,wrhs,urhs,vrhs,seta);
                     }
-                    velfab(i,j,k,0) = u;
-                    velfab(i,j,k,1) = v;
-                    velfab(i,j,k,2) = w;
-                    rhsfab(i,j,k,0) = urhs;
-                    rhsfab(i,j,k,1) = vrhs;
-                    rhsfab(i,j,k,2) = wrhs;
+#endif
+                    AMREX_D_TERM(velfab(i,j,k,0) = u;,
+                                 velfab(i,j,k,1) = v;,
+                                 velfab(i,j,k,2) = w;);
+                    AMREX_D_TERM(rhsfab(i,j,k,0) = urhs;,
+                                 rhsfab(i,j,k,1) = vrhs;,
+                                 rhsfab(i,j,k,2) = wrhs;);
                     etafab(i,j,k) = seta;
+
+#if (AMREX_SPACEDIM == 2)
+                    if (x < -1.0 or x > 1.0 or
+                        y < -1.0 or y > 1.0)
+#elif (AMREX_SPACEDIM == 3)
                     if (x < -1.0 or x > 1.0 or
                         y < -1.0 or y > 1.0 or
                         z < -1.0 or z > 1.0)
+#endif
                     {
-                        x = std::max(-1.0,std::min(1.0,x));
-                        y = std::max(-1.0,std::min(1.0,y));
-                        z = std::max(-1.0,std::min(1.0,z));
+                        AMREX_D_TERM(x = std::max(-1.0,std::min(1.0,x));,
+                                     y = std::max(-1.0,std::min(1.0,y));,
+                                     z = std::max(-1.0,std::min(1.0,z));)
+#if (AMREX_SPACEDIM == 2)
+                            init(x,y,R2,u,v,urhs,vrhs,seta);
+#elif (AMREX_SPACEDIM == 3)
                         if (cylinder_direction == 2) {
                             init(x,y,z,R2,u,v,w,urhs,vrhs,wrhs,seta);
                         } else if (cylinder_direction == 0) {
@@ -207,9 +241,10 @@ MyTest::initData ()
                         } else {
                             init(z,x,y,R2,w,u,v,wrhs,urhs,vrhs,seta);
                         }
-                        velfab(i,j,k,0) = u;
-                        velfab(i,j,k,1) = v;
-                        velfab(i,j,k,2) = w;
+#endif
+                        AMREX_D_TERM(velfab(i,j,k,0) = u;,
+                                     velfab(i,j,k,1) = v;,
+                                     velfab(i,j,k,2) = w;);
                     }
                 }
             }
diff --git a/Tests/LinearSolvers/EBTensor/MyTestPlotfile.cpp b/Tests/LinearSolvers/EBTensor/MyTestPlotfile.cpp
index eafcb635108..6709ff55f64 100644
--- a/Tests/LinearSolvers/EBTensor/MyTestPlotfile.cpp
+++ b/Tests/LinearSolvers/EBTensor/MyTestPlotfile.cpp
@@ -9,44 +9,56 @@ void
 MyTest::writePlotfile () const
 {
     ParmParse pp;
-    bool gpu_regtest = false;
-#ifdef AMREX_USE_GPU
-    pp.query("gpu_regtest", gpu_regtest);
-#endif
-    if (gpu_regtest) {
-        const int ncomp = AMREX_SPACEDIM*3 + 2;
+    bool plot_error = true;
+
+    pp.query("plot_error", plot_error);
+
+    if (plot_error) {
+        const int ncomp = AMREX_SPACEDIM*4 + 2;
         Vector<std::string> varname =
-            {"u", "v", "w", "uexact", "vexact", "wexact",
+#if (AMREX_SPACEDIM == 2)
+            {"u", "v", "uexact", "vexact", "xerror", "yerror", 
+             "xrhs", "yrhs", "eta", "vfrc"};
+#else
+            {"u", "v", "w", "uexact", "vexact", "wexact", "xerror", "yerror", "zerror",
              "xrhs", "yrhs", "zrhs", "eta", "vfrc"};
+#endif
 
         const MultiFab& vfrc = factory->getVolFrac();
 
         MultiFab plotmf(grids, dmap, ncomp,  0);
-        MultiFab::Copy(plotmf, solution, 0,  0, 3, 0);
-        MultiFab::Copy(plotmf, exact   , 0,  3, 3, 0);
-        MultiFab::Copy(plotmf, rhs     , 0,  6, 3, 0);
-        MultiFab::Copy(plotmf, eta     , 0,  9, 1, 0);
-        MultiFab::Copy(plotmf, vfrc    , 0, 10, 1, 0);
+        MultiFab::Copy(plotmf, solution, 0,                 0  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, exact   , 0,    AMREX_SPACEDIM  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, solution, 0,  2*AMREX_SPACEDIM  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, rhs     , 0,  3*AMREX_SPACEDIM  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, eta     , 0,  4*AMREX_SPACEDIM  , 1, 0);
+        MultiFab::Copy(plotmf, vfrc    , 0,  4*AMREX_SPACEDIM+1, 1, 0);
+
+        MultiFab::Subtract(plotmf, exact, 0, 2*AMREX_SPACEDIM, AMREX_SPACEDIM, 0);
 
         WriteMultiLevelPlotfile("plot", 1, {&plotmf},
                                 varname, {geom}, 0.0, {0}, {IntVect(2)});
+
     } else {
-        const int ncomp = AMREX_SPACEDIM*4 + 2;
+
+        const int ncomp = AMREX_SPACEDIM*3 + 2;
         Vector<std::string> varname =
-            {"u", "v", "w", "uexact", "vexact", "wexact", "xerror", "yerror", "zerror",
+#if (AMREX_SPACEDIM == 2)
+            {"u", "v", "uexact", "vexact",
+             "xrhs", "yrhs", "eta", "vfrc"};
+#else
+            {"u", "v", "w", "uexact", "vexact", "wexact",
              "xrhs", "yrhs", "zrhs", "eta", "vfrc"};
+#endif
 
         const MultiFab& vfrc = factory->getVolFrac();
 
         MultiFab plotmf(grids, dmap, ncomp,  0);
-        MultiFab::Copy(plotmf, solution, 0,  0, 3, 0);
-        MultiFab::Copy(plotmf, exact   , 0,  3, 3, 0);
-        MultiFab::Copy(plotmf, solution, 0,  6, 3, 0);
-        MultiFab::Copy(plotmf, rhs     , 0,  9, 3, 0);
-        MultiFab::Copy(plotmf, eta     , 0, 12, 1, 0);
-        MultiFab::Copy(plotmf, vfrc    , 0, 13, 1, 0);
-
-        MultiFab::Subtract(plotmf, exact, 0, 6, 3, 0);
+        MultiFab::Copy(plotmf, solution, 0,               0  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, exact   , 0,  AMREX_SPACEDIM  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, rhs     , 0,2*AMREX_SPACEDIM  , AMREX_SPACEDIM, 0);
+        MultiFab::Copy(plotmf, eta     , 0,3*AMREX_SPACEDIM  , 1, 0);
+        MultiFab::Copy(plotmf, vfrc    , 0,3*AMREX_SPACEDIM+1, 1, 0);
 
         WriteMultiLevelPlotfile("plot", 1, {&plotmf},
                                 varname, {geom}, 0.0, {0}, {IntVect(2)});
diff --git a/Tests/LinearSolvers/EBTensor/MyTest_2D_K.H b/Tests/LinearSolvers/EBTensor/MyTest_2D_K.H
new file mode 100644
index 00000000000..c309eaa6a42
--- /dev/null
+++ b/Tests/LinearSolvers/EBTensor/MyTest_2D_K.H
@@ -0,0 +1,105 @@
+#ifndef MY_TEST_K_H_
+#define MY_TEST_K_H_
+
+#include <AMReX_FArrayBox.H>
+
+inline void init (amrex::Real x, amrex::Real y, amrex::Real R2,
+                  amrex::Real& u, amrex::Real& v, 
+                  amrex::Real& urhs, amrex::Real& vrhs,
+                  amrex::Real& eta)
+{
+    constexpr amrex::Real pi = 3.1415926535897932;
+    amrex::Real x2 = x*x;
+    amrex::Real y2 = y*y;
+    amrex::Real r2 = x2+y2;
+    amrex::Real r2R2 = r2/R2;
+    amrex::Real R4 = R2*R2;
+    amrex::Real sinx = std::sin(x);
+    amrex::Real cosx = std::cos(x);
+    amrex::Real siny = std::sin(y);
+    amrex::Real cosy = std::cos(y);
+
+    amrex::Real f1 = std::sin(   pi*r2R2);
+    amrex::Real f2 = std::sin(2.*pi*r2R2);
+    amrex::Real f3 = std::sin(3.*pi*r2R2);
+
+    u = sinx * (1. + siny) * f1;
+    v = (1. + sinx) * siny * f2;
+    eta = 2. + sinx * siny;
+
+    amrex::Real df1dx = std::cos(   pi*r2R2) * (2.*pi)/R2 * x;
+    amrex::Real df1dy = std::cos(   pi*r2R2) * (2.*pi)/R2 * y;
+    amrex::Real df2dx = std::cos(2.*pi*r2R2) * (4.*pi)/R2 * x;
+    amrex::Real df2dy = std::cos(2.*pi*r2R2) * (4.*pi)/R2 * y;
+    amrex::Real df3dx = std::cos(3.*pi*r2R2) * (6.*pi)/R2 * x;
+    amrex::Real df3dy = std::cos(3.*pi*r2R2) * (6.*pi)/R2 * y;
+
+    amrex::Real df1dx2 =  -std::sin(pi*r2R2) * (4.*pi*pi)/R4 * x2
+                          +std::cos(pi*r2R2) * (2.*pi)/R2;
+    amrex::Real df1dy2 =  -std::sin(pi*r2R2) * (4.*pi*pi)/R4 * y2
+                          +std::cos(pi*r2R2) * (2.*pi)/R2;
+    amrex::Real df1dxdy = -std::sin(pi*r2R2) * (4.*pi*pi)/R4 * x * y;
+
+    amrex::Real df2dx2 =  -std::sin(2.*pi*r2R2) * (16.*pi*pi)/R4 * x2
+                          +std::cos(2.*pi*r2R2) * (4.*pi)/R2;
+    amrex::Real df2dy2 =  -std::sin(2.*pi*r2R2) * (16.*pi*pi)/R4 * y2
+                          +std::cos(2.*pi*r2R2) * (4.*pi)/R2;
+    amrex::Real df2dxdy = -std::sin(2.*pi*r2R2) * (16.*pi*pi)/R4 * x * y;
+
+    amrex::Real df3dx2 = -std::sin(3.*pi*r2R2) * (36.*pi*pi)/R4 * x2
+                         +std::cos(3.*pi*r2R2) * (6.*pi)/R2;
+    amrex::Real df3dy2 = -std::sin(3.*pi*r2R2) * (36.*pi*pi)/R4 * y2
+                         +std::cos(3.*pi*r2R2) * (6.*pi)/R2;
+
+    amrex::Real detadx = cosx * siny;
+    amrex::Real detady = sinx * cosy;
+
+    amrex::Real dudx = cosx * (1.+siny) * f1
+                     + sinx * (1.+siny) * df1dx;
+    amrex::Real dudy = sinx * cosy * f1
+                     + sinx * (1.+siny) * df1dy;
+
+    amrex::Real dvdx = cosx * siny * f2
+                     + (1.+sinx) * siny * df2dx;
+    amrex::Real dvdy = (1.+sinx) * cosy * f2
+                     + (1.+sinx) * siny * df2dy;
+
+    amrex::Real dudx2 = -sinx * (1.+siny) * f1
+                       + cosx * (1.+siny) * df1dx
+                       + cosx * (1.+siny) * df1dx
+                       + sinx * (1.+siny) * df1dx2;
+    amrex::Real dudy2 = -sinx * siny * f1
+                       + sinx * cosy * df1dy
+                       + sinx * cosy * df1dy
+                       + sinx * (1.+siny) * df1dy2;
+    amrex::Real dudxdy = cosx * cosy * f1
+                       + cosx * (1.+siny) * df1dy
+                       + sinx * cosy * df1dx
+                       + sinx * (1.+siny) * df1dxdy;
+
+    amrex::Real dvdx2 = -sinx * siny * f2
+                        +cosx * siny * df2dx
+                        +cosx * siny * df2dx
+                        +(1.+sinx) * siny * df2dx2;
+    amrex::Real dvdy2 = -(1.+sinx) * siny * f2
+                        +(1.+sinx) * cosy * df2dy
+                        +(1.+sinx) * cosy * df2dy
+                        +(1.+sinx) * siny * df2dy2;
+    amrex::Real dvdxdy = cosx * cosy * f2
+                        +cosx * siny * df2dy
+                        +(1.+sinx) * cosy * df2dx
+                        +(1.+sinx) * siny * df2dxdy;
+
+    amrex::Real dtauxxdx = detadx*((4./3.)*dudx - (2./3.)*dvdy)
+                            + eta*((4./3.)*dudx2 - (2./3.)*dvdxdy);
+    amrex::Real dtauyydy = detady*((4./3.)*dvdy - (2./3.)*dudx)
+                            + eta*((4./3.)*dvdy2 - (2./3.)*dudxdy);
+
+    amrex::Real dtauxydx = detadx*(dvdx + dudy) + eta*(dvdx2 + dudxdy);
+    amrex::Real dtauxydy = detady*(dvdx + dudy) + eta*(dvdxdy + dudy2);
+
+    urhs = -(dtauxxdx + dtauxydy);
+    vrhs = -(dtauxydx + dtauyydy);
+}
+
+#endif
diff --git a/Tests/LinearSolvers/EBTensor/MyTest_3D_K.H b/Tests/LinearSolvers/EBTensor/MyTest_3D_K.H
new file mode 100644
index 00000000000..0e3b2d007ec
--- /dev/null
+++ b/Tests/LinearSolvers/EBTensor/MyTest_3D_K.H
@@ -0,0 +1,143 @@
+#ifndef MY_TEST_K_H_
+#define MY_TEST_K_H_
+
+#include <AMReX_FArrayBox.H>
+
+inline void init (amrex::Real x, amrex::Real y, amrex::Real z, amrex::Real R2,
+                  amrex::Real& u, amrex::Real& v, amrex::Real& w,
+                  amrex::Real& urhs, amrex::Real& vrhs, amrex::Real& wrhs,
+                  amrex::Real& eta)
+{
+    constexpr amrex::Real pi = 3.1415926535897932;
+    amrex::Real x2 = x*x;
+    amrex::Real y2 = y*y;
+    amrex::Real r2 = x2+y2;
+    amrex::Real r2R2 = r2/R2;
+    amrex::Real R4 = R2*R2;
+    amrex::Real sinx = std::sin(x);
+    amrex::Real cosx = std::cos(x);
+    amrex::Real siny = std::sin(y);
+    amrex::Real cosy = std::cos(y);
+    amrex::Real sinz = std::sin(z);
+    amrex::Real cosz = std::cos(z);
+
+    amrex::Real f1 = std::sin(pi*r2R2);
+    amrex::Real f2 = std::sin(2.*pi*r2R2);
+    amrex::Real f3 = std::sin(3.*pi*r2R2);
+
+    u = sinx * (1. + siny) * cosz * f1;
+    v = (1. + sinx) * siny * sinz * f2;
+    w = cosx * cosy * sinz * f3;
+    eta = 2. + sinx * siny * sinz;
+
+    amrex::Real df1dx = std::cos(pi*r2R2) * (2.*pi)/R2 * x;
+    amrex::Real df1dy = std::cos(pi*r2R2) * (2.*pi)/R2 * y;
+    amrex::Real df2dx = std::cos(2.*pi*r2R2) * (4.*pi)/R2 * x;
+    amrex::Real df2dy = std::cos(2.*pi*r2R2) * (4.*pi)/R2 * y;
+    amrex::Real df3dx = std::cos(3.*pi*r2R2) * (6.*pi)/R2 * x;
+    amrex::Real df3dy = std::cos(3.*pi*r2R2) * (6.*pi)/R2 * y;
+
+    amrex::Real df1dx2 = -std::sin(pi*r2R2) * (4.*pi*pi)/R4 * x2
+        + std::cos(pi*r2R2) * (2.*pi)/R2;
+    amrex::Real df1dy2 = -std::sin(pi*r2R2) * (4.*pi*pi)/R4 * y2
+        + std::cos(pi*r2R2) * (2.*pi)/R2;
+    amrex::Real df1dxdy = -std::sin(pi*r2R2) * (4.*pi*pi)/R4 * x * y;
+
+    amrex::Real df2dx2 = -std::sin(2.*pi*r2R2) * (16.*pi*pi)/R4 * x2
+        + std::cos(2.*pi*r2R2) * (4.*pi)/R2;
+    amrex::Real df2dy2 = -std::sin(2.*pi*r2R2) * (16.*pi*pi)/R4 * y2
+        + std::cos(2.*pi*r2R2) * (4.*pi)/R2;
+    amrex::Real df2dxdy = -std::sin(2.*pi*r2R2) * (16.*pi*pi)/R4 * x * y;
+
+    amrex::Real df3dx2 = -std::sin(3.*pi*r2R2) * (36.*pi*pi)/R4 * x2
+        + std::cos(3.*pi*r2R2) * (6.*pi)/R2;
+    amrex::Real df3dy2 = -std::sin(3.*pi*r2R2) * (36.*pi*pi)/R4 * y2
+        + std::cos(3.*pi*r2R2) * (6.*pi)/R2;
+
+    amrex::Real detadx = cosx * siny * sinz;
+    amrex::Real detady = sinx * cosy * sinz;
+    amrex::Real detadz = sinx * siny * cosz;
+
+    amrex::Real dudx = cosx * (1.+siny) * cosz * f1
+        + sinx * (1.+siny) * cosz * df1dx;
+    amrex::Real dudy = sinx * cosy * cosz * f1
+        + sinx * (1.+siny) * cosz * df1dy;
+    amrex::Real dudz = -sinx * (1.+siny) * sinz * f1;
+
+    amrex::Real dvdx = cosx * siny * sinz * f2
+        + (1.+sinx) * siny * sinz * df2dx;
+    amrex::Real dvdy = (1.+sinx) * cosy * sinz * f2
+        + (1.+sinx) * siny * sinz * df2dy;
+    amrex::Real dvdz = (1.+sinx) * siny * cosz * f2;
+
+    amrex::Real dwdx = -sinx * cosy * sinz * f3
+        + cosx * cosy * sinz * df3dx;
+    amrex::Real dwdy = -cosx * siny * sinz * f3
+        + cosx * cosy * sinz * df3dy;
+    amrex::Real dwdz = cosx * cosy * cosz * f3;
+
+    amrex::Real dudx2 = -sinx * (1.+siny) * cosz * f1
+        + cosx * (1.+siny) * cosz * df1dx
+        + cosx * (1.+siny) * cosz * df1dx
+        + sinx * (1.+siny) * cosz * df1dx2;
+    amrex::Real dudy2 = -sinx * siny * cosz * f1
+        + sinx * cosy * cosz * df1dy
+        + sinx * cosy * cosz * df1dy
+        + sinx * (1.+siny) * cosz * df1dy2;
+    amrex::Real dudz2 = -sinx * (1.+siny) * cosz * f1;
+    amrex::Real dudxdy = cosx * cosy * cosz * f1
+        + cosx * (1.+siny) * cosz * df1dy
+        + sinx * cosy * cosz * df1dx
+        + sinx * (1.+siny) * cosz * df1dxdy;
+    amrex::Real dudxdz = -cosx * (1.+siny) * sinz * f1
+        - sinx * (1.+siny) * sinz * df1dx;
+
+    amrex::Real dvdx2 = -sinx * siny * sinz * f2
+        + cosx * siny * sinz * df2dx
+        + cosx * siny * sinz * df2dx
+        + (1.+sinx) * siny * sinz * df2dx2;
+    amrex::Real dvdy2 = -(1.+sinx) * siny * sinz * f2
+        + (1.+sinx) * cosy * sinz * df2dy
+        + (1.+sinx) * cosy * sinz * df2dy
+        + (1.+sinx) * siny * sinz * df2dy2;
+    amrex::Real dvdz2 = -(1.+sinx) * siny * sinz * f2;
+    amrex::Real dvdxdy = cosx * cosy * sinz * f2
+        + cosx * siny * sinz * df2dy
+        + (1.+sinx) * cosy * sinz * df2dx
+        + (1.+sinx) * siny * sinz * df2dxdy;
+    amrex::Real dvdydz = (1.+sinx) * cosy * cosz * f2
+        + (1.+sinx) * siny * cosz * df2dy;
+
+    amrex::Real dwdx2 = -cosx * cosy * sinz * f3
+        - sinx * cosy * sinz * df3dx
+        - sinx * cosy * sinz * df3dx
+        + cosx * cosy * sinz * df3dx2;
+    amrex::Real dwdy2 = -cosx * cosy * sinz * f3
+        - cosx * siny * sinz * df3dy
+        - cosx * siny * sinz * df3dy
+        + cosx * cosy * sinz * df3dy2;
+    amrex::Real dwdz2 = -cosx * cosy * sinz * f3;
+    amrex::Real dwdxdz = -sinx * cosy * cosz * f3
+        + cosx * cosy * cosz * df3dx;
+    amrex::Real dwdydz = -cosx * siny * cosz * f3
+        + cosx * cosy * cosz * df3dy;
+
+    amrex::Real dtauxxdx = detadx*((4./3.)*dudx - (2./3.)*dvdy - (2./3.)*dwdz)
+        + eta*((4./3.)*dudx2 - (2./3.)*dvdxdy - (2./3.)*dwdxdz);
+    amrex::Real dtauyydy = detady*((4./3.)*dvdy - (2./3.)*dudx - (2./3.)*dwdz)
+        + eta*((4./3.)*dvdy2 - (2./3.)*dudxdy - (2./3.)*dwdydz);
+    amrex::Real dtauzzdz = detadz*((4./3.)*dwdz - (2./3.)*dudx - (2./3.)*dvdy)
+        + eta*((4./3.)*dwdz2 - (2./3.)*dudxdz - (2./3)*dvdydz);
+    amrex::Real dtauxydx = detadx*(dvdx + dudy) + eta*(dvdx2 + dudxdy);
+    amrex::Real dtauxydy = detady*(dvdx + dudy) + eta*(dvdxdy + dudy2);
+    amrex::Real dtauxzdx = detadx*(dwdx + dudz) + eta*(dwdx2 + dudxdz);
+    amrex::Real dtauxzdz = detadz*(dwdx + dudz) + eta*(dwdxdz + dudz2);
+    amrex::Real dtauyzdy = detady*(dwdy + dvdz) + eta*(dwdy2 + dvdydz);
+    amrex::Real dtauyzdz = detadz*(dwdy + dvdz) + eta*(dwdydz + dvdz2);
+
+    urhs = -(dtauxxdx + dtauxydy + dtauxzdz);
+    vrhs = -(dtauxydx + dtauyydy + dtauyzdz);
+    wrhs = -(dtauxzdx + dtauyzdy + dtauzzdz);
+}
+
+#endif
diff --git a/Tests/LinearSolvers/EBTensor/inputs b/Tests/LinearSolvers/EBTensor/inputs
deleted file mode 100644
index cf058c275e4..00000000000
--- a/Tests/LinearSolvers/EBTensor/inputs
+++ /dev/null
@@ -1,8 +0,0 @@
-n_cell = 32
-
-eb2.geom_type = cylinder
-eb2.cylinder_direction = 2
-eb2.cylinder_center = 0.0 0.0 0.0
-eb2.cylinder_radius = 0.9
-eb2.cylinder_height = -1.0
-eb2.cylinder_has_fluid_inside = 1
diff --git a/Tests/LinearSolvers/EBTensor/inputs.rt.2d b/Tests/LinearSolvers/EBTensor/inputs.rt.2d
new file mode 100644
index 00000000000..0bbe0ab1bfa
--- /dev/null
+++ b/Tests/LinearSolvers/EBTensor/inputs.rt.2d
@@ -0,0 +1,7 @@
+n_cell = 64
+max_grid_size = 32
+
+eb2.geom_type = sphere
+eb2.sphere_center = 0.0 0.0
+eb2.sphere_radius = 0.9
+eb2.sphere_has_fluid_inside = 1
diff --git a/Tests/LinearSolvers/EBflux_grad/GNUmakefile b/Tests/LinearSolvers/EBflux_grad/GNUmakefile
index ec1e1307b10..43ead809598 100644
--- a/Tests/LinearSolvers/EBflux_grad/GNUmakefile
+++ b/Tests/LinearSolvers/EBflux_grad/GNUmakefile
@@ -13,7 +13,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tests/LinearSolvers/MLMG/GNUmakefile b/Tests/LinearSolvers/MLMG/GNUmakefile
index 47285d22598..16d51716665 100644
--- a/Tests/LinearSolvers/MLMG/GNUmakefile
+++ b/Tests/LinearSolvers/MLMG/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	?= FALSE
 DIM	?= 3
diff --git a/Tests/LinearSolvers/MLMG/inputs b/Tests/LinearSolvers/MLMG/inputs
index 3a69b9628bd..4d2b96d9276 100644
--- a/Tests/LinearSolvers/MLMG/inputs
+++ b/Tests/LinearSolvers/MLMG/inputs
@@ -20,7 +20,7 @@ max_grid_size = 64
 
 # For MLMG
 verbose = 2
-cg_verbose = 0
+bottom_verbose = 0
 max_iter = 100
 max_fmg_iter = 0     # # of F-cycles before switching to V.  To do pure V-cycle, set to 0
 linop_maxorder = 2
diff --git a/Tests/LinearSolvers/MLMG/inputs.boxes b/Tests/LinearSolvers/MLMG/inputs.boxes
index 79a908ef774..9a864432537 100644
--- a/Tests/LinearSolvers/MLMG/inputs.boxes
+++ b/Tests/LinearSolvers/MLMG/inputs.boxes
@@ -19,7 +19,7 @@ max_grid_size = 64
 
 # For MLMG
 verbose = 2
-cg_verbose = 0
+bottom_verbose = 0
 max_iter = 100
 max_fmg_iter = 0     # # of F-cycles before switching to V.  To do pure V-cycle, set to 0
 linop_maxorder = 2
diff --git a/Tests/LinearSolvers/MLMG/solve_with_mlmg.cpp b/Tests/LinearSolvers/MLMG/solve_with_mlmg.cpp
index 187c60237e4..995387e651d 100644
--- a/Tests/LinearSolvers/MLMG/solve_with_mlmg.cpp
+++ b/Tests/LinearSolvers/MLMG/solve_with_mlmg.cpp
@@ -15,7 +15,7 @@ static int max_iter = 100;
 static int max_fmg_iter = 20;
 static int max_coarsening_level = 30;
 static int verbose  = 2;
-static int cg_verbose = 0;
+static int bottom_verbose = 0;
 static int linop_maxorder = 2;
 static bool agglomeration = false;
 static bool consolidation = false;
@@ -39,7 +39,7 @@ void solve_with_mlmg(const Vector<Geometry>& geom, int ref_ratio,
     pp.query("max_fmg_iter", max_fmg_iter);
     pp.query("max_coarsening_level", max_coarsening_level);
     pp.query("verbose", verbose);
-    pp.query("cg_verbose", cg_verbose);
+    pp.query("bottom_verbose", bottom_verbose);
     pp.query("linop_maxorder", linop_maxorder);
     pp.query("agglomeration", agglomeration);
     pp.query("consolidation", consolidation);
@@ -94,7 +94,7 @@ void solve_with_mlmg(const Vector<Geometry>& geom, int ref_ratio,
     mlmg.setMaxFmgIter(max_fmg_iter);
     if (use_hypre) mlmg.setBottomSolver(MLMG::BottomSolver::hypre);
     mlmg.setVerbose(verbose);
-    mlmg.setBottomVerbose(cg_verbose);
+    mlmg.setBottomVerbose(bottom_verbose);
 
     mlmg.solve(psoln, prhs, tol_rel, tol_abs);
   } else {
@@ -136,7 +136,7 @@ void solve_with_mlmg(const Vector<Geometry>& geom, int ref_ratio,
       mlmg.setMaxIter(max_iter);
       mlmg.setMaxFmgIter(max_fmg_iter);
       mlmg.setVerbose(verbose);
-      mlmg.setBottomVerbose(cg_verbose);
+      mlmg.setBottomVerbose(bottom_verbose);
 
       mlmg.solve({&soln[ilev]}, {&rhs[ilev]}, tol_rel, tol_abs);
     }
diff --git a/Tests/LinearSolvers/NodalOverset/GNUmakefile b/Tests/LinearSolvers/NodalOverset/GNUmakefile
index 18c24b6b39f..e7191ec7525 100644
--- a/Tests/LinearSolvers/NodalOverset/GNUmakefile
+++ b/Tests/LinearSolvers/NodalOverset/GNUmakefile
@@ -16,7 +16,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 include ./Make.package
diff --git a/Tests/LinearSolvers/NodalOverset/MyTest.cpp b/Tests/LinearSolvers/NodalOverset/MyTest.cpp
index 05f80d82e5f..081137c5df6 100644
--- a/Tests/LinearSolvers/NodalOverset/MyTest.cpp
+++ b/Tests/LinearSolvers/NodalOverset/MyTest.cpp
@@ -36,7 +36,7 @@ MyTest::solve ()
 
     mlndlap.setDomainBC(mlmg_lobc, mlmg_hibc);
 
-    mlndlap.setDirichletMask(0, dmask);
+    mlndlap.setOversetMask(0, dmask);
 
     {
         MultiFab sigma(grids, dmap, 1, 0);
@@ -59,11 +59,11 @@ MyTest::solve ()
         [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
         {
             if (domain.strictly_contains(IntVect(AMREX_D_DECL(i,j,k))) and
-                ma(i,j,k) == 0)
-            {  // Let's set phi = 0 for non-Dirichlet nodes
+                ma(i,j,k) == 1)
+            {  // Let's set phi = 0 for unknown nodes
                 pa(i,j,k) = 0.0;
             }
-            if (ma(i,j,k) == 1) {  // Let's set rhs = 0 for Dirichlet nodes
+            if (ma(i,j,k) == 0) {  // Let's set rhs = 0 for masked out known nodes
                 ra(i,j,k) = 0.0;
             }
         });
@@ -138,9 +138,9 @@ MyTest::initData ()
             ra(i,j,k) = 7.0*r2*std::cos(3.0*theta);
             Real r = std::sqrt(r2);
             if (r < (0.3 + 0.15*std::cos(6.*theta))) {
-                ma(i,j,k) = 1; // Dirichlet nodes
+                ma(i,j,k) = 0; // masked out known nodes
             } else {
-                ma(i,j,k) = 0;
+                ma(i,j,k) = 1;
             }
         });
     }
diff --git a/Tests/LinearSolvers/NodeEB/GNUmakefile b/Tests/LinearSolvers/NodeEB/GNUmakefile
index 5f3176e1ee4..502ce91e5e2 100644
--- a/Tests/LinearSolvers/NodeEB/GNUmakefile
+++ b/Tests/LinearSolvers/NodeEB/GNUmakefile
@@ -16,7 +16,7 @@ COMP = gnu
 
 DIM = 3
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 include ./Make.package
diff --git a/Tests/LinearSolvers/TensorOverset/GNUmakefile b/Tests/LinearSolvers/TensorOverset/GNUmakefile
new file mode 100644
index 00000000000..a073dff4fc2
--- /dev/null
+++ b/Tests/LinearSolvers/TensorOverset/GNUmakefile
@@ -0,0 +1,34 @@
+
+DEBUG = FALSE
+
+TEST = TRUE
+USE_ASSERTION = TRUE
+
+BL_NO_FORT = TRUE
+
+USE_EB = FALSE
+
+USE_MPI  = TRUE
+USE_OMP  = FALSE
+
+USE_HYPRE  = FALSE
+USE_PETSC  = FALSE
+
+COMP = gnu
+
+DIM = 3
+
+AMREX_HOME = ../../..
+
+include $(AMREX_HOME)/Tools/GNUMake/Make.defs
+include ./Make.package
+
+Pdirs := Base Boundary
+Pdirs += LinearSolvers/MLMG
+
+Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
+
+include $(Ppack)
+
+include $(AMREX_HOME)/Tools/GNUMake/Make.rules
+
diff --git a/Tests/LinearSolvers/TensorOverset/Make.package b/Tests/LinearSolvers/TensorOverset/Make.package
new file mode 100644
index 00000000000..e47c5e4ff24
--- /dev/null
+++ b/Tests/LinearSolvers/TensorOverset/Make.package
@@ -0,0 +1,3 @@
+CEXE_sources += main.cpp
+CEXE_sources += MyTest.cpp
+CEXE_headers += MyTest.H MyTest_K.H
diff --git a/Tests/LinearSolvers/TensorOverset/MyTest.H b/Tests/LinearSolvers/TensorOverset/MyTest.H
new file mode 100644
index 00000000000..3910066bfbf
--- /dev/null
+++ b/Tests/LinearSolvers/TensorOverset/MyTest.H
@@ -0,0 +1,44 @@
+#ifndef MY_TEST_H_
+#define MY_TEST_H_
+
+#include <AMReX_MLMG.H>
+
+class MyTest
+{
+public:
+
+    MyTest ();
+
+    void solve ();
+    void writePlotfile ();
+    void initData ();
+
+private:
+
+    void readParameters ();
+    void initGrids ();
+
+    int n_cell = 128;
+    int max_grid_size = 64;
+
+    std::string plot_file_name{"plot"};
+
+    // For MLMG solver
+    int verbose = 2;
+    int bottom_verbose = 2;
+    int max_coarsening_level = 30;
+
+    amrex::Geometry geom;
+    amrex::BoxArray grids;
+    amrex::DistributionMapping dmap;
+
+    amrex::MultiFab solution;
+    amrex::MultiFab exact;
+    amrex::MultiFab rhs;
+    amrex::MultiFab eta;
+
+    int do_overset = 1;
+    amrex::iMultiFab oversetmask;
+};
+
+#endif
diff --git a/Tests/LinearSolvers/TensorOverset/MyTest.cpp b/Tests/LinearSolvers/TensorOverset/MyTest.cpp
new file mode 100644
index 00000000000..ba19e7d264f
--- /dev/null
+++ b/Tests/LinearSolvers/TensorOverset/MyTest.cpp
@@ -0,0 +1,188 @@
+#include "MyTest.H"
+#include "MyTest_K.H"
+
+#include <AMReX_MLTensorOp.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_MultiFabUtil.H>
+#include <AMReX_PlotFileUtil.H>
+
+using namespace amrex;
+
+MyTest::MyTest ()
+{
+    readParameters();
+
+    initGrids();
+
+    initData();
+}
+
+void
+MyTest::solve ()
+{
+    std::array<LinOpBCType,AMREX_SPACEDIM> mlmg_lobc;
+    std::array<LinOpBCType,AMREX_SPACEDIM> mlmg_hibc;
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        mlmg_lobc[idim] = LinOpBCType::Dirichlet;
+        mlmg_hibc[idim] = LinOpBCType::Dirichlet;
+    }
+
+    LPInfo info;
+    info.setMaxCoarseningLevel(max_coarsening_level);
+
+    std::unique_ptr<MLTensorOp> mltensor;
+    if (do_overset) {
+        mltensor.reset(new MLTensorOp({geom}, {grids}, {dmap}, {&oversetmask}, info));
+    } else {
+        mltensor.reset(new MLTensorOp({geom}, {grids}, {dmap}, info));
+    }
+
+    mltensor->setDomainBC(mlmg_lobc, mlmg_hibc);
+    mltensor->setLevelBC(0, &exact);
+
+    const Real a = 0.0; // 1.0e6;
+    {
+        MultiFab tmp(grids, dmap, 1, 0);
+        tmp.setVal(a);
+
+        mltensor->setACoeffs(0, tmp);
+
+        Array<MultiFab,AMREX_SPACEDIM> face_bcoef;
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+        {
+            const BoxArray& ba = amrex::convert(grids, IntVect::TheDimensionVector(idim));
+            face_bcoef[idim].define(ba, dmap, 1, 0);
+        }
+        amrex::average_cellcenter_to_face(amrex::GetArrOfPtrs(face_bcoef), eta, geom);
+        mltensor->setShearViscosity(0, amrex::GetArrOfConstPtrs(face_bcoef));
+    }
+
+    MultiFab::Saxpy(rhs, a, exact, 0, 0, AMREX_SPACEDIM, 0);
+
+    MLMG mlmg(*mltensor);
+    mlmg.setVerbose(verbose);
+    mlmg.setBottomVerbose(bottom_verbose);
+
+    // In region with overset mask = 0, phi has valid solution and rhs is zero.
+    Real mlmg_err = mlmg.solve({&solution}, {&rhs}, 1.e-11, 0.0);
+}
+
+void
+MyTest::writePlotfile ()
+{
+    Vector<std::string> varname = {"u", "v", "w", "uexact", "vexact", "wexact",
+                                   "xerror", "yerror", "zerror", "xrhs", "yrhs", "zrhs", "eta"};
+    MultiFab plotmf(grids, dmap, varname.size(),  0);
+    MultiFab::Copy(plotmf, solution, 0,  0, 3, 0);
+    MultiFab::Copy(plotmf, exact   , 0,  3, 3, 0);
+    MultiFab::Copy(plotmf, solution, 0,  6, 3, 0);
+    MultiFab::Copy(plotmf, rhs     , 0,  9, 3, 0);
+    MultiFab::Copy(plotmf, eta     , 0, 12, 1, 0);
+    MultiFab::Subtract(plotmf, exact, 0, 6, 3, 0);
+    WriteMultiLevelPlotfile("plot", 1, {&plotmf},
+                            varname, {geom}, 0.0, {0}, {IntVect(2)});
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+        amrex::Print() << "\n";
+        amrex::Print() << "  max-norm error = " << plotmf.norm0(6+idim) << std::endl;
+        const auto dx = geom.CellSize();
+        amrex::Print() << "    1-norm error = " << plotmf.norm1(6+idim) * (dx[0]*dx[1]*dx[2])
+                       << std::endl;
+    }
+}
+
+void
+MyTest::readParameters ()
+{
+    ParmParse pp;
+    pp.query("n_cell", n_cell);
+    pp.query("max_grid_size", max_grid_size);
+
+    pp.query("plot_file", plot_file_name);
+
+    pp.query("verbose", verbose);
+    pp.query("bottom_verbose", bottom_verbose);
+    pp.query("max_coarsening_level", max_coarsening_level);
+
+    pp.query("do_overset", do_overset);
+}
+
+void
+MyTest::initGrids ()
+{
+    RealBox rb({AMREX_D_DECL(-1.,-1.,-1.)}, {AMREX_D_DECL(1.,1.,1.)});
+    std::array<int,AMREX_SPACEDIM> isperiodic{AMREX_D_DECL(0,0,0)};
+    Geometry::Setup(&rb, 0, isperiodic.data());
+    Box domain(IntVect{AMREX_D_DECL(0,0,0)}, IntVect{AMREX_D_DECL(n_cell-1,n_cell-1,n_cell-1)});
+    geom.define(domain, rb, CoordSys::cartesian, isperiodic);
+
+    grids.define(domain);
+    grids.maxSize(max_grid_size);
+}
+
+void
+MyTest::initData ()
+{
+    dmap.define(grids);
+
+    solution.define(grids, dmap, AMREX_SPACEDIM, 1);
+    exact.define(grids, dmap, AMREX_SPACEDIM, 1);
+    rhs.define(grids, dmap, AMREX_SPACEDIM, 1);
+    eta.define(grids, dmap, 1, 1);
+    oversetmask.define(grids, dmap, 1, 0);
+
+    Box overset_box = amrex::grow(geom.Domain(), -n_cell/4); // middle of the domain
+    // Box overset_box = amrex::shift(geom.Domain(), 0, n_cell/2); // right half
+
+    const auto problo = geom.ProbLoArray();
+    const auto probhi = geom.ProbHiArray();
+    const auto dx     = geom.CellSizeArray();
+    auto loverset = do_overset;
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    for (MFIter mfi(rhs, TilingIfNotGPU()); mfi.isValid(); ++mfi)
+    {
+        const Box& vbx = mfi.validbox();
+        const Box& gbx = mfi.growntilebox(1);
+        const Array4<Real> solnfab = solution.array(mfi);
+        const Array4<Real> exactfab = exact.array(mfi);
+        const Array4<Real> rhsfab = rhs.array(mfi);
+        const Array4<Real> etafab = eta.array(mfi);
+        const Array4<int> mask = oversetmask.array(mfi);
+
+        amrex::ParallelFor(gbx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+        {
+            Real x = (i+0.5)*dx[0] + problo[0];
+            Real y = (j+0.5)*dx[1] + problo[1];
+            Real z = (k+0.5)*dx[2] + problo[2];
+            x = std::max(-1.0,std::min(1.0,x));
+            y = std::max(-1.0,std::min(1.0,y));
+            z = std::max(-1.0,std::min(1.0,z));
+            Real u,v,w,urhs,vrhs,wrhs,seta;
+            init(x,y,z,1.0,u,v,w,urhs,vrhs,wrhs,seta);
+            exactfab(i,j,k,0) = u;
+            exactfab(i,j,k,1) = v;
+            exactfab(i,j,k,2) = w;
+            rhsfab(i,j,k,0) = urhs;
+            rhsfab(i,j,k,1) = vrhs;
+            rhsfab(i,j,k,2) = wrhs;
+            etafab(i,j,k) = seta;
+            if (vbx.contains(IntVect(i,j,k)) and overset_box.contains(IntVect(i,j,k))) {
+                solnfab(i,j,k,0) = u;
+                solnfab(i,j,k,1) = v;
+                solnfab(i,j,k,2) = w;
+            } else {
+                solnfab(i,j,k,0) = 0;
+                solnfab(i,j,k,1) = 0;
+                solnfab(i,j,k,2) = 0;
+            }
+            if (vbx.contains(IntVect(i,j,k))) {
+                if (overset_box.contains(IntVect(i,j,k))) {
+                    mask(i,j,k) = 0;
+                } else {
+                    mask(i,j,k) = 1;
+                }
+            }
+        });
+    }
+}
diff --git a/Tests/LinearSolvers/EBTensor/MyTest_K.H b/Tests/LinearSolvers/TensorOverset/MyTest_K.H
similarity index 95%
rename from Tests/LinearSolvers/EBTensor/MyTest_K.H
rename to Tests/LinearSolvers/TensorOverset/MyTest_K.H
index 6beb9b44877..12fe94bb057 100644
--- a/Tests/LinearSolvers/EBTensor/MyTest_K.H
+++ b/Tests/LinearSolvers/TensorOverset/MyTest_K.H
@@ -3,10 +3,11 @@
 
 #include <AMReX_FArrayBox.H>
 
-inline void init (amrex::Real x, amrex::Real y, amrex::Real z, amrex::Real R2,
-                  amrex::Real& u, amrex::Real& v, amrex::Real& w,
-                  amrex::Real& urhs, amrex::Real& vrhs, amrex::Real& wrhs,
-                  amrex::Real& eta)
+AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+void init (amrex::Real x, amrex::Real y, amrex::Real z, amrex::Real R2,
+           amrex::Real& u, amrex::Real& v, amrex::Real& w,
+           amrex::Real& urhs, amrex::Real& vrhs, amrex::Real& wrhs,
+           amrex::Real& eta)
 {
     constexpr amrex::Real pi = 3.1415926535897932;
     amrex::Real x2 = x*x;
diff --git a/Tests/LinearSolvers/TensorOverset/main.cpp b/Tests/LinearSolvers/TensorOverset/main.cpp
new file mode 100644
index 00000000000..90a13cc0493
--- /dev/null
+++ b/Tests/LinearSolvers/TensorOverset/main.cpp
@@ -0,0 +1,17 @@
+
+#include <AMReX.H>
+#include <AMReX_ParmParse.H>
+#include "MyTest.H"
+
+int main (int argc, char* argv[])
+{
+    amrex::Initialize(argc, argv);
+
+    {
+        MyTest mytest;
+        mytest.solve();
+        mytest.writePlotfile();
+    }
+
+    amrex::Finalize();
+}
diff --git a/Tests/MKDir/GNUmakefile b/Tests/MKDir/GNUmakefile
deleted file mode 100644
index ce1430e7e5b..00000000000
--- a/Tests/MKDir/GNUmakefile
+++ /dev/null
@@ -1,21 +0,0 @@
-AMREX_HOME ?= ../../../amrex
-
-DEBUG        = FALSE
-USE_MPI      = TRUE
-USE_OMP      = FALSE
-USE_IPM      = FALSE
-PROFILE      = TRUE
-TRACE_PROFILE = TRUE
-COMM_PROFILE = TRUE
-USE_DUMPI    = FALSE
-COMP         = g++
-DIM          = 3
-PRECISION    = DOUBLE
-EBASE        = mkdirtest
-
-CEXE_sources += MKDir.cpp
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/MKDir/MKDir.cpp b/Tests/MKDir/MKDir.cpp
deleted file mode 100644
index b09ca34b07f..00000000000
--- a/Tests/MKDir/MKDir.cpp
+++ /dev/null
@@ -1,91 +0,0 @@
-// --------------------------------------------------------------------------
-// MKDir.cpp
-// --------------------------------------------------------------------------
-//   this file tests making directories.
-// --------------------------------------------------------------------------
-
-#include <new>
-#include <iostream>
-#include <sstream>
-#include <cstdio>
-#include <cstdlib>
-#include <sys/stat.h>
-#include <string.h>
-
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-// --------------------------------------------------------------------------
-int main(int argc, char *argv[]) {
-    amrex::Initialize(argc,argv);    
-    BL_PROFILE_VAR("main()", pmain);
-    const Real tStart(ParallelDescriptor::second());
-    int nprocs(ParallelDescriptor::NProcs());
-
-    int ndirs(256), nlevels(4);
-
-    if(ParallelDescriptor::IOProcessor()) {
-      errno = 0;
-      mkdir("testdir", 0755);
-      std::cout << "_here 0:  errno = " << strerror(errno) << std::endl;
-      errno = 0;
-      rmdir("testdir");
-      std::cout << "_here 1:  errno = " << strerror(errno) << std::endl;
-      errno = 0;
-      mkdir("testnest/n0/n1", 0755);
-      std::cout << "_here 2:  errno = " << strerror(errno) << std::endl;
-      errno = 0;
-    }
-
-    BL_PROFILE_VAR("mkdirs", mkdirs);
-    for(int i(0); i < ndirs; ++i) {
-      std::stringstream dirname;
-      dirname << "dir" << i;
-      if(ParallelDescriptor::IOProcessor()) {
-        if( ! amrex::UtilCreateDirectory(dirname.str(), 0755)) {
-          amrex::CreateDirectoryFailed(dirname.str());
-        }
-        for(int level(0); level < nlevels; ++level) {
-          std::stringstream dirname;
-          dirname << "dir" << i << "/Level_" << level;
-          if( ! amrex::UtilCreateDirectory(dirname.str(), 0755)) {
-            amrex::CreateDirectoryFailed(dirname.str());
-          }
-        }
-      }
-    }
-    ParallelDescriptor::Barrier("waitfordir");
-    BL_PROFILE_VAR_STOP(mkdirs);
-
-    BL_PROFILE_VAR("renamedirs", renamedirs);
-    for(int i(0); i < ndirs; ++i) {
-      if(ParallelDescriptor::IOProcessor()) {
-        std::stringstream dirname;
-        dirname << "dir" << i;
-        std::string newdirname;
-        newdirname = dirname.str() + ".old";
-	std::rename(dirname.str().c_str(), newdirname.c_str());
-      }
-    }
-    ParallelDescriptor::Barrier("renamedirs");
-    BL_PROFILE_VAR_STOP(renamedirs);
-
-
-    Real runTime(ParallelDescriptor::second() - tStart);
-    ParallelDescriptor::ReduceRealMax(runTime, ParallelDescriptor::IOProcessorNumber());
-
-    if(ParallelDescriptor::IOProcessor()) {
-      std::cout << std::endl;
-      std::cout << "Finished." << std::endl;
-      std::cout << "Run time = " << runTime << std::endl;
-      std::cout << std::endl;
-      std::cout << std::endl;
-    }
-
-    BL_PROFILE_VAR_STOP(pmain);
-    amrex::Finalize();
-    return 0;
-}
-// --------------------------------------------------------------------------
diff --git a/Tests/NoFort/GNUmakefile b/Tests/NoFort/GNUmakefile
deleted file mode 100644
index a7c6b5ed0f3..00000000000
--- a/Tests/NoFort/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-AMREX_HOME ?= ../../
-
-DEBUG	= FALSE
-DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gnu
-
-USE_MPI   = FALSE
-USE_OMP   = FALSE
-
-BL_NO_FORT = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/NoFort/Make.package b/Tests/NoFort/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/NoFort/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/NoFort/main.cpp b/Tests/NoFort/main.cpp
deleted file mode 100644
index 4cc1e9edb9a..00000000000
--- a/Tests/NoFort/main.cpp
+++ /dev/null
@@ -1,11 +0,0 @@
-
-#include <AMReX.H>
-#include <AMReX_Print.H>
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    amrex::Print() << "Hello world from AMReX version " << amrex::Version() << "\n";
-    amrex::Finalize();
-}
-
diff --git a/Tests/Particles/AssignDensity/GNUmakefile b/Tests/Particles/AssignDensity/GNUmakefile
index 07b0582f97c..81c2f93f1e5 100644
--- a/Tests/Particles/AssignDensity/GNUmakefile
+++ b/Tests/Particles/AssignDensity/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/AssignMultiLevelDensity/GNUmakefile b/Tests/Particles/AssignMultiLevelDensity/GNUmakefile
index 07e75c77b83..04c0fb5afab 100644
--- a/Tests/Particles/AssignMultiLevelDensity/GNUmakefile
+++ b/Tests/Particles/AssignMultiLevelDensity/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/PnetCDFBenchmark/GNUmakefile b/Tests/Particles/AsyncIO/GNUmakefile
similarity index 59%
rename from Tests/PnetCDFBenchmark/GNUmakefile
rename to Tests/Particles/AsyncIO/GNUmakefile
index 29db797f3b8..6dddb3a2871 100644
--- a/Tests/PnetCDFBenchmark/GNUmakefile
+++ b/Tests/Particles/AsyncIO/GNUmakefile
@@ -1,19 +1,21 @@
-AMREX_HOME ?= ../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
 
 DIM	= 3
 
-COMP    = gnu
+COMP    = gcc
+
+TINY_PROFILE = TRUE
+USE_PARTICLES = TRUE
 
 PRECISION = DOUBLE
 
 USE_MPI   = TRUE
-#USE_OMP   = TRUE
 USE_OMP   = FALSE
 
-TINY_PROFILE = TRUE
+MPI_THREAD_MULTIPLE = TRUE
 
 ###################################################
 
@@ -23,14 +25,8 @@ include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
 include ./Make.package
 include $(AMREX_HOME)/Src/Base/Make.package
+include $(AMREX_HOME)/Src/Boundary/Make.package
+include $(AMREX_HOME)/Src/AmrCore/Make.package
 include $(AMREX_HOME)/Src/Particle/Make.package
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-PNETCDF_HOME   = /home/khl7265/.local
-USE_PNETCDF = TRUE
-ifeq ($(USE_PNETCDF), TRUE)
-DEFINES += -DBL_PNETCDF
-INCLUDE_LOCATIONS += $(PNETCDF_HOME)/include
-LIBRARIES         += -lpnetcdf -L$(PNETCDF_HOME)/lib
-endif
diff --git a/Tests/GPU/Locking/Make.package b/Tests/Particles/AsyncIO/Make.package
similarity index 100%
rename from Tests/GPU/Locking/Make.package
rename to Tests/Particles/AsyncIO/Make.package
diff --git a/Tests/Particles/AsyncIO/inputs b/Tests/Particles/AsyncIO/inputs
new file mode 100644
index 00000000000..9d81c23f8a3
--- /dev/null
+++ b/Tests/Particles/AsyncIO/inputs
@@ -0,0 +1,29 @@
+
+# Domain size
+
+#nx = 32 # number of grid points along the x axis
+#ny = 32 # number of grid points along the y axis 
+#nz = 32 # number of grid points along the z axis
+
+#nx = 64 # number of grid points along the x axis
+#ny = 64 # number of grid points along the y axis 
+#nz = 64 # number of grid points along the z axis
+
+nx = 128 # number of grid points along the x axis
+ny = 128 # number of grid points along the y axis 
+nz = 128 # number of grid points along the z axis
+
+# Maximum allowable size of each subdomain in the problem domain; 
+#    this is used to decompose the domain for parallel calculations.
+max_grid_size = 16
+
+# Number of particles per cell
+nppc = 10
+
+# Verbosity
+verbose = true   # set to true to get more verbosity 
+
+# Number of levels
+nlevs = 2
+
+amrex.async_io=1
\ No newline at end of file
diff --git a/Tests/Particles/AsyncIO/main.cpp b/Tests/Particles/AsyncIO/main.cpp
new file mode 100644
index 00000000000..cf00d0cafe2
--- /dev/null
+++ b/Tests/Particles/AsyncIO/main.cpp
@@ -0,0 +1,314 @@
+#include <iostream>
+
+#include <AMReX.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_MultiFabUtil.H>
+#include <AMReX_AmrParticles.H>
+#include <AMReX_PlotFileUtil.H>
+
+#include <thread>
+
+using namespace amrex;
+
+static constexpr int NSR = 1 + AMREX_SPACEDIM;
+static constexpr int NSI = 0;
+static constexpr int NAR = 0;
+static constexpr int NAI = 0;
+
+struct TestParams {
+  int nx;
+  int ny;
+  int nz;
+  int max_grid_size;
+  int nppc;
+  int nlevs;
+  bool verbose;
+};
+
+void get_position_unit_cell(Real* r, const IntVect& nppc, int i_part)
+{
+    int nx = nppc[0];
+#if AMREX_SPACEDIM > 1
+    int ny = nppc[1];
+#else
+    int ny = 1;
+#endif
+#if AMREX_SPACEDIM > 2
+    int nz = nppc[2];
+#else
+    int nz = 1;
+#endif
+
+    int ix_part = i_part/(ny * nz);
+    int iy_part = (i_part % (ny * nz)) % ny;
+    int iz_part = (i_part % (ny * nz)) / ny;
+
+    r[0] = (0.5+ix_part)/nx;
+    r[1] = (0.5+iy_part)/ny;
+    r[2] = (0.5+iz_part)/nz;
+}
+
+class MyParticleContainer
+    : public amrex::ParticleContainer<NSR, NSI, NAR, NAI>
+{
+
+public:
+
+    MyParticleContainer (const Vector<amrex::Geometry>            & a_geom,
+                         const Vector<amrex::DistributionMapping> & a_dmap,
+                         const Vector<amrex::BoxArray>            & a_ba,
+                         const Vector<amrex::IntVect>             & a_rr)
+        : amrex::ParticleContainer<NSR, NSI, NAR, NAI>(a_geom, a_dmap, a_ba, a_rr)
+    {}
+
+    void InitParticles (const amrex::IntVect& a_num_particles_per_cell)
+    {
+        BL_PROFILE("InitParticles");
+
+        const int lev = 0;  // only add particles on level 0
+        const Real* dx = Geom(lev).CellSize();
+        const Real* plo = Geom(lev).ProbLo();
+
+        const int num_ppc = AMREX_D_TERM( a_num_particles_per_cell[0],
+                                         *a_num_particles_per_cell[1],
+                                         *a_num_particles_per_cell[2]);
+
+        for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+        {
+            const Box& tile_box  = mfi.tilebox();
+
+            Gpu::HostVector<ParticleType> host_particles;
+            std::array<Gpu::HostVector<Real>, NAR> host_real;
+            std::array<Gpu::HostVector<int>, NAI> host_int;
+
+            std::vector<Gpu::HostVector<Real> > host_runtime_real(NumRuntimeRealComps());
+            std::vector<Gpu::HostVector<int> > host_runtime_int(NumRuntimeIntComps());
+
+            for (IntVect iv = tile_box.smallEnd(); iv <= tile_box.bigEnd(); tile_box.next(iv))
+            {
+                for (int i_part=0; i_part<num_ppc;i_part++) {
+                    Real r[3];
+                    get_position_unit_cell(r, a_num_particles_per_cell, i_part);
+
+                    ParticleType p;
+                    p.id()  = ParticleType::NextID();
+                    p.cpu() = ParallelDescriptor::MyProc();
+                    p.pos(0) = plo[0] + (iv[0] + r[0])*dx[0];
+#if AMREX_SPACEDIM > 1
+                    p.pos(1) = plo[1] + (iv[1] + r[1])*dx[1];
+#endif
+#if AMREX_SPACEDIM > 2
+                    p.pos(2) = plo[2] + (iv[2] + r[2])*dx[2];
+#endif
+
+                    for (int i = 0; i < NSR; ++i) p.rdata(i) = p.id();
+                    for (int i = 0; i < NSI; ++i) p.idata(i) = p.id();
+
+                    host_particles.push_back(p);
+                    for (int i = 0; i < NAR; ++i)
+                        host_real[i].push_back(p.id());
+                    for (int i = 0; i < NAI; ++i)
+                        host_int[i].push_back(p.id());
+                    for (int i = 0; i < NumRuntimeRealComps(); ++i)
+                        host_runtime_real[i].push_back(p.id());
+                    for (int i = 0; i < NumRuntimeIntComps(); ++i)
+                        host_runtime_int[i].push_back(p.id());
+                }
+            }
+
+            auto& particle_tile = DefineAndReturnParticleTile(lev, mfi.index(), mfi.LocalTileIndex());
+            auto old_size = particle_tile.GetArrayOfStructs().size();
+            auto new_size = old_size + host_particles.size();
+            particle_tile.resize(new_size);
+
+            Gpu::copy(Gpu::hostToDevice,
+                      host_particles.begin(),
+                      host_particles.end(),
+                      particle_tile.GetArrayOfStructs().begin() + old_size);
+
+            auto& soa = particle_tile.GetStructOfArrays();
+            for (int i = 0; i < NAR; ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_real[i].begin(),
+                          host_real[i].end(),
+                          soa.GetRealData(i).begin() + old_size);
+            }
+
+            for (int i = 0; i < NAI; ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_int[i].begin(),
+                          host_int[i].end(),
+                          soa.GetIntData(i).begin() + old_size);
+            }
+            for (int i = 0; i < NumRuntimeRealComps(); ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_runtime_real[i].begin(),
+                          host_runtime_real[i].end(),
+                          soa.GetRealData(NAR+i).begin() + old_size);
+            }
+
+            for (int i = 0; i < NumRuntimeIntComps(); ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_runtime_int[i].begin(),
+                          host_runtime_int[i].end(),
+                          soa.GetIntData(NAI+i).begin() + old_size);
+            }
+
+            Gpu::synchronize();
+        }
+
+        Redistribute();
+    }
+};
+
+void test_async_io(TestParams& parms)
+{
+    int nlevs = parms.nlevs;
+
+    RealBox real_box;
+    for (int n = 0; n < BL_SPACEDIM; n++) {
+        real_box.setLo(n, 0.0);
+        real_box.setHi(n, 1.0);
+    }
+
+    RealBox fine_box;
+    for (int n = 0; n < BL_SPACEDIM; n++)
+    {
+       fine_box.setLo(n,0.25);
+       fine_box.setHi(n,0.75);
+    }
+
+    IntVect domain_lo(D_DECL(0 , 0, 0));
+    IntVect domain_hi(D_DECL(parms.nx - 1, parms.ny - 1, parms.nz-1));
+    const Box domain(domain_lo, domain_hi);
+
+    // Define the refinement ratio
+    Vector<IntVect> rr(nlevs-1);
+    for (int lev = 1; lev < nlevs; lev++)
+        rr[lev-1] = IntVect(AMREX_D_DECL(2, 2, 2));
+
+    // This sets the boundary conditions to be doubly or triply periodic
+    int is_per[BL_SPACEDIM];
+    for (int i = 0; i < BL_SPACEDIM; i++)
+        is_per[i] = 1;
+
+    // This defines a Geometry object which is useful for writing the plotfiles
+    Vector<Geometry> geom(nlevs);
+    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
+    for (int lev = 1; lev < nlevs; lev++) {
+	geom[lev].define(amrex::refine(geom[lev-1].Domain(), rr[lev-1]),
+			 &real_box, CoordSys::cartesian, is_per);
+    }
+
+    Vector<BoxArray> ba(nlevs);
+    ba[0].define(domain);
+
+    if (nlevs > 1) {
+        int n_fine = parms.nx*rr[0][0];
+        IntVect refined_lo(D_DECL(n_fine/4,n_fine/4,n_fine/4));
+        IntVect refined_hi(D_DECL(3*n_fine/4-1,3*n_fine/4-1,3*n_fine/4-1));
+
+        // Build a box for the level 1 domain
+        Box refined_patch(refined_lo, refined_hi);
+        ba[1].define(refined_patch);
+    }
+
+    // break the BoxArrays at both levels into max_grid_size^3 boxes
+    for (int lev = 0; lev < nlevs; lev++) {
+        ba[lev].maxSize(parms.max_grid_size);
+    }
+
+    Vector<DistributionMapping> dmap(nlevs);
+
+    Vector<std::unique_ptr<MultiFab> > partMF(nlevs);
+    Vector<std::unique_ptr<MultiFab> > density(nlevs);
+    Vector<std::unique_ptr<MultiFab> > acceleration(nlevs);
+    for (int lev = 0; lev < nlevs; lev++) {
+        dmap[lev] = DistributionMapping{ba[lev]};
+        density[lev].reset(new MultiFab(ba[lev], dmap[lev], 1, 0));
+        density[lev]->setVal(0.0);
+        acceleration[lev].reset(new MultiFab(ba[lev], dmap[lev], 3, 1));
+        acceleration[lev]->setVal(5.0, 1);
+    }
+
+    MyParticleContainer myPC(geom, dmap, ba, rr);
+    myPC.SetVerbose(false);
+
+    myPC.InitParticles(IntVect(2, 2, 2));
+
+    for (int step = 0; step < 4000; ++step)
+    {
+        myPC.AssignDensity(0, partMF, 0, 1, nlevs-1);
+
+        for (int lev = 0; lev < nlevs; ++lev) {
+            MultiFab::Copy(*density[lev], *partMF[lev], 0, 0, 1, 0);
+        }
+
+        if (step % 1000 == 0) {
+            Vector<std::string> varnames;
+            varnames.push_back("density");
+
+            Vector<std::string> particle_varnames;
+            particle_varnames.push_back("mass");
+
+            Vector<int> level_steps;
+            level_steps.push_back(0);
+            level_steps.push_back(0);
+
+            int output_levs = nlevs;
+
+            Vector<const MultiFab*> outputMF(output_levs);
+            Vector<IntVect> outputRR(output_levs);
+            for (int lev = 0; lev < output_levs; ++lev) {
+                outputMF[lev] = density[lev].get();
+                outputRR[lev] = IntVect(D_DECL(2, 2, 2));
+            }
+
+            std::string fn = amrex::Concatenate("plt", step, 5);
+
+            WriteMultiLevelPlotfile(fn, output_levs, outputMF,
+                                    varnames, geom, 0.0, level_steps, outputRR);
+
+            myPC.WritePlotFile(fn, "particle0");
+        }
+    }
+}
+
+int main(int argc, char* argv[])
+{
+  amrex::Initialize(argc,argv);
+
+  ParmParse pp;
+
+  TestParams parms;
+
+  pp.get("nx", parms.nx);
+  pp.get("ny", parms.ny);
+  pp.get("nz", parms.nz);
+  pp.get("max_grid_size", parms.max_grid_size);
+  pp.get("nlevs", parms.nlevs);
+  pp.get("nppc", parms.nppc);
+  if (parms.nppc < 1 && ParallelDescriptor::IOProcessor())
+    amrex::Abort("Must specify at least one particle per cell");
+
+  parms.verbose = false;
+  pp.query("verbose", parms.verbose);
+
+  if (parms.verbose && ParallelDescriptor::IOProcessor()) {
+    std::cout << std::endl;
+    std::cout << "Number of particles per cell : ";
+    std::cout << parms.nppc  << std::endl;
+    std::cout << "Size of domain               : ";
+    std::cout << "Num levels: ";
+    std::cout << parms.nlevs << std::endl;
+    std::cout << parms.nx << " " << parms.ny << " " << parms.nz << std::endl;
+  }
+
+  test_async_io(parms);
+
+  amrex::Finalize();
+}
diff --git a/Tests/Particles/GNUmakefile b/Tests/Particles/GhostsAndVirtuals/GNUmakefile
similarity index 71%
rename from Tests/Particles/GNUmakefile
rename to Tests/Particles/GhostsAndVirtuals/GNUmakefile
index 9054deb8ede..04c0fb5afab 100644
--- a/Tests/Particles/GNUmakefile
+++ b/Tests/Particles/GhostsAndVirtuals/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
@@ -7,12 +7,13 @@ DIM	= 3
 
 COMP    = gcc
 
+TINY_PROFILE = TRUE
 USE_PARTICLES = TRUE
 
 PRECISION = DOUBLE
 
 USE_MPI   = TRUE
-USE_OMP   = TRUE
+USE_OMP   = FALSE
 
 ###################################################
 
@@ -22,6 +23,8 @@ include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
 include ./Make.package
 include $(AMREX_HOME)/Src/Base/Make.package
+include $(AMREX_HOME)/Src/Boundary/Make.package
+include $(AMREX_HOME)/Src/AmrCore/Make.package
 include $(AMREX_HOME)/Src/Particle/Make.package
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/Particles/Make.package b/Tests/Particles/GhostsAndVirtuals/Make.package
similarity index 100%
rename from Tests/Particles/Make.package
rename to Tests/Particles/GhostsAndVirtuals/Make.package
diff --git a/Tests/Particles/GhostsAndVirtuals/inputs b/Tests/Particles/GhostsAndVirtuals/inputs
new file mode 100644
index 00000000000..3a0957f8f32
--- /dev/null
+++ b/Tests/Particles/GhostsAndVirtuals/inputs
@@ -0,0 +1,27 @@
+
+# Domain size
+
+#nx = 32 # number of grid points along the x axis
+#ny = 32 # number of grid points along the y axis 
+#nz = 32 # number of grid points along the z axis
+
+#nx = 64 # number of grid points along the x axis
+#ny = 64 # number of grid points along the y axis 
+#nz = 64 # number of grid points along the z axis
+
+nx = 128 # number of grid points along the x axis
+ny = 128 # number of grid points along the y axis 
+nz = 128 # number of grid points along the z axis
+
+# Maximum allowable size of each subdomain in the problem domain; 
+#    this is used to decompose the domain for parallel calculations.
+max_grid_size = 16
+
+# Number of particles per cell
+nppc = 10
+
+# Verbosity
+verbose = true   # set to true to get more verbosity 
+
+# Number of levels
+nlevs = 2
diff --git a/Tests/Particles/GhostsAndVirtuals/main.cpp b/Tests/Particles/GhostsAndVirtuals/main.cpp
new file mode 100644
index 00000000000..9ef435e1110
--- /dev/null
+++ b/Tests/Particles/GhostsAndVirtuals/main.cpp
@@ -0,0 +1,148 @@
+#include <iostream>
+
+#include <AMReX.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_MultiFabUtil.H>
+#include <AMReX_AmrParticles.H>
+#include <AMReX_PlotFileUtil.H>
+
+using namespace amrex;
+
+struct TestParams {
+  int nx;
+  int ny;
+  int nz;
+  int max_grid_size;
+  int nppc;
+  int nlevs;
+  bool verbose;
+};
+
+void test_ghosts_and_virtuals (TestParams& parms)
+{
+    int nlevs = parms.nlevs;
+
+    RealBox real_box;
+    for (int n = 0; n < BL_SPACEDIM; n++) {
+        real_box.setLo(n, 0.0);
+        real_box.setHi(n, 1.0);
+    }
+
+    RealBox fine_box;
+    for (int n = 0; n < BL_SPACEDIM; n++)
+    {
+       fine_box.setLo(n,0.25);
+       fine_box.setHi(n,0.75);
+    }
+
+    IntVect domain_lo(D_DECL(0 , 0, 0));
+    IntVect domain_hi(D_DECL(parms.nx - 1, parms.ny - 1, parms.nz-1));
+    const Box domain(domain_lo, domain_hi);
+
+    // Define the refinement ratio
+    Vector<int> rr(nlevs-1);
+    for (int lev = 1; lev < nlevs; lev++)
+        rr[lev-1] = 2;
+
+    // This sets the boundary conditions to be doubly or triply periodic
+    int is_per[BL_SPACEDIM];
+    for (int i = 0; i < BL_SPACEDIM; i++)
+        is_per[i] = 1;
+
+    // This defines a Geometry object which is useful for writing the plotfiles
+    Vector<Geometry> geom(nlevs);
+    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
+    for (int lev = 1; lev < nlevs; lev++) {
+	geom[lev].define(amrex::refine(geom[lev-1].Domain(), rr[lev-1]),
+			 &real_box, CoordSys::cartesian, is_per);
+    }
+
+    Vector<BoxArray> ba(nlevs);
+    ba[0].define(domain);
+
+    if (nlevs > 1) {
+        int n_fine = parms.nx*rr[0];
+        IntVect refined_lo(D_DECL(n_fine/4,n_fine/4,n_fine/4));
+        IntVect refined_hi(D_DECL(3*n_fine/4-1,3*n_fine/4-1,3*n_fine/4-1));
+
+        // Build a box for the level 1 domain
+        Box refined_patch(refined_lo, refined_hi);
+        ba[1].define(refined_patch);
+    }
+
+    // break the BoxArrays at both levels into max_grid_size^3 boxes
+    for (int lev = 0; lev < nlevs; lev++) {
+        ba[lev].maxSize(parms.max_grid_size);
+    }
+
+    Vector<DistributionMapping> dmap(nlevs);
+    for (int lev = 0; lev < nlevs; lev++) {
+        dmap[lev] = DistributionMapping{ba[lev]};
+    }
+
+    typedef AmrParticleContainer<0, 0, 1> MyParticleContainer;
+    MyParticleContainer myPC(geom, dmap, ba, rr);
+    myPC.SetVerbose(false);
+
+    int num_particles = parms.nppc * AMREX_D_TERM(parms.nx, * parms.ny, * parms.nz);
+    bool serialize = true;
+    int iseed = 451;
+    Real mass = 10.0;
+    MyParticleContainer::ParticleInitData pdata = {mass};
+
+    myPC.InitRandom(num_particles, iseed, pdata, serialize);
+
+    {
+        const int src_lev = 1;
+        const int dst_lev = 0;
+        MyParticleContainer virtPC(geom, dmap, ba, rr);
+        MyParticleContainer::ParticleTileType virts;
+        myPC.CreateVirtualParticles(1, virts);
+        virtPC.AddParticlesAtLevel(virts, 0);
+    }
+
+    {
+        const int ngrow = 1;
+        const int src_lev = 0;
+        const int dst_lev = 1;
+        MyParticleContainer ghostPC(geom, dmap, ba, rr);
+        MyParticleContainer::ParticleTileType ghosts;
+        myPC.CreateGhostParticles(src_lev, ngrow, ghosts);
+        ghostPC.AddParticlesAtLevel(ghosts, dst_lev, ngrow);
+    }
+}
+
+int main(int argc, char* argv[])
+{
+  amrex::Initialize(argc,argv);
+
+  ParmParse pp;
+
+  TestParams parms;
+
+  pp.get("nx", parms.nx);
+  pp.get("ny", parms.ny);
+  pp.get("nz", parms.nz);
+  pp.get("max_grid_size", parms.max_grid_size);
+  pp.get("nlevs", parms.nlevs);
+  pp.get("nppc", parms.nppc);
+  if (parms.nppc < 1 && ParallelDescriptor::IOProcessor())
+    amrex::Abort("Must specify at least one particle per cell");
+
+  parms.verbose = false;
+  pp.query("verbose", parms.verbose);
+
+  if (parms.verbose && ParallelDescriptor::IOProcessor()) {
+    std::cout << std::endl;
+    std::cout << "Number of particles per cell : ";
+    std::cout << parms.nppc  << std::endl;
+    std::cout << "Size of domain               : ";
+    std::cout << "Num levels: ";
+    std::cout << parms.nlevs << std::endl;
+    std::cout << parms.nx << " " << parms.ny << " " << parms.nz << std::endl;
+  }
+
+  test_ghosts_and_virtuals(parms);
+
+  amrex::Finalize();
+}
diff --git a/Tests/Particles/InitFromAscii/GNUmakefile b/Tests/Particles/InitFromAscii/GNUmakefile
index 07b0582f97c..81c2f93f1e5 100644
--- a/Tests/Particles/InitFromAscii/GNUmakefile
+++ b/Tests/Particles/InitFromAscii/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/Intersection/GNUmakefile b/Tests/Particles/Intersection/GNUmakefile
index 07b0582f97c..81c2f93f1e5 100644
--- a/Tests/Particles/Intersection/GNUmakefile
+++ b/Tests/Particles/Intersection/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/NeighborParticles/CMakeLists.txt b/Tests/Particles/NeighborParticles/CMakeLists.txt
index 0f8716cdb13..d7fe12cd55d 100644
--- a/Tests/Particles/NeighborParticles/CMakeLists.txt
+++ b/Tests/Particles/NeighborParticles/CMakeLists.txt
@@ -1,38 +1,8 @@
-#
-# This test requires CUDA and Particles to be enabled
-#
-if (NOT ENABLE_CUDA OR NOT ENABLE_PARTICLES)
-   return ()
-endif ()
+set(_sources CheckPair.H Constants.H main.cpp  MDParticleContainer.cpp MDParticleContainer.H )
 
-set( SRC_DIR ${CMAKE_CURRENT_LIST_DIR} )
-set( EXENAME  "gpu_nblist.exe" )
+set(_input_files inputs  )
 
-add_executable( ${EXENAME} EXCLUDE_FROM_ALL "")
+setup_test(_sources _input_files NTASKS 2)
 
-target_sources( ${EXENAME}
-   PRIVATE
-   ${SRC_DIR}/Constants.H
-   ${SRC_DIR}/MDParticleContainer.H
-   ${SRC_DIR}/MDParticleContainer.cpp
-   ${SRC_DIR}/CheckPair.H
-   ${SRC_DIR}/main.cpp)
-
-target_include_directories(${EXENAME} PRIVATE ${CMAKE_CURRENT_LIST_DIR} )
-set_source_files_properties(${SRC_DIR}/main.cpp ${SRC_DIR}/MDParticleContainer.cpp PROPERTIES LANGUAGE CUDA)
-
-# Since we are forcing the use of fortran compiler to link
-# we need to specify the flags to add at link phase since
-# it won't propagate amrex ones
-set_target_properties( ${EXENAME}
-   PROPERTIES
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}
-   CUDA_SEPARABLE_COMPILATION ON  # This add -dc flag
-   )
-
-target_link_libraries(${EXENAME} amrex)
-
-file( COPY inputs DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-add_tutorial(${EXENAME})   
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/Particles/NeighborParticles/GNUmakefile b/Tests/Particles/NeighborParticles/GNUmakefile
index 712e8518b49..bdf7be9a980 100644
--- a/Tests/Particles/NeighborParticles/GNUmakefile
+++ b/Tests/Particles/NeighborParticles/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tests/Particles/NeighborParticles/MDParticleContainer.cpp b/Tests/Particles/NeighborParticles/MDParticleContainer.cpp
index 1a06253c5fa..bb51e993a1a 100644
--- a/Tests/Particles/NeighborParticles/MDParticleContainer.cpp
+++ b/Tests/Particles/NeighborParticles/MDParticleContainer.cpp
@@ -100,6 +100,8 @@ InitParticles(const IntVect& a_num_particles_per_cell,
         
         Gpu::copy(Gpu::hostToDevice, host_particles.begin(), host_particles.end(),
                   particle_tile.GetArrayOfStructs().begin() + old_size);        
+
+        Gpu::synchronize();
     }
     
     amrex::PrintToFile("neighbor_test") << " Number of particles is " << this->TotalNumberOfParticles()<< " \n";
@@ -141,15 +143,15 @@ std::pair<Real, Real> MDParticleContainer::minAndMaxDistance()
             ParticleType& p1 = pstruct[i];
 
             for (const auto& p2 : nbor_data.getNeighbors(i))
-            {                	      
+            {
                 Real dx = p1.pos(0) - p2.pos(0);
                 Real dy = p1.pos(1) - p2.pos(1);
                 Real dz = p1.pos(2) - p2.pos(2);
-                
+
                 Real r2 = dx*dx + dy*dy + dz*dz;
                 r2 = amrex::max(r2, Params::min_r*Params::min_r);
                 Real r = sqrt(r2);
-                
+
 		Gpu::Atomic::Min(pmin_d, r);
 		Gpu::Atomic::Max(pmax_d, r);
             }
@@ -234,7 +236,7 @@ void MDParticleContainer::checkNeighborParticles()
         for (int i = 0; i < np; i++)
         {
             ParticleType& p1 = pstruct[i];
-            Gpu::Atomic::Add(&(p_num_per_grid[p1.idata(0)]),1);
+            Gpu::Atomic::AddNoRet(&(p_num_per_grid[p1.idata(0)]),1);
         }
 
         amrex::AllPrintToFile("neighbor_test") << "FOR GRID " << gid << "\n";;
@@ -272,9 +274,9 @@ void MDParticleContainer::checkNeighborParticles()
         {
             ParticleType& p1 = pstruct[i];
 
-            // Gpu::Atomic::Add(p_mine,1);
+            // Gpu::Atomic::AddNoRet(p_mine,1);
 
-            Gpu::Atomic::Add(&(p_num_per_grid[p1.idata(0)]),1);
+            Gpu::Atomic::AddNoRet(&(p_num_per_grid[p1.idata(0)]),1);
         });
 
         Gpu::Device::synchronize();
@@ -357,14 +359,14 @@ void MDParticleContainer::checkNeighborList()
 
 		if (r2 <= cutoff_sq)
 		{
-                   Gpu::Atomic::Add(&(p_full_count[i]),1);
+                   Gpu::Atomic::AddNoRet(&(p_full_count[i]),1);
                    full_nbors.push_back(p2.id());
 		}
             }
 
             for (const auto& p2 : nbor_data.getNeighbors(i))
             {               
-                Gpu::Atomic::Add(&(p_neighbor_count[i]),1);
+                Gpu::Atomic::AddNoRet(&(p_neighbor_count[i]),1);
                 nbor_nbors.push_back(p2.id());
             }
 
diff --git a/Tests/GPU/CudaGraphs/GraphInitTest/GNUmakefile b/Tests/Particles/ParallelContext/GNUmakefile
similarity index 70%
rename from Tests/GPU/CudaGraphs/GraphInitTest/GNUmakefile
rename to Tests/Particles/ParallelContext/GNUmakefile
index 860d7916a70..01876565e12 100644
--- a/Tests/GPU/CudaGraphs/GraphInitTest/GNUmakefile
+++ b/Tests/Particles/ParallelContext/GNUmakefile
@@ -1,20 +1,21 @@
-AMREX_HOME ?= ../../../..
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
-#DEBUG	= TRUE
 
 DIM	= 3
 
-COMP    = gnu 
+COMP    = gcc
 
 USE_MPI   = TRUE
 USE_OMP   = FALSE
-USE_CUDA  = TRUE
+USE_CUDA  = FALSE
+
 TINY_PROFILE = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
 include ./Make.package
 include $(AMREX_HOME)/Src/Base/Make.package
+include $(AMREX_HOME)/Src/Particle/Make.package
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/GPU/CudaGraphs/GraphInitTest/Make.package b/Tests/Particles/ParallelContext/Make.package
similarity index 89%
rename from Tests/GPU/CudaGraphs/GraphInitTest/Make.package
rename to Tests/Particles/ParallelContext/Make.package
index 6b4b865e8fc..4497b0e25b9 100644
--- a/Tests/GPU/CudaGraphs/GraphInitTest/Make.package
+++ b/Tests/Particles/ParallelContext/Make.package
@@ -1 +1,4 @@
 CEXE_sources += main.cpp
+
+
+
diff --git a/Tests/Particles/ParallelContext/inputs.rt b/Tests/Particles/ParallelContext/inputs.rt
new file mode 100644
index 00000000000..7b4f164a9f2
--- /dev/null
+++ b/Tests/Particles/ParallelContext/inputs.rt
@@ -0,0 +1,13 @@
+redistribute.size = (64, 64, 128)
+redistribute.max_grid_size = 32
+redistribute.is_periodic = 1
+redistribute.num_ppc = 1
+redistribute.move_dir = (1, 0, 0)
+redistribute.do_random = 0
+redistribute.nsteps = 100
+redistribute.do_regrid = 0
+
+redistribute.num_runtime_real = 0
+redistribute.num_runtime_int = 0
+
+particles.do_tiling=1
\ No newline at end of file
diff --git a/Tests/Particles/ParallelContext/main.cpp b/Tests/Particles/ParallelContext/main.cpp
new file mode 100644
index 00000000000..e3c43cf1f14
--- /dev/null
+++ b/Tests/Particles/ParallelContext/main.cpp
@@ -0,0 +1,432 @@
+#include <AMReX.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_Particles.H>
+
+using namespace amrex;
+
+static constexpr int NSR = 4;
+static constexpr int NSI = 3;
+static constexpr int NAR = 2;
+static constexpr int NAI = 1;
+
+int num_runtime_real = 0;
+int num_runtime_int = 0;
+
+void get_position_unit_cell(Real* r, const IntVect& nppc, int i_part)
+{
+    int nx = nppc[0];
+#if AMREX_SPACEDIM > 1
+    int ny = nppc[1];
+#else
+    int ny = 1;
+#endif
+#if AMREX_SPACEDIM > 2
+    int nz = nppc[2];
+#else
+    int nz = 1;
+#endif
+
+    int ix_part = i_part/(ny * nz);
+    int iy_part = (i_part % (ny * nz)) % ny;
+    int iz_part = (i_part % (ny * nz)) / ny;
+
+    r[0] = (0.5+ix_part)/nx;
+    r[1] = (0.5+iy_part)/ny;
+    r[2] = (0.5+iz_part)/nz;
+}
+
+class TestParticleContainer
+    : public amrex::ParticleContainer<NSR, NSI, NAR, NAI>
+{
+
+public:
+
+    TestParticleContainer (const amrex::Geometry& a_geom,
+                           const amrex::DistributionMapping& a_dmap,
+                           const amrex::BoxArray& a_ba)
+        : amrex::ParticleContainer<NSR, NSI, NAR, NAI>(a_geom, a_dmap, a_ba)
+    {
+        for (int i = 0; i < num_runtime_real; ++i)
+        {
+            AddRealComp(true);
+        }
+        for (int i = 0; i < num_runtime_int; ++i)
+        {
+            AddIntComp(true);
+        }
+    }
+
+    void RedistributeLocal ()
+    {
+        const int lev_min = 0;
+        const int lev_max = 0;
+        const int nGrow = 0;
+        const int local = 1;
+        Redistribute(lev_min, lev_max, nGrow, local);
+    }
+
+    void InitParticles (const amrex::IntVect& a_num_particles_per_cell)
+    {
+        BL_PROFILE("InitParticles");
+
+        const int lev = 0;  // only add particles on level 0
+        const Real* dx = Geom(lev).CellSize();
+        const Real* plo = Geom(lev).ProbLo();
+
+        const int num_ppc = AMREX_D_TERM( a_num_particles_per_cell[0],
+                                         *a_num_particles_per_cell[1],
+                                         *a_num_particles_per_cell[2]);
+
+        for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+        {
+            const Box& tile_box  = mfi.tilebox();
+
+            Gpu::HostVector<ParticleType> host_particles;
+            std::array<Gpu::HostVector<Real>, NAR> host_real;
+            std::array<Gpu::HostVector<int>, NAI> host_int;
+
+            std::vector<Gpu::HostVector<Real> > host_runtime_real(NumRuntimeRealComps());
+            std::vector<Gpu::HostVector<int> > host_runtime_int(NumRuntimeIntComps());
+
+            for (IntVect iv = tile_box.smallEnd(); iv <= tile_box.bigEnd(); tile_box.next(iv))
+            {
+                for (int i_part=0; i_part<num_ppc;i_part++) {
+                    Real r[3];
+                    get_position_unit_cell(r, a_num_particles_per_cell, i_part);
+
+                    ParticleType p;
+                    p.id()  = ParticleType::NextID();
+                    p.cpu() = ParallelDescriptor::MyProc();
+                    p.pos(0) = plo[0] + (iv[0] + r[0])*dx[0];
+#if AMREX_SPACEDIM > 1
+                    p.pos(1) = plo[1] + (iv[1] + r[1])*dx[1];
+#endif
+#if AMREX_SPACEDIM > 2
+                    p.pos(2) = plo[2] + (iv[2] + r[2])*dx[2];
+#endif
+
+                    for (int i = 0; i < NSR; ++i) p.rdata(i) = p.id();
+                    for (int i = 0; i < NSI; ++i) p.idata(i) = p.id();
+
+                    host_particles.push_back(p);
+                    for (int i = 0; i < NAR; ++i)
+                        host_real[i].push_back(p.id());
+                    for (int i = 0; i < NAI; ++i)
+                        host_int[i].push_back(p.id());
+                    for (int i = 0; i < NumRuntimeRealComps(); ++i)
+                        host_runtime_real[i].push_back(p.id());
+                    for (int i = 0; i < NumRuntimeIntComps(); ++i)
+                        host_runtime_int[i].push_back(p.id());
+                }
+            }
+
+            auto& particle_tile = DefineAndReturnParticleTile(lev, mfi.index(), mfi.LocalTileIndex());
+            auto old_size = particle_tile.GetArrayOfStructs().size();
+            auto new_size = old_size + host_particles.size();
+            particle_tile.resize(new_size);
+
+            Gpu::copy(Gpu::hostToDevice,
+                      host_particles.begin(),
+                      host_particles.end(),
+                      particle_tile.GetArrayOfStructs().begin() + old_size);
+
+            auto& soa = particle_tile.GetStructOfArrays();
+            for (int i = 0; i < NAR; ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_real[i].begin(),
+                          host_real[i].end(),
+                          soa.GetRealData(i).begin() + old_size);
+            }
+
+            for (int i = 0; i < NAI; ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_int[i].begin(),
+                          host_int[i].end(),
+                          soa.GetIntData(i).begin() + old_size);
+            }
+            for (int i = 0; i < NumRuntimeRealComps(); ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_runtime_real[i].begin(),
+                          host_runtime_real[i].end(),
+                          soa.GetRealData(NAR+i).begin() + old_size);
+            }
+
+            for (int i = 0; i < NumRuntimeIntComps(); ++i)
+            {
+                Gpu::copy(Gpu::hostToDevice,
+                          host_runtime_int[i].begin(),
+                          host_runtime_int[i].end(),
+                          soa.GetIntData(NAI+i).begin() + old_size);
+            }
+
+            Gpu::synchronize();
+        }
+
+        RedistributeLocal();
+    }
+
+    void moveParticles (const IntVect& move_dir, int do_random)
+    {
+        BL_PROFILE("TestParticleContainer::moveParticles");
+
+        for (int lev = 0; lev <= finestLevel(); ++lev)
+        {
+            const Geometry& geom = Geom(lev);
+            const auto dx = Geom(lev).CellSizeArray();
+            auto& plev  = GetParticles(lev);
+
+            for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+            {
+                int gid = mfi.index();
+                int tid = mfi.LocalTileIndex();
+                auto& ptile = plev[std::make_pair(gid, tid)];
+                auto& aos   = ptile.GetArrayOfStructs();
+                ParticleType* pstruct = &(aos[0]);
+                const size_t np = aos.numParticles();
+
+                if (do_random == 0)
+                {
+                    amrex::ParallelFor(np,
+                    [=] AMREX_GPU_DEVICE (size_t i) noexcept
+                    {
+                        ParticleType& p = pstruct[i];
+                        p.pos(0) += move_dir[0]*dx[0];
+#if AMREX_SPACEDIM > 1
+                        p.pos(1) += move_dir[1]*dx[1];
+#endif
+#if AMREX_SPACEDIM > 2
+                        p.pos(2) += move_dir[2]*dx[2];
+#endif
+                    });
+                }
+                else
+                {
+                    amrex::ParallelForRNG(np,
+                    [=] AMREX_GPU_DEVICE (size_t i, RandomEngine const& engine) noexcept
+                    {
+                        ParticleType& p = pstruct[i];
+
+                        p.pos(0) += (2*amrex::Random(engine)-1)*move_dir[0]*dx[0];
+#if AMREX_SPACEDIM > 1
+                        p.pos(1) += (2*amrex::Random(engine)-1)*move_dir[1]*dx[1];
+#endif
+#if AMREX_SPACEDIM > 2
+                        p.pos(2) += (2*amrex::Random(engine)-1)*move_dir[2]*dx[2];
+#endif
+                    });
+                }
+            }
+        }
+    }
+
+    void checkAnswer () const
+    {
+        BL_PROFILE("TestParticleContainer::checkAnswer");
+
+        AMREX_ALWAYS_ASSERT(OK());
+
+        int num_rr = NumRuntimeRealComps();
+        int num_ii = NumRuntimeIntComps();
+
+        for (int lev = 0; lev <= finestLevel(); ++lev)
+        {
+            const Geometry& geom = Geom(lev);
+            const auto dx = Geom(lev).CellSizeArray();
+            auto& plev  = GetParticles(lev);
+
+            for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+            {
+                int gid = mfi.index();
+                int tid = mfi.LocalTileIndex();
+                auto& ptile = plev.at(std::make_pair(gid, tid));
+                const auto ptd = ptile.getConstParticleTileData();
+                const size_t np = ptile.numParticles();
+
+                AMREX_FOR_1D ( np, i,
+                {
+                    for (int j = 0; j < NSR; ++j)
+                    {
+                        AMREX_ALWAYS_ASSERT(ptd.m_aos[i].rdata(j) == ptd.m_aos[i].id());
+                    }
+                    for (int j = 0; j < NSI; ++j)
+                    {
+                        AMREX_ALWAYS_ASSERT(ptd.m_aos[i].idata(j) == ptd.m_aos[i].id());
+                    }
+                    for (int j = 0; j < NAR; ++j)
+                    {
+                        AMREX_ALWAYS_ASSERT(ptd.m_rdata[j][i] == ptd.m_aos[i].id());
+                    }
+                    for (int j = 0; j < NAI; ++j)
+                    {
+                        AMREX_ALWAYS_ASSERT(ptd.m_idata[j][i] == ptd.m_aos[i].id());
+                    }
+                    for (int j = 0; j < num_rr; ++j)
+                    {
+                        AMREX_ALWAYS_ASSERT(ptd.m_runtime_rdata[j][i] == ptd.m_aos[i].id());
+                    }
+                    for (int j = 0; j < num_ii; ++j)
+                    {
+                        AMREX_ALWAYS_ASSERT(ptd.m_runtime_idata[j][i] == ptd.m_aos[i].id());
+                    }
+                });
+            }
+        }
+    }
+};
+
+struct TestParams
+{
+    IntVect size;
+    int max_grid_size;
+    int num_ppc;
+    int is_periodic;
+    IntVect move_dir;
+    int do_random;
+    int nsteps;
+    int do_regrid;
+    int sort;
+};
+
+void testParallelContext();
+
+int main (int argc, char* argv[])
+{
+    amrex::Initialize(argc,argv);
+
+    amrex::Print() << "Running redistribute test \n";
+    testParallelContext();
+
+    amrex::Finalize();
+}
+
+void get_test_params(TestParams& params, const std::string& prefix)
+{
+    ParmParse pp(prefix);
+    pp.get("size", params.size);
+    pp.get("max_grid_size", params.max_grid_size);
+    pp.get("num_ppc", params.num_ppc);
+    pp.get("is_periodic", params.is_periodic);
+    pp.get("move_dir", params.move_dir);
+    pp.get("do_random", params.do_random);
+    pp.get("nsteps", params.nsteps);
+    pp.get("do_regrid", params.do_regrid);
+    pp.query("num_runtime_real", num_runtime_real);
+    pp.query("num_runtime_int", num_runtime_int);
+
+    params.sort = 0;
+    pp.query("sort", params.sort);
+}
+
+void testParallelContext ()
+{
+    BL_PROFILE("testParallelContext");
+
+    AMREX_ALWAYS_ASSERT(AMREX_SPACEDIM == 3);
+
+    // we always make two subcommunicators.
+    // one takes the left half of the domain in direction 0, the other the right.
+    int rank_n = ParallelContext::NProcsSub();
+    int myproc = ParallelContext::MyProcSub();
+    int task_me = myproc / (amrex::max(rank_n, 2) / 2);
+
+    if (task_me > 1) task_me = 1;
+
+    MPI_Comm new_comm;
+    MPI_Comm_split(ParallelContext::CommunicatorSub(), task_me, myproc, &new_comm);
+
+    const int io_rank = 0;
+    ParallelContext::push(new_comm, task_me, io_rank);
+
+    {
+        TestParams params;
+        get_test_params(params, "redistribute");
+
+        int is_per[BL_SPACEDIM];
+        for (int i = 0; i < BL_SPACEDIM; i++)
+            is_per[i] = params.is_periodic;
+
+        // Each comm gets a different domain
+        IntVect hs = params.size / 2;
+
+        RealBox real_box;
+        for (int n = 0; n < BL_SPACEDIM; n++)
+        {
+            Real physlo = (n == 0) ? task_me*hs[n] : 0.0;
+            Real physhi = (n == 0) ? task_me*hs[n] + hs[n] : params.size[n];
+            real_box.setLo(n, physlo);
+            real_box.setHi(n, physhi);
+        }
+
+        IntVect domain_lo(AMREX_D_DECL(task_me*hs[0], 0, 0));
+        IntVect domain_hi(AMREX_D_DECL(task_me*hs[0] + hs[0] - 1,
+                                       params.size[1] - 1,
+                                       params.size[2] - 1));
+        const Box base_domain(domain_lo, domain_hi);
+
+        Geometry geom;
+        geom.define(base_domain, &real_box, CoordSys::cartesian, is_per);
+
+        BoxArray ba;
+        ba.define(base_domain);
+        ba.maxSize(params.max_grid_size);
+
+        DistributionMapping dm;
+        dm.define(ba, ParallelContext::NProcsSub());
+
+        // by doing it this way, we have each subcommunicator making
+        // separate Redistribute calls at the same time.
+        if (task_me == 0)
+        {
+            TestParticleContainer pc(geom, dm, ba);
+
+            int npc = params.num_ppc;
+            IntVect nppc = IntVect(AMREX_D_DECL(npc, npc, npc));
+
+            pc.InitParticles(nppc);
+
+            pc.checkAnswer();
+
+            auto np_old = pc.TotalNumberOfParticles();
+
+            for (int i = 0; i < params.nsteps; ++i)
+            {
+                pc.moveParticles(params.move_dir, params.do_random);
+                pc.RedistributeLocal();
+                if (params.sort) pc.SortParticlesByCell();
+                pc.checkAnswer();
+            }
+
+            if (geom.isAllPeriodic()) AMREX_ALWAYS_ASSERT(np_old == pc.TotalNumberOfParticles());
+        }
+
+        if (task_me == 1)
+        {
+            TestParticleContainer pc(geom, dm, ba);
+
+            int npc = params.num_ppc;
+            IntVect nppc = IntVect(AMREX_D_DECL(npc, npc, npc));
+
+            pc.InitParticles(nppc);
+
+            pc.checkAnswer();
+
+            auto np_old = pc.TotalNumberOfParticles();
+
+            for (int i = 0; i < params.nsteps; ++i)
+            {
+                pc.moveParticles(params.move_dir, params.do_random);
+                pc.RedistributeLocal();
+                if (params.sort) pc.SortParticlesByCell();
+                pc.checkAnswer();
+            }
+
+            if (geom.isAllPeriodic()) AMREX_ALWAYS_ASSERT(np_old == pc.TotalNumberOfParticles());
+        }
+    }
+
+    ParallelContext::pop();
+}
diff --git a/Tests/Particles/ParticleIterator/GNUmakefile b/Tests/Particles/ParticleIterator/GNUmakefile
index 81a5b0d68f1..784ac758d72 100644
--- a/Tests/Particles/ParticleIterator/GNUmakefile
+++ b/Tests/Particles/ParticleIterator/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/ParticleMesh/CMakeLists.txt b/Tests/Particles/ParticleMesh/CMakeLists.txt
new file mode 100644
index 00000000000..4358c17ffcb
--- /dev/null
+++ b/Tests/Particles/ParticleMesh/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files inputs  )
+
+setup_test(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/Particles/ParticleMesh/GNUmakefile b/Tests/Particles/ParticleMesh/GNUmakefile
index 07b0582f97c..81c2f93f1e5 100644
--- a/Tests/Particles/ParticleMesh/GNUmakefile
+++ b/Tests/Particles/ParticleMesh/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/ParticleMesh/main.cpp b/Tests/Particles/ParticleMesh/main.cpp
index 2e1b88b8af3..30f2ee05ade 100644
--- a/Tests/Particles/ParticleMesh/main.cpp
+++ b/Tests/Particles/ParticleMesh/main.cpp
@@ -89,7 +89,7 @@ void testParticleMesh(TestParams& parms)
           for (int kk = 0; kk <= 1; ++kk) { 
               for (int jj = 0; jj <= 1; ++jj) { 
                   for (int ii = 0; ii <= 1; ++ii) {
-                      amrex::Gpu::Atomic::Add(&rho(i+ii-1, j+jj-1, k+kk-1, 0),
+                      amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, j+jj-1, k+kk-1, 0),
                                               sx[ii]*sy[jj]*sz[kk]*p.rdata(0));
                   }
               }
@@ -99,7 +99,7 @@ void testParticleMesh(TestParams& parms)
              for (int kk = 0; kk <= 1; ++kk) { 
                   for (int jj = 0; jj <= 1; ++jj) { 
                       for (int ii = 0; ii <= 1; ++ii) {
-                          amrex::Gpu::Atomic::Add(&rho(i+ii-1, j+jj-1, k+kk-1, comp),
+                          amrex::Gpu::Atomic::AddNoRet(&rho(i+ii-1, j+jj-1, k+kk-1, comp),
                                                   sx[ii]*sy[jj]*sz[kk]*p.rdata(0)*p.rdata(comp));
                       }
                   }
diff --git a/Tests/Particles/ParticleReduce/CMakeLists.txt b/Tests/Particles/ParticleReduce/CMakeLists.txt
new file mode 100644
index 00000000000..9acfbe5148e
--- /dev/null
+++ b/Tests/Particles/ParticleReduce/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files inputs  )
+
+setup_test(_sources _input_files NTHREADS 2)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/Particles/ParticleReduce/GNUmakefile b/Tests/Particles/ParticleReduce/GNUmakefile
index d581c28d164..01876565e12 100644
--- a/Tests/Particles/ParticleReduce/GNUmakefile
+++ b/Tests/Particles/ParticleReduce/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tests/Particles/ParticleReduce/main.cpp b/Tests/Particles/ParticleReduce/main.cpp
index 2c04b68b1de..a07d6a1f2ab 100644
--- a/Tests/Particles/ParticleReduce/main.cpp
+++ b/Tests/Particles/ParticleReduce/main.cpp
@@ -104,6 +104,8 @@ class TestParticleContainer
                 Gpu::copy(Gpu::hostToDevice, host_int[i].begin(), host_int[i].end(),
                           soa.GetIntData(i).begin() + old_size);
             }
+
+            Gpu::synchronize();
         }
     }
 };
diff --git a/Tests/Particles/ParticleTransformations/CMakeLists.txt b/Tests/Particles/ParticleTransformations/CMakeLists.txt
new file mode 100644
index 00000000000..4358c17ffcb
--- /dev/null
+++ b/Tests/Particles/ParticleTransformations/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files inputs  )
+
+setup_test(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/Particles/ParticleTransformations/GNUmakefile b/Tests/Particles/ParticleTransformations/GNUmakefile
index d581c28d164..01876565e12 100644
--- a/Tests/Particles/ParticleTransformations/GNUmakefile
+++ b/Tests/Particles/ParticleTransformations/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tests/Particles/ParticleTransformations/main.cpp b/Tests/Particles/ParticleTransformations/main.cpp
index 00d00224c96..590cee345db 100644
--- a/Tests/Particles/ParticleTransformations/main.cpp
+++ b/Tests/Particles/ParticleTransformations/main.cpp
@@ -107,6 +107,8 @@ class TestParticleContainer
                 Gpu::copy(Gpu::hostToDevice, host_int[i].begin(), host_int[i].end(),
                           soa.GetIntData(i).begin() + old_size);
             }
+
+            Gpu::synchronize();
         }
     }
 };
@@ -299,6 +301,7 @@ void filterParticles (PC& pc, F&& f)
             ptile_tmp.resize(ptile.size());
             
             auto num_output = amrex::filterParticles(ptile_tmp, ptile, std::forward<F>(f));
+
             ptile.swap(ptile_tmp);
             ptile.resize(num_output);
         }
@@ -393,12 +396,10 @@ void testFilter (const PC& pc)
 {
     using PType = typename PC::SuperParticleType;
 
-    PC pc2(pc.Geom(0), pc.ParticleDistributionMap(0), pc.ParticleBoxArray(0));
-    pc2.copyParticles(pc);
+    auto np_old = pc.TotalNumberOfParticles();
 
-    auto np_old = pc2.TotalNumberOfParticles();
-    
-    filterParticles(pc2, KeepOddFilter());
+    PC pc2(pc.Geom(0), pc.ParticleDistributionMap(0), pc.ParticleBoxArray(0));
+    pc2.copyParticles(pc, KeepOddFilter());
 
     auto np_new = pc2.TotalNumberOfParticles();
 
@@ -409,10 +410,10 @@ void testFilter (const PC& pc)
     AMREX_ALWAYS_ASSERT(all_odd);
 
     pc2.clearParticles();
-    pc2.copyParticles(pc);
-    filterParticles(pc2, KeepEvenFilter());
+    pc2.copyParticles(pc, KeepEvenFilter());
 
     np_new = pc2.TotalNumberOfParticles();
+
     AMREX_ALWAYS_ASSERT(2*np_new == np_old);
 
     auto all_even = amrex::ReduceLogicalAnd(pc2, [=] AMREX_GPU_HOST_DEVICE (const PType& p) -> int { return p.id() % 2 == 0; });
diff --git a/Tests/Particles/Redistribute/CMakeLists.txt b/Tests/Particles/Redistribute/CMakeLists.txt
new file mode 100644
index 00000000000..59bb4df94d9
--- /dev/null
+++ b/Tests/Particles/Redistribute/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files inputs.rt  )  # There are others but we use only this one for now
+
+setup_test(_sources _input_files NTASKS 2)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/Particles/Redistribute/GNUmakefile b/Tests/Particles/Redistribute/GNUmakefile
index d581c28d164..01876565e12 100644
--- a/Tests/Particles/Redistribute/GNUmakefile
+++ b/Tests/Particles/Redistribute/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tests/Particles/Redistribute/main.cpp b/Tests/Particles/Redistribute/main.cpp
index a9deaf4a815..9df5913cb1c 100644
--- a/Tests/Particles/Redistribute/main.cpp
+++ b/Tests/Particles/Redistribute/main.cpp
@@ -5,8 +5,8 @@
 
 using namespace amrex;
 
-static constexpr int NSR = 4;
-static constexpr int NSI = 3;
+static constexpr int NSR = 0;
+static constexpr int NSI = 0;
 static constexpr int NAR = 2;
 static constexpr int NAI = 1;
 
@@ -93,10 +93,10 @@ class TestParticleContainer
             const Box& tile_box  = mfi.tilebox();
 
             Gpu::HostVector<ParticleType> host_particles;
-            std::array<Gpu::HostVector<Real>, NAR> host_real;
+            std::array<Gpu::HostVector<ParticleReal>, NAR> host_real;
             std::array<Gpu::HostVector<int>, NAI> host_int;
 
-            std::vector<Gpu::HostVector<Real> > host_runtime_real(NumRuntimeRealComps());
+            std::vector<Gpu::HostVector<ParticleReal> > host_runtime_real(NumRuntimeRealComps());
             std::vector<Gpu::HostVector<int> > host_runtime_int(NumRuntimeIntComps());
 
             for (IntVect iv = tile_box.smallEnd(); iv <= tile_box.bigEnd(); tile_box.next(iv))
@@ -115,10 +115,10 @@ class TestParticleContainer
 #if AMREX_SPACEDIM > 2
                     p.pos(2) = plo[2] + (iv[2] + r[2])*dx[2];
 #endif
-                    
+
                     for (int i = 0; i < NSR; ++i) p.rdata(i) = p.id();
                     for (int i = 0; i < NSI; ++i) p.idata(i) = p.id();
-                    
+
                     host_particles.push_back(p);
                     for (int i = 0; i < NAR; ++i)
                         host_real[i].push_back(p.id());
@@ -172,6 +172,8 @@ class TestParticleContainer
                           host_runtime_int[i].end(),
                           soa.GetIntData(NAI+i).begin() + old_size);
             }
+
+            Gpu::synchronize();
         }
 
         RedistributeLocal();
@@ -183,7 +185,6 @@ class TestParticleContainer
 
         for (int lev = 0; lev <= finestLevel(); ++lev)
         {
-            const Geometry& geom = Geom(lev);
             const auto dx = Geom(lev).CellSizeArray();
             auto& plev  = GetParticles(lev);
         
@@ -198,7 +199,7 @@ class TestParticleContainer
 
                 if (do_random == 0)
                 {
-                    AMREX_FOR_1D ( np, i,
+                    amrex::ParallelFor( np, [=] AMREX_GPU_DEVICE (int i) noexcept
                     {
                         ParticleType& p = pstruct[i];
                         p.pos(0) += move_dir[0]*dx[0];
@@ -209,19 +210,20 @@ class TestParticleContainer
                         p.pos(2) += move_dir[2]*dx[2];
 #endif
                     });
-                }            
+                }
                 else
                 {
-                    AMREX_FOR_1D ( np, i,
+                    amrex::ParallelForRNG( np,
+                    [=] AMREX_GPU_DEVICE (int i, RandomEngine const& engine) noexcept
                     {
                         ParticleType& p = pstruct[i];
 
-                        p.pos(0) += (2*amrex::Random()-1)*move_dir[0]*dx[0];
+                        p.pos(0) += (2*amrex::Random(engine)-1)*move_dir[0]*dx[0];
 #if AMREX_SPACEDIM > 1
-                        p.pos(1) += (2*amrex::Random()-1)*move_dir[1]*dx[1];
+                        p.pos(1) += (2*amrex::Random(engine)-1)*move_dir[1]*dx[1];
 #endif
 #if AMREX_SPACEDIM > 2
-                        p.pos(2) += (2*amrex::Random()-1)*move_dir[2]*dx[2];
+                        p.pos(2) += (2*amrex::Random(engine)-1)*move_dir[2]*dx[2];
 #endif
                     });
                 }
@@ -240,10 +242,7 @@ class TestParticleContainer
 
         for (int lev = 0; lev <= finestLevel(); ++lev)
         {
-            const Geometry& geom = Geom(lev);
-            const auto dx = Geom(lev).CellSizeArray();
             auto& plev  = GetParticles(lev);
-            
             for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
             {
                 int gid = mfi.index();
@@ -387,9 +386,6 @@ void testRedistribute ()
 
     auto np_old = pc.TotalNumberOfParticles();
 
-    Gpu::DeviceVector<int> vecy = {1, 2, 3};
-    Gpu::HostVector<int> asdf = {1, 2, 3};
-    
     for (int i = 0; i < params.nsteps; ++i)
     {
         pc.moveParticles(params.move_dir, params.do_random);
diff --git a/Tests/Particles/SparseBins/GNUmakefile b/Tests/Particles/SparseBins/GNUmakefile
index 07b0582f97c..81c2f93f1e5 100644
--- a/Tests/Particles/SparseBins/GNUmakefile
+++ b/Tests/Particles/SparseBins/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/TypeDescriptor/GNUmakefile b/Tests/Particles/TypeDescriptor/GNUmakefile
index 38753a8959e..e9f5c464a80 100644
--- a/Tests/Particles/TypeDescriptor/GNUmakefile
+++ b/Tests/Particles/TypeDescriptor/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tests/Particles/main.cpp b/Tests/Particles/main.cpp
deleted file mode 100644
index 1857226832d..00000000000
--- a/Tests/Particles/main.cpp
+++ /dev/null
@@ -1,171 +0,0 @@
-#include <iostream>
-#include <map>
-#include <vector>
-#include <type_traits>
-
-#include <AMReX_Vector.H>
-#include "AMReX_Particles.H"
-
-using namespace amrex;
-
-struct RealIdx {
-    enum {
-        id = 0,
-        cpu,
-        nattribs
-    };
-};
-
-struct IntIdx {
-    enum {
-        id = 0,
-        cpu,
-        nattribs
-    };
-};
-
-/*
-
-  This is a particle container that demonstrates how to layout the particle
-  data in struct-of-arrays form. We refer to data laid out in this manner as
-  particle "attributes". In this test, in addition to being stored in the particle
-  struct itself, we also store the particle id and cpu in additional arrays,
-  once as Reals and once as integers. The test below then moves the particles
-  randomly for 10 time steps, making sure that the particle data is redistributed
-  correctly.
-  
- */
-class StructOfArraysParticleContainer 
-    : public ParticleContainer<0, 0,
-                               RealIdx::nattribs,
-                               IntIdx::nattribs>
-{
- public:
-    
-    StructOfArraysParticleContainer (const Vector<Geometry>            & geom, 
-                                     const Vector<DistributionMapping> & dmap,
-                                     const Vector<BoxArray>            & ba,
-                                     const Vector<int>                 & rr)
-        : ParticleContainer<0, 0,
-                            RealIdx::nattribs,
-                            IntIdx::nattribs> (geom, dmap, ba, rr)
-    {
-        AddRealComp(true);
-        AddRealComp(true);
-
-        AddIntComp(true);
-        AddIntComp(true);
-    }
-
-    void InitParticles() {
-        const int lev = 0;
-        const Geometry& geom = Geom(lev);
-        const Real* dx  = geom.CellSize();
-        
-        ParticleType p;
-        for (MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi) {
-            const Box& tile_box = mfi.tilebox();
-            const RealBox tile_real_box { tile_box, dx, geom.ProbLo() };
-            
-            const int grid_id = mfi.index();
-            const int tile_id = mfi.LocalTileIndex();
-            auto& particle_tile = DefineAndReturnParticleTile(lev, grid_id, tile_id);
-            
-            const auto& boxlo = tile_box.smallEnd();
-            for (IntVect iv = tile_box.smallEnd(); iv <= tile_box.bigEnd(); tile_box.next(iv)) {
-                
-                p.id() = ParticleType::NextID();
-                p.cpu() = ParallelDescriptor::MyProc();
-            
-                AMREX_D_TERM(p.pos(0) = tile_real_box.lo(0) + (iv[0]- boxlo[0] + 0.5)*dx[0];,
-                       p.pos(1) = tile_real_box.lo(1) + (iv[1]- boxlo[1] + 0.5)*dx[1];,
-                       p.pos(2) = tile_real_box.lo(2) + (iv[2]- boxlo[2] + 0.5)*dx[2];);
-
-                // set this particle's real attributes
-                std::array<double, RealIdx::nattribs> real_attribs;
-                real_attribs[RealIdx::id]  = p.id();
-                real_attribs[RealIdx::cpu] = p.cpu();
-
-                // set this particle's integer attributes
-                std::array<int, IntIdx::nattribs> int_attribs;
-                int_attribs[IntIdx::id]  = p.id();
-                int_attribs[IntIdx::cpu] = p.cpu();
-                                
-                particle_tile.push_back(p);
-                particle_tile.push_back_real(real_attribs);
-                particle_tile.push_back_int(int_attribs);
-
-                particle_tile.push_back_real(2, p.id());
-                particle_tile.push_back_real(3, p.cpu());
-
-                particle_tile.push_back_int(2, p.id());
-                particle_tile.push_back_int(3, p.cpu());
-            }
-        }
-    }
-};
-
-int main(int argc, char* argv[])
-{
-    
-    amrex::Initialize(argc,argv);
-
-    int ncell = 64;
-    int nlevs = 2;
-
-    RealBox real_box, fine_box;
-    for (int n = 0; n < BL_SPACEDIM; n++) {
-        real_box.setLo(n,0.0);
-        real_box.setHi(n,1.0);
-        fine_box.setLo(n,0.4);
-        fine_box.setHi(n,0.6);
-    }
-    
-    IntVect domain_lo(0 , 0, 0); 
-    IntVect domain_hi(ncell-1, ncell-1, ncell-1); 
-    
-    const Box domain(domain_lo, domain_hi);
-    
-    Vector<int> rr(nlevs-1);
-    for (int lev = 1; lev < nlevs; lev++)
-        rr[lev-1] = 2;
- 
-    int is_per[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; i++) is_per[i] = 1;
-
-    Vector<Geometry> geom(nlevs);
-    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
-    geom[1].define(amrex::refine(geom[0].Domain(), rr[0]),
-                   &real_box, CoordSys::cartesian, is_per);
-
-    Vector<BoxArray> ba(nlevs);
-    ba[0].define(domain);  
-
-    int nfine = ncell*rr[0];
-    IntVect refined_lo(nfine/4,nfine/4,nfine/4); 
-    IntVect refined_hi(3*nfine/4-1,3*nfine/4-1,3*nfine/4-1);
-    
-    // Build a box for the level 1 domain
-    Box refined_patch(refined_lo, refined_hi);
-    ba[1].define(refined_patch);
-    
-    int max_grid_size = 32;
-    for (int lev = 0; lev < nlevs; lev++)
-        ba[lev].maxSize(max_grid_size);
-    
-    Vector<DistributionMapping> dmap(nlevs);
-    for (int lev = 0; lev < nlevs; lev++)
-        dmap[lev].define(ba[lev]);
-    
-    StructOfArraysParticleContainer MyPC(geom, dmap, ba, rr);
-    
-    MyPC.InitParticles();
-    MyPC.Redistribute();
-    
-    for (int i = 0; i < 10; i ++)
-        MyPC.MoveRandom();
-    
-    MyPC.WriteAsciiFile("particles");
-    
-    amrex::Finalize();
-}
diff --git a/Tests/Particles/test.py b/Tests/Particles/test.py
deleted file mode 100644
index 25666a91f47..00000000000
--- a/Tests/Particles/test.py
+++ /dev/null
@@ -1,17 +0,0 @@
-import sys
-
-with open("particles", "r") as f:
-    f.readline()
-    f.readline()
-    f.readline()
-    f.readline()
-    f.readline()
-    for line in f:
-        vals = line.strip().split()
-        if (vals[3] != vals[5] or vals[3] != vals[7]):
-            print("Fail", vals[3], vals[5], vals[7])
-            sys.exit()
-        if (vals[4] != vals[6] or vals[4] != vals[8]):
-            print("Fail", vals[4], vals[6], vals[8])
-            sys.exit()
-print("pass!")
diff --git a/Tests/PnetCDFBenchmark/Make.package b/Tests/PnetCDFBenchmark/Make.package
deleted file mode 100644
index cbdcaa37858..00000000000
--- a/Tests/PnetCDFBenchmark/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-CEXE_sources += main.cpp WritePlotfilePnetCDF.cpp
-CEXE_headers += WritePlotfilePnetCDF.H
diff --git a/Tests/PnetCDFBenchmark/ReadMe b/Tests/PnetCDFBenchmark/ReadMe
deleted file mode 100644
index 59ae07d8a54..00000000000
--- a/Tests/PnetCDFBenchmark/ReadMe
+++ /dev/null
@@ -1,112 +0,0 @@
-This benchmark is translated from the HDF5 benchmark. It store the plot file in NetCDF format using the PnetCDF library.
-
-The usage and options is exactly the same as the HDF5 benchmark. Run the benchmark program with a input file containing the configuration. inputs is an example input file.
-
-To build the benchmark:
-    First, edit the GNUmakefile:
-        set variable "PNETCDF_HOME" to the install directory of PnetCDF library
-    Then, simply run make
-
-To run the benchmark:
-    ./<benchmark> inputs
-
-Note:
-    open MP in GNUmakefile should remain disabled since PnetCDF does not officialy support open MP.
-
-Performance evaluation:
-    1024 processes on Cori @ NERSC
-    Lustre 64 stripe with 1 MiB stripe size
-    Input file (49 GiB total size):
-        ncells = 1024 
-        max_grid_size = 32
-        nlevs = 1
-        ncomp = 6 
-        nppc = 2 
-    I/O time (sec) compared to HDF5 benchmark:
-        Round	1	2	3
-        HDF5	93	111	110
-        PnetCDF	17	16	28
-
-Example output (Running on 1024 processes):
-    MPI initialized with 1024 MPI processes
-    AMReX (18.11-803-g43c833e1d9f0-dirty) initialized
-    Write_NCHEADER_time_1_2_0 = 0.4263730049  seconds.
-    #%$: ncmpi_create_time: 0.4263730049
-    Write_NCATT_time_1_3 = 0.006245136261  seconds.
-    #%$: file_init_att_time: 0.01249027252
-    Write_NCINIT_time_1 = 0.5565130711  seconds.
-    #%$: create_open_time: 0.5565130711
-    Write_NCATT_time_2 = 0.002128839493  seconds.
-    #%$: write_att_time: 0.002128839493
-    Write_NCATT_time_3 = 0.01520013809  seconds.
-    #%$: def_meta_var_dim_time: 0.01520013809
-    Write_NCVAR_time_4 = 0.2298190594  seconds.
-    #%$: write_meta_var_time: 0.2298190594
-    Write_NCATT_time = 0.8017010689  seconds.
-    #%$: write_all_meta_time: 0.8017010689
-    ::---- calling NCPUT for the grid data on level 0
-    Write_NCATT_time_5 = 0.2226190567  seconds.
-    #%$: def_data_var_time: 0.2226190567
-    Write_NCVARPUT_time = 15.79316187  seconds.
-    Write_NCVARPUT_time_since = 1545594288
-    #%$: write_data_time: 15.79316187
-    Write_NC_time_7_closing = 0  seconds.
-    Write_PNETCDF_time = 16.72815895  seconds.
-    #%$: write_file_total_time: 16.72815895
-
-
-    TinyProfiler total time across processes [min...avg...max]: 26.11 ... 26.33 ... 27.63
-
-    ----------------------------------------------------------------------------------------------------
-    Name                                                 NCalls  Excl. Min  Excl. Avg  Excl. Max   Max %
-    ----------------------------------------------------------------------------------------------------
-    NCVarPutGrids                                             1      15.79      15.79      15.79  57.15%
-    VisMF::Write(FabArray)                                    1     0.2093      1.421      7.965  28.82%
-    VisMF::CalculateMinMax                                    1     0.0101       1.04      7.698  27.86%
-    ParticleContainer::Checkpoint()                           1    0.08512      6.133      6.959  25.18%
-    WriteMultiLevelPlotfilePNETCDF                            1     0.8486     0.8559     0.8599   3.11%
-    VisMF::WriteHeader                                        1   8.84e-07  0.0003416     0.3481   1.26%
-    DistributionMapping::LeastUsedCPUs()                      1    0.05556     0.1135     0.2797   1.01%
-    NFI::ReadyToWrite:decider                                 0          0  0.0002229     0.2282   0.83%
-    WriteMultiLevelPlotfile()                                 1     0.0988     0.1212     0.1308   0.47%
-    WriteGenericPlotfileHeader()                              0          0  0.0001129     0.1156   0.42%
-    FABio_binary::write_header                               96  0.0001979  0.0007719    0.08167   0.30%
-    NCVarPut                                                  1    0.07673    0.07985    0.08114   0.29%
-    DistributionMapping::SFCProcessorMapDoIt()                1    0.04754    0.05188    0.07602   0.28%
-    FabArray::setVal()                                        1    0.03905    0.05305    0.07502   0.27%
-    ParticleContainer::RedistributeMPI()                      1    0.01621    0.04918    0.07067   0.26%
-    VisMF::FindOffsets                                        1  5.539e-06   0.002958     0.0501   0.18%
-    FABio::write_header                                      96  9.944e-05  0.0003072    0.04653   0.17%
-    ParticleContainer::RedistributeCPU()                      1   0.008609    0.02038    0.04361   0.16%
-    ParticleContainer<NSR, NSI, NAR, NAI>::InitRandom()       1  0.0003943   0.001009   0.003208   0.01%
-    NFI::CleanUpMessages                                      1  1.041e-06  2.587e-06  5.681e-05   0.00%
-    VisMF::Header                                             1  1.715e-06  2.294e-06  1.671e-05   0.00%
-    ----------------------------------------------------------------------------------------------------
-
-    ----------------------------------------------------------------------------------------------------
-    Name                                                 NCalls  Incl. Min  Incl. Avg  Incl. Max   Max %
-    ----------------------------------------------------------------------------------------------------
-    WriteMultiLevelPlotfilePNETCDF                            1      16.72      16.73      16.73  60.54%
-    NCVarPut                                                  1      15.87      15.87      15.87  57.44%
-    NCVarPutGrids                                             1      15.79      15.79      15.79  57.15%
-    WriteMultiLevelPlotfile()                                 1      1.762      2.587      8.636  31.25%
-    VisMF::Write(FabArray)                                    1      1.569      2.466      8.514  30.81%
-    VisMF::CalculateMinMax                                    1     0.0101       1.04      7.698  27.86%
-    ParticleContainer::Checkpoint()                           1    0.08512      6.133      6.959  25.18%
-    VisMF::WriteHeader                                        1   8.84e-07  0.0003416     0.3481   1.26%
-    DistributionMapping::SFCProcessorMapDoIt()                1     0.1315     0.1654     0.3377   1.22%
-    DistributionMapping::LeastUsedCPUs()                      1    0.05556     0.1135     0.2797   1.01%
-    NFI::ReadyToWrite:decider                                 0          0  0.0002229     0.2282   0.83%
-    VisMF::FindOffsets                                        1  5.539e-06   0.003082     0.1779   0.64%
-    FABio_binary::write_header                               96  0.0002976   0.001079     0.1282   0.46%
-    WriteGenericPlotfileHeader()                              0          0  0.0001129     0.1156   0.42%
-    ParticleContainer<NSR, NSI, NAR, NAI>::InitRandom()       1    0.03218    0.07057     0.1145   0.41%
-    ParticleContainer::RedistributeCPU()                      1    0.03102    0.06956     0.1115   0.40%
-    FabArray::setVal()                                        1    0.03905    0.05305    0.07502   0.27%
-    ParticleContainer::RedistributeMPI()                      1    0.01621    0.04918    0.07067   0.26%
-    FABio::write_header                                      96  9.944e-05  0.0003072    0.04653   0.17%
-    NFI::CleanUpMessages                                      1  1.041e-06  2.587e-06  5.681e-05   0.00%
-    VisMF::Header                                             1  1.715e-06  2.294e-06  1.671e-05   0.00%
-    ----------------------------------------------------------------------------------------------------
-
-    AMReX (18.11-803-g43c833e1d9f0-dirty) finalized
\ No newline at end of file
diff --git a/Tests/PnetCDFBenchmark/WritePlotfilePnetCDF.H b/Tests/PnetCDFBenchmark/WritePlotfilePnetCDF.H
deleted file mode 100644
index 4e9e47b637b..00000000000
--- a/Tests/PnetCDFBenchmark/WritePlotfilePnetCDF.H
+++ /dev/null
@@ -1,22 +0,0 @@
-#ifndef WRITEPLOTFILEPNETCDF_H_
-#define WRITEPLOTFILEPNETCDF_H_
-
-#include <AMReX_REAL.H>
-#include <AMReX_Vector.H>
-#include <AMReX_BLProfiler.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_Geometry.H>
-
-#ifdef BL_PNETCDF
-void WriteMultiLevelPlotfilePNETCDF (const std::string &plotfilename,
-                                  int nlevels,
-                                  const amrex::Vector<const amrex::MultiFab*> &mf,
-                                  const amrex::Vector<std::string> &varnames,
-                                  const amrex::Vector<amrex::Geometry> &geom,
-                                  amrex::Real time,
-                                  amrex::Real dt,
-				  const amrex::Vector<amrex::IntVect> &ref_ratio);
-#endif
-
-#endif
diff --git a/Tests/PnetCDFBenchmark/WritePlotfilePnetCDF.cpp b/Tests/PnetCDFBenchmark/WritePlotfilePnetCDF.cpp
deleted file mode 100644
index 515404b912c..00000000000
--- a/Tests/PnetCDFBenchmark/WritePlotfilePnetCDF.cpp
+++ /dev/null
@@ -1,575 +0,0 @@
-/* This file is translated form Tests/HDF5Benchmark/WritePlotfileHDF5.cpp
- * A HDF5 variable maps to a NetCDF variable of the same size
- * A HDF attribute maps to a NetCDF attribute 
- * A HDF5 data space is mapped to a set of NetCDF dimensions representing every dimension of the data space
- * PnetCDF does not support composite datatype in attributes and variables. Luckily, all composite datatype 
- * used in this benchmark are sinmply repetiion of a single elementary datatype. We simply add one dimension 
- * to the variable to accomodate multiple values per cell.
- * Since NetCDF classic format does not have the concept of groups, groups are represented by appending the 
- * group name to the name of all member objects similar to a path. For example: variable X under group Y will 
- * be represented by a global variable called Y/X
- * PnetCDF have data and define mode. Objects can only be created in define mode and variable can only be 
- * accessed in data mode. We follow the flow of the HDF5 benchmark and switch mode as we need.
- */
-
-#include <WritePlotfilePnetCDF.H>
-
-#include <AMReX_BLProfiler.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <unistd.h>
-#include <iomanip>
-#include <vector>
-#include <map>
-#include <algorithm>
-
-#ifdef BL_PNETCDF
-#include <pnetcdf.h>
-#endif
-
-#define ERR {if(err!=NC_NOERR){printf("Error at line %d in %s: %s\n", __LINE__,__FILE__, ncmpi_strerror(err));}}
-
-using namespace amrex;
-
-#ifdef BL_PNETCDF
-
-namespace {
-    
-    /* Write std amp content as NetCDF attributes
-     * m_int: IN: integer attributes 
-     * m_real: IN: double attributes 
-     * m_string: IN: string attributes 
-     */
-    int VWriteToLocation(int ncid, 
-                            std::string prefix,
-                            std::map<std::string, int>  &m_int,
-                            std::map<std::string, Real> &m_real,
-                            std::map<std::string, std::string> &m_string)
-    {
-        int err, status = NC_NOERR;
-        std::string attname;
-    
-        // Write integer attribute
-        for (std::map<std::string, int>::const_iterator p = m_int.begin(); p!= m_int.end(); ++p){
-            attname = prefix + p->first;
-            std::replace(attname.begin(), attname.end(), '/', '_'); 
-            err = ncmpi_put_att_int(ncid, NC_GLOBAL, attname.c_str(), NC_INT, 1, &(p->second)); ERR
-        }
-
-        // Write real valued attribute
-        for (std::map<std::string, double>::const_iterator p = m_real.begin(); p!= m_real.end(); ++p){
-            double val;
-
-            attname = std::string(prefix) + p->first;
-            std::replace(attname.begin(), attname.end(), '/', '_'); 
-            val = (double)(p->second);  // NetCDF has no specific datatype for Real, so we cast it as double
-            err = ncmpi_put_att_double(ncid, NC_GLOBAL, attname.c_str(), NC_DOUBLE, 1, &(val)); ERR
-        }
-
-        // Write string attribute
-        for (std::map<std::string, std::string>::const_iterator p = m_string.begin(); p!= m_string.end(); ++p){
-            attname = std::string(prefix) + p->first;
-            std::replace(attname.begin(), attname.end(), '/', '_'); 
-            err = ncmpi_put_att_text(ncid, NC_GLOBAL, attname.c_str(), p->second.length(), p->second.c_str()); ERR
-        }
-
-        return status;
-    }
-}
-
-/* Write NetCDF formated plot file
- */
-void WriteMultiLevelPlotfilePNETCDF (const std::string &plotfilename,
-                                  int nlevels,
-				  const Vector<const MultiFab*> &mf,
-				  const Vector<std::string> &varnames,
-				  const Vector<Geometry> &geom,
-				  Real time, Real dt,
-				  const Vector<IntVect> &ref_ratio)
-{
-    BL_PROFILE("WriteMultiLevelPlotfilePNETCDF");
-    
-    int myProc(ParallelDescriptor::MyProc());
-    int nProcs(ParallelDescriptor::NProcs());
-    
-    const int nComp = mf[0]->nComp();
-    const int nGrow = 0;
-    std::string filename(plotfilename + ".nc");
-
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime80(ParallelDescriptor::second());
-
-    // ---- start PnetCDF part
-    //herr_t  ret;
-    int err, ret;
-    IntVect iv1;
-    Box b3(geom[0].Domain());
-
-    int  b3int[2 * BL_SPACEDIM];
-    for(int i(0); i < BL_SPACEDIM; ++i) {
-        b3int[i] = b3.smallEnd(i);
-        b3int[i + BL_SPACEDIM] = b3.bigEnd(i);
-    }
-
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime741(ParallelDescriptor::second());
-    double dPlotFileTime742(dPlotFileTime741 - dPlotFileTime80);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime742);
-    if ( ParallelDescriptor::IOProcessor() )
-    {
-        //std::cout << "Write_H5M_time_1_0 = " << dPlotFileTime742 << "  seconds." << std::endl;
-    }
-    
-#if BL_SPACEDIM == 1
-    amrex::Abort("WriteMultiLevelPlotfilePNETCDF not implemented in 1d.");
-#elif BL_SPACEDIM == 2
-    amrex::Abort("WriteMultiLevelPlotfilePNETCDF not implemented in 2d.");
-#endif
-    
-    // ASim@lbl.gov 6/15/2016
-    double dPlotFileTime711(ParallelDescriptor::second());
-    double dPlotFileTime712(dPlotFileTime711 - dPlotFileTime741);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime712);
-    if ( ParallelDescriptor::IOProcessor() )
-    {
-        //std::cout << "Write_H5M_time_1_1 = " << dPlotFileTime712 << "  seconds." << std::endl;
-    }
-    
-    std::string vGroupName = "_";
-    int vFile;
-    
-    // Write one level at a time
-    for (int level = 0; level < nlevels; ++level) {
-
-    // Create the file only whne it is the first level, otherwise, open existing file
-    if ( level == 0 ) {
-        std::string filedescriptor("VanillaAMRFileType");
-
-        err = ncmpi_create(ParallelDescriptor::Communicator(), filename.c_str(), NC_CLOBBER | NC_64BIT_DATA, MPI_INFO_NULL, &vFile); ERR
-
-        std::string vGlobalGroupName = "Chombo_global";
-        
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime713(ParallelDescriptor::second());
-        double dPlotFileTime714(dPlotFileTime713 - dPlotFileTime711);
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime714);
-        if(ParallelDescriptor::IOProcessor()) {
-          std::cout << "Write_NCHEADER_time_1_2_0 = " << dPlotFileTime714 << "  seconds." << std::endl;
-          std::cout << "#%$: ncmpi_create_time: " << dPlotFileTime714 << std::endl;
-        }
-
-        std::map<std::string, int>  vMInt;
-        std::map<std::string, Real> vMReal;
-        std::map<std::string, std::string> vMString;
-        
-        vMInt["SpaceDim"] = amrex::SpaceDim;
-        vMReal["testReal"] = 0.0;
-        vMString["testString"] = "vMString::testString";
-        ret = VWriteToLocation(vFile, vGlobalGroupName, vMInt, vMReal, vMString);
-        if(ret < 0) {
-            std::cout << myProc << "**** Error 0:  ret = " << ret << std::endl;
-        }
-        
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime7131(ParallelDescriptor::second());
-        double dPlotFileTime7141(dPlotFileTime7131 - dPlotFileTime713);
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime7141);
-        if( ParallelDescriptor::IOProcessor() )
-        {
-            //std::cout << "Write_NCATT_time_1_2 = " << dPlotFileTime7141 << "  seconds." << std::endl;
-        }
-        
-        vMInt.clear();
-        vMReal.clear();
-        
-        vMString ["filetype"]    = filedescriptor;
-        vMInt ["num_levels"]     = nlevels;
-        vMInt ["num_components"] = nComp;
-        for(int ivar(0); ivar < nComp; ++ivar) {
-            char labelChSt[100];
-            sprintf(labelChSt, "component_%d", ivar);
-            std::string label(labelChSt);
-            vMString[label] = varnames[ivar];
-        }
-        
-        ret = VWriteToLocation(vFile, vGroupName, vMInt, vMReal, vMString);
-        if(ret < 0) {
-            std::cout << myProc << "**** Error 1:  ret = " << ret << std::endl;
-        }
-        
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime715(ParallelDescriptor::second());
-        double dPlotFileTime716(dPlotFileTime715 - dPlotFileTime7131);
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime716);
-        if( ParallelDescriptor::IOProcessor() )
-        {
-            std::cout << "Write_NCATT_time_1_3 = " << dPlotFileTime716 << "  seconds." << std::endl;
-            std::cout << "#%$: file_init_att_time: " << dPlotFileTime716 + dPlotFileTime716 << std::endl;
-        }
-        
-    } else {
-        err = ncmpi_open(ParallelDescriptor::Communicator(), filename.c_str(), NC_WRITE, MPI_INFO_NULL, &vFile); ERR
-
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime713(ParallelDescriptor::second());
-        double dPlotFileTime714(dPlotFileTime713 - dPlotFileTime711);
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime714);
-        if( ParallelDescriptor::IOProcessor() )
-        {
-            std::cout << "Write_NCHEADER_time_1_4 = " << dPlotFileTime714 << "  seconds." << std::endl;
-        }
-    }
-    
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime71(ParallelDescriptor::second());
-    double dPlotFileTime72(dPlotFileTime71 - dPlotFileTime80);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime72);
-    if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "Write_NCINIT_time_1 = " << dPlotFileTime72 << "  seconds." << std::endl;
-        std::cout << "#%$: create_open_time: " << dPlotFileTime72 << std::endl;
-    }
-        
-    char levelName[10];
-    sprintf(levelName, "_level_%i", level);
-    std::string gL(vGroupName + levelName);
-    std::string gLDA(gL + "_data_attributes");
-    err = ncmpi_put_att_int(vFile, NC_GLOBAL, (gLDA + "comps").c_str(), NC_INT, 1, &nComp); ERR
-
-    IntVect giv;
-    int gint[BL_SPACEDIM];
-    for(int gi(0); gi < BL_SPACEDIM; ++gi) {
-        giv[gi] = 0;
-        gint[gi] = 0;
-    }
-    int gintvect_id[3];
-    err = ncmpi_put_att_int(vFile, NC_GLOBAL, (gLDA + "_" + "ghost").c_str(), NC_INT, 3, gintvect_id); ERR
-    
-    const Real *a_dx = geom[level].CellSize();
-    Real vData(dt);
-    std::string vName("dt");
-    
-    err = ncmpi_put_att_double(vFile, NC_GLOBAL, (gL + "_" + vName).c_str(), NC_DOUBLE, 1, &vData); ERR
-    err = ncmpi_put_att_double(vFile, NC_GLOBAL, (gL + "_" + "dx").c_str(), NC_DOUBLE, 1, &(a_dx[level])); ERR
-    err = ncmpi_put_att_double(vFile, NC_GLOBAL, (gL + "_" + "time").c_str(), NC_DOUBLE, 1, &time); ERR
-    err = ncmpi_put_att_int(vFile, NC_GLOBAL, (gL + "_" + "prob_domain").c_str(), NC_INT, 6, b3int); ERR
-
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime73(ParallelDescriptor::second());
-    double dPlotFileTime74(dPlotFileTime73 - dPlotFileTime71);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime74);
-    if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "Write_NCATT_time_2 = " << dPlotFileTime74 << "  seconds." << std::endl;
-        std::cout << "#%$: write_att_time: " << dPlotFileTime74 << std::endl;
-    }
-    
-    // ---- "boxes" and "Processors" data
-    Vector<int> procMap = mf[level]->DistributionMap().ProcessorMap();
-    const BoxArray& grids = mf[level]->boxArray();
-    int procdataset;
-    int procdataspacedimids[1];
-    int boxdataset;
-    int boxdataspacedimids[2];
-    int offsetdataset;
-    int offsetdataspacedimids[1];
-    std::string pdsname("Processors");
-    std::string bdsname("boxes");
-    std::string odsname("data:offsets=0");
-    MPI_Offset flatdims[1], count[1], ocount[1];
-    
-    flatdims[0] = (MPI_Offset)grids.size();
-    err = ncmpi_def_dim(vFile, "procdataspace_0", flatdims[0], procdataspacedimids); ERR
-    err = ncmpi_def_var(vFile, (gL + "_" + pdsname).c_str(), NC_INT, 1, procdataspacedimids, &procdataset); ERR
- 
-    
-    int bab3int[2 * BL_SPACEDIM];
-    for(int i(0); i < BL_SPACEDIM; ++i) {
-        bab3int[i] = 0;
-        bab3int[i + BL_SPACEDIM] = 1;
-    }
-    int  boxSize(2 * BL_SPACEDIM);
-
-    flatdims[0] = (MPI_Offset)grids.size();
-
-    err = ncmpi_def_dim(vFile, "boxdataspace_0", flatdims[0], boxdataspacedimids); ERR
-    err = ncmpi_def_dim(vFile, "boxdataspace_1", 6, boxdataspacedimids + 1); ERR
-    err = ncmpi_def_var(vFile, (gL + "_" + bdsname).c_str(), NC_INT, 2, boxdataspacedimids, &boxdataset); ERR
-
-    int iRefRatio(1);
-    if(level < nlevels-1) {
-        iRefRatio = ref_ratio[level][0];
-    }
-    err = ncmpi_put_att_int(vFile, NC_GLOBAL, (gL + "_" + "ref_ratio").c_str(), NC_INT, 1, &iRefRatio); ERR
-
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime75(ParallelDescriptor::second());
-    double dPlotFileTime76(dPlotFileTime75 - dPlotFileTime73);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime76);
-    if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "Write_NCATT_time_3 = " << dPlotFileTime76 << "  seconds." << std::endl;
-        std::cout << "#%$: def_meta_var_dim_time: " << dPlotFileTime76 << std::endl;
-    }
-    
-    // ---- create a boxarray sorted by rank
-    std::map<int, Vector<Box> > gridMap;
-    for(int i(0); i < grids.size(); ++i) {
-        int gridProc(procMap[i]);
-        Vector<Box> &boxesAtProc = gridMap[gridProc];
-        boxesAtProc.push_back(grids[i]);
-    }
-    BoxArray sortedGrids(grids.size());
-    Vector<int> sortedProcs(grids.size());
-    int bIndex(0);
-    for(auto it = gridMap.begin(); it != gridMap.end(); ++it) {
-        int proc = it->first;
-        Vector<Box> &boxesAtProc = it->second;
-        for(int ii(0); ii < boxesAtProc.size(); ++ii) {
-            sortedGrids.set(bIndex, boxesAtProc[ii]);
-            sortedProcs[bIndex] = proc;
-            ++bIndex;
-        }
-    }
-    
-    MPI_Offset oflatdims[1];
-    oflatdims[0] = (MPI_Offset)sortedGrids.size() + 1;
-    err = ncmpi_def_dim(vFile, "offsetdataspace_0", oflatdims[0], offsetdataspacedimids); ERR
-    err = ncmpi_def_var(vFile, (gL + "_" + odsname).c_str(), NC_INT64, 1, offsetdataspacedimids, &offsetdataset); ERR
-
-    Vector<unsigned long long> offsets(sortedGrids.size() + 1);
-    unsigned long long currentOffset(0L);
-    ocount[0] = (MPI_Offset)sortedGrids.size() + 1;
-    for(int b(0); b < sortedGrids.size(); ++b) {
-        offsets[b] = currentOffset;
-        currentOffset += sortedGrids[b].numPts() * nComp;
-    }
-    offsets[sortedGrids.size()] = currentOffset;
-    
-    Vector<unsigned long long> procOffsets(nProcs);
-    int posCount(0);
-    Vector<unsigned long long> procBufferSize(nProcs);
-    unsigned long long totalOffset(0);
-    for(auto it = gridMap.begin(); it != gridMap.end(); ++it) {
-        int proc = it->first;
-        Vector<Box> &boxesAtProc = it->second;
-        BL_ASSERT(posCount == proc);
-        procOffsets[posCount] = totalOffset;
-        ++posCount;
-        procBufferSize[proc] = 0L;
-        for(int b(0); b < boxesAtProc.size(); ++b) {
-            procBufferSize[proc] += boxesAtProc[b].numPts() * nComp;
-        }
-        totalOffset += procBufferSize[proc];
-    }
-
-    // Some metadata are stored in small variables, enter ddata mode to write variables
-    err = ncmpi_enddef(vFile); ERR
-
-    // Since only part of the processes write the variable, we use independent mode
-    err = ncmpi_begin_indep_data(vFile); ERR
-    
-    if(ParallelDescriptor::IOProcessor()) {
-        int vbCount(0);
-        Vector<int> vbox(sortedGrids.size() * boxSize);
-        Vector<int> pid(sortedGrids.size());
-        count[0] = (MPI_Offset)sortedGrids.size();
-        for(int b(0); b < sortedGrids.size(); ++b) {
-            for(int i(0); i < BL_SPACEDIM; ++i) {
-                vbox[(vbCount * boxSize) + i] = sortedGrids[b].smallEnd(i);
-                vbox[(vbCount * boxSize) + i + BL_SPACEDIM] = sortedGrids[b].bigEnd(i);
-            }
-            ++vbCount;
-            pid[b] = sortedProcs[b];
-        }
-        // ASim@lbl.gov CollectiveMetaData
-	    // commented out 10/3/2017
-        //ret = H5Pset_all_coll_metadata_ops(bmemdataspace, true);
-        //ret = H5Pset_coll_metadata_write(bmemdataspace, true);
-        //ret = H5Pset_all_coll_metadata_ops(pmemdataspace, true);
-        //ret = H5Pset_coll_metadata_write(pmemdataspace, true);
-        
-        /*
-        // ASim@lbl.gov 03/20/2017 for collective io setting: H5FD_MPIO_COLLECTIVE
-        // Collective IO does not work here. H5FD_MPIO_INDEPENDENT = H5P_DEFAULT 
-        // Is there a reason why this array needs to be written 
-        // on this particular IOProcessor?
-        // leaving along dxfer_template = H5P_DEFAULT;
-        hid_t dxfer_template;
-        dxfer_template = H5Pcreate(H5P_DATASET_XFER);
-        // H5Pset_dxpl_mpio(dxfer_template, H5FD_MPIO_COLLECTIVE);
-        H5Pset_dxpl_mpio(dxfer_template, H5FD_MPIO_INDEPENDENT);
-        */
-        
-        if(vbox.size() > 0) {
-            ret = ncmpi_put_var_ulonglong(vFile, offsetdataset, &(offsets[0])); ERR
-            ret = ncmpi_put_var_int(vFile, boxdataset, &(vbox[0])); ERR
-            ret = ncmpi_put_var_int(vFile, procdataset, &(pid[0])); ERR
-        } else {
-            /*
-            hid_t dxfer_template;
-            dxfer_template = H5P_DEFAULT;
-            ret = H5Dwrite(offsetdataset, H5T_NATIVE_LLONG, omemdataspace, offsetdataspace,
-                           dxfer_template, NULL);
-            if(ret < 0) { std::cout << "_here 3:  ret = " << ret << std::endl; }
-            ret = H5Dwrite(boxdataset, babox_id, bmemdataspace, boxdataspace,
-                           dxfer_template, NULL);
-            if(ret < 0) { std::cout << "_here 4:  ret = " << ret << std::endl; }
-            ret = H5Dwrite(procdataset, H5T_NATIVE_INT, pmemdataspace, procdataspace,
-                           dxfer_template, NULL);
-            if(ret < 0) { std::cout << "_here 5:  ret = " << ret << std::endl; }
-            */
-        }
-        
-        /*
-        // ASim@lbl.gov 03/20/2017 for closing collective io
-        H5Pclose(dxfer_template);
-        */
-    }
-
-    // Back to collective mode
-    err = ncmpi_end_indep_data(vFile); ERR
-    
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime77(ParallelDescriptor::second());
-    double dPlotFileTime78(dPlotFileTime77 - dPlotFileTime75);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime78);
-    if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "Write_NCVAR_time_4 = " << dPlotFileTime78 << "  seconds." << std::endl;
-        std::cout << "#%$: write_meta_var_time: " << dPlotFileTime78 << std::endl;
-    }
-    
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime85(ParallelDescriptor::second());
-    double dPlotFileTime86(dPlotFileTime85 - dPlotFileTime80);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime86);
-    if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "Write_NCATT_time = " << dPlotFileTime86 << "  seconds." << std::endl;
-        std::cout << "#%$: write_all_meta_time: " << dPlotFileTime86 << std::endl;
-    }
-    
-    // Now it's time for the main data, we enter define mode to define variable for the main data
-    err = ncmpi_redef(vFile); ERR
-
-    {  // ---- data write
-        BL_PROFILE_VAR("NCVarPut", h5dwd);
-
-        MPI_Offset hs_procsize[1], hs_allprocsize[1], ch_offset[1];
-        
-        ch_offset[0]      = (MPI_Offset)procOffsets[myProc];          // ---- offset on this proc
-        hs_procsize[0]    = (MPI_Offset)procBufferSize[myProc];       // ---- size of buffer on this proc
-        hs_allprocsize[0] = (MPI_Offset)offsets[sortedGrids.size()];  // ---- size of buffer on all procs
-
-        char dataname[1024];
-        sprintf(dataname, "data:datatype=0");
-        
-        int dataspacedimmids[1];
-        err = ncmpi_def_dim(vFile, "dataspace", hs_allprocsize[0], dataspacedimmids); ERR
-        int dataset;
-        err = ncmpi_def_var(vFile, (gL + "_" + dataname).c_str(), NC_DOUBLE, 1, dataspacedimmids, &dataset); ERR
-        err = ncmpi_enddef(vFile); ERR  // Switch to data mode for writing the main data
-
-        // ASim@lbl.gov CollectiveMetaData
-	// commented out 10/3/2017
-        //ret = H5Pset_all_coll_metadata_ops(dataset, true);
-        //ret = H5Pset_coll_metadata_write(dataset, true);
-        
-        //select where in the file it will be written
-        //H5Sselect_hyperslab(dataspace, H5S_SELECT_SET, ch_offset, NULL,
-        //                    hs_procsize, NULL);
-        
-        Vector<Real> a_buffer(procBufferSize[myProc], -1.0);
-        long dataCount(0);
-        for(MFIter mfi(*mf[level]); mfi.isValid(); ++mfi) {
-            const Box &vbox    = mfi.validbox();
-            const Real *dataPtr = (*mf[level])[mfi].dataPtr();
-            for(int i(0); i < vbox.numPts() * nComp; ++i) {
-                a_buffer[dataCount++] = dataPtr[i];
-            }
-        }
-        if(ParallelDescriptor::IOProcessor()) {
-            std::cout << "::---- calling NCPUT for the grid data on level " << level << std::endl;
-        }
-        
-        /*
-        // ASim@lbl.gov 4/10/2017 metadata sizing test 
-        if(ParallelDescriptor::IOProcessor()) {
-        // H5Fget_mdc_size(hid_t file_id, size_t *max_size_ptr, size_t *min_clean_size_ptr, size_t *cur_size_ptr, int *cur_num_entries_ptr)
-        size_t max_size, min_clean_size, cur_size;
-        int cur_num_entries;
-        H5Fget_mdc_size(vFile, &max_size, &min_clean_size, &cur_size, &cur_num_entries);
-        std::cout << "GET_MDC_SIZE = " << cur_size << std::endl;
-        std::cout << "GET_MDC_SIZE_2 = " << max_size << " : " << min_clean_size << " : " << cur_num_entries << std::endl;
-        }
-        */
-        
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime771(ParallelDescriptor::second());
-        double dPlotFileTime781(dPlotFileTime771 - dPlotFileTime77);
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime781);
-        if(ParallelDescriptor::IOProcessor()) {
-            std::cout << "Write_NCATT_time_5 = " << dPlotFileTime781 << "  seconds." << std::endl;
-            std::cout << "#%$: def_data_var_time: " << dPlotFileTime781 << std::endl;
-        }
-
-#ifdef H5INDEP
-        // Switch to independent mode if we are writing independnetly
-        err = ncmpi_begin_indep_data(vFile); ERR
-#else
-#endif
-        
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime00(ParallelDescriptor::second());
-        
-        BL_PROFILE_VAR("NCVarPutGrids", h5dwg);
-
-        // Write main data, PnetCDF has different sset of API for independnent and collective operation
-#ifdef H5INDEP
-        err = ncmpi_put_vara_double(vFile, dataset, ch_offset, hs_procsize, a_buffer.dataPtr());
-#else
-        err = ncmpi_put_vara_double_all(vFile, dataset, ch_offset, hs_procsize, a_buffer.dataPtr());
-#endif
-        BL_PROFILE_VAR_STOP(h5dwg);
-        ERR
-        //if(ret < 0) {
-        //    std::cout << ParallelDescriptor::MyProc() << "_here 6:  ret = " << ret << std::endl;
-        //}
-
-#ifdef H5INDEP
-        err = ncmpi_end_indep_data(vFile); ERR
-#endif
-        
-        // ASim@lbl.gov 6/15/2017
-        double dPlotFileTime11(ParallelDescriptor::second());
-        double dPlotFileTime22(dPlotFileTime11 - dPlotFileTime00);
-        ParallelDescriptor::ReduceRealMax(dPlotFileTime22);
-        if(ParallelDescriptor::IOProcessor()) {
-            std::cout << "Write_NCVARPUT_time = " << dPlotFileTime22 << "  seconds." << std::endl;
-            std::cout << "Write_NCVARPUT_time_since = " << ParallelDescriptor::second() << std::endl;
-            std::cout << "#%$: write_data_time: " << dPlotFileTime22 << std::endl;
-        }
-        
-    	// ASim@lbl.gov 6/15/2017 for closing collective io
-        //H5Pclose(dxfer_template); 
-
-        BL_PROFILE_VAR_STOP(h5dwd);
-    }
-    
-    err = ncmpi_close(vFile);
-    }
-
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime791(ParallelDescriptor::second());
-
-    // ASim@lbl.gov 6/15/2017
-    double dPlotFileTime81(ParallelDescriptor::second());
-    double dPlotFileTime82(dPlotFileTime81 - dPlotFileTime80);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime82);
-    double dPlotFileTime792(dPlotFileTime81 - dPlotFileTime791);
-    ParallelDescriptor::ReduceRealMax(dPlotFileTime791);
-    if(ParallelDescriptor::IOProcessor()) {
-        std::cout << "Write_NC_time_7_closing = " << dPlotFileTime792 << "  seconds." << std::endl;
-        std::cout << "Write_PNETCDF_time = " << dPlotFileTime82 << "  seconds." << std::endl;
-        std::cout << "#%$: write_file_total_time: " << dPlotFileTime82 << std::endl;
-    }    
-
-}
-
-#endif
diff --git a/Tests/PnetCDFBenchmark/inputs b/Tests/PnetCDFBenchmark/inputs
deleted file mode 100644
index cd5cbdb55b1..00000000000
--- a/Tests/PnetCDFBenchmark/inputs
+++ /dev/null
@@ -1,15 +0,0 @@
-# Domain size
-ncells = 128 
-
-# Maximum allowable size of each subdomain in the problem domain; 
-# this is used to decompose the domain for parallel calculations.
-max_grid_size = 32
-
-# Number of levels
-nlevs = 1
-
-# Number of components in the multifabs
-ncomp = 6 
-
-# Number of particles per cell
-nppc = 2 
diff --git a/Tests/PnetCDFBenchmark/main.cpp b/Tests/PnetCDFBenchmark/main.cpp
deleted file mode 100644
index 054a1d45a5f..00000000000
--- a/Tests/PnetCDFBenchmark/main.cpp
+++ /dev/null
@@ -1,139 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_Particles.H>
-
-#ifdef BL_PNETCDF
-#include <WritePlotfilePnetCDF.H>
-#endif
-
-using namespace amrex;
-
-int main(int argc, char* argv[])
-{    
-    amrex::Initialize(argc,argv);
-    {
-    const int nghost = 0;
-    int ncells, max_grid_size, ncomp, nlevs, nppc;
-
-    ParmParse pp;
-    pp.get("ncells", ncells);
-    pp.get("max_grid_size", max_grid_size);
-    pp.get("ncomp", ncomp);
-    pp.get("nlevs", nlevs);
-    pp.get("nppc", nppc);
-    
-    AMREX_ALWAYS_ASSERT(nlevs < 2); // relax this later
-
-    IntVect domain_lo(AMREX_D_DECL(0, 0, 0));
-    IntVect domain_hi(AMREX_D_DECL(ncells-1, ncells-1, ncells-1)); 
-    const Box domain(domain_lo, domain_hi);
-
-    RealBox real_box;
-    for (int n = 0; n < AMREX_SPACEDIM; n++) {
-        real_box.setLo(n, 0.0);
-        real_box.setHi(n, 1.0);
-    }
-
-    // Define the refinement ratio
-    Vector<IntVect> ref_ratio(nlevs-1);
-    for (int lev = 1; lev < nlevs; lev++)
-        ref_ratio[lev-1] = IntVect(AMREX_D_DECL(2, 2, 2));
-
-    // This sets the boundary conditions to be doubly or triply periodic
-    int is_per[AMREX_SPACEDIM];
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-        is_per[i] = 1;
-
-    // This defines a Geometry object for each level
-    Vector<Geometry> geom(nlevs);
-    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
-    for (int lev = 1; lev < nlevs; lev++) {
-	geom[lev].define(amrex::refine(geom[lev-1].Domain(), ref_ratio[lev-1]),
-			 &real_box, CoordSys::cartesian, is_per);
-    }
-    
-    Vector<BoxArray> ba(nlevs);
-    ba[0].define(domain);
-    
-    // Now we make the refined level be the center eighth of the domain
-    if (nlevs > 1) {
-        int n_fine = ncells*ref_ratio[0][0];
-        IntVect refined_lo(D_DECL(n_fine/4,n_fine/4,n_fine/4)); 
-        IntVect refined_hi(D_DECL(3*n_fine/4-1,3*n_fine/4-1,3*n_fine/4-1));
-
-        // Build a box for the level 1 domain
-        Box refined_patch(refined_lo, refined_hi);
-        ba[1].define(refined_patch);
-    }
-    
-    // break the BoxArrays at both levels into max_grid_size^3 boxes
-    for (int lev = 0; lev < nlevs; lev++) {
-        ba[lev].maxSize(max_grid_size);
-    }
-
-    Vector<DistributionMapping> dmap(nlevs);
-
-    Vector<std::unique_ptr<MultiFab> > mf(nlevs);
-    for (int lev = 0; lev < nlevs; lev++) {
-        dmap[lev] = DistributionMapping{ba[lev]};
-        mf[lev].reset(new MultiFab(ba[lev], dmap[lev], ncomp, nghost));
-        mf[lev]->setVal(lev);
-    }
-
-    // Add some particles
-    constexpr int NStructReal = 4;
-    constexpr int NStructInt  = 1;
-    constexpr int NArrayReal  = 8;
-    constexpr int NArrayInt   = 3;
-
-    typedef ParticleContainer<NStructReal, NStructInt, NArrayReal, NArrayInt> MyPC;
-    MyPC myPC(geom, dmap, ba, ref_ratio);
-    myPC.SetVerbose(false);
-
-    int num_particles = nppc * AMREX_D_TERM(ncells, * ncells, * ncells);
-    bool serialize = false;
-    int iseed = 451;
-    MyPC::ParticleInitData pdata = {1.0, 2.0, 3.0, 4.0, 5, 6.0,
-                                    7.0, 8.0, 9.0, 10.0, 11.0,
-                                    12.0, 13.0, 14, 15, 16};
-    
-    
-    myPC.InitRandom(num_particles, iseed, pdata, serialize);
-    
-    // these don't really matter, make something up
-    const Real time = 0.0;
-    const Real dt = 0.0;
-
-    Vector<std::string> varnames;
-    for (int i = 0; i < ncomp; ++i)
-    {
-        varnames.push_back("component_" + std::to_string(i));
-    }
-
-#ifdef BL_PNETCDF   
-    WriteMultiLevelPlotfilePNETCDF("plt00000", nlevs, amrex::GetVecOfConstPtrs(mf), 
-                                varnames, geom, time, dt, ref_ratio);
-#endif
-
-    Vector<int> level_steps(nlevs, 0);
-    WriteMultiLevelPlotfile("plt00000", nlevs, amrex::GetVecOfConstPtrs(mf),
-                            varnames, geom, time, level_steps, ref_ratio);
-   
-    Vector<std::string> particle_realnames;
-    for (int i = 0; i < NStructReal + NArrayReal; ++i)
-    {
-        particle_realnames.push_back("particle_real_component_" + std::to_string(i));
-    }
-
-    Vector<std::string> particle_intnames;
-    for (int i = 0; i < NStructInt + NArrayInt; ++i)
-    {
-        particle_intnames.push_back("particle_int_component_" + std::to_string(i));
-    }
-    
-    myPC.Checkpoint("plt00000", "particle0", false, particle_realnames, particle_intnames);
-    }
-    
-    amrex::Finalize();
-}
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Exec/GNUmakefile b/Tests/ProfTests/HeatEquation_EX1_C/Exec/GNUmakefile
deleted file mode 100644
index 377fb3447dc..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Exec/GNUmakefile
+++ /dev/null
@@ -1,21 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
-
-DEBUG         = FALSE
-USE_MPI       = TRUE
-USE_OMP       = FALSE
-PROFILE       = TRUE
-COMM_PROFILE  = TRUE
-TRACE_PROFILE = TRUE
-COMP          = gnu
-DIM           = 2
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ../Source/Make.package
-VPATH_LOCATIONS  += ../Source
-
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Exec/inputs_2d b/Tests/ProfTests/HeatEquation_EX1_C/Exec/inputs_2d
deleted file mode 100644
index 304d6fcf457..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Exec/inputs_2d
+++ /dev/null
@@ -1,5 +0,0 @@
-nsteps = 5 
-plot_int = 5
-n_cell = 256
-max_grid_size = 64
-blprofiler.prof_flushprint = false
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Exec/inputs_3d b/Tests/ProfTests/HeatEquation_EX1_C/Exec/inputs_3d
deleted file mode 100644
index 65464f20d74..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Exec/inputs_3d
+++ /dev/null
@@ -1,5 +0,0 @@
-nsteps = 1000
-plot_int = 100
-n_cell = 128
-max_grid_size = 32
-
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/Make.package b/Tests/ProfTests/HeatEquation_EX1_C/Source/Make.package
deleted file mode 100644
index 1ce2429e707..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/Make.package
+++ /dev/null
@@ -1,7 +0,0 @@
-CEXE_sources += main.cpp advance.cpp
-
-CEXE_headers += myfunc.H
-FEXE_headers += myfunc_F.H
-
-f90EXE_sources += init_phi_$(DIM)d.f90 
-f90EXE_sources += advance_$(DIM)d.f90
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/advance.cpp b/Tests/ProfTests/HeatEquation_EX1_C/Source/advance.cpp
deleted file mode 100644
index e157d6dbaf9..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/advance.cpp
+++ /dev/null
@@ -1,60 +0,0 @@
-
-#include "myfunc.H"
-#include "myfunc_F.H"
-
-void advance (MultiFab& phi_old,
-              MultiFab& phi_new,
-	      std::array<MultiFab, AMREX_SPACEDIM>& flux,
-	      Real dt,
-              const Geometry& geom)
-{
-    // Fill the ghost cells of each grid from the other grids
-    // includes periodic domain boundaries
-    phi_old.FillBoundary(geom.periodicity());
-
-    int Ncomp = phi_old.nComp();
-    int ng_p = phi_old.nGrow();
-    int ng_f = flux[0].nGrow();
-
-    const Real* dx = geom.CellSize();
-
-    //
-    // Note that this simple example is not optimized.
-    // The following two MFIter loops could be merged
-    // and we do not have to use flux MultiFab.
-    // 
-
-    const Box& domain_bx = geom.Domain();
-
-    // Compute fluxes one grid at a time
-    for ( MFIter mfi(phi_old); mfi.isValid(); ++mfi )
-    {
-        const Box& bx = mfi.validbox();
-
-        compute_flux(BL_TO_FORTRAN_BOX(bx),
-                     BL_TO_FORTRAN_BOX(domain_bx),
-                     BL_TO_FORTRAN_ANYD(phi_old[mfi]),
-                     BL_TO_FORTRAN_ANYD(flux[0][mfi]),
-                     BL_TO_FORTRAN_ANYD(flux[1][mfi]),
-#if (AMREX_SPACEDIM == 3)   
-                     BL_TO_FORTRAN_ANYD(flux[2][mfi]),
-#endif
-                     dx);
-    }
-    
-    // Advance the solution one grid at a time
-    for ( MFIter mfi(phi_old); mfi.isValid(); ++mfi )
-    {
-        const Box& bx = mfi.validbox();
-        
-        update_phi(BL_TO_FORTRAN_BOX(bx),
-                   BL_TO_FORTRAN_ANYD(phi_old[mfi]),
-                   BL_TO_FORTRAN_ANYD(phi_new[mfi]),
-                   BL_TO_FORTRAN_ANYD(flux[0][mfi]),
-                   BL_TO_FORTRAN_ANYD(flux[1][mfi]),
-#if (AMREX_SPACEDIM == 3)   
-                   BL_TO_FORTRAN_ANYD(flux[2][mfi]),
-#endif
-                   dx, &dt);
-    }
-}
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/advance_2d.f90 b/Tests/ProfTests/HeatEquation_EX1_C/Source/advance_2d.f90
deleted file mode 100644
index f4d655d0d38..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/advance_2d.f90
+++ /dev/null
@@ -1,67 +0,0 @@
-
-subroutine compute_flux (lo, hi, domlo, domhi, phi, philo, phihi, &
-                         fluxx, fxlo, fxhi, fluxy, fylo, fyhi, &
-                         dx) bind(C, name="compute_flux")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(2), hi(2), domlo(2), domhi(2)
-  integer philo(2), phihi(2), fxlo(2), fxhi(2), fylo(2), fyhi(2)
-  real(amrex_real), intent(in)    :: phi  (philo(1):phihi(1),philo(2):phihi(2))
-  real(amrex_real), intent(inout) :: fluxx( fxlo(1): fxhi(1), fxlo(2): fxhi(2))
-  real(amrex_real), intent(inout) :: fluxy( fylo(1): fyhi(1), fylo(2): fyhi(2))
-  real(amrex_real), intent(in)    :: dx(2)
-
-  ! local variables
-  integer i,j
-
-  ! x-fluxes
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)+1
-     fluxx(i,j) = ( phi(i,j) - phi(i-1,j) ) / dx(1)
-  end do
-  end do
-
-  ! y-fluxes
-  do j = lo(2), hi(2)+1
-  do i = lo(1), hi(1)
-     fluxy(i,j) = ( phi(i,j) - phi(i,j-1) ) / dx(2)
-  end do
-  end do
-
-end subroutine compute_flux
-
-
-subroutine update_phi (lo, hi, phiold, polo, pohi, phinew, pnlo, pnhi, &
-                       fluxx, fxlo, fxhi, fluxy, fylo, fyhi, &
-                       dx, dt) bind(C, name="update_phi")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(2), hi(2), polo(2), pohi(2), pnlo(2), pnhi(2), fxlo(2), fxhi(2), fylo(2), fyhi(2)
-  real(amrex_real), intent(in)    :: phiold(polo(1):pohi(1),polo(2):pohi(2))
-  real(amrex_real), intent(inout) :: phinew(pnlo(1):pnhi(1),pnlo(2):pnhi(2))
-  real(amrex_real), intent(in   ) :: fluxx (fxlo(1):fxhi(1),fxlo(2):fxhi(2))
-  real(amrex_real), intent(in   ) :: fluxy (fylo(1):fyhi(1),fylo(2):fyhi(2))
-  real(amrex_real), intent(in)    :: dx(2)
-  real(amrex_real), intent(in)    :: dt
-
-  ! local variables
-  integer i,j
-  real(amrex_real) :: dtdx(2)
-
-  dtdx = dt/dx
-
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)
-
-     phinew(i,j) = phiold(i,j) &
-          + dtdx(1) * (fluxx(i+1,j  ) - fluxx(i,j)) &
-          + dtdx(2) * (fluxy(i  ,j+1) - fluxy(i,j))
-
-  end do
-  end do
-
-end subroutine update_phi
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/advance_3d.f90 b/Tests/ProfTests/HeatEquation_EX1_C/Source/advance_3d.f90
deleted file mode 100644
index 6b50e26549e..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/advance_3d.f90
+++ /dev/null
@@ -1,86 +0,0 @@
-
-subroutine compute_flux (lo, hi, domlo, domhi, phi, philo, phihi, &
-                         fluxx, fxlo, fxhi, fluxy, fylo, fyhi, fluxz, fzlo, fzhi, &
-                         dx) bind(C, name="compute_flux")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(3), hi(3), domlo(3), domhi(3)
-  integer philo(3), phihi(3), fxlo(3), fxhi(3), fylo(3), fyhi(3), fzlo(3), fzhi(3)
-  real(amrex_real), intent(in)    :: phi  (philo(1):phihi(1),philo(2):phihi(2),philo(3):phihi(3))
-  real(amrex_real), intent(inout) :: fluxx( fxlo(1): fxhi(1), fxlo(2): fxhi(2), fxlo(3): fxhi(3))
-  real(amrex_real), intent(inout) :: fluxy( fylo(1): fyhi(1), fylo(2): fyhi(2), fylo(3): fyhi(3))
-  real(amrex_real), intent(inout) :: fluxz( fzlo(1): fzhi(1), fzlo(2): fzhi(2), fzlo(3): fzhi(3))
-  real(amrex_real), intent(in)    :: dx(3)
-  
-  ! local variables
-  integer i,j,k
-
-  ! x-fluxes
-  do k = lo(3), hi(3)
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)+1
-     fluxx(i,j,k) = ( phi(i,j,k) - phi(i-1,j,k) ) / dx(1)
-  end do
-  end do
-  end do
-
-  ! y-fluxes
-  do k = lo(3), hi(3)
-  do j = lo(2), hi(2)+1
-  do i = lo(1), hi(1)
-     fluxy(i,j,k) = ( phi(i,j,k) - phi(i,j-1,k) ) / dx(2)
-  end do
-  end do
-  end do
-
-  ! z-fluxes
-  do k = lo(3), hi(3)+1
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)
-     fluxz(i,j,k) = ( phi(i,j,k) - phi(i,j,k-1) ) / dx(3)
-  end do
-  end do
-  end do
-
-end subroutine compute_flux
-
-
-subroutine update_phi (lo, hi, phiold, polo, pohi, phinew, pnlo, pnhi, &
-                       fluxx, fxlo, fxhi, fluxy, fylo, fyhi, fluxz, fzlo, fzhi, &
-                       dx, dt) bind(C, name="update_phi")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(3), hi(3), polo(3), pohi(3), pnlo(3), pnhi(3), &
-       fxlo(3), fxhi(3), fylo(3), fyhi(3), fzlo(3), fzhi(3)
-  real(amrex_real), intent(in)    :: phiold(polo(1):pohi(1),polo(2):pohi(2),polo(3):pohi(3))
-  real(amrex_real), intent(inout) :: phinew(pnlo(1):pnhi(1),pnlo(2):pnhi(2),pnlo(3):pnhi(3))
-  real(amrex_real), intent(in   ) :: fluxx (fxlo(1):fxhi(1),fxlo(2):fxhi(2),fxlo(3):fxhi(3))
-  real(amrex_real), intent(in   ) :: fluxy (fylo(1):fyhi(1),fylo(2):fyhi(2),fylo(3):fyhi(3))
-  real(amrex_real), intent(in   ) :: fluxz (fzlo(1):fzhi(1),fzlo(2):fzhi(2),fzlo(3):fzhi(3))
-  real(amrex_real), intent(in)    :: dx(3)
-  real(amrex_real), intent(in)    :: dt
-
-  ! local variables
-  integer i,j,k
-  real(amrex_real) :: dtdx(3)
-
-  dtdx = dt/dx
-
-  do k = lo(3), hi(3)
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)
-
-     phinew(i,j,k) = phiold(i,j,k) &
-          + dtdx(1) * (fluxx(i+1,j  ,k  ) - fluxx(i,j,k)) &
-          + dtdx(2) * (fluxy(i  ,j+1,k  ) - fluxy(i,j,k)) &
-          + dtdx(3) * (fluxz(i  ,j  ,k+1) - fluxz(i,j,k))
-
-  end do
-  end do
-  end do
-
-end subroutine update_phi
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/init_phi_2d.f90 b/Tests/ProfTests/HeatEquation_EX1_C/Source/init_phi_2d.f90
deleted file mode 100644
index 02a4c036cff..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/init_phi_2d.f90
+++ /dev/null
@@ -1,28 +0,0 @@
-subroutine init_phi(lo, hi, phi, philo, phihi, dx, prob_lo, prob_hi) bind(C, name="init_phi")
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2), philo(2), phihi(2)
-  real(amrex_real), intent(inout) :: phi(philo(1):phihi(1),philo(2):phihi(2))
-  real(amrex_real), intent(in   ) :: dx(2) 
-  real(amrex_real), intent(in   ) :: prob_lo(2) 
-  real(amrex_real), intent(in   ) :: prob_hi(2) 
-
-  integer          :: i,j
-  double precision :: x,y,r2
-
-  do j = lo(2), hi(2)
-     y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-     do i = lo(1), hi(1)
-        x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-
-        r2 = ((x-0.25d0)**2 + (y-0.25d0)**2) / 0.01d0
-
-        phi(i,j) = 1.d0 + exp(-r2)
-
-     end do
-  end do
-
-end subroutine init_phi
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/init_phi_3d.f90 b/Tests/ProfTests/HeatEquation_EX1_C/Source/init_phi_3d.f90
deleted file mode 100644
index ec281d22df5..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/init_phi_3d.f90
+++ /dev/null
@@ -1,30 +0,0 @@
-subroutine init_phi(lo, hi, phi, philo, phihi, dx, prob_lo, prob_hi) bind(C, name="init_phi")
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3), philo(3), phihi(3)
-  real(amrex_real), intent(inout) :: phi(philo(1):phihi(1),philo(2):phihi(2),philo(3):phihi(3))
-  real(amrex_real), intent(in   ) :: dx(3) 
-  real(amrex_real), intent(in   ) :: prob_lo(3) 
-  real(amrex_real), intent(in   ) :: prob_hi(3) 
-
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-
-  do k = lo(3), hi(3)
-     z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-     do j = lo(2), hi(2)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i = lo(1), hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-
-           r2 = ((x-0.25d0)**2 + (y-0.25d0)**2 + (z-0.25d0)**2) / 0.01d0
-           phi(i,j,k) = 1.d0 + exp(-r2)
-
-        end do
-     end do
-  end do
-
-end subroutine init_phi
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/main.cpp b/Tests/ProfTests/HeatEquation_EX1_C/Source/main.cpp
deleted file mode 100644
index 7d76b5f186b..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/main.cpp
+++ /dev/null
@@ -1,163 +0,0 @@
-
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_Print.H>
-
-#include "myfunc.H"
-#include "myfunc_F.H"
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    BL_PROFILE_VAR("main()", pmain);
-    BL_PROFILE_REGION_START("main");
-
-    main_main();
-
-    BL_PROFILE_REGION_STOP("main");
-    BL_PROFILE_VAR_STOP(pmain);
-    amrex::Finalize();
-    return 0;
-}
-
-void main_main ()
-{
-    // What time is it now?  We'll use this to compute total run time.
-    Real strt_time = ParallelDescriptor::second();
-
-    // AMREX_SPACEDIM: number of dimensions
-    int n_cell, max_grid_size, nsteps, plot_int;
-    Vector<int> is_periodic(AMREX_SPACEDIM,1);  // periodic in all direction by default
-
-    // inputs parameters
-    {
-        // ParmParse is way of reading inputs from the inputs file
-        ParmParse pp;
-
-        // We need to get n_cell from the inputs file - this is the number of cells on each side of 
-        //   a square (or cubic) domain.
-        pp.get("n_cell",n_cell);
-
-        // The domain is broken into boxes of size max_grid_size
-        pp.get("max_grid_size",max_grid_size);
-
-        // Default plot_int to -1, allow us to set it to something else in the inputs file
-        //  If plot_int < 0 then no plot files will be writtenq
-        plot_int = -1;
-        pp.query("plot_int",plot_int);
-
-        // Default nsteps to 0, allow us to set it to something else in the inputs file
-        nsteps = 10;
-        pp.query("nsteps",nsteps);
-
-        pp.queryarr("is_periodic", is_periodic);
-    }
-
-    // make BoxArray and Geometry
-    BoxArray ba;
-    Geometry geom;
-    {
-        IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-        IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-        Box domain(dom_lo, dom_hi);
-
-        // Initialize the boxarray "ba" from the single box "bx"
-        ba.define(domain);
-        // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-        ba.maxSize(max_grid_size);
-
-       // This defines the physical box, [-1,1] in each direction.
-        RealBox real_box({AMREX_D_DECL(-1.0,-1.0,-1.0)},
-                         {AMREX_D_DECL( 1.0, 1.0, 1.0)});
-
-        // This defines a Geometry object
-        geom.define(domain,&real_box,CoordSys::cartesian,is_periodic.data());
-    }
-
-    // Nghost = number of ghost cells for each array 
-    int Nghost = 1;
-    
-    // Ncomp = number of components for each array
-    int Ncomp  = 1;
-  
-    // How Boxes are distrubuted among MPI processes
-    DistributionMapping dm(ba);
-
-    // we allocate two phi multifabs; one will store the old state, the other the new.
-    MultiFab phi_old(ba, dm, Ncomp, Nghost);
-    MultiFab phi_new(ba, dm, Ncomp, Nghost);
-
-    // Initialize phi_new by calling a Fortran routine.
-    // MFIter = MultiFab Iterator
-    for ( MFIter mfi(phi_new); mfi.isValid(); ++mfi )
-    {
-        const Box& bx = mfi.validbox();
-
-        init_phi(BL_TO_FORTRAN_BOX(bx),
-                 BL_TO_FORTRAN_ANYD(phi_new[mfi]),
-                 geom.CellSize(), geom.ProbLo(), geom.ProbHi());
-    }
-
-    // compute the time step
-    const Real* dx = geom.CellSize();
-    Real dt = 0.9*dx[0]*dx[0] / (2.0*AMREX_SPACEDIM);
-
-    // time = starting time in the simulation
-    Real time = 0.0;
-
-    // Write a plotfile of the initial data if plot_int > 0 (plot_int was defined in the inputs file)
-    if (plot_int > 0)
-    {
-        int n = 0;
-        const std::string& pltfile = amrex::Concatenate("plt",n,5);
-        WriteSingleLevelPlotfile(pltfile, phi_new, {"phi"}, geom, time, 0);
-    }
-
-    // build the flux multifabs
-    std::array<MultiFab, AMREX_SPACEDIM> flux;
-    for (int dir = 0; dir < AMREX_SPACEDIM; dir++)
-    {
-        // flux(dir) has one component, zero ghost cells, and is nodal in direction dir
-        BoxArray edge_ba = ba;
-        edge_ba.surroundingNodes(dir);
-        flux[dir].define(edge_ba, dm, 1, 0);
-    }
-
-    for (int n = 1; n <= nsteps; ++n)
-    {
-        BL_PROFILE_REGION_START(std::string("TimeStep" + std::to_string(n)));
-        MultiFab::Copy(phi_old, phi_new, 0, 0, 1, 0);
-
-        // new_phi = old_phi + dt * (something)
-        BL_PROFILE_VAR("HeatConduction::advance()", hcadvance);
-        advance(phi_old, phi_new, flux, dt, geom); 
-        BL_PROFILE_VAR_STOP(hcadvance);
-        time = time + dt;
-        
-        // Tell the I/O Processor to write out which step we're doing
-        amrex::Print() << "Advanced step " << n << "\n";
-
-        // Write a plotfile of the current data (plot_int was defined in the inputs file)
-        if (plot_int > 0 && n%plot_int == 0)
-        {
-            const std::string& pltfile = amrex::Concatenate("plt",n,5);
-            WriteSingleLevelPlotfile(pltfile, phi_new, {"phi"}, geom, time, n);
-        }
-        BL_PROFILE_REGION_STOP(std::string("TimeStep" + std::to_string(n)));
-
-        BL_PROFILE_REGION_START("Profile::Flush");
-        BL_PROFILE_VAR("PROFILE_FLUSH", pFlush);
-        BL_PROFILE_FLUSH();
-        BL_PROFILE_VAR_STOP(pFlush);
-        BL_PROFILE_REGION_STOP("Profile::Flush");
-    }
-
-    // Call the timer again and compute the maximum difference between the start time and stop time
-    //   over all processors
-    Real stop_time = ParallelDescriptor::second() - strt_time;
-    const int IOProc = ParallelDescriptor::IOProcessorNumber();
-    ParallelDescriptor::ReduceRealMax(stop_time,IOProc);
-
-    // Tell the I/O Processor to write out the "run time"
-    amrex::Print() << "Run time = " << stop_time << std::endl;
-}
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/myfunc.H b/Tests/ProfTests/HeatEquation_EX1_C/Source/myfunc.H
deleted file mode 100644
index af0c1f885ac..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/myfunc.H
+++ /dev/null
@@ -1,17 +0,0 @@
-#ifndef MYFUNC_H_
-#define MYFUNC_H_
-
-#include <AMReX_Geometry.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-void main_main ();
-
-void advance (MultiFab& phi_old,
-              MultiFab& phi_new,
-	      std::array<MultiFab, AMREX_SPACEDIM>& flux,
-	      Real dt,
-              const Geometry& geom);
-
-#endif
diff --git a/Tests/ProfTests/HeatEquation_EX1_C/Source/myfunc_F.H b/Tests/ProfTests/HeatEquation_EX1_C/Source/myfunc_F.H
deleted file mode 100644
index 7da2ca7e00b..00000000000
--- a/Tests/ProfTests/HeatEquation_EX1_C/Source/myfunc_F.H
+++ /dev/null
@@ -1,39 +0,0 @@
-#ifndef MYFUNC_F_H_
-#define MYFUNC_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-    void init_phi(const int* lo, const int* hi,
-                  amrex_real* data, const int* dlo, const int* dhi,
-                  const amrex_real* dx, const amrex_real* prob_lo, const amrex_real* prob_hi);
-    
-    void compute_flux(const int* lo, const int* hi,
-                      const int* domlo, const int* domhi,
-                      amrex_real* phi, const int* philo, const int* phihi,
-                      amrex_real* fluxx, const int* fxlo, const int* fxhi,
-                      amrex_real* fluxy, const int* fylo, const int* fyhi,
-#if (BL_SPACEDIM == 3)   
-                      amrex_real* fluxz, const int* fzlo, const int* fzhi,
-#endif
-                      const amrex_real* dx);
-
-    void update_phi(const int* lo, const int* hi,
-                    amrex_real* pold, const int* polo, const int* pohi,
-                    amrex_real* pnew, const int* pnlo, const int* pnhi,
-                    amrex_real* fluxx, const int* fxlo, const int* fxhi,
-                    amrex_real* fluxy, const int* fylo, const int* fyhi,
-#if (BL_SPACEDIM == 3)   
-                    amrex_real* fluxz, const int* fzlo, const int* fzhi,
-#endif
-                    const amrex_real* dx, const amrex_real* dt);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Tests/ProfTests/ThirdParty/Exec/GNUmakefile b/Tests/ProfTests/ThirdParty/Exec/GNUmakefile
deleted file mode 100644
index fddb3686caa..00000000000
--- a/Tests/ProfTests/ThirdParty/Exec/GNUmakefile
+++ /dev/null
@@ -1,19 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../..
-
-DEBUG     = FALSE
-USE_MPI   = TRUE 
-USE_OMP   = FALSE
-COMP      = intel 
-DIM       = 2
-THIRD_PARTY_PROFILING=CRAYPAT
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ../Source/Make.package
-VPATH_LOCATIONS  += ../Source
-
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/ProfTests/ThirdParty/Exec/inputs_2d b/Tests/ProfTests/ThirdParty/Exec/inputs_2d
deleted file mode 100644
index 94a0243c041..00000000000
--- a/Tests/ProfTests/ThirdParty/Exec/inputs_2d
+++ /dev/null
@@ -1,4 +0,0 @@
-nsteps = 10000
-plot_int = 1000
-n_cell = 256
-max_grid_size = 64
diff --git a/Tests/ProfTests/ThirdParty/Exec/inputs_3d b/Tests/ProfTests/ThirdParty/Exec/inputs_3d
deleted file mode 100644
index 65464f20d74..00000000000
--- a/Tests/ProfTests/ThirdParty/Exec/inputs_3d
+++ /dev/null
@@ -1,5 +0,0 @@
-nsteps = 1000
-plot_int = 100
-n_cell = 128
-max_grid_size = 32
-
diff --git a/Tests/ProfTests/ThirdParty/Source/Make.package b/Tests/ProfTests/ThirdParty/Source/Make.package
deleted file mode 100644
index 1ce2429e707..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/Make.package
+++ /dev/null
@@ -1,7 +0,0 @@
-CEXE_sources += main.cpp advance.cpp
-
-CEXE_headers += myfunc.H
-FEXE_headers += myfunc_F.H
-
-f90EXE_sources += init_phi_$(DIM)d.f90 
-f90EXE_sources += advance_$(DIM)d.f90
diff --git a/Tests/ProfTests/ThirdParty/Source/advance.cpp b/Tests/ProfTests/ThirdParty/Source/advance.cpp
deleted file mode 100644
index e157d6dbaf9..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/advance.cpp
+++ /dev/null
@@ -1,60 +0,0 @@
-
-#include "myfunc.H"
-#include "myfunc_F.H"
-
-void advance (MultiFab& phi_old,
-              MultiFab& phi_new,
-	      std::array<MultiFab, AMREX_SPACEDIM>& flux,
-	      Real dt,
-              const Geometry& geom)
-{
-    // Fill the ghost cells of each grid from the other grids
-    // includes periodic domain boundaries
-    phi_old.FillBoundary(geom.periodicity());
-
-    int Ncomp = phi_old.nComp();
-    int ng_p = phi_old.nGrow();
-    int ng_f = flux[0].nGrow();
-
-    const Real* dx = geom.CellSize();
-
-    //
-    // Note that this simple example is not optimized.
-    // The following two MFIter loops could be merged
-    // and we do not have to use flux MultiFab.
-    // 
-
-    const Box& domain_bx = geom.Domain();
-
-    // Compute fluxes one grid at a time
-    for ( MFIter mfi(phi_old); mfi.isValid(); ++mfi )
-    {
-        const Box& bx = mfi.validbox();
-
-        compute_flux(BL_TO_FORTRAN_BOX(bx),
-                     BL_TO_FORTRAN_BOX(domain_bx),
-                     BL_TO_FORTRAN_ANYD(phi_old[mfi]),
-                     BL_TO_FORTRAN_ANYD(flux[0][mfi]),
-                     BL_TO_FORTRAN_ANYD(flux[1][mfi]),
-#if (AMREX_SPACEDIM == 3)   
-                     BL_TO_FORTRAN_ANYD(flux[2][mfi]),
-#endif
-                     dx);
-    }
-    
-    // Advance the solution one grid at a time
-    for ( MFIter mfi(phi_old); mfi.isValid(); ++mfi )
-    {
-        const Box& bx = mfi.validbox();
-        
-        update_phi(BL_TO_FORTRAN_BOX(bx),
-                   BL_TO_FORTRAN_ANYD(phi_old[mfi]),
-                   BL_TO_FORTRAN_ANYD(phi_new[mfi]),
-                   BL_TO_FORTRAN_ANYD(flux[0][mfi]),
-                   BL_TO_FORTRAN_ANYD(flux[1][mfi]),
-#if (AMREX_SPACEDIM == 3)   
-                   BL_TO_FORTRAN_ANYD(flux[2][mfi]),
-#endif
-                   dx, &dt);
-    }
-}
diff --git a/Tests/ProfTests/ThirdParty/Source/advance_2d.f90 b/Tests/ProfTests/ThirdParty/Source/advance_2d.f90
deleted file mode 100644
index f4d655d0d38..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/advance_2d.f90
+++ /dev/null
@@ -1,67 +0,0 @@
-
-subroutine compute_flux (lo, hi, domlo, domhi, phi, philo, phihi, &
-                         fluxx, fxlo, fxhi, fluxy, fylo, fyhi, &
-                         dx) bind(C, name="compute_flux")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(2), hi(2), domlo(2), domhi(2)
-  integer philo(2), phihi(2), fxlo(2), fxhi(2), fylo(2), fyhi(2)
-  real(amrex_real), intent(in)    :: phi  (philo(1):phihi(1),philo(2):phihi(2))
-  real(amrex_real), intent(inout) :: fluxx( fxlo(1): fxhi(1), fxlo(2): fxhi(2))
-  real(amrex_real), intent(inout) :: fluxy( fylo(1): fyhi(1), fylo(2): fyhi(2))
-  real(amrex_real), intent(in)    :: dx(2)
-
-  ! local variables
-  integer i,j
-
-  ! x-fluxes
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)+1
-     fluxx(i,j) = ( phi(i,j) - phi(i-1,j) ) / dx(1)
-  end do
-  end do
-
-  ! y-fluxes
-  do j = lo(2), hi(2)+1
-  do i = lo(1), hi(1)
-     fluxy(i,j) = ( phi(i,j) - phi(i,j-1) ) / dx(2)
-  end do
-  end do
-
-end subroutine compute_flux
-
-
-subroutine update_phi (lo, hi, phiold, polo, pohi, phinew, pnlo, pnhi, &
-                       fluxx, fxlo, fxhi, fluxy, fylo, fyhi, &
-                       dx, dt) bind(C, name="update_phi")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(2), hi(2), polo(2), pohi(2), pnlo(2), pnhi(2), fxlo(2), fxhi(2), fylo(2), fyhi(2)
-  real(amrex_real), intent(in)    :: phiold(polo(1):pohi(1),polo(2):pohi(2))
-  real(amrex_real), intent(inout) :: phinew(pnlo(1):pnhi(1),pnlo(2):pnhi(2))
-  real(amrex_real), intent(in   ) :: fluxx (fxlo(1):fxhi(1),fxlo(2):fxhi(2))
-  real(amrex_real), intent(in   ) :: fluxy (fylo(1):fyhi(1),fylo(2):fyhi(2))
-  real(amrex_real), intent(in)    :: dx(2)
-  real(amrex_real), intent(in)    :: dt
-
-  ! local variables
-  integer i,j
-  real(amrex_real) :: dtdx(2)
-
-  dtdx = dt/dx
-
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)
-
-     phinew(i,j) = phiold(i,j) &
-          + dtdx(1) * (fluxx(i+1,j  ) - fluxx(i,j)) &
-          + dtdx(2) * (fluxy(i  ,j+1) - fluxy(i,j))
-
-  end do
-  end do
-
-end subroutine update_phi
diff --git a/Tests/ProfTests/ThirdParty/Source/advance_3d.f90 b/Tests/ProfTests/ThirdParty/Source/advance_3d.f90
deleted file mode 100644
index 6b50e26549e..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/advance_3d.f90
+++ /dev/null
@@ -1,86 +0,0 @@
-
-subroutine compute_flux (lo, hi, domlo, domhi, phi, philo, phihi, &
-                         fluxx, fxlo, fxhi, fluxy, fylo, fyhi, fluxz, fzlo, fzhi, &
-                         dx) bind(C, name="compute_flux")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(3), hi(3), domlo(3), domhi(3)
-  integer philo(3), phihi(3), fxlo(3), fxhi(3), fylo(3), fyhi(3), fzlo(3), fzhi(3)
-  real(amrex_real), intent(in)    :: phi  (philo(1):phihi(1),philo(2):phihi(2),philo(3):phihi(3))
-  real(amrex_real), intent(inout) :: fluxx( fxlo(1): fxhi(1), fxlo(2): fxhi(2), fxlo(3): fxhi(3))
-  real(amrex_real), intent(inout) :: fluxy( fylo(1): fyhi(1), fylo(2): fyhi(2), fylo(3): fyhi(3))
-  real(amrex_real), intent(inout) :: fluxz( fzlo(1): fzhi(1), fzlo(2): fzhi(2), fzlo(3): fzhi(3))
-  real(amrex_real), intent(in)    :: dx(3)
-  
-  ! local variables
-  integer i,j,k
-
-  ! x-fluxes
-  do k = lo(3), hi(3)
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)+1
-     fluxx(i,j,k) = ( phi(i,j,k) - phi(i-1,j,k) ) / dx(1)
-  end do
-  end do
-  end do
-
-  ! y-fluxes
-  do k = lo(3), hi(3)
-  do j = lo(2), hi(2)+1
-  do i = lo(1), hi(1)
-     fluxy(i,j,k) = ( phi(i,j,k) - phi(i,j-1,k) ) / dx(2)
-  end do
-  end do
-  end do
-
-  ! z-fluxes
-  do k = lo(3), hi(3)+1
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)
-     fluxz(i,j,k) = ( phi(i,j,k) - phi(i,j,k-1) ) / dx(3)
-  end do
-  end do
-  end do
-
-end subroutine compute_flux
-
-
-subroutine update_phi (lo, hi, phiold, polo, pohi, phinew, pnlo, pnhi, &
-                       fluxx, fxlo, fxhi, fluxy, fylo, fyhi, fluxz, fzlo, fzhi, &
-                       dx, dt) bind(C, name="update_phi")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  integer lo(3), hi(3), polo(3), pohi(3), pnlo(3), pnhi(3), &
-       fxlo(3), fxhi(3), fylo(3), fyhi(3), fzlo(3), fzhi(3)
-  real(amrex_real), intent(in)    :: phiold(polo(1):pohi(1),polo(2):pohi(2),polo(3):pohi(3))
-  real(amrex_real), intent(inout) :: phinew(pnlo(1):pnhi(1),pnlo(2):pnhi(2),pnlo(3):pnhi(3))
-  real(amrex_real), intent(in   ) :: fluxx (fxlo(1):fxhi(1),fxlo(2):fxhi(2),fxlo(3):fxhi(3))
-  real(amrex_real), intent(in   ) :: fluxy (fylo(1):fyhi(1),fylo(2):fyhi(2),fylo(3):fyhi(3))
-  real(amrex_real), intent(in   ) :: fluxz (fzlo(1):fzhi(1),fzlo(2):fzhi(2),fzlo(3):fzhi(3))
-  real(amrex_real), intent(in)    :: dx(3)
-  real(amrex_real), intent(in)    :: dt
-
-  ! local variables
-  integer i,j,k
-  real(amrex_real) :: dtdx(3)
-
-  dtdx = dt/dx
-
-  do k = lo(3), hi(3)
-  do j = lo(2), hi(2)
-  do i = lo(1), hi(1)
-
-     phinew(i,j,k) = phiold(i,j,k) &
-          + dtdx(1) * (fluxx(i+1,j  ,k  ) - fluxx(i,j,k)) &
-          + dtdx(2) * (fluxy(i  ,j+1,k  ) - fluxy(i,j,k)) &
-          + dtdx(3) * (fluxz(i  ,j  ,k+1) - fluxz(i,j,k))
-
-  end do
-  end do
-  end do
-
-end subroutine update_phi
diff --git a/Tests/ProfTests/ThirdParty/Source/init_phi_2d.f90 b/Tests/ProfTests/ThirdParty/Source/init_phi_2d.f90
deleted file mode 100644
index 02a4c036cff..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/init_phi_2d.f90
+++ /dev/null
@@ -1,28 +0,0 @@
-subroutine init_phi(lo, hi, phi, philo, phihi, dx, prob_lo, prob_hi) bind(C, name="init_phi")
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2), philo(2), phihi(2)
-  real(amrex_real), intent(inout) :: phi(philo(1):phihi(1),philo(2):phihi(2))
-  real(amrex_real), intent(in   ) :: dx(2) 
-  real(amrex_real), intent(in   ) :: prob_lo(2) 
-  real(amrex_real), intent(in   ) :: prob_hi(2) 
-
-  integer          :: i,j
-  double precision :: x,y,r2
-
-  do j = lo(2), hi(2)
-     y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-     do i = lo(1), hi(1)
-        x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-
-        r2 = ((x-0.25d0)**2 + (y-0.25d0)**2) / 0.01d0
-
-        phi(i,j) = 1.d0 + exp(-r2)
-
-     end do
-  end do
-
-end subroutine init_phi
diff --git a/Tests/ProfTests/ThirdParty/Source/init_phi_3d.f90 b/Tests/ProfTests/ThirdParty/Source/init_phi_3d.f90
deleted file mode 100644
index ec281d22df5..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/init_phi_3d.f90
+++ /dev/null
@@ -1,30 +0,0 @@
-subroutine init_phi(lo, hi, phi, philo, phihi, dx, prob_lo, prob_hi) bind(C, name="init_phi")
-
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3), philo(3), phihi(3)
-  real(amrex_real), intent(inout) :: phi(philo(1):phihi(1),philo(2):phihi(2),philo(3):phihi(3))
-  real(amrex_real), intent(in   ) :: dx(3) 
-  real(amrex_real), intent(in   ) :: prob_lo(3) 
-  real(amrex_real), intent(in   ) :: prob_hi(3) 
-
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-
-  do k = lo(3), hi(3)
-     z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-     do j = lo(2), hi(2)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i = lo(1), hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-
-           r2 = ((x-0.25d0)**2 + (y-0.25d0)**2 + (z-0.25d0)**2) / 0.01d0
-           phi(i,j,k) = 1.d0 + exp(-r2)
-
-        end do
-     end do
-  end do
-
-end subroutine init_phi
diff --git a/Tests/ProfTests/ThirdParty/Source/main.cpp b/Tests/ProfTests/ThirdParty/Source/main.cpp
deleted file mode 100644
index d1fc3dc11f0..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/main.cpp
+++ /dev/null
@@ -1,156 +0,0 @@
-#include <AMReX_ThirdPartyProfiling.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_Print.H>
-
-#include "myfunc.H"
-#include "myfunc_F.H"
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    
-    main_main();
-    
-    amrex::Finalize();
-    return 0;
-}
-
-void main_main ()
-{
-    // What time is it now?  We'll use this to compute total run time.
-    Real strt_time = ParallelDescriptor::second();
-
-    // AMREX_SPACEDIM: number of dimensions
-    int n_cell, max_grid_size, nsteps, plot_int;
-    Vector<int> is_periodic(AMREX_SPACEDIM,1);  // periodic in all direction by default
-
-    // inputs parameters
-    {
-        // ParmParse is way of reading inputs from the inputs file
-        ParmParse pp;
-
-        // We need to get n_cell from the inputs file - this is the number of cells on each side of 
-        //   a square (or cubic) domain.
-        pp.get("n_cell",n_cell);
-
-        // The domain is broken into boxes of size max_grid_size
-        pp.get("max_grid_size",max_grid_size);
-
-        // Default plot_int to -1, allow us to set it to something else in the inputs file
-        //  If plot_int < 0 then no plot files will be writtenq
-        plot_int = -1;
-        pp.query("plot_int",plot_int);
-
-        // Default nsteps to 0, allow us to set it to something else in the inputs file
-        nsteps = 10;
-        pp.query("nsteps",nsteps);
-
-        pp.queryarr("is_periodic", is_periodic);
-    }
-
-    // make BoxArray and Geometry
-    BoxArray ba;
-    Geometry geom;
-    {
-        IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-        IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-        Box domain(dom_lo, dom_hi);
-
-        // Initialize the boxarray "ba" from the single box "bx"
-        ba.define(domain);
-        // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-        ba.maxSize(max_grid_size);
-
-       // This defines the physical box, [-1,1] in each direction.
-        RealBox real_box({AMREX_D_DECL(-1.0,-1.0,-1.0)},
-                         {AMREX_D_DECL( 1.0, 1.0, 1.0)});
-
-        // This defines a Geometry object
-        geom.define(domain,&real_box,CoordSys::cartesian,is_periodic.data());
-    }
-
-    // Nghost = number of ghost cells for each array 
-    int Nghost = 1;
-    
-    // Ncomp = number of components for each array
-    int Ncomp  = 1;
-  
-    // How Boxes are distrubuted among MPI processes
-    DistributionMapping dm(ba);
-
-    // we allocate two phi multifabs; one will store the old state, the other the new.
-    MultiFab phi_old(ba, dm, Ncomp, Nghost);
-    MultiFab phi_new(ba, dm, Ncomp, Nghost);
-
-    // Initialize phi_new by calling a Fortran routine.
-    // MFIter = MultiFab Iterator
-    for ( MFIter mfi(phi_new); mfi.isValid(); ++mfi )
-    {
-        const Box& bx = mfi.validbox();
-
-        init_phi(BL_TO_FORTRAN_BOX(bx),
-                 BL_TO_FORTRAN_ANYD(phi_new[mfi]),
-                 geom.CellSize(), geom.ProbLo(), geom.ProbHi());
-    }
-
-    // compute the time step
-    const Real* dx = geom.CellSize();
-    Real dt = 0.9*dx[0]*dx[0] / (2.0*AMREX_SPACEDIM);
-
-    // time = starting time in the simulation
-    Real time = 0.0;
-
-    // Write a plotfile of the initial data if plot_int > 0 (plot_int was defined in the inputs file)
-    if (plot_int > 0)
-    {
-        int n = 0;
-        const std::string& pltfile = amrex::Concatenate("plt",n,5);
-        WriteSingleLevelPlotfile(pltfile, phi_new, {"phi"}, geom, time, 0);
-    }
-
-    // build the flux multifabs
-    std::array<MultiFab, AMREX_SPACEDIM> flux;
-    for (int dir = 0; dir < AMREX_SPACEDIM; dir++)
-    {
-        // flux(dir) has one component, zero ghost cells, and is nodal in direction dir
-        BoxArray edge_ba = ba;
-        edge_ba.surroundingNodes(dir);
-        flux[dir].define(edge_ba, dm, 1, 0);
-    }
-
-//    BL_TP_PROFILE_REGION_START();
-    for (int n = 1; n <= nsteps; ++n)
-    {
-        MultiFab::Copy(phi_old, phi_new, 0, 0, 1, 0);
-
-        // new_phi = old_phi + dt * (something)
-        if (n > (nsteps==5))
-        {
-          BL_TP_PROFILE_REGION_START();
-        }
-
-        advance(phi_old, phi_new, flux, dt, geom); 
-        time = time + dt;
-        
-        // Tell the I/O Processor to write out which step we're doing
-        amrex::Print() << "Advanced step " << n << "\n";
-
-        // Write a plotfile of the current data (plot_int was defined in the inputs file)
-        if (plot_int > 0 && n%plot_int == 0)
-        {
-            const std::string& pltfile = amrex::Concatenate("plt",n,5);
-            WriteSingleLevelPlotfile(pltfile, phi_new, {"phi"}, geom, time, n);
-        }
-    }
-    BL_TP_PROFILE_REGION_STOP();
-
-    // Call the timer again and compute the maximum difference between the start time and stop time
-    //   over all processors
-    Real stop_time = ParallelDescriptor::second() - strt_time;
-    const int IOProc = ParallelDescriptor::IOProcessorNumber();
-    ParallelDescriptor::ReduceRealMax(stop_time,IOProc);
-
-    // Tell the I/O Processor to write out the "run time"
-    amrex::Print() << "Run time = " << stop_time << std::endl;
-}
diff --git a/Tests/ProfTests/ThirdParty/Source/myfunc.H b/Tests/ProfTests/ThirdParty/Source/myfunc.H
deleted file mode 100644
index af0c1f885ac..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/myfunc.H
+++ /dev/null
@@ -1,17 +0,0 @@
-#ifndef MYFUNC_H_
-#define MYFUNC_H_
-
-#include <AMReX_Geometry.H>
-#include <AMReX_MultiFab.H>
-
-using namespace amrex;
-
-void main_main ();
-
-void advance (MultiFab& phi_old,
-              MultiFab& phi_new,
-	      std::array<MultiFab, AMREX_SPACEDIM>& flux,
-	      Real dt,
-              const Geometry& geom);
-
-#endif
diff --git a/Tests/ProfTests/ThirdParty/Source/myfunc_F.H b/Tests/ProfTests/ThirdParty/Source/myfunc_F.H
deleted file mode 100644
index 7da2ca7e00b..00000000000
--- a/Tests/ProfTests/ThirdParty/Source/myfunc_F.H
+++ /dev/null
@@ -1,39 +0,0 @@
-#ifndef MYFUNC_F_H_
-#define MYFUNC_F_H_
-
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-    void init_phi(const int* lo, const int* hi,
-                  amrex_real* data, const int* dlo, const int* dhi,
-                  const amrex_real* dx, const amrex_real* prob_lo, const amrex_real* prob_hi);
-    
-    void compute_flux(const int* lo, const int* hi,
-                      const int* domlo, const int* domhi,
-                      amrex_real* phi, const int* philo, const int* phihi,
-                      amrex_real* fluxx, const int* fxlo, const int* fxhi,
-                      amrex_real* fluxy, const int* fylo, const int* fyhi,
-#if (BL_SPACEDIM == 3)   
-                      amrex_real* fluxz, const int* fzlo, const int* fzhi,
-#endif
-                      const amrex_real* dx);
-
-    void update_phi(const int* lo, const int* hi,
-                    amrex_real* pold, const int* polo, const int* pohi,
-                    amrex_real* pnew, const int* pnlo, const int* pnhi,
-                    amrex_real* fluxx, const int* fxlo, const int* fxhi,
-                    amrex_real* fluxy, const int* fylo, const int* fyhi,
-#if (BL_SPACEDIM == 3)   
-                    amrex_real* fluxz, const int* fzlo, const int* fzhi,
-#endif
-                    const amrex_real* dx, const amrex_real* dt);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Tests/SinglePrecision/GNUmakefile b/Tests/SinglePrecision/GNUmakefile
deleted file mode 100644
index b4ec73343db..00000000000
--- a/Tests/SinglePrecision/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-AMREX_HOME ?= ../../
-
-PRECISION = FLOAT
-
-DEBUG	= FALSE
-DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gnu
-
-USE_MPI   = FALSE
-USE_OMP   = FALSE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/SinglePrecision/Make.package b/Tests/SinglePrecision/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/SinglePrecision/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/SinglePrecision/main.cpp b/Tests/SinglePrecision/main.cpp
deleted file mode 100644
index 1ccad4ab2dd..00000000000
--- a/Tests/SinglePrecision/main.cpp
+++ /dev/null
@@ -1,15 +0,0 @@
-
-#include <AMReX.H>
-#include <AMReX_Print.H>
-#include <AMReX_REAL.H>
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    {
-        static_assert(sizeof(amrex::Real) == sizeof(float), "amrex::Real and float have different size");
-        amrex::Print() << "Hello world from AMReX version " << amrex::Version() << "\n";
-    }
-    amrex::Finalize();
-}
-
diff --git a/Tests/Slice/GNUmakefile b/Tests/Slice/GNUmakefile
deleted file mode 100644
index 85cec712d06..00000000000
--- a/Tests/Slice/GNUmakefile
+++ /dev/null
@@ -1,36 +0,0 @@
-AMREX_HOME ?= ../../
-
-DEBUG	= FALSE
-DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gnu
-
-PRECISION = DOUBLE
-
-USE_MPI   = TRUE
-USE_OMP   = TRUE
-USE_CUDA   = FALSE
-
-TINY_PROFILE = TRUE
-
-###################################################
-
-EBASE     = main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/Particle/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-HDF5_HOME   = /global/homes/s/sbyna/software/hdf5develop/install
-USE_HDF5 = FALSE
-ifeq ($(USE_HDF5), TRUE)
-DEFINES += -DBL_HDF5 
-INCLUDE_LOCATIONS += $(HDF5_HOME)/include
-LIBRARIES         += -lhdf5 -L$(HDF5_HOME)/lib
-endif
diff --git a/Tests/Slice/Make.package b/Tests/Slice/Make.package
deleted file mode 100644
index 0a07775e9ee..00000000000
--- a/Tests/Slice/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-CEXE_headers += main.H 
-CEXE_sources += main.cpp 
diff --git a/Tests/Slice/inputs b/Tests/Slice/inputs
deleted file mode 100644
index fbf08c4c319..00000000000
--- a/Tests/Slice/inputs
+++ /dev/null
@@ -1,21 +0,0 @@
-# Domain size
-ncells = 20
-
-# Maximum allowable size of each subdomain in the problem domain; 
-# this is used to decompose the domain for parallel calculations.
-max_grid_size = 2
-
-# Number of levels
-nlevs = 1
-
-# Number of components in the multifabs
-ncomp = 6
-
-# Number of particles per cell
-nppc = 2
-
-#slice domain
-slice.dom_lo = 0.49 0.49 0.0
-slice.dom_hi = 0.49 0.49 0.45
-slice.n_cells = 0 0 9
-slice.max_grid_size = 2
diff --git a/Tests/Slice/main.H b/Tests/Slice/main.H
deleted file mode 100644
index 30fdac69eb6..00000000000
--- a/Tests/Slice/main.H
+++ /dev/null
@@ -1,28 +0,0 @@
-#ifndef MAIN_H
-#define MAIN_H
-
-#include <AMReX_Gpu.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_IArrayBox.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_Particles.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_IArrayBox.H>
-#include <AMReX_Vector.H>
-#include <cmath>
-
-namespace amrex {
-
-   IntVect cctype(AMREX_D_DECL(0,0,0));
-   IntVect ndtype(AMREX_D_DECL(1,1,1));
-   IntVect xetype(AMREX_D_DECL(0,1,1));
-   IntVect yetype(AMREX_D_DECL(1,0,1));
-   IntVect zetype(AMREX_D_DECL(1,1,0));
-   IntVect xftype(AMREX_D_DECL(1,0,0));
-   IntVect yftype(AMREX_D_DECL(0,1,0));
-   IntVect zftype(AMREX_D_DECL(0,0,1));
-
-}
-
-#endif
diff --git a/Tests/Slice/main.cpp b/Tests/Slice/main.cpp
deleted file mode 100644
index f7bf1f1e451..00000000000
--- a/Tests/Slice/main.cpp
+++ /dev/null
@@ -1,406 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_Particles.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_IArrayBox.H>
-#include <AMReX_Vector.H>
-#include <main.H>
-#include <AMReX_BLassert.H>
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_MultiFabUtil_C.H>
-
-
-using namespace amrex;
-
-void CreateSlice(Vector<MultiFab*> mf, Vector<Geometry> geom, RealBox slice_realbox, Vector<int> slice_ncells, int slice_grid_size);
-void InitializeVariables(Vector<MultiFab*> mf, Vector<Geometry> geom);
-
-int main(int argc, char* argv[])
-{    
-    amrex::Initialize(argc,argv);
-    { 
-    const int nghost = 0;
-    int ncells, max_grid_size, ncomp, nlevs, nppc;
-
-    ParmParse pp;
-    pp.get("ncells", ncells);
-    pp.get("max_grid_size", max_grid_size);
-    pp.get("ncomp", ncomp);
-    pp.get("nlevs", nlevs);
-    pp.get("nppc", nppc);
-    
-    
-    AMREX_ALWAYS_ASSERT(nlevs < 2); // relax this later
-
-    IntVect domain_lo(AMREX_D_DECL(0, 0, 0));
-    IntVect domain_hi(AMREX_D_DECL(ncells-1, ncells-1, ncells-1)); 
-    const Box domain(domain_lo, domain_hi);
-
-    RealBox real_box;
-    for (int n = 0; n < AMREX_SPACEDIM; n++) {
-        real_box.setLo(n, 0.0);
-        real_box.setHi(n, 1.0);
-    }
-
-    // Define the refinement ratio
-    Vector<IntVect> ref_ratio(nlevs-1);
-    for (int lev = 1; lev < nlevs; lev++)
-        ref_ratio[lev-1] = IntVect(AMREX_D_DECL(2, 2, 2));
-
-    // This sets the boundary conditions to be doubly or triply periodic
-    int is_per[AMREX_SPACEDIM];
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-        is_per[i] = 1;
-
-    // This defines a Geometry object for each level
-    Vector<Geometry> geom(nlevs);
-    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
-    for (int lev = 1; lev < nlevs; lev++) {
-	geom[lev].define(amrex::refine(geom[lev-1].Domain(), ref_ratio[lev-1]),
-			 &real_box, CoordSys::cartesian, is_per);
-    }
-    Vector<BoxArray> ba(nlevs);
-    ba[0].define(domain);
-    
-    // break the BoxArrays at both levels into max_grid_size^3 boxes
-    for (int lev = 0; lev < nlevs; lev++) {
-        ba[lev].maxSize(max_grid_size);
-    }
-
-    Vector<DistributionMapping> dmap(nlevs);
-
-    // default cell-centered multifab //
-    Vector<std::unique_ptr<MultiFab> > mf(nlevs);
-    // node-based multifab //
-    Vector<std::unique_ptr<MultiFab> > rho_mf(nlevs);
-    // Ex - Edge based //
-    Vector<std::unique_ptr<MultiFab> > Ex_mf(nlevs);
-    // Ey - Edge based //
-    Vector<std::unique_ptr<MultiFab> > Ey_mf(nlevs);
-    // Ez - Edge based //
-    Vector<std::unique_ptr<MultiFab> > Ez_mf(nlevs);
-    // Bx - face centered //
-    Vector<std::unique_ptr<MultiFab> > Bx_mf(nlevs);
-    // By - face centered //
-    Vector<std::unique_ptr<MultiFab> > By_mf(nlevs);
-    // Bz - face centered //
-    Vector<std::unique_ptr<MultiFab> > Bz_mf(nlevs);
-
-    // note that current density is edge centered similar to E-Field and therefore for testing purposes it is not explicitly included here. 
-
-    for (int lev = 0; lev < nlevs; lev++) {
-        dmap[lev] = DistributionMapping{ba[lev]};
-        mf[lev].reset(new MultiFab(ba[lev], dmap[lev], ncomp, nghost));
-        rho_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,1,1}), dmap[lev], ncomp, nghost));
-        Ex_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{0,1,1}), dmap[lev], ncomp, nghost));
-        Ey_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,0,1}), dmap[lev], ncomp, nghost));
-        Ez_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,1,0}), dmap[lev], ncomp, nghost));
-        Bx_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,0,0}), dmap[lev], ncomp, nghost));
-        By_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{0,1,0}), dmap[lev], ncomp, nghost));
-        Bz_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{0,0,1}), dmap[lev], ncomp, nghost));
-    }
-
-    InitializeVariables( GetVecOfPtrs(mf), geom );
-    InitializeVariables( GetVecOfPtrs(rho_mf), geom );
-    InitializeVariables( GetVecOfPtrs(Ex_mf), geom );
-    InitializeVariables( GetVecOfPtrs(Ey_mf), geom );
-    InitializeVariables( GetVecOfPtrs(Ez_mf), geom );
-    InitializeVariables( GetVecOfPtrs(Bx_mf), geom );
-    InitializeVariables( GetVecOfPtrs(By_mf), geom );
-    InitializeVariables( GetVecOfPtrs(Bz_mf), geom );
-
-    VisMF::Write((*mf[0]),"vismf_orig_cc");
-    VisMF::Write((*rho_mf[0]),"vismf_orig_node");
-    VisMF::Write((*Ex_mf[0]),"vismf_orig_Ex");
-    VisMF::Write((*Ey_mf[0]),"vismf_orig_Ey");
-    VisMF::Write((*Ez_mf[0]),"vismf_orig_Ez");
-    VisMF::Write((*Bx_mf[0]),"vismf_orig_Bx");
-    VisMF::Write((*By_mf[0]),"vismf_orig_By");
-    VisMF::Write((*Bz_mf[0]),"vismf_orig_Bz");
-    // Slice generation starts here //
-    Vector<Real> slo(AMREX_SPACEDIM);
-    Vector<Real> shi(AMREX_SPACEDIM);
-    Vector<int> slice_cells(AMREX_SPACEDIM);
-    
-    int slice_grid_size;
-
-    ParmParse ppg("slice");
-    ppg.queryarr("dom_lo",slo,0,AMREX_SPACEDIM);
-    ppg.queryarr("dom_hi",shi,0,AMREX_SPACEDIM);
-    ppg.queryarr("n_cells",slice_cells,0,AMREX_SPACEDIM);
-    ppg.query("max_grid_size",slice_grid_size);
-    amrex::RealBox slice_realbox;
-    slice_realbox.setLo(slo); 
-    slice_realbox.setHi(shi); 
-
-    CreateSlice( GetVecOfPtrs(mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(rho_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(Ex_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(Ey_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(Ez_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(Bx_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(By_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    CreateSlice( GetVecOfPtrs(Bz_mf),geom,slice_realbox,slice_cells,slice_grid_size);
-    }
-
-    amrex::Finalize();
-
-}
-
-//*********************************************************************************//
-// This function generates 1D,2D, or 3D multifab that .lo and .hi contained        //
-// within the domain. The slice is generated in two steps :                        //
-// 1. Slice multifab (smf) is generated with same cell size as the parent domain   //
-//    Then Parallel Copy is used to copy data from domain -> slice                 //
-// 2. Then, based on the user-defined cell size for the slice, the slice           //
-//    multifab (cs_mf) is coarsened and the data is averaged refined->coarse       //
-//    using the in-built average functions in AMReX_MultiFabUtil_3D_C.H            //
-// Note : If the user-defined cell size for the slice is same as that of the       //
-//        domain, no averaging/coarsening is performed.                            //
-//        If the user-defined cell size for the slice is smaller than the domain   //
-//        cell size, no slice is generated, since interpolation of data            //
-//        from coarse->refine is not performed in this function.                   //
-// Also the slice generation currently assumes only 1 level for the amr structure  //
-//*********************************************************************************//
-
-void CreateSlice(Vector<MultiFab*> mf, Vector<Geometry> geom, RealBox slice_realbox, Vector<int> slice_ncells, int slice_grid_size)
-{
-
-    // assumption 1 : nghost = 0; 
-    const int nghost = 0;
-    int is_per[AMREX_SPACEDIM];
-
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-        is_per[i] = 1;
-  
-    int nlevs = geom.size();
-    int ncomp = (*mf[0]).nComp();
-    bool genslice = true; 
-    int max_ratio = 1;
-    bool coarsen = false; 
-    IntVect cr_ratio(AMREX_D_DECL(1,1,1));
-    const auto conversionType = (*mf[0]).ixType();
-
-    const RealBox& real_box = geom[0].ProbDomain(); 
-
-    // ensuring that index space for slice is same as domain // 
-    IntVect slice_lo(AMREX_D_DECL(0,0,0));
-    IntVect slice_hi(AMREX_D_DECL(1,1,1)); 
-
-    // Define slice box and error checks //
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
-       
-       double fac = ( 1.0-conversionType[idim] )*geom[0].CellSize(idim) * 0.5;
-//       double compare = real_box.lo(idim) + geom[0].CellSize(idim) *0.5;
-       
-       slice_lo[idim] = round((slice_realbox.lo(idim) - real_box.lo(idim))/geom[0].CellSize(idim));
-       slice_hi[idim] = round((slice_realbox.hi(idim) - real_box.lo(idim))/geom[0].CellSize(idim)); 
-
-       if ( slice_lo[idim] > fac && fac > 0 ) {
-            slice_lo[idim] =  round((slice_realbox.lo(idim) - (real_box.lo(idim) + fac))/geom[0].CellSize(idim));
-            slice_hi[idim] =  round((slice_realbox.hi(idim) - (real_box.lo(idim) + fac))/geom[0].CellSize(idim));
-       }
-        
-       if ( ( slice_hi[idim] - slice_lo[idim]) == 0) {
-          // Only 1 cell is required if hi and lo are equal //
-          slice_hi[idim] = slice_lo[idim] + 2;
-          slice_ncells[idim] = 1;
-       }
-       else {
-
-          int refinedcells =  ((slice_realbox.hi(idim) - slice_realbox.lo(idim)) / 
-                                                         geom[0].CellSize(idim));
-
-          // compare cell sizes of slice and computational domain //
-          if (refinedcells >= slice_ncells[idim]) 
-          {
-             if (refinedcells % slice_ncells[idim] != 0) 
-             {
-                amrex::Abort( " SLICEERROR :: cell size of slice is not an integer                                           multiple of the computaitonal domain's cell size" );
-             } 
-             if ( refinedcells > slice_ncells[idim] && slice_ncells[idim]>0) 
-             {
-                coarsen = true; 
-                cr_ratio[idim] =  refinedcells / slice_ncells[idim] ;
-                if ( slice_grid_size % cr_ratio[idim] != 0) 
-                {
-                   amrex::Abort("SLICE_ERROR :: Max grid size of slice is not an                                              integer multiple of coarsening ratio ");
-                }
-                if (max_ratio < cr_ratio[idim] ) 
-                {
-                   max_ratio = cr_ratio[idim];
-                }
-             }
-          }
-          else 
-          {
-             genslice = false; // no slice generation in this case
-             amrex::Abort(" SLICEERROR : The cell size for the required diagnostic                                       slice is more refined than the simulation domain cell size.                                  Please change input such that cell size >= domain cell size");
-          }
-       }
-       --slice_hi[idim]; // since default index type is cc  // -= 1; 
-    }
-
-
-    // Slice generation only if slice cell size >= domain cell size //
-    if (genslice == true)
-    {
-
-    // Default index type for slice is cell-centered //
-    Box slice(slice_lo, slice_hi);
-    
-
-
-    // Convert from cc to index type of parent multifab //
-    IntVect convertTypeofSlice(AMREX_D_DECL(0,0,0));
-    bool slicetypeToBeConverted = 0;
-    for ( int idim = 0; idim < AMREX_SPACEDIM; ++idim )
-    {
-       if ( conversionType.nodeCentered(idim) ) {
-          convertTypeofSlice[idim] = 1;
-          slicetypeToBeConverted = 1;
-       }
-    }
-   
-    Vector<BoxArray> sba(nlevs);
-    sba[0].define(slice);
-    sba[0].maxSize(slice_grid_size);
-
-    // Distribution mapping for slice can be different from that of domain
-    Vector<DistributionMapping> sdmap(nlevs);
-    sdmap[0] = DistributionMapping{sba[0]};
-
-    // multifab for slice  
-    Vector<std::unique_ptr<MultiFab> > smf(nlevs);    
-    if ( slicetypeToBeConverted==1 ) {
-       smf[0].reset(new MultiFab(amrex::convert(sba[0],convertTypeofSlice),sdmap[0],ncomp,nghost));
-    }
-    else {
-       smf[0].reset(new MultiFab(sba[0],sdmap[0],ncomp,nghost));
-    }
-    smf[0]->setVal(1);
-    VisMF::Write((*smf[0]),"vismf_init");
-    // Copy data from domain to slice that has same cell size as that of the domain mf.  
-    (*smf[0]).ParallelCopy((*mf[0]), 0, 0, ncomp);  
-
-    if ( coarsen == false ) {
-       amrex::Print() << " Cell sizes are equal. No averaging required. " << "\n";
-       VisMF::Write((*smf[0]),"vismf_output");
-    }
-    else if ( coarsen == true ) {
-       
-       Vector<BoxArray> crse_ba(nlevs);
-
-       //Ensures that box arrays are the same and then coarsen using IntVect cr_ratio
-       crse_ba[0] = sba[0];
-       crse_ba[0].coarsen(cr_ratio);
-
-       // The input values of max_grid_size is factored by ratio in the coarsened slice //
-       int cs_grid_size = double(sba[0].size())*max_ratio ; 
-       crse_ba[0].maxSize(cs_grid_size);
-       AMREX_ALWAYS_ASSERT(crse_ba[0].size() == sba[0].size());
-
-       // constructing coarsened slice as per user-input if s_cells<ncells // 
-       Vector<std::unique_ptr<MultiFab> > cs_mf(nlevs); 
-
-       if(slicetypeToBeConverted==1) {
-          cs_mf[0].reset(new MultiFab(amrex::convert(crse_ba[0],convertTypeofSlice),sdmap[0],ncomp,nghost));
-       }
-       else {
-          cs_mf[0].reset(new MultiFab(crse_ba[0],sdmap[0],ncomp,nghost));
-       }
-
-       // Assumption :: Currently works only for 1 level //
-       for (int ilev = 0; ilev < nlevs; ilev++)
-       {
-           MultiFab& mfSrc = *smf[ilev];
-           MultiFab& mfDst = *cs_mf[ilev];
-          
-           MFIter mfi_dst(mfDst);
-           for (MFIter mfi(mfSrc); mfi.isValid(); ++mfi)
-           {
-               Array4<Real const> const& Src_arr = mfSrc.array(mfi);
-
-               const Box& Dst_bx = mfi_dst.validbox();
-               Array4<Real> const& Dst_arr = mfDst.array(mfi_dst);
-
-               int scomp = 0;
-               int dcomp = 0;
-
-               if( convertTypeofSlice==cctype ) {
-                  amrex::amrex_avgdown(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio);
-               }
-               if( convertTypeofSlice == ndtype ) {
-                  amrex::amrex_avgdown_nodes(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio);
-               }
-               if( convertTypeofSlice == xetype ) {
-                  amrex::amrex_avgdown_edges(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio,0);
-               }
-               if( convertTypeofSlice == yetype) {
-                  amrex::amrex_avgdown_edges(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio,1);
-               }
-               if( convertTypeofSlice == zetype ) {
-                  amrex::amrex_avgdown_edges(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio,2);
-               }
-               if (AMREX_SPACEDIM==3) {
-                  if( convertTypeofSlice == xftype) {
-                     amrex::amrex_avgdown_faces(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio,0);
-                  }
-                  if( convertTypeofSlice == yftype ) {
-                     amrex::amrex_avgdown_faces(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio,1);
-                  }
-                  if( convertTypeofSlice == zftype ) {
-                     amrex::amrex_avgdown_faces(Dst_bx,Dst_arr,Src_arr,dcomp,scomp,ncomp,cr_ratio,2);
-                  }
-               }
-
-               if ( mfi_dst.isValid() ) {
-                  ++mfi_dst;
-               }
-           }
-       }
-       VisMF::Write((*cs_mf[0]),"vismf_output");
-    }
-
-    }
-}
-
-// assuming 6 components for all multifabs just for testing purposes //
-void InitializeVariables(Vector<MultiFab*> mf, Vector<Geometry> geom)
-{
-    int nlevs = geom.size();
-    const Real *dom_dx = geom[0].CellSize();
-    for (int lev = 0; lev < nlevs; ++lev) {
-        for (MFIter mfi(*mf[lev]); mfi.isValid(); ++mfi) {
-            
-            MultiFab &mfSrc= *mf[lev];
-            auto const &mf_arr = mfSrc.array(mfi);
-            const Box& bx = mfi.tilebox();
-            const auto IndType = (*mf[lev]).ixType();
-            const auto lo = amrex::lbound(bx); 
-            const auto hi = amrex::ubound(bx); 
-            for (int k = lo.z; k<=hi.z; ++k) {
-               for (int j = lo.y; j<=hi.y; ++j) {
-                  for (int i = lo.x; i<=hi.x; ++i) {
-                      int icomp= 0;
-		      mf_arr(i,j,k,icomp) = i * dom_dx[0] + (1.0-IndType[0])*dom_dx[0]*0.5; 
-                      ++icomp;      
-                      mf_arr(i,j,k,icomp) = j * dom_dx[1] + (1.0-IndType[1])*dom_dx[1]*0.5; 
-                      ++icomp;      
-                      mf_arr(i,j,k,icomp) = k * dom_dx[2] + (1.0-IndType[2])*dom_dx[2]*0.5; 
-                      ++icomp;      
-                      mf_arr(i,j,k,icomp) = i * dom_dx[0] + (1.0-IndType[0])*dom_dx[0]*0.5;
-                      ++icomp;      
-                      mf_arr(i,j,k,icomp) = j * dom_dx[1] + (1.0-IndType[1])*dom_dx[1]*0.5; 
-                      ++icomp;      
-                      mf_arr(i,j,k,icomp) = k * dom_dx[2] + (1.0-IndType[2])*dom_dx[2]*0.5;
-                  }
-               }
-            }
-        }
-    }
-
-}
-
diff --git a/Tests/SliceWithInterp/inputs b/Tests/SliceWithInterp/inputs
deleted file mode 100644
index 0a1c27a9096..00000000000
--- a/Tests/SliceWithInterp/inputs
+++ /dev/null
@@ -1,20 +0,0 @@
-# Domain size
-ncells = 128
-
-# Maximum allowable size of each subdomain in the problem domain; 
-# this is used to decompose the domain for parallel calculations.
-max_grid_size = 2
-
-# Number of levels
-nlevs = 1
-
-# Number of components in the multifabs
-ncomp = 6
-
-# Number of particles per cell
-nppc = 2
-
-#slice domain
-slice.dom_lo = 0.01 0.1 0.55
-slice.dom_hi = 0.01 0.7 0.55
-slice.coarsening_ratio = 1 4 3
diff --git a/Tests/SliceWithInterp/main.cpp b/Tests/SliceWithInterp/main.cpp
deleted file mode 100644
index 74258212ce0..00000000000
--- a/Tests/SliceWithInterp/main.cpp
+++ /dev/null
@@ -1,653 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_Particles.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_IArrayBox.H>
-#include <AMReX_Vector.H>
-#include <main.H>
-#include <AMReX_BLassert.H>
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_MultiFabUtil_C.H>
-
-
-using namespace amrex;
-
-void InitializeVariables(Vector<MultiFab*> mf, Vector<Geometry> geom, int srccomp, int ncomp);
-
-void CreateSlice(Vector<MultiFab*> mf, Vector<Geometry> geom, RealBox slice_realbox, Vector<int> slice_cr_ratio);
-
-void CheckSliceInput(const RealBox real_box, RealBox &slice_cc_nd_box, RealBox &slice_realbox,IntVect &cr_ratio, Vector<int> slice_cr_ratio,Vector<Geometry> const geom, IntVect const SliceType, IntVect& slice_lo, IntVect &slice_hi, IntVect &interp_lo);
-
-void InterpolateLo(const Box& bx, FArrayBox &fabox, IntVect slice_lo, Vector<Geometry> geom, int idir, IntVect IndType, RealBox slice_realbox, int srccomp, int ncomp, int nghost);
-
-void InterpolateSliceValues( Vector<MultiFab*>smf, IntVect interp_lo, RealBox slice_realbox, Vector<Geometry> geom, int ncomp, int nghost, IntVect slice_lo, IntVect slice_hi, IntVect ConvertTypeofSlice);
-
-
-int main(int argc, char* argv[])
-{    
-    amrex::Initialize(argc,argv);
-    { 
-    const int nghost = 1;
-    int ncells, max_grid_size, ncomp, nlevs, nppc;
-
-    ParmParse pp;
-    pp.get("ncells", ncells);
-    pp.get("max_grid_size", max_grid_size);
-    pp.get("ncomp", ncomp);
-    pp.get("nlevs", nlevs);
-    pp.get("nppc", nppc);
-    
-    
-    AMREX_ALWAYS_ASSERT(nlevs < 2); // relax this later
-    AMREX_ALWAYS_ASSERT(nghost > 0); 
-
-    IntVect domain_lo(AMREX_D_DECL(0, 0, 0));
-    IntVect domain_hi(AMREX_D_DECL(ncells-1, ncells-1, ncells-1)); 
-    const Box domain(domain_lo, domain_hi);
-
-    RealBox real_box;
-    for (int n = 0; n < AMREX_SPACEDIM; n++) {
-        real_box.setLo(n, 0.0);
-        real_box.setHi(n, 1.0);
-    }
-
-    // Define the refinement ratio
-    Vector<IntVect> ref_ratio(nlevs-1);
-    for (int lev = 1; lev < nlevs; lev++)
-        ref_ratio[lev-1] = IntVect(AMREX_D_DECL(2, 2, 2));
-
-    // This sets the boundary conditions to be doubly or triply periodic
-    int is_per[AMREX_SPACEDIM];
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-        is_per[i] = 1;
-
-    // This defines a Geometry object for each level
-    Vector<Geometry> geom(nlevs);
-    geom[0].define(domain, &real_box, CoordSys::cartesian, is_per);
-    for (int lev = 1; lev < nlevs; lev++) {
-	geom[lev].define(amrex::refine(geom[lev-1].Domain(), ref_ratio[lev-1]),
-			 &real_box, CoordSys::cartesian, is_per);
-    }
-    Vector<BoxArray> ba(nlevs);
-    ba[0].define(domain);
-    
-    // break the BoxArrays at both levels into max_grid_size^3 boxes
-    for (int lev = 0; lev < nlevs; lev++) {
-        ba[lev].maxSize(max_grid_size);
-    }
-
-    Vector<DistributionMapping> dmap(nlevs);
-
-    // default cell-centered multifab //
-    Vector<std::unique_ptr<MultiFab> > mf(nlevs);
-    // node-based multifab //
-    Vector<std::unique_ptr<MultiFab> > rho_mf(nlevs);
-    // Ex - Edge based //
-    Vector<std::unique_ptr<MultiFab> > Ex_mf(nlevs);
-    // Ey - Edge based //
-    Vector<std::unique_ptr<MultiFab> > Ey_mf(nlevs);
-    // Ez - Edge based //
-    Vector<std::unique_ptr<MultiFab> > Ez_mf(nlevs);
-    // Bx - face centered //
-    Vector<std::unique_ptr<MultiFab> > Bx_mf(nlevs);
-    // By - face centered //
-    Vector<std::unique_ptr<MultiFab> > By_mf(nlevs);
-    // Bz - face centered //
-    Vector<std::unique_ptr<MultiFab> > Bz_mf(nlevs);
-
-    // note that current density is edge centered similar to E-Field and therefore for testing purposes it is not explicitly included here. 
-    for (int lev = 0; lev < nlevs; lev++) {
-        dmap[lev] = DistributionMapping{ba[lev]};
-        mf[lev].reset(new MultiFab(ba[lev], dmap[lev], ncomp, nghost));
-        rho_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,1,1}), dmap[lev], ncomp, nghost));
-        Ex_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{0,1,1}), dmap[lev], ncomp, nghost));
-        Ey_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,0,1}), dmap[lev], ncomp, nghost));
-        Ez_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,1,0}), dmap[lev], ncomp, nghost));
-        Bx_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{1,0,0}), dmap[lev], ncomp, nghost));
-        By_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{0,1,0}), dmap[lev], ncomp, nghost));
-        Bz_mf[lev].reset(new MultiFab(amrex::convert(ba[lev], IntVect{0,0,1}), dmap[lev], ncomp, nghost));
-    }
-
-    InitializeVariables( GetVecOfPtrs(mf), geom , 0, ncomp);
-    InitializeVariables( GetVecOfPtrs(rho_mf), geom, 0, ncomp);
-    InitializeVariables( GetVecOfPtrs(Ex_mf), geom, 0, ncomp );
-    InitializeVariables( GetVecOfPtrs(Ey_mf), geom, 0, ncomp );
-    InitializeVariables( GetVecOfPtrs(Ez_mf), geom, 0, ncomp );
-    InitializeVariables( GetVecOfPtrs(Bx_mf), geom, 0, ncomp );
-    InitializeVariables( GetVecOfPtrs(By_mf), geom, 0, ncomp );
-    InitializeVariables( GetVecOfPtrs(Bz_mf), geom, 0, ncomp );
-
-    VisMF::Write((*mf[0]),"vismf_orig_cc");
-    VisMF::Write((*rho_mf[0]),"vismf_orig_node");
-    VisMF::Write((*Ex_mf[0]),"vismf_orig_Ex");
-    VisMF::Write((*Ey_mf[0]),"vismf_orig_Ey");
-    VisMF::Write((*Ez_mf[0]),"vismf_orig_Ez");
-    VisMF::Write((*Bx_mf[0]),"vismf_orig_Bx");
-    VisMF::Write((*By_mf[0]),"vismf_orig_By");
-    VisMF::Write((*Bz_mf[0]),"vismf_orig_Bz");
-
-    // Slice generation starts here //
-    Vector<Real> slo(AMREX_SPACEDIM);
-    Vector<Real> shi(AMREX_SPACEDIM);
-    Vector<int> slice_cells(AMREX_SPACEDIM);
-    Vector<int> slice_crse_ratio(AMREX_SPACEDIM);
-   
-    //Read input for slice //
-    ParmParse ppg("slice");
-    ppg.queryarr("dom_lo",slo,0,AMREX_SPACEDIM);
-    ppg.queryarr("dom_hi",shi,0,AMREX_SPACEDIM);
-    ppg.queryarr("coarsening_ratio",slice_crse_ratio,0,AMREX_SPACEDIM);
-
-    // Set lo and hi for slice 
-    amrex::RealBox slice_realbox;
-    slice_realbox.setLo(slo); 
-    slice_realbox.setHi(shi); 
-
-    CreateSlice( GetVecOfPtrs(mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(rho_mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(Ex_mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(Ey_mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(Ez_mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(Bx_mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(By_mf), geom, slice_realbox, slice_crse_ratio);
-    CreateSlice( GetVecOfPtrs(Bz_mf), geom, slice_realbox, slice_crse_ratio);
-    }
-
-    amrex::Finalize();
-
-}
-
-//*********************************************************************************//
-// This function generates 1D,2D, or 3D multifab that .lo and .hi contained        //
-// within the domain. The slice is generated in two steps :                        //
-// 1. Slice multifab (smf) is generated with same cell size as the parent domain   //
-//    Then Parallel Copy is used to copy data from domain -> slice                 //
-// 2. Then, based on the user-defined cell size for the slice, the slice           //
-//    multifab (cs_mf) is coarsened and the data is averaged refined->coarse       //
-//    using the in-built average functions in AMReX_MultiFabUtil_3D_C.H            //
-// Note : If the user-defined cell size for the slice is same as that of the       //
-//        domain, no averaging/coarsening is performed.                            //
-//        If the user-defined cell size for the slice is smaller than the domain   //
-//        cell size, no slice is generated, since interpolation of data            //
-//        from coarse->refine is not performed in this function.                   //
-// Also the slice generation currently assumes only 1 level for the amr structure  //
-//*********************************************************************************//
-
-void CreateSlice(Vector<MultiFab*> mf, Vector<Geometry> geom, RealBox slice_realbox, Vector<int> slice_cr_ratio)
-{
-
-    Vector<int> slice_ncells(AMREX_SPACEDIM);
-    int nghost = 1;
-    int is_per[AMREX_SPACEDIM];
-
-    for (int i = 0; i < AMREX_SPACEDIM; i++)
-        is_per[i] = 1;
-  
-    int nlevs = geom.size();
-    int ncomp = (*mf[0]).nComp();
-    int max_ratio = 1;
-    bool coarsen = false; 
-    IntVect cr_ratio(AMREX_D_DECL(1,1,1));
-    const auto conversionType = (*mf[0]).ixType();
-
-    // Obtain index type of source multifab //
-    IntVect SliceType(AMREX_D_DECL(0,0,0));
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim ) 
-    {
-        if ( conversionType.nodeCentered(idim) ) 
-        {
-           SliceType[idim] = 1;
-        }
-    }
-
-    const RealBox& real_box = geom[0].ProbDomain(); 
- 
-    RealBox slice_cc_nd_box;    
-    // Default max_grid_size for slice //
-    int slice_grid_size = 32;
-
-    bool interpolate = false;
-    // ensuring that index space for slice is same as domain // 
-    IntVect slice_lo(AMREX_D_DECL(0,0,0));
-    IntVect slice_hi(AMREX_D_DECL(1,1,1)); 
-    IntVect slice_lo2(AMREX_D_DECL(0,0,0));
-    IntVect interp_lo(AMREX_D_DECL(0,0,0)); 
-
-    // If inheriting data type //
-    CheckSliceInput(real_box, slice_cc_nd_box, slice_realbox, cr_ratio,                                         slice_cr_ratio, geom, SliceType, slice_lo, slice_hi, interp_lo); 
-
-    // Determine if interpolatiojnj is required and number of cells in slice //
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
-
-        if ( interp_lo[idim] == 1) {
-           interpolate = 1;
-        }
-
-       // For the case when a dimension is reduced //
-       if ( ( slice_hi[idim] - slice_lo[idim]) == 1) {
-          slice_ncells[idim] = 1;
-       }
-       else {
-            
-            slice_ncells[idim] = ( slice_hi[idim] - slice_lo[idim]                                                           + (1 - SliceType[idim]))/cr_ratio[idim]; 
-
-            int refined_ncells = (slice_hi[idim] - slice_lo[idim]) + ( 1 - SliceType[idim]);
-            
-            if ( cr_ratio[idim] > 1) 
-            {
-               coarsen = true; 
-               
-               if (max_ratio < cr_ratio[idim] ) 
-               {
-                  if (slice_grid_size < cr_ratio[idim] ) 
-                  {
-                      slice_grid_size  = cr_ratio[idim] ;
-                  }
-                  max_ratio = cr_ratio[idim];
-               }
-
-               // modify slice_grid_size if >= refines_cells //
-               if ( slice_grid_size >= refined_ncells ) {
-                   slice_grid_size = refined_ncells;
-               }
-            }
-       }
-    }
-
-    // Slice generation with Index Type inheritance //
-
-    // Default index type for slice is cell-centered //
-    Box slice(slice_lo, slice_hi);
-    
-    // Convert from cc to index type of parent multifab //
-    bool slicetypeToBeConverted = 0;
-    for ( int idim = 0; idim < AMREX_SPACEDIM; ++idim )
-    {
-       if ( SliceType[idim] == 1 ) {
-          slicetypeToBeConverted = 1;
-       }
-    }
-    
-    Vector<BoxArray> sba(nlevs);
-    sba[0].define(slice);
-    sba[0].maxSize(slice_grid_size);
-
-    // Distribution mapping for slice can be different from that of domain
-    Vector<DistributionMapping> sdmap(nlevs);
-    sdmap[0] = DistributionMapping{sba[0]};
-
-    // multifab for slice  
-    Vector<std::unique_ptr<MultiFab> > smf(nlevs);    
-    if ( slicetypeToBeConverted==1 ) {
-       smf[0].reset(new MultiFab(amrex::convert(sba[0],SliceType),sdmap[0],ncomp,nghost));
-    }
-    else {
-       smf[0].reset(new MultiFab(sba[0],sdmap[0],ncomp,nghost));
-    }
-
-    // Copy data from domain to slice that has same cell size as that of the domain mf.  
-    (*smf[0]).ParallelCopy((*mf[0]), 0, 0, ncomp,nghost,nghost);  
-    VisMF::Write((*smf[0]),"vismf_init");
-
-    // Interpolation of data on refined slice //
-    if (interpolate == 1) {
-       InterpolateSliceValues( GetVecOfPtrs(smf), interp_lo, slice_cc_nd_box, geom, ncomp,                                 nghost, slice_lo, slice_hi, SliceType);
-       VisMF::Write((*smf[0]),"vismf_output_interpolatedfine");
-    }
-
-    if ( coarsen == false ) {
-       amrex::Print() << " Cell sizes are equal. No averaging required. " << "\n";
-       VisMF::Write((*smf[0]),"vismf_output");
-    }
-    else if ( coarsen == true ) {
- 
-       amrex::Print() << " Calling in-built amrex average functions "<< cr_ratio[0] ;
-       amrex::Print() << " " << cr_ratio[1] << " " << cr_ratio[2] << "\n";
-
-       Vector<BoxArray> crse_ba(nlevs);
-       crse_ba[0] = sba[0];
-       crse_ba[0].coarsen(cr_ratio);
-
-       // The input values of max_grid_size is factored by ratio in the coarsened slice //
-       int cs_grid_size = double(sba[0].size())*max_ratio ; 
-       crse_ba[0].maxSize(cs_grid_size);
-       AMREX_ALWAYS_ASSERT(crse_ba[0].size() == sba[0].size());
-
-       // constructing coarsened slice as per user-input if s_cells<ncells // 
-       Vector<std::unique_ptr<MultiFab> > cs_mf(nlevs); 
-
-       if(slicetypeToBeConverted==1) {
-          cs_mf[0].reset(new MultiFab(amrex::convert(crse_ba[0],SliceType), sdmap[0],                                ncomp,nghost));
-       }
-       else {
-          cs_mf[0].reset(new MultiFab(crse_ba[0], sdmap[0], ncomp, nghost));
-       }
-
-       // Assumption :: Currently works only for 1 level //
-       for (int ilev = 0; ilev < nlevs; ilev++)
-       {
-           MultiFab& mfSrc = *smf[ilev];
-           MultiFab& mfDst = *cs_mf[ilev];
-          
-           MFIter mfi_dst(mfDst);
-           for (MFIter mfi(mfSrc); mfi.isValid(); ++mfi)
-           {
-               Array4<Real const> const& Src_arr = mfSrc.array(mfi);
-
-               const Box& Dst_bx = mfi_dst.validbox();
-               Array4<Real> const& Dst_arr = mfDst.array(mfi_dst);
-
-               int scomp = 0;
-               int dcomp = 0;
-
-               if( SliceType==cctype ) {
-                  amrex::amrex_avgdown(Dst_bx, Dst_arr, Src_arr, dcomp, scomp,                                                 ncomp, cr_ratio);
-               }
-               if( SliceType == ndtype ) {
-                  amrex::amrex_avgdown_nodes(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio);
-               }
-               if( SliceType == xetype ) {
-                  amrex::amrex_avgdown_edges(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio, 0);
-               }
-               if( SliceType == yetype) {
-                  amrex::amrex_avgdown_edges(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio, 1);
-               }
-               if( SliceType == zetype ) {
-                  amrex::amrex_avgdown_edges(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio, 2);
-               }
-               if (AMREX_SPACEDIM==3) {
-                  if( SliceType == xftype) {
-                     amrex::amrex_avgdown_faces(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio, 0);
-                  }
-                  if( SliceType == yftype ) {
-                     amrex::amrex_avgdown_faces(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio, 1);
-                  }
-                  if( SliceType == zftype ) {
-                     amrex::amrex_avgdown_faces(Dst_bx, Dst_arr, Src_arr, dcomp,                                                        scomp, ncomp, cr_ratio, 2);
-                  }
-               }
-
-               if ( mfi_dst.isValid() ) 
-               {
-                  ++mfi_dst;
-               }
-           }
-       }
-       VisMF::Write((*cs_mf[0]),"vismf_output_coarse");
-    }
-
-}
-
-void InitializeVariables(Vector<MultiFab*> mf, Vector<Geometry> geom, int srccomp, int ncomp)
-{
-    int nlevs = geom.size();
-    const Real *dom_dx = geom[0].CellSize();
-    for (int lev = 0; lev < nlevs; ++lev) {
-        for (MFIter mfi(*mf[lev]); mfi.isValid(); ++mfi) {
-            
-            MultiFab &mfSrc= *mf[lev];
-            auto const &mf_arr = mfSrc.array(mfi);
-            const Box& bx = mfi.growntilebox();
-            const auto IndType = (*mf[lev]).ixType();
-            const auto lo = amrex::lbound(bx); 
-            const auto hi = amrex::ubound(bx); 
-            for (int n = srccomp; n < srccomp + ncomp; ++n ) {
-               for (int k = lo.z; k<=hi.z; ++k) {
-                  for (int j = lo.y; j<=hi.y; ++j) {
-                     for (int i = lo.x; i<=hi.x; ++i) {
-                         int idim = n;
-                         if (n >=3 )
-                         {
-                            idim = n % 3;
-                         }
-                         int fac = i;
-                         if (idim == 1) fac = j;
-                         if (idim == 2) fac = k;
-                         mf_arr(i,j,k,n) = fac * dom_dx[idim]                                                                          + ( 1.0 - IndType[idim] ) * dom_dx[idim] *0.5;
-                     }
-                  }
-               }
-            }
-        }
-    }
-
-}
-
-void InterpolateLo(const Box& bx, FArrayBox &fabox, IntVect slice_lo, Vector<Geometry> geom, int idir, IntVect IndType, RealBox slice_realbox, int srccomp, int ncomp, int nghost)
-{
-    auto fabarr = fabox.array();
-    const auto lo = amrex::lbound(bx); 
-    const auto hi = amrex::ubound(bx);            
-    double fac = ( 1.0-IndType[idir] )*geom[0].CellSize(idir) * 0.5;
-    int imin = slice_lo[idir];
-    double minpos = imin*geom[0].CellSize(idir) + fac ;
-    double maxpos = (imin+1)*geom[0].CellSize(idir) + fac;
-    double slice_minpos = slice_realbox.lo(idir) ;
-
-    switch (idir) { 
-    case 0:
-    { 
-        if ( imin >= lo.x && imin <= lo.x) {
-           for (int n = srccomp; n < srccomp + ncomp; ++n) {
-              for (int k = lo.z; k <= hi.z; ++k) {
-                 for (int j = lo.y; j <= hi.y; ++j) {
-                     for (int i = lo.x; i <= hi.x; ++i) {
-                           double minval = fabarr(i,j,k,n);
-                           double maxval = fabarr(i+1,j,k,n);
-                           double ratio  = (maxval - minval) / (maxpos - minpos);
-                           double xdiff  = slice_minpos - minpos;
-                           double newval = minval + xdiff * ratio;
-			   fabarr(i,j,k,n) = newval;
-                     }
-                 }
-              }
-           }
-        }
-        break;
-    }
-    case 1:
-    {
-        if ( imin >= lo.y && imin <= lo.y) {
-           for (int n = srccomp; n < srccomp+ncomp; ++n) {
-              for (int k = lo.z; k <= hi.z; ++k) {
-                 for (int j = lo.y; j <= hi.y; ++j) {
-                    for (int i = lo.x; i <= hi.x; ++i) {
-                        double minval = fabarr(i,j,k,n);
-                        double maxval = fabarr(i,j+1,k,n);
-                        double ratio  = (maxval - minval) / (maxpos - minpos);
-                        double xdiff  = slice_minpos - minpos;
-                        double newval = minval + xdiff * ratio;
-                        fabarr(i,j,k,n) = newval;
-                    }
-                 }
-              }
-           }
-        }
-        break; 
-    }
-    case 2:
-    {
-        if ( imin >= lo.z && imin <= lo.z) {
-           for (int n = srccomp; n < srccomp+ncomp; ++n) {
-              for (int k = lo.z; k <= hi.z; ++k) {
-                 for (int j = lo.y; j <= hi.y; ++j) {
-                    for (int i = lo.x; i <= hi.x; ++i) {
-                        double minval = fabarr(i,j,k,n);
-                        double maxval = fabarr(i,j,k+1,n);
-                        double ratio  = (maxval - minval) / (maxpos - minpos);
-                        double xdiff  = slice_minpos - minpos;
-                        double newval = minval + xdiff * ratio;
-                        fabarr(i,j,k,n) = newval;
-                    }
-                 }
-              }
-           }
-        }
-        break;
-    }
-
-    }
-
-}
-
-
-void InterpolateSliceValues( Vector<MultiFab*>smf, IntVect interp_lo, RealBox slice_realbox, Vector<Geometry> geom, int ncomp, int nghost, IntVect slice_lo, IntVect slice_hi, IntVect SliceType)
-{
-    for (MFIter mfi(*smf[0]); mfi.isValid(); ++mfi) 
-    {
-         MultiFab &mfSrc= *smf[0];
-         const Box& bx = mfi.tilebox();
-         const auto IndType = (*smf[0]).ixType();
-         const auto lo = amrex::lbound(bx); 
-         const auto hi = amrex::ubound(bx);            
-         FArrayBox& fabox = mfSrc[mfi];
- 
-         for ( int idim = 0; idim < AMREX_SPACEDIM; ++idim) 
-         {
-             if ( interp_lo[idim] == 1 ) 
-             {
-                InterpolateLo( bx, fabox, slice_lo, geom, idim, SliceType,                                                 slice_realbox, 0, ncomp, nghost);
-             }
-         }
-    }
-
-}
-    
-
-     
-void CheckSliceInput(const RealBox real_box, RealBox &slice_cc_nd_box, RealBox &slice_realbox,IntVect &cr_ratio, Vector<int> slice_cr_ratio,Vector<Geometry> const geom, IntVect const SliceType, IntVect& slice_lo, IntVect &slice_hi, IntVect &interp_lo)
-{
-
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) 
-    {
-       // Modify coarsening ratio if the input value is not an exponent of 2 for AMR //
-       if (slice_cr_ratio[idim] > 0 ) 
-       {
-           int log_cr_ratio = floor( log2(slice_cr_ratio[idim])) ;
-           slice_cr_ratio[idim] = exp2( log_cr_ratio);  
-       }
-
-       // Default coarsening ratio is 1 //
-       if ( slice_cr_ratio[idim] > 0 ) cr_ratio[idim] = slice_cr_ratio[idim];
-
-       // Modify lo if input is out of bounds //
-       if ( slice_realbox.lo(idim) < real_box.lo(idim) ) 
-       {
-            slice_realbox.setLo( idim, real_box.lo(idim) ) ;
-            amrex::Print() << " Slice lo out of bounds. Modified slice lo along dim : " <<                                 idim << " to be aligned with domain box\n";
-       }
-
-       // Modify hi if input is out of bounds //
-       if ( slice_realbox.hi(idim) > real_box.hi(idim) ) 
-       {
-            slice_realbox.setHi( idim, real_box.hi(idim) );
-            amrex::Print() << " Slice hi out of bounds. Modified slice lo along dim : " <<                                 idim << " to be aligned with domain box\n";
-       }
-
-       double fac = ( 1.0-SliceType[idim] )*geom[0].CellSize(idim) * 0.5;
-
-       // If dimension is reduced to one cell length //
-       if ( slice_realbox.hi(idim) - slice_realbox.lo(idim) <= 0) 
-       {
-          slice_cc_nd_box.setLo( idim, slice_realbox.lo(idim) );
-          slice_cc_nd_box.setHi( idim, slice_realbox.hi(idim) );
-
-          if ( slice_cr_ratio[idim] > 1 )  cr_ratio[idim] = 1; 
-
-          // check for interpolation -- compute index lo with floor and ceil //
-          IntVect slice_lo2(AMREX_D_DECL(0,0,0));
-          if ( slice_cc_nd_box.lo(idim) - real_box.lo(idim) >= fac ) 
-          {
-             slice_lo[idim] = floor( ( (slice_cc_nd_box.lo(idim) - (real_box.lo(idim)                                          + fac ) ) / geom[0].CellSize(idim)) + fac * 1E-10);
-             slice_lo2[idim] = ceil( ( (slice_cc_nd_box.lo(idim) - (real_box.lo(idim)                                          + fac) ) / geom[0].CellSize(idim)) - fac * 1E-10 );
-          }
-          else  
-          {
-              slice_lo[idim] =  round((slice_cc_nd_box.lo(idim) - (real_box.lo(idim) ) )                                    / geom[0].CellSize(idim));
-              slice_lo2[idim] =  ceil((slice_cc_nd_box.lo(idim) - (real_box.lo(idim) ) )                                    / geom[0].CellSize(idim) );
-          }
-
-          if ( slice_lo[idim] == slice_lo2[idim]) 
-          {
-             if ( slice_cc_nd_box.lo(idim) - real_box.lo(idim) < fac ) 
-             {
-                interp_lo[idim] = 1;
-             }
-          }
-          else 
-          {
-             interp_lo[idim] = 1;
-          }
-
-          // ncells = 1 if dimension is reduced //
-          slice_hi[idim] = slice_lo[idim] + 1;
- 
-       }
-       else 
-       {
-          // moving realbox.lo and reabox.hi to nearest coarsenable grid point //
-          int index_lo = floor( ( (slice_realbox.lo(idim) - (real_box.lo(idim)) )                                         / geom[0].CellSize(idim) ) +fac * 1E-10);
-          int index_hi = ceil( ( (slice_realbox.hi(idim) - (real_box.lo(idim)) )                                         / geom[0].CellSize(idim) ) - fac * 1E-10);
-          bool modify_cr = true;
-         
-          // The input coarsening ratio and lo and hi may require reduction in the ratio //
-          while ( modify_cr == true ) 
-          {
-              int lo_new = index_lo;
-              int hi_new = index_hi;
-              int mod_lo = index_lo % cr_ratio[idim];          
-              int mod_hi = index_hi % cr_ratio[idim];          
-              modify_cr = false;
-
-              // To ensure that the index.lo is coarsenable //
-              if ( mod_lo > 0) {
-                 lo_new = index_lo - mod_lo;
-              } 
-              // To ensure that the index.hi is coarsenable //
-              if ( mod_hi > 0) {
-                 hi_new = index_hi + (cr_ratio[idim] - mod_hi);
-              }
-
-              //If modified index.hi is > baselinebox.hi, reduce coarsening ratio,                          and provide more points that asked for //               
-              if ( hi_new * geom[0].CellSize(idim) > real_box.hi(idim) ) 
-              {
-                 cr_ratio[idim] = cr_ratio[idim]/2;
-                 modify_cr = true;
-              } 
-              
-              int ncells = (hi_new - lo_new);
-
-              // If refined cells is not an integer multiple of coarsening ratio,                            then reduce coarsening ratio by factor of 2 // 
- 
-              if( ( ncells % cr_ratio[idim] ) != 0 )
-              {
-                  cr_ratio[idim] = cr_ratio[idim]/2;
-                  modify_cr = true;
-              }
-                 
-              if ( modify_cr == false ) 
-              {
-                 index_lo = lo_new;
-                 index_hi = hi_new;
-              }
-
-              slice_lo[idim] = index_lo;   
-              slice_hi[idim] = index_hi - 1; // since default is cell-centered    
-          }
-          slice_realbox.setLo( idim, index_lo * geom[0].CellSize(idim) );
-          slice_realbox.setHi( idim, index_hi * geom[0].CellSize(idim) );
-          slice_cc_nd_box.setLo( idim, slice_realbox.lo(idim) + fac );
-          slice_cc_nd_box.setHi( idim, slice_realbox.hi(idim) - fac );
-       }
-    }
-
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
-       amrex::Print() << " Input parameters for the Slice dim : " << idim ;
-       amrex::Print() << " slice real box lo = " << slice_realbox.lo(idim) << " hi = " << slice_realbox.hi(idim)  ;   
-       amrex::Print() << " cr " << cr_ratio[idim] << "\n";
-    }
-
-
-}
diff --git a/Tests/Stream/GNUmakefile b/Tests/Stream/GNUmakefile
deleted file mode 100644
index 60430bfb9ac..00000000000
--- a/Tests/Stream/GNUmakefile
+++ /dev/null
@@ -1,27 +0,0 @@
-AMREX_HOME ?= ../../../
-
-DEBUG     = FALSE
-USE_MPI   = TRUE
-USE_OMP   = FALSE
-USE_CUDA  = TRUE
-COMP      = pgi
-DIM       = 3
-
-Bpack   := ./Make.package
-Blocs   := .
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-TOP := $(AMREX_HOME)/Tests/Stream
-include $(TOP)/Make.package
-INCLUDE_LOCATIONS += $(TOP)
-VPATH_LOCATIONS   += $(TOP)
-
-include $(AMREX_HOME)/Src/Base/Make.package
-
-all: $(executable)
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/Stream/Make.package b/Tests/Stream/Make.package
deleted file mode 100644
index 6b4b865e8fc..00000000000
--- a/Tests/Stream/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources += main.cpp
diff --git a/Tests/Stream/inputs b/Tests/Stream/inputs
deleted file mode 100644
index 281e41629b6..00000000000
--- a/Tests/Stream/inputs
+++ /dev/null
@@ -1,8 +0,0 @@
-nsteps = 100
-n_cell = 100
-max_grid_size = 1000000
-nvar = 1
-
-test = triad
-
-amrex.v = 0
diff --git a/Tests/Stream/main.cpp b/Tests/Stream/main.cpp
deleted file mode 100644
index c131b3d6d6b..00000000000
--- a/Tests/Stream/main.cpp
+++ /dev/null
@@ -1,198 +0,0 @@
-#include <AMReX.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_Gpu.H>
-#include <AMReX_GpuLaunch.H>
-#include <AMReX_Utility.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_Print.H>
-
-using namespace amrex;
-
-void main_main ()
-{
-    // This test is not configured to use multiple ranks.
-    if (ParallelDescriptor::NProcs() > 1) {
-        amrex::Abort("This test is not configured to use multiple ranks.");
-    }
-
-    int n_cell, max_grid_size, nsteps, nvar;
-    std::string test;
-
-    // inputs parameters
-    {
-        // ParmParse is way of reading inputs from the inputs file
-        ParmParse pp;
-
-        // Number of cells on each side of a cubic domain.
-        pp.get("n_cell", n_cell);
-
-        // The domain is broken into boxes of size max_grid_size
-        pp.get("max_grid_size", max_grid_size);
-
-        // Number of "steps" to take by default.
-        nsteps = 10;
-        pp.query("nsteps", nsteps);
-
-        // Number of variables to represent.
-        nvar = 1;
-        pp.query("nvar", nvar);
-
-        // Stream test to run.
-        test = "triad";
-        pp.query("test", test);
-    }
-
-    // make BoxArray and Geometry
-    BoxArray ba;
-    Geometry geom;
-
-    IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-    IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-    Box domain(dom_lo, dom_hi);
-
-    // Initialize the boxarray "ba" from the single box "bx"
-    ba.define(domain);
-
-    // Break up boxarray "ba" into chunks no larger than "max_grid_size" along a direction
-    ba.maxSize(max_grid_size);
-
-    // This defines the physical box, [-1,1] in each direction.
-    RealBox real_box({AMREX_D_DECL(-1.0, -1.0, -1.0)},
-                     {AMREX_D_DECL( 1.0,  1.0,  1.0)});
-
-    // Specify periodic domain (does not matter for this test).
-    Vector<int> is_periodic(AMREX_SPACEDIM, 1);
-
-    // This defines a Geometry object
-    geom.define(domain, &real_box, CoordSys::cartesian, is_periodic.data());
-
-    // How Boxes are distrubuted among MPI processes
-    DistributionMapping dm(ba);
-
-    // Allocate and initialize our data, stored as MultiFabs.
-    MultiFab a(ba, dm, nvar, 0);
-    MultiFab b(ba, dm, nvar, 0);
-    MultiFab c(ba, dm, nvar, 0);
-
-    a.setVal(0.0);
-    b.setVal(1.0);
-    c.setVal(2.0);
-
-    Real scal = 3.0;
-
-    amrex::Print() << std::endl;
-    amrex::Print() << "Beginning stream benchmark with: " << std::endl;
-    amrex::Print() << "n_cell = " << n_cell << std::endl;
-    amrex::Print() << "nvar = " << nvar << std::endl;
-    amrex::Print() << "nsteps = " << nsteps << std::endl;
-    amrex::Print() << "max_grid_size = " << max_grid_size << std::endl;
-    amrex::Print() << std::endl;
-
-        // What time is it now?  We'll use this to compute total run time.
-    Real strt_time = ParallelDescriptor::second();
-
-    for (int s = 1; s <= nsteps; ++s)
-    {
-        for (MFIter mfi(a, TilingIfNotGPU()); mfi.isValid(); ++mfi)
-        {
-            const Box& bx = mfi.tilebox();
-
-            auto a_arr = a.array(mfi);
-            auto b_arr = b.array(mfi);
-            auto c_arr = c.array(mfi);
-
-            if (test == "copy") {
-
-                AMREX_PARALLEL_FOR_4D(bx, nvar, i, j, k, n,
-                {
-                    a_arr(i,j,k,n) = b_arr(i,j,k,n);
-                });
-
-            }
-            else if (test == "scale") {
-
-                AMREX_PARALLEL_FOR_4D(bx, nvar, i, j, k, n,
-                {
-                    a_arr(i,j,k,n) = scal * b_arr(i,j,k,n);
-                });
-
-            }
-            else if (test == "sum") {
-
-                AMREX_PARALLEL_FOR_4D(bx, nvar, i, j, k, n,
-                {
-                    a_arr(i,j,k,n) = b_arr(i,j,k,n) + c_arr(i,j,k,n);
-                });
-
-            }
-            else if (test == "triad") {
-
-                AMREX_PARALLEL_FOR_4D(bx, nvar, i, j, k, n,
-                {
-                    a_arr(i,j,k,n) = b_arr(i,j,k,n) + scal * c_arr(i,j,k,n);
-                });
-
-            }
-            else {
-
-                amrex::Abort("Unknown stream test");
-
-            }
-        }
-    }
-
-    // Call the timer again, compute maximum run time across ranks.
-    Real run_time = ParallelDescriptor::second() - strt_time;
-    ParallelDescriptor::ReduceRealMax(run_time);
-
-    amrex::Print() << "Stream benchmark completed!" << std::endl;
-    amrex::Print() << std::endl;
-
-    // Write out runtime and effective average bandwidth.
-
-    int nBytesScale = 1;
-    int flopScale = 1;
-
-    if (test == "copy") {
-        nBytesScale = 2;
-        flopScale = 0;
-    }
-    else if (test == "scale") {
-        nBytesScale = 2;
-        flopScale = 1;
-    }
-    else if (test == "sum") {
-        nBytesScale = 3;
-        flopScale = 1;
-    }
-    else if (test == "triad") {
-        nBytesScale = 3;
-        flopScale = 2;
-    }
-
-    size_t nBytes = nvar * domain.numPts() * nBytesScale * sizeof(Real);
-    Real nBytesGB = nBytes / ((Real) 1024*1024*1024);
-
-    Real bandwidthGBs = nBytesGB / (run_time / nsteps);
-
-    Real flops = nvar * domain.numPts() * flopScale;
-    Real Gflops = flops / ((Real) (1024*1024*1024));
-
-    Real flopsGFs = Gflops / (run_time / nsteps);
-
-    amrex::Print() << "Run time = " << run_time << " s" << std::endl;
-    amrex::Print() << "Data size = " << nBytesGB << " GB" << std::endl;
-    amrex::Print() << "Bandwidth = " << bandwidthGBs << " GB/s" << std::endl;
-    amrex::Print() << "Compute = " << flopsGFs << " GF/s" << std::endl;
-    amrex::Print() << std::endl;
-}
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    {
-        main_main();
-    }
-    amrex::Finalize();
-    return 0;
-}
diff --git a/Tests/ThirdPartyLib/GNUmakefile b/Tests/ThirdPartyLib/GNUmakefile
deleted file mode 100644
index 75a1f62ba95..00000000000
--- a/Tests/ThirdPartyLib/GNUmakefile
+++ /dev/null
@@ -1,31 +0,0 @@
-# Here we assume gcc and mpich.
-
-# We assume that libamrex.a has been built and installed at
-AMREX_DIR := ../../tmp_install_dir
-
-default: main.ex
-
-main.ex: main.o libfoo_cxx.a libbar_f.a
-	mpicc -o $@ -O $^ -L. -L$(AMREX_DIR)/lib -lfoo_cxx -lbar_f -lamrex -lmpichf90 -lgfortran -lstdc++ -lm
-
-main.o: main.c
-	mpicc -o $@ -c -O $^
-
-libfoo_cxx.a: foo.o
-	ar rv $@ $^
-	ranlib $@
-
-foo.o: foo.cpp
-	mpicxx -o $@ -c -O -std=c++11 $^ -I$(AMREX_DIR)/include
-
-libbar_f.a: bar.o
-	ar rv $@ $^
-	ranlib $@
-
-bar.o: bar.F90
-	mpif90 -o $@ -c -O $^ -I$(AMREX_DIR)/include
-
-clean::
-	$(RM) main.ex *.o *.a
-
-.PHONY: clean
diff --git a/Tests/ThirdPartyLib/Readme b/Tests/ThirdPartyLib/Readme
deleted file mode 100644
index 44c34ddb62d..00000000000
--- a/Tests/ThirdPartyLib/Readme
+++ /dev/null
@@ -1,8 +0,0 @@
-
-This tests how AMReX can be used as a third-party library.  In this
-simple example, the user's code is in main.c and it has no direct
-interaction with AMReX.  It uses libfoo_cxx and libbar_f that in turn
-use AMReX C++ and Fortran interfaces, respectively.
-
-To build libamrex, follow the instruction at amrex/INSTALL.
-
diff --git a/Tests/ThirdPartyLib/bar.F90 b/Tests/ThirdPartyLib/bar.F90
deleted file mode 100644
index 57e5a51d71e..00000000000
--- a/Tests/ThirdPartyLib/bar.F90
+++ /dev/null
@@ -1,96 +0,0 @@
-
-subroutine bar (comm) bind(c)
-  use amrex_base_module
-  implicit none
-  integer, intent(in), value :: comm
-
-  integer :: rank, ierr
-
-  call amrex_init(comm)
-
-  if (amrex_parallel_ioprocessor()) then
-     print *, "bar: AMReX Fortran has been initialized."
-  end if
-
-  call fsolve()
-
-  call amrex_finalize()
-
-  ! After amrex_finalize(), amrex can no longer be used.
-  call mpi_comm_rank(comm, rank, ierr)
-  if (rank .eq. 0) then
-     print *, "bar: AMReX Fortran has been finalized."
-  end if
-  
-contains
-
-  subroutine fsolve
-    use amrex_linear_solver_module
-
-    type(amrex_box) :: domain, bx
-    type(amrex_geometry) :: geom
-    type(amrex_boxarray) :: grids
-    type(amrex_distromap) :: dm
-    type(amrex_multifab) :: rhs, phi
-    type(amrex_mfiter) :: mfi
-    real(amrex_real), pointer :: prhs(:,:,:,:)
-    integer :: lo(4), hi(4), i, j, k
-    real(amrex_real) :: r, error
-    type(amrex_poisson) :: poisson
-    type(amrex_multigrid) :: multigrid
-
-    call amrex_geometry_set_coord_sys(0)  ! Cartesian
-    call amrex_geometry_set_prob_domain([0._amrex_real,0._amrex_real,0._amrex_real], &
-         &                              [1._amrex_real,1._amrex_real,1._amrex_real])
-    call amrex_geometry_set_periodic([.true., .true., .true.])
-
-    domain = amrex_box([0,0,0], [63,63,63])  ! # of cells
-
-    call amrex_geometry_build(geom, domain)
-    call amrex_boxarray_build(grids, domain)
-    call grids % maxSize(32)
-    call amrex_distromap_build(dm, grids)
-    call amrex_multifab_build(rhs, grids, dm, nc=1, ng=0)
-    call amrex_multifab_build(phi, grids, dm, nc=1, ng=1)
-
-    ! set right hand side to random numbers
-    call amrex_mfiter_build(mfi, rhs)
-    do while (mfi%next())
-       bx = mfi%tilebox()
-       prhs => rhs%dataptr(mfi)
-       lo = lbound(prhs)
-       hi = ubound(prhs)
-       do k = lo(3), hi(3)
-          do j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                call random_number(r)
-                prhs(i,j,k,1) = r
-             end do
-          end do
-       end do
-    end do
-    call amrex_mfiter_destroy(mfi)
-
-    call phi % setVal(0.0_amrex_real) ! intial guess
-
-    call amrex_poisson_build(poisson, [geom], [grids], [dm])
-    call poisson % set_domain_bc([amrex_lo_periodic,amrex_lo_periodic,amrex_lo_periodic], &
-         &                       [amrex_lo_periodic,amrex_lo_periodic,amrex_lo_periodic]);
-    call poisson % set_level_bc(0, phi)
-
-    call amrex_multigrid_build(multigrid, poisson)
-    call multigrid % set_verbose(1)
-
-    error = multigrid % solve([phi], [rhs], 1.e-10_amrex_real, 0.0_amrex_real)
-
-    call amrex_poisson_destroy(poisson)
-    call amrex_multigrid_destroy(multigrid)
-
-    call amrex_multifab_destroy(rhs)
-    call amrex_multifab_destroy(phi)
-    call amrex_geometry_destroy(geom)
-    call amrex_boxarray_destroy(grids)
-    call amrex_distromap_destroy(dm)
-  end subroutine fsolve
-
-end subroutine bar
diff --git a/Tests/ThirdPartyLib/foo.cpp b/Tests/ThirdPartyLib/foo.cpp
deleted file mode 100644
index 979048109b4..00000000000
--- a/Tests/ThirdPartyLib/foo.cpp
+++ /dev/null
@@ -1,74 +0,0 @@
-#include <mpi.h>
-#include <AMReX.H>
-#include <AMReX_Print.H>
-
-void csolve ();
-
-extern "C"
-{
-    void foo(MPI_Comm comm)
-    {
-        amrex::Initialize(comm);
-        
-        amrex::Print() << " foo: AMReX C++ has been initialized.\n";
-
-        csolve();
-        
-        amrex::Finalize();
-
-        // After amrex::Finalize(), amrex can no longer be used.
-        int rank;
-        MPI_Comm_rank(comm, &rank);
-        if (rank == 0) {
-            std::cout << " foo: AMReX C++ has been finalized.\n";
-        }
-    }
-}
-
-#include <AMReX_MLPoisson.H>
-#include <AMReX_MLMG.H>
-
-using namespace amrex;
-
-void csolve ()
-{
-    RealBox rb({0.,0.,0.}, {1.,1.,1.}); // physical domain size
-    std::array<int,3> is_periodic{1,1,1}; // periodic bc
-    Geometry::Setup(&rb, 0, is_periodic.data());
-
-    Box domain({0,0,0}, {63,63,63});  // # of cells
-
-    Geometry geom(domain);
-
-    BoxArray grids(domain);
-    grids.maxSize(32);
-
-    DistributionMapping dm(grids);
-
-    MultiFab rhs(grids, dm, 1, 0);
-    MultiFab phi(grids, dm, 1, 1);
-
-    // set right hand side to some random numbers
-    for (MFIter mfi(rhs); mfi.isValid(); ++mfi)
-    {
-        auto const& fab = rhs.array(mfi);
-        Box const& bx = mfi.fabbox();
-        amrex::For(bx, [=] (int i, int j, int k) noexcept
-        {
-            fab(i,j,k) = Random();
-        });
-    }
-
-    // set initial guess of potential to zero
-    phi.setVal(0.0);
-
-    MLPoisson mlpoisson({geom}, {grids}, {dm});
-
-    mlpoisson.setDomainBC({LinOpBCType::Periodic,LinOpBCType::Periodic,LinOpBCType::Periodic},
-                          {LinOpBCType::Periodic,LinOpBCType::Periodic,LinOpBCType::Periodic});
-    mlpoisson.setLevelBC(0,nullptr);
-   
-    MLMG mlmg(mlpoisson);
-    mlmg.setVerbose(1);
-    mlmg.solve({&phi}, {&rhs}, 1.e-10, 0.0);
-}
diff --git a/Tests/ThirdPartyLib/main.c b/Tests/ThirdPartyLib/main.c
deleted file mode 100644
index 6b88bdd9d00..00000000000
--- a/Tests/ThirdPartyLib/main.c
+++ /dev/null
@@ -1,69 +0,0 @@
-#include <stdio.h>
-#include <mpi.h>
-
-void foo(MPI_Comm comm);    // foo is a C++ function.
-void bar(MPI_Comm comm);    // bar is a Fortran subroutine.
-
-int main(int argc, char** argv)
-{
-    MPI_Init(&argc, &argv);
-
-    int rank_world, np_world;
-
-    MPI_Comm_rank(MPI_COMM_WORLD, &rank_world);
-    MPI_Comm_size(MPI_COMM_WORLD, &np_world);
-
-    int fcomm = MPI_Comm_c2f(MPI_COMM_WORLD);
-
-    if (rank_world == 0) {
-        printf("\nCalling foo with MPI_COMM_WORLD\n");
-    }
-    foo(MPI_COMM_WORLD);
-
-    if (rank_world == 0) {
-        printf("\nCalling bar with MPI_COMM_WORLD\n");
-    }
-    bar(fcomm);
-
-    int subcomm, subrank;
-    int color = rank_world % 2;
-    MPI_Comm_split(MPI_COMM_WORLD, color, rank_world, &subcomm);
-    MPI_Comm_rank(subcomm, &subrank);
-    int fsubcomm = MPI_Comm_c2f(subcomm);
-
-    if (color == 0) {
-        if (subrank == 0) {
-            printf("\nCalling bar with sub-communicator 0\n");
-        }
-        bar(subcomm);
-
-        if (subrank == 0) {
-            printf("\nCalling foo with sub-communicator 0\n");
-        }
-        foo(subcomm);
-    } else {
-        if (subrank == 0) {
-            printf("\nCalling foo with sub-communicator 1\n");
-        }
-        foo(subcomm);
-
-        if (subrank == 0) {
-            printf("\nCalling bar with sub-communicator 1\n");
-        }
-        bar(subcomm);
-    }
-
-    if (rank_world == 0) {
-        printf("\nCalling bar with MPI_COMM_WORLD\n");
-    }
-    bar(MPI_COMM_WORLD);
-
-    if (rank_world == 0) {
-        printf("\nCalling foo with MPI_COMM_WORLD\n");
-    }
-    foo(MPI_COMM_WORLD);
-
-    MPI_Comm_free(&subcomm);
-
-    MPI_Finalize();
-}
diff --git a/Tests/TypeCheck/GNUmakefile b/Tests/TypeCheck/GNUmakefile
deleted file mode 100644
index 1b0a72a48aa..00000000000
--- a/Tests/TypeCheck/GNUmakefile
+++ /dev/null
@@ -1,23 +0,0 @@
-AMREX_HOME ?= ../../
-
-DEBUG	= FALSE
-DEBUG	= TRUE
-
-DIM	= 3
-
-COMP    = gcc
-
-PRECISION = DOUBLE
-
-USE_MPI   = TRUE
-USE_OMP   = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-default: typecheck
-	@echo "\n7 errors should be found.  No errros should be found in functions starting with pass_."
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/TypeCheck/Make.package b/Tests/TypeCheck/Make.package
deleted file mode 100644
index 5706c93e4d9..00000000000
--- a/Tests/TypeCheck/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-CEXE_headers += f_F.H
-f90EXE_sources += f.f90
diff --git a/Tests/TypeCheck/f.f90 b/Tests/TypeCheck/f.f90
deleted file mode 100644
index 682bef74f07..00000000000
--- a/Tests/TypeCheck/f.f90
+++ /dev/null
@@ -1,85 +0,0 @@
-
-subroutine err_c_2_f_4 (i, j, k, n) bind(c)
-  implicit none
-  integer :: i,j,k,n
-end subroutine err_c_2_f_4
-
-subroutine err_c_value_f_pointer (x) bind(c)
-  use iso_c_binding
-  implicit none
-  real(c_double) :: x
-end subroutine err_c_value_f_pointer
-
-subroutine err_c_float_f_double (ifab, lo, hi, x) bind(c)
-  integer, intent(in) :: lo(3), hi(3)
-  integer, intent(inout) :: ifab(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3))
-  double precision, intent(out) :: x
-end subroutine err_c_float_f_double
-
-subroutine pass_c_real_f_real (x, y, z) bind(c)
-  use iso_c_binding
-  real(c_float), value :: x
-  double precision, value :: y
-  real(c_double), value :: z
-end subroutine pass_c_real_f_real
-
-module x_module
-
-  use iso_c_binding
-  use amrex_fort_module, only : amrex_real
-
-  implicit none
-
-  type, bind(c) :: my_c_struct
-     double precision :: x(3)
-     integer :: i(100)
-  end type my_c_struct
-
-contains
-
-  function err_c_ret_int_f_ret_real () result(r)
-    double precision :: r
-  end function err_c_ret_int_f_ret_real
-
-  function pass_c_ret_int_f_ret_int () result(r)
-    integer :: r
-  end function pass_c_ret_int_f_ret_int
-
-  subroutine err_c_poiner_f_value (x) bind(c)
-    use amrex_fort_module, only : amrex_real
-    real(amrex_real), intent(in), value :: x
-  end subroutine err_c_poiner_f_value
-
-  subroutine err_c_reference_f_value (x) bind(c)
-    use amrex_fort_module, only : amrex_real
-    real(amrex_real), intent(in), value :: x
-  end subroutine err_c_reference_f_value
-
-  subroutine pass_c_bl_fort_fab_arg (x, xlo1, xlo2, xlo3, xhi1, xhi2, xhi3) bind(c)
-    integer, intent(in) :: xlo1, xlo2, xlo3, xhi1, xhi2, xhi3
-    real(amrex_real), intent(inout) :: x(xlo1:xhi1,xlo2:xhi2,xlo3:xhi3)
-  end subroutine pass_c_bl_fort_fab_arg
-
-  subroutine pass_c_bl_fort_fab_arg_3d (x, lo, hi) bind(c)
-    integer, intent(in) :: lo(3), hi(3)
-    real(amrex_real), intent(inout) :: x(lo(1):hi(1),lo(2):hi(2),lo(3):hi(3))
-  end subroutine pass_c_bl_fort_fab_arg_3d
-
-  subroutine pass_c_pointer_f_c_ptr (p) bind(c)
-    use iso_c_binding
-    type(c_ptr), value :: p
-  end subroutine pass_c_pointer_f_c_ptr
-
-  subroutine err_c_pointer_f_c_ptr (p) bind(c)
-    use iso_c_binding
-    type(c_ptr) :: p
-  end subroutine err_c_pointer_f_c_ptr
-
-  subroutine pass_c_void_pointer_f_any (x, y ,z) bind(c)
-    integer :: x
-    double precision :: y
-    type(my_c_struct) :: z
-  end subroutine pass_c_void_pointer_f_any
-
-end module x_module
-
diff --git a/Tests/TypeCheck/f_F.H b/Tests/TypeCheck/f_F.H
deleted file mode 100644
index 6be8abaddf0..00000000000
--- a/Tests/TypeCheck/f_F.H
+++ /dev/null
@@ -1,36 +0,0 @@
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-
-    int err_c_ret_int_f_ret_real ();
-
-    int pass_c_ret_int_f_ret_int ();
-
-    void err_c_2_f_4 (int* i, int* j);
-
-    void err_c_value_f_pointer (double x);
-
-    void err_c_poiner_f_value (amrex::Real* x);
-
-    void err_c_reference_f_value (const amrex::Real& x);
-
-    void pass_c_bl_fort_fab_arg (BL_FORT_FAB_ARG(fab));
-
-    void pass_c_bl_fort_fab_arg_3d (BL_FORT_FAB_ARG_3D(fab));
-
-    void err_c_float_f_double (BL_FORT_IFAB_ARG_3D(ifab), float*);
-
-    void pass_c_real_f_real (float x, double y, amrex_real z);
-
-    void pass_c_pointer_f_c_ptr (int * p);
-
-    void err_c_pointer_f_c_ptr (amrex::Real * p);
-
-    void pass_c_void_pointer_f_any (void* x, void* y, void* z);
-
-#ifdef __cplusplus
-}
-#endif
diff --git a/Tests/Vectorization/GNUmakefile b/Tests/Vectorization/GNUmakefile
deleted file mode 100644
index 1117c179bee..00000000000
--- a/Tests/Vectorization/GNUmakefile
+++ /dev/null
@@ -1,17 +0,0 @@
-AMREX_HOME ?= ../../
-
-DEBUG	= FALSE
-
-DIM	= 3
-
-COMP    = gnu
-
-USE_MPI   = TRUE
-USE_OMP   = FALSE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tests/Vectorization/Make.package b/Tests/Vectorization/Make.package
deleted file mode 100644
index 8c1f5eef936..00000000000
--- a/Tests/Vectorization/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-CEXE_headers += kc.H kdecl.H
-CEXE_sources += main.cpp  kc.cpp
-F90EXE_sources += kf.F90
diff --git a/Tests/Vectorization/kc.H b/Tests/Vectorization/kc.H
deleted file mode 100644
index 097e6afd194..00000000000
--- a/Tests/Vectorization/kc.H
+++ /dev/null
@@ -1,78 +0,0 @@
-
-void SIMDORNOT(flux_to_dudt_c)
-    (Box const& bx,
-     FArrayBox& dudtfab,
-     FArrayBox const& fxfab,
-     FArrayBox const& fyfab,
-     FArrayBox const& fzfab,
-     Array<Real,AMREX_SPACEDIM> const& a_dxinv)
-{
-    const int ncomp = dudtfab.nComp();
-    const auto dudt = dudtfab.array();
-    const auto fx   =   fxfab.const_array();
-    const auto fy   =   fyfab.const_array();
-    const auto fz   =   fzfab.const_array();
-    const Real dxinv = a_dxinv[0];
-    const Real dyinv = a_dxinv[1];
-    const Real dzinv = a_dxinv[2];
-
-    amrex::LoopConcurrent(bx,7,[=] (int i, int j, int k, int n) noexcept
-    {
-        dudt(i,j,k,n) = dxinv * (fx(i,j,k,n) - fx(i+1,j,k,n))
-            +           dyinv * (fy(i,j,k,n) - fy(i,j+1,k,n))
-            +           dzinv * (fz(i,j,k,n) - fz(i,j,k+1,n));
-    });
-}
-
-void SIMDORNOT(ctoprim_c)
-    (Box const& bx, FArrayBox const& ufab, FArrayBox & qfab)
-{
-    const auto u = ufab.const_array();
-    const auto q = qfab.array();
-    const Real smallr = 1.e-19;
-    const Real smallp = 1.e-10;
-    const Real gamma = 1.4;
-
-    const int URHO  = 0;
-    const int UMX   = 1;
-    const int UMY   = 2;
-    const int UMZ   = 3;
-    const int UEDEN = 4;
-    const int UEINT = 5;
-    const int UTEMP = 6;
-
-    const int QRHO   = 0;
-    const int QU     = 1;
-    const int QV     = 2;
-    const int QW     = 3;
-    const int QPRES  = 4;
-    const int QCS    = 5;
-    const int QEINT  = 6;
-    const int QTEMP  = 7;
-
-    amrex::LoopConcurrent(bx, [=] (int i, int j, int k) noexcept
-    {
-        Real rho = u(i,j,k,URHO);
-        rho = (rho > smallr) ? rho : smallr;
-        Real rhoinv = 1.0/rho;
-        Real ux = u(i,j,k,UMX)*rhoinv;
-        Real uy = u(i,j,k,UMY)*rhoinv;
-        Real uz = u(i,j,k,UMZ)*rhoinv;
-        Real kineng = 0.5*rho*(ux*ux+uy*uy+uz*uz);
-        Real ei = u(i,j,k,UEDEN) - kineng;
-        if (ei <= 0.0) ei = u(i,j,k,UEINT);
-        Real p = (gamma-1.0)*ei;
-        p = (p > smallp) ? p : smallp;
-        ei *= rhoinv;
-
-        q(i,j,k,QRHO) = rho;
-        q(i,j,k,QU) = ux;
-        q(i,j,k,QV) = uy;
-        q(i,j,k,QW) = uz;
-        q(i,j,k,QEINT) = ei;
-        q(i,j,k,QPRES) = p;
-        q(i,j,k,QCS) = std::sqrt(gamma*p*rhoinv);
-        q(i,j,k,QTEMP) = 0.0;
-    });
-}
-
diff --git a/Tests/Vectorization/kc.cpp b/Tests/Vectorization/kc.cpp
deleted file mode 100644
index 4bca5e0fcdb..00000000000
--- a/Tests/Vectorization/kc.cpp
+++ /dev/null
@@ -1,17 +0,0 @@
-
-#include <kdecl.H>
-
-using namespace amrex;
-
-#define SIMDORNOT(f) f##_simd
-
-#include <kc.H>
-
-
-#undef SIMDORNOT
-#define SIMDORNOT(f) f##_nosimd
-#undef AMREX_PRAGMA_SIMD
-#define AMREX_PRAGMA_SIMD 
-
-#include <kc.H>
-
diff --git a/Tests/Vectorization/kdecl.H b/Tests/Vectorization/kdecl.H
deleted file mode 100644
index d4c1a46e11b..00000000000
--- a/Tests/Vectorization/kdecl.H
+++ /dev/null
@@ -1,41 +0,0 @@
-#ifndef KDECL_H_
-#define KDECL_H_
-
-#include <AMReX_FArrayBox.H>
-
-void ctoprim_c_simd
-    (amrex::Box const& bx, amrex::FArrayBox const& ufab, amrex::FArrayBox & qfab);
-
-void ctoprim_c_nosimd
-    (amrex::Box const& bx, amrex::FArrayBox const& ufab, amrex::FArrayBox & qfab);
-
-void flux_to_dudt_c_simd
-    (amrex::Box const& bx,
-     amrex::FArrayBox& dudtfab,
-     amrex::FArrayBox const& fxfab,
-     amrex::FArrayBox const& fyfab,
-     amrex::FArrayBox const& fzfab,
-     amrex::Array<amrex::Real,AMREX_SPACEDIM> const& dxinv);
-
-void flux_to_dudt_c_nosimd
-    (amrex::Box const& bx,
-     amrex::FArrayBox& dudtfab,
-     amrex::FArrayBox const& fxfab,
-     amrex::FArrayBox const& fyfab,
-     amrex::FArrayBox const& fzfab,
-     amrex::Array<amrex::Real,AMREX_SPACEDIM> const& dxinv);
-
-extern "C" {
-    void ctoprim_f (const int* lo, const int* hi,
-                    amrex::Real* u, const int* ulo, const int* uhi,
-                    const amrex::Real* q, const int* qlo, const int* qhi);
-
-    void flux_to_dudt_f (const int* lo, const int* hi,
-                         amrex::Real* dudt, const int* ulo, const int* uhi,
-                         const amrex::Real* fx, const int* xlo, const int* xhi,
-                         const amrex::Real* fy, const int* ylo, const int* yhi,
-                         const amrex::Real* fz, const int* zlo, const int* zhi,
-                         const amrex::Real* dxinv, const int* ncomp);
-}
-
-#endif
diff --git a/Tests/Vectorization/kf.F90 b/Tests/Vectorization/kf.F90
deleted file mode 100644
index 18e04445784..00000000000
--- a/Tests/Vectorization/kf.F90
+++ /dev/null
@@ -1,85 +0,0 @@
-module kf_module
-
-  implicit none
-
-  double precision, parameter :: gamma = 1.4d0
-  double precision, parameter :: smallr = 1.d-19
-  double precision, parameter :: smallp = 1.d-10
-
-  integer, parameter :: URHO  = 0;
-  integer, parameter :: UMX   = 1;
-  integer, parameter :: UMY   = 2;
-  integer, parameter :: UMZ   = 3;
-  integer, parameter :: UEDEN = 4;
-  integer, parameter :: UEINT = 5;
-  integer, parameter :: UTEMP = 6;
-  integer, parameter :: ncons = 7
- 
-  integer, parameter :: QRHO   = 0;
-  integer, parameter :: QU     = 1;
-  integer, parameter :: QV     = 2;
-  integer, parameter :: QW     = 3;
-  integer, parameter :: QPRES  = 4;
-  integer, parameter :: QCS    = 5;
-  integer, parameter :: QEINT  = 6;
-  integer, parameter :: QTEMP  = 7;
-  integer, parameter :: nprim  = 8;
-
-contains
-
-  subroutine ctoprim_f (lo,hi,u,ulo,uhi,q,qlo,qhi) bind(c,name='ctoprim_f')
-    integer, intent(in) :: lo(3),hi(3),ulo(3),uhi(3),qlo(3),qhi(3)
-    double precision, intent(in   ) :: u(ulo(1):uhi(1),ulo(2):uhi(2),ulo(3):uhi(3),0:ncons-1)
-    double precision, intent(inout) :: q(qlo(1):qhi(1),qlo(2):qhi(2),qlo(3):qhi(3),0:nprim-1)
-    
-    integer :: i,j,k
-    double precision :: rhoinv, kineng
-    
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             q(i,j,k,qrho) = max(smallr,u(i,j,k,urho))
-             rhoinv = 1.d0/q(i,j,k,qrho)
-             q(i,j,k,qu) = u(i,j,k,umx)*rhoinv
-             q(i,j,k,qv) = u(i,j,k,umy)*rhoinv
-             q(i,j,k,qw) = u(i,j,k,umz)*rhoinv
-             kineng = 0.5d0*q(i,j,k,qrho)*(q(i,j,k,QU)**2 + q(i,j,k,QV)**2 + q(i,j,k,QW)**2)
-             q(i,j,k,qeint) = (u(i,j,k,ueden)-kineng) * rhoinv
-             if (q(i,j,k,qeint) .le. 0.d0) then
-                q(i,j,k,qeint) = u(i,j,k,ueint) * rhoinv
-             end if
-             q(i,j,k,qpres) = max(smallp,(gamma-1.d0)*q(i,j,k,qeint)*q(i,j,k,qrho))
-             q(i,j,k,qcs) = sqrt(gamma*q(i,j,k,qpres)*rhoinv)
-             q(i,j,k,qtemp) = 0.d0
-          end do
-       end do
-    end do
-  end subroutine ctoprim_f
-  
-  subroutine flux_to_dudt_f (lo, hi, dudt, ulo, uhi, fx, xlo, xhi, &
-       fy, ylo, yhi, fz, zlo, zhi, dxinv, nc) bind(c,name="flux_to_dudt_f")
-    integer, dimension(3), intent(in) :: lo, hi, ulo, uhi, xlo, xhi, ylo, yhi, zlo, zhi
-    integer, intent(in) :: nc
-    double precision, intent(inout) :: dudt(ulo(1):uhi(1),ulo(2):uhi(2),ulo(3):uhi(3),nc)
-    double precision, intent(inout) :: fx  (xlo(1):xhi(1),xlo(2):xhi(2),xlo(3):xhi(3),nc)
-    double precision, intent(inout) :: fy  (ylo(1):yhi(1),ylo(2):yhi(2),ylo(3):yhi(3),nc)
-    double precision, intent(inout) :: fz  (zlo(1):zhi(1),zlo(2):zhi(2),zlo(3):zhi(3),nc)
-    double precision, intent(in) :: dxinv(3)
-    
-    integer :: i,j,k,n
-    
-    do n = 1, nc
-       do       k = lo(3), hi(3)
-          do    j = lo(2), hi(2)
-             do i = lo(1), hi(1)
-                dudt(i,j,k,n) = dxinv(1) * (fx(i,j,k,n) - fx(i+1,j,k,n)) &
-                     +          dxinv(2) * (fy(i,j,k,n) - fy(i,j+1,k,n)) &
-                     +          dxinv(3) * (fz(i,j,k,n) - fz(i,j,k+1,n))
-             end do
-          end do
-       end do
-    end do
-    
-  end subroutine flux_to_dudt_f
-
-end module kf_module
diff --git a/Tests/Vectorization/main.cpp b/Tests/Vectorization/main.cpp
deleted file mode 100644
index f2008514214..00000000000
--- a/Tests/Vectorization/main.cpp
+++ /dev/null
@@ -1,112 +0,0 @@
-
-#include <AMReX.H>
-#include <AMReX_Print.H>
-
-#include <kdecl.H>
-
-using namespace amrex;
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    {
-        const Box bx(IntVect(0), IntVect(63));
-        const Box& bxg2 = amrex::grow(bx,2);
-        const int ncomp = 7;
-        FArrayBox ufab(bxg2,ncomp);
-        FArrayBox qfab(bxg2,8);
-        FArrayBox dudtfab(bx,ncomp);
-        FArrayBox fxfab(amrex::convert(bx,IntVect::TheDimensionVector(0)),ncomp);
-        FArrayBox fyfab(amrex::convert(bx,IntVect::TheDimensionVector(1)),ncomp);
-        FArrayBox fzfab(amrex::convert(bx,IntVect::TheDimensionVector(2)),ncomp);
-
-        ufab.setVal(3.0);
-        fxfab.setVal(1.0);
-        fyfab.setVal(1.0);
-        fzfab.setVal(1.0);
-
-        Array<Real,3> dxinv {10.,10.,10.};
-
-        // ctoprim
-        {
-            ctoprim_f(BL_TO_FORTRAN_BOX(bxg2),
-                      BL_TO_FORTRAN_ANYD(ufab),
-                      BL_TO_FORTRAN_ANYD(qfab));
-
-            double t0 = amrex::second();
-
-            for (int i = 0; i < 1000; ++i) {
-                __asm__ __volatile__("" : : : "memory");
-                ctoprim_f(BL_TO_FORTRAN_BOX(bxg2),
-                          BL_TO_FORTRAN_ANYD(ufab),
-                          BL_TO_FORTRAN_ANYD(qfab));
-            }
-            
-            double t1 = amrex::second();
-            
-            for (int i = 0; i < 1000; ++i) {
-                __asm__ __volatile__("" : : : "memory");
-                ctoprim_c_simd(bxg2, ufab, qfab);
-            }
-            
-            double t2 = amrex::second();
-            
-            for (int i = 0; i < 1000; ++i) {
-                __asm__ __volatile__("" : : : "memory");
-                ctoprim_c_nosimd(bxg2, ufab, qfab);
-            }
-            
-            double t3 = amrex::second();
-            
-            amrex::Print() << "ctoprim: Fortran time: " << t1-t0 << "\n"
-                           << "         C++ w/ simd time: " << t2-t1  << "\n"
-                           << "         C++ w/o simd time: " << t3-t2 << std::endl;
-        }
-
-        // flux_to_dudt 
-        {
-            flux_to_dudt_f(BL_TO_FORTRAN_BOX(bx),
-                           BL_TO_FORTRAN_ANYD(dudtfab),
-                           BL_TO_FORTRAN_ANYD(fxfab),
-                           BL_TO_FORTRAN_ANYD(fyfab),
-                           BL_TO_FORTRAN_ANYD(fzfab),
-                           dxinv.data(),
-                           &ncomp);
-
-            double t0 = amrex::second();
-
-            for (int i = 0; i < 1000; ++i) {
-                __asm__ __volatile__("" : : : "memory");
-                flux_to_dudt_f(BL_TO_FORTRAN_BOX(bx),
-                               BL_TO_FORTRAN_ANYD(dudtfab),
-                               BL_TO_FORTRAN_ANYD(fxfab),
-                               BL_TO_FORTRAN_ANYD(fyfab),
-                               BL_TO_FORTRAN_ANYD(fzfab),
-                               dxinv.data(),
-                               &ncomp);
-            }
-            
-            double t1 = amrex::second();
-            
-            for (int i = 0; i < 1000; ++i) {
-                __asm__ __volatile__("" : : : "memory");
-                flux_to_dudt_c_simd(bx, dudtfab, fxfab, fyfab, fzfab, dxinv);
-            }
-            
-            double t2 = amrex::second();
-            
-            for (int i = 0; i < 1000; ++i) {
-                __asm__ __volatile__("" : : : "memory");
-                flux_to_dudt_c_nosimd(bx, dudtfab, fxfab, fyfab, fzfab, dxinv);
-            }
-            
-            double t3 = amrex::second();
-            
-            amrex::Print() << "flux_to_dudt: Fortran time: " << t1-t0 << "\n"
-                           << "              C++ w/ simd time: " << t2-t1  << "\n"
-                           << "              C++ w/o simd time: " << t3-t2 << std::endl;
-        }
-    }
-    amrex::Finalize();
-}
-
diff --git a/Tests/complementIn/CMakeLists.txt b/Tests/complementIn/CMakeLists.txt
new file mode 100644
index 00000000000..ac043eefd8d
--- /dev/null
+++ b/Tests/complementIn/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files )
+
+setup_test(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tests/complementIn/GNUmakefile b/Tests/complementIn/GNUmakefile
index 14495c1b8b2..4cd3c68f5d4 100644
--- a/Tests/complementIn/GNUmakefile
+++ b/Tests/complementIn/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../
+AMREX_HOME = ../../
 
 DEBUG	= FALSE
 
diff --git a/Tools/AMRProfParser/TestCodes/AMRProfTest0.cpp b/Tools/AMRProfParser/TestCodes/AMRProfTest0.cpp
index e90ed17fa1f..1d4c56ddea5 100644
--- a/Tools/AMRProfParser/TestCodes/AMRProfTest0.cpp
+++ b/Tools/AMRProfParser/TestCodes/AMRProfTest0.cpp
@@ -29,7 +29,7 @@ void ReportSleep(double s) {
 // --------------------------------------------------------------
 void SleepProcTimes(double sleepsec) {
   ReportSleep(sleepsec);
-  amrex::USleep(sleepsec);
+  amrex::Sleep(sleepsec);
 }
 
 //---------------------------------------------------------------
@@ -103,36 +103,36 @@ int main(int argc, char *argv[]) {
 
   amrex::ParallelDescriptor::Barrier();
   {
-    BL_PROFILE_REGION_START("USleep1");
-    BL_PROFILE("USleep1()");
-    amrex::Print() << "USleep1." << std::endl;
-    amrex::USleep(1);
-    BL_PROFILE_REGION_STOP("USleep1");
+    BL_PROFILE_REGION_START("Sleep1");
+    BL_PROFILE("Sleep1()");
+    amrex::Print() << "Sleep1." << std::endl;
+    amrex::Sleep(1);
+    BL_PROFILE_REGION_STOP("Sleep1");
   }
   amrex::ParallelDescriptor::Barrier();
   {
-    BL_PROFILE_REGION_START("USleep2");
-    BL_PROFILE("USleep2()");
-    amrex::Print() << "USleep2." << std::endl;
-    amrex::USleep(2);
-    BL_PROFILE_REGION_STOP("USleep2");
+    BL_PROFILE_REGION_START("Sleep2");
+    BL_PROFILE("Sleep2()");
+    amrex::Print() << "Sleep2." << std::endl;
+    amrex::Sleep(2);
+    BL_PROFILE_REGION_STOP("Sleep2");
   }
   amrex::ParallelDescriptor::Barrier();
   {
-    BL_PROFILE_REGION_START("USleep3");
-    BL_PROFILE("USleep3()");
-    amrex::Print() << "USleep3." << std::endl;
-    amrex::USleep(3);
-    BL_PROFILE_REGION_STOP("USleep3");
+    BL_PROFILE_REGION_START("Sleep3");
+    BL_PROFILE("Sleep3()");
+    amrex::Print() << "Sleep3." << std::endl;
+    amrex::Sleep(3);
+    BL_PROFILE_REGION_STOP("Sleep3");
   }
   amrex::ParallelDescriptor::Barrier();
   /*
   {
-    BL_PROFILE_REGION_START("USleepRplus1");
-    BL_PROFILE("USleepRplus1()");
-    amrex::Print() << "USleepRplus1." << std::endl;
-    amrex::USleep(myProc+1);
-    BL_PROFILE_REGION_STOP("USleepRplus1");
+    BL_PROFILE_REGION_START("SleepRplus1");
+    BL_PROFILE("SleepRplus1()");
+    amrex::Print() << "SleepRplus1." << std::endl;
+    amrex::Sleep(myProc+1);
+    BL_PROFILE_REGION_STOP("SleepRplus1");
   }
   amrex::ParallelDescriptor::Barrier();
   */
diff --git a/Tools/AMRProfParser/TestCodes/ProfWaitTest.cpp b/Tools/AMRProfParser/TestCodes/ProfWaitTest.cpp
index fdec0885d03..451d24e0613 100644
--- a/Tools/AMRProfParser/TestCodes/ProfWaitTest.cpp
+++ b/Tools/AMRProfParser/TestCodes/ProfWaitTest.cpp
@@ -221,27 +221,27 @@ int main(int argc, char *argv[]) {
 /*
   amrex::ParallelDescriptor::Barrier();
   {
-    BL_PROFILE_REGION_START("USleep1");
-    BL_PROFILE("USleep1()");
-    amrex::Print() << "USleep1." << std::endl;
-    amrex::USleep(1);
-    BL_PROFILE_REGION_STOP("USleep1");
+    BL_PROFILE_REGION_START("Sleep1");
+    BL_PROFILE("Sleep1()");
+    amrex::Print() << "Sleep1." << std::endl;
+    amrex::Sleep(1);
+    BL_PROFILE_REGION_STOP("Sleep1");
   }
   amrex::ParallelDescriptor::Barrier();
   {
-    BL_PROFILE_REGION_START("USleep2");
-    BL_PROFILE("USleep2()");
-    amrex::Print() << "USleep2." << std::endl;
-    amrex::USleep(2);
-    BL_PROFILE_REGION_STOP("USleep2");
+    BL_PROFILE_REGION_START("Sleep2");
+    BL_PROFILE("Sleep2()");
+    amrex::Print() << "Sleep2." << std::endl;
+    amrex::Sleep(2);
+    BL_PROFILE_REGION_STOP("Sleep2");
   }
   amrex::ParallelDescriptor::Barrier();
   {
-    BL_PROFILE_REGION_START("USleep3");
-    BL_PROFILE("USleep3()");
-    amrex::Print() << "USleep3." << std::endl;
-    amrex::USleep(3);
-    BL_PROFILE_REGION_STOP("USleep3");
+    BL_PROFILE_REGION_START("Sleep3");
+    BL_PROFILE("Sleep3()");
+    amrex::Print() << "Sleep3." << std::endl;
+    amrex::Sleep(3);
+    BL_PROFILE_REGION_STOP("Sleep3");
   }
   amrex::ParallelDescriptor::Barrier();
 */
diff --git a/Tools/CMake/AMReXBuildInfo.cmake b/Tools/CMake/AMReXBuildInfo.cmake
index 10bd6ee4605..17209ca872f 100644
--- a/Tools/CMake/AMReXBuildInfo.cmake
+++ b/Tools/CMake/AMReXBuildInfo.cmake
@@ -84,8 +84,10 @@ function (generate_buildinfo _target _git_dir)
    get_target_property(BUILD_DIR ${_target} BINARY_DIR)
 
    # Build machine
-   execute_process(COMMAND uname -a OUTPUT_VARIABLE BUILD_MACHINE
-      OUTPUT_STRIP_TRAILING_WHITESPACE)
+   cmake_host_system_information( RESULT BUILD_MACHINE
+      QUERY OS_NAME HOSTNAME OS_RELEASE OS_VERSION OS_PLATFORM )
+   string(REPLACE ";" " " BUILD_MACHINE "${BUILD_MACHINE}")
+
 
    #
    # Build flags
@@ -101,11 +103,11 @@ function (generate_buildinfo _target _git_dir)
       foreach( _p IN LISTS _prop )
 
          # _${_l}${_p} is a variable named as _lang_property,
-         evaluate_genex(${_p} _${_l}${_p}
-            LANG ${_l}
-            COMP ${CMAKE_${_l}_COMPILER_ID}
-            CONFIG ${CMAKE_BUILD_TYPE}
-            INTERFACE BUILD)
+         set(_${_l}${_p} "${${_p}}")
+         eval_genex( _${_l}${_p} ${_l} ${CMAKE_${_l}_COMPILER_ID}
+           COMP_VERSION ${CMAKE_${_l}_COMPILER_VERSION}
+           CONFIG       ${CMAKE_BUILD_TYPE}
+           INTERFACE    BUILD)
 
          if (_${_l}${_p})
             list(REMOVE_DUPLICATES _${_l}${_p})
diff --git a/Tools/CMake/AMReXConfig.cmake.in b/Tools/CMake/AMReXConfig.cmake.in
index b64e6361ddf..a5047eb6bec 100644
--- a/Tools/CMake/AMReXConfig.cmake.in
+++ b/Tools/CMake/AMReXConfig.cmake.in
@@ -22,20 +22,15 @@ set(AMReX_BUILD_TYPE  @CMAKE_BUILD_TYPE@)
 #
 set(AMReX_GIT_VERSION \"@AMREX_GIT_VERSION@\")
 
-#
-# Add AMReX modules to app code CMake
-#
-set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} "@CMAKE_INSTALL_PREFIX@/Tools/CMake/")
-
 #
 # AMReX CMake modules PATH
 #
-set(AMReX_MODULES_PATH @CMAKE_INSTALL_PREFIX@/Tools/CMake)
+set_and_check(AMReX_MODULE_PATH @PACKAGE_MODULE_PATH@)
 
 #
-# Path to amrex typechecker command
+# Add AMReX modules to app code CMake
 #
-set(AMReX_TYPECHECKER "@CMAKE_INSTALL_PREFIX@/Tools/typechecker/typechecker.py")
+set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} ${AMReX_MODULE_PATH})
 
 #
 # Configuration options
@@ -44,86 +39,104 @@ set(AMReX_TYPECHECKER "@CMAKE_INSTALL_PREFIX@/Tools/typechecker/typechecker.py")
 #
 
 # General options
-set(AMReX_@DIM@D_FOUND                  ON)
-set(AMReX_MPI_FOUND                 @ENABLE_MPI@)
-set(AMReX_OMP_FOUND                 @ENABLE_OMP@)
-set(AMReX_CUDA_FOUND                @ENABLE_CUDA@)
-set(AMReX_DP_FOUND                  @ENABLE_DP@)
+set(AMReX_@AMReX_SPACEDIM@D_FOUND   ON)
+set(AMReX_MPI_FOUND                 @AMReX_MPI@)
+set(AMReX_MPI_THREAD_MULTIPLE_FOUND @AMReX_MPI_THREAD_MULTIPLE@)
+set(AMReX_OMP_FOUND                 @AMReX_OMP@)
+set(AMReX_CUDA_FOUND                @AMReX_CUDA@)
+set(AMReX_DPCPP_FOUND               @AMReX_DPCPP@)
+set(AMReX_@AMReX_PRECISION@_FOUND  ON)
+set(AMReX_FORTRAN_FOUND             @AMReX_FORTRAN@)
 
 # Actual components selection
-set(AMReX_EB_FOUND                  @ENABLE_EB@)
-set(AMReX_FINTERFACES_FOUND         @ENABLE_FORTRAN_INTERFACES@)
-set(AMReX_LSOLVERS_FOUND            @ENABLE_LINEAR_SOLVERS@)
-set(AMReX_AMRDATA_FOUND             @ENABLE_AMRDATA@)
-set(AMReX_PARTICLES_FOUND           @ENABLE_PARTICLES@)
-set(AMReX_DPARTICLES_FOUND          @ENABLE_DP_PARTICLES@)
-set(AMReX_SENSEI_FOUND              @ENABLE_SENSEI_INSITU@)
-set(AMReX_CONDUIT_FOUND             @ENABLE_CONDUIT@)
-set(AMReX_SUNDIALS_FOUND            @ENABLE_SUNDIALS@)
-set(AMReX_ASCENT_FOUND              @ENABLE_ASCENT@)
-set(AMReX_HYPRE_FOUND               @ENABLE_HYPRE@)
+set(AMReX_EB_FOUND                  @AMReX_EB@)
+set(AMReX_FINTERFACES_FOUND         @AMReX_FORTRAN_INTERFACES@)
+set(AMReX_LSOLVERS_FOUND            @AMReX_LINEAR_SOLVERS@)
+set(AMReX_AMRDATA_FOUND             @AMReX_AMRDATA@)
+set(AMReX_PARTICLES_FOUND           @AMReX_PARTICLES@)
+set(AMReX_P@AMReX_PARTICLES_PRECISION@_FOUND ON)
+set(AMReX_SENSEI_FOUND              @AMReX_SENSEI@)
+set(AMReX_CONDUIT_FOUND             @AMReX_CONDUIT@)
+set(AMReX_SUNDIALS_FOUND            @AMReX_SUNDIALS@)
+set(AMReX_ASCENT_FOUND              @AMReX_ASCENT@)
+set(AMReX_HYPRE_FOUND               @AMReX_HYPRE@)
+set(AMReX_PETSC_FOUND               @AMReX_PETSC@)
 
 # Compilation options
-set(AMReX_FPE_FOUND                 @ENABLE_FPE@)
-set(AMReX_PIC_FOUND                 @ENABLE_PIC@)
-set(AMReX_ASSERTIONS_FOUND          @ENABLE_ASSERTIONS@)
+set(AMReX_FPE_FOUND                 @AMReX_FPE@)
+set(AMReX_PIC_FOUND                 @AMReX_PIC@)
+set(AMReX_ASSERTIONS_FOUND          @AMReX_ASSERTIONS@)
 
 # Profiling options
-set(AMReX_BASEP_FOUND               @ENABLE_BASE_PROFILE@)
-set(AMReX_TINYP_FOUND               @ENABLE_TINY_PROFILE@)
-set(AMReX_TRACEP_FOUND              @ENABLE_TRACE_PROFILE@)
-set(AMReX_MEMP_FOUND                @ENABLE_MEM_PROFILE@)
-set(AMReX_COMMP_FOUND               @ENABLE_COMM_PROFILE@)
-set(AMReX_BACKTRACE_FOUND           @ENABLE_BACKTRACE@)
-set(AMReX_PROFPARSER_FOUND          @ENABLE_PROFPARSER@)
+set(AMReX_BASEP_FOUND               @AMReX_BASE_PROFILE@)
+set(AMReX_TINYP_FOUND               @AMReX_TINY_PROFILE@)
+set(AMReX_TRACEP_FOUND              @AMReX_TRACE_PROFILE@)
+set(AMReX_MEMP_FOUND                @AMReX_MEM_PROFILE@)
+set(AMReX_COMMP_FOUND               @AMReX_COMM_PROFILE@)
+set(AMReX_PROFPARSER_FOUND          @AMReX_PROFPARSER@)
 
 #
-# Find dependencies if needed
+# Parallel backends
 #
 set( THREADS_PREFER_PTHREAD_FLAG on)
 find_dependency(Threads REQUIRED)
 
-if (@ENABLE_MPI@)
+if (@AMReX_MPI@)
    set( _mpi_components C CXX )
-   if (@ENABLE_FORTRAN_INTERFACES@)
+   if (@AMReX_FORTRAN_INTERFACES@)
       list(APPEND _mpi_components Fortran)
    endif ()
    find_dependency(MPI REQUIRED ${_mpi_components})
    unset(_mpi_components)
 endif()
 
-if (@ENABLE_OMP@)
+if (@AMReX_OMP@)
    set( _omp_components CXX )
-   if (@ENABLE_FORTRAN_INTERFACES@ OR @ENABLE_HYPRE@)
+   if (@AMReX_FORTRAN_INTERFACES@)
       list(APPEND _omp_components Fortran)
    endif ()
    find_dependency(OpenMP REQUIRED ${_omp_components})
 endif ()
 
+#
+# Third party libraries
+#
+if (@AMReX_SENSEI@)
+   find_dependency(SENSEI REQUIRED)
+endif ()
 
-if (@ENABLE_SUNDIALS@)
-   find_dependency(SUNDIALS 4 COMPONENTS nvecserial cvode arkode REQUIRED )
+if (@AMReX_SUNDIALS@)
+    set(_sundials_components nvecserial;cvode;arkode)
+    if (@AMReX_OMP@)
+        list(APPEND _sundials_components nvecopenmp)
+    endif ()
+    if (@AMReX_CUDA@)
+        list(APPEND _sundials_components nveccuda)
+    endif ()
+    find_dependency(SUNDIALS 4 REQUIRED COMPONENTS ${_sundials_components})
+    unset(_sundials_components)
 endif ()
 
-if (@ENABLE_SENSEI_INSITU@)
-   find_dependency(SENSEI REQUIRED)
+if (@AMReX_ASCENT@)
+    find_dependency(Ascent REQUIRED)
 endif ()
 
-if (@ENABLE_CONDUIT@)
+if (@AMReX_CONDUIT@)
    find_dependency(Conduit REQUIRED)
-   if (@ENABLE_ASCENT@)
-      find_dependency(Ascent REQUIRED)
-   endif ()
 endif ()
 
-if (@ENABLE_HYPRE@)
+if (@AMReX_HYPRE@)
    find_dependency(HYPRE 2.15 REQUIRED)
 endif ()
 
+if (@AMReX_PETSC@)
+   find_dependency(PETSc 2.13 REQUIRED)
+endif ()
+
 #
 # CUDA
 #
-if (@ENABLE_CUDA@)
+if (@AMReX_CUDA@)
    include(AMReX_SetupCUDA)
 endif ()
 
diff --git a/Tools/CMake/AMReXFlagsTargets.cmake b/Tools/CMake/AMReXFlagsTargets.cmake
index 74cf02bb039..a302f710e51 100644
--- a/Tools/CMake/AMReXFlagsTargets.cmake
+++ b/Tools/CMake/AMReXFlagsTargets.cmake
@@ -4,7 +4,6 @@
 #
 #   Flags_CXX                 --> Optional flags for C++ code
 #   Flags_Fortran             --> Optional flags for Fortran code
-#   Flags_Fortran_REQUIRED    --> Required Fortran flags for some components of AMReX
 #   Flags_FPE                 --> Floating-Point Exception flags for both C++ and Fortran
 #
 # These INTERFACE targets can be added to the AMReX export set.
@@ -22,13 +21,13 @@ include_guard(GLOBAL)
 # for every combination of
 #
 #     <lang> = cxx,fortran
-#     <id>   = gnu,intel,pgi,cray,clang,appleclang
+#     <id>   = gnu,intel,pgi,cray,clang,appleclang,msvc
 #
 foreach (_language CXX Fortran )
    set(_comp_lang   "$<COMPILE_LANGUAGE:${_language}>")
    string(TOLOWER "${_language}" _lang)
 
-   foreach (_comp GNU Intel PGI Cray Clang AppleClang )
+   foreach (_comp GNU Intel PGI Cray Clang AppleClang MSVC )
       string(TOLOWER "${_comp}" _id)
       # Define variables
       set(_comp_id              "$<${_language}_COMPILER_ID:${_comp}>")
@@ -62,6 +61,8 @@ target_compile_options( Flags_CXX
    $<${_cxx_cray_rel}:>
    $<${_cxx_clang_dbg}:-O0 -Wall -Wextra -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable>
    $<${_cxx_clang_rel}:>
+   $<${_cxx_appleclang_dbg}:-O0 -Wall -Wextra -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable>
+   $<${_cxx_appleclang_rel}:>
    )
 
 #
@@ -83,20 +84,6 @@ target_compile_options( Flags_Fortran
    $<${_fortran_cray_rel}:>
    )
 
-#
-# Fortran REQUIRED flags -- This is for internal use only: it is useless to export it
-#
-add_library(Flags_Fortran_REQUIRED INTERFACE)
-add_library(AMReX::Flags_Fortran_REQUIRED ALIAS Flags_Fortran_REQUIRED)
-
-target_compile_options( Flags_Fortran_REQUIRED
-   INTERFACE
-   $<${_fortran_gnu}:-ffixed-line-length-none -ffree-line-length-none>
-   $<${_fortran_intel}:-extend_source>
-   $<${_fortran_pgi}:-Mextend>
-   $<${_fortran_cray}:-N 255 -h list=a>
-   )
-
 
 #
 # Floating point exceptions
@@ -116,14 +103,13 @@ target_compile_options ( Flags_FPE
    $<${_cxx_cray}:-K trap=fp>
    $<${_fortran_clang}:>
    $<${_cxx_clang}:-ftrapv>
-
    )
 
 #
 # Unset all the variables defined in this module
 #
 foreach (_lang cxx fortran)
-   foreach (_comp gnu intel pgi cray clang apple)
+   foreach (_comp gnu intel pgi cray clang appleclang msvc)
       unset(_${_lang}_${_comp})
       unset(_${_lang}_${_comp}_dbg)
       unset(_${_lang}_${_comp}_rel)
diff --git a/Tools/CMake/AMReXGenexHelpers.cmake b/Tools/CMake/AMReXGenexHelpers.cmake
index f73b0bb7c07..fd2dd62bb8c 100644
--- a/Tools/CMake/AMReXGenexHelpers.cmake
+++ b/Tools/CMake/AMReXGenexHelpers.cmake
@@ -1,155 +1,334 @@
+#[=======================================================================[
+AMReXGenexHelpers
+-----------------
+
+Provides functions to evaluate generator expressions.
+
+The most important of these functions is
+
+  * eval_genex( _list _lang _comp )
+
+eval_genex(...) evaluates the generator expression in _list
+according to user-specified parameters such as compiler language (_lang)
+and compiler id (_comp).
+
+Other functions provided by this module are:
+
+  * eval_conditional_expressions( _out _in )
+  * eval_logical_operators( _out _in )
+  * eval_string_comparisons( _out _in )
+  * eval_string_transformations( _out _in )
+
+Each of these functions evaluate a specific type of genex in a list
+and therefore are rarely needed outside of this module.
+
+IMPORTANT NOTE:
+when specifying regex, be aware that the group "\\", i.e. quoted
+double backslash, is parsed as a single  backslash.Therefore, "\\$" is
+parsed as just \$.
+
+#]=======================================================================]
+
+#
+# Evaluate string-valued generator expressions that depend on a boolean condition
+# that must be 0 or 1.
 #
+function ( eval_conditional_expressions _list)
+
+   set(_in ${${_list}})
+
+   # Genex in the form $<condition:true_string> where condition=<0|1>
+   #
+   string(REGEX REPLACE "\\$<1:([^\$>]*)>" "\\1" _in "${_in}")  # true (\\1 is first subexpression in the match)
+   string(REGEX REPLACE "\\$<0:[^\$>]*>"   ""    _in "${_in}")  # false
+
+   #
+   # Genex in the form $<IF:condition,true_string,false_string> where condition=<0|1>
+   #
+   string(REGEX REPLACE "\\$<IF:0,[^\$,]*,([^\$>]*)>"   "\\1" _in "${_in}")  # false
+   string(REGEX REPLACE "(\\$<IF):1,([^\$,]*),[^\$>]*>" "\\2" _in "${_in}")  # true
+
+   set(${_list}  "${_in}" PARENT_SCOPE)
+
+endfunction ()
+
+
+
 #
-# FUNCTION: evaluate_genex
+# Evaluate boolean generator expressions that perform logical operations
 #
-# Takes a list as input and evaluate the generator expressions
+function (eval_logical_operators _list)
+
+   set(_in ${${_list}})
+
+   #
+   # Genex in the form $<BOOL:string>
+   #
+   set(_semicol "$SC$")   # Use to replace ; with a custom mark so the following foreach doesn't get confused
+   string(REPLACE ";" "${_semicol}" _in "${_in}")
+   string(REGEX MATCHALL "\\$<BOOL:[^\$>]*>" _matches "${_in}" )
+   foreach (_match IN LISTS _matches)
+      string(REGEX MATCHALL "\\$<BOOL:([^>]*)>" _tmp "${_match}" )
+      if (CMAKE_MATCH_1)
+         string(REPLACE "${_match}" "1" _in "${_in}")
+      else()
+         string(REPLACE "${_match}" "0" _in "${_in}")
+      endif ()
+   endforeach ()
+   string(REPLACE "${_semicol}" ";" _in "${_in}")
+
+   #
+   # Genex in the form $<AND:conditions> where conditions=<0|1>
+   #
+   string(REGEX REPLACE "\\$<AND:[1,]*>"           "1" _in "${_in}")  # True
+   string(REGEX REPLACE "\\$<AND:[01\,]*0[01\,]*>" "0" _in "${_in}")  # False
+
+   #
+   # Genex in the form $<OR:conditions> where conditions=<0|1>
+   #
+   string(REGEX REPLACE "\\$<OR:[0,]*>"           "0" _in "${_in}")  # True
+   string(REGEX REPLACE "\\$<OR:[01\,]*1[01\,]*>" "1" _in "${_in}")  # False
+
+   #
+   # Genex in the form $<NOT:condition> where condition=<0|1>
+   #
+   string(REGEX REPLACE "\\$<NOT:1>" "0" _in "${_in}")
+   string(REGEX REPLACE "\\$<NOT:0>" "1" _in "${_in}")
+
+   set(${_list} "${_in}" PARENT_SCOPE)
+
+endfunction ()
+
+#
+# Evaluate boolean generator expressions that perform string operations
+#
+function (eval_string_comparisons _list)
+
+   set(_in ${${_list}})
+
+   # To avoid confusing ";" with list separators when using REGEX MATCHALL
+   set(_semicol "$SC$")
+   string(REPLACE ";" "${_semicol}" _in "${_in}")
+
+   #
+   # Genex in the form $<ops:a1,a2> where ops=VERSION_*,EQUAL,STREQUAL,IN_LIST
+   #
+   string(REGEX MATCHALL "\\$<(VERSION|EQUAL|STREQUAL|IN_LIST)[^\$>]*>" _matches "${_in}")
+   foreach(_match IN LISTS _matches)
+      string(REGEX MATCH "([^\$<:]*):([^,]*),([^>]*)" _tmp "${_match}")
+      set(_ops ${CMAKE_MATCH_1})
+      set(_a1  ${CMAKE_MATCH_2})
+      set(_a2  ${CMAKE_MATCH_3})
+      if (_a1 ${_ops} _a2)
+         string(REPLACE "${_match}" "1" _in "${_in}")
+      else ()
+         string(REPLACE "${_match}" "0" _in "${_in}")
+      endif ()
+   endforeach()
+
+   string(REPLACE "${_semicol}" ";" _in "${_in}")
+   set(${_list} "${_in}" PARENT_SCOPE)
+
+endfunction ()
+
+#
+# Evaluate string-valued generator expressions that perform string
+# transformations
+#
+function (eval_string_transformations _list)
+
+   set(_in ${${_list}})
+
+   # To avoid confusing ";" with list separators when using REGEX MATCHALL
+   set(_semicol "$SC$")
+   string(REPLACE ";" "${_semicol}" _in "${_in}")
+
+   # Genex that deal with strings
+   string(REGEX MATCHALL "\\$<(LOWER_CASE|UPPER_CASE)[^\$>]*>" _matches "${_in}")
+   foreach(_match IN LISTS _matches)
+      string(REGEX MATCH "([^\$<:]*):([^>]*)" _tmp "${_match}")
+      set(_ops  ${CMAKE_MATCH_1})
+      set(_args  ${CMAKE_MATCH_2})
+      string(REPLACE "UPPER_CASE" "TOUPPER" _ops ${_ops})
+      string(REPLACE "LOWER_CASE" "TOLOWER" _ops ${_ops})
+      string(${_ops} ${CMAKE_MATCH_2} CMAKE_MATCH_2)
+      string(REPLACE "${_match}" "${CMAKE_MATCH_2}" _in "${_in}")
+   endforeach()
+
+   # Genex that deal with lists
+   string(REGEX MATCHALL "\\$<(JOIN|REMOVE_DUPLICATES|FILTER)[^\$>]*>" _matches "${_in}")
+   foreach(_match IN LISTS _matches)
+      string(REGEX MATCH "([^\$<:]*):([^>]*)" _tmp "${_match}")
+      set(_ops  ${CMAKE_MATCH_1})
+      set(_args  ${CMAKE_MATCH_2})
+      string(REPLACE "$SC$" ";" _args "${_args}")
+
+      if (_ops MATCHES "REMOVE_DUPLICATES")
+         list(REMOVE_DUPLICATES _args)
+         string(REPLACE "${_match}" "${_args}" _in "${_in}")
+      elseif (_ops MATCHES "JOIN")
+         string(REGEX MATCH "([^,]*),(.*)" _tmp "${_args}")
+         list(JOIN CMAKE_MATCH_1 ${CMAKE_MATCH_2} _args)
+         string(REPLACE "${_match}" "${_args}" _in "${_in}")
+      elseif (_ops MATCHES "FILTER")
+         string(REGEX MATCH "([^,]*),(INCLUDE|EXCLUDE),(.*)" _tmp "${_args}")
+         list(FILTER CMAKE_MATCH_1 ${CMAKE_MATCH_2} REGEX "${CMAKE_MATCH_3}")
+         string(REPLACE "${_match}" "${CMAKE_MATCH_1}" _in "${_in}")
+      endif ()
+   endforeach()
+
+   string(REPLACE "${_semicol}" ";" _in "${_in}")
+   set(${_list} "${_in}" PARENT_SCOPE)
+
+endfunction ()
+
+#
+#
+# FUNCTION: eval_genex
+#
+# Evaluate the generator expressions in an input list
 # according to user-defined criteria (see arguments below).
 #
-# Optional arguments:
-#   LANG       <compile-language>
-#   COMP       <compiler-id>
-#   CONFIG     <config-type>
-#   INTERFACE  <interface-type>  (BUILD is default)
+# Arguments:
+#   _list         the input list
+#   _lang         the compile language
+#   _comp         the compiler id
+#
+# Optional one-value arguments:
+#   COMP_VERSION  <compiler-version>
+#   CONFIG        <config-type>
+#   INTERFACE     <interface-type>
+#
+# Optional no-value arguments:
+#   STRING        Returns a string rather than a list
 #
 # Additionally, passing the keyword STRING will return a string
-# rather than a list (default).
-# 
-# Example:
-#
-# evaluate_genex(IN OUT COMP GNU LANG CXX STRING)
-#
-# Returns in OUT all the elements in IN that do not contain genex-es
-# + all the elements in IN contaning genex-es which test for true
-# when $<COMPILE_LANGUAGE:CXX> and the compiler id is GNU.
-# Also, OUT will be returned as a string, i.e. without ";"
-#
-# Author: Michele Rosso
-# Date  : Jan 30, 2019
-#
-#
-function( evaluate_genex input output )
-
-   set(option_arg STRING)
-   set(one_value_args LANG COMP CONFIG INTERFACE)
-   cmake_parse_arguments( ARG "${option_arg}" "${one_value_args}" "" ${ARGN} )
-
-   
-   # Split input into two lists: one containing genex, the other with
-   # no genex inside.
-   # Since ";" can be used as both item separator in a list and
-   # semi-column, we replace ";" with placeholders to indicate which
-   # of these two function ";" is performing.
-   set(list_sep "$SEP$" ) # Use this to indicate a item separator in list
-   set(semicol  "$SC$"  ) # Use this to indicate a simple semi-column 
-   set(genex_list ${${input}})
-   string(GENEX_STRIP "${genex_list}" nogenex_list)
-   if (nogenex_list)
-      list(REMOVE_ITEM genex_list ${nogenex_list})
-   endif ()
-   
-   if (genex_list)
-      # The genex_list is a list of genex-es in the form
-      # $<SOME_GENEX:something;something;something;...>.
-      # In order to avoid genex-ex containg ";" to be split over multiple
-      # items in the list - ";" is also the list separator - we replace
-      # all the ";" meant to be regular semicolumns with a placeholder
-      # to be converted back to ";" later on.
-      string(REPLACE ">;" "${list_sep}" genex_list "${genex_list}")
-      string(REPLACE ";" "${semicol}" genex_list "${genex_list}" )
-      string(REPLACE  "${list_sep}" ";" genex_list "${genex_list}" )
-
-      # Now we can tag wih true or false the genex-es which satisfy
-      # or not our criteria  
-      set(true ".true.")
-      set(false ".false.")
-
-      # Tag by language
-      if (ARG_LANG)
-         foreach(_lang C CXX Fortran CUDA)
-            if ("${_lang}" STREQUAL "${ARG_LANG}")
-               string(REPLACE "$<COMPILE_LANGUAGE:${_lang}>" "${true}"
-                  genex_list "${genex_list}")
-            else ()
-               string(REPLACE "$<COMPILE_LANGUAGE:${_lang}>" "${false}"
-                  genex_list "${genex_list}")
-            endif ()
-         endforeach()
-      endif ()
-      
-      string(REPLACE "$<COMPILE_LANGUAGE:" "${false}"
-         genex_list "${genex_list}")
-
-      # Tag by compiler
-      if (ARG_COMP)
-         string(REPLACE "$<C_COMPILER_ID:${ARG_COMP}>" "${true}"
-            genex_list "${genex_list}")
-         string(REPLACE "$<CXX_COMPILER_ID:${ARG_COMP}>" "${true}"
-            genex_list "${genex_list}")
-         string(REPLACE "$<Fortran_COMPILER_ID:${ARG_COMP}>" "${true}"
-            genex_list "${genex_list}")
+# rather than a list
+# If an optional argument if not specify, any genex requiring that
+# argument will be stripped from _list.
+#
+function ( eval_genex _list _lang _comp )
+
+   #
+   # Optional arguments
+   #
+   set(_option_arg STRING)
+   set(_one_value_args COMP_VERSION CONFIG INTERFACE)
+   cmake_parse_arguments( ARG "${_option_arg}" "${_one_value_args}" "" ${ARGN} )
+
+   # Auxiliary list
+   set(_in "${${_list}}")
+
+   #
+   # Loop to deal with nested genex if any are present
+   #
+   foreach ( iter RANGE 10 )
+
+      # Check if there are any genex-es in the input. If not, exit foreach
+      string(GENEX_STRIP "${_in}" _nogenex_string)
+      if (_nogenex_string STREQUAL _in)
+         break ()
       endif ()
-      string(REPLACE "$<C_COMPILER_ID:" "${false}" genex_list "${genex_list}")
-      string(REPLACE "$<CXX_COMPILER_ID:" "${false}" genex_list "${genex_list}")
-      string(REPLACE "$<Fortran_COMPILER_ID:" "${false}" genex_list "${genex_list}")
 
+      #
+      # String variable queries
+      #
 
-      # Tag by configuration
-      if (ARG_COMP)
-         string(REPLACE "$<CONFIG:${ARG_CONFIG}>" "${true}"
-            genex_list "${genex_list}")
+      # Genex in the form $<CONFIG>
+      # Ignore if no CONFIG arg is given? NOTE: should I keep it or ignore it?
+      if (ARG_CONFIG)
+         string(REGEX REPLACE "\\$<CONFIG>" "${ARG_CONFIG}"  _in "${_in}")
       endif ()
-      string(REPLACE "$<CONFIG:" "${false}" genex_list "${genex_list}")
 
-      # Tag by interface
-      if (ARG_INTERFACE)
-         if ( "${ARG_INTERFACE}" STREQUAL "BUILD")
-            string(REPLACE "$<BUILD_INTERFACE:" "${true}"
-               genex_list "${genex_list}")
-         elseif ("${ARG_INTERFACE}" STREQUAL "INSTALL")
-            string(REPLACE "$<INSTALL_INTERFACE:" "${true}"
-               genex_list "${genex_list}")         
-         endif ()
+      # Genex in the form $<*_COMPILER_ID>
+      string(REGEX REPLACE "\\$<${_lang}_COMPILER_ID>" "${_comp}"  _in "${_in}")
+      string(REGEX REPLACE "\\$<[A-Za-z]*_COMPILER_ID>" ""  _in "${_in}")
+
+      # Genex in the form $<*_COMPILER_VERSION>
+      if (ARG_COMP_VERSION)
+         string(REGEX REPLACE "\\$<${_lang}_COMPILER_VERSION>" "${ARG_COMP_VERSION}>" "1"  _in "${_in}")
       endif ()
-      
-      # Build interface is default
-      string(REPLACE "$<BUILD_INTERFACE:" "${true}"  genex_list "${genex_list}")
-      string(REPLACE "_INTERFACE:"        "${false}" genex_list "${genex_list}")   
-
-      # Take care of logical NOT
-      string(REPLACE "NOT:${true}"  "${false}"  genex_list "${genex_list}")
-      string(REPLACE "NOT:${false}" "${true}"   genex_list "${genex_list}")
-      
-      # Remove genex-es not satisfying our criteria
-      set(valid_genex_list ${genex_list})
-      if(valid_genex_list)
-         list(FILTER valid_genex_list EXCLUDE REGEX "${false}")
-      endif()
-
-      # Replace back regular semi-columns
-      string(REPLACE  "${semicol}" ";" valid_genex_list "${valid_genex_list}" )
+      string(REGEX REPLACE "\\$<[A-Za-z]*_COMPILER_VERSION>" "0"  _in "${_in}")
+
+      # Genex in the form $<COMPILE_LANGUAGE>
+      string(REGEX REPLACE "\\$<COMPILE_LANGUAGE>" "${_lang}"  _in "${_in}")
+
+      # Genex in the form $<COMPILE_LANGUAGE>
+      string(REGEX REPLACE "\\$<LINK_LANGUAGE>" "${_lang}"  _in "${_in}")
+
 
       #
-      # remove all remaining placeholders and genex characters
-      # OR operation not supported for now
+      #  Boolean variable queries
       #
-      string(REPLACE "$<AND:"    "" valid_genex_list "${valid_genex_list}")
-      # string(REPLACE "$<OR:"     "" valid_genex_list "${valid_genex_list}")
-      string(REPLACE "${true},"  "" valid_genex_list "${valid_genex_list}")
-      string(REPLACE "${true}>:" "" valid_genex_list "${valid_genex_list}")
-      string(REPLACE "${true}"   "" valid_genex_list "${valid_genex_list}")
-      string(REPLACE ">:"        "" valid_genex_list "${valid_genex_list}")
-      string(REPLACE "<:"        "" valid_genex_list "${valid_genex_list}")
-      string(REGEX REPLACE "\\$|<|>" "" valid_genex_list "${valid_genex_list}")
-   else()
-     set(valid_genex_list "") 
-   endif ()
 
+      # Genex in the form $<CONFIG:cfg>
+      # Ignore if no CONFIG arg is given? NOTE: should I keep it or ignore it?
+      if (ARG_CONFIG)
+         string(REGEX REPLACE "\\$<CONFIG:${ARG_CONFIG}>" "1"  _in "${_in}")
+      endif ()
+      string(REGEX REPLACE "\\$<CONFIG:[A-Za-z]*>" "0"  _in "${_in}")
+
+      # Genex in the form $<*_COMPILER_ID:compiler_ids>
+      string(REGEX REPLACE "\\$<${_lang}_COMPILER_ID:[^>]*${_comp}[^>]*>" "1"  _in "${_in}")
+      string(REGEX REPLACE "\\$<[A-Za-z]*_COMPILER_ID:[A-Za-z]*>" "0"  _in "${_in}")
+
+      # Genex in the form $<*_COMPILER_VERSION:version>
+      # Ignore if no COMP_VERSION arg is given
+      if (ARG_COMP_VERSION)
+         string(REGEX REPLACE "\\$<${_lang}_COMPILER_VERSION:${ARG_COMP_VERSION}>" "1"  _in "${_in}")
+      endif ()
+      string(REGEX REPLACE "\\$<[A-Za-z]*_COMPILER_VERSION:[^\$>]*>" "0"  _in "${_in}")
+
+      # Genex in the form $<COMPILE_LANGUAGE_AND_ID:language,compiler_ids>
+      string(REGEX REPLACE "\\$<COMPILE_LANGUAGE_AND_ID:${_lang},[^\$>]*${_comp}[^\$>]*>" "1"  _in "${_in}")
+      string(REGEX REPLACE "\\$<COMPILE_LANGUAGE_AND_ID:[A-Za-z,]*>" "0"  _in "${_in}")
+
+      # Genex in the form $<COMPILE_LANGUAGE:languages>
+      string(REGEX REPLACE "\\$<COMPILE_LANGUAGE:[^\$>]*${_lang}[^\$>]*>" "1"  _in "${_in}")
+      string(REGEX REPLACE "\\$<COMPILE_LANGUAGE:[A-Za-z]*>" "0"  _in "${_in}")
+
+      # Genex in the form $<LINK_LANGUAGE_AND_ID:language,compiler_ids>
+      string(REGEX REPLACE "\\$<LINK_LANGUAGE_AND_ID:${_lang},[^\$>]*${_comp}[^\$>]*>" "1"  _in "${_in}")
+      string(REGEX REPLACE "\\$<LINK_LANGUAGE_AND_ID:[A-Za-z,]*>" "0"  _in "${_in}")
+
+      # Genex in the form $<LINK_LANGUAGE:languages>
+      string(REGEX REPLACE "\\$<LINK_LANGUAGE:[^\$>]*${_lang}[^\$>]*>" "1"  _in "${_in}")
+      string(REGEX REPLACE "\\$<LINK_LANGUAGE:[A-Za-z]*>" "0"  _in "${_in}")
+
+      # String transformation
+      eval_string_transformations(_in)
+
+      # String comparisons
+      eval_string_comparisons(_in)
+
+      # Logical operators
+      eval_logical_operators(_in)
+
+      # Conditional expressions
+      eval_conditional_expressions(_in)
+
+      # Deal with interface if present
+      if (ARG_INTERFACE)
+         string(REGEX REPLACE "\\$<${ARG_INTERFACE}_INTERFACE:([^\$>]*)>" "\\1"  _in "${_in}")
+      endif ()
+      string(REGEX REPLACE "\\$<[A-Za-z]*_INTERFACE:[^\$>]*>" ""  _in "${_in}")
+
+      # Remove empty elements, i.e. the ";;" resulting from
+      # deleting false genex.
+      # In this case, _in is treated as a list
+      list(REMOVE_ITEM _in "")
+
+      # More clean up
+      list(TRANSFORM _in STRIP)
+
+   endforeach ()
+
+   # If string is required
    if (ARG_STRING)
-      string(REPLACE ";" " " tmp "${nogenex_list};${valid_genex_list}" )
-      string(STRIP "${tmp}" tmp)
-      set(${output} ${tmp} PARENT_SCOPE)
-   else ()
-      set(${output} ${nogenex_list} ${valid_genex_list} PARENT_SCOPE)
+      string(REPLACE ";" " " _in "${_in}" )
+      string(STRIP "${_in}" _in)
    endif ()
-   
+
+   set(${_list} "${_in}" PARENT_SCOPE)
+
 endfunction ()
diff --git a/Tools/CMake/AMReXInstallHelpers.cmake b/Tools/CMake/AMReXInstallHelpers.cmake
index 63f916cfd41..0571874c119 100644
--- a/Tools/CMake/AMReXInstallHelpers.cmake
+++ b/Tools/CMake/AMReXInstallHelpers.cmake
@@ -3,8 +3,8 @@
 #
 function ( generate_amrex_config_header )
 
-   get_target_property(_defines amrex COMPILE_DEFINITIONS)
-   evaluate_genex(_defines _defines_list )
+   get_target_property(_defines_list amrex COMPILE_DEFINITIONS)
+   eval_genex(_defines_list NONE NONE INTERFACE BUILD)
 
    # set variables from list of defines
    # configure_file() will use these variables to
@@ -23,19 +23,31 @@ function ( generate_amrex_config_header )
 
    endforeach ()
 
-   if ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "GNU" )
-      set(COMPILER_ID_MACRO __GNUC__)
-   elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "Intel" )
-      set(COMPILER_ID_MACRO __INTEL_COMPILER)
-   elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "Cray" )
-      set(COMPILER_ID_MACRO  __CRAYC)
-   elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "PGI" )
-      set(COMPILER_ID_MACRO  __PGI)
-   elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "Clang" )
-      set(COMPILER_ID_MACRO  __llvm__)
-   endif ()
-
-   if (ENABLE_OMP)
+   set(COMP_DECLS)
+   if (NOT AMReX_DIFFERENT_COMPILER)
+       if ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "GNU" )
+           set(COMPILER_ID_MACRO __GNUC__)
+       elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "Intel" )
+           set(COMPILER_ID_MACRO __INTEL_COMPILER)
+       elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "Cray" )
+           set(COMPILER_ID_MACRO  __CRAYC)
+       elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "PGI" )
+           set(COMPILER_ID_MACRO  __PGI)
+       elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "Clang" )
+           set(COMPILER_ID_MACRO  __llvm__)
+       elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "AppleClang" )
+           set(COMPILER_ID_MACRO  __llvm__)
+       elseif ("${CMAKE_CXX_COMPILER_ID}" STREQUAL "MSVC" )
+           set(COMPILER_ID_MACRO  _MSC_VER)
+       else ()
+           message(FATAL_ERROR "Compiler '${CMAKE_CXX_COMPILER_ID}' not supported by AMReX developers! "
+               "Try to configure with -DAMReX_DIFFERENT_COMPILER=ON")
+       endif ()
+       set(msg "libamrex was built with ${CMAKE_CXX_COMPILER_ID}. To avoid this error, reconfigure with -DAMReX_DIFFERENT_COMPILER=ON")
+       set(COMP_DECLS "\n#ifndef ${COMPILER_ID_MACRO}\nstatic_assert(false,\"${msg}\");\n#endif")
+   endif()
+
+   if (AMReX_OMP)
       set(OMP_DECLS "#ifndef _OPENMP\nstatic_assert(false,\"libamrex was built with OpenMP\");\n#endif")
    else ()
       set(OMP_DECLS "#ifdef _OPENMP\nstatic_assert(false,\"libamrex was built without OpenMP\");\n#endif")
@@ -55,7 +67,7 @@ endfunction ()
 #
 function (install_amrex)
 
-   # Check if the given arguments are vvalid targets
+   # Check if the given arguments are valid targets
    set(_targets amrex)
    foreach (_arg IN LISTS ARGV)
       if (TARGET ${_arg})
@@ -68,20 +80,35 @@ function (install_amrex)
    # Write and install configure file
    include(CMakePackageConfigHelpers)
 
+   #
+   # Setup for install and export of build tree
+   #
+   # Relative path to top level installation/build-tree
+   if(WIN32)
+       set(CMAKE_FILES_DIR   cmake)   
+   else()
+       set(CMAKE_FILES_DIR   lib/cmake/AMReX)
+   endif()
+   set(MODULE_PATH       Tools/CMake)       # Relative path to top level installation/build-tree
+
+   # Write Config file -- this is designed to work for both install and build trees
    configure_package_config_file(${AMREX_CMAKE_MODULES_PATH}/AMReXConfig.cmake.in
-      ${PROJECT_BINARY_DIR}/export/AMReXConfig.cmake
-      INSTALL_DESTINATION bin/cmake/AMReX )
+      ${PROJECT_BINARY_DIR}/${CMAKE_FILES_DIR}/AMReXConfig.cmake
+      INSTALL_DESTINATION ${CMAKE_FILES_DIR}
+      PATH_VARS MODULE_PATH)
 
    write_basic_package_version_file(
-       ${PROJECT_BINARY_DIR}/export/AMReXConfigVersion.cmake
+       ${PROJECT_BINARY_DIR}/${CMAKE_FILES_DIR}/AMReXConfigVersion.cmake
        COMPATIBILITY AnyNewerVersion )
 
    install( FILES
-      ${PROJECT_BINARY_DIR}/export/AMReXConfig.cmake
-      ${PROJECT_BINARY_DIR}/export/AMReXConfigVersion.cmake
-      DESTINATION lib/cmake/AMReX )
+      ${PROJECT_BINARY_DIR}/${CMAKE_FILES_DIR}/AMReXConfig.cmake
+      ${PROJECT_BINARY_DIR}/${CMAKE_FILES_DIR}/AMReXConfigVersion.cmake
+      DESTINATION ${CMAKE_FILES_DIR} )
 
-   # Setup for target amrex installation
+   #
+   # Export install-tree
+   #
    install(
       TARGETS       ${_targets}
       EXPORT        AMReXTargets
@@ -91,7 +118,6 @@ function (install_amrex)
       PUBLIC_HEADER DESTINATION include
       )
 
-   # Setup for export AMReXtargets installation
    install( EXPORT AMReXTargets
       NAMESPACE AMReX::
       DESTINATION lib/cmake/AMReX )
@@ -107,13 +133,34 @@ function (install_amrex)
    generate_amrex_config_header()
 
    # Install Tools directory
-   install(DIRECTORY ${PROJECT_SOURCE_DIR}/Tools/CMake
+   install(
+      DIRECTORY
+      ${PROJECT_SOURCE_DIR}/Tools/CMake
       ${PROJECT_SOURCE_DIR}/Tools/C_scripts
-      DESTINATION Tools
+      ${PROJECT_SOURCE_DIR}/Tools/typechecker
+      DESTINATION
+      Tools
       USE_SOURCE_PERMISSIONS
       )
 
    # Modify installed headers by calling external script: add #include<AMReX_Config.H>
    install(SCRIPT "${AMREX_CMAKE_MODULES_PATH}/modify_installed_headers.cmake" )
 
+   #
+   # Export build-tree
+   #
+   export( EXPORT AMReXTargets NAMESPACE AMReX::
+      FILE ${PROJECT_BINARY_DIR}/${CMAKE_FILES_DIR}/AMReXTargets.cmake )
+
+   # Copy Tools directory to build tree
+   file(
+      COPY
+      ${PROJECT_SOURCE_DIR}/Tools/CMake
+      ${PROJECT_SOURCE_DIR}/Tools/C_scripts
+      ${PROJECT_SOURCE_DIR}/Tools/typechecker
+      DESTINATION
+      ${PROJECT_BINARY_DIR}/Tools
+      )
+
+
 endfunction ()
diff --git a/Tools/CMake/AMReXOptions.cmake b/Tools/CMake/AMReXOptions.cmake
new file mode 100644
index 00000000000..4ae2efa5849
--- /dev/null
+++ b/Tools/CMake/AMReXOptions.cmake
@@ -0,0 +1,328 @@
+###############################################
+
+# Here we define the default config options   #
+# that can be overwritten by the user         #
+
+###############################################
+include_guard(GLOBAL)
+
+include(CMakeDependentOption)
+
+#
+# Define a macro to print active options
+#
+macro (print_option _var)
+   if (${_var})
+      message( STATUS "   ${_var}")
+   endif ()
+endmacro ()
+
+
+#
+# Dimensionality of the build  ===============================================
+#
+set(AMReX_SPACEDIM_VALUES 1 2 3)
+set(AMReX_SPACEDIM 3 CACHE STRING "Dimension of AMReX build: <1,2,3>")
+set_property(CACHE AMReX_SPACEDIM PROPERTY STRINGS ${AMReX_SPACEDIM_VALUES})
+if(NOT AMReX_SPACEDIM IN_LIST AMReX_SPACEDIM_VALUES)
+   message(FATAL_ERROR "AMReX_SPACEDIM=${AMReX_SPACEDIM} is not allowed."
+      " Must be one of ${AMReX_SPACEDIM_VALUES}")
+endif()
+message( STATUS "Building AMReX with AMReX_SPACEDIM = ${AMReX_SPACEDIM}")
+
+#
+# Populate the cache and check the value of the user-definable options
+#
+message(STATUS "Configuring AMReX with the following options enabled: ")
+
+#
+# This is the option to enable/disable xSDK mode
+#
+# To handle both XDSK options and correponding plain AMReX options,
+# we make use of policy CMP0077 introduced as a default in CMake 3.13
+# Under policy CMP0077, normal variables prevent option()
+# to set internal variables of the same name.
+# Example: if XSDK mode is ON and XSDK_ENABLE_Fortran=ON, a normal
+# variable AMReX_FORTRAN will be created and set to ON.
+# This will stop the subsequent option( AMReX_FORTRAN "Enable Fortran language" ON )
+# from being executed and no entry AMReX_FORTRAN will be created in the cache
+#
+option( USE_XSDK_DEFAULTS "Enable xSDK mode"  OFF )
+print_option( USE_XSDK_DEFAULTS )
+
+
+#
+# Option to control the type of library: static vs shared  ===================
+#
+if ( USE_XSDK_DEFAULTS )
+   option( BUILD_SHARED_LIBS "Build AMReX shared library" ON )
+else ()
+   option( BUILD_SHARED_LIBS "Build AMReX shared library" OFF )
+endif ()
+print_option( BUILD_SHARED_LIBS )
+
+
+#
+# Option to control if Fortran must be enabled  ==============================
+#
+if ( USE_XSDK_DEFAULTS )
+   option( XSDK_ENABLE_Fortran "Enable Fortran language" OFF )
+   set( AMReX_FORTRAN ${XSDK_ENABLE_Fortran} )
+   print_option(XSDK_ENABLE_Fortran)
+endif ()
+
+option( AMReX_FORTRAN "Enable Fortran language" ON )
+print_option( AMReX_FORTRAN )
+
+#
+# Option to control precision of the build  ==================================
+#
+if ( USE_XSDK_DEFAULTS )
+   set( XSDK_PRECISION "DOUBLE" CACHE STRING "Precision:<SINGLE,DOUBLE>" )
+   set( AMReX_PRECISION ${XSDK_PRECISION})
+   set( AMReX_PARTICLES_PRECISION ${XSDK_PRECISION})
+   message( STATUS "   XSDK_PRECISION = ${XSDK_PRECISION}")
+endif ()
+
+
+set(AMReX_PRECISION_VALUES SINGLE DOUBLE)
+set(AMReX_PRECISION DOUBLE CACHE STRING "Precision of AMReX build: <SINGLE,DOUBLE>")
+set_property(CACHE AMReX_PRECISION PROPERTY STRINGS ${AMReX_PRECISION_VALUES})
+if(NOT AMReX_PRECISION IN_LIST AMReX_PRECISION_VALUES)
+   message(FATAL_ERROR "AMReX_PRECISION=${AMReX_PRECISION} not supported."
+      " Must be one of ${AMReX_PRECISION_VALUES}")
+endif()
+message( STATUS "   AMReX_PRECISION = ${AMReX_PRECISION}")
+
+
+#
+# GPU backends    =============================================================
+#
+set(AMReX_GPU_BACKEND_VALUES NONE SYCL CUDA HIP)
+set(AMReX_GPU_BACKEND NONE CACHE STRING "On-node, accelerated GPU backend: <NONE,SYCL,CUDA,HIP>")
+set_property(CACHE AMReX_GPU_BACKEND PROPERTY STRINGS ${AMReX_GPU_BACKEND_VALUES})
+if (NOT AMReX_GPU_BACKEND IN_LIST AMReX_GPU_BACKEND_VALUES)
+   message(FATAL_ERROR "AMReX_GPU_BACKEND=${AMReX_GPU_BACKEND} is not allowed."
+      " Must be one of ${AMReX_GPU_BACKEND_VALUES}")
+endif ()
+
+if (NOT AMReX_GPU_BACKEND STREQUAL NONE)
+   message( STATUS "   AMReX_GPU_BACKEND = ${AMReX_GPU_BACKEND}")
+endif ()
+
+if (AMReX_GPU_BACKEND STREQUAL SYCL)
+   set(AMReX_CUDA  OFF CACHE INTERNAL "")
+   set(AMReX_DPCPP ON  CACHE INTERNAL "")
+   set(AMReX_HIP   OFF CACHE INTERNAL "")
+elseif (AMReX_GPU_BACKEND STREQUAL CUDA)
+   set(AMReX_CUDA  ON  CACHE INTERNAL "")
+   set(AMReX_DPCPP OFF CACHE INTERNAL "")
+   set(AMReX_HIP   OFF CACHE INTERNAL "")
+elseif (AMReX_GPU_BACKEND STREQUAL HIP)
+   set(AMReX_CUDA  OFF CACHE INTERNAL "")
+   set(AMReX_DPCPP OFF CACHE INTERNAL "")
+   set(AMReX_HIP   ON  CACHE INTERNAL "")
+endif ()
+
+# --- SYCL ---
+if (AMReX_DPCPP)
+   if (NOT (CMAKE_CXX_COMPILER MATCHES "dpcpp") )
+      message(FATAL_ERROR "\nAMReX_GPU_BACKEND=${AMReX_GPU_BACKEND} supports dpcpp compiler only."
+         "Set CMAKE_CXX_COMPILER=dpccp and try again.")
+   endif ()
+   if (AMReX_MPI)
+      message(FATAL_ERROR "\nAMReX_GPU_BACKEND=${AMReX_GPU_BACKEND} is incompatible with AMReX_MPI=${AMReX_MPI}.")
+   endif ()
+endif ()
+
+cmake_dependent_option( AMReX_DPCPP_AOT  "Enable DPCPP ahead-of-time compilation (WIP)"  OFF
+   "AMReX_GPU_BACKEND STREQUAL SYCL" OFF)
+print_option( AMReX_DPCPP_AOT )
+
+cmake_dependent_option( AMReX_DPCPP_SPLIT_KERNEL "Enable DPCPP kernel splitting"  ON
+   "AMReX_GPU_BACKEND STREQUAL SYCL" OFF)
+print_option(  AMReX_DPCPP_SPLIT_KERNEL )
+
+# --- HIP ----
+if (AMReX_HIP)
+   set(AMReX_AMD_ARCH "IGNORE" CACHE STRING
+      "AMD GPU architecture (Must be provided if AMReX_HIP=ON)")
+   if (NOT AMReX_AMD_ARCH)
+      message(FATAL_ERROR "\nMust specify AMReX_AMD_ARCH if AMReX_HIP=ON\n")
+   endif ()
+endif ()
+
+if (AMReX_CUDA OR AMReX_HIP)
+   set(GPUS_PER_SOCKET "IGNORE" CACHE STRING "Number of GPUs per socket" )
+   print_option(GPUS_PER_SOCKET)
+
+   set(GPUS_PER_NODE "IGNORE" CACHE STRING "Number of GPUs per node" )
+   print_option(GPUS_PER_NODE)
+endif ()
+
+
+#
+# Parallel backends    ========================================================
+#
+cmake_dependent_option( AMReX_MPI  "Enable MPI"  ON "NOT AMReX_GPU_BACKEND STREQUAL HIP" OFF)
+print_option( AMReX_MPI )
+
+cmake_dependent_option( AMReX_MPI_THREAD_MULTIPLE
+   "whether to initialize MPI so that multiple threads can make MPI calls at the same time"  OFF
+   "AMReX_MPI" OFF)
+print_option( AMReX_MPI_THREAD_MULTIPLE )
+
+option( AMReX_OMP  "Enable OpenMP" OFF)
+print_option( AMReX_OMP )
+
+
+#
+# AMReX components selection  ================================================
+#
+cmake_dependent_option( AMReX_EB "Build with Embedded Boundary support" OFF
+   "NOT AMReX_SPACEDIM EQUAL 1" OFF )
+print_option(AMReX_EB)
+
+cmake_dependent_option( AMReX_FORTRAN_INTERFACES "Build Fortran API" OFF
+   "AMReX_FORTRAN" OFF )
+print_option(AMReX_FORTRAN_INTERFACES)
+
+option( AMReX_LINEAR_SOLVERS  "Build AMReX Linear solvers" ON )
+print_option( AMReX_LINEAR_SOLVERS )
+
+option( AMReX_AMRDATA "Build data services" OFF)
+print_option( AMReX_AMRDATA )
+
+option( AMReX_PARTICLES "Build particle classes" OFF)
+print_option( AMReX_PARTICLES )
+
+if (AMReX_PARTICLES)
+   set(AMReX_PARTICLES_PRECISION_VALUES SINGLE DOUBLE)
+   set(AMReX_PARTICLES_PRECISION ${AMReX_PRECISION}
+      CACHE STRING "Precision of reals in particle classes: <SINGLE,DOUBLE>")
+   set_property(CACHE AMReX_PARTICLES_PRECISION PROPERTY STRINGS ${AMReX_PARTICLES_PRECISION_VALUES})
+   if(NOT AMReX_PARTICLES_PRECISION IN_LIST AMReX_PARTICLES_PRECISION_VALUES)
+      message(FATAL_ERROR "AMReX_PARTICLES_PRECISION=${AMReX_PRECISION} not supported."
+         " Must be one of ${AMReX_PARTICLES_PRECISION_VALUES}")
+   endif()
+   message( STATUS "   AMReX_PARTICLES_PRECISION = ${AMReX_PARTICLES_PRECISION}")
+endif ()
+
+
+#
+# External packages  =========================================================
+#
+
+# sensei
+option( AMReX_SENSEI "Enable SENSEI in situ infrastructure" OFF )
+print_option( AMReX_SENSEI )
+
+# Conduit (requires CONDUIT_DIR)
+option( AMReX_CONDUIT "Enable Conduit support" OFF )
+print_option( AMReX_CONDUIT )
+
+# Ascent
+cmake_dependent_option( AMReX_ASCENT "Enable Ascent support" OFF
+   "AMReX_CONDUIT" OFF )
+print_option( AMReX_ASCENT )
+
+# SUNDIALS
+cmake_dependent_option(AMReX_SUNDIALS "Enable SUNDIALS4 interfaces" OFF
+   "AMReX_FORTRAN_INTERFACES" OFF)
+print_option(AMReX_SUNDIALS)
+
+# Hypre
+cmake_dependent_option(AMReX_HYPRE "Enable Hypre interfaces" OFF
+   "AMReX_LINEAR_SOLVERS" OFF)
+print_option(AMReX_HYPRE)
+
+# PETSc
+cmake_dependent_option(AMReX_PETSC "Enable PETSc interfaces" OFF
+   "AMReX_LINEAR_SOLVERS" OFF )
+print_option(AMReX_PETSC)
+
+# HDF5
+option(AMReX_HDF5 "Enable HDF5-based I/O" OFF)
+print_option(AMReX_HDF5)
+
+cmake_dependent_option(AMReX_HDF5_ASYNC "Enable asynchronous writes in the HDF5-based IO" OFF
+   "AMReX_HDF5" OFF )
+print_option(AMReX_HDF5_ASYNC)
+
+if (AMReX_HDF5_ASYNC)
+   message(FATAL_ERROR "\nAMReX_HDF5_ASYNC not yet supported\n")
+endif ()
+
+
+#
+# Miscellanoues options  =====================================================
+#
+option( AMReX_PIC "Build position-independent code" OFF)
+print_option( AMReX_PIC )
+
+option(AMReX_FPE "Enable Floating Point Exceptions checks" OFF)
+print_option( AMReX_FPE )
+
+if ( "${CMAKE_BUILD_TYPE}" MATCHES "Debug" )
+   option( AMReX_ASSERTIONS "Enable assertions" ON)
+else ()
+   option( AMReX_ASSERTIONS "Enable assertions" OFF)
+endif ()
+
+print_option( AMReX_ASSERTIONS )
+
+
+#
+# Profiling options  =========================================================
+#
+option( AMReX_BASE_PROFILE "Enable basic profiling" OFF )
+print_option( AMReX_BASE_PROFILE )
+
+cmake_dependent_option( AMReX_TINY_PROFILE "Enable tiny profiling" OFF
+   "NOT AMReX_BASE_PROFILE" OFF)
+print_option( AMReX_TINY_PROFILE )
+
+cmake_dependent_option( AMReX_TRACE_PROFILE "Enable trace-profiling" OFF
+   "AMReX_BASE_PROFILE" OFF)
+print_option( AMReX_TRACE_PROFILE )
+
+option( AMReX_MEM_PROFILE   "Enable memory profiling" OFF )
+print_option( AMReX_MEM_PROFILE )
+
+cmake_dependent_option( AMReX_COMM_PROFILE  "Enable communicator-profiling" OFF
+   "AMReX_BASE_PROFILE" OFF)
+print_option( AMReX_COMM_PROFILE )
+
+cmake_dependent_option(AMReX_PROFPARSER "Enable profile parser" OFF
+   "AMReX_BASE_PROFILE;AMReX_TRACE_PROFILE;AMReX_AMRDATA" OFF)
+print_option( AMReX_PROFPARSER )
+
+set(AMReX_TP_PROFILE_VALUES IGNORE CRAYPAT FORGE VTUNE)
+set(AMReX_TP_PROFILE IGNORE CACHE STRING "Third-party profiling options: <CRAYPAT,FORGE,VTUNE>")
+set_property(CACHE AMReX_TP_PROFILE PROPERTY STRINGS ${AMReX_TP_PROFILE_VALUES})
+if (NOT AMReX_TP_PROFILE IN_LIST AMReX_TP_PROFILE_VALUES)
+   message(FATAL_ERROR "AMReX_TP_PROFILE (${AMReX_TP_PROFILE}) must be one of ${AMReX_TP_PROFILE_VALUES}")
+endif()
+if (AMReX_TP_PROFILE)
+   message( STATUS "   AMReX_TP_PROFILE = ${AMReX_TP_PROFILE}")
+endif ()
+
+# Check profile options
+if ( NOT ( CMAKE_C_COMPILER_ID STREQUAL "Intel" ) AND
+      ( AMReX_TP_PROFILE STREQUAL "VTUNE") )
+   message( FATAL_ERROR "VTUNE cannot be used with ${CMAKE_C_COMPILER_ID} compiler" )
+endif ()
+
+if (  ( ( AMReX_TP_PROFILE STREQUAL "CRAYPAT" ) OR
+        ( AMReX_TP_PROFILE STREQUAL "FORGE"   ) OR
+        ( AMReX_TP_PROFILE STREQUAL "VTUNE"   )   ) AND
+     (AMReX_BASE_PROFILE OR AMReX_TINY_PROFILE) )
+   message(WARNING "This configuration should only be used to profile BL_PROFILE!")
+endif()
+
+
+#
+# Extra options  =========================================================
+#
+option(AMReX_DIFFERENT_COMPILER
+    "Allow an application to use a different compiler than the one used to build AMReX" OFF)
diff --git a/Tools/CMake/AMReXParallelBackends.cmake b/Tools/CMake/AMReXParallelBackends.cmake
new file mode 100644
index 00000000000..31ac7305f4d
--- /dev/null
+++ b/Tools/CMake/AMReXParallelBackends.cmake
@@ -0,0 +1,123 @@
+#
+#
+#  Pthreads -- always required
+#
+#
+set( THREADS_PREFER_PTHREAD_FLAG on )
+find_package( Threads REQUIRED )
+target_link_libraries( amrex PUBLIC Threads::Threads )
+
+
+#
+#
+#  MPI
+#
+#
+if (AMReX_MPI)
+   set(_mpi_comps C CXX)  # Do we need MPI_C ?
+   if (AMReX_FORTRAN_INTERFACES)
+      list(APPEND _mpi_comps Fortran)
+   endif ()
+   find_package(MPI REQUIRED ${_mpi_comps})
+   list(TRANSFORM _mpi_comps PREPEND "MPI::MPI_")
+   target_link_libraries(amrex PUBLIC ${_mpi_comps})
+   unset(_mpi_comps)
+endif ()
+
+#
+#
+#  OpenMP
+#
+#
+if (AMReX_OMP)
+   set(_omp_comps CXX)
+   if (AMReX_FORTRAN_INTERFACES)
+      list(APPEND _omp_comps Fortran)
+   endif ()
+   find_package(OpenMP REQUIRED ${_omp_comps})
+   list(TRANSFORM _omp_comps PREPEND "OpenMP::OpenMP_")
+   target_link_libraries(amrex PUBLIC ${_omp_comps})
+   unset(_omp_comps)
+else ()
+   target_compile_options( amrex
+      PUBLIC
+      $<$<CXX_COMPILER_ID:Cray>:-h;noomp> )
+endif ()
+
+
+
+#
+#
+# CUDA
+#
+#
+# For now this is a place holder.
+# CUDA stuff will go here after we get rid of AMReXSetupCUDA
+#
+
+#
+#
+#  SYCL/DPCPP
+#
+#
+if (AMReX_DPCPP)
+   include(AMReXSYCL)
+   target_link_libraries(amrex PUBLIC SYCL)
+endif ()
+
+
+#
+#
+# HIP
+#
+#
+if (AMReX_HIP)
+
+   set(_valid_hip_compilers hipcc nvcc)
+   get_filename_component(_this_comp ${CMAKE_CXX_COMPILER} NAME)
+
+   if (NOT (_this_comp IN_LIST _valid_hip_compilers) )
+      message(FATAL_ERROR "\nCMAKE_CXX_COMPILER is incompatible with HIP.\n"
+         "Set CMAKE_CXX_COMPILER to either hipcc or nvcc for HIP builds.\n")
+   endif ()
+
+   unset(_hip_compiler)
+   unset(_valid_hip_compilers)
+
+   if(NOT DEFINED HIP_PATH)
+      if(NOT DEFINED ENV{HIP_PATH})
+         set(HIP_PATH "/opt/rocm/hip" CACHE PATH "Path to which HIP has been installed")
+      else()
+         set(HIP_PATH $ENV{HIP_PATH} CACHE PATH "Path to which HIP has been installed")
+      endif()
+   endif()
+
+   set(CMAKE_MODULE_PATH "${HIP_PATH}/cmake" ${CMAKE_MODULE_PATH})
+
+   find_package(HIP REQUIRED)
+
+   if("${HIP_COMPILER}" STREQUAL "hcc")
+      message(FATAL_ERROR "Using (deprecated) HCC compiler: please update ROCm")
+   endif()
+
+   if(HIP_FOUND)
+      message(STATUS "Found HIP: ${HIP_VERSION}")
+      message(STATUS "HIP: Platform=${HIP_PLATFORM} Compiler=${HIP_COMPILER}")
+   else()
+      message(FATAL_ERROR "Could not find HIP."
+         " Ensure that HIP is either installed in /opt/rocm/hip or the variable HIP_PATH is set to point to the right location.")
+   endif()
+
+   # Link to hiprand -- must include rocrand too
+   find_package(rocrand REQUIRED CONFIG)
+   find_package(hiprand REQUIRED CONFIG)
+   target_link_libraries(amrex PUBLIC hip::hiprand roc::rocrand)
+
+   # ARCH flags -- these must be PUBLIC for all downstream targets to use,
+   # else there will be a runtime issue (cannot find
+   # missing gpu devices)
+   target_compile_options(amrex
+      PUBLIC
+      $<$<COMPILE_LANGUAGE:CXX>:-m64 --amdgpu-target=${AMReX_AMD_ARCH}> )
+
+endif ()
diff --git a/Tools/CMake/AMReXSYCL.cmake b/Tools/CMake/AMReXSYCL.cmake
new file mode 100644
index 00000000000..f2b4dbde44d
--- /dev/null
+++ b/Tools/CMake/AMReXSYCL.cmake
@@ -0,0 +1,132 @@
+#
+# This module defines the INTERFACE target SYCL and its alias AMReX::SYCL.
+# These targets provides build/link requirements for the SYCL language.
+# For the time being, only dpc++ is supported
+#
+
+# Provide a cache variable for the dpc++ root directory installation by probing
+# the compiler
+execute_process(COMMAND ${CMAKE_CXX_COMPILER} --version  OUTPUT_VARIABLE _tmp)
+string(REGEX MATCH "InstalledDir: (.*)" _tmp "${_tmp}")
+unset(_tmp)
+
+get_filename_component(DPCPP_ROOT ${CMAKE_MATCH_1} DIRECTORY CACHE)
+message(STATUS "dpc++ root directory: ${DPCPP_ROOT}")
+
+# Provide cache variable to identify the dpc++ version, including the "beta"
+string(REGEX MATCH "[^//]*beta(.[^//])" DPCPP_VERSION "${DPCPP_ROOT}")
+set(DPCPP_VERSION ${DPCPP_VERSION} CACHE INTERNAL "dpc++ version")
+set(DPCPP_BETA_VERSION ${CMAKE_MATCH_1} CACHE INTERNAL "dpc++ beta version")
+message(STATUS "dpc++ version: ${DPCPP_VERSION}")
+
+# We do not support anything lower than beta09
+if (DPCPP_BETA_VERSION LESS "09")
+   message(FATAL_ERROR
+      "\nUnsupported dpc++ compiler version."
+      "\nAMReX requires dpc++ \"beta\" version >= 08. "
+      "The current compiler \"beta\" version is ${DPCPP_BETA_VERSION}.\n")
+endif ()
+
+
+set(_cxx_clang "$<AND:$<COMPILE_LANGUAGE:CXX>,$<CXX_COMPILER_ID:Clang>>") # Only Clang for now
+
+#
+# SYCL and AMReX::SYCL targets
+#
+add_library(SYCL INTERFACE)
+add_library(AMReX::SYCL ALIAS SYCL)
+
+target_compile_features(SYCL INTERFACE cxx_std_17)
+
+
+#
+# Compiler options
+#
+target_compile_options( SYCL
+   INTERFACE
+   $<${_cxx_clang}:-Wno-error=sycl-strict -fsycl>
+   $<${_cxx_clang}:$<$<BOOL:${AMReX_DPCPP_SPLIT_KERNEL}>:-fsycl-device-code-split=per_kernel>>)
+
+# temporary work-around for DPC++ beta08 bug
+#   define "long double" as 64bit for C++ user-defined literals
+#   https://github.com/intel/llvm/issues/2187
+target_compile_options( SYCL
+   INTERFACE
+   $<${_cxx_clang}:-mlong-double-64 "SHELL:-Xclang -mlong-double-64">)
+
+# Beta09 has enabled eary optimizations by default.  But this causes many
+# tests to crash.  So we disable it.
+target_compile_options( SYCL
+   INTERFACE
+   $<${_cxx_clang}:-fno-sycl-early-optimizations>)
+
+
+#
+# Link options
+#
+if (DPCPP_BETA_VERSION LESS "10")   # If beta < 10
+
+   find_file(LIBSYCL_GLIBC_OBJ libsycl-glibc.o
+      PATHS ${DPCPP_ROOT} ENV LD_LIBRARY_PATH
+      PATH_SUFFIXES lib
+      DOC "Full path to libsycl-glibc.o")
+
+   target_link_libraries(SYCL INTERFACE ${LIBSYCL_GLIBC_OBJ})
+
+   target_link_options( SYCL
+      INTERFACE
+      $<${_cxx_clang}:-fsycl -device-math-lib=fp32,fp64> )
+
+else ()  # for beta >= 10
+
+   target_link_options( SYCL
+      INTERFACE
+      $<${_cxx_clang}:-fsycl -fsycl-device-lib=libc,libm-fp32,libm-fp64> )
+
+endif ()
+
+
+
+# TODO: use $<LINK_LANG_AND_ID:> genex for CMake >=3.17
+target_link_options( SYCL
+   INTERFACE
+   $<${_cxx_clang}:$<$<BOOL:${AMReX_DPCPP_SPLIT_KERNEL}>:-fsycl-device-code-split=per_kernel>>)
+
+
+if (AMReX_DPCPP_AOT)
+   message(FATAL_ERROR "\nAhead-of-time (AOT) compilation support not available yet.\nRe-configure with AMReX_DPCPP_AOT=OFF.")
+
+   #
+   # TODO: remove comments to enable AOT support when the time comes
+   #       (main blocker: missing math library)
+   #
+   # if (CMAKE_SYSTEM_NAME STREQUAL "Linux")
+   #    ## TODO: use file(READ)
+   #    execute_process( COMMAND cat /sys/devices/cpu/caps/pmu_name OUTPUT_VARIABLE _cpu_long_name )
+   # else ()
+   #    message(FATAL_ERROR "\nAMReX_DPCPP_AOT is not supported on ${CMAKE_SYSTEM_NAME}\n")
+   # endif ()
+
+   # string(STRIP "${_cpu_long_name}" _cpu_long_name)
+   # if (_cpu_long_name STREQUAL "skylake")
+   #    set(_cpu_short_name "skl")
+   # elseif (_cpu_long_name STREQUAL "kabylake")
+   #    set(_cpu_short_name "kbl")
+   # elseif (_cpu_long_name STREQUAL "cascadelake")
+   #    set(_cpu_short_name "cfl")
+   # else ()
+   #    message(FATAL_ERROR "\n Ahead-of-time compilation for CPU ${_cpu_long_name} is not yet supported\n"
+   #       "Maybe set AMReX_DPCPP_AOT to OFF?\n")
+   # endif ()
+
+   # target_compile_options( amrex
+   #    PUBLIC
+   #    $<$<AND:$<COMPILE_LANGUAGE:CXX>,$<CXX_COMPILER_ID:Clang>,$<NOT:$<CONFIG:Debug>>>:
+   #    -fsycl-targets=spir64_gen-unknown-unknown-sycldevice -Xsycl-target-backend "-device ${_cpu_short_name}" >)
+   # target_link_options(amrex PUBLIC -fsycl-targets=spir64_gen-unknown-unknown-sycldevice -Xsycl-target-backend "-device ${_cpu_short_name}" )
+   # unset(_cpu_long_name)
+   # unset(_cpu_short_name)
+endif ()
+
+
+unset(_cxx_clang)
diff --git a/Tools/CMake/AMReXTargetHelpers.cmake b/Tools/CMake/AMReXTargetHelpers.cmake
index 88deeeea7b2..c11fd7cb194 100644
--- a/Tools/CMake/AMReXTargetHelpers.cmake
+++ b/Tools/CMake/AMReXTargetHelpers.cmake
@@ -74,8 +74,7 @@ function (get_target_prop_recursive _target _lincludes _ldefines _lflags _llink_
 
    # Remove INTERFACE genex: choose build
    include(AMReXGenexHelpers)
-   evaluate_genex(_interface_link_libraries
-      _interface_link_libraries
+   eval_genex(_interface_link_libraries NONE NONE
       CONFIG ${CMAKE_BUILD_TYPE}
       INTERFACE BUILD)
 
@@ -104,7 +103,7 @@ endfunction ()
 #
 function (set_cpp_sources_to_cuda_language _target)
    get_target_property(_sources ${_target} SOURCES)
-   list(FILTER _sources INCLUDE REGEX "\\.cpp")
+   list(FILTER _sources INCLUDE REGEX "\\.cpp$")
    set_source_files_properties(${_sources} PROPERTIES LANGUAGE CUDA )
 endfunction ()
 
diff --git a/Tools/CMake/AMReXThirdPartyLibraries.cmake b/Tools/CMake/AMReXThirdPartyLibraries.cmake
new file mode 100644
index 00000000000..f2c02c1f1c6
--- /dev/null
+++ b/Tools/CMake/AMReXThirdPartyLibraries.cmake
@@ -0,0 +1,89 @@
+#
+# HDF5 -- here it would be best to create an imported target
+#
+if (AMReX_HDF5)
+    set(HDF5_PREFER_PARALLEL TRUE)
+    find_package(HDF5 1.10.4 REQUIRED)
+    if (NOT HDF5_IS_PARALLEL)
+        message(FATAL_ERROR "\nHDF5 library does not support parallel I/O")
+     endif ()
+
+    if (TARGET hdf5::hdf5)  # CMake >= 3.19
+       target_link_libraries(amrex PUBLIC hdf5::hdf5)
+    else ()  # CMake < 3.19 -- Remove when minimum cmake version is bumped up
+       target_include_directories(amrex PUBLIC ${HDF5_INCLUDE_DIRS})
+       target_compile_definitions(amrex PUBLIC ${HDF5_DEFINITIONS})
+       target_link_libraries(amrex PUBLIC ${HDF5_LIBRARIES})
+    endif ()
+
+endif ()
+
+
+#
+# Sensei
+#
+if (AMReX_SENSEI)
+    find_package(SENSEI REQUIRED)
+    target_link_libraries( amrex PUBLIC sensei )
+endif ()
+
+
+#
+# SUNDIALS
+#
+if (AMReX_SUNDIALS)
+    # We link to libraries and always include nvecserial (in case app code needs it)
+    set(_sundials_components farkode_mod;fcvode_mod)
+
+    find_package(SUNDIALS 4 REQUIRED COMPONENTS ${_sundials_components})
+
+    foreach (_comp ${_sundials_components})
+        target_link_libraries(amrex PUBLIC SUNDIALS::${_comp})
+    endforeach ()
+
+    unset(_sundials_components)
+endif ()
+
+
+#
+#  Ascent
+#
+if (AMReX_ASCENT) # Ascent will find conduit, so check for Ascent first
+    find_package(Ascent REQUIRED)
+    if (AMReX_MPI)
+        target_link_libraries( amrex PUBLIC ascent::ascent_mpi )
+    else ()
+        target_link_libraries( amrex PUBLIC ascent::ascent )
+    endif ()
+endif ()
+
+
+#
+# Conduit
+#
+if (AMReX_CONDUIT)
+    find_package(Conduit REQUIRED)
+    if (AMReX_MPI)
+        target_link_libraries( amrex PUBLIC conduit::conduit_mpi )
+    else ()
+        target_link_libraries( amrex PUBLIC conduit::conduit )
+    endif ()
+endif ()
+
+
+#
+# HYPRE
+#
+if (AMReX_HYPRE)
+    find_package(HYPRE 2.18.2 REQUIRED)
+    target_link_libraries( amrex PUBLIC HYPRE )
+endif ()
+
+
+#
+# PETSc
+#
+if (AMReX_PETSC)
+    find_package(PETSc 2.13 REQUIRED)
+    target_link_libraries( amrex PUBLIC PETSC )
+endif ()
diff --git a/Tools/CMake/AMReXTypecheck.cmake b/Tools/CMake/AMReXTypecheck.cmake
index 1c936b19649..ae241785806 100644
--- a/Tools/CMake/AMReXTypecheck.cmake
+++ b/Tools/CMake/AMReXTypecheck.cmake
@@ -192,25 +192,22 @@ function( add_typecheck_target _target)
 
    # expand genex-es
    include(AMReXGenexHelpers)
-   
-   evaluate_genex(_defines _cxx_defines
-      LANG CXX
-      COMP GNU
-      CONFIG ${CMAKE_BUILD_TYPE}
-      INTERFACE BUILD)
-   
-   evaluate_genex(_defines _fortran_defines
-      LANG Fortran
-      COMP GNU
-      CONFIG ${CMAKE_BUILD_TYPE}
-      INTERFACE BUILD)
-
-   evaluate_genex(_amrex_flags _amrex_fortran_flags
-      LANG Fortran
-      COMP GNU
-      CONFIG ${CMAKE_BUILD_TYPE}
-      INTERFACE BUILD) 
-   
+
+   set(_cxx_defines "${_defines}")
+   eval_genex(_cxx_defines  CXX GNU
+      CONFIG        ${CMAKE_BUILD_TYPE}
+      INTERFACE     BUILD)
+
+   set(_fortran_defines "${_defines}")
+   eval_genex(_fortran_defines Fortran GNU
+      CONFIG        ${CMAKE_BUILD_TYPE}
+      INTERFACE     BUILD)
+
+   set(_amrex_fortran_flags "${_amrex_flags}")
+   eval_genex(_amrex_fortran_flags Fortran GNU
+      CONFIG        ${CMAKE_BUILD_TYPE}
+      INTERFACE     BUILD)
+
    if (_cxx_defines)
       string(REPLACE ";" ";-D" _cxx_defines "-D${_cxx_defines}")
    endif ()
diff --git a/Tools/CMake/AMReX_Config.H.in b/Tools/CMake/AMReX_Config.H.in
index 6f028a3f917..3b29103dbf5 100644
--- a/Tools/CMake/AMReX_Config.H.in
+++ b/Tools/CMake/AMReX_Config.H.in
@@ -11,12 +11,13 @@
 #cmakedefine BL_COMM_PROFILING
 #cmakedefine AMREX_TINY_PROFILING
 #cmakedefine AMREX_MEM_PROFILING
-#cmakedefine AMREX_BACKTRACING
 #cmakedefine AMREX_TESTING
 #cmakedefine AMREX_USE_MPI
 #cmakedefine BL_USE_MPI
+#cmakedefine AMREX_MPI_THREAD_MULTIPLE
 #cmakedefine AMREX_USE_OMP
 #cmakedefine BL_USE_OMP
+#cmakedefine AMREX_USE_DPCPP
 #cmakedefine AMREX_USE_FLOAT
 #cmakedefine BL_USE_FLOAT
 #cmakedefine AMREX_SPACEDIM @AMREX_SPACEDIM@
@@ -38,14 +39,12 @@
 #cmakedefine BL_COALESCE_FABS
 #cmakedefine AMREX_GPUS_PER_SOCKET @AMREX_GPUS_PER_SOCKET@
 #cmakedefine AMREX_GPUS_PER_NODE   @AMREX_GPUS_PER_NODE@
-#cmakedefine BL_GCC_VERSION @BL_GCC_VERSION@
-#cmakedefine BL_GCC_MAJOR_VERSION @BL_GCC_MAJOR_VERSION@
-#cmakedefine BL_GCC_MINOR_VERSION @BL_GCC_MINOR_VERSION@
 #cmakedefine AMREX_PARTICLES
-#ifdef __cplusplus
-#ifndef @COMPILER_ID_MACRO@
-static_assert(false,"libamrex was built with @CMAKE_CXX_COMPILER_ID@");
-#endif
+#cmakedefine AMREX_USE_HDF5
+#cmakedefine AMREX_USE_HDF5_ASYNC
+#cmakedefine AMREX_USE_HYPRE
+#cmakedefine AMREX_USE_PETSC
+#ifdef __cplusplus@COMP_DECLS@
 @OMP_DECLS@
 #endif
 #endif
diff --git a/Tools/CMake/AMReX_Config.cmake b/Tools/CMake/AMReX_Config.cmake
index e44476a4203..97a084a803e 100644
--- a/Tools/CMake/AMReX_Config.cmake
+++ b/Tools/CMake/AMReX_Config.cmake
@@ -23,8 +23,8 @@ function (configure_amrex)
    #
    # Check that needed options have already been defined
    #
-   if ( ( NOT ( DEFINED ENABLE_MPI ) ) OR ( NOT (DEFINED ENABLE_OMP) )
-	 OR ( NOT (DEFINED ENABLE_PIC) ) OR (NOT (DEFINED ENABLE_FPE)))
+   if ( ( NOT ( DEFINED AMReX_MPI ) ) OR ( NOT (DEFINED AMReX_OMP) )
+	 OR ( NOT (DEFINED AMReX_PIC) ) OR (NOT (DEFINED AMReX_FPE)))
       message ( AUTHOR_WARNING "Required options are not defined" )
    endif ()
 
@@ -48,40 +48,46 @@ function (configure_amrex)
    # Moreover, it will also enforce such standard on all the consuming targets
    #
    set_target_properties(amrex PROPERTIES CXX_EXTENSIONS OFF)
+   # minimum: C++11 on Linux, C++17 on Windows, C++17 for dpc++
+   if (AMReX_DPCPP)
+      target_compile_features(amrex PUBLIC cxx_std_17)
+   else ()
+      target_compile_features(amrex PUBLIC $<IF:$<STREQUAL:$<PLATFORM_ID>,Windows>,cxx_std_17,cxx_std_11>)
+   endif ()
 
-   target_compile_features(amrex PUBLIC cxx_std_11)  # minimum: C++11
+   if (AMReX_CUDA AND (CMAKE_VERSION VERSION_GREATER_EQUAL 3.17) )
+      set_target_properties(amrex PROPERTIES CUDA_EXTENSIONS OFF)
+      # minimum: C++11 on Linux, C++17 on Windows
+      target_compile_features(amrex PUBLIC $<IF:$<STREQUAL:$<PLATFORM_ID>,Windows>,cuda_std_17,cuda_std_11>)
+   endif()
 
    #
-   # Setup OpenMP
+   # Special flags for MSV compiler
    #
-   if (ENABLE_OMP)
+   set(_cxx_msvc   "$<AND:$<COMPILE_LANGUAGE:CXX>,$<CXX_COMPILER_ID:MSVC>>")
+   set(_condition  "$<VERSION_LESS:$<CXX_COMPILER_VERSION>,19.26>")
 
-      find_package(OpenMP REQUIRED)
-      target_link_libraries(amrex PUBLIC OpenMP::OpenMP_CXX)
+   target_compile_options( amrex PRIVATE $<${_cxx_msvc}:/bigobj> )
 
-      # Make imported target "global" so that it can be seen
-      # from other directories in the project.
-      # This is especially useful when get_target_properties_flattened()
-      # (see module AMReXTargetHelpers.cmake) is called to recover dependecy tree info
-      # in projects that use amrex directly in the build (via add_subdirectory()).
-      set_target_properties(OpenMP::OpenMP_CXX PROPERTIES IMPORTED_GLOBAL True )
+   target_compile_options( amrex PUBLIC
+      $<${_cxx_msvc}:$<IF:${_condition},/experimental:preprocessor,/Zc:preprocessor>>
+      )
 
-      if (ENABLE_FORTRAN_INTERFACES OR ENABLE_HYPRE)
-         target_link_libraries(amrex PUBLIC OpenMP::OpenMP_Fortran )
-         set_target_properties(OpenMP::OpenMP_Fortran PROPERTIES IMPORTED_GLOBAL True )
-      endif ()
+   unset(_condition)
+   unset(_cxx_msvc)
 
+   #
+   # Setup OpenMP
+   #
+   if (AMReX_OMP)
       # We have to manually pass OpenMP flags to host compiler if CUDA is enabled
       # Since OpenMP imported targets are generated only for the Compiler ID in use, i.e.
       # they do not provide flags for all possible compiler ids, we assume the same compiler use
       # for building amrex will be used to build the application code
-      if (ENABLE_CUDA)
-         get_target_property(_cxx_omp_flags OpenMP::OpenMP_CXX INTERFACE_COMPILE_OPTIONS)
+      if (AMReX_CUDA)
+         get_target_property(_omp_flags OpenMP::OpenMP_CXX INTERFACE_COMPILE_OPTIONS)
 
-         evaluate_genex(_cxx_omp_flags _omp_flags
-            LANG   CXX
-            COMP   ${_comp}
-            STRING )
+         eval_genex(_omp_flags CXX ${_comp} INTERFACE BUILD STRING )
 
          target_compile_options(amrex PUBLIC $<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=${_omp_flags}>)
       endif ()
@@ -93,17 +99,7 @@ function (configure_amrex)
    endif ()
 
 
-   if (ENABLE_CUDA)
-      # After we load the setups for ALL the supported compilers
-      # we can load the setup for NVCC if required
-      # This is necessary because we need to know the C++ flags
-      # to pass to the Xcompiler option.
-      target_compile_definitions( amrex
-         PUBLIC
-         AMREX_NVCC_VERSION=${CMAKE_CUDA_COMPILER_VERSION}
-         AMREX_NVCC_MAJOR_VERSION=${NVCC_VERSION_MAJOR}
-         AMREX_NVCC_MINOR_VERSION=${NVCC_VERSION_MINOR} )
-
+   if (AMReX_CUDA)
       #
       # Retrieve compile flags for the current configuration
       # I haven't find a way to set host compiler flags for all the
@@ -113,7 +109,7 @@ function (configure_amrex)
 
       if (NOT CMAKE_CXX_FLAGS)
          get_target_property( _amrex_flags_2 Flags_CXX INTERFACE_COMPILE_OPTIONS)
-      endif ()
+      endif()
 
       set(_amrex_flags)
       if (_amrex_flags_1)
@@ -123,61 +119,32 @@ function (configure_amrex)
          list(APPEND _amrex_flags ${_amrex_flags_2})
       endif ()
 
-      evaluate_genex(_amrex_flags _amrex_cxx_flags
-         LANG   CXX
-         COMP   ${CMAKE_CXX_COMPILER_ID}
-         CONFIG ${CMAKE_BUILD_TYPE}
+      eval_genex(_amrex_flags CXX  ${CMAKE_CXX_COMPILER_ID}
+         COMP_VERSION ${CMAKE_CXX_COMPILER_VERSION}
+         CONFIG       ${CMAKE_BUILD_TYPE}
+         INTERFACE    BUILD
          STRING )
 
-      if (_amrex_cxx_flags)
-         target_compile_options(amrex PRIVATE $<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=${_amrex_cxx_flags}>)
+      if (_amrex_flags)
+         target_compile_options(amrex PRIVATE $<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=${_amrex_flags}>)
       endif ()
 
       #
       # Add manually nvToolsExt if tiny profiler or base profiler are on.n
       # CMake >= 3.17 provides the module FindCUDAToolkit to do this natively.
       #
-      if (ENABLE_TINY_PROFILE OR ENABLE_BASE_PROFILE )
+      if (AMReX_TINY_PROFILE OR AMReX_BASE_PROFILE )
           find_library(LIBNVTOOLSEXT nvToolsExt PATHS ${CMAKE_CUDA_IMPLICIT_LINK_DIRECTORIES})
           target_link_libraries(amrex PUBLIC ${LIBNVTOOLSEXT})
       endif ()
 
    endif ()
 
-   #
-   # Add compiler version defines
-   #
-   string( REPLACE "." ";" VERSION_LIST ${CMAKE_CXX_COMPILER_VERSION})
-   list( GET VERSION_LIST 0 COMP_VERSION_MAJOR )
-   list( GET VERSION_LIST 1 COMP_VERSION_MINOR )
-
-   if ( ${CMAKE_CXX_COMPILER_ID} STREQUAL "GNU" )
-
-      if ( CMAKE_CXX_COMPILER_VERSION VERSION_LESS "4.8" )
-         message( WARNING
-            " Your default GCC is version ${CMAKE_CXX_COMPILER_VERSION}. This might break during build. GCC>=4.8 is recommended.")
-      endif ()
-
-      target_compile_definitions( amrex PUBLIC $<BUILD_INTERFACE:
-          BL_GCC_VERSION=${CMAKE_CXX_COMPILER_VERSION}
-          BL_GCC_MAJOR_VERSION=${COMP_VERSION_MAJOR}
-          BL_GCC_MINOR_VERSION=${COMP_VERSION_MINOR}
-          >
-          )
-  elseif ( ${CMAKE_CXX_COMPILER_ID} STREQUAL "Clang" )
-     target_compile_definitions( amrex PUBLIC $<BUILD_INTERFACE:
-          BL_CLANG_VERSION=${CMAKE_CXX_COMPILER_VERSION}
-          BL_CLANG_MAJOR_VERSION=${COMP_VERSION_MAJOR}
-          BL_CLANG_MINOR_VERSION=${COMP_VERSION_MINOR}
-          >
-          )
-  endif ()
-
-   if ( ENABLE_PIC OR BUILD_SHARED_LIBS )
+   if ( AMReX_PIC OR BUILD_SHARED_LIBS )
       set_target_properties ( amrex PROPERTIES POSITION_INDEPENDENT_CODE True )
    endif ()
 
-   if ( BUILD_SHARED_LIBS OR ENABLE_CUDA )
+   if ( BUILD_SHARED_LIBS OR AMReX_CUDA )
       if(APPLE)
          target_link_options(amrex PUBLIC -Wl,-undefined,warning)
       else()
@@ -228,11 +195,11 @@ function (print_amrex_configuration_summary)
 
         # _${_ll}${_p} is a variable named as _lang_property,
         # both lower case.
-        evaluate_genex(${_p} _${_ll}${_p}
-           LANG ${_l}
-           COMP ${CMAKE_${_l}_COMPILER_ID}
-           CONFIG ${CMAKE_BUILD_TYPE}
-           INTERFACE BUILD)
+        set(_${_ll}${_p} "${${_p}}")
+        eval_genex( _${_ll}${_p} ${_l} ${CMAKE_${_l}_COMPILER_ID}
+           COMP_VERSION ${CMAKE_${_l}_COMPILER_VERSION}
+           CONFIG       ${CMAKE_BUILD_TYPE}
+           INTERFACE    BUILD)
 
         if (_${_ll}${_p})
 
@@ -264,22 +231,30 @@ function (print_amrex_configuration_summary)
    message( STATUS "   Build type               = ${CMAKE_BUILD_TYPE}")
    message( STATUS "   Install directory        = ${CMAKE_INSTALL_PREFIX}")
    message( STATUS "   C++ compiler             = ${CMAKE_CXX_COMPILER}")
-   message( STATUS "   Fortran compiler         = ${CMAKE_Fortran_COMPILER}")
-   if (ENABLE_CUDA)
+   if (CMAKE_Fortran_COMPILER_LOADED)
+      message( STATUS "   Fortran compiler         = ${CMAKE_Fortran_COMPILER}")
+   endif ()
+   if (AMReX_CUDA)
       message( STATUS "   CUDA compiler            = ${CMAKE_CUDA_COMPILER}")
    endif ()
 
    message( STATUS "   C++ defines              = ${_cxx_defines}")
-   message( STATUS "   Fortran defines          = ${_fortran_defines}")
+   if (CMAKE_Fortran_COMPILER_LOADED)
+      message( STATUS "   Fortran defines          = ${_fortran_defines}")
+   endif ()
 
    message( STATUS "   C++ flags                = ${_cxx_flags}")
-   message( STATUS "   Fortran flags            = ${_fortran_flags}")
-   if (ENABLE_CUDA)
+   if (CMAKE_Fortran_COMPILER_LOADED)
+      message( STATUS "   Fortran flags            = ${_fortran_flags}")
+   endif ()
+   if (AMReX_CUDA)
       message( STATUS "   CUDA flags               = ${CMAKE_CUDA_FLAGS_${AMREX_BUILD_TYPE}} ${CMAKE_CUDA_FLAGS}"
          "${AMREX_CUDA_FLAGS}")
    endif ()
    message( STATUS "   C++ include paths        = ${_cxx_includes}")
-   message( STATUS "   Fortran include paths    = ${_fortran_includes}")
+   if (CMAKE_Fortran_COMPILER_LOADED)
+      message( STATUS "   Fortran include paths    = ${_fortran_includes}")
+   endif ()
    message( STATUS "   Link line                = ${_cxx_link_line}")
 
 endfunction ()
diff --git a/Tools/CMake/AMReX_Defines.cmake b/Tools/CMake/AMReX_Defines.cmake
index f702db2f6fd..b5d6dc417f9 100644
--- a/Tools/CMake/AMReX_Defines.cmake
+++ b/Tools/CMake/AMReX_Defines.cmake
@@ -44,47 +44,49 @@ function ( set_amrex_defines )
    endif ()
 
    # Base profiling options
-   add_amrex_define( AMREX_PROFILING       IF ENABLE_BASE_PROFILE )
-   add_amrex_define( AMREX_TRACE_PROFILING IF ENABLE_TRACE_PROFILE )
-   add_amrex_define( AMREX_COMM_PROFILING  IF ENABLE_COMM_PROFILE )
+   add_amrex_define( AMREX_PROFILING       IF AMReX_BASE_PROFILE )
+   add_amrex_define( AMREX_TRACE_PROFILING IF AMReX_TRACE_PROFILE )
+   add_amrex_define( AMREX_COMM_PROFILING  IF AMReX_COMM_PROFILE )
 
    # Tiny profiler
-   add_amrex_define( AMREX_TINY_PROFILING NO_LEGACY IF ENABLE_TINY_PROFILE )
+   add_amrex_define( AMREX_TINY_PROFILING NO_LEGACY IF AMReX_TINY_PROFILE )
 
    # Mem profiler
-   add_amrex_define( AMREX_MEM_PROFILING NO_LEGACY IF ENABLE_MEM_PROFILE )
-
-   # Backtrace
-   if (ENABLE_BACKTRACE)
-      add_amrex_define( AMREX_BACKTRACING NO_LEGACY)
-      add_amrex_define( AMREX_TESTING NO_LEGACY )
-   endif ()
+   add_amrex_define( AMREX_MEM_PROFILING NO_LEGACY IF AMReX_MEM_PROFILE )
 
    # MPI
-   add_amrex_define( AMREX_USE_MPI IF ENABLE_MPI )
+   add_amrex_define( AMREX_USE_MPI IF AMReX_MPI )
+   add_amrex_define( AMREX_MPI_THREAD_MULTIPLE NO_LEGACY IF AMReX_MPI_THREAD_MULTIPLE)
 
    # OpenMP -- This one has legacy definition only in Base/AMReX_omp_mod.F90
-   add_amrex_define( AMREX_USE_OMP IF ENABLE_OMP )
+   add_amrex_define( AMREX_USE_OMP IF AMReX_OMP )
+
+   # DPCPP
+   add_amrex_define( AMREX_USE_DPCPP NO_LEGACY IF AMReX_DPCPP )
+   add_amrex_define( AMREX_USE_GPU NO_LEGACY IF AMReX_DPCPP )
+
+   # HIP
+   add_amrex_define( AMREX_USE_HIP NO_LEGACY IF AMReX_HIP )
+   add_amrex_define( NDEBUG IF AMReX_HIP)  # This address a bug that causes slow build times
 
    # Precision
-   if (NOT ENABLE_DP)
+   if (AMReX_PRECISION STREQUAL SINGLE)
       add_amrex_define(AMREX_USE_FLOAT)
    endif ()
 
    # Dimensionality
-   add_amrex_define( AMREX_SPACEDIM=${DIM} )
+   add_amrex_define( AMREX_SPACEDIM=${AMReX_SPACEDIM} )
 
-   # System -- not used anywhere in the source code but mentioned
-   # in /Src/AmrTask/ Makefiles
+   # System -- not used anywhere in the source code
    add_amrex_define( AMREX_${CMAKE_SYSTEM_NAME} )
 
    #  Assertions
-   add_amrex_define( AMREX_USE_ASSERTION NO_LEGACY IF ENABLE_ASSERTIONS )
+   add_amrex_define( AMREX_USE_ASSERTION NO_LEGACY IF AMReX_ASSERTIONS )
 
    #
    # Fortran-specific defines: BL_LANG_FORT and AMREX_LANG_FORT
    #
-   if (ENABLE_FORTRAN)
+   if (AMReX_FORTRAN)
       target_compile_definitions ( amrex PUBLIC
          $<$<COMPILE_LANGUAGE:Fortran>:BL_LANG_FORT> )
       target_compile_definitions ( amrex PUBLIC
@@ -94,11 +96,15 @@ function ( set_amrex_defines )
       # Fortran/C mangling scheme
       #
       include( FortranCInterface )
+      if(NOT FortranCInterface_GLOBAL_FOUND)
+          message(FATAL_ERROR "Failed to find the Fortan C Interface -- check the CMakeError.log")
+      endif()
       include( ${FortranCInterface_BINARY_DIR}/Output.cmake )
 
       set( FORTLINK "" )
 
-      if ( FortranCInterface_GLOBAL_SUFFIX STREQUAL "" )
+      if ( (FortranCInterface_GLOBAL_SUFFIX STREQUAL "" ) AND NOT
+          (FortranCInterface_GLOBAL_CASE STREQUAL "") )
          set(FORTLINK "${FortranCInterface_GLOBAL_CASE}CASE" )
          message(STATUS "Fortran name mangling scheme: ${FORTLINK} (no append underscore)")
       elseif ( (FortranCInterface_GLOBAL_SUFFIX STREQUAL "_")  AND
@@ -106,7 +112,13 @@ function ( set_amrex_defines )
          set(FORTLINK "UNDERSCORE")
          message(STATUS "Fortran name mangling scheme: ${FORTLINK} (lower case, append underscore)")
       else ()
-         message(AUTHOR_WARNING "Fortran to C mangling not compatible with AMReX code")
+         # now we have to guess
+         if (CMAKE_Fortran_COMPILER_ID MATCHES XL) # old IBM prior to XLClang
+             set(FORTLINK "LOWERCASE")
+         else ()
+             set(FORTLINK "UNDERSCORE")
+         endif()
+         message(WARNING "Fortran to C mangling not compatible with AMReX code, assuming '${FORTLINK}'")
       endif ()
 
       add_amrex_define( BL_FORT_USE_${FORTLINK} )  # Only legacy form
@@ -117,52 +129,29 @@ function ( set_amrex_defines )
    endif ()
 
    # SENSEI Insitu -- only legacy
-   add_amrex_define( BL_USE_SENSEI_INSITU IF ENABLE_SENSEI_INSITU )
+   add_amrex_define( BL_USE_SENSEI_INSITU IF AMReX_SENSEI )
 
    # Conduit Support
-   add_amrex_define( AMREX_USE_CONDUIT NO_LEGACY IF ENABLE_CONDUIT )
+   add_amrex_define( AMREX_USE_CONDUIT NO_LEGACY IF AMReX_CONDUIT )
 
    # Ascent Support
-   add_amrex_define( AMREX_USE_ASCENT NO_LEGACY IF ENABLE_ASCENT )
+   add_amrex_define( AMREX_USE_ASCENT NO_LEGACY IF AMReX_ASCENT )
 
    # EB
-   add_amrex_define( AMREX_USE_EB NO_LEGACY IF ENABLE_EB )
+   add_amrex_define( AMREX_USE_EB NO_LEGACY IF AMReX_EB )
 
    #
    # CUDA
    #
-   add_amrex_define( AMREX_USE_CUDA NO_LEGACY IF ENABLE_CUDA )
-   add_amrex_define( AMREX_USE_NVML NO_LEGACY IF ENABLE_CUDA )
-   add_amrex_define( AMREX_GPU_MAX_THREADS=${CUDA_MAX_THREADS} NO_LEGACY
-      IF ENABLE_CUDA )
-
-   # Fortran macros used by application code only
-   # (they are not present in AMReX source code)
-   if (ENABLE_CUDA AND ENABLE_AMREX_FORTRAN )
-      target_compile_definitions( amrex PUBLIC
-         $<$<COMPILE_LANGUAGE:Fortran>:AMREX_LAUNCH=attributes\(global\);
-         AMREX_DEVICE=attributes\(device\);
-         AMREX_CUDA_FORT_GLOBAL=attributes\(global\);
-         AMREX_CUDA_FORT_DEVICE=attributes\(device\);
-         AMREX_CUDA_FORT_HOST=attributes\(host\)>)
-   # else ()
-   #    target_compile_definitions( amrex PUBLIC
-   #       $<$<COMPILE_LANGUAGE:Fortran>:AMREX_LAUNCH=\"\";
-   #       AMREX_DEVICE=\"\";
-   #       AMREX_CUDA_FORT_GLOBAL=\"\";
-   #       AMREX_CUDA_FORT_DEVICE=\"\";
-   #       AMREX_CUDA_FORT_HOST=\"\">)
-   endif ()
-
-   #
-   # OpenACC
-   #
-   add_amrex_define( AMREX_USE_ACC NO_LEGACY IF ENABLE_ACC )
+   add_amrex_define( AMREX_USE_CUDA NO_LEGACY IF AMReX_CUDA )
+   add_amrex_define( AMREX_USE_NVML NO_LEGACY IF AMReX_CUDA )
+   add_amrex_define( AMREX_GPU_MAX_THREADS=${AMReX_CUDA_MAX_THREADS} NO_LEGACY
+      IF AMReX_CUDA )
 
    #
    # General setup for any GPUs
    #
-   if (ENABLE_CUDA OR ENABLE_ACC)
+   if (AMReX_CUDA OR AMReX_HIP)
       add_amrex_define( AMREX_USE_GPU  NO_LEGACY )
       add_amrex_define( BL_COALESCE_FABS )
 
@@ -173,4 +162,10 @@ function ( set_amrex_defines )
          NO_LEGACY IF GPUS_PER_NODE)
    endif ()
 
+   #
+   # HDF5
+   #
+   add_amrex_define(AMREX_USE_HDF5 NO_LEGACY IF AMReX_HDF5)
+   add_amrex_define(AMREX_USE_HDF5_ASYNC NO_LEGACY IF AMReX_HDF5_ASYNC)
+
 endfunction ()
diff --git a/Tools/CMake/AMReX_Machines.cmake b/Tools/CMake/AMReX_Machines.cmake
deleted file mode 100644
index 9dd125fcda8..00000000000
--- a/Tools/CMake/AMReX_Machines.cmake
+++ /dev/null
@@ -1,95 +0,0 @@
-#
-# This file defines the following variables
-# 
-#   CCSE_MACHINES
-#   NERSC_MACHINES
-#   OCLF_MACHINES
-#   LLNL_MACHINES
-#   ALCF_MACHINES
-#   NREAL_MACHINES
-#   FLASH_MACHINES
-#   SITE
-#   MACHINE
-
-#
-#  CCSE machines
-#
-set ( CCSE_MACHINES )
-list ( APPEND CCSE_MACHINES angilas atragon baragon battra biollante ebirah gamera gigan )
-list ( APPEND CCSE_MACHINES gimantis godzilla gojira hedorah kiryu kumonga manda )
-list ( APPEND CCSE_MACHINES megalon mothra rodan varan naphta orga ghidorah )
-
-#
-# NERSC machines
-# 
-set ( NERSC_MACHINES )
-list (APPEND NERSC_MACHINES cori )
-
-#
-# OLCF machines
-# 
-set ( OLCF_MACHINES )
-list ( APPEND OLCF_MACHINES titan summit summitdev )
-
-#
-# LLNL machines
-# 
-set ( LLNL_MACHINES )
-list ( APPEND LLNL_MACHINES ray rzmanta )
-
-#
-# ALCF machines
-#
-set ( ACLF_MACHINES )
-list ( APPEND ACLF_MACHINES mira theta )
-
-#
-# NREL machines
-#
-set ( NREL_MACHINES )
-list ( APPEND NREL_MACHINES merlin anymachine )
-
-#
-# FLASH machines
-#
-set ( FLASH_MACHINES )
-list ( APPEND FLASH_MACHINES asterix )
-
-#
-# Find machine and site where AMReX is being used
-#
-set ( SITE     unknown )
-set ( MACHINE  unknown )
-cmake_host_system_information ( RESULT MACHINE QUERY HOSTNAME )
-
-# function to assign SITE
-function ( assign_site group machine site_name )
-   foreach ( item ${${group}} )
-      string ( FIND "${${machine}}" "${item}" pos ) 
-      if ( ${pos} GREATER -1 )
-	 set ( SITE ${site_name} PARENT_SCOPE )
-	 return ()
-      endif ()
-   endforeach()
-endfunction ()
-
-assign_site ( CCSE_MACHINES MACHINE ccse )
-
-assign_site ( NERSC_MACHINES MACHINE nersc )
-
-assign_site ( OLCF_MACHINES MACHINE olcf )
-
-assign_site ( LLNL_MACHINES MACHINE llnl )
-
-assign_site ( ALCF_MACHINES MACHINE alcf )
-
-assign_site ( FLASH_MACHINES MACHINE flash )
-
-assign_site ( NREAL_MACHINES MACHINE nrel )
-
-message ( STATUS "Machine name is ${MACHINE}")
-message ( STATUS "Site name is ${SITE}" )
-
-
-
-
diff --git a/Tools/CMake/AMReX_Options.cmake b/Tools/CMake/AMReX_Options.cmake
deleted file mode 100644
index efd28dd68d1..00000000000
--- a/Tools/CMake/AMReX_Options.cmake
+++ /dev/null
@@ -1,272 +0,0 @@
-###############################################
-
-# Here we define the default config options   #
-# that can be overwritten by the user         #
-
-###############################################
-include_guard(GLOBAL)
-
-#
-# Include module
-#
-include(CMakeDependentOption)
-
-
-#
-# Define a macro to check the value of the inputs integer options
-#
-macro (print_option var)
-   message ( STATUS "   ${var} = ${${var}}")
-endmacro ()
-
-#
-# Check if CMAKE_BUILD_TYPE is given. If not, use default
-#
-if ( NOT CMAKE_BUILD_TYPE )
-   message(STATUS "Setting build type to Release as none was specified.")
-   set( CMAKE_BUILD_TYPE Release )
-else ()
-   message(STATUS "Build type set by user to '${CMAKE_BUILD_TYPE}'.")
-endif()
-
-
-#
-# Populate the cache and check the value of the user-definable options
-#
-message(STATUS "Configuring AMReX with the following options: ")
-
-
-#
-# This is the option to enable/disable xSDK mode
-#
-option( USE_XSDK_DEFAULTS "Enable xSDK mode"  OFF )
-print_option( USE_XSDK_DEFAULTS )
-
-
-#
-# Option to control the type of library build: static vs shared
-#
-if ( USE_XSDK_DEFAULTS )
-   option( BUILD_SHARED_LIBS "Build AMReX shared library" ON )
-else ()
-   option( BUILD_SHARED_LIBS "Build AMReX shared library" OFF )
-endif ()
-print_option( BUILD_SHARED_LIBS )
-
-#
-# Print out info on install path
-#
-print_option( CMAKE_INSTALL_PREFIX )
-
-
-#
-# Option to control if Fortran must be enabled
-#
-if ( USE_XSDK_DEFAULTS )
-   option( XSDK_ENABLE_Fortran "Enable Fortran language" OFF )
-   set( ENABLE_FORTRAN ${XSDK_ENABLE_Fortran} CACHE INTERNAL "")
-   print_option(XSDK_ENABLE_Fortran)
-else()
-   option( ENABLE_FORTRAN "Enable Fortran language" ON )
-   print_option( ENABLE_FORTRAN )
-endif ()
-
-
-set (DIM 3 CACHE STRING "Dimension of AMReX build")
-if ( (${DIM} GREATER 3) OR (${DIM} LESS 1) )
-   message ( FATAL_ERROR "DIM must be either 1, 2 or 3.")
-endif ()
-print_option( DIM )
-
-option( ENABLE_PIC "Build position-independent code" OFF)
-print_option( ENABLE_PIC )
-
-option( ENABLE_MPI  "Enable MPI"  ON)
-print_option( ENABLE_MPI )
-
-option( ENABLE_OMP  "Enable OpenMP" OFF)
-print_option( ENABLE_OMP )
-
-
-if ( USE_XSDK_DEFAULTS )
-   set ( XSDK_PRECISION "DOUBLE" CACHE STRING "Precision:<SINGLE,DOUBLE>" )
-   if ( "${XSDK_PRECISION}" STREQUAL "DOUBLE" )
-      set ( ENABLE_DP ON )
-   elseif ( "${XSDK_PRECISION}" STREQUAL "SINGLE" )
-      set ( ENABLE_DP OFF )
-   else ()
-      message ( WARNING "Unsupported precision ${XSDK_PRECISION}: defaulting to DOUBLE" )
-      set ( XSDK_PRECISION "DOUBLE" CACHE STRING "Precision:<SINGLE,DOUBLE>" )
-      set ( ENABLE_DP ON )
-   endif ()
-   print_option( XSDK_PRECISION )
-else ()
-   option( ENABLE_DP "Enable double precision" ON )
-   print_option( ENABLE_DP )
-endif ()
-
-
-#
-# AMReX components selection
-#
-option( ENABLE_EB "Build EB Code" OFF )
-print_option(ENABLE_EB)
-
-if (ENABLE_FORTRAN)
-   option( ENABLE_FORTRAN_INTERFACES "Build Fortran API" OFF )
-   print_option(ENABLE_FORTRAN_INTERFACES)
-else ()
-   set(ENABLE_FORTRAN_INTERFACES OFF CACHE INTERNAL "Build Fortran API")
-endif ()
-
-option( ENABLE_LINEAR_SOLVERS  "Build AMReX Linear solvers" ON )
-print_option( ENABLE_LINEAR_SOLVERS )
-
-option( ENABLE_AMRDATA "Build data services" OFF)
-print_option( ENABLE_AMRDATA )
-
-option( ENABLE_PARTICLES "Build particle classes" OFF)
-print_option( ENABLE_PARTICLES )
-
-if ( ENABLE_PARTICLES )
-   if ( USE_XSDK_DEFAULTS )
-      if ( "${XSDK_PRECISION}" STREQUAL "DOUBLE" )
-	 set ( ENABLE_DP_PARTICLES ON )
-      elseif ( "${XSDK_PRECISION}" STREQUAL "SINGLE" )
-	 set ( ENABLE_DP_PARTICLES OFF )
-      endif ()
-   else ()
-      option( ENABLE_DP_PARTICLES "Enable double-precision particle data" ON )
-      print_option( ENABLE_DP_PARTICLES )
-   endif ()
-endif ()
-
-option( ENABLE_SENSEI_INSITU "Enable SENSEI in situ infrastructure" OFF )
-print_option( ENABLE_SENSEI_INSITU )
-
-
-#
-# Conduit Support (for features in Src/Extern/Conduit)
-# Note: ENABLE_CONDUIT = ON, requires CONDUIT_DIR.
-#
-option ( ENABLE_CONDUIT "Enable Conduit support" OFF )
-print_option ( ENABLE_CONDUIT )
-
-if (ENABLE_CONDUIT)
-   option ( ENABLE_ASCENT "Enable Ascent support" OFF )
-   print_option ( ENABLE_ASCENT )
-endif ()
-
-
-#
-# External packages
-#
-option(ENABLE_SUNDIALS "Enable SUNDIALS4 interfaces" OFF)
-print_option(ENABLE_SUNDIALS)
-
-# Hypre
-if (ENABLE_LINEAR_SOLVERS)
-   option(ENABLE_HYPRE "Enable Hypre interfaces" OFF)
-   print_option(ENABLE_HYPRE)
-   option(ENABLE_PETSC "Enable PETSc interfaces" OFF)
-   print_option(ENABLE_PETSC)
-else ()
-   set(ENABLE_HYPRE OFF CACHE INTERNAL "Enable Hypre interfaces")
-   set(ENABLE_PETSC OFF CACHE INTERNAL "Enable PETSc interfaces")
-endif ()
-
-
-#
-# Compilation options
-#
-option(ENABLE_FPE "Enable Floating Point Exceptions checks" OFF)
-print_option( ENABLE_FPE )
-
-if ( "${CMAKE_BUILD_TYPE}" MATCHES "Debug" )
-   option( ENABLE_ASSERTIONS "Enable assertions" ON)
-else ()
-   option( ENABLE_ASSERTIONS "Enable assertions" OFF)
-endif ()
-
-print_option( ENABLE_ASSERTIONS )
-
-
-#
-# Profiling options
-#
-option( ENABLE_BASE_PROFILE "Enable basic profiling" OFF )
-print_option( ENABLE_BASE_PROFILE )
-
-option( ENABLE_TINY_PROFILE "NOT ENABLE_BASE_DEBUG" OFF)
-print_option( ENABLE_TINY_PROFILE )
-
-option( ENABLE_TRACE_PROFILE "Enable trace-profiling" OFF )
-print_option( ENABLE_TRACE_PROFILE )
-
-option( ENABLE_MEM_PROFILE   "Enable memory profiling" OFF )
-print_option( ENABLE_MEM_PROFILE )
-
-option( ENABLE_COMM_PROFILE  "Enable communicator-profiling" OFF )
-print_option( ENABLE_COMM_PROFILE )
-
-option( ENABLE_BACKTRACE "Enable backtracing" OFF)
-print_option( ENABLE_BACKTRACE )
-
-option( ENABLE_PROFPARSER "Enable profile parser" OFF)
-print_option( ENABLE_PROFPARSER )
-
-set ( TP_PROFILE "None" CACHE STRING "Third-party profiling options:<CRAYPAT,FORGE,VTUNE>")
-print_option( TP_PROFILE )
-
-
-# Modify the profiling options if needed ( because of dependencies between
-# the options )
-if (ENABLE_PROFPARSER)
-   set (ENABLE_BASE_PROFILE ON)
-   set (ENABLE_TRACE_PROFILE ON)
-   set (ENABLE_AMRDATA ON)
-endif ()
-
-if (ENABLE_TRACE_PROFILE OR ENABLE_COMM_PROFILE)
-   set (ENABLE_BASE_PROFILE ON)
-endif ()
-
-if (ENABLE_BASE_PROFILE)
-   set (ENABLE_TINY_PROFILE OFF)
-endif()
-
-# Check profile options
-if ( NOT ( ${CMAKE_C_COMPILER_ID} MATCHES "Intel" ) AND
-      ( ${TP_PROFILE} MATCHES "VTUNE") )
-   message ( WARNING "VTUNE cannot be used with ${CMAKE_C_COMPILER_ID} compiler: ignoring TP_PROFILE" )
-   set ( TP_PROFILE "")
-endif ()
-
-if (  ( ( ${TP_PROFILE} MATCHES "CRAYPAT" ) OR
-        ( ${TP_PROFILE} MATCHES "FORGE"   ) OR
-        ( ${TP_PROFILE} MATCHES "VTUNE"   )   ) AND
-     (ENABLE_BASE_PROFILE OR ENABLE_TINY_PROFILE) )
-   message (WARNING "This configuration should only be used to profile BL_PROFILE!")
-endif()
-
-#
-# GPU options
-#
-
-# More CUDA options in AMReX_SetupCUDA
-option( ENABLE_CUDA "Enable GPU support via CUDA" OFF )
-print_option( ENABLE_CUDA )
-
-option( ENABLE_ACC  "Enable GPU support via OpenACC" OFF )
-print_option( ENABLE_ACC )
-
-# GNU shared options
-if (ENABLE_CUDA OR ENABLE_ACC)
-   set(GPUS_PER_SOCKET "IGNORE" CACHE STRING
-      "Number of GPUs per socket" )
-   print_option(GPUS_PER_SOCKET)
-
-   set(GPUS_PER_NODE "IGNORE" CACHE STRING
-      "Number of GPUs per node" )
-   print_option(GPUS_PER_NODE)
-endif ()
diff --git a/Tools/CMake/AMReX_SetupCUDA.cmake b/Tools/CMake/AMReX_SetupCUDA.cmake
index e5e03046960..50461590588 100644
--- a/Tools/CMake/AMReX_SetupCUDA.cmake
+++ b/Tools/CMake/AMReX_SetupCUDA.cmake
@@ -1,12 +1,24 @@
 #
 # Setup the CUDA enviroment
 #
-#  Author: Michele Rosso
-#  Date  : April 4, 2019
+#  Authors: Michele Rosso, Axel Huebl
+#  Date   : April 4, 2019
 #
 #
 include_guard(GLOBAL)
 
+include(CMakeDependentOption)
+
+#
+# Define a macro to print active options
+#
+macro (cuda_print_option _var)
+   if (${_var})
+      message( STATUS "   ${_var}")
+   endif ()
+endmacro ()
+
+
 get_property(_lang GLOBAL PROPERTY ENABLED_LANGUAGES)
 if (NOT ("CUDA" IN_LIST _lang ))
     message(WARNING "AMReX_SetupCUDA will not be processed because CUDA language has not been enabled.")
@@ -19,35 +31,107 @@ endif ()
 # CUDAHOSTCXX and the CMake variable CMAKE_CUDA_HOST_COMPILER.
 # For the time being we force the CUDA host compiler to be the C++ compiler.
 #
-if ( ( CMAKE_CUDA_HOST_COMPILER AND NOT ("${CMAKE_CUDA_HOST_COMPILER}" STREQUAL "${CMAKE_CXX_COMPILER}") )
-      OR  ( NOT ("$ENV{CUDAHOSTCXX}" STREQUAL "") ) )
-   message(FATAl_ERROR "User-defined CUDA host compiler does not match C++ compiler")
+# Note: just comparing the CMAKE_..._COMPILER vars is not sufficient and raises
+#       false negatives on e.g. /usr/bin/g++-8 and /usr/bin/c++
+# Note: blocked by https://gitlab.kitware.com/cmake/cmake/-/issues/20901
+#
+if (CMAKE_CUDA_HOST_COMPILER)
+  if (NOT "${CMAKE_CXX_COMPILER}" STREQUAL "${CMAKE_CUDA_HOST_COMPILER}")
+    if (NOT "$ENV{CUDAHOSTCXX}" STREQUAL "" OR NOT "$ENV{CXX}" STREQUAL "")
+      message(WARNING "CUDA host compiler "
+                      "(${CMAKE_CUDA_HOST_COMPILER}) "
+                      "does not match the C++ compiler "
+                      "(${CMAKE_CXX_COMPILER})! "
+                      "Consider setting the CXX and CUDAHOSTCXX environment "
+                      "variables.")
+    endif ()
+  endif ()
 endif ()
 
 #
 #  CUDA-related options
 #
-message(STATUS "CUDA options:")
+message(STATUS "Enabled CUDA options:")
 
-set(CUDA_ARCH "Auto" CACHE STRING "CUDA architecture (Use 'Auto' for automatic detection)")
+set(AMReX_CUDA_ARCH_DEFAULT "Auto")
+if(DEFINED ENV{AMREX_CUDA_ARCH})
+    set(AMReX_CUDA_ARCH_DEFAULT "$ENV{AMREX_CUDA_ARCH}")
+endif()
+set(AMReX_CUDA_ARCH ${AMReX_CUDA_ARCH_DEFAULT} CACHE STRING "CUDA architecture (Use 'Auto' for automatic detection)")
 
-option( ENABLE_CUDA_FASTMATH "Enable CUDA fastmath" ON )
-message(STATUS "   ENABLE_CUDA_FASTMATH = ${ENABLE_CUDA_FASTMATH}")
+option(AMReX_CUDA_FASTMATH "Enable CUDA fastmath" ON)
+cuda_print_option( AMReX_CUDA_FASTMATH )
 
-set(CUDA_MAX_THREADS "256" CACHE STRING
+set(AMReX_CUDA_MAX_THREADS "256" CACHE STRING
    "Maximum number of CUDA threads per block" )
-message(STATUS "   CUDA_MAX_THREADS = ${CUDA_MAX_THREADS}")
+message( STATUS "   AMReX_CUDA_MAX_THREADS = ${AMReX_CUDA_MAX_THREADS}")
 
-set(CUDA_MAXREGCOUNT "255" CACHE STRING
+set(AMReX_CUDA_MAXREGCOUNT "255" CACHE STRING
    "Limit the maximum number of registers available" )
-message(STATUS "   CUDA_MAXREGCOUNT = ${CUDA_MAXREGCOUNT}")
+message( STATUS "   AMReX_CUDA_MAXREGCOUNT = ${AMReX_CUDA_MAXREGCOUNT}")
+
+# if this works well and does not add too much compile-time we should enable it by default
+cmake_dependent_option(AMReX_CUDA_LTO "Enable CUDA link-time-optimization" OFF
+   "CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 11.0.167" OFF)
+cuda_print_option(AMReX_CUDA_LTO)
+
+# this warns on a typical user bug when developing on (forgiving) Power9 machines (e.g. Summit)
+cmake_dependent_option(AMReX_CUDA_WARN_CAPTURE_THIS
+   "Warn if a CUDA lambda captures a class' this" ON
+   "CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 11.0.194" OFF)
+# no code should ever ship -Werror, but one can turn this on manually in CI if one likes
+cmake_dependent_option(AMReX_CUDA_ERROR_CAPTURE_THIS
+   "Error if a CUDA lambda captures a class' this" OFF
+   "CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 11.0.194" OFF)
+cuda_print_option(AMReX_CUDA_WARN_CAPTURE_THIS)
+cuda_print_option(AMReX_CUDA_ERROR_CAPTURE_THIS)
+
+# makes things more robust for -Xcompiler pre-fixing unknown nvcc flags
+# note: available with NVCC 10.2.89+; default in CMake 3.17.0+ for supporting NVCCs
+#       https://gitlab.kitware.com/cmake/cmake/-/blob/v3.17.0/Modules/Compiler/NVIDIA-CUDA.cmake
+cmake_dependent_option(CUDA_FORWARD_UNKNOWN_FLAGS_HOST
+   "Forward unknown NVCC flags to the host compiler" ON
+   "CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 10.2.89;CMAKE_VERSION VERSION_LESS 3.17" OFF)
+
+option(AMReX_CUDA_PTX_VERBOSE "Verbose code generation statistics in ptxas" OFF)
+cuda_print_option(AMReX_CUDA_PTX_VERBOSE)
+
+option(AMReX_CUDA_COMPILATION_TIMER "Generate CSV table with time for each compilation phase" OFF)
+cuda_print_option(AMReX_CUDA_COMPILATION_TIMER)
+
+# not a good default-candidate for CMAKE_BUILD_TYPE "Debug": often does not
+# compile at all, is very sensitive to further set options, or compiles super slowly;
+# im some cases, such as recursive function usage, apps need to increase
+# `cudaLimitStackSize` in order to not stack overflow with device debug symbols
+# (this costs some extra DRAM).
+option(AMReX_CUDA_DEBUG "Generate debug information for device code (optimizations: off)" OFF)
+cuda_print_option(AMReX_CUDA_DEBUG)
+
+set(_CUDA_PERF_NEUTRAL_DEBUG OFF)
+if ("${CMAKE_BUILD_TYPE}" MATCHES "Debug" OR "${CMAKE_BUILD_TYPE}" MATCHES "RelWithDebInfo")
+    set(_CUDA_PERF_NEUTRAL_DEBUG ON)
+endif ()
+
+# both are performance-neutral debug symbols
+option(AMReX_CUDA_SHOW_LINENUMBERS "Generate line-number information (optimizations: on)"
+       ${_CUDA_PERF_NEUTRAL_DEBUG})
+option(AMReX_CUDA_SHOW_CODELINES "Generate source information in PTX (optimizations: on)"
+       ${_CUDA_PERF_NEUTRAL_DEBUG})
+cuda_print_option(AMReX_CUDA_SHOW_LINENUMBERS)
+cuda_print_option(AMReX_CUDA_SHOW_CODELINES)
+
+option(AMReX_CUDA_BACKTRACE "Generate host function symbol names (better cuda-memcheck)" ${AMReX_CUDA_DEBUG})
+cuda_print_option(AMReX_CUDA_BACKTRACE)
+
+option(AMReX_CUDA_KEEP_FILES "Keep intermediately generated files (folder: nvcc_tmp)" OFF)
+cuda_print_option(AMReX_CUDA_KEEP_FILES)
 
 #
 # Error if NVCC is too old
 #
-If (CMAKE_CUDA_COMPILER_VERSION VERSION_LESS "8.0")
+if (CMAKE_CUDA_COMPILER_VERSION VERSION_LESS "9.0")
    message(FATAL_ERROR "Your nvcc version is ${CMAKE_CUDA_COMPILER_VERSION}."
-      "This is unsupported. Please use CUDA toolkit version 8.0 or newer.")
+      "This is unsupported. Please use CUDA toolkit version 9.0 or newer.")
 endif ()
 
 #
@@ -55,24 +139,26 @@ endif ()
 # autodetection is enabled
 #
 include(FindCUDA/select_compute_arch)
-cuda_select_nvcc_arch_flags(_nvcc_arch_flags ${CUDA_ARCH})
+cuda_select_nvcc_arch_flags(_nvcc_arch_flags ${AMReX_CUDA_ARCH})
 
 #
 # Remove unsupported architecture: anything less the 6.0 must go
 #
-string(REPLACE "-gencode;" "-gencode " _nvcc_arch_flags "${_nvcc_arch_flags}")
-
-foreach (_item IN LISTS _nvcc_arch_flags)
-   # Match one time the regex [0-9]+.
-   # [0-9]+ means any number between 0 and 9 will be matched one or more times (option +)
-   string(REGEX MATCH "[0-9]+" _cuda_compute_capability "${_item}")
+string(REPLACE "-gencode;" "-gencode=" _nvcc_arch_flags "${_nvcc_arch_flags}")
 
-   if (_cuda_compute_capability LESS 60)
-      message(STATUS "Ignoring unsupported CUDA architecture ${_cuda_compute_capability}")
-      list(REMOVE_ITEM _nvcc_arch_flags ${_item})
-   endif ()
-
-endforeach ()
+if (AMReX_CUDA_LTO)
+    # we replace
+    #   -gencode=arch=compute_NN,code=sm_NN
+    # with
+    #   -gencode=arch=compute_NN,code=lto_NN
+    set(_nvcc_arch_flags_org ${_nvcc_arch_flags})
+    foreach (_item IN LISTS _nvcc_arch_flags_org)
+       string(REGEX MATCH "[0-9]+" _cuda_compute_capability "${_item}")
+       string(REPLACE "code=sm_${_cuda_compute_capability}"
+                      "code=lto_${_cuda_compute_capability}"
+              _nvcc_arch_flags "${_nvcc_arch_flags}")
+    endforeach ()
+endif ()
 
 if (NOT _nvcc_arch_flags)
    message(FATAL_ERROR "the given target CUDA architectures are not supported by AMReX")
@@ -105,10 +191,87 @@ set(NVCC_VERSION_MINOR "${_nvcc_version_minor}" CACHE INTERNAL "CUDA compiler ve
 
 # We gotta set CUDA flags globally since there is no other way at this time to pass CUDA flags to
 # device linking stage
-set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --expt-relaxed-constexpr --expt-extended-lambda")
-set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Wno-deprecated-gpu-targets -m64 ${NVCC_ARCH_FLAGS}")
-set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -maxrregcount=${CUDA_MAXREGCOUNT}")
+if (NOT (CMAKE_SYSTEM_NAME STREQUAL "Windows" ) )
+   # CUDA only supports 64bit builds on windows ( 32bit builds are deprecated ).
+   # Thus the option "--machine 64" is being set by the msbuild configuration.
+   # For Linux and MAC, we need to enforce that manually
+   set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -m64")
+endif ()
+string(APPEND CMAKE_CUDA_FLAGS " --expt-relaxed-constexpr --expt-extended-lambda")
+string(APPEND CMAKE_CUDA_FLAGS " -Wno-deprecated-gpu-targets ${NVCC_ARCH_FLAGS}")
+string(APPEND CMAKE_CUDA_FLAGS " -maxrregcount=${AMReX_CUDA_MAXREGCOUNT}")
+
+# This is to work around a bug with nvcc, see: https://github.com/kokkos/kokkos/issues/1473
+string(APPEND CMAKE_CUDA_FLAGS " -Xcudafe --diag_suppress=esa_on_defaulted_function_ignored")
 
-if (ENABLE_CUDA_FASTMATH)
+if (AMReX_CUDA_FASTMATH)
    set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --use_fast_math")
 endif ()
+
+#
+# Print numbers for warnings and errors
+#
+set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xcudafe --display_error_number")
+
+
+#
+# CUDA specific warnings
+#
+if (AMReX_CUDA_WARN_CAPTURE_THIS)
+    string(APPEND CMAKE_CUDA_FLAGS " --Wext-lambda-captures-this")
+endif()
+if (AMReX_CUDA_ERROR_CAPTURE_THIS)
+    # note: prefer double-dash --Werror!
+    # https://github.com/ccache/ccache/issues/598
+    string(APPEND CMAKE_CUDA_FLAGS " --Werror ext-lambda-captures-this")
+endif()
+
+#
+# Forward unknown NVCC flags to the host compiler
+#
+if (CUDA_FORWARD_UNKNOWN_FLAGS_HOST)
+    string(APPEND CMAKE_CUDA_FLAGS " --forward-unknown-to-host-compiler")
+endif()
+
+#
+# Code generation
+#
+if (AMReX_CUDA_PTX_VERBOSE)
+    string(APPEND CMAKE_CUDA_FLAGS " --ptxas-options=-v")
+endif()
+
+# keep intermediately generated files
+if (AMReX_CUDA_KEEP_FILES)
+    make_directory("${PROJECT_BINARY_DIR}/nvcc_tmp")
+    string(APPEND CMAKE_CUDA_FLAGS " --keep --keep-dir ${PROJECT_BINARY_DIR}/nvcc_tmp")
+endif ()
+
+# compilation timings
+if (AMReX_CUDA_COMPILATION_TIMER)
+    file(REMOVE "${PROJECT_BINARY_DIR}/nvcc_timings.csv")
+    string(APPEND CMAKE_CUDA_FLAGS " --time ${PROJECT_BINARY_DIR}/nvcc_timings.csv")
+endif ()
+
+#
+# Debugging
+#
+if (AMReX_CUDA_DEBUG)
+    # is this unsupported with MSVC?
+    string(APPEND CMAKE_CUDA_FLAGS " -G")
+endif()
+
+if (AMReX_CUDA_SHOW_LINENUMBERS AND NOT AMReX_CUDA_DEBUG)
+    # nvcc warning : '--device-debug (-G)' overrides '--generate-line-info (-lineinfo)'
+    string(APPEND CMAKE_CUDA_FLAGS " --generate-line-info")
+endif ()
+if (AMReX_CUDA_SHOW_CODELINES)
+    string(APPEND CMAKE_CUDA_FLAGS " --source-in-ptx")
+endif ()
+
+if (AMReX_CUDA_BACKTRACE)
+    if (CMAKE_SYSTEM_NAME STREQUAL "Windows")
+        string(APPEND CMAKE_CUDA_FLAGS " -Xcompiler /Zi") # comes with Debug & RelWithDebInfo
+    else ()
+        string(APPEND CMAKE_CUDA_FLAGS " -Xcompiler -rdynamic")
+    endif ()
+endif ()
diff --git a/Tools/CMake/AMReX_ThirdPartyProfilers.cmake b/Tools/CMake/AMReX_ThirdPartyProfilers.cmake
index 446cb237046..9c410cc7ddc 100644
--- a/Tools/CMake/AMReX_ThirdPartyProfilers.cmake
+++ b/Tools/CMake/AMReX_ThirdPartyProfilers.cmake
@@ -11,56 +11,45 @@
 # Author: Michele Rosso
 # Date  : June 26, 2018
 #
-# 
+#
 function (set_amrex_profilers)
 
-   # 
+   #
    # Check if target "amrex" has been defined before
    # calling this macro
    #
    if (NOT TARGET amrex)
-      message (FATAL_ERROR "Target 'amrex' must be defined before calling function 'set_amrex_profilers'" )     
-   endif ()
-
-   #
-   # Check that needed options have already been defined
-   # 
-   if ( ( NOT ( DEFINED TP_PROFILE ) ) OR ( NOT (DEFINED SITE) ) )
-      message ( AUTHOR_WARNING "Required options are not defined" )
-      return ()
+      message (FATAL_ERROR "Target 'amrex' must be defined before calling function 'set_amrex_profilers'" )
    endif ()
 
+   cmake_host_system_information( RESULT _machine QUERY HOSTNAME )
 
-   if ( ${TP_PROFILE} MATCHES "CRAYPAT" )
+   if ( TP_PROFILE MATCHES "CRAYPAT" )
 
       add_amrex_define( AMREX_CRAYPAT )
-      if ( ${SITE} MATCHES "nersc" )
-         target_include_directories ( amrex PUBLIC $ENV{CRAYPAT_ROOT}/include )
+      if ( _machine MATCHES "cori" )
+         target_include_directories( amrex PUBLIC $ENV{CRAYPAT_ROOT}/include )
       endif ()
 
-   elseif ( ${TP_PROFILE} MATCHES "FORGE" )
+   elseif ( TP_PROFILE MATCHES "FORGE" )
 
       add_amrex_define( AMREX_FORGE )
-      if ( ${SITE} MATCHES "nersc" )
-         target_include_directories ( amrex PUBLIC 
+      if ( _machine MATCHES "cori" )
+         target_include_directories( amrex PUBLIC
 	    $ENV{ALLINEA_TOOLS_DIR}/$ENV{ALLINEA_TOOLS_VERSION}/map/wrapper )
       endif()
 
-   elseif ( ${TP_PROFILE} MATCHES "VTUNE" )
+   elseif ( TP_PROFILE MATCHES "VTUNE" )
 
       add_amrex_define( AMREX_VTUNE )
-      target_compile_options ( amrex PUBLIC -debug inline-debug-info -parallel-source-info=2 )
+      target_compile_options( amrex PUBLIC -debug inline-debug-info -parallel-source-info=2 )
 
-      if ( ${SITE} MATCHES "nersc" )
-         target_compile_options ( amrex PUBLIC -dynamic )
-         target_include_directories ( amrex PUBLIC $ENV{VTUNE_AMPLIFIER_XE_2018_DIR}/include )
-         target_link_libraries ( amrex PUBLIC -L$ENV{VTUNE_AMPLIFIER_XE_2018_DIR}/lib64 -littnotify )
+      if ( _machine MATCHES "cori" )
+         target_compile_options( amrex PUBLIC -dynamic )
+         target_include_directories( amrex PUBLIC $ENV{VTUNE_AMPLIFIER_XE_2018_DIR}/include )
+         target_link_libraries( amrex PUBLIC -L$ENV{VTUNE_AMPLIFIER_XE_2018_DIR}/lib64 -littnotify )
       endif ()
 
    endif ()
-   
-endfunction ()
-
-
-
 
+endfunction ()
diff --git a/Tools/CMake/AMReX_Utils.cmake b/Tools/CMake/AMReX_Utils.cmake
index b3da8a8b462..8e8e6c292b4 100644
--- a/Tools/CMake/AMReX_Utils.cmake
+++ b/Tools/CMake/AMReX_Utils.cmake
@@ -1,282 +1,108 @@
-###################################################################
-# Check if dir or file given by path exists and issue a warning or
-#  error if not
-##################################################################
-function ( check_path  path  message_type )
-  if ( EXISTS ${path} )
-  else ()
-    message(${message_type} ${path} " does not exist!")
-  endif ( EXISTS ${path} )
-endfunction ()
-
-
 #
-# This function turns a list into a string
-# 
-function ( list_to_string list )
-  string (REPLACE ";" " " tmp "${${list}}")
-  set ( ${list} "${tmp}" PARENT_SCOPE)
-endfunction ()
-
 #
-# Create list of all include directories
-# cmake must be re-run if new dirs with Headers are introduced
+# FUNCTION: get_amrex_version
 #
-# Arguments:
+# Retrieves AMReX version info and sets internal cache variables
+# AMREX_GIT_VERSION and AMREX_PKG_VERSION
 #
-#  dirlist  = the list of subdir
-#  ROOT     = top level directory from where to start search
-#             If not given, default is CMAKE_CURRENT_LIST_DIR
-#  EXCLUDE  = list of path to exclude from search
 #
-function ( find_include_paths dirlist )
+function (get_amrex_version)
 
-  cmake_parse_arguments ( ARG "" "ROOT" "EXCLUDE"  ${ARGN} )
+   find_package(Git QUIET)
 
-  if (NOT ARG_ROOT)
-    set ( ARG_ROOT ${CMAKE_CURRENT_LIST_DIR} )
-  endif ()
+   set( _tmp "" )
 
-  # Check that root and exclude dir exist
-  set ( alldirs ${ARG_ROOT} )
-  if ( ARG_EXCLUDE )
-    list (APPEND alldirs ${ARG_EXCLUDE} )
-  endif ()
+   # Try to inquire software version from git
+   if ( EXISTS ${CMAKE_CURRENT_LIST_DIR}/.git AND ${GIT_FOUND} )
+      execute_process ( COMMAND git describe --abbrev=12 --dirty --always --tags
+         WORKING_DIRECTORY ${CMAKE_CURRENT_LIST_DIR}
+         OUTPUT_VARIABLE _tmp )
+      string( STRIP ${_tmp} _tmp )
+      # filter invalid descriptions in shallow git clones
+      if (NOT _tmp MATCHES "^([0-9]+)\\.([0-9]+)(\\.([0-9]+))*(-.*)*$")
+         set( _tmp "")
+      endif ()
+   endif()
 
-  foreach ( dir ${alldirs} )
-    if ( NOT EXISTS ${dir} )
-      message (WARNING "${dir} is not a valid path")
-    endif ()
-  endforeach ()
-
-  # This list all the directories containing headers 
-  file ( GLOB_RECURSE includes LIST_DIRECTORIES true 
-    ${ARG_ROOT}/*.h ${ARG_ROOT}/*.H )
-  
-  
-  foreach (item ${includes})
-
-    get_filename_component ( path ${item} PATH )
-    
-    if (IS_DIRECTORY ${path})
-
-      # Check first if it is a valid path
-      set (path_is_valid "YES")
-      
-      foreach ( exclude ${ARG_EXCLUDE})
-	string (FIND ${path} ${exclude} out )
-	if ( NOT (${out} EQUAL -1) ) 
-	  set (path_is_valid "NO")
-	endif ()
-      endforeach ()
+   # Grep first line from file CHANGES if cannot find version from Git
+   if (NOT _tmp)
+      file(STRINGS ${CMAKE_CURRENT_LIST_DIR}/CHANGES ALL_VERSIONS REGEX "#")
+      list(GET ALL_VERSIONS 0 _tmp)
+      string(REPLACE "#" "" _tmp "${_tmp}")
+      string(STRIP "${_tmp}" _tmp )
+      set(_tmp "${_tmp}.0")
+   endif ()
 
-      
-      if ( NOT (${path} IN_LIST tmp ) AND path_is_valid )	   	    
-	list ( APPEND tmp ${path} )
-      endif ()
-      
-    endif ()
-    
-  endforeach ()
-
-  
-  
-  set ( ${dirlist} ${tmp} PARENT_SCOPE )
-  
-endfunction ()
+   set( AMREX_GIT_VERSION "${_tmp}" CACHE INTERNAL "" )
+   unset(_tmp)
 
+   # Package version is a modified form of AMREX_GIT_VERSION
+   if (AMREX_GIT_VERSION)
+      string(FIND "${AMREX_GIT_VERSION}" "-" _idx REVERSE)
+      string(SUBSTRING "${AMREX_GIT_VERSION}" 0 "${_idx}" _pkg_version )
+      string(FIND "${_pkg_version}" "-" _idx REVERSE)
+      string(SUBSTRING "${_pkg_version}" 0 "${_idx}" _pkg_version )
+      string(REPLACE "-" "." _pkg_version "${_pkg_version}")
+   endif ()
 
-#
-# Append new_var to all_var
-# 
-function ( append new_var all_var )
-  if ( ${new_var} )
-    set ( tmp  "${${all_var}} ${${new_var}}" )
+   set( AMREX_PKG_VERSION "${_pkg_version}" CACHE INTERNAL "" )
+   unset(_pkg_version)
 
-    # Since I am OCD, remove the double spaces.
-    string ( REPLACE "  " " " tmp ${tmp} )
-    set ( ${all_var}  ${tmp} PARENT_SCOPE )
-  endif ()
 endfunction ()
 
 
 #
-# Print variable (useful for debugging)
 #
-function ( print var )
-  message (" ${var} = ${${var}}" )
-endfunction ()
-
+# FUNCTION: print
 #
-# Print list
+# Debug function to print a variable
 #
-function ( print_list list )
-  
-  list ( LENGTH ${list} len )
-
-  if ( ${len} GREATER 0 )
-    message ("")
-    message ( STATUS " LIST NAME:  ${list}")
-    foreach ( item ${${list}})
-      message ( STATUS "  ${item}")
-    endforeach ()
-    message ("")
-  endif ()
-  
-endfunction ()
-
-
+# Arguments:
 #
-# Function to append to link line
+#    _var = the variable to print
 #
-function ( append_to_link_line libs link_line )
-
-  if ( ${ARGC} EQUAL 3 )  # Third one is optional flags
-    set ( flags  ${ARGV2} )
-  else ()
-    set ( flags )
-  endif ()
-  
-  set ( tmp "${${link_line}} ${${flags}} ${${libs}} " )
-  string ( STRIP "${tmp}" tmp )
-  set ( ${link_line} ${tmp} PARENT_SCOPE )
-  
+#
+function ( print _var )
+   message(" ${_var} = ${${_var}}" )
 endfunction ()
 
-
 #
-# Function to install include files
 #
-function ( install_include_files )
-  foreach (file ${ARGV})
-    install ( FILES ${file} DESTINATION include )
-  endforeach()
-endfunction ()
-
+# FUNCTION: print_list
 #
-# Function to prepend path to list items
+# Debug function to print a list as an columns of entries
 #
-function (prepend list prefix)
-
-  set ( tmp "" )
-  foreach (item ${${list}})
-    set ( name   ${prefix}/${item} )
-    string ( REPLACE "//" "/" name ${name})
-    list ( APPEND tmp ${name} )
-  endforeach ()
-
-  set ( ${list} ${tmp}  PARENT_SCOPE )
-
-endfunction ()
-
-
-
+# Arguments:
 #
-#  USE AT YOUR OWN RISK
+#    _list = the list to print
 #
-function (scan_for_sources f90src f77src cxxsrc allheaders)
-
-  cmake_parse_arguments ( ARG "" "ROOT" ""  ${ARGN} )
-
-  if (NOT (ARG_ROOT))
-    set (ARG_ROOT ${CMAKE_CURRENT_LIST_DIR})
-  endif ()
-  
-  file (GLOB_RECURSE tmp  "${ARG_ROOT}/*.f90"
-    "${ARG_ROOT}/*.F90")
-  set (${f90src} ${tmp} PARENT_SCOPE)
-
-  
-  file (GLOB_RECURSE f77src  "${ARG_ROOT}/*.f"
-    "${ARG_ROOT}/*.F")
-
-  file (GLOB_RECURSE cxxsrc  "${ARG_ROOT}/*.cpp" )
+#
+function ( print_list _list )
 
-  file (GLOB_RECURSE allheaders  "${ARG_ROOT}/*.H"
-    "${ARG_ROOT}/*.H")
+   list( LENGTH ${_list} _len )
 
-  set (f90src)
+   if ( ${_len} GREATER 0 )
+      message("")
+      message( STATUS "LIST NAME:  ${_list}")
+      foreach ( _item ${${_list}})
+         message ( STATUS "  ${_item}")
+      endforeach ()
+      message("")
+   endif ()
 
 endfunction ()
 
 
 #
-# Find all source files ( Fortran, C++, Headers )
-# in CMAKE_CURRENT_LIST_DIR.
-#
-# Arguments:
-#
-#  source_list  = the list of sources (prefixed with their absolute path)
-#  ROOT         = directory to search.
-#                 If not given, default is CMAKE_CURRENT_LIST_DIR
-#  RECURSE      = if given, enables search for subdirectories
 #
-# This macro returns a list of files with their absolute paths
+# FUNCTION: set_default_config_flags
 #
-# WARNING: it is dangerous and definitely discouraged to use
-#          GLOBBING to find sources. Use at your own risk.
-# 
-macro ( find_all_sources sources_list include_paths )
-
-  cmake_parse_arguments ( ARG "RECURSE" "ROOT" ""  ${ARGN} )
-
-  if ( NOT (ARG_ROOT) )
-    set (ARG_ROOT ${CMAKE_CURRENT_LIST_DIR})
-  endif ()
-
-  if (ARG_RECURSE)
-    set ( search_type GLOB_RECURSE )
-  else ()
-    set ( search_type GLOB )
-  endif ()
-  
-  file ( ${search_type} ${sources_list}
-    "${ARG_ROOT}/*.f90"
-    "${ARG_ROOT}/*.F90"
-    "${ARG_ROOT}/*.F"
-    "${ARG_ROOT}/*.cpp"
-    "${ARG_ROOT}/*.H"
-    "${ARG_ROOT}/*.h"
-    )
-  
-  unset (search_type)
-
-  # Find include paths
-  if ( ${sources_list} )
-    
-    set ( include_paths )
-    
-    foreach ( file IN LISTS ${sources_list} )
-
-      get_filename_component ( ext ${file} EXT )
-
-      if ( ("${ext}" STREQUAL ".h") OR ("${ext}" STREQUAL ".H") )
-
-	get_filename_component (path ${file} DIRECTORY)
-	list ( APPEND ${include_paths} ${path} ) 
-
-      endif()
-      
-    endforeach ()
-
-    unset (path)
-
-    if ( ${include_paths} )
-      list ( REMOVE_DUPLICATES ${include_paths} )
-    endif ()
-    
-  endif ()
-
-endmacro ()
-
-
-
 #
-# This sets CMake_<LANG>_FLAGS_<CONFIG> to default values
+# Set CMake_<LANG>_FLAGS_<CONFIG> to default values
 # if the variable is empty
 #
 macro ( set_default_config_flags )
-  
+
   if ( NOT CMAKE_Fortran_FLAGS_DEBUG )
     set (CMAKE_Fortran_FLAGS_DEBUG "-g")
   endif ()
@@ -288,27 +114,14 @@ macro ( set_default_config_flags )
   if ( NOT CMAKE_CXX_FLAGS_DEBUG )
     set (CMAKE_CXX_FLAGS_DEBUG "-g")
   endif ()
-  
+
   if ( NOT CMAKE_CXX_FLAGS_RELEASE )
     set (CMAKE_CXX_FLAGS_RELEASE "-O2 -DNDEBUG")
   endif ()
-  
-endmacro ()
-
-
 
-#
-# Strip string from trailing and leading whitespace
-# after veryfing it is not empty
-#
-macro (strip var)
-  if (${var})
-    string ( STRIP "${${var}}" ${var} )
-  endif ()  
 endmacro ()
 
-
-# 
+#
 #
 # FUNCTION: add_amrex_define
 #
@@ -321,25 +134,23 @@ endmacro ()
 #                    If the new define is in the form AMREX_SOMENAME,
 #                    this function also adds BL_SOMENAME to the list,
 #                    unless NO_LEGACY is specified (see below)
-# 
+#
 #    NO_LEGACY     = if specified, the legacy version of a new_define given in the
 #                    form AMREX_SOMENAME will not be added.
-#                     
+#
 #    IF <cond-var> = new_define is added only if <cond-var> is true
 #
-# Author: Michele Rosso
-# Date  : June 26, 2018
-# 
+#
 function ( add_amrex_define new_define )
 
-   # 
+   #
    # Check if target "amrex" has been defined before
    # calling this macro
    #
    if (NOT TARGET amrex)
       message(FATAL_ERROR "Target 'amrex' must be defined before calling function 'add_amrex_define'" )
    endif ()
-   
+
    cmake_parse_arguments( DEFINE "NO_LEGACY" "IF" ""  ${ARGN} )
 
    set( condition  1 )
@@ -363,7 +174,28 @@ function ( add_amrex_define new_define )
 	 string(REPLACE "AMREX_" "BL_" legacy_define ${new_define})
 	 target_compile_definitions( amrex PUBLIC $<BUILD_INTERFACE:${legacy_define}> )
       endif ()
-   endif () 
-   
+   endif ()
+
 endfunction ()
 
+
+#
+#
+# FUNCTION: set_mininum_cxx_compiler_version
+#
+# Check whether the C++ compiler version is >= a required minimum.
+# If not, stop with a fatal error
+#
+# Arguments:
+#
+#    _comp_id         = the compiler ID
+#    _minimum_version = the minimum version required for _comp_id
+#
+#
+function (set_mininum_cxx_compiler_version _comp_id  _minimum_version)
+   if (  (CMAKE_CXX_COMPILER_ID STREQUAL _comp_id ) AND
+         (CMAKE_CXX_COMPILER_VERSION VERSION_LESS _minimum_version ) )
+      message( FATAL_ERROR
+         "\n${_comp_id} compiler version is ${CMAKE_CXX_COMPILER_VERSION}. Minimum required is ${_minimum_version}.\n")
+   endif ()
+endfunction ()
diff --git a/Tools/CMake/FindPETSc.cmake b/Tools/CMake/FindPETSc.cmake
index bdec998ff95..2b306c63db0 100644
--- a/Tools/CMake/FindPETSc.cmake
+++ b/Tools/CMake/FindPETSc.cmake
@@ -36,9 +36,6 @@ message(STATUS "arch ${PETSC_INCLUDE_DIRS_ARCH}")
 set(PETSC_INCLUDE_DIRS ${PETSC_INCLUDE_DIRS_BASE} ${PETSC_INCLUDE_DIRS_ARCH})
 message(STATUS "joe ${PETSC_INCLUDE_DIRS}")
 
-#Set Fortran include directories TODO: currently overwrites any given values
-set(CMAKE_Fortran_FLAGS ${PETSC_INCLUDE_DIRS})
-
 # Find libraries
 find_library(PETSC_LIBRARIES PATHS ${PETSC_DIR}/${PETSC_ARCH}/lib NAMES petsc)
 
diff --git a/Tools/CMake/FindSUNDIALS.cmake b/Tools/CMake/FindSUNDIALS.cmake
index 2a4a29f1588..68269930750 100644
--- a/Tools/CMake/FindSUNDIALS.cmake
+++ b/Tools/CMake/FindSUNDIALS.cmake
@@ -48,21 +48,28 @@ unset(_version_string CACHE)
 
 # Include directory is only the top level one, i.e. "include"
 # Find path by using directory "sundials" as reference
-find_path(_sundials_include_path NAMES sundials PATH_SUFFIXES include)
-
+find_path(_sundials_include_path     NAMES sundials PATH_SUFFIXES include)
+find_path(_sundials_fortran_mod_path NAMES fortran )
+if (_sundials_fortran_mod_path)
+   set(_sundials_fortran_mod_path ${_sundials_fortran_mod_path}/fortran)
+endif ()
 
 # Valid components
 set(_valid_components
    nvecserial
+   fnvecserial_mod
    nvecparallel
+   fnvecparallel_mod
    nvecopenmp
+   fnvecopenmp_mod
    nvecopenmpdev
    nveccuda
    cvode
+   fcvode_mod
    arkode
+   farkode_mod
    )
 
-
 # Search for a default library (nvecserial) or for all the
 # required components
 if (NOT SUNDIALS_FIND_COMPONENTS)
@@ -78,7 +85,7 @@ list(REMOVE_DUPLICATES _sundials_findlist)
 #
 set(_SUNDIALS_REQUIRED_VARS)
 foreach(_comp IN LISTS _sundials_findlist)
-   
+
    string( TOLOWER "${_comp}" _comp_lower  )
    string( TOUPPER "${_comp}" _comp_upper  )
 
@@ -91,6 +98,14 @@ foreach(_comp IN LISTS _sundials_findlist)
    set(SUNDIALS_${_comp_upper}_INCLUDE_DIRS ${_sundials_include_path})
    find_library(SUNDIALS_${_comp_upper}_LIBRARIES NAMES sundials_${_comp_lower} PATH_SUFFIXES lib lib64)
 
+   # If this is a fortran library, add module search path to includes
+   if (_comp_lower MATCHES ".*_mod")
+      if (NOT _sundials_fortran_mod_path)
+         message(FATAL_ERROR "\\ No Fortran support found for SUNDIALS (required by ${_comp_lower})")
+      endif ()
+      list( APPEND SUNDIALS_${_comp_upper}_INCLUDE_DIRS ${_sundials_fortran_mod_path})
+   endif ()
+
    find_package_handle_standard_args(SUNDIALS_${_comp_upper}
       REQUIRED_VARS
       SUNDIALS_${_comp_upper}_LIBRARIES
@@ -101,7 +116,7 @@ foreach(_comp IN LISTS _sundials_findlist)
    mark_as_advanced(SUNDIALS_${_comp_upper}_LIBRARIES SUNDIALS_${_comp_upper}_INCLUDE_DIRS)
 
    list(APPEND _SUNDIALS_REQUIRED_VARS "SUNDIALS_${_comp_upper}_FOUND")
-   
+
    # Create imported target
    set(_target SUNDIALS::${_comp_lower})
    if (SUNDIALS_${_comp_upper}_FOUND AND NOT TARGET ${_target})
@@ -110,7 +125,7 @@ foreach(_comp IN LISTS _sundials_findlist)
          IMPORTED_LOCATION "${SUNDIALS_${_comp_upper}_LIBRARIES}"
          INTERFACE_INCLUDE_DIRECTORIES "${SUNDIALS_${_comp_upper}_INCLUDE_DIRS}"
          )
-   endif ()  
+   endif ()
 
 endforeach()
 
diff --git a/Tools/C_util/Convergence/ComparePlotfiles.cpp b/Tools/C_util/Convergence/ComparePlotfiles.cpp
new file mode 100644
index 00000000000..1ed64d142a3
--- /dev/null
+++ b/Tools/C_util/Convergence/ComparePlotfiles.cpp
@@ -0,0 +1,247 @@
+
+#include <fstream>
+#include <iostream>
+
+#include <AMReX_ParmParse.H>
+#include <AMReX_PlotFileUtil.H>
+
+using namespace amrex;
+
+static
+void
+PrintUsage (const char* progName)
+{
+    Print() << std::endl
+            << "This utility performs a diff operation between two"           << std::endl
+            << "plotfiles that have the same geometrical domain and nodality" << std::endl
+            << "(supports all nodality types; cell, face, edge, node)"        << std::endl
+            << "but possibly a factor of refinement between the cells,"       << std::endl
+            << "and outputs the L0, L1, and L2 norms"                         << std::endl
+            << "L1 = sum(|diff_ijk|)/npts_coarsedomain"                       << std::endl
+            << "L2 = sqrt[sum(diff_ijk^2)]/sqrt(npts_coarsedomain)"           << std::endl
+            <<  "(only single-level supported)"                               << std::endl << std::endl;
+    
+    Print() << "Usage:" << '\n';
+    Print() << progName << '\n';
+    Print() << "    infile1 = inputFileName1" << '\n';
+    Print() << "    reffile = refinedPlotFile" << '\n';
+    Print() << "    diffile = differenceFileName" << '\n';
+    Print() << "              (If not specified no file is written)" << '\n' << '\n';
+    
+    Print() << "You can either point to the plotfile base directory itself, e.g."      << std::endl
+            << "  infile=plt00000"                                                     << std::endl
+            << "Or the raw data itself, e.g."                                          << std::endl
+            << "  infile=plt00000/Level_0/Cell"                                        << std::endl
+            << "the latter is useful for some applications that dump out raw"          << std::endl
+            << "nodal data within a plotfile directory."                               << std::endl
+            << "The program will first try appending 'Level_0/Cell'"                   << std::endl
+            << "onto the specified filenames."                                         << std::endl
+            << "If that _H file doesn't exist, it tries using the full specified name" << std::endl << std::endl;
+        
+    exit(1);
+}
+
+int
+main (int   argc,
+      char* argv[])
+{
+    amrex::Initialize(argc,argv);
+
+    if (argc == 1) {
+        PrintUsage(argv[0]);
+    }
+
+    // plotfile names for the coarse, fine, and subtracted output
+    std::string iFile1, iFile2, difFile="";
+
+    // read in parameters from inputs file
+    ParmParse pp;
+
+    // coarse MultiFab
+    pp.query("infile1", iFile1);
+    if (iFile1.empty())
+        amrex::Abort("You must specify `infile1'");
+
+    // fine MultiFab (might have same resolution as coarse)
+    pp.query("reffile", iFile2);
+    if (iFile2.empty())
+        amrex::Abort("You must specify `reffile'");
+
+    // subtracted output (optional)
+    pp.query("diffile", difFile);
+
+    // single-level for now
+    // AMR comes later, where we iterate over each level in isolation
+
+    // check to see whether the user pointed to the plotfile base directory
+    // or the data itself
+    if (amrex::FileExists(iFile1+"/Level_0/Cell_H")) {
+       iFile1 += "/Level_0/Cell";
+    }
+    if (amrex::FileExists(iFile2+"/Level_0/Cell_H")) {
+       iFile2 += "/Level_0/Cell";
+    }
+
+    // storage for the input coarse and fine MultiFabs
+    MultiFab mf_c, mf_f;
+    
+    // read in plotfiles, 'coarse' and 'fine' to MultiFabs
+    // note: fine could be the same resolution as coarse
+    VisMF::Read(mf_c, iFile1);
+    VisMF::Read(mf_f, iFile2);
+
+    // check number of components
+    if (mf_c.nComp() != mf_f.nComp()) {
+        Abort("plotfiles do not have the same number of variables");
+    }
+    int ncomp = mf_c.nComp();
+    Print() << "ncomp = " << ncomp << std::endl;
+
+    // check nodality
+    IntVect c_nodality = mf_c.ixType().toIntVect();
+    IntVect f_nodality = mf_f.ixType().toIntVect();
+    if (c_nodality != f_nodality) {
+        Abort("plotfiles do not have the same nodality");
+    }
+    Print() << "nodality " << c_nodality << std::endl;
+
+    // get coarse and fine boxArrays
+    BoxArray ba_c = mf_c.boxArray();
+    BoxArray ba_f = mf_f.boxArray();
+
+    // minimalBox() computes a single box to enclose all the boxes
+    // enclosedCells() converts it to a cell-centered Box
+    Box bx_c = ba_c.minimalBox().enclosedCells();
+    Box bx_f = ba_f.minimalBox().enclosedCells();
+
+    // number of cells in the coarse domain
+    Print() << "npts in coarse domain = " << bx_c.numPts() << std::endl;
+    Print() << "npts in fine   domain = " << bx_f.numPts() << std::endl;
+    long npts_coarsedomain = bx_c.numPts();
+    
+    // assume ref_ratio is the same in each direction
+    int rr = bx_f.length(0)/bx_c.length(0);
+
+    Print() << "ref_ratio = " << rr << std::endl;
+    
+    // check to make sure refinement ratio is an integer
+    for (int i=0; i<AMREX_SPACEDIM; ++i) {
+        if (bx_f.length(i)%bx_c.length(i) != 0) {
+            Abort("not an integer refinement ratio");
+        }
+    }
+
+    // check to make sure refinement ratio is the same in each direction
+    for (int i=0; i<AMREX_SPACEDIM; ++i) {
+        if ( bx_f.length(i)/bx_c.length(i) != rr ) {
+            Abort("ref_ratio not the same in each direction");
+        }
+    }
+
+    // make a new BoxArray that is a refined version of the coarse BoxArray with the same
+    // problem domain as the fine BoxArray
+    BoxArray ba_c2 = ba_c;
+    ba_c2.refine(rr);
+
+    // grab the distribtion map from the coarse MultiFab
+    DistributionMapping dm = mf_c.DistributionMap();
+
+    // create a fine MultiFab with same distribution mapping as coarse MultiFab
+    MultiFab mf_f2(ba_c2,dm,ncomp,0);
+
+    // copy fine data into new fine MultiFab
+    mf_f2.ParallelCopy(mf_f,0,0,ncomp,0,0);
+
+    // storage for averaged-down fine MultiFab
+    MultiFab mf_c2(ba_c,dm,ncomp,0);
+
+    // now we average down mf_f2 into mf_c2
+
+    int how_many_nodal = 0;
+    for (int i=0; i<AMREX_SPACEDIM; ++i ) {
+        if (c_nodality[i] == 1) {
+            ++how_many_nodal;            
+        }
+    }
+
+    int npts_avg = pow(rr,AMREX_SPACEDIM-how_many_nodal);
+
+    int rr_i = (c_nodality[0] == 0) ? rr : 1;
+    int rr_j = (c_nodality[1] == 0) ? rr : 1;
+#if (AMREX_SPACEDIM == 3)
+    int rr_k = (c_nodality[2] == 0) ? rr : 1;
+#else
+    int rr_k = 0;
+#endif
+        
+    for ( MFIter mfi(mf_c,TilingIfNotGPU()); mfi.isValid(); ++mfi ) {
+        
+        const Box& bx = mfi.tilebox();
+
+        const Array4<Real const>& fine   = mf_f2.array(mfi);
+        const Array4<Real      >& coarse = mf_c2.array(mfi);
+
+        amrex::ParallelFor(bx, ncomp, [=] AMREX_GPU_DEVICE (int i, int j, int k, int n) noexcept
+        {
+            coarse(i,j,k,n) = 0.;
+
+#if (AMREX_SPACEDIM==3)
+            for (int kk=0; kk<rr_k; ++kk) {
+#else
+                int kk=0;    
+#endif
+                for (int jj=0; jj<rr_j; ++jj) {
+                    for (int ii=0; ii<rr_i; ++ii) {
+                        coarse(i,j,k,n) += fine(rr*i+ii,rr*j+jj,rr*k+kk,n);
+                    }
+                }
+#if (AMREX_SPACEDIM==3)
+            }
+#endif
+            coarse(i,j,k,n) /= npts_avg;
+        });
+            
+    } // end MFIter        
+
+    // subtract coarse from coarsened fine
+    MultiFab::Subtract(mf_c2,mf_c,0,0,ncomp,0);
+    
+    // force periodicity so faces/edges/nodes get weighted accordingly for L1 and L2 norms
+    IntVect iv(AMREX_D_DECL(bx_c.length(0),
+                            bx_c.length(1),
+                            bx_c.length(2)));
+    Periodicity period(iv);
+
+    // compute norms of mf_c2
+    for (int i=0; i<ncomp; ++i) {
+        Real norm0 = mf_c2.norm0(i);
+        Real norm1 = mf_c2.norm1(i,period);
+        Real norm2 = mf_c2.norm2(i,period);
+        Print() << "(comp,L0,L1,L2) " << i << " "
+                << norm0 << " "
+                << norm1/npts_coarsedomain << " "
+                << norm2/sqrt(npts_coarsedomain) << " " << std::endl;
+    }
+
+    // write out the subtracted plotfile if diffile was specified at the command line
+    if (difFile != "") {
+
+        // define the problem domain as (0,1) for now
+        RealBox real_box({AMREX_D_DECL(0.,0.,0.)},
+                         {AMREX_D_DECL(1.,1.,1.)});
+
+        Vector<int> is_periodic(AMREX_SPACEDIM,1);
+
+        // build a geometry object so we can use WriteSingleLevelPlotfile
+        Geometry geom(bx_c,&real_box,CoordSys::cartesian,is_periodic.data());
+
+        // give generic variables names for now
+        Vector<std::string> varNames(ncomp);
+        for (int i=0; i<ncomp; ++i) {
+            varNames[i] = std::to_string(i);
+        }
+
+        WriteSingleLevelPlotfile(difFile,mf_c2,varNames,geom,0.,0);
+    }
+    
+}
diff --git a/Tools/C_util/Convergence/GNUmakefile b/Tools/C_util/Convergence/GNUmakefile
index 681ba7a6fd9..591419fd8e2 100644
--- a/Tools/C_util/Convergence/GNUmakefile
+++ b/Tools/C_util/Convergence/GNUmakefile
@@ -7,9 +7,9 @@ USE_EB =FALSE
 PRECISION     = DOUBLE
 DEBUG	      = TRUE
 DEBUG	      = FALSE
-#DIM	      = 3
-DIM	      = 2
-DIM           = 1
+DIM	      = 3
+#DIM	       = 2
+#DIM           = 1
 COMP          = g++
 #USE_MPI       = TRUE 
 USE_MPI       = FALSE
@@ -18,8 +18,9 @@ USE_MPI       = FALSE
 #
 #EBASE = Add
 ### this has no main EBASE = ComputeAmrDataNorms
+EBASE = ComparePlotfiles
 #EBASE = DiffFab
-EBASE = DiffSameDomainRefined
+#EBASE = DiffSameDomainRefined
 #EBASE = DiffSameDomainRefinedComposite
 #EBASE = DiffSameDomainRefinedStag
 #EBASE = DiffSameGrid2
diff --git a/Tools/CompileTesting/compiletesting.py b/Tools/CompileTesting/compiletesting.py
index d56e3e9dec2..718bde713da 100755
--- a/Tools/CompileTesting/compiletesting.py
+++ b/Tools/CompileTesting/compiletesting.py
@@ -55,8 +55,6 @@ def compiletesting(arg_string):
                      'Tests/Particles/ParticleMesh',
                      'Tests/LinearSolvers/CellEB',
                      'Tests/LinearSolvers/CellEB2',
-                     'Tests/LinearSolvers/C_CellMG',
-                     'Tests/LinearSolvers/C_TensorMG',
                      'Tests/MKDir']
 
     else:
diff --git a/Tools/GNUMake/Make.defs b/Tools/GNUMake/Make.defs
index 3ab7484b78b..aeef8a2ee36 100644
--- a/Tools/GNUMake/Make.defs
+++ b/Tools/GNUMake/Make.defs
@@ -9,6 +9,12 @@ ifneq (,$(findstring ~,$(AMREX_HOME)))
   AMREX_HOME := $(shell echo $(AMREX_HOME))
 endif
 
+ifneq ($(MAKECMDGOALS),)
+ifeq ($(MAKECMDGOALS),$(filter $(MAKECMDGOALS),realclean clean cleanconfig uninstall distclean))
+  NO_CONFIG_CHECKING = TRUE
+endif
+endif
+
 ifneq ("$(wildcard $(AMREX_HOME)/Tools/GNUMake/Make.local-pre)","")
   $(info Loading $(AMREX_HOME)/Tools/GNUMake/Make.local-pre...)
   include        $(AMREX_HOME)/Tools/GNUMake/Make.local-pre
@@ -23,11 +29,6 @@ else
 endif
 
 ifeq ($(USE_DPCPP),TRUE)
-  ifdef DPCPPROOT
-    DPCPP_DIR ?= $(DPCPPROOT)
-  else
-    DPCPP_DIR ?= /opt/intel/inteloneapi/compiler/latest/linux
-  endif
   override COMP = dpcpp
   DEFINES += -DAMREX_USE_DPCPP -DAMREX_USE_GPU
   USE_CUDA := FALSE
@@ -44,19 +45,19 @@ else
 endif
 
 ifeq ($(USE_HIP),TRUE)
+  DEBUG := FALSE  # Currently there is a compiler bug for DEBUG=TRUE.
   USE_CUDA := FALSE
-  COMP := hip
-  HIP_PLATFORM = $(shell hipconfig --compiler)
-  ifeq ($(HIP_PLATFORM),nvcc)
-  $(error HIP_PLATFORM nvcc is not supported at this time. Use USE_CUDA to compile for NVIDIA platforms)
-#    If nvcc is supported, put this back.
-#    CUDA_ARCH ?= 60
-#    CUDA_MAX_THREADS ?= 256
-#    CUDA_MAXREGCOUNT ?= 255
-  else ifeq ($(HIP_PLATFORM),hcc)
-# do nothing special for now, but also don't abort
-  else
-    $(error only HIP_PLATFORM=hcc is supported)
+  override COMP = hip
+  ifneq ($(NO_CONFIG_CHECKING),TRUE)
+    HIP_COMPILER = $(shell hipconfig --compiler)
+    ifeq ($(HIP_COMPILER),nvcc)
+      $(error HIP_COMPILER=nvcc is not supported at this time. Use USE_CUDA to compile for NVIDIA platforms)
+    else ifeq ($(HIP_COMPILER),hcc)
+      $(error HIP_COMPILER=hcc is no longer supported)
+    else ifeq ($(HIP_COMPILER),clang)
+    else
+      $(error Unknown HIP_COMPILER=$(HIP_COMPILER))
+    endif
   endif
 endif
 
@@ -161,12 +162,6 @@ else
   BOUND_CHECK := FALSE
 endif
 
-ifdef BACKTRACE
-  BACKTRACE := $(strip $(BACKTRACE))
-else
-  BACKTRACE := FALSE
-endif
-
 ifdef EXPORT_DYNAMIC
   EXPORT_DYNAMIC := $(strip $(EXPORT_DYNAMIC))
 else
@@ -282,6 +277,12 @@ else
   USE_SENSEI_INSITU := FALSE
 endif
 
+ifdef USE_HDF5
+  USE_HDF5 := $(strip $(USE_HDF5))
+else
+  USE_HDF5 := FALSE
+endif
+
 ifdef EBASE
   EBASE := $(strip $(EBASE))
 else
@@ -294,6 +295,22 @@ else
   USE_FORCE_INLINE := FALSE
 endif
 
+ifdef WARN_ALL
+  WARN_ALL := $(strip $(WARN_ALL))
+else
+ifeq ($(DEBUG),TRUE)
+  WARN_ALL := TRUE
+else
+  WARN_ALL := FALSE
+endif
+endif
+
+ifdef WARN_ERROR
+  WARN_ERROR := $(strip $(WARN_ERROR))
+else
+  WARN_ERROR := FALSE
+endif
+
 ifdef USE_GPU_PRAGMA
   USE_GPU_PRAGMA := $(strip $(USE_GPU_PRAGMA))
   GPU_PRAGMA_NO_HOST_VERSION ?= FALSE
@@ -318,13 +335,23 @@ else
   FIX_NVCC_PTHREAD := FALSE
 endif
 
+ifdef GPU_WARN_CAPTURE_THIS
+  GPU_WARN_CAPTURE_THIS := $(strip $(GPU_WARN_CAPTURE_THIS))
+else
+  GPU_WARN_CAPTURE_THIS := TRUE
+endif
+
+ifdef GPU_ERROR_CAPTURE_THIS
+  GPU_ERROR_CAPTURE_THIS := $(strip $(GPU_ERROR_CAPTURE_THIS))
+else
+  GPU_ERROR_CAPTURE_THIS := TRUE
+endif
+
 SKIP_LINKING ?= FALSE
 USE_COMPILE_PIC ?= FALSE
 
 AMREX_GIT_VERSION := $(shell cd $(AMREX_HOME); git describe --abbrev=12 --dirty --always --tags)
-ifneq ($(USE_HIP),TRUE)
-  DEFINES += -DAMREX_GIT_VERSION=\"$(AMREX_GIT_VERSION)\"
-endif
+DEFINES += -DAMREX_GIT_VERSION=\"$(AMREX_GIT_VERSION)\"
 
 FORTLINK  	= UNDERSCORE
 
@@ -338,6 +365,8 @@ CHECKFORT       = $(AMREX_HOME)/Tools/typechecker/typechecker.py
 MKCONFIG        = $(AMREX_HOME)/Tools/libamrex/mkconfig.py
 MKPKGCONFIG     = $(AMREX_HOME)/Tools/libamrex/mkpkgconfig.py
 
+DEPFLAGS        = -MM
+
 RANLIB          = ranlib
 
 EXE_OUTPUT_OPTION      = -o $(objEXETempDir)/$*.o
@@ -369,6 +398,8 @@ ifdef AMREX_CCOMP
     AMREX_CCOMP = cray
   else ifeq ($(lowercase_amrex_comp),pgi)
     AMREX_CCOMP = pgi
+  else ifeq ($(lowercase_amrex_comp),hpcsdk)
+    AMREX_CCOMP = hpcsdk
   else ifeq ($(lowercase_amrex_comp),ibm)
     AMREX_CCOMP = ibm
   else ifeq ($(lowercase_amrex_comp),$(filter $(lowercase_amrex_comp),llvm clang clang++))
@@ -380,7 +411,7 @@ ifdef AMREX_CCOMP
   else ifeq ($(lowercase_amrex_comp),nec)
     AMREX_CCOMP = nec
   else
-    $(error Unknown compiler $(AMREX_CCOMP). Supported compilers are gnu, intel, dpcpp, cray, pgi, ibm, llvm, nag, and nec)
+    $(error Unknown compiler $(AMREX_CCOMP). Supported compilers are gnu, intel, dpcpp, cray, pgi, hpcsdk, ibm, llvm, nag, and nec)
   endif
 endif
 
@@ -412,6 +443,11 @@ else ifeq ($(lowercase_comp),pgi)
   AMREX_CCOMP ?= pgi
   $(info Loading $(AMREX_HOME)/Tools/GNUMake/comps/pgi.mak...)
   include        $(AMREX_HOME)/Tools/GNUMake/comps/pgi.mak
+else ifeq ($(lowercase_comp),hpcsdk)
+  AMREX_FCOMP ?= hpcsdk
+  AMREX_CCOMP ?= hpcsdk
+  $(info Loading $(AMREX_HOME)/Tools/GNUMake/comps/hpcsdk.mak...)
+  include        $(AMREX_HOME)/Tools/GNUMake/comps/hpcsdk.mak
 else ifeq ($(lowercase_comp),ibm)
   AMREX_FCOMP ?= ibm
   AMREX_CCOMP ?= ibm
@@ -445,13 +481,14 @@ else ifeq ($(lowercase_comp),hip)
   $(info Loading $(AMREX_HOME)/Tools/GNUMake/comps/hip.mak...)
   include        $(AMREX_HOME)/Tools/GNUMake/comps/hip.mak
 else
-  $(error Unknown compiler $(COMP). Supported compilers are gnu, intel, dpcpp, cray, pgi, ibm, llvm, nag, and nec)
+  $(error Unknown compiler $(COMP). Supported compilers are gnu, intel, dpcpp, cray, pgi, hpcsdk, ibm, llvm, nag, and nec)
 endif
 
 CXXFLAGS += $(XTRA_CXXFLAGS)
 CFLAGS   += $(XTRA_CFLAGS)
 FFLAGS   += $(XTRA_FFLAGS)
 F90FLAGS += $(XTRA_F90FLAGS)
+CPPFLAGS += $(XTRA_CPPFLAGS)
 
 ifeq ($(MAKECMDGOALS),check_fortran)
   ifneq ($(lowercase_comp),gnu)
@@ -519,13 +556,6 @@ ifeq ($(TEST),TRUE)
     endif
 endif
 
-ifeq ($(BACKTRACE),TRUE)
-    CPPFLAGS += -DAMREX_BACKTRACING -DAMREX_TESTING
-    BTSuffix := .BT
-else
-    BTSuffix :=
-endif
-
 ifdef CRAY_CPU_TARGET
 ifneq ($(USE_CUDA),TRUE)
     archSuffix += .$(strip $(CRAY_CPU_TARGET))
@@ -616,56 +646,24 @@ endif
 ifeq ($(USE_HIP),TRUE)
 
     USE_GPU := TRUE
-    AMREX_FCOMP ?= gnu 
-    AMREX_CCOMP ?= hip
-
-    ifneq ($(lowercase_comp),gnu)
-    else ifneq ($(lowercase_comp),hip)
-        $(error HIP can only be used with COMP=hip)
-    endif
-
-#    include $(AMREX_HOME)/Tools/GNUMake/comps/hip.mak
-
-    ifeq ($(USE_MPI),TRUE)
-#      $(error MPI is not supported with HIP)
-
-      export OMPI_CC := hipcc 
-      export OMPI_CXX := hipcc
-      export OMPI_F77 := $(FC)
-      export OMPI_FC  := $(F90)
-
-      export MPICH_CC  := hipcc
-      export MPICH_CXX := hipcc
-      export MPICH_F77 := $(FC)
-      export MPICH_FC  := $(F90)
-
-    endif
 
     DEFINES += -DAMREX_USE_HIP
 
-    ifeq ($(HIP_PLATFORM),nvcc)
-        $(error HIP_PLATFORM nvcc is not supported at this time. Use USE_CUDA to compile for NVIDIA platforms.)
- #       DEFINES += -DAMREX_USE_CUDA -DAMREX_HIP_PLATFORM_NVCC
-    else ifeq ($(HIP_PLATFORM),hcc)
-        DEFINES += -DAMREX_HIP_PLATFORM_HCC
-    endif
-
     GPUSuffix := .HIP
 
 else ifeq ($(USE_CUDA),TRUE)
 
     USE_GPU := TRUE
 
-    # The CUDA implementation is not currently threadsafe.
-    # Throw an error if the user tries to build with OpenMP and CUDA.
-
     ifeq ($(lowercase_comp),pgi)
         LINK_WITH_FORTRAN_COMPILER=TRUE
+    else ifeq ($(lowercase_comp),hpcsdk)
+        LINK_WITH_FORTRAN_COMPILER=TRUE
     else ifeq ($(lowercase_comp),ibm)
         LINK_WITH_FORTRAN_COMPILER=TRUE
     else ifeq ($(lowercase_comp),gnu)
     else
-        $(error CUDA can only be used with COMP=pgi or ibm or gnu)
+        $(error CUDA can only be used with COMP=pgi or hpcsdk or ibm or gnu)
     endif
 
     include $(AMREX_HOME)/Tools/GNUMake/comps/nvcc.mak
@@ -703,7 +701,7 @@ else ifeq ($(USE_CUDA),TRUE)
 
     GPUSuffix := .CUDA
 
-    ifeq ($(lowercase_comp),$(filter $(lowercase_comp),ibm pgi))
+    ifeq ($(lowercase_comp),$(filter $(lowercase_comp),ibm pgi hpcsdk))
       DEFINES += -DAMREX_LAUNCH='attributes(global)'
       DEFINES += -DAMREX_DEVICE='attributes(device)'
       DEFINES += -DAMREX_CUDA_FORT_GLOBAL='attributes(global)'
@@ -822,6 +820,12 @@ ifeq ($(AMREX_XSDK),TRUE)
    DEFINES += -DAMREX_XSDK
 endif
 
+ifneq ($(DEBUG),TRUE)
+ifneq ($(USE_ASSERTION),TRUE)
+  DEFINES += -DNDEBUG
+endif
+endif
+
 CPPFLAGS	+= $(DEFINES)
 
 libraries	= $(XTRAOBJS) $(LIBRARIES) $(XTRALIBS)
@@ -831,7 +835,7 @@ ifeq ($(USE_RPATH),TRUE)
 endif
 LDFLAGS	+= -L. $(addprefix -L, $(LIBRARY_LOCATIONS))
 
-machineSuffix	= $(lowercase_comp)$(archSuffix)$(PrecisionSuffix)$(DebugSuffix)$(ProfSuffix)$(MProfSuffix)$(BTSuffix)$(MPISuffix)$(UPCXXSuffix)$(OMPSuffix)$(ACCSuffix)$(GPUSuffix)$(CUPTISuffix)$(USERSuffix)
+machineSuffix	= $(lowercase_comp)$(archSuffix)$(PrecisionSuffix)$(DebugSuffix)$(ProfSuffix)$(MProfSuffix)$(MPISuffix)$(UPCXXSuffix)$(OMPSuffix)$(ACCSuffix)$(GPUSuffix)$(CUPTISuffix)$(USERSuffix)
 
 optionsSuffix	= $(DIM)d.$(machineSuffix)
 
@@ -915,14 +919,9 @@ ifeq ($(USE_UPCXX),TRUE)
   include        $(AMREX_HOME)/Tools/GNUMake/Make.upcxx
 endif
 
-ifeq ($(USE_SUNDIALS_3x4x),TRUE)
-  ifeq ("$(SUNDIALS_VERSION)","4")
-    $(info Loading $(AMREX_HOME)/Tools/GNUMake/packages/Make.sundials4...)
-    include        $(AMREX_HOME)/Tools/GNUMake/packages/Make.sundials4
-  else
-    $(info Loading $(AMREX_HOME)/Tools/GNUMake/packages/Make.sundials3...)
-    include        $(AMREX_HOME)/Tools/GNUMake/packages/Make.sundials3
-  endif
+ifeq ($(USE_SUNDIALS),TRUE)
+  $(info Loading $(AMREX_HOME)/Tools/GNUMake/packages/Make.sundials...)
+  include        $(AMREX_HOME)/Tools/GNUMake/packages/Make.sundials
 endif
 
 ifeq ($(USE_CVODE),TRUE)
@@ -955,6 +954,11 @@ ifeq ($(USE_SENSEI_INSITU),TRUE)
   include        $(AMREX_HOME)/Tools/GNUMake/tools/Make.sensei
 endif
 
+ifeq ($(USE_HDF5),TRUE)
+  $(info Loading $(AMREX_HOME)/Tools/GNUMake/packages/Make.hdf5...)
+  include        $(AMREX_HOME)/Tools/GNUMake/packages/Make.hdf5
+endif
+
 ifneq ("$(wildcard $(AMREX_HOME)/Tools/GNUMake/Make.local)","")
   $(info Loading $(AMREX_HOME)/Tools/GNUMake/Make.local...)
   include        $(AMREX_HOME)/Tools/GNUMake/Make.local
@@ -965,8 +969,23 @@ ifeq ($(USE_HIP),TRUE)
     LINKFLAGS = $(HIPCC_FLAGS)
     AMREX_LINKER = hipcc
 
+    ifeq ($(HIP_SAVE_TEMPS),TRUE)
+      # Issue: hipcc does not seem to respect the arg to --save-temps
+      CXXFLAGS += --save-temps=$(objEXETempDir)
+      ifeq ($(DEBUG),TRUE) # --save-temps does not like AMREX_GPU_EXTERNAL
+        CPPFLAGS += -DNDEBUG
+      endif
+    endif
+
 else ifeq ($(USE_CUDA),TRUE)
 
+    ifdef AMREX_CUDA_ARCH
+      CUDA_ARCH = $(AMREX_CUDA_ARCH)
+    endif
+
+    # remove dot in 7.0 if there is
+    override CUDA_ARCH := $(subst .,,$(CUDA_ARCH))
+
     # Allow the user to specify the location of the CUDA toolkit.
     # If they don't, check if it has been defined for one of the
     # systems we know about.
@@ -1029,40 +1048,40 @@ else ifeq ($(USE_CUDA),TRUE)
 
     DEFINES += -DAMREX_GPU_MAX_THREADS=$(CUDA_MAX_THREADS)
 
-    comm := ,
-    space :=
-    space +=
-
     ifneq ($(LINK_WITH_FORTRAN_COMPILER),TRUE)
       LINKFLAGS = $(NVCC_FLAGS)
-      # we are using nvcc for linking
-      libraries := $(subst -Wl$(comm),-Xlinker=,$(libraries))
-      ifeq ($(FIX_NVCC_PTHREAD),TRUE)
-        libraries := $(subst -pthread,-Xcompiler$(space)-pthread,$(libraries))
-      endif
       AMREX_LINKER = nvcc
     endif
 
-    ifeq ($(USE_MPI),TRUE)
+    ifeq ($(nvcc_forward_unknowns),0)
 
-      ifneq ($(findstring Open MPI, $(shell mpicxx -showme:version 2>&1)),)
+      comm := ,
+      space :=
+      space +=
 
+      ifeq ($(AMREX_LINKER),nvcc)
+        libraries := $(subst -Wl$(comm),-Xlinker=,$(libraries))
         ifeq ($(FIX_NVCC_PTHREAD),TRUE)
-          OMPI_CXXFLAGS_ORIG = $(shell mpicxx -showme:compile)
-          export OMPI_CXXFLAGS := $(subst -pthread,-Xcompiler$(space)-pthread,$(OMPI_CXXFLAGS_ORIG))
+          libraries := $(subst -pthread,-Xcompiler$(space)-pthread,$(libraries))
+        endif
+      endif
 
-          OMPI_CFLAGS_ORIG = $(shell mpicc -showme:compile)
-          export OMPI_CFLAGS := $(subst -pthread,-Xcompiler$(space)-pthread,$(OMPI_CXXFLAGS_ORIG))
+      ifeq ($(USE_MPI),TRUE)
 
-          # If we're compiling with PGI, it doesn't know -pthread, replace
-          # with -lpthread.
+        ifneq ($(findstring Open MPI, $(shell mpicxx -showme:version 2>&1)),)
 
-          OMPI_FCFLAGS_ORIG = $(shell mpif90 -showme:compile)
-          export OMPI_FCFLAGS := $(subst -pthread,-lpthread,$(OMPI_FCFLAGS_ORIG))
-        endif
+          ifeq ($(FIX_NVCC_PTHREAD),TRUE)
+            OMPI_CXXFLAGS_ORIG = $(shell mpicxx -showme:compile)
+            export OMPI_CXXFLAGS := $(subst -pthread,-Xcompiler$(space)-pthread,$(OMPI_CXXFLAGS_ORIG))
 
-      endif
+            OMPI_CFLAGS_ORIG = $(shell mpicc -showme:compile)
+            export OMPI_CFLAGS := $(subst -pthread,-Xcompiler$(space)-pthread,$(OMPI_CXXFLAGS_ORIG))
+          endif
 
-    endif
+        endif # Open MPI
+
+      endif # USE_MPI
+
+    endif # nvcc_forward_unknowns == 0
 
 endif
diff --git a/Tools/GNUMake/Make.machines b/Tools/GNUMake/Make.machines
index 2fdc5512d6a..7b48b41ee10 100644
--- a/Tools/GNUMake/Make.machines
+++ b/Tools/GNUMake/Make.machines
@@ -4,57 +4,41 @@
 which_site := unknown
 which_computer := unknown
 
-ifdef $(HOSTNAME)
-  host_name := $(strip $(HOSTNAME))
-else ifdef $(HOST)
-  host_name := $(strip $(HOST))
+ifdef HOSTNAME
+  host_name_env := $(strip $(HOSTNAME))
+else ifdef HOST
+  host_name_env := $(strip $(HOST))
 else
-  host_name := $(shell hostname -f)
+  host_name_env := unknown
 endif
 
-# MACHINES supported
-
-CCSE_MACHINES := angilas atragon baragon battra ebirah gamera garuda gigan
-CCSE_MACHINES += gimantis godzilla gojira hedorah kiryu kumonga manda
-CCSE_MACHINES += megalon mothra rodan varan naphta orga ghidorah
-ifeq ($(host_name), $(findstring $(host_name), $(CCSE_MACHINES)))
-  which_site := ccse
-  which_computer := $(host_name)
-endif
+host_name := $(shell hostname -f)
+host_name_short := $(shell hostname -s)
 
-ifeq ($(findstring cori, $(host_name)), cori)
-  which_site := nersc
-  which_computer := cori
-endif
+# MACHINES supported
 
+ifdef NERSC_HOST
 ifeq ($(findstring cgpu, $(host_name)), cgpu)
   which_site := nersc
   which_computer := cgpu
+else
+ifeq ($(NERSC_HOST), cori)
+  which_site := nersc
+  which_computer := cori
 endif
-
-ifeq ($(findstring titan, $(host_name)), titan)
-  which_site := olcf
-  which_computer := titan
-endif
-
-ifeq ($(findstring summit, $(host_name)), summit)
-  which_site := olcf
-  which_computer := summit
 endif
-
-ifeq ($(findstring summitdev, $(host_name)), summitdev)
-  which_site := olcf
-  which_computer := summitdev
 endif
 
-ifeq ($(findstring ascent, $(host_name)), ascent)
-  which_site := olcf
-  which_computer := ascent
-endif
+ifdef OLCF_MODULEPATH_ROOT
+  ifeq ($(findstring summit, $(host_name)), summit)
+    which_site := olcf
+    which_computer := summit
+  endif
 
-ifeq ($(findstring peak, $(host_name)), peak)
-  which_site := olcf
-  which_computer := peak
+  ifeq ($(findstring ascent, $(host_name)), ascent)
+    which_site := olcf
+    which_computer := ascent
+  endif
 endif
 
 ifeq ($(findstring sierra, $(host_name)), sierra)
@@ -131,7 +115,8 @@ ifeq ($(findstring raijin, $(host_name)), raijin)
   which_computer := raijin
 endif
 
-ifeq ($(findstring tulip, $(host_name)), tulip)
+ifneq (,$(filter $(host_name_env),poplar redwood tulip))
   which_site := frontier-coe
-  which_computer := tulip
+  which_computer := $(host_name_env)
 endif
+
diff --git a/Tools/GNUMake/Make.rules b/Tools/GNUMake/Make.rules
index 64b82798136..c97058d9f55 100644
--- a/Tools/GNUMake/Make.rules
+++ b/Tools/GNUMake/Make.rules
@@ -37,6 +37,9 @@ else
 endif
 endif
 
+CXXDEPFLAGS = $(DEPFLAGS) $(filter-out -dc,$(CXXFLAGS)) $(CPPFLAGS) $(includes)
+CDEPFLAGS = $(DEPFLAGS) $(filter-out -dc,$(CFLAGS)) -DBL_LANG_C -DAMREX_LANG_C $(CPPFLAGS) $(includes)
+
 #
 # Rules for building executable.
 #
@@ -61,9 +64,9 @@ else
 
 # multiple executables
 %.$(machineSuffix).ex:%.cpp $(objForExecs)
-	$(SLIENT) $(CCACHE) $(CXX) $(CXXFLAGS) $(EXTRACXXFLAGS) $(CPPFLAGS) $(includes) -c $< -o $(objEXETempDir)/$<.o
+	$(SLIENT) $(CCACHE) $(CXX) $(CXXFLAGS) $(EXTRACXXFLAGS) $(CPPFLAGS) $(includes) -c $< -o $(objEXETempDir)/$(subst /,_,$<).o
 	@echo "Linking $@ ..."
-	$(SLIENT) $(AMREX_LINKER) $(LINKFLAGS) $(CPPFLAGS) $(includes) $(LDFLAGS) -o $@ $(objEXETempDir)/$<.o $(objForExecs) $(libraries)
+	$(SLIENT) $(AMREX_LINKER) $(LINKFLAGS) $(CPPFLAGS) $(includes) $(LDFLAGS) -o $@ $(objEXETempDir)/$(subst /,_,$<).o $(objForExecs) $(libraries)
 
 endif
 
@@ -136,7 +139,7 @@ $(amrexIncludeDir)/AMReX_Config.H: FORCE
 	              --use-omp="$(USE_OMP)" \
 	              > $@
 
-clean::
+cleanconfig::
 	@echo Cleaning...
 	$(SILENT) $(RM) $(f77EXETempDir)/*.f $(f77EXETempDir)/*.f90 $(f77EXETempDir)/*.F90
 	$(SILENT) $(RM) $(srcTempDir)/* $(objEXETempDir)/*.o $(objEXETempDir)/*.mod
@@ -145,7 +148,7 @@ clean::
 	$(SILENT) $(RM) $(executable)
 	$(SILENT) $(RM) -r $(executable).dSYM
 
-realclean:: clean
+clean:: cleanconfig
 	@echo Cleaning ...
 	$(SILENT) $(RM) TAGS tags
 	$(SILENT) $(RM) -r $(TmpBuildDir) *~
@@ -155,6 +158,8 @@ realclean:: clean
 	$(SILENT) $(RM) BLProfParser.tab.cpp
 	$(SILENT) $(RM) BLProfParser.tab.H
 
+realclean:: clean
+
 file_locations:
 	$(AMREX_HOME)/Tools/F_scripts/find_files_vpath.py --vpath "$(FINAL_VPATH_LOCATIONS)" --files "$(CEXE_sources) $(FEXE_sources) $(cEXE_sources) $(fEXE_sources) $(f90EXE_sources) $(F90EXE_sources) $(CEXE_headers) $(cEXE_headers) $(fEXE_headers) $(FEXE_headers)"
 
@@ -175,7 +180,7 @@ clang-tidy: $(CEXE_sources)
 
 FORCE:
 
-.PHONY:	all clean realclean file_locations tags TAGS clang-analyze clang-tidy install_lib install_headers install_fortran_modules install_pkg_config
+.PHONY:	all cleanconfig clean realclean file_locations tags TAGS clang-analyze clang-tidy install_lib install_headers install_fortran_modules install_pkg_config
 
 #
 # Rules for objects.
@@ -260,6 +265,8 @@ cap_registers := $(shell expr $(CUDA_MAXREGCOUNT) \> 128)
 
 ifeq ($(lowercase_comp),pgi)
   cap_register_flag := -Mcuda=maxregcount:
+else ifeq ($(lowercase_comp),hpcsdk)
+  cap_register_flag := -gpu=maxregcount:
 else ifeq ($(lowercase_comp),ibm)
   cap_register_flag := -Xptxas -maxrregcount=
 else
@@ -287,12 +294,43 @@ endif
 # Rules for dependencies in bare object files.
 #
 
+$(depEXETempDir)/%.d: %.cpp
+	@echo Depending $< ...
+ifeq ($(USE_GPU_PRAGMA),TRUE)
+	@if [ ! -d $(srcTempDir) ]; then mkdir -p $(srcTempDir); fi
+endif
+	@if [ ! -d $(depEXETempDir) ]; then mkdir -p $(depEXETempDir); fi
+ifeq ($(USE_DPCPP),TRUE)
+        # Use > $@2 to filter out unnecessary messages
+	$(CXX) $(CXXDEPFLAGS) $< -o $@ > $@2
+else ifeq ($(USE_HIP),TRUE)
+	$(CXX) $(CXXDEPFLAGS) $< -o $@
+else
+	$(CXX) $(CXXDEPFLAGS) $< > $@
+endif
+	@$(SHELL) -ec 'sed -i -e '\''s,$*\.o,$(objEXETempDir)/& $@,g'\'' $@'
+
+$(depEXETempDir)/%.d: %.c
+	@echo Depending $< ...
+ifeq ($(USE_GPU_PRAGMA),TRUE)
+	@if [ ! -d $(srcTempDir) ]; then mkdir -p $(srcTempDir); fi
+endif
+	@if [ ! -d $(depEXETempDir) ]; then mkdir -p $(depEXETempDir); fi
+ifeq ($(USE_DPCPP),TRUE)
+	$(CC) $(CDEPFLAGS) $< -o $@
+else ifeq ($(USE_HIP),TRUE)
+	$(CC) $(CDEPFLAGS) $< -o $@
+else
+	$(CC) $(CDEPFLAGS) $< > $@
+endif
+	@$(SHELL) -ec 'sed -i -e '\''s,$*\.o,$(objEXETempDir)/& $@,g'\'' $@'
+
 #
 # The sed foo below:
 #
 # First it starts a shell that runs `$MKDEP` command on `$<`, the
-# first prerequisite of make rule, say `/path/to/y.H`.  The output
-# of `$MKDEP` are lines like `/path/to/x.o: /path/to/y.H`.
+# first prerequisite of make rule, say `/path/to/y.cpp`.  The output
+# of `$MKDEP` are lines like `/path/to/x.o: /path/to/y.cpp`.
 #
 # It is then piped into two `sed` commands and then into the target
 # (i.e., `$(depEXETempDir)/x.d`).  We need sed to modify the output
@@ -301,57 +339,37 @@ endif
 #
 # The command of `sed` needs to be inside a pair of `'`s.  But the
 # whole `sed -e '......'` is already inside a pair of `'`s for the
-# shell.  So we have to use escape, thus `'\''mycommand'\''`. 
+# shell.  So we have to use escape, thus `'\''mycommand'\''`.
 #
 # The sed command is search and replace, `s,X,Y` that replaces `X` by
-# `Y`. 
+# `Y`.
 #
 # In the first sed, `X` is `^[^:]*\/`.  This matches the beginning
 # of the line to the last `/` before `:`.  The `Y` contains nothing.
-# So the matched string is removed, and the line becomes `x.o: /path/to/x.xpp`. 
+# So the matched string is removed, and the line becomes `x.o: /path/to/x.xpp`.
 #
 # In the second sed, we replace `x.o` with `$(objEXETempDir)/o`.  Note
 # that `$*` is make variable set to `%` (i.e., `x` in our example).
 # `&` is sed variable meaning the whole matched string.  The
 # replacement string also includes the target of the make rule (i.e.,
-# `$(depEXETempDir)/x.d`). 
+# `$(depEXETempDir)/x.d`).
 #
-# The final result is `$(objEXETempDir)/x.o $(depEXETempDir)/x.d: /path/to/y.H`.
+# The final result is `$(objEXETempDir)/x.o $(depEXETempDir)/x.d: /path/to/y.cpp`.
 #
 
-$(depEXETempDir)/%.d: %.cpp
-	@echo Depending $< ...
-ifeq ($(USE_GPU_PRAGMA),TRUE)
-	@if [ ! -d $(srcTempDir) ]; then mkdir -p $(srcTempDir); fi
-endif
-	@if [ ! -d $(depEXETempDir) ]; then mkdir -p $(depEXETempDir); fi
-	@$(SHELL) -ec '$(MKDEP) $(includes) $< | \
-		sed -e '\''s,^[^:]*\/,,'\'' | \
-		sed -e '\''s,$*.o,$(objEXETempDir)/& $@,'\'' > $@'
-
-$(depEXETempDir)/%.d: %.c
-	@echo Depending $< ...
-ifeq ($(USE_GPU_PRAGMA),TRUE)
-	@if [ ! -d $(srcTempDir) ]; then mkdir -p $(srcTempDir); fi
-endif
-	@if [ ! -d $(depEXETempDir) ]; then mkdir -p $(depEXETempDir); fi
-	@$(SHELL) -ec '$(MKDEP) $(includes) $< | \
-		sed -e '\''s,^[^:]*\/,,'\'' | \
-		sed -e '\''s,$*.o,$(objEXETempDir)/& $@,'\'' > $@'
-
 $(depEXETempDir)/%.d: %.F
 	@echo Depending $< ...
 	@if [ ! -d $(depEXETempDir) ]; then mkdir -p $(depEXETempDir); fi
 	@$(SHELL) -ec '$(MKDEP) -fortran $(fincludes) $< | \
 		sed -e '\''s,^[^:]*\/,,'\'' | \
-		sed -e '\''s,$*.o,$(objEXETempDir)/& $@,'\'' > $@'
+		sed -e '\''s,$*\.o,$(objEXETempDir)/& $@,'\'' > $@'
 
 $(depEXETempDir)/%.d: %.f
 	@echo Depending $< ...
 	@if [ ! -d $(depEXETempDir) ]; then mkdir -p $(depEXETempDir); fi
 	@$(SHELL) -ec '$(MKDEP) -fortran $(fincludes) $< | \
 		sed -e '\''s,^[^:]*\/,,'\'' | \
-		sed -e '\''s,$*.o,$(objEXETempDir)/& $@,'\'' > $@'
+		sed -e '\''s,$*\.o,$(objEXETempDir)/& $@,'\'' > $@'
 
 DEP_CHECK_OPTS :=
 
@@ -434,11 +452,9 @@ typecheck: $(fortran_ir_sources) $(fortran_fdecl_headers_cppd)
 # Now load/build the dependency files.
 # Also handle any necessary preprocessing.
 #
-ifneq ($(MAKECMDGOALS),realclean)
-ifneq ($(MAKECMDGOALS),clean)
-ifneq ($(MAKECMDGOALS),uninstall)
-ifneq ($(MAKECMDGOALS),distclean)
+ifneq ($(NO_CONFIG_CHECKING),TRUE)
 ifneq ($(findstring print-,$(MAKECMDGOALS)),print-)
+ifneq ($(MAKECMDGOALS),help)
 
 ifeq ($(USE_GPU_PRAGMA),TRUE)
 include $(TmpBuildDir)/$(optionsSuffix)_cuda_done
@@ -464,17 +480,17 @@ ifneq "$(strip $(f90EXE_sources) $(F90EXE_sources))" ""
 include $(depEXETempDir)/f90.depends
 endif
 
-endif
-endif
 endif
 endif
 endif
 
-ifneq ($(MAKECMDGOALS),$(filter $(MAKECMDGOALS),clean realclean file_locations tags TAGS uninstall distclean))
+ifneq ($(NO_CONFIG_CHECKING),TRUE)
+ifneq ($(MAKECMDGOALS),$(filter $(MAKECMDGOALS),file_locations tags TAGS))
   ifdef has_compiler_mismatch
     $(error $(has_compiler_mismatch))
   endif
 endif
+endif
 
 #-----------------------------------------------------------------------------
 # for debugging.  To see the value of a Makefile variable,
diff --git a/Tools/GNUMake/README.md b/Tools/GNUMake/README.md
index 944ed26de74..6fcec95e264 100644
--- a/Tools/GNUMake/README.md
+++ b/Tools/GNUMake/README.md
@@ -26,8 +26,8 @@ set either in the makefile or via the shell's environment variable.
 Typically one types `make` to build an executable.  Other useful
 commands include:
 
-* `make clean` removes the executable, `.o` files, and the resulting files of preprocessing.
-* `make realclean` removes all files generated by the make system.
+* `make cleanconfig` removes the executable, `.o` files, and the resulting files of preprocessing.
+* `make clean` removes all files generated by the make system.
 * `make help` shows the rules for compilation.
 * `make print-xxx` shows the value of `xxx`.  This is very useful for
   debugging.
diff --git a/Tools/GNUMake/comps/cray.mak b/Tools/GNUMake/comps/cray.mak
index 2a1825e3470..a247d1bedbd 100644
--- a/Tools/GNUMake/comps/cray.mak
+++ b/Tools/GNUMake/comps/cray.mak
@@ -19,11 +19,16 @@ F90FLAGS =
 # still based on CCE 8 and so it has the same options as before.
 COMP_VERSION = $(shell echo $(CRAY_CC_VERSION) | cut -f 1 -d .)
 
+ifeq ($(shell expr $(COMP_VERSION) \>= 9), 1)
+  CCE_GE_V9 := TRUE
+else
+  CCE_GE_V9 := FALSE
+endif
 ########################################################################
 
 ifeq ($(DEBUG),TRUE)
 
-  ifeq ($(COMP_VERSION),9)
+  ifeq ($(CCE_GE_V9),TRUE)
     CXXFLAGS += -g -O0
     CFLAGS   += -g -O0
     FFLAGS   += -g -O0 -e i -K trap=fp
@@ -38,13 +43,13 @@ ifeq ($(DEBUG),TRUE)
   endif
 
 else
-  ifeq ($(COMP_VERSION),9)
+  ifeq ($(CCE_GE_V9),TRUE)
     # The LLVM optimizer is not as aggressive as the native Cray optimizer from
     # CCE <= 8. So we adjust some flags to achieve similar optimization. See
     # this page:
     # http://pubs.cray.com/content/S-5212/9.0/cray-compiling-environment-cce-release-overview/cce-900-software-enhancements
-    CXXFLAGS += -O2 -ffast-math -fsave-loopmark -fsave-decompile
-    CFLAGS   += -O2 -ffast-math -fsave-loopmark -fsave-decompile
+    CXXFLAGS += -O2 -ffast-math #-fsave-loopmark -fsave-decompile
+    CFLAGS   += -O2 -ffast-math #-fsave-loopmark -fsave-decompile
     FFLAGS   += -O2 -h list=a
     F90FLAGS += -O2 -h list=a
   else
@@ -66,7 +71,7 @@ else
   CXXSTD := c++11
 endif
 
-ifeq ($(COMP_VERSION),9)
+ifeq ($(CCE_GE_V9),TRUE)
   CXXFLAGS += -std=$(CXXSTD)
   CFLAGS   += -std=c99
 else
@@ -84,7 +89,7 @@ FMODULES = -I $(fmoddir) -J $(fmoddir)
 ifeq ($(USE_OMP),TRUE)
   # Starting in CCE 9, OpenMP is disabled by default in each of C/C++/Fortran
   # compilers.
-  ifeq ($(COMP_VERSION),9)
+  ifeq ($(CCE_GE_V9),TRUE)
     CXXFLAGS += -fopenmp
     CFLAGS   += -fopenmp
     FFLAGS   += -h omp
@@ -93,18 +98,18 @@ ifeq ($(USE_OMP),TRUE)
     GENERIC_COMP_FLAGS += -h omp
   endif
 else
-  ifneq ($(COMP_VERSION),9)
+  ifeq ($(CCE_GE_V9),FALSE)
     GENERIC_COMP_FLAGS += -h noomp
   endif
 endif
 
 ifeq ($(USE_ACC),TRUE)
   # OpenACC is removed from CCE altogether in CCE 9.
-  ifeq ($(COMP_VERSION),9)
-    $(error OpenACC has been removed from CCE 9.)
+  ifeq ($(CCE_GE_V9),TRUE)
+    $(error OpenACC has been removed from CCE >= 9.)
   endif
 else
-  ifneq ($(COMP_VERSION),9)
+  ifeq ($(CCE_GE_V9),FALSE)
     GENERIC_COMP_FLAGS += -h noacc
   endif
 endif
diff --git a/Tools/GNUMake/comps/dpcpp.mak b/Tools/GNUMake/comps/dpcpp.mak
index 5fb2a71189a..e806aa13731 100644
--- a/Tools/GNUMake/comps/dpcpp.mak
+++ b/Tools/GNUMake/comps/dpcpp.mak
@@ -13,22 +13,10 @@ F90FLAGS =
 
 ########################################################################
 
-#clang_version       = $(shell $(CXX) --version | head -1 | sed -e 's/.*version.*\([0-9]\+\.[0-9]\+\.[0-9]\+\).*/\1/')
-#clang_major_version = $(shell $(CXX) --version | head -1 | sed -e 's/.*version.*\([0-9]\+\.[0-9]\+\.[0-9]\+\).*/\1/' | sed -e 's;\..*;;')
-#clang_minor_version = $(shell $(CXX) --version | head -1 | sed -e 's/.*version.*\([0-9]\+\.[0-9]\+\.[0-9]\+\).*/\1/' | sed -e 's;[^.]*\.;;' | sed -e 's;\..*;;')
-#
-#COMP_VERSION = $(clang_version)
-#
-#DEFINES += -DBL_CLANG_VERSION='$(clang_version)'
-#DEFINES += -DBL_CLANG_MAJOR_VERSION='$(clang_major_version)'
-#DEFINES += -DBL_CLANG_MINOR_VERSION='$(clang_minor_version)'
-
-########################################################################
-
 ifeq ($(DEBUG),TRUE)
 
-  CXXFLAGS += -g -O0 -Wall -Wextra -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable #-ftrapv
-  CFLAGS   += -g -O0 -Wall -Wextra -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable #-ftrapv
+  CXXFLAGS += -g -O0 #-ftrapv
+  CFLAGS   += -g -O0 #-ftrapv
 
   FFLAGS   += -g -O0 -ggdb -fbounds-check -fbacktrace -Wuninitialized -Wunused -ffpe-trap=invalid,zero -finit-real=snan -finit-integer=2147483647 #-ftrapv
   F90FLAGS += -g -O0 -ggdb -fbounds-check -fbacktrace -Wuninitialized -Wunused -ffpe-trap=invalid,zero -finit-real=snan -finit-integer=2147483647 #-ftrapv
@@ -36,7 +24,7 @@ ifeq ($(DEBUG),TRUE)
 else
 
   CXXFLAGS += -O3 # // xxxx DPCPP: todo -g in beta6 causes a lot of warning messages
-  CFLAGS   += -O3
+  CFLAGS   += -O3 #                       and makes linking much slower
 #  CXXFLAGS += -g -O3
 #  CFLAGS   += -g -O3
   FFLAGS   += -g -O3
@@ -44,15 +32,38 @@ else
 
 endif
 
+CXXFLAGS += -Wno-pass-failed  # disable this warning
+
+ifeq ($(WARN_ALL),TRUE)
+  warning_flags = -Wall -Wextra -Wno-sign-compare -Wunreachable-code -Wnull-dereference
+  warning_flags += -Wfloat-conversion -Wextra-semi
+
+  ifneq ($(USE_CUDA),TRUE)
+    warning_flags += -Wpedantic
+  endif
+
+  ifneq ($(WARN_SHADOW),FALSE)
+    warning_flags += -Wshadow
+  endif
+
+  CXXFLAGS += $(warning_flags) -Woverloaded-virtual
+  CFLAGS += $(warning_flags)
+endif
+
+ifeq ($(WARN_ERROR),TRUE)
+  CXXFLAGS += -Werror
+  CFLAGS += -Werror
+endif
+
 ########################################################################
 
 ifdef CXXSTD
-  CXXSTD := $(strip $(CXXSTD))
+  CXXFLAGS += -std=$(strip $(CXXSTD))
 else
-  CXXSTD := c++14
+  CXXFLAGS += -std=c++17
 endif
 
-CXXFLAGS += -std=$(CXXSTD) -Wno-error=sycl-strict -fsycl -fsycl-unnamed-lambda
+CXXFLAGS += -Wno-error=sycl-strict -fsycl
 CFLAGS   += -std=c99
 
 ifneq ($(DEBUG),TRUE)  # There is currently a bug that DEBUG build will crash.
@@ -79,6 +90,15 @@ ifneq ($(DPCPP_SPLIT_KERNEL),FALSE)
 endif
 endif
 
+# temporary work-around for DPC++ beta08 bug
+#   define "long double" as 64bit for C++ user-defined literals
+#   https://github.com/intel/llvm/issues/2187
+CXXFLAGS += -mlong-double-64 -Xclang -mlong-double-64
+
+# Beta09 has enabled early optimizations by default.  But this causes many
+# tests to crash.  So we disable it.
+CXXFLAGS += -fno-sycl-early-optimizations
+
 FFLAGS   += -ffixed-line-length-none -fno-range-check -fno-second-underscore
 F90FLAGS += -ffree-line-length-none -fno-range-check -fno-second-underscore -fimplicit-none
 
@@ -130,7 +150,13 @@ override XTRALIBS += -lgfortran -lquadmath
 
 endif
 
-override XTRAOBJS += $(DPCPP_DIR)/lib/libsycl-glibc.o $(DPCPP_DIR)/lib/libsycl-cmath.o $(DPCPP_DIR)/lib/libsycl-cmath-fp64.o
+DPCPP_DIR = $(shell dpcpp --version | tail -1 | sed -e 's/InstalledDir: //' | sed -e 's/linux\/bin/linux/')
+ifeq ($(findstring beta09, $(DPCPP_DIR)), beta09)
+  override XTRAOBJS += $(DPCPP_DIR)/lib/libsycl-glibc.o
+  LDFLAGS += -device-math-lib=fp32,fp64
+else
+  LDFLAGS += -fsycl-device-lib=libc,libm-fp32,libm-fp64
+endif
 
 ifeq ($(FSANITIZER),TRUE)
   override XTRALIBS += -lubsan
diff --git a/Tools/GNUMake/comps/gnu.mak b/Tools/GNUMake/comps/gnu.mak
index b6eb9bea38f..e609463d6b7 100644
--- a/Tools/GNUMake/comps/gnu.mak
+++ b/Tools/GNUMake/comps/gnu.mak
@@ -28,10 +28,6 @@ gcc_minor_version = $(shell $(GCC_VERSION_COMP) -dumpfullversion -dumpversion |
 
 COMP_VERSION = $(gcc_version)
 
-DEFINES += -DBL_GCC_VERSION=$(gcc_version)
-DEFINES += -DBL_GCC_MAJOR_VERSION=$(gcc_major_version)
-DEFINES += -DBL_GCC_MINOR_VERSION=$(gcc_minor_version)
-
 ########################################################################
 
 GENERIC_GNU_FLAGS =
@@ -42,6 +38,9 @@ ifeq ($(EXPORT_DYNAMIC),TRUE)
   GENERIC_GNU_FLAGS += -rdynamic -fno-omit-frame-pointer
 endif
 
+gcc_major_ge_5 = $(shell expr $(gcc_major_version) \>= 5)
+gcc_major_ge_6 = $(shell expr $(gcc_major_version) \>= 6)
+gcc_major_ge_7 = $(shell expr $(gcc_major_version) \>= 7)
 gcc_major_ge_8 = $(shell expr $(gcc_major_version) \>= 8)
 gcc_major_ge_9 = $(shell expr $(gcc_major_version) \>= 9)
 gcc_major_ge_10 = $(shell expr $(gcc_major_version) \>= 10)
@@ -79,32 +78,45 @@ CXXFLAGS += -Werror=return-type
 CFLAGS   += -Werror=return-type
 
 ifeq ($(DEBUG),TRUE)
+  CXXFLAGS += -g -O0 -ggdb -ftrapv
+  CFLAGS   += -g -O0 -ggdb -ftrapv
+else
+  CXXFLAGS += -g -O3
+  CFLAGS   += -g -O3
+endif
 
-  CXXFLAGS += -g -O0 -ggdb -Wall -Wno-sign-compare -ftrapv -Wno-unused-but-set-variable
-  CFLAGS   += -g -O0 -ggdb -Wall -Wno-sign-compare -ftrapv -Wno-unused-but-set-variable
+ifeq ($(WARN_ALL),TRUE)
+  warning_flags = -Wall -Wextra -Wno-sign-compare -Wunreachable-code
 
-  ifneq ($(gcc_major_version),$(filter $(gcc_major_version),4 5))
-    CXXFLAGS += -Wnull-dereference
-    CFLAGS += -Wnull-dereference
+  ifneq ($(USE_CUDA),TRUE)
+    # With -Wpedantic I got 650 MB of warnings
+    warning_flags += -Wpedantic
   endif
 
-  ifneq ($(gcc_major_version),$(filter $(gcc_major_version),4))
-    CXXFLAGS += -Wfloat-conversion
-    CFLAGS += -Wfloat-conversion
+  ifeq ($(gcc_major_ge_6),1)
+    warning_flags += -Wnull-dereference
   endif
 
-  ifneq ($(WARN_SHADOW),FALSE)
-    CXXFLAGS += -Wshadow
-    CFLAGS += -Wshadow
+  ifeq ($(gcc_major_ge_5),1)
+    warning_flags += -Wfloat-conversion
   endif
 
-else
+  ifneq ($(WARN_SHADOW),FALSE)
+    warning_flags += -Wshadow
+  endif
 
-  CXXFLAGS += -g -O3
-  CFLAGS   += -g -O3
+  ifeq ($(gcc_major_version),7)
+    warning_flags += -Wno-array-bounds
+  endif
 
+  CXXFLAGS += $(warning_flags) -Woverloaded-virtual
+  CFLAGS += $(warning_flags)
 endif
 
+ifeq ($(WARN_ERROR),TRUE)
+  CXXFLAGS += -Werror
+  CFLAGS += -Werror
+endif
 
 ifeq ($(USE_GPROF),TRUE)
   CXXFLAGS += -pg
@@ -146,8 +158,6 @@ CFLAGS   += -std=gnu99
 
 CXXFLAGS += $(GENERIC_GNU_FLAGS) -pthread
 CFLAGS   += $(GENERIC_GNU_FLAGS)
-FFLAGS   += $(GENERIC_GNU_FLAGS)
-F90FLAGS += $(GENERIC_GNU_FLAGS)
 
 endif # AMREX_CCOMP == gnu
 
@@ -222,5 +232,3 @@ F90FLAGS += $(GENERIC_GNU_FLAGS)
 endif  # BL_NO_FORT
 
 endif # AMREX_FCOMP == gnu
-
-
diff --git a/Tools/GNUMake/comps/hip.mak b/Tools/GNUMake/comps/hip.mak
index b53831fedae..5735a580180 100644
--- a/Tools/GNUMake/comps/hip.mak
+++ b/Tools/GNUMake/comps/hip.mak
@@ -1,8 +1,10 @@
 # Setup for HIP, using hipcc (HCC and clang will use the same compiler name).
 
-HIP_PATH=$(shell hipconfig --path)
-ifeq ($(HIP_PATH),)
-  $(error hipconfig failed. Is the HIP toolkit available?)
+ifneq ($(NO_CONFIG_CHECKING),TRUE)
+  HIP_PATH=$(shell hipconfig --path)
+  ifeq ($(HIP_PATH),)
+    $(error hipconfig failed. Is the HIP toolkit available?)
+  endif
 endif
 
 CXX = $(HIP_PATH)/bin/hipcc
@@ -50,21 +52,47 @@ endif  # BL_NO_FORT
 
 # =============================================================================================
 
-# This is designed only for dogora for now.
-ifeq ($(HIP_PLATFORM),hcc)
+ifeq ($(HIP_COMPILER),clang)
 
   ifeq ($(DEBUG),TRUE)
-    # From llvm
-    CXXFLAGS += -g
-    CFLAGS   += -g 
+    CXXFLAGS += -g -O0 -ftrapv
+    CFLAGS   += -g -O0 -ftrapv
+
     FFLAGS   += -g -O0 -ggdb -fbounds-check -fbacktrace -Wuninitialized -Wunused -ffpe-trap=invalid,zero -finit-real=snan -finit-integer=2147483647 -ftrapv
     F90FLAGS += -g -O0 -ggdb -fbounds-check -fbacktrace -Wuninitialized -Wunused -ffpe-trap=invalid,zero -finit-real=snan -finit-integer=2147483647 -ftrapv
 
   else  # DEBUG=FALSE flags
+
+    CXXFLAGS += -g -O3
+    CFLAGS   += -g -O3
+    FFLAGS   += -g -O3
+    F90FLAGS += -g -O3
+
+  endif
+
+  CXXFLAGS += -Wno-pass-failed  # disable this warning
+
+  ifeq ($(WARN_ALL),TRUE)
+    warning_flags = -Wall -Wextra -Wno-sign-compare -Wunreachable-code -Wnull-dereference
+    warning_flags += -Wfloat-conversion -Wextra-semi
+
+    warning_flags += -Wpedantic
+
+    ifneq ($(WARN_SHADOW),FALSE)
+      warning_flags += -Wshadow
+    endif
+
+    CXXFLAGS += $(warning_flags) -Woverloaded-virtual
+    CFLAGS += $(warning_flags)
   endif
 
+#  ifeq ($(WARN_ERROR),TRUE)
+#    CXXFLAGS += -Werror
+#    CFLAGS += -Werror
+#  endif
+
   # Generic HIP info
-  ROC_PATH=/opt/rocm
+  ROC_PATH=$(realpath $(dir $(HIP_PATH)))
   INCLUDE_LOCATIONS += $(HIP_PATH)/include
 
   # rocRand
@@ -76,33 +104,12 @@ ifeq ($(HIP_PLATFORM),hcc)
   INCLUDE_LOCATIONS += $(ROC_PATH)/rocprim/include
 
   # rocThrust - Header only
-  INCLUDE_LOCATIONS += $(ROC_PATH)/rocthrust/include
+  # INCLUDE_LOCATIONS += $(ROC_PATH)/rocthrust/include
 
 # =============================================================================================
 
-# This is Summit. Likely broken.
-else ifeq ($(HIP_PLATFORM),nvcc)
-  $(error HIP_PLATFORM nvcc is not supported at this time. Use USE_CUDA to compile for NVIDIA platforms.)
-#
-#  CXXFLAGS_FROM_HOST := -ccbin=$(CXX) --std=c++14
-#  CFLAGS_FROM_HOST := -ccbin=$(CXX)
-#  HIPCC_FLAGS = -Wno-deprecated-gpu-targets -m64 -arch=compute_$(CUDA_ARCH) -code=sm_$(CUDA_ARCH) -maxrregcount=$(CUDA_MAXREGCOUNT)
-#
-#  ifeq ($(DEBUG),TRUE)
-#    HIPCC_FLAGS += -g -G
-#  else
-#    HIPCC_FLAGS += -lineinfo --ptxas-options=-O3,-v
-#  endif
-#
-#  ifneq ($(USE_CUDA_FAST_MATH),FALSE)
-#    HIPCC_FLAGS += --use_fast_math
-#  endif
-#
-#  CXXFLAGS = $(CXXFLAGS_FROM_HOST) $(HIPCC_FLAGS) -c -dc
-#  CFLAGS   =   $(CFLAGS_FROM_HOST) $(HIPCC_FLAGS) -dc
-#
-#  CXXFLAGS += --expt-relaxed-constexpr --expt-extended-lambda
-#
+else ifeq ($(HIP_COMPILER),nvcc)
+  $(error HIP_COMPILER nvcc is not supported at this time. Use USE_CUDA to compile for NVIDIA platforms.)
 endif
 
 # =============================================================================================
diff --git a/Tools/GNUMake/comps/hpcsdk.mak b/Tools/GNUMake/comps/hpcsdk.mak
new file mode 100644
index 00000000000..38b399ff20a
--- /dev/null
+++ b/Tools/GNUMake/comps/hpcsdk.mak
@@ -0,0 +1,221 @@
+
+ifndef AMREX_CCOMP
+  AMREX_CCOMP = hpcsdk
+endif
+
+ifndef AMREX_FCOMP
+  AMREX_FCOMP = hpcsdk
+endif
+
+########################################################################
+
+hpcsdk_version = $(shell $(CXX) -V 2>&1 | grep 'target' | sed 's|.*$(CXX) \([0-9\.]*\).*|\1|')
+hpcsdk_major_version = $(shell echo $(hpcsdk_version) | cut -f1 -d.)
+hpcsdk_minor_version = $(shell echo $(hpcsdk_version) | cut -f2 -d.)
+
+gcc_version       = $(shell g++ -dumpfullversion -dumpversion | head -1 | sed -e 's;.*  *;;')
+gcc_major_version = $(shell g++ -dumpfullversion -dumpversion | head -1 | sed -e 's;.*  *;;' | sed -e 's;\..*;;')
+gcc_minor_version = $(shell g++ -dumpfullversion -dumpversion | head -1 | sed -e 's;.*  *;;' | sed -e 's;[^.]*\.;;' | sed -e 's;\..*;;')
+
+COMP_VERSION = $(hpcsdk_version)
+
+########################################################################
+
+GENERIC_HPCSDK_FLAGS =
+
+ifeq ($(USE_OMP),TRUE)
+  GENERIC_HPCSDK_FLAGS += -mp -Minfo=mp
+endif
+
+ifeq ($(USE_ACC),TRUE)
+  GENERIC_HPCSDK_FLAGS += -acc=gpu -Minfo=accel -mcmodel=medium
+  ifneq ($(CUDA_ARCH),)
+    # We use 10.1 because nvcc defaults to 10.1 if it can't detect a GPU
+    # driver. And in Cori GPU interactive jobs, nvcc can't see the GPU driver
+    # unless it is executed within an `srun`. Most people do not execute `srun
+    # make`, so nvcc defaults to 10.1. But HPC SDK defaults to CUDA 11, so we
+    # get link errors between nvcc and the HPC SDK if we don't do something
+    # about this. The easiest fix is to simply force HPC SDK to use CUDA 10.1
+    # to match the blind nvcc.
+    GENERIC_HPCSDK_FLAGS += -acc=gpu -gpu=cc$(CUDA_ARCH),cuda10.1
+  else
+    GENERIC_HPCSDK_FLAGS += -acc=gpu
+  endif
+endif
+
+# Note that -O2 is the default optimization level for HPCSDK
+
+HPCSDK_OPT := -O2 -fast
+
+########################################################################
+########################################################################
+########################################################################
+
+ifeq ($(AMREX_CCOMP),hpcsdk)
+
+CXX = nvc++
+CC  = nvc
+
+########################################################################
+
+CXXFLAGS =
+CFLAGS   =
+
+# Allow -gopt to be disabled to work around a compiler bug on P9.
+
+HPCSDK_GOPT ?= TRUE
+
+ifeq ($(DEBUG),TRUE)
+
+  CXXFLAGS += -g -O0 -Mbounds
+  CFLAGS   += -g -O0 -Mbounds
+
+else
+
+  CXXFLAGS += $(HPCSDK_OPT)
+  CFLAGS   += $(HPCSDK_OPT)
+
+  ifeq ($(HPCSDK_GOPT),TRUE)
+
+    CXXFLAGS += -gopt
+    CFLAGS   += -gopt
+
+  endif
+
+endif
+
+# The logic here should be consistent with what's in nvcc.mak
+ifdef CXXSTD
+  CXXSTD := $(strip $(CXXSTD))
+  ifeq ($(shell expr $(gcc_major_version) \< 5),1)
+    ifeq ($(CXXSTD),c++14)
+      $(error C++14 support requires GCC 5 or newer.)
+    endif
+  endif
+  CXXFLAGS += -std=$(CXXSTD)
+else
+  ifeq ($(gcc_major_version),4)
+    CXXFLAGS += -std=c++11
+  else ifeq ($(gcc_major_version),5)
+    CXXFLAGS += -std=c++14
+  endif
+endif
+
+CFLAGS   += -c99
+
+CXXFLAGS += $(GENERIC_HPCSDK_FLAGS)
+CFLAGS   += $(GENERIC_HPCSDK_FLAGS)
+
+else # AMREX_CCOMP == hpcsdk
+
+# If we're using OpenACC but also CUDA, then nvcc will be the C++ compiler. If
+# we want to call the OpenACC API from C++ then we need to make sure we have
+# the includes for it, because HPCSDK may not be the host compiler for nvcc.
+
+ifeq ($(USE_ACC),TRUE)
+  HPCSDK_BIN_LOCATION := $(shell nvc++ -show 2>&1 | grep CPPCOMPDIR | awk '{print $$7}' | cut -c2-)
+  HPCSDK_LOCATION := $(shell dirname $(HPCSDK_BIN_LOCATION))
+  INCLUDE_LOCATIONS += $(HPCSDK_LOCATION)/etc/include_acc
+endif
+
+endif # AMREX_CCOMP == hpcsdk
+
+########################################################################
+########################################################################
+########################################################################
+
+ifeq ($(AMREX_FCOMP),hpcsdk)
+
+#
+# Now set the Fortran flags. Since this is done after the GNU include
+# in the CUDA version, all of the GNU specific options are overriden.
+#
+
+FC  = nvfortran
+F90 = nvfortran
+
+FFLAGS   =
+F90FLAGS =
+
+ifeq ($(DEBUG),TRUE)
+
+  FFLAGS   += -g -O0 -Mbounds -Ktrap=divz,inv -Mchkptr
+  F90FLAGS += -g -O0 -Mbounds -Ktrap=divz,inv -Mchkptr
+
+else
+
+  FFLAGS   += $(HPCSDK_OPT)
+  F90FLAGS += $(HPCSDK_OPT)
+
+  ifeq ($(HPCSDK_GOPT),TRUE)
+
+    FFLAGS   += -gopt
+    F90FLAGS += -gopt
+
+  endif
+
+endif
+
+# Note that we do not have a Fortran main
+
+ifneq ($(USE_F_INTERFACES),TRUE)
+  F90FLAGS += -Mnomain
+  FFLAGS   += -Mnomain
+endif
+
+ifeq ($(USE_CUDA),TRUE)
+
+  F90FLAGS += -gpu=cc$(CUDA_ARCH),fastmath,cuda10.1
+  FFLAGS   += -gpu=cc$(CUDA_ARCH),fastmath,cuda10.1
+
+  ifneq ($(DEBUG),TRUE)
+    F90FLAGS += -Mcuda=lineinfo
+    FFLAGS   += -Mcuda=lineinfo
+  endif
+
+  ifeq ($(CUDA_VERBOSE),TRUE)
+    F90FLAGS += -gpu=keepptx
+    FFLAGS   += -gpu=keepptx
+  endif
+
+  F90FLAGS += CUDA_HOME=$(COMPILE_CUDA_PATH)
+  FFLAGS   += CUDA_HOME=$(COMPILE_CUDA_PATH)
+
+  ifdef CUDA_MAXREGCOUNT
+    F90FLAGS += -gpu=maxregcount:$(CUDA_MAXREGCOUNT)
+    FFLAGS   += -gpu=maxregcount:$(CUDA_MAXREGCOUNT)
+  endif
+
+  DEFINES += -DAMREX_USE_CUDA_FORTRAN
+
+  LINK_WITH_FORTRAN_COMPILER = TRUE
+
+  ifeq ($(USE_MPI),TRUE)
+  ifneq ($(findstring Open MPI, $(shell mpicxx -showme:version 2>&1)),)
+    OMPI_FCFLAGS_ORIG = $(shell mpif90 -showme:compile)
+    export OMPI_FCFLAGS := $(subst -pthread,-lpthread,$(OMPI_FCFLAGS_ORIG))
+  endif
+  endif
+
+endif
+
+
+########################################################################
+
+F90FLAGS += -Mdclchk
+FFLAGS   += -Mextend
+
+FMODULES = -module $(fmoddir) -I$(fmoddir)
+
+########################################################################
+
+FFLAGS   += $(GENERIC_HPCSDK_FLAGS)
+F90FLAGS += $(GENERIC_HPCSDK_FLAGS)
+
+########################################################################
+
+override XTRALIBS += -lstdc++ -latomic -lnvf
+
+LINK_WITH_FORTRAN_COMPILER ?= $(USE_F_INTERFACES)
+
+endif # AMREX_FCOMP == hpcsdk
diff --git a/Tools/GNUMake/comps/llvm-flang.mak b/Tools/GNUMake/comps/llvm-flang.mak
index 2222904aa9f..3024f6b8c62 100644
--- a/Tools/GNUMake/comps/llvm-flang.mak
+++ b/Tools/GNUMake/comps/llvm-flang.mak
@@ -19,10 +19,6 @@ clang_minor_version = $(shell $(CXX) --version | head -1 | sed -e 's/.*version.*
 
 COMP_VERSION = $(clang_version)
 
-DEFINES += -DBL_CLANG_VERSION='$(clang_version)'
-DEFINES += -DBL_CLANG_MAJOR_VERSION='$(clang_major_version)'
-DEFINES += -DBL_CLANG_MINOR_VERSION='$(clang_minor_version)'
-
 ########################################################################
 
 ifeq ($(DEBUG),TRUE)
diff --git a/Tools/GNUMake/comps/llvm.mak b/Tools/GNUMake/comps/llvm.mak
index 19cda0879a2..f8e0f3b472c 100644
--- a/Tools/GNUMake/comps/llvm.mak
+++ b/Tools/GNUMake/comps/llvm.mak
@@ -19,16 +19,12 @@ clang_minor_version = $(shell $(CXX) --version | head -1 | sed -e 's/.*version.*
 
 COMP_VERSION = $(clang_version)
 
-DEFINES += -DBL_CLANG_VERSION='$(clang_version)'
-DEFINES += -DBL_CLANG_MAJOR_VERSION='$(clang_major_version)'
-DEFINES += -DBL_CLANG_MINOR_VERSION='$(clang_minor_version)'
-
 ########################################################################
 
 ifeq ($(DEBUG),TRUE)
 
-  CXXFLAGS += -g -O0 -Wall -Wextra -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable -Wno-missing-braces -Wmissing-field-initializers -ftrapv 
-  CFLAGS   += -g -O0 -Wall -Wextra -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable -Wno-missing-braces -Wmissing-field-initializers -ftrapv
+  CXXFLAGS += -g -O0 -ftrapv
+  CFLAGS   += -g -O0 -ftrapv
 
   FFLAGS   += -g -O0 -ggdb -fbounds-check -fbacktrace -Wuninitialized -Wunused -ffpe-trap=invalid,zero -finit-real=snan -finit-integer=2147483647 -ftrapv
   F90FLAGS += -g -O0 -ggdb -fbounds-check -fbacktrace -Wuninitialized -Wunused -ffpe-trap=invalid,zero -finit-real=snan -finit-integer=2147483647 -ftrapv
@@ -42,6 +38,29 @@ else
 
 endif
 
+CXXFLAGS += -Wno-pass-failed  # disable this warning
+
+ifeq ($(WARN_ALL),TRUE)
+  warning_flags = -Wall -Wextra -Wno-sign-compare -Wunreachable-code -Wnull-dereference
+  warning_flags += -Wfloat-conversion -Wextra-semi
+
+  ifneq ($(USE_CUDA),TRUE)
+    warning_flags += -Wpedantic
+  endif
+
+  ifneq ($(WARN_SHADOW),FALSE)
+    warning_flags += -Wshadow
+  endif
+
+  CXXFLAGS += $(warning_flags) -Woverloaded-virtual
+  CFLAGS += $(warning_flags)
+endif
+
+ifeq ($(WARN_ERROR),TRUE)
+  CXXFLAGS += -Werror
+  CFLAGS += -Werror
+endif
+
 ########################################################################
 
 ifdef CXXSTD
diff --git a/Tools/GNUMake/comps/nag.mak b/Tools/GNUMake/comps/nag.mak
index 0ccdccca95c..34319dddbe2 100644
--- a/Tools/GNUMake/comps/nag.mak
+++ b/Tools/GNUMake/comps/nag.mak
@@ -19,10 +19,6 @@ gcc_minor_version = $(shell $(CXX) -dumpversion | head -1 | sed -e 's;.*  *;;' |
 
 COMP_VERSION = $(gcc_version)
 
-DEFINES += -DBL_GCC_VERSION='$(gcc_version)'
-DEFINES += -DBL_GCC_MAJOR_VERSION=$(gcc_major_version)
-DEFINES += -DBL_GCC_MINOR_VERSION=$(gcc_minor_version)
-
 ########################################################################
 
 ifeq ($(DEBUG),TRUE)
@@ -100,4 +96,3 @@ FFLAGS   += $(GENERIC_FORT_FLAGS)
 F90FLAGS += $(GENERIC_FORT_FLAGS)
 
 ########################################################################
-
diff --git a/Tools/GNUMake/comps/nvcc.mak b/Tools/GNUMake/comps/nvcc.mak
index 27a7b414600..0ccd71caece 100644
--- a/Tools/GNUMake/comps/nvcc.mak
+++ b/Tools/GNUMake/comps/nvcc.mak
@@ -1,12 +1,14 @@
 # Store the CUDA toolkit version.
 
-nvcc_version       := $(shell nvcc --version | tail -1 | awk 'BEGIN {FS = ","} {print $$2}' | awk '{print $$2}')
-nvcc_major_version := $(shell nvcc --version | tail -1 | awk 'BEGIN {FS = ","} {print $$2}' | awk '{print $$2}' | awk 'BEGIN {FS = "."} {print $$1}')
-nvcc_minor_version := $(shell nvcc --version | tail -1 | awk 'BEGIN {FS = ","} {print $$2}' | awk '{print $$2}' | awk 'BEGIN {FS = "."} {print $$2}')
-
-DEFINES += -DAMREX_NVCC_VERSION=$(nvcc_version)
-DEFINES += -DAMREX_NVCC_MAJOR_VERSION=$(nvcc_major_version)
-DEFINES += -DAMREX_NVCC_MINOR_VERSION=$(nvcc_minor_version)
+ifneq ($(NO_CONFIG_CHECKING),TRUE)
+  nvcc_version       := $(shell nvcc --version | grep "release" | awk 'BEGIN {FS = ","} {print $$2}' | awk '{print $$2}')
+  nvcc_major_version := $(shell nvcc --version | grep "release" | awk 'BEGIN {FS = ","} {print $$2}' | awk '{print $$2}' | awk 'BEGIN {FS = "."} {print $$1}')
+  nvcc_minor_version := $(shell nvcc --version | grep "release" | awk 'BEGIN {FS = ","} {print $$2}' | awk '{print $$2}' | awk 'BEGIN {FS = "."} {print $$2}')
+else
+  nvcc_version       := 99.9
+  nvcc_major_version := 99
+  nvcc_minor_version := 9
+endif
 
 # Disallow CUDA toolkit versions < 8.0.
 
@@ -15,6 +17,26 @@ ifeq ($(nvcc_major_lt_8),1)
   $(error Your nvcc version is $(nvcc_version). This is unsupported. Please use CUDA toolkit version 8.0 or newer.)
 endif
 
+nvcc_forward_unknowns = 0
+ifeq ($(shell expr $(nvcc_major_version) \= 10),1)
+ifeq ($(shell expr $(nvcc_minor_version) \>= 2),1)
+  nvcc_forward_unknowns = 1
+endif
+endif
+ifeq ($(shell expr $(nvcc_major_version) \>= 11),1)
+  nvcc_forward_unknowns = 1
+endif
+
+ifeq ($(shell expr $(nvcc_major_version) \< 10),1)
+  DEPFLAGS = -M  # -MM not supported in < 10
+endif
+
+ifeq ($(shell expr $(nvcc_major_version) \= 10),1)
+ifeq ($(shell expr $(nvcc_minor_version) \= 0),1)
+  DEPFLAGS = -M  # -MM not supported in 10.0
+endif
+endif
+
 #
 # nvcc compiler driver does not always accept pgc++
 # as a host compiler at present. However, if we're using
@@ -55,7 +77,7 @@ ifeq ($(lowercase_nvcc_host_comp),gnu)
 
   NVCC_CCBIN ?= g++
 
-  CXXFLAGS_FROM_HOST := -ccbin=$(NVCC_CCBIN) -Xcompiler='$(CXXFLAGS) --std=$(CXXSTD)' --std=$(CXXSTD)
+  CXXFLAGS_FROM_HOST := -ccbin=$(NVCC_CCBIN) -Xcompiler='$(CXXFLAGS)' --std=$(CXXSTD)
   CFLAGS_FROM_HOST := $(CXXFLAGS_FROM_HOST)
   ifeq ($(USE_OMP),TRUE)
      LIBRARIES += -lgomp
@@ -99,6 +121,8 @@ else
 endif
 
 NVCC_FLAGS = -Wno-deprecated-gpu-targets -m64 -arch=compute_$(CUDA_ARCH) -code=sm_$(CUDA_ARCH) -maxrregcount=$(CUDA_MAXREGCOUNT) --expt-relaxed-constexpr --expt-extended-lambda
+# This is to work around a bug with nvcc, see: https://github.com/kokkos/kokkos/issues/1473
+NVCC_FLAGS += -Xcudafe --diag_suppress=esa_on_defaulted_function_ignored
 # Unfortunately, on cori with cuda 10.0 this fails in thrust code
 # NVCC_FLAGS += --Werror=cross-execution-space-call
 
@@ -114,7 +138,7 @@ endif
 
 ifeq ($(USE_CUPTI),TRUE)
   INCLUDE_LOCATIONS += $(MAKE_CUDA_PATH)/extras/CUPTI/include
-  LIBRARY_LOCATIONS += ${MAKE_CUDA_PATH}/extras/CUPTI/lib64 
+  LIBRARY_LOCATIONS += ${MAKE_CUDA_PATH}/extras/CUPTI/lib64
   LIBRARIES += -Wl,-rpath,${MAKE_CUDA_PATH}/extras/CUPTI/lib64 -lcupti
 endif
 
@@ -124,6 +148,20 @@ endif
 
 NVCC_FLAGS += $(XTRA_NVCC_FLAGS)
 
+ifeq ($(nvcc_forward_unknowns),1)
+  NVCC_FLAGS += --forward-unknown-to-host-compiler
+endif
+
+ifeq ($(shell expr $(nvcc_major_version) \>= 11),1)
+ifeq ($(GPU_ERROR_CAPTURE_THIS),TRUE)
+  NVCC_FLAGS += --Werror ext-lambda-captures-this
+else
+ifeq ($(GPU_WARN_CAPTURE_THIS),TRUE)
+  NVCC_FLAGS += --Wext-lambda-captures-this
+endif
+endif
+endif
+
 CXXFLAGS = $(CXXFLAGS_FROM_HOST) $(NVCC_FLAGS) -dc -x cu
 CFLAGS   =   $(CFLAGS_FROM_HOST) $(NVCC_FLAGS) -dc -x cu
 
diff --git a/Tools/GNUMake/comps/pgi.mak b/Tools/GNUMake/comps/pgi.mak
index 0839de6d3e0..b63bca577b1 100644
--- a/Tools/GNUMake/comps/pgi.mak
+++ b/Tools/GNUMake/comps/pgi.mak
@@ -192,6 +192,13 @@ ifeq ($(USE_CUDA),TRUE)
 
   LINK_WITH_FORTRAN_COMPILER = TRUE
 
+  ifeq ($(USE_MPI),TRUE)
+  ifneq ($(findstring Open MPI, $(shell mpicxx -showme:version 2>&1)),)
+    OMPI_FCFLAGS_ORIG = $(shell mpif90 -showme:compile)
+    export OMPI_FCFLAGS := $(subst -pthread,-lpthread,$(OMPI_FCFLAGS_ORIG))
+  endif
+  endif
+
 endif
 
 
diff --git a/Tools/GNUMake/packages/Make.hdf5 b/Tools/GNUMake/packages/Make.hdf5
new file mode 100644
index 00000000000..c2b5c0bdc24
--- /dev/null
+++ b/Tools/GNUMake/packages/Make.hdf5
@@ -0,0 +1,19 @@
+CPPFLAGS += -DAMREX_USE_HDF5
+
+ifndef AMREX_HDF5_HOME
+ifdef HDF5_DIR
+  AMREX_HDF5_HOME = $(HDF5_DIR)
+endif
+ifdef HDF5_HOME
+  AMREX_HDF5_HOME = $(HDF5_HOME)
+endif
+endif
+
+LIBRARIES += -lhdf5 -lz -ldl
+
+ifdef AMREX_HDF5_HOME
+  HDF5_ABSPATH = $(abspath $(AMREX_HDF5_HOME))
+  INCLUDE_LOCATIONS += $(HDF5_ABSPATH)/include
+  LIBRARY_LOCATIONS += $(HDF5_ABSPATH)/lib
+  LDFLAGS += -Xlinker -rpath -Xlinker $(HDF5_ABSPATH)/lib
+endif
diff --git a/Tools/GNUMake/packages/Make.sundials b/Tools/GNUMake/packages/Make.sundials
new file mode 100644
index 00000000000..ed2296c27a2
--- /dev/null
+++ b/Tools/GNUMake/packages/Make.sundials
@@ -0,0 +1,52 @@
+SUNDIALS_ROOT ?= ../../../../sundials/instdir
+SUNDIALS_LIB_DIR ?= $(SUNDIALS_ROOT)/lib
+
+USE_CVODE_LIBS ?= TRUE
+USE_ARKODE_LIBS ?= TRUE
+
+CPPFLAGS += -DAMREX_USE_SUNDIALS
+INCLUDE_LOCATIONS += $(SUNDIALS_ROOT)/include
+
+ifeq ($(USE_CVODE_LIBS),TRUE)
+  LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_cvode
+endif
+
+ifeq ($(USE_ARKODE_LIBS),TRUE)
+  LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_arkode
+endif
+
+LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_nvecserial
+
+ifeq ($(USE_CUDA),TRUE)
+  LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_nveccuda
+endif
+
+ifeq ($(USE_OMP),TRUE)
+  LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_nvecopenmp
+endif
+
+ifeq ($(lowercase_comp),pgi)
+   USE_FORT_ODE = FALSE
+else
+   USE_FORT_ODE ?= TRUE
+endif
+
+ifeq (${USE_FORT_ODE},TRUE)
+  include $(AMREX_HOME)/Src/Extern/SUNDIALS/Make.package
+  INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/SUNDIALS
+  INCLUDE_LOCATIONS += $(SUNDIALS_ROOT)/include $(SUNDIALS_ROOT)/fortran
+  VPATH_LOCATIONS += $(SUNDIALS_ROOT)/include $(SUNDIALS_ROOT)/fortran
+  VPATH_LOCATIONS += $(AMREX_HOME)/Src/Extern/SUNDIALS
+
+  ifeq ($(USE_CVODE_LIBS),TRUE)
+    LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_fcvode_mod
+  endif
+  
+  ifeq ($(USE_ARKODE_LIBS),TRUE)
+    LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_farkode_mod
+  endif
+ 
+  LIBRARIES += -L$(SUNDIALS_LIB_DIR) -lsundials_fnvecserial_mod
+endif
+
+LIBRARIES += -Wl,-rpath,${SUNDIALS_LIB_DIR}
diff --git a/Tools/GNUMake/packages/Make.sundials3 b/Tools/GNUMake/packages/Make.sundials3
deleted file mode 100644
index b644e86de02..00000000000
--- a/Tools/GNUMake/packages/Make.sundials3
+++ /dev/null
@@ -1,39 +0,0 @@
-# Not using cray-tpsl version, since 18.06.1 still loads Sundials 2.7
-
-USE_CVODE_LIBS ?= TRUE
-CPPFLAGS += -DAMREX_USE_SUNDIALS_3x4x
-
-ifeq ($(lowercase_comp),pgi)
-    USE_FORT_ODE = FALSE
-else
-   USE_FORT_ODE ?= TRUE
-endif
-
-ifeq (${USE_FORT_ODE},TRUE)
-include $(AMREX_HOME)/Src/Extern/SUNDIALS3/Make.package
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/Extern/SUNDIALS3
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/SUNDIALS3
-endif
-
-CVODE_LIB_DIR ?= ../../../../sundials/instdir/lib
-INCLUDE_LOCATIONS += $(CVODE_LIB_DIR)/../include
-
-ifeq ($(USE_CVODE_LIBS),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_cvode
-endif
-
-ifeq ($(USE_ARKODE_LIBS),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_arkode
-endif
-
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_nvecserial
-
-ifeq ($(USE_CUDA),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_nveccuda
-endif
-
-ifeq ($(USE_OMP),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_nvecopenmp
-endif
-
-LIBRARIES += -Wl,-rpath,${CVODE_LIB_DIR}
diff --git a/Tools/GNUMake/packages/Make.sundials4 b/Tools/GNUMake/packages/Make.sundials4
deleted file mode 100644
index e425def8fa9..00000000000
--- a/Tools/GNUMake/packages/Make.sundials4
+++ /dev/null
@@ -1,39 +0,0 @@
-# Not using cray-tpsl version, since 18.06.1 still loads Sundials 2.7
-
-USE_CVODE_LIBS ?= TRUE
-CPPFLAGS += -DAMREX_USE_SUNDIALS_3x4x
-
-ifeq ($(lowercase_comp),pgi)
-    USE_FORT_ODE = FALSE
-else
-   USE_FORT_ODE ?= TRUE
-endif
-
-ifeq (${USE_FORT_ODE},TRUE)
-include $(AMREX_HOME)/Src/Extern/SUNDIALS4/Make.package
-VPATH_LOCATIONS += $(AMREX_HOME)/Src/Extern/SUNDIALS4
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/Extern/SUNDIALS4
-endif
-
-CVODE_LIB_DIR ?= ../../../../sundials/instdir/lib
-INCLUDE_LOCATIONS += $(CVODE_LIB_DIR)/../include
-
-ifeq ($(USE_CVODE_LIBS),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_cvode
-endif
-
-ifeq ($(USE_ARKODE_LIBS),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_arkode
-endif
-
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_nvecserial
-
-ifeq ($(USE_CUDA),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_nveccuda
-endif
-
-ifeq ($(USE_OMP),TRUE)
-LIBRARIES += -L$(CVODE_LIB_DIR) -lsundials_nvecopenmp
-endif
-
-LIBRARIES += -Wl,-rpath,${CVODE_LIB_DIR}
diff --git a/Tools/GNUMake/sites/Make.ccse b/Tools/GNUMake/sites/Make.ccse
deleted file mode 100644
index c2325a88a9d..00000000000
--- a/Tools/GNUMake/sites/Make.ccse
+++ /dev/null
@@ -1,9 +0,0 @@
-#
-# CCSE machines just use the default now
-#
-
-include $(AMREX_HOME)/Tools/GNUMake/sites/Make.unknown
-
-ifeq ($(which_computer),garuda)
-  CUDA_ARCH=75
-endif
diff --git a/Tools/GNUMake/sites/Make.cscs b/Tools/GNUMake/sites/Make.cscs
deleted file mode 100644
index 425920fb284..00000000000
--- a/Tools/GNUMake/sites/Make.cscs
+++ /dev/null
@@ -1,19 +0,0 @@
-#
-# For CSCS machines: Daint
-#
-
-ifdef PE_ENV
-  lowercase_peenv := $(shell echo $(PE_ENV) | tr A-Z a-z)
-  ifneq ($(lowercase_peenv),$(lowercase_comp))
-    has_compiler_mismatch = COMP=$(COMP) does not match PrgEnv-$(lowercase_peenv)
-  endif
-endif
-
-
-ifeq ($(USE_MPI),TRUE)
-  CC  = cc
-  CXX = CC
-  FC  = ftn
-  F90 = ftn
-  LIBRARIES += -lmpichf90
-endif
diff --git a/Tools/GNUMake/sites/Make.frontier-coe b/Tools/GNUMake/sites/Make.frontier-coe
index 20120c5e3fd..23d97af9128 100644
--- a/Tools/GNUMake/sites/Make.frontier-coe
+++ b/Tools/GNUMake/sites/Make.frontier-coe
@@ -1,6 +1,28 @@
-ifeq ($(which_computer),$(filter $(which_computer),tulip))
+ifeq (,$(filter $(which_computer),poplar redwood tulip))
+  $(error Unknown Frontier CoE computer, $(which_computer))
+else
   ifeq ($(USE_HIP),TRUE)
-    CXXFLAGS += --amdgpu-target=gfx906
-    HIPCC_FLAGS += --amdgpu-target=gfx906
+    CXXFLAGS += --amdgpu-target=gfx906,gfx908
+    HIPCC_FLAGS += --amdgpu-target=gfx906,gfx908
   endif
+
+  ifeq ($(USE_MPI),TRUE)
+
+    INCLUDE_LOCATIONS += $(MPI_HOME)/include
+    LIBRARY_LOCATIONS += $(MPI_HOME)/lib
+
+    ifneq ($(findstring Open MPI, $(shell mpif90 -showme:version 2>&1)),)
+      mpif90_link_flags := $(shell mpif90 -showme:link)
+      LIBRARIES += $(mpif90_link_flags)
+    else
+      mpicxx_link_flags := $(shell mpicxx -link_info)
+      LIBRARIES += $(filter -Wl%,$(mpicxx_link_flags))
+      ifneq ($(BL_NO_FORT),TRUE)
+        LIBRARIES += -lmpifort
+      endif
+      LIBRARIES += -lmpi
+    endif
+
+  endif
+
 endif
diff --git a/Tools/GNUMake/sites/Make.llnl b/Tools/GNUMake/sites/Make.llnl
index 6c550b05327..5e1a83864ed 100644
--- a/Tools/GNUMake/sites/Make.llnl
+++ b/Tools/GNUMake/sites/Make.llnl
@@ -12,7 +12,7 @@ ifeq ($(which_computer),$(filter $(which_computer),ray rzmanta))
 
   XLC_ROOT = /usr/tce/packages/xl/xl-beta-2018.06.01/xlC/16.1.1/
   XLF_ROOT = /usr/tce/packages/xl/xl-beta-2018.06.01/xlf/16.1.1/
-  MPIROOT=/usr/tce/packages/spectrum-mpi/ibm/spectrum-mpi-2018.06.01
+  MPIROOT=/usr/tce/packages/spectrum-mpi/ibm/spectrum-mpi-rolling-release
 
   ifeq ($(USE_MPI),TRUE)
     CC  = mpicc
@@ -20,7 +20,12 @@ ifeq ($(which_computer),$(filter $(which_computer),ray rzmanta))
     FC  = mpifort
     F90 = mpifort
 
-    LIBRARIES += -lmpi_ibm_mpifh
+    ifeq ($(USE_GPU_PRAGMA),TRUE)
+      LIBRARIES += -lmpi_ibm_mpifh
+    else
+      LIBRARIES += -lmpi_ibm
+      override XTRALIBS += -L$(MPIROOT)/lib
+    endif
   endif
 
   ifeq ($(USE_CUDA),TRUE)
@@ -53,7 +58,7 @@ ifeq ($(which_computer),$(filter $(which_computer),ray rzmanta))
   endif
 
   ifeq ($(lowercase_comp),gnu)
-       override XTRALIBS := -lgfortran
+       override XTRALIBS += -lgfortran
   endif
 
   ifeq ($(lowercase_comp),ibm)
@@ -74,7 +79,12 @@ ifeq ($(which_computer),$(filter $(which_computer),sierra butte rzansel lassen))
     FC  = mpifort
     F90 = mpifort
 
-    LIBRARIES += -lmpi_ibm_mpifh
+    ifeq ($(USE_GPU_PRAGMA),TRUE)
+      LIBRARIES += -lmpi_ibm_mpifh
+    else
+      LIBRARIES += -lmpi_ibm
+      override XTRALIBS += -L$(MPIROOT)/lib
+    endif
   endif
 
   ifeq ($(USE_CUDA),TRUE)
@@ -107,7 +117,8 @@ ifeq ($(which_computer),$(filter $(which_computer),sierra butte rzansel lassen))
   endif
 
   ifeq ($(lowercase_comp),gnu)
-       override XTRALIBS := -lgfortran
+       # Note we need gcc/8.3.1 at LLNL because gcc/7.3.1 does not contain libquadmath
+       override XTRALIBS += -lgfortran
   endif
 
   ifeq ($(lowercase_comp),ibm)
diff --git a/Tools/GNUMake/sites/Make.nersc b/Tools/GNUMake/sites/Make.nersc
index fa404d298ad..8f69589b464 100644
--- a/Tools/GNUMake/sites/Make.nersc
+++ b/Tools/GNUMake/sites/Make.nersc
@@ -71,7 +71,11 @@ ifeq ($(which_computer),$(filter $(which_computer),cgpu))
         COMPILE_CUDA_PATH := $(CUDA_HOME)
     endif
 
-    CUDA_ARCH = 70
+    ifeq ($(findstring :dgx, $(LOADEDMODULES)), :dgx)
+      CUDA_ARCH = 80
+    else
+      CUDA_ARCH = 70
+    endif
     GPUS_PER_NODE = 8
     GPUS_PER_SOCKET = 4
   endif
diff --git a/Tools/GNUMake/sites/Make.nrel b/Tools/GNUMake/sites/Make.nrel
index 755e58afa1d..80b0f463643 100644
--- a/Tools/GNUMake/sites/Make.nrel
+++ b/Tools/GNUMake/sites/Make.nrel
@@ -21,6 +21,15 @@ ifeq ($(which_computer), eagle)
       F90FLAGS += -march=skylake-avx512 -mtune=skylake-avx512
     endif
   endif
+  ifeq ($(USE_CUDA),TRUE)
+    ifneq ($(CUDA_HOME),)
+        SYSTEM_CUDA_PATH := $(CUDA_HOME)
+        COMPILE_CUDA_PATH := $(CUDA_HOME)
+    endif
+    CUDA_ARCH = 70
+    GPUS_PER_NODE = 2
+    GPUS_PER_SOCKET = 1
+  endif
 else ifeq ($(which_computer), rhodes)
 # Rhodes is dedicated single node machine for testing
   ifeq ($(COMP), intel)
@@ -31,6 +40,7 @@ else ifeq ($(which_computer), rhodes)
   endif
 endif
 
+# Account for Intel-MPI, MPICH, OpenMPI, and MPT
 ifeq ($(USE_MPI),TRUE)
   ifeq ($(COMP), intel)
     CXX := mpiicpc
@@ -48,8 +58,6 @@ ifeq ($(USE_MPI),TRUE)
     else ifneq ($(findstring Open MPI, $(shell $(F90) -showme:version 2>&1)),)
       mpif90_link_flags := $(shell $(F90) -showme:link)
       LIBRARIES += $(mpif90_link_flags)
-    else
-      $(error unknown mpi implementation)
     endif
   endif
 endif
diff --git a/Tools/GNUMake/sites/Make.olcf b/Tools/GNUMake/sites/Make.olcf
index 3e9a9d6de90..728e06bab3c 100644
--- a/Tools/GNUMake/sites/Make.olcf
+++ b/Tools/GNUMake/sites/Make.olcf
@@ -1,90 +1,14 @@
 #
-# For titan at OLCF
+# For Summit et al. at OLCF
 #
 
-OLCF_MACHINES := titan summitdev summit ascent peak
+OLCF_MACHINES := summit ascent
 
 ifneq ($(which_computer), $(findstring $(which_computer), $(OLCF_MACHINES)))
   $(error Unknown OLCF computer, $(which_computer))
 endif
 
-ifeq ($(which_computer),$(filter $(which_computer),titan))
-
-  ifdef PE_ENV
-    lowercase_peenv := $(shell echo $(PE_ENV) | tr A-Z a-z)
-    ifneq ($(lowercase_peenv),$(lowercase_comp))
-      has_compiler_mismatch = COMP=$(COMP) does not match PrgEnv-$(lowercase_peenv)
-    endif
-  endif
-
-  ifeq ($(USE_MPI),TRUE)
-    CC  = cc
-    CXX = CC
-    FC  = ftn
-    F90 = ftn
-    LIBRARIES += -lmpichf90
-  endif
-
-  # If the cudatoolkit module is loaded, CRAY_CUDATOOLKIT_DIR is set as the toolkit location.
-
-  SYSTEM_CUDA_PATH=$(CRAY_CUDATOOLKIT_DIR)
-
-  # Specify that we want to build for Kepler
-
-  CUDA_ARCH = 35
-  COMPILE_CUDA_PATH=$(CRAY_CUDATOOLKIT_DIR)
-
-  # Provide system configuration information.
-
-  GPUS_PER_NODE=1
-  GPUS_PER_SOCKET=1
-
-endif
-
-
-
-ifeq ($(which_computer),$(filter $(which_computer),summitdev))
-
-  ifeq ($(USE_MPI),TRUE)
-
-    CC  := mpicc
-    CXX := mpicxx
-    FC  := mpifort
-    F90 := mpifort
-
-    LIBRARIES += -lmpi_ibm_mpifh -lmpi_ibm
-
-  endif
-
-  ifeq ($(lowercase_comp),gnu)
-    override XTRALIBS := -lgfortran
-  endif
-
-  ifeq ($(lowercase_comp),ibm)
-    override XTRALIBS += -L$(OLCF_XLF_ROOT)/lib -L$(OLCF_XLC_ROOT)/lib
-  endif
-
-  # If the cuda module is loaded, CUDAPATH is set as the toolkit location.
-
-  SYSTEM_CUDA_PATH=$(CUDAPATH)
-
-  SYSTEM_NVML_PATH=/usr/lib64/nvidia
-
-  # Specify that we want to build for Pascal
-
-  CUDA_ARCH = 60
-  COMPILE_CUDA_PATH = $(OLCF_CUDA_ROOT)
-
-  # Provide system configuration information.
-
-  GPUS_PER_NODE=4
-  GPUS_PER_SOCKET=2
-
-endif
-
-
-
-ifeq ($(which_computer),$(filter $(which_computer),summit))
+ifeq ($(which_computer),$(filter $(which_computer),summit ascent))
 
   ifeq ($(USE_MPI),TRUE)
 
@@ -105,9 +29,6 @@ ifeq ($(which_computer),$(filter $(which_computer),summit))
     override XTRALIBS += -L$(OLCF_XLF_ROOT)/lib -L$(OLCF_XLC_ROOT)/lib
   endif
 
-  # If the cuda module is loaded, CUDAPATH is set as the toolkit location.
-  # No longer the case
-  # SYSTEM_CUDA_PATH=$(CUDAPATH)
   SYSTEM_CUDA_PATH=$(OLCF_CUDA_ROOT)
 
   SYSTEM_NVML_PATH=$(OLCF_CUDA_ROOT)/lib64/stubs
@@ -123,45 +44,3 @@ ifeq ($(which_computer),$(filter $(which_computer),summit))
   GPUS_PER_SOCKET=3
 
 endif
-
-
-ifeq ($(which_computer),$(filter $(which_computer),ascent peak))
-
-  ifeq ($(USE_MPI),TRUE)
-
-    CC  := mpicc
-    CXX := mpicxx
-    FC  := mpif90
-    F90 := mpif90
-
-    LIBRARIES += -lmpi_ibm_mpifh -lmpi_ibm
-
-  endif
-
-  ifeq ($(lowercase_comp),gnu)
-    override XTRALIBS := -lgfortran
-  endif
-
-  ifeq ($(lowercase_comp),ibm)
-    override XTRALIBS += -L$(OLCF_XLF_ROOT)/lib -L$(OLCF_XLC_ROOT)/lib
-  endif
-
-  # If the cuda module is loaded, CUDAPATH is set as the toolkit location.
-
-  SYSTEM_CUDA_PATH=$(CUDAPATH)
-
-  SYSTEM_NVML_PATH=/usr/lib64/nvidia
-
-  # Specify that we want to build for Volta
-
-  CUDA_ARCH = 70
-  COMPILE_CUDA_PATH = $(OLCF_CUDA_ROOT)
-
-  # Provide system configuration information.
-
-  GPUS_PER_NODE=6
-  GPUS_PER_SOCKET=3
-
-   CPATH=/autofs/nccsopen-svm1_sw/ascent/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/pgi-18.7/spectrum-mpi-10.2.0.7-20180830-d6ufwv3i4tohn6fq552fpz6au5ik33ok/include:/sw/ascent/cuda/9.1.85/include
-
-endif
diff --git a/Tools/GNUMake/sites/Make.unknown b/Tools/GNUMake/sites/Make.unknown
index 23afb4ef47e..a51c0278b5c 100644
--- a/Tools/GNUMake/sites/Make.unknown
+++ b/Tools/GNUMake/sites/Make.unknown
@@ -4,6 +4,8 @@
 
 os_type := $(shell uname)
 
+ifneq ($(NO_CONFIG_CHECKING),TRUE)
+
 ifneq ($(NO_MPI_CHECKING),TRUE)
 ifeq ($(USE_MPI),TRUE)
 
@@ -73,7 +75,9 @@ ifeq ($(USE_MPI),TRUE)
       LIBRARIES += $(filter -l%,$(mpicxx_link_flags))
 #    endif
 
-  else ifneq ($(findstring Spectrum MPI, $(shell $(MPI_OTHER_COMP) -showme:version 2>&1)),1)
+     DEFINES += -DOMPI_SKIP_MPICXX
+
+  else ifneq ($(findstring Spectrum MPI, $(shell $(MPI_OTHER_COMP) -showme:version 2>&1)),)
 
     #
     # Spectrum MPI
@@ -83,6 +87,25 @@ ifeq ($(USE_MPI),TRUE)
       LIBRARIES += $(mpif90_link_flags)
 #    endif
 
+  else ifneq ($(findstring /intel/mpi-rt,$(shell $(MPI_OTHER_COMP) -show 2>&1)),)
+
+    #
+    # Intel mpi
+    #
+#
+#    ifneq ($(BL_NO_FORT),TRUE)
+      mpif90_link_flags := $(shell $(MPI_OTHER_COMP) -link_info)
+      #
+      # The first word is the underlying compiler say gfortran
+      #
+      LIBRARIES += $(wordlist 2,1024,$(mpif90_link_flags))
+#    endif
+
+#    ifneq ($(CXX),$(filter $(CXX),mpicxx mpic++))
+      mpicxx_link_flags := $(shell mpicxx -link_info)
+      LIBRARIES += $(filter -l%,$(mpicxx_link_flags))
+#    endif
+
   else
 
     $(error Unknown mpi implementation.  You can try setting MPI stuff in amrex/Tools/GNUMake/Make.local and then compile with NO_MPI_CHECKING=TRUE.)
@@ -92,7 +115,6 @@ ifeq ($(USE_MPI),TRUE)
 endif
 endif
 
-
 ifneq ($(NO_CUDA_CHECKING),TRUE)
 ifeq ($(USE_CUDA),TRUE)
   CUDA_HOME ?= /usr/local/cuda
@@ -114,4 +136,6 @@ ifeq ($(USE_CUDA),TRUE)
 endif
 endif
 
+endif
+
 FIX_NVCC_PTHREAD=TRUE
diff --git a/Tools/Plotfile/CMakeLists.txt b/Tools/Plotfile/CMakeLists.txt
index 63be48b9943..b4154f1d3c1 100644
--- a/Tools/Plotfile/CMakeLists.txt
+++ b/Tools/Plotfile/CMakeLists.txt
@@ -24,7 +24,7 @@ set(_exe_names
 foreach( _exe IN LISTS _exe_names)
    add_executable(${_exe} ${_exe}.cpp)
    target_link_libraries(${_exe} PRIVATE amrex)
-   if (ENABLE_CUDA)
+   if (AMReX_CUDA)
       set_source_files_properties(${_exe}.cpp PROPERTIES LANGUAGE CUDA)
    endif()
    add_dependencies(plotfile_tools ${_exe})  
@@ -34,7 +34,7 @@ endforeach()
 # target snapshot needs a special treatment
 target_include_directories(fsnapshot PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
 target_sources(fsnapshot PRIVATE AMReX_PPMUtil.H AMReX_PPMUtil.cpp)
-if (ENABLE_CUDA)
+if (AMReX_CUDA)
    set_source_files_properties(AMReX_PPMUtil.cpp PROPERTIES LANGUAGE CUDA)
    target_compile_features(fsnapshot PUBLIC cxx_std_14) 
 endif()
diff --git a/Tools/Plotfile/fcompare.cpp b/Tools/Plotfile/fcompare.cpp
index 19446a53dc4..e905583fb37 100644
--- a/Tools/Plotfile/fcompare.cpp
+++ b/Tools/Plotfile/fcompare.cpp
@@ -21,6 +21,7 @@ int main_main()
 
     Real global_error = 0.0;
     Real global_rerror = 0.0;
+    Real abserr_for_global_rerror = 0.0;
     bool any_nans = false;
     ErrZone err_zone;
     bool all_variables_found = true;
@@ -33,6 +34,7 @@ int main_main()
     int zone_info = false;
     int allow_diff_grids = false;
     Real rtol = 0.0;
+    Real atol = 0.0;
     std::string zone_info_var_name;
     Vector<std::string> plot_names(1);
     bool abort_if_not_all_found = false;
@@ -56,6 +58,8 @@ int main_main()
             allow_diff_grids = true;
         } else if (fname == "-r" or fname == "--rel_tol") {
             rtol = std::stod(amrex::get_command_argument(++farg));
+        } else if (fname == "--abs_tol") {
+            atol = std::stod(amrex::get_command_argument(++farg));
         } else if (fname == "--abort_if_not_all_found") {
             abort_if_not_all_found = true;            
         } else {
@@ -79,10 +83,9 @@ int main_main()
             << " variable.\n"
             << "\n"
             << " usage:\n"
-            << "    fcompare [-g|--ghost] [-n|--norm num] [-d|--diffvar var] [-z|--zone_info var] [-a|--allow_diff_grids] [-r|rel_tol] file1 file2\n"
+            << "    fcompare [-n|--norm num] [-d|--diffvar var] [-z|--zone_info var] [-a|--allow_diff_grids] [-r|rel_tol] [--abs_tol] file1 file2\n"
             << "\n"
             << " optional arguments:\n"
-            << "    -g|--ghost            : compare the ghost cells too (if stored)\n"
             << "    -n|--norm num         : what norm to use (default is 0 for inf norm)\n"
             << "    -d|--diffvar var      : output a plotfile showing the differences for\n"
             << "                            variable var\n"
@@ -90,6 +93,7 @@ int main_main()
             << "                            to the maximum error for the given variable\n"
             << "    -a|--allow_diff_grids : allow different BoxArrays covering the same domain\n"
             << "    -r|--rel_tol rtol     : relative tolerance (default is 0)\n"
+            << "    --abs_tol atol        : absolute tolerance (default is 0)\n"
             << std::endl;
         return 0;
     }
@@ -268,10 +272,18 @@ int main_main()
                 amrex::Print() << " " << std::setw(24) << std::left << names_a[icomp_a]
                                << "  " << std::setw(50)
                                << "< variable not present in both files > \n";
-            } else if (has_nan_a[icomp_a] or has_nan_b[icomp_a]) {
+            } else if (has_nan_a[icomp_a] and has_nan_b[icomp_a]) {
                 amrex::Print() << " " << std::setw(24) << std::left << names_a[icomp_a]
                                << "  " << std::setw(50)
-                               << "< NaN present > \n";
+                               << "< NaN present in both A and B > \n";
+            } else if (has_nan_a[icomp_a]) {
+                amrex::Print() << " " << std::setw(24) << std::left << names_a[icomp_a]
+                               << "  " << std::setw(50)
+                               << "< NaN present in A > \n";
+            } else if (has_nan_b[icomp_a]) {
+                amrex::Print() << " " << std::setw(24) << std::left << names_b[icomp_a]
+                               << "  " << std::setw(50)
+                               << "< NaN present in B > \n";
             } else {
                 Real aerr = 0., rerr = 0.;
                 if (aerror[icomp_a] > 0.) {
@@ -291,9 +303,12 @@ int main_main()
         global_error = std::max(global_error,
                                 *(std::max_element(aerror.begin(),
                                                    aerror.end())));
-        global_rerror = std::max(global_rerror,
-                                 *(std::max_element(rerror.begin(),
-                                                    rerror.end())));
+
+        const auto max_rerr = std::max_element(rerror.begin(), rerror.end());
+        global_rerror = std::max(global_rerror, *max_rerr);
+        const auto idx = std::distance(rerror.begin(), max_rerr);
+        abserr_for_global_rerror = std::max(
+            abserr_for_global_rerror, aerror[idx]);
         for (int icomp_a = 0; icomp_a < ncomp_a; ++icomp_a) {
             any_nans = any_nans or has_nan_a[icomp_a] or has_nan_b[icomp_a];
         }
@@ -349,6 +364,12 @@ int main_main()
     if (global_error == 0.0 and !any_nans) {
         amrex::Print() << " PLOTFILE AGREE" << std::endl;
         return EXIT_SUCCESS;
+    } else if ((abserr_for_global_rerror <= atol) ||
+               (global_rerror <= rtol)) {
+        amrex::Print() << " PLOTFILE AGREE to specified tolerances: "
+                       << "absolute = " << atol
+                       << " relative = " << rtol << std::endl;
+        return EXIT_SUCCESS;
     } else if (global_rerror <= rtol) {
         amrex::Print() << " PLOTFILE AGREE to relative tolerance " << rtol << std::endl;
         return EXIT_SUCCESS;
diff --git a/Tools/Plotfile/fsnapshot.cpp b/Tools/Plotfile/fsnapshot.cpp
index b97aa389717..4cd279660ef 100644
--- a/Tools/Plotfile/fsnapshot.cpp
+++ b/Tools/Plotfile/fsnapshot.cpp
@@ -117,6 +117,7 @@ void main_main()
             }
         }
     }
+    amrex::ignore_unused(numElements);
 
     PlotFileData pf(pltfile);
     int dim = pf.spaceDim();
@@ -178,6 +179,7 @@ void main_main()
         ndir_end = ndir_begin+1;
         ndirs = 1;
     }
+    amrex::ignore_unused(ndirs);
 
     Vector<Box> finebox(3, finedomainbox);
     Vector<MultiFab> datamf(3);
diff --git a/Tools/RegressionTesting/AMReX-cuda-tests.ini b/Tools/RegressionTesting/AMReX-cuda-tests.ini
new file mode 100644
index 00000000000..8f5fc58649f
--- /dev/null
+++ b/Tools/RegressionTesting/AMReX-cuda-tests.ini
@@ -0,0 +1,444 @@
+[main]
+testTopDir = /scratch/regtester/RegTesting/rt-AMReX
+webTopDir  = /scratch/regtester/RegTesting/rt-AMReX/web
+
+MAKE = make
+sourceTree = AMReX
+# Don't set it too high. Currently Ubuntu has a bug that causes parallel make fail
+numMakeJobs = 8
+
+COMP = g++
+FCOMP = gfortran
+add_to_c_make_command = TEST=TRUE USE_ASSERTION=TRUE
+add_to_f_make_command = TEST=t
+
+purge_output = 1
+
+# suiteName is the name prepended to all output directories
+suiteName = AMReX-GPU
+
+reportActiveTestsOnly = 1
+
+# Add "GO UP" link at the top of the web page?
+goUpLink = 1
+
+# email
+sendEmailWhenFail = 1
+#emailTo = weiqunzhang@lbl.gov
+emailTo = weiqunzhang@lbl.gov, msday@lbl.gov, ASAlmgren@lbl.gov, atmyers@lbl.gov
+emailBody = Check https://ccse.lbl.gov/pub/GpuRegressionTesting/AMReX/ for more details.
+
+# MPIcommand should use the placeholders:
+#   @host@ to indicate where to put the hostname to run on
+#   @nprocs@ to indicate where to put the number of processors
+#   @command@ to indicate where to put the command to run
+#
+# only tests with useMPI = 1 will run in parallel
+# nprocs is problem dependent and specified in the individual problem
+# sections.
+
+#MPIcommand = mpiexec -host @host@ -n @nprocs@ @command@
+MPIcommand = mpiexec -n @nprocs@ @command@
+MPIhost = 
+
+[AMReX]
+dir = /home/regtester/git/amrex/
+# PLEASE DO NOT CHANGE THIS.  IF YOU CHANGE THIS PLEASE REMEMBER TO
+# CHANGE IT BACK TO DEVELOPMENT.
+branch = "development"
+
+# individual problems follow
+
+[CNS-Sod]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tutorials/GPU/CNS/Exec/Sod
+inputFile = inputs-rt
+dim = 3
+restartTest = 0
+useMPI = 0
+numprocs = 2
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+testSrcTree = C_Src
+
+[CNS-RT]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tutorials/GPU/CNS/Exec/RT
+inputFile = inputs-rt
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+testSrcTree = C_Src
+
+[MLMG_PoisLev] 
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tutorials/LinearSolvers/ABecLaplacian_C
+inputFile = inputs-rt-poisson-lev
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[MLMG_ABecCom]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-13
+runtime_params = gpu_regtest=1
+buildDir = Tutorials/LinearSolvers/ABecLaplacian_C
+inputFile = inputs-rt-abeclap-com
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[MLMG_NodalPoisson]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-12
+runtime_params = gpu_regtest=1
+buildDir = Tutorials/LinearSolvers/NodalPoisson
+inputFile = inputs-rt
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_Cell_Dir_2D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 6.e-11
+runtime_params = gpu_regtest=1
+buildDir = Tests/LinearSolvers/CellEB2
+inputFile = inputs.rt.2d
+dim = 2
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_Cell_Dir_3D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-13
+runtime_params = eb2.geom_type=rotated_box gpu_regtest=1
+buildDir = Tests/LinearSolvers/CellEB2
+inputFile = inputs.rt.3d
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_Cell_Neu_2D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-12
+buildDir = Tests/LinearSolvers/CellEB
+inputFile = inputs.rt.2d
+dim = 2
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_Cell_Neu_3D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-12
+buildDir = Tests/LinearSolvers/CellEB
+inputFile = inputs.rt.3d
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_MacProj_3D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-9
+buildDir = Tutorials/LinearSolvers/MAC_Projection_EB
+inputFile = inputs_3d
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 1
+compileTest = 0
+doVis = 0
+runtime_params = regtest=1
+outputFile = plt00000
+testSrcTree = C_Src
+
+[EB_Node_2D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 5.e-14
+buildDir = Tests/LinearSolvers/NodeEB
+inputFile = inputs.rt.2d
+dim = 2
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_Node_3D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-11
+runtime_params = gpu_regtest=1
+buildDir = Tests/LinearSolvers/NodeEB
+inputFile = inputs.rt.3d.x
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 1
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[EB_Tensor_3D]
+addToCompileString = USE_CUDA=TRUE
+tolerance = 1.e-12
+runtime_params = gpu_regtest=1
+buildDir = Tests/LinearSolvers/EBTensor
+inputFile = inputs.rt.3d
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 4
+useOMP = 0
+numthreads = 1
+compileTest = 0
+doVis = 0
+outputFile = plot
+testSrcTree = C_Src
+
+[Tracers]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex
+inputFile = inputs.tracers
+runtime_params = particles.do_tiling=0
+dim = 2
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+probinFile = probin
+compileTest = 0
+compareParticles = 1
+doVis = 0
+testSrcTree = C_Src
+
+[Redistribute]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/Redistribute
+inputFile = inputs.rt.cuda
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[SortParticlesByCell]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/Redistribute
+inputFile = inputs.rt.cuda.sort
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[RedistributeMR]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/Redistribute
+inputFile = inputs.rt.cuda.mr
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[RedistributeNonPeriodic]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/Redistribute
+inputFile = inputs.rt.cuda.nonperiodic
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[RedistributeMR_2D]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/Redistribute
+inputFile = inputs.rt.cuda.mr
+dim = 2
+restartTest = 0
+useMPI = 1
+numprocs = 2
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[NeighborParticles]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/NeighborParticles
+inputFile = inputs
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 1
+useOMP = 0
+compileTest = 0
+doComparison = 0
+diffDir = neighbor_particles.0
+doVis = 0
+testSrcTree = C_Src
+
+[ParticleMesh]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/ParticleMesh
+inputFile = inputs
+dim = 3
+restartTest = 0
+useMPI = 1
+numprocs = 1
+useOMP = 0
+numthreads = 2
+compileTest = 0
+doVis = 0
+outputFile = plot
+compareParticles = 1
+particleTypes = particle0
+tolerance = 5.e-14
+testSrcTree = C_Src
+
+[ParticleReduce]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/ParticleReduce
+inputFile = inputs
+dim = 3
+restartTest = 0
+useMPI = 0
+numprocs = 1
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[ParticleTransformation]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/Particles/ParticleTransformations
+inputFile = inputs
+dim = 3
+restartTest = 0
+useMPI = 0
+numprocs = 1
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = pass
+doVis = 0
+testSrcTree = C_Src
+
+[Locking]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/GPU/Locking
+inputFile = inputs
+dim = 3
+restartTest = 0
+useMPI = 0
+numprocs = 1
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = passed
+doVis = 0
+testSrcTree = C_Src
+
+[Vector]
+addToCompileString = USE_CUDA=TRUE
+buildDir = Tests/GPU/Vector
+inputFile = inputs
+dim = 3
+restartTest = 0
+useMPI = 0
+numprocs = 1
+useOMP = 0
+compileTest = 0
+selfTest = 1
+stSuccessString = Passed
+doVis = 0
+testSrcTree = C_Src
diff --git a/Tools/libamrex/mkconfig.py b/Tools/libamrex/mkconfig.py
index 13a74b51367..fce34b81d92 100755
--- a/Tools/libamrex/mkconfig.py
+++ b/Tools/libamrex/mkconfig.py
@@ -29,36 +29,35 @@ def doit(defines, undefines, comp, allow_diff_comp, use_omp):
 
     if allow_diff_comp == "FALSE":
         if comp == "gnu" or comp == "nag":
-            print("#ifndef __GNUC__")
-            print('static_assert(false,"libamrex was built with GNU");')
-            print("#endif")
+            comp_macro = "__GNUC__"
+            comp_id    = "GNU"
         elif comp == "intel":
-            print("#ifndef __INTEL_COMPILER")
-            print('static_assert(false,"libamrex was built with Intel");')
-            print("#endif")
+            comp_macro = "__INTEL_COMPILER"
+            comp_id    = "Intel"
         elif comp == "cray":
-            print("#ifndef _CRAYC")
-            print('static_assert(false,"libamrex was built with Cray");')
-            print("#endif")
+            comp_macro = "_CRAYC"
+            comp_id    = "Cray"
         elif comp == "pgi":
-            print("#ifndef __PGI")
-            print('static_assert(false,"libamrex was built with PGI");')
-            print("#endif")
+            comp_macro = "__PGI"
+            comp_id    = "PGI"
         elif comp == "llvm":
-            print("#ifndef __llvm__")
-            print('static_assert(false,"libamrex was built with Clang/LLVM");')
-            print("#endif")
+            comp_macro = "__llvm__"
+            comp_id    = "Clang/LLVM"
         elif comp == "nec":
-            print("#ifndef __NEC__")
-            print('static_assert(false,"libamrex was built with NEC");')
-            print("#endif")
+            comp_macro = "__NEC__"
+            comp_id    = "NEC"
         elif comp == "ibm":
-            print("#ifndef __ibmxl__")
-            print('static_assert(false,"libamrex was built with IBM");')
-            print("#endif")
+            comp_macro = "__ibmxl__"
+            comp_id    = "IBM"
         else:
             sys.exit("ERROR: unknown compiler "+comp+" to mkconfig.py")
 
+        msg = "libamrex was built with " + comp_id + ". "
+        msg = msg + "To avoid this error, reconfigure with --allow-different-compiler=yes"
+        print("#ifndef " + comp_macro )
+        print('static_assert(false,"'+msg+'");')
+        print("#endif")
+
     if use_omp == "TRUE":
         print("#ifndef _OPENMP")
         print('static_assert(false,"libamrex was built with OpenMP");')
@@ -101,4 +100,3 @@ def doit(defines, undefines, comp, allow_diff_comp, use_omp):
     except:
         # something went wrong
         print("$(error something went wrong in mkconfig.py)")
-
diff --git a/Tutorials/Amr/Advection_AmrCore/CMakeLists.txt b/Tutorials/Amr/Advection_AmrCore/CMakeLists.txt
index 7329f68711d..3861988026e 100644
--- a/Tutorials/Amr/Advection_AmrCore/CMakeLists.txt
+++ b/Tutorials/Amr/Advection_AmrCore/CMakeLists.txt
@@ -1,56 +1,19 @@
-if ( (DIM EQUAL 1) OR NOT ENABLE_FORTRAN )
+if (AMReX_SPACEDIM EQUAL 1)
    return()
 endif ()
 
-#
-# This test works for both 2D and 3D builds
-#
-set ( EXENAME  "Advection_AmrCore.exe" )
-set ( SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex )
+# List of source files
+set(_sources AdvancePhiAllLevels.cpp  AdvancePhiAtLevel.cpp  AmrCoreAdv.cpp  AmrCoreAdv.H bc_fill.H)
+list(APPEND _sources DefineVelocity.cpp  face_velocity.H  Kernels.H  main.cpp  Tagging.H)
+list(APPEND _sources Src_K/Adv_K.H  Src_K/compute_flux_${AMReX_SPACEDIM}D_K.H  Src_K/slope_K.H)
+list(TRANSFORM _sources PREPEND Source/)
+list(APPEND _sources Exec/Prob.H)
 
-#
-# Create target (executable) for this tutorial
-#
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
+# List of input files
+set(_input_files inputs  inputs_for_scaling  paraview_amr101.py)
+list(TRANSFORM _input_files PREPEND "Exec/")
 
-#
-# Set target (executable) properties
-#
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-find_all_sources ( SRC3 INC3 ROOT ${SRC_DIR}/Src_nd )
+setup_tutorial(_sources _input_files)
 
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-set_target_properties ( ${EXENAME} PROPERTIES
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR} )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${EXENAME} )
-endif ()
-
-target_link_libraries ( ${EXENAME} amrex ${AMREX_EXTRA_Fortran_LINK_LINE} )
-
-#
-# Find input files
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false  ${EXE_DIR}/input* )
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-#
-# Add to the "tutorial" target
-#
-add_tutorial (${EXENAME})
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/GNUmakefile b/Tutorials/Amr/Advection_AmrCore/Exec/GNUmakefile
similarity index 73%
rename from Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/GNUmakefile
rename to Tutorials/Amr/Advection_AmrCore/Exec/GNUmakefile
index 4916f0eccdc..b5ca957ca1e 100644
--- a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/GNUmakefile
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/GNUmakefile
@@ -1,4 +1,3 @@
-AMREX_HOME ?= ../../../../..
 
 PRECISION  = DOUBLE
 PROFILE    = FALSE
@@ -12,9 +11,10 @@ DIM        = 2
 COMP	   = gnu
 
 USE_MPI    = TRUE
-USE_OMP    = FALSE
+USE_OMP    = FALSE 
+USE_CUDA   = FALSE
 
 Bpack   := ./Make.package 
 Blocs   := . 
 
-include ../Make.Adv
+include Make.Adv
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/GNUmakefile_movie b/Tutorials/Amr/Advection_AmrCore/Exec/GNUmakefile_movie
new file mode 100644
index 00000000000..7070a0aecda
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/GNUmakefile_movie
@@ -0,0 +1,11 @@
+PARAVIEW_PATH ?= /path/containing/paraview/executable
+
+movie2D:
+	@echo "Making a movie from 2D simulation, this will probably take <30 seconds ..."
+	@$(PARAVIEW_PATH)/pvpython paraview_amr101.py -d 2 > /dev/null 2>&1
+	@echo "Done! Generated amr101_2D.avi and amr101_2D.gif"
+
+movie3D:
+	@echo "Making a movie from 3D simulation, this will probably take <30 seconds ..."
+	@$(PARAVIEW_PATH)/pvpython paraview_amr101.py > /dev/null 2>&1
+	@echo "Done! Generated amr101_3D.avi and amr101_3D.gif"
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/Make.Adv b/Tutorials/Amr/Advection_AmrCore/Exec/Make.Adv
index 990c1bc0e24..64989d5729b 100644
--- a/Tutorials/Amr/Advection_AmrCore/Exec/Make.Adv
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/Make.Adv
@@ -1,13 +1,15 @@
-AMREX_HOME ?= ../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/Amr/Advection_AmrCore
+AMREX_HOME = ../../../..
+ADV_DIR    = ../
 
-TOP := $(ADR_DIR)
+TOP := $(ADV_DIR)
 
 EBASE := main
 
+BL_NO_FORT = TRUE
+
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
+Bdirs 	:= Source Source/Src_K
 Bpack	+= $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
 Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
 
@@ -17,9 +19,6 @@ INCLUDE_LOCATIONS += $(Blocs)
 VPATH_LOCATIONS   += $(Blocs)
 
 Pdirs 	:= Base Boundary AmrCore
-ifeq ($(USE_SENSEI_INSITU),TRUE)
-	Pdirs += Amr Extern/SENSEI
-endif
 Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
 
 include $(Ppack)
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/Make.package b/Tutorials/Amr/Advection_AmrCore/Exec/Make.package
new file mode 100644
index 00000000000..18747fd168a
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/Make.package
@@ -0,0 +1 @@
+CEXE_headers += Prob.H
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/Prob.H b/Tutorials/Amr/Advection_AmrCore/Exec/Prob.H
new file mode 100644
index 00000000000..a7c172468ba
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/Prob.H
@@ -0,0 +1,32 @@
+#ifndef PROB_H_
+#define PROB_H_
+
+#include <AMReX_Box.H>
+#include <AMReX_FArrayBox.H>
+#include <AMReX_Geometry.H>
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void
+initdata(amrex::Box const& bx, amrex::Array4<amrex::Real> const& phi,
+         amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& prob_lo,
+         amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dx)
+{
+    using namespace amrex;
+
+    const auto lo = lbound(bx);
+    const auto hi = ubound(bx);    
+
+    for         (int k = lo.z; k <= hi.z; ++k) {
+        for     (int j = lo.y; j <= hi.y; ++j) {
+            Real y = prob_lo[1] + (0.5+j) * dx[1];
+            for (int i = lo.x; i <= hi.x; ++i) {
+                Real x = prob_lo[0] + (0.5+i) * dx[0]; 
+                Real r2 = (std::pow(x-0.5, 2) + std::pow((y-0.75),2)) / 0.01;
+                phi(i,j,k) = 1.0 + std::exp(-r2);
+            }
+        }
+    }
+}
+
+#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/Make.package b/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/Make.package
deleted file mode 100644
index c478388fbdc..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/Prob.f90 b/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/Prob.f90
deleted file mode 100644
index 556c0d86bc5..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/Prob.f90
+++ /dev/null
@@ -1,39 +0,0 @@
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo) bind(C, name="initdata")
-
-  use amrex_fort_module, only : amrex_spacedim, amrex_real
-
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  real(amrex_real), intent(in) :: time
-  real(amrex_real), intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  real(amrex_real), intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: i,j,k
-  real(amrex_real) :: x,y,z,r2
-  
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( amrex_spacedim .eq. 2) then
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2 + (z-0.5d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/face_velocity_2d.f90 b/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/face_velocity_2d.f90
deleted file mode 100644
index 3db62eb9dff..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/face_velocity_2d.f90
+++ /dev/null
@@ -1,62 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  real(amrex_real), intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  real(amrex_real), intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  real(amrex_real), intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  real(amrex_real), intent(in) :: dx(2), prob_lo(2)
-
-  integer :: i, j, plo(2), phi(2)
-  real(amrex_real) :: x, y
-  real(amrex_real), pointer, contiguous :: psi(:,:)
-  real(amrex_real), parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-
-  ! y velocity
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-
-  call bl_deallocate(psi)
-  
-end subroutine get_face_velocity
-
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/face_velocity_3d.f90
deleted file mode 100644
index e1818d778d1..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/face_velocity_3d.f90
+++ /dev/null
@@ -1,70 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3, &
-     vy, vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3, &
-     vz, vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  real(amrex_real), intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3
-  integer, intent(in) :: vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3
-  integer, intent(in) :: vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3
-  real(amrex_real), intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2,vx_l3:vx_h3)
-  real(amrex_real), intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2,vy_l3:vy_h3)
-  real(amrex_real), intent(out) :: vz(vz_l1:vz_h1,vz_l2:vz_h2,vz_l3:vz_h3)
-  real(amrex_real), intent(in) :: dx(3), prob_lo(3)
-
-  integer :: i, j, k, plo(2), phi(2)
-  real(amrex_real) :: x, y, z
-  real(amrex_real), pointer, contiguous :: psi(:,:)
-  real(amrex_real), parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do k = vx_l3, vx_h3
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j,k) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-  end do
-
-  ! y velocity
-  do k = vy_l3, vy_h3
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j,k) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-  end do
-
-  vz = 1.d0
-
-  call bl_deallocate(psi)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/inputs b/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/inputs
deleted file mode 100644
index 908dd13bad0..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,41 +0,0 @@
-max_step  = 1000000
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# VERBOSITY
-amr.v              = 1       # verbosity in Amr
-
-# REFINEMENT
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-amr.regrid_int      = 2       # how often to regrid
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-
-adv.do_reflux = 1
-
-# Tagging
-adv.phierr = 1.01  1.1  1.5
-
-# PLOTFILES
-amr.plot_file  = plt    # root name of plot file
-amr.plot_int   = 10     # number of timesteps between plot files
-
-# CHECKPOINT
-amr.chk_file = chk      # root name of checkpoint file
-amr.chk_int  = 10       # number of timesteps between checkpoint files
-#amr.restart  = chk00060 # restart from this checkpoint file
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/inputs b/Tutorials/Amr/Advection_AmrCore/Exec/inputs
new file mode 100644
index 00000000000..eec6de1f210
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/inputs
@@ -0,0 +1,79 @@
+# *****************************************************************
+# Run until nsteps == max_step or time == stop_time, 
+#     whichever comes first
+# *****************************************************************
+max_step  = 1000
+stop_time = 2.0
+
+# *****************************************************************
+# Are we restarting from an existing checkpoint file?
+# *****************************************************************
+#amr.restart  = chk00060 # restart from this checkpoint file
+
+# *****************************************************************
+# Problem size and geometry
+# *****************************************************************
+geometry.prob_lo     =  0.0  0.0  0.0 
+geometry.prob_hi     =  1.0  1.0  0.125
+geometry.is_periodic =  1    1    1
+
+# *****************************************************************
+# VERBOSITY
+# *****************************************************************
+amr.v              = 1       # verbosity in Amr
+
+# *****************************************************************
+# Resolution and refinement
+# *****************************************************************
+amr.n_cell          = 64 64 8
+amr.max_level       = 2       # maximum level number allowed -- 
+                              # number of levels = max_level + 1
+
+amr.ref_ratio       = 2 2 2 2 # refinement ratio between levels
+
+# *****************************************************************
+# Control of grid creation
+# *****************************************************************
+# Blocking factor for grid creation in each dimension --
+#   this ensures that every grid is coarsenable by a factor of 8 --
+#   this is mostly relevant for multigrid performance
+amr.blocking_factor_x = 8
+amr.blocking_factor_y = 8
+amr.blocking_factor_z = 8
+
+amr.max_grid_size   = 16
+
+amr.regrid_int      = 2       # how often to regrid
+
+# *****************************************************************
+# Time step control
+# *****************************************************************
+adv.cfl            = 0.7     # CFL constraint for explicit advection
+
+adv.do_subcycle    = 1       # Do we subcycle in time?
+
+# *****************************************************************
+# Should we reflux at coarse-fine boundaries?
+# *****************************************************************
+adv.do_reflux = 1
+
+# *****************************************************************
+# Tagging -  if phi > 1.01 at level 0, then refine 
+#            if phi > 1.1  at level 1, then refine 
+#            if phi > 1.5  at level 2, then refine 
+# *****************************************************************
+adv.phierr = 1.01  1.1  1.5
+
+# *****************************************************************
+# Plotfile name and frequency
+# *****************************************************************
+amr.plot_file  = plt    # root name of plot file
+amr.plot_int   =  10    # number of timesteps between plot files
+                        # if negative then no plot files will be written
+
+# *****************************************************************
+# Checkpoint name and frequency
+# *****************************************************************
+amr.chk_file = chk      # root name of checkpoint file
+amr.chk_int  = -1       # number of timesteps between checkpoint files
+                        # if negative then no checkpoint files will be written
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/inputs_for_scaling b/Tutorials/Amr/Advection_AmrCore/Exec/inputs_for_scaling
new file mode 100644
index 00000000000..15b1b6938bb
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/inputs_for_scaling
@@ -0,0 +1,80 @@
+# *****************************************************************
+# Run until nsteps == max_step or time == stop_time, 
+#     whichever comes first
+# *****************************************************************
+max_step  = 1000
+max_step  = 10
+stop_time = 2.0
+
+# *****************************************************************
+# Are we restarting from an existing checkpoint file?
+# *****************************************************************
+#amr.restart  = chk00060 # restart from this checkpoint file
+
+# *****************************************************************
+# Problem size and geometry
+# *****************************************************************
+geometry.prob_lo     =  0.0  0.0  0.0 
+geometry.prob_hi     =  1.0  1.0  0.25
+geometry.is_periodic =  1    1    1
+
+# *****************************************************************
+# VERBOSITY
+# *****************************************************************
+amr.v              = 1       # verbosity in Amr
+
+# *****************************************************************
+# Resolution and refinement
+# *****************************************************************
+amr.n_cell          = 128 128 32
+amr.max_level       = 3       # maximum level number allowed -- 
+                              # number of levels = max_level + 1
+
+amr.ref_ratio       = 2 2 2 2 # refinement ratio between levels
+
+# *****************************************************************
+# Control of grid creation
+# *****************************************************************
+# Blocking factor for grid creation in each dimension --
+#   this ensures that every grid is coarsenable by a factor of 8 --
+#   this is mostly relevant for multigrid performance
+amr.blocking_factor_x = 8
+amr.blocking_factor_y = 8
+amr.blocking_factor_z = 8
+
+amr.max_grid_size   = 64
+
+amr.regrid_int      = 2       # how often to regrid
+
+# *****************************************************************
+# Time step control
+# *****************************************************************
+adv.cfl            = 0.9     # CFL constraint for explicit advection
+
+adv.do_subcycle    = 1       # Do we subcycle in time?
+
+# *****************************************************************
+# Should we reflux at coarse-fine boundaries?
+# *****************************************************************
+adv.do_reflux = 1
+
+# *****************************************************************
+# Tagging -  if phi > 1.01 at level 0, then refine 
+#            if phi > 1.1  at level 1, then refine 
+#            if phi > 1.5  at level 2, then refine 
+# *****************************************************************
+adv.phierr = 1.01  1.1  1.5
+
+# *****************************************************************
+# Plotfile name and frequency
+# *****************************************************************
+amr.plot_file  = plt    # root name of plot file
+amr.plot_int   = -1     # number of timesteps between plot files
+                        # if negative then no plot files will be written
+
+# *****************************************************************
+# Checkpoint name and frequency
+# *****************************************************************
+amr.chk_file = chk      # root name of checkpoint file
+amr.chk_int  = -1       # number of timesteps between checkpoint files
+                        # if negative then no checkpoint files will be written
diff --git a/Tutorials/Amr/Advection_AmrCore/Exec/paraview_amr101.py b/Tutorials/Amr/Advection_AmrCore/Exec/paraview_amr101.py
new file mode 100644
index 00000000000..f77699bea34
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Exec/paraview_amr101.py
@@ -0,0 +1,339 @@
+# based on traces generated using paraview version 5.8.0
+#
+# To ensure correct image size when batch processing, please search 
+# for and uncomment the line `# renderView*.ViewSize = [*,*]`
+
+#### import the simple module from the paraview
+from paraview.simple import *
+
+import subprocess
+import glob
+import argparse
+
+parser = argparse.ArgumentParser()
+parser.add_argument('-f', '--frame_rate', type=int, default=15, help="Frame rate for generating movies, i.e. number of plots per second in the movie.")
+parser.add_argument('-r', '--resolution', type=int, default=1024, help="(Square) resolution of output movie.")
+parser.add_argument('-d', '--spacedim', type=int, default=3, help="Dimensionality of the problem: 2 or 3")
+args = parser.parse_args()
+
+def generate_movie_3D(AllPlotFiles):
+    #### disable automatic camera reset on 'Show'
+    paraview.simple._DisableFirstRenderCameraReset()
+
+    # create a new 'AMReX/BoxLib Grid Reader'
+    plt00 = AMReXBoxLibGridReader(FileNames=AllPlotFiles)
+    plt00.CellArrayStatus = []
+
+    # get animation scene
+    animationScene1 = GetAnimationScene()
+
+    # get the time-keeper
+    timeKeeper1 = GetTimeKeeper()
+
+    # update animation scene based on data timesteps
+    animationScene1.UpdateAnimationUsingDataTimeSteps()
+
+    # Properties modified on plt00
+    plt00.CellArrayStatus = ['phi']
+
+    # get active view
+    renderView1 = GetActiveViewOrCreate('RenderView')
+    renderView1.ViewSize = [1200, 1200]
+
+    # get layout
+    layout1 = GetLayout()
+
+    # show data in view
+    plt00Display = Show(plt00, renderView1, 'AMRRepresentation')
+
+    # trace defaults for the display properties.
+    plt00Display.Representation = 'Outline'
+    plt00Display.ColorArrayName = [None, '']
+    plt00Display.OSPRayScaleFunction = 'PiecewiseFunction'
+    plt00Display.SelectOrientationVectors = 'None'
+    plt00Display.ScaleFactor = 0.1
+    plt00Display.SelectScaleArray = 'None'
+    plt00Display.GlyphType = 'Arrow'
+    plt00Display.GlyphTableIndexArray = 'None'
+    plt00Display.GaussianRadius = 0.005
+    plt00Display.SetScaleArray = [None, '']
+    plt00Display.ScaleTransferFunction = 'PiecewiseFunction'
+    plt00Display.OpacityArray = [None, '']
+    plt00Display.OpacityTransferFunction = 'PiecewiseFunction'
+    plt00Display.DataAxesGrid = 'GridAxesRepresentation'
+    plt00Display.PolarAxes = 'PolarAxesRepresentation'
+    plt00Display.ScalarOpacityUnitDistance = 0.030761993184097912
+
+    # reset view to fit data
+    renderView1.ResetCamera()
+
+    # get the material library
+    materialLibrary1 = GetMaterialLibrary()
+
+    # update the view to ensure updated data information
+    renderView1.Update()
+
+    # change solid color
+    plt00Display.AmbientColor = [0.0, 1.0, 0.0]
+    plt00Display.DiffuseColor = [0.0, 1.0, 0.0]
+
+    # create a new 'Slice'
+    slice1 = Slice(Input=plt00)
+    slice1.SliceType = 'Plane'
+    slice1.HyperTreeGridSlicer = 'Plane'
+    slice1.SliceOffsetValues = [0.0]
+
+    # init the 'Plane' selected for 'SliceType'
+    slice1.SliceType.Origin = [0.5, 0.5, 0.0625]
+
+    # init the 'Plane' selected for 'HyperTreeGridSlicer'
+    slice1.HyperTreeGridSlicer.Origin = [0.5, 0.5, 0.0625]
+
+    # toggle 3D widget visibility (only when running from the GUI)
+    Hide3DWidgets(proxy=slice1.SliceType)
+
+    # Properties modified on slice1.SliceType
+    slice1.SliceType.Normal = [0.0, 0.0, 1.0]
+
+    # show data in view
+    slice1Display = Show(slice1, renderView1, 'GeometryRepresentation')
+
+    # trace defaults for the display properties.
+    slice1Display.Representation = 'Surface'
+    slice1Display.ColorArrayName = [None, '']
+    slice1Display.OSPRayScaleFunction = 'PiecewiseFunction'
+    slice1Display.SelectOrientationVectors = 'None'
+    slice1Display.ScaleFactor = 0.1
+    slice1Display.SelectScaleArray = 'None'
+    slice1Display.GlyphType = 'Arrow'
+    slice1Display.GlyphTableIndexArray = 'None'
+    slice1Display.GaussianRadius = 0.005
+    slice1Display.SetScaleArray = [None, '']
+    slice1Display.ScaleTransferFunction = 'PiecewiseFunction'
+    slice1Display.OpacityArray = [None, '']
+    slice1Display.OpacityTransferFunction = 'PiecewiseFunction'
+    slice1Display.DataAxesGrid = 'GridAxesRepresentation'
+    slice1Display.PolarAxes = 'PolarAxesRepresentation'
+
+    # update the view to ensure updated data information
+    renderView1.Update()
+
+    # set scalar coloring
+    ColorBy(slice1Display, ('FIELD', 'vtkBlockColors'))
+
+    # get color transfer function/color map for 'vtkBlockColors'
+    vtkBlockColorsLUT = GetColorTransferFunction('vtkBlockColors')
+
+    # get opacity transfer function/opacity map for 'vtkBlockColors'
+    vtkBlockColorsPWF = GetOpacityTransferFunction('vtkBlockColors')
+
+    # set scalar coloring
+    ColorBy(slice1Display, ('CELLS', 'phi'))
+
+    # rescale color and/or opacity maps used to include current data range
+    slice1Display.RescaleTransferFunctionToDataRange(True, False)
+
+    # get color transfer function/color map for 'phi'
+    phiLUT = GetColorTransferFunction('phi')
+
+    # get opacity transfer function/opacity map for 'phi'
+    phiPWF = GetOpacityTransferFunction('phi')
+
+    # show color bar/color legend
+    slice1Display.SetScalarBarVisibility(renderView1, True)
+
+    # get color legend/bar for phiLUT in view renderView1
+    phiLUTColorBar = GetScalarBar(phiLUT, renderView1)
+
+    # change scalar bar placement
+    phiLUTColorBar.WindowLocation = 'AnyLocation'
+    phiLUTColorBar.Position = [0, 0.75]
+    phiLUTColorBar.ScalarBarLength = 0.2
+
+    # current camera placement for renderView1
+    renderView1.CameraPosition = [0.5, 0.5, 2.3291959654285184]
+    renderView1.CameraFocalPoint = [0.5, 0.5, 0.0625]
+    renderView1.CameraParallelScale = 0.7098635432250342
+
+    # save animation
+    output_movie_base = "amr101_3D"
+    output_movie = output_movie_base + ".avi"
+    SaveAnimation(output_movie,
+                  renderView1,
+                  ImageResolution=[1200, 1200],
+                  FrameRate=args.frame_rate,
+                  FrameWindow=[0, len(AllPlotFiles)-1])
+
+    return output_movie_base, output_movie
+
+def generate_movie_2D(AllPlotFiles):
+    #### disable automatic camera reset on 'Show'
+    paraview.simple._DisableFirstRenderCameraReset()
+
+    # create a new 'AMReX/BoxLib Grid Reader'
+    plt00 = AMReXBoxLibGridReader(FileNames=AllPlotFiles)
+    plt00.CellArrayStatus = []
+
+    # get animation scene
+    animationScene1 = GetAnimationScene()
+
+    # get the time-keeper
+    timeKeeper1 = GetTimeKeeper()
+
+    # update animation scene based on data timesteps
+    animationScene1.UpdateAnimationUsingDataTimeSteps()
+
+    # Properties modified on plt00
+    plt00.CellArrayStatus = ['phi']
+
+    # get active view
+    renderView1 = GetActiveViewOrCreate('RenderView')
+    # uncomment following to set a specific view size
+    # renderView1.ViewSize = [1309, 923]
+    renderView1.ViewSize = [1200, 1200]
+
+    # get layout
+    layout1 = GetLayout()
+
+    # show data in view
+    plt00Display = Show(plt00, renderView1, 'AMRRepresentation')
+
+    # trace defaults for the display properties.
+    plt00Display.Representation = 'Outline'
+    plt00Display.ColorArrayName = [None, '']
+    plt00Display.OSPRayScaleFunction = 'PiecewiseFunction'
+    plt00Display.SelectOrientationVectors = 'None'
+    plt00Display.ScaleFactor = 0.1
+    plt00Display.SelectScaleArray = 'None'
+    plt00Display.GlyphType = 'Arrow'
+    plt00Display.GlyphTableIndexArray = 'None'
+    plt00Display.GaussianRadius = 0.005
+    plt00Display.SetScaleArray = [None, '']
+    plt00Display.ScaleTransferFunction = 'PiecewiseFunction'
+    plt00Display.OpacityArray = [None, '']
+    plt00Display.OpacityTransferFunction = 'PiecewiseFunction'
+    plt00Display.DataAxesGrid = 'GridAxesRepresentation'
+    plt00Display.PolarAxes = 'PolarAxesRepresentation'
+    plt00Display.ScalarOpacityUnitDistance = 0.0701538780193358
+
+    # reset view to fit data
+    renderView1.ResetCamera()
+
+    #changing interaction mode based on data extents
+    renderView1.InteractionMode = '2D'
+    renderView1.CameraPosition = [0.5, 0.5, 10000.0]
+    renderView1.CameraFocalPoint = [0.5, 0.5, 0.0]
+
+    # get the material library
+    materialLibrary1 = GetMaterialLibrary()
+
+    # update the view to ensure updated data information
+    renderView1.Update()
+
+    # change representation type
+    plt00Display.SetRepresentationType('Surface')
+
+    # set scalar coloring
+    ColorBy(plt00Display, ('CELLS', 'phi'))
+
+    # rescale color and/or opacity maps used to include current data range
+    plt00Display.RescaleTransferFunctionToDataRange(True, False)
+
+    # get color transfer function/color map for 'phi'
+    phiLUT = GetColorTransferFunction('phi')
+
+    # get opacity transfer function/opacity map for 'phi'
+    phiPWF = GetOpacityTransferFunction('phi')
+
+    # show color bar/color legend
+    plt00Display.SetScalarBarVisibility(renderView1, True)
+
+    # create a new 'AMReX/BoxLib Grid Reader'
+    plt00_1 = AMReXBoxLibGridReader(FileNames=AllPlotFiles)
+    plt00_1.CellArrayStatus = []
+
+    # show data in view
+    plt00_1Display = Show(plt00_1, renderView1, 'AMRRepresentation')
+
+    # trace defaults for the display properties.
+    plt00_1Display.Representation = 'Outline'
+    plt00_1Display.ColorArrayName = [None, '']
+    plt00_1Display.OSPRayScaleFunction = 'PiecewiseFunction'
+    plt00_1Display.SelectOrientationVectors = 'None'
+    plt00_1Display.ScaleFactor = 0.1
+    plt00_1Display.SelectScaleArray = 'None'
+    plt00_1Display.GlyphType = 'Arrow'
+    plt00_1Display.GlyphTableIndexArray = 'None'
+    plt00_1Display.GaussianRadius = 0.005
+    plt00_1Display.SetScaleArray = [None, '']
+    plt00_1Display.ScaleTransferFunction = 'PiecewiseFunction'
+    plt00_1Display.OpacityArray = [None, '']
+    plt00_1Display.OpacityTransferFunction = 'PiecewiseFunction'
+    plt00_1Display.DataAxesGrid = 'GridAxesRepresentation'
+    plt00_1Display.PolarAxes = 'PolarAxesRepresentation'
+    plt00_1Display.ScalarOpacityUnitDistance = 0.0701538780193358
+
+    # update the view to ensure updated data information
+    renderView1.Update()
+
+    # change solid color
+    plt00_1Display.AmbientColor = [0.0, 1.0, 0.0]
+    plt00_1Display.DiffuseColor = [0.0, 1.0, 0.0]
+
+    # get color legend/bar for phiLUT in view renderView1
+    phiLUTColorBar = GetScalarBar(phiLUT, renderView1)
+
+    # change scalar bar placement
+    phiLUTColorBar.WindowLocation = 'AnyLocation'
+    phiLUTColorBar.Position = [0, 0.75]
+    phiLUTColorBar.ScalarBarLength = 0.2
+
+    # current camera placement for renderView1
+    renderView1.InteractionMode = '2D'
+    renderView1.CameraPosition = [0.5, 0.5, 10000.0]
+    renderView1.CameraFocalPoint = [0.5, 0.5, 0.0]
+    renderView1.CameraParallelScale = 0.5843857695756589
+
+    # save animation
+    output_movie_base = "amr101_2D"
+    output_movie = output_movie_base + ".avi"
+    SaveAnimation(output_movie,
+                  renderView1,
+                  ImageResolution=[1200, 1200],
+                  FrameRate=args.frame_rate,
+                  FrameWindow=[0, len(AllPlotFiles)-1])
+
+    return output_movie_base, output_movie
+
+def convert_avi_to_gif(output_movie_base, output_movie):
+    # use ffmpeg to convert the avi movie into an animated gif
+    ffmpeg_convert_to_gif = 'ffmpeg -y -i {} -vf "fps=35,scale={}:-1:flags=lanczos,split[s0][s1];[s0]palettegen[p];[s1][p]paletteuse" -loop 0 {}.gif'.format(output_movie, args.resolution, output_movie_base)
+    subprocess.run(ffmpeg_convert_to_gif, shell=True)
+
+if __name__ == "__main__":
+    if not (args.spacedim == 2 or args.spacedim == 3):
+        print("Please specify --spacedim D (with D=2 or D=3)")
+        exit()
+
+    if args.frame_rate <= 0:
+        print("Please specify --frame_rate F (with F > 0)")
+        exit()
+
+    if args.resolution <= 0:
+        print("Please specify --resolution R (with R > 0)")
+        exit()
+
+    # get all the plotfiles
+    PlotFiles = sorted(glob.glob("plt" + "[0-9]"*5))
+
+    # call the 2D or 3D vis function
+    output_movie_base = None
+    output_movie = None
+
+    if args.spacedim == 3:
+        output_movie_base, output_movie = generate_movie_3D(PlotFiles)
+    elif args.spacedim == 2:
+        output_movie_base, output_movie = generate_movie_2D(PlotFiles)
+
+    # convert the avi movie into an animated gif
+    convert_avi_to_gif(output_movie_base, output_movie)
\ No newline at end of file
diff --git a/Tutorials/Amr/Advection_AmrCore/README b/Tutorials/Amr/Advection_AmrCore/README
index 7c4eb512323..1d4302292fb 100644
--- a/Tutorials/Amr/Advection_AmrCore/README
+++ b/Tutorials/Amr/Advection_AmrCore/README
@@ -1,13 +1,25 @@
-Advection_AmrCore: This tutorial contains an AMR advection code that advects a single 
-scalar field with a velocity field that is specified on faces.
+Advection_AmrCore: 
 
-It is an AMReX based code designed to run in parallel using MPI/OMP.
+This tutorial contains an AMR advection code 
+that advects a single scalar field with a velocity field that is specified on faces.
+It is written entirely in C++, can be built in 2D or 3D and run with the same
+inputs file, and can be built with 
+
+USE_MPI = TRUE
+or 
+USE_MPI = FALSE
+
+and either 
+
+USE_OMP = TRUE
+or
+USE_CUDA = TRUE
 
 This example uses source code from the amrex/Src/Base, Boundary, and AmrCore directories.
-Notably, this example does not use source code from amrex/Src/Amr
-(see the tutorial Advection_AmrLevel).
+To see a similar example that uses amrex/Src/Amr rather than AmrCore, see
+the tutorial in amrex/Tutorials/Amr/Advection_AmrLevel.
 
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with VisIt.
+If you run this code with plot_int > 0, 
+plotfiles are generated that can be viewed with amrvis2d / amrvis3d
+(CCSE's native vis / spreadsheet tool, downloadable separately from 
+https://github.com/amrex-codes/amrvis) or with VisIt, yt or Paraview.
diff --git a/Tutorials/Amr/Advection_AmrCore/README.md b/Tutorials/Amr/Advection_AmrCore/README.md
new file mode 100644
index 00000000000..265740e0364
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/README.md
@@ -0,0 +1,265 @@
+ use_math: true
+
+##  Multi-Level Scalar Advection
+
+### What Features Are We Using
+
+* Mesh data 
+* Dynamic AMR with and without subcycling
+
+### The Problem
+
+Consider a drop of dye (we'll define $$\phi$$ to be the concentration of dye) 
+in a thin incompressible fluid that is spinning 
+clock-wise then counter-clockwise with a prescribed motion.  We consider the dye to be a 
+passive tracer that is advected by the fluid velocity.  The fluid is thin enough that we can model
+this as two-dimensional motion; here we have the option of solving in a 2D or 3D computational domain.
+
+In other words, we want to solve for $$\phi(x,y,t)$$ by evolving 
+
+$$\frac{\partial \phi}{\partial t} + \nabla \cdot (\bf{u^{spec}} \phi)  = 0$$
+
+in time ($$t$$), where the velocity $${\bf{u^{spec}}} = (u,v)$$ is a divergence-free field computed by defining
+
+$$\psi(i,j) = \sin^2(\pi x) \sin^2(\pi y)  \cos (\pi t / 2) / \pi $$
+
+and defining
+
+$$u = -\frac{\partial \psi}{\partial y},  v = \frac{\partial \psi}{\partial x}.$$
+
+Note that because $${\bf{u^{spec}}}$$ is defined as the curl of a scalar field, it is analytically divergence-free
+
+In this example we'll be using AMR to resolve the scalar field since the location of the dye is
+what we care most about.
+
+### The AMR Algorithm
+
+To update the solution in a patch at a given level, we compute fluxes ($${\bf u^{spec}} \phi$$)
+on each face, and difference the fluxes to create the update to phi.   The update routine
+in the code looks like
+
+```cplusplus
+  // Do a conservative update
+  {
+    phi_out(i,j,k) = phi_in(i,j,k) +
+                ( AMREX_D_TERM( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx[0],
+                              + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx[1],
+                              + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx[2] ) );
+  }
+```
+
+In this routine we use the macro AMREX_D_TERM so that we can write dimension-independent code; 
+in 3D this returns the flux differences in all three directions, but in 2D it does not include
+the z-fluxes.
+
+Knowing how to synchronize the solution at coarse/fine boundaries is essential in an AMR algorithm;
+here having the algorithm written in flux form allows us to either make the fluxes consistent between
+coarse and fine levels in a no-subcycling algorithm, or "reflux" after the update in a subcycling algorithm.
+
+The subcycling algorithm can be written as follows
+```C++
+void
+AmrCoreAdv::timeStepWithSubcycling (int lev, Real time, int iteration)
+{
+
+    // Advance a single level for a single time step, and update flux registers
+    Real t_nph = 0.5 * (t_old[lev] + t_new[lev]);
+    DefineVelocityAtLevel(lev, t_nph);
+    AdvancePhiAtLevel(lev, time, dt[lev], iteration, nsubsteps[lev]);
+
+    ++istep[lev];
+
+    if (lev < finest_level)
+    {
+        // recursive call for next-finer level
+        for (int i = 1; i <= nsubsteps[lev+1]; ++i)
+        {
+            timeStepWithSubcycling(lev+1, time+(i-1)*dt[lev+1], i);
+        }
+
+        if (do_reflux)
+        {
+            // update lev based on coarse-fine flux mismatch
+            flux_reg[lev+1]->Reflux(phi_new[lev], 1.0, 0, 0, phi_new[lev].nComp(), geom[lev]);
+        }
+
+        AverageDownTo(lev); // average lev+1 down to lev
+    }
+
+}
+```
+
+while the no-subcycling algorithm looks like
+```C++
+void
+AmrCoreAdv::timeStepNoSubcycling (Real time, int iteration)
+{
+    DefineVelocityAllLevels(time);
+    AdvancePhiAllLevels (time, dt[0], iteration);
+
+    // Make sure the coarser levels are consistent with the finer levels
+    AverageDown ();
+
+    for (int lev = 0; lev <= finest_level; lev++)
+        ++istep[lev];
+}
+```
+
+### Running the Code
+
+First git clone amrex.  Then from within the amrex repo,
+
+```
+cd Tutorials/Advection_AmrCore/Exec
+```
+Note that you can choose to work entirely in 2D or in 3D ... whichever you prefer.
+The instructions below will be written for 3D but you can substitute the 2D executable.
+
+To build in 2d, type
+```
+make DIM = 2
+```
+
+To build in 3d, type
+```
+make DIM = 3
+```
+
+In this directory you'll see 
+
+
+```
+inputs -- an inputs file for both 2D and 3D
+```
+
+To run in serial, 
+
+```
+./main3d.gnu.MPI.ex inputs
+```
+
+To run in parallel, for example on 4 ranks:
+
+```
+mpiexec -n 4 ./main3d.gnu.MPI.ex inputs
+```
+
+The following parameters can be set at run-time -- these are currently set in the inputs
+file but you can also set them on the command line.  
+
+```
+stop_time          =  2.0                # the final time (if we have not exceeded number of steps)
+max_step           = 1000000             # the maximum number of steps (if we have not exceeded stop_time)
+
+amr.n_cell         =  64  64   8         # number of cells at the coarsest AMR level in each coordinate direction
+
+amr.max_grid_size  = 16                  # the maximum number of cells in any direction in a single grid
+
+amr.plot_int       = 10                  # frequency of writing plotfiles
+
+adv.cfl            = 0.9                 # cfl number to be used for computing the time step
+
+adv.phierr = 1.01  1.1  1.5              # regridding criteria  at each level
+
+```
+
+The base grid here is a square of 64 x 64 x 8 cells, made up of 16 subgrids each of size 16x16x8 cells.  
+The problem is periodic in all directions.
+
+We have hard-wired the code here to refine based on the magnitude of $$\phi$$.    Here we set the 
+threshold level by level.  If $$\phi > 1.01$$ then we want to refine at least once; if $$\phi > 1.1$$ we
+want to resolve $$\phi$$ with two levels of refinement, and if $$\phi > 1.5$$ we want even more refinement.
+
+Note that you can see the total runtime by looking at the line at the end of your run that says
+
+```
+Total Time: 
+```
+
+and you can check conservation of $$\phi$$ by checking the line that prints, e.g. 
+
+```
+Coarse STEP 8 ends. TIME = 0.007031485953 DT = 0.0008789650903 Sum(Phi) = 540755.0014
+```
+
+Here Sum(Phi) is the sum of $$\phi$$ over all the cells at the coarsest level.
+
+Questions to answer:
+
+```
+1. How do the subcycling vs no-subycling calculations compare?
+    a.   How many steps did each take at the finest level? Why might this not be the same?
+    b.   How many cells were at the finest level in each case? Why might this number not be the same?
+
+2  What was the total run time for each calculation?  Was this what you expected?
+
+3. Was phi conserved (over time) in each case?
+      a.  If you set do_refluxing = 0 for the subcycling case, was phi still conserved?
+      b.  How in the algorithm is conservation enforced differently between subcycling and not?
+
+4. How did the runtimes vary with 1 vs. 4 MPI processes?  
+   We suggest you use a big enough problem here -- try running 
+
+   mpiexec -n 1 ./main3d.gnu.MPI.ex inputs_for_scaling
+
+   mpiexec -n 4 ./main3d.gnu.MPI.ex inputs_for_scaling
+
+5. Why could we check conservation by just adding up the values at the coarsest level?
+```
+
+### Visualizing the Results
+
+Here is a sample slice through a 3D run with 64x64x8 cells at the coarsest level and three finer levels (4 total levels).
+
+![Sample solution](amr101_3D.gif)
+
+After you run the code you will have a series of plotfiles.  To visualize these
+we will use ParaView 5.8, which has native support for AMReX Grid, Particle,
+and Embedded Boundary data (in the AMR 101 exercise we only have grid data).
+
+#### Make a Movie with the ParaView 5.8 Script
+
+To use the ParaView 5.8 python script, simply do the following to generate `amr101_3D.gif`:
+
+```
+$ make movie3D
+```
+
+If you run the 2D executable, make the 2D movie using:
+
+```
+$ make movie2D
+```
+
+Notes:
+
+- To delete old plotfiles before a new run, do `rm -rf plt*`
+
+- You will need `+ffmpeg`.
+
+#### Using ParaView 5.8 Manually
+
+To do the same thing with ParaView 5.8 manually,
+
+```
+1. Start Paraview 5.8
+2. File --> Open ... and select the collection of directories named "plt.." --> [OK]
+3. From the "Open Data With..." dialog that pops up, select "AMReX/BoxLib Grid Reader" --> [OK]
+4. Check the "phi" box in the "Cell Array Status" menu that appears
+5. Click green Apply button
+6. Click on the "slice" icon -- three to the right of the calculator
+   This will create "Slice 1" in the Pipeline Browser which will be highlighted.
+7. Click on "Z Normal"
+8. Unclick the "Show Plane" button
+9. Click green Apply button
+10. Change the drop-down menu option (above the calculator row) from "vtkBlockColors" to "phi"
+```
+
+You are now ready to play the movie!  See the "VCR-like" controls at the top. Click the play button.
+
+### Additional Topics to Explore
+
+* What happens as you change the max grid size for decomposition?
+
+* What happens as you change the refinement criteria (i.e. use different values of $$\phi$$)?
+  (You can edit these in inputs)  
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/AdvancePhiAllLevels.cpp b/Tutorials/Amr/Advection_AmrCore/Source/AdvancePhiAllLevels.cpp
new file mode 100644
index 00000000000..a3c4f8796aa
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/AdvancePhiAllLevels.cpp
@@ -0,0 +1,334 @@
+#include <AmrCoreAdv.H>
+#include <Kernels.H>
+
+#include <AMReX_MultiFabUtil.H>
+
+using namespace amrex;
+
+// advance all levels for a single time step
+void
+AmrCoreAdv::AdvancePhiAllLevels (Real time, Real dt_lev, int /*iteration*/)
+{
+    constexpr int num_grow = 3;
+
+    Vector< Array<MultiFab,AMREX_SPACEDIM> > fluxes(finest_level+1);
+    for (int lev = 0; lev <= finest_level; lev++)
+    {
+        for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+        {
+            BoxArray ba = grids[lev];
+            ba.surroundingNodes(idim);
+            fluxes[lev][idim] = MultiFab(ba, dmap[lev], 1, 0);
+        }
+    }
+
+    for (int lev = 0; lev <= finest_level; lev++)
+    {
+        std::swap(phi_old[lev], phi_new[lev]);
+        t_old[lev] = t_new[lev];
+        t_new[lev] += dt_lev;
+
+        const auto dx = geom[lev].CellSizeArray();
+        AMREX_D_TERM(Real dtdx = dt_lev/dx[0];,
+                     Real dtdy = dt_lev/dx[1];,
+                     Real dtdz = dt_lev/dx[2]);
+
+        // State with ghost cells
+        MultiFab Sborder(grids[lev], dmap[lev], phi_new[lev].nComp(), num_grow);
+        FillPatch(lev, time, Sborder, 0, Sborder.nComp());
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+        {
+            FArrayBox tmpfab;
+            for (MFIter mfi(phi_new[lev],TilingIfNotGPU()); mfi.isValid(); ++mfi)
+            {
+                AMREX_D_TERM(Array4<Real const> velx = facevel[lev][0].const_array(mfi);,
+                             Array4<Real const> vely = facevel[lev][1].const_array(mfi);,
+                             Array4<Real const> velz = facevel[lev][2].const_array(mfi));
+
+                const Box& bx = mfi.tilebox();
+                const Box& gbx = amrex::grow(bx, 1);
+
+                Array4<Real const> statein = Sborder.const_array(mfi);
+
+                AMREX_D_TERM(Array4<Real> fluxx = fluxes[lev][0].array(mfi);,
+                             Array4<Real> fluxy = fluxes[lev][1].array(mfi);,
+                             Array4<Real> fluxz = fluxes[lev][2].array(mfi));
+
+                int ntmpcomps = (AMREX_SPACEDIM == 2) ? 4 : 11;
+                tmpfab.resize(amrex::grow(bx,2),ntmpcomps);
+                Elixir tmpeli = tmpfab.elixir();
+                int itmp = 0;
+
+                Array4<Real> slope2 = tmpfab.array(itmp);
+                Array4<Real const> slope2_c = slope2;
+                itmp += 1;
+                Array4<Real> slope4 = tmpfab.array(itmp);
+                Array4<Real const> slope4_c = slope4;
+                itmp += 1;
+
+                // compute longitudinal fluxes
+                // ===========================
+
+                // x -------------------------
+                Array4<Real> phix = tmpfab.array(itmp);
+                Array4<Real const> phix_c = phix;
+                itmp += 1;
+
+                amrex::launch(amrex::grow(gbx,Direction::x,1),
+                [=] AMREX_GPU_DEVICE (const Box& tbx)
+                {
+                    slopex2(tbx, slope2, statein);
+                });
+
+                amrex::launch(gbx,
+                [=] AMREX_GPU_DEVICE (const Box& tbx)
+                {
+                    slopex4(tbx, slope4, statein, slope2_c);
+                });
+
+                Box b = gbx;
+                amrex::ParallelFor(b.grow(Direction::x,-1).surroundingNodes(Direction::x),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_x(i, j, k, phix, statein, velx, slope4_c, dtdx);
+                });
+
+                // y -------------------------
+                Array4<Real> phiy = tmpfab.array(itmp);
+                Array4<Real const> phiy_c = phiy;
+                itmp += 1;
+
+                amrex::launch(amrex::grow(gbx,Direction::y,1),
+                [=] AMREX_GPU_DEVICE (const Box& tbx)
+                {
+                    slopey2(tbx, slope2, statein);
+                });
+
+                amrex::launch(gbx,
+                [=] AMREX_GPU_DEVICE (const Box& tbx)
+                {
+                    slopey4(tbx, slope4, statein, slope2_c);
+                });
+
+                b = gbx;
+                amrex::ParallelFor(b.grow(Direction::y,-1).surroundingNodes(Direction::y),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_y(i, j, k, phiy, statein, vely, slope4_c, dtdy);
+                });
+
+#if (AMREX_SPACEDIM > 2)
+                // z -------------------------
+                Array4<Real> phiz = tmpfab.array(itmp);
+                Array4<Real const> phiz_c = phiz;
+                itmp += 1;
+
+                amrex::launch(amrex::grow(gbx,Direction::z,1),
+                [=] AMREX_GPU_DEVICE (const Box& tbx)
+                {
+                    slopez2(tbx, slope2, statein);
+                });
+
+                amrex::launch(gbx,
+                [=] AMREX_GPU_DEVICE (const Box& tbx)
+                {
+                    slopez4(tbx, slope4, statein, slope2_c);
+                });
+
+                b = gbx;
+                amrex::ParallelFor(b.grow(Direction::z,-1).surroundingNodes(Direction::z),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_z(i, j, k, phiz, statein, velz, slope4_c, dtdz);
+                });
+
+                // compute transverse fluxes (3D only)
+                // ===================================
+
+                // xy --------------------
+                Array4<Real> phix_y = tmpfab.array(itmp);
+                Array4<Real const> phix_y_c = phix_y;
+                itmp += 1;
+
+                b = bx;
+                amrex::ParallelFor(b.grow(Direction::z,1).surroundingNodes(Direction::x),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_xy(i, j, k, phix_y,
+                            velx, vely,
+                            phix_c, phiy_c,
+                            dtdy);
+                }); 
+
+                // xz --------------------
+                Array4<Real> phix_z = tmpfab.array(itmp);
+                Array4<Real const> phix_z_c = phix_z;
+                itmp += 1;
+
+                b = bx;
+                amrex::ParallelFor(b.grow(Direction::y,1).surroundingNodes(Direction::x),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_xz(i, j, k, phix_z,
+                            velx, velz,
+                            phix, phiz,
+                            dtdz);
+                }); 
+
+                // yx --------------------
+                Array4<Real> phiy_x = tmpfab.array(itmp);
+                Array4<Real const> phiy_x_c = phiy_x;
+                itmp += 1;
+
+                b = bx;
+                amrex::ParallelFor(b.grow(Direction::z,1).surroundingNodes(Direction::y),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_yx(i, j, k, phiy_x,
+                            velx, vely,
+                            phix, phiy,
+                            dtdx);
+                }); 
+
+                // yz --------------------
+                Array4<Real> phiy_z = tmpfab.array(itmp);
+                Array4<Real const> phiy_z_c = phiy_z;
+                itmp += 1;
+
+                b = bx;
+                amrex::ParallelFor(b.grow(Direction::x,1).surroundingNodes(Direction::y),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_yz(i, j, k, phiy_z,
+                            vely, velz,
+                            phiy, phiz,
+                            dtdz);
+                }); 
+
+                // zx --------------------
+                Array4<Real> phiz_x = tmpfab.array(itmp);
+                Array4<Real const> phiz_x_c = phiz_x;
+                itmp += 1;
+
+                b = bx;
+                amrex::ParallelFor(b.grow(Direction::y,1).surroundingNodes(Direction::z),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_zx(i, j, k, phiz_x,
+                            velx, velz,
+                            phix, phiz,
+                            dtdx);
+                }); 
+
+                // zy --------------------
+                Array4<Real> phiz_y = tmpfab.array(itmp);
+                Array4<Real const> phiz_y_c = phiz_y;
+                itmp += 1;
+
+                b = bx;
+                amrex::ParallelFor(b.grow(Direction::x,1).surroundingNodes(Direction::z),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    flux_zy(i, j, k, phiz_y,
+                            vely, velz,
+                            phiy, phiz,
+                            dtdy);
+                }); 
+#endif
+
+                // final edge states 
+                // ===========================
+                amrex::ParallelFor(mfi.nodaltilebox(0),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    create_flux_x(i, j, k, fluxx,
+                                  AMREX_D_DECL(velx,vely,velz),
+#if (AMREX_SPACEDIM == 3)
+                                  phix_c, phiy_z_c, phiz_y_c,
+                                  dtdy, dtdz);
+#else
+                                  phix_c, phiy_c,
+                                  dtdy);
+#endif
+                });
+
+                amrex::ParallelFor(mfi.nodaltilebox(1),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    create_flux_y(i, j, k, fluxy,
+                                  AMREX_D_DECL(velx,vely,velz),
+#if (AMREX_SPACEDIM == 3)
+                                  phiy_c, phix_z_c, phiz_x_c,
+                                  dtdx, dtdz);
+#else
+                                  phiy_c, phix_c,
+                                  dtdx);
+#endif
+                });
+
+#if (AMREX_SPACEDIM == 3)
+                amrex::ParallelFor(mfi.nodaltilebox(2),
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    create_flux_z(i, j, k, fluxz,
+                                  velx, vely, velz,
+                                  phiz_c, phix_y_c, phiy_x_c,
+                                  dtdx, dtdy);
+                });
+#endif
+                AMREX_ASSERT(itmp == ntmpcomps);
+            } // end mfi
+        } // end omp
+    } // end lev
+
+    // =======================================================
+    // Average down the fluxes before using them to update phi 
+    // =======================================================
+    for (int lev = finest_level; lev > 0; lev--)
+    {
+       average_down_faces(amrex::GetArrOfConstPtrs(fluxes[lev  ]),
+                          amrex::GetArrOfPtrs     (fluxes[lev-1]),
+                          refRatio(lev-1), Geom(lev-1));
+    } 
+
+    for (int lev = 0; lev <= finest_level; lev++)
+    {
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+        {
+            const auto dx = geom[lev].CellSizeArray();
+            AMREX_D_TERM(Real dtdx = dt_lev/dx[0];,
+                         Real dtdy = dt_lev/dx[1];,
+                         Real dtdz = dt_lev/dx[2]);
+
+            // ===========================================
+            // Compute phi_new using a conservative update 
+            // ===========================================
+            for (MFIter mfi(phi_new[lev],TilingIfNotGPU()); mfi.isValid(); ++mfi)
+            {
+                Array4<Real const> statein  = phi_old[lev].const_array(mfi);
+                Array4<Real      > stateout = phi_new[lev].array(mfi);
+
+                AMREX_D_TERM(Array4<Real const> fluxx = fluxes[lev][0].const_array(mfi);,
+                             Array4<Real const> fluxy = fluxes[lev][1].const_array(mfi);,
+                             Array4<Real const> fluxz = fluxes[lev][2].const_array(mfi));
+
+                const Box& bx  = mfi.tilebox();
+    
+                amrex::ParallelFor(bx,
+                [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                {
+                    conservative(i, j, k,
+                                 stateout, statein,
+                                 AMREX_D_DECL(fluxx,fluxy,fluxz),
+                                 AMREX_D_DECL(dtdx,dtdy,dtdz));
+                });
+            } // end mfi
+        } // end omp
+    } // end lev
+}
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/AdvancePhiAtLevel.cpp b/Tutorials/Amr/Advection_AmrCore/Source/AdvancePhiAtLevel.cpp
new file mode 100644
index 00000000000..7cb85429927
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/AdvancePhiAtLevel.cpp
@@ -0,0 +1,381 @@
+#include <AmrCoreAdv.H>
+#include <Kernels.H>
+
+using namespace amrex;
+
+// Advance a single level for a single time step, updates flux registers
+void
+AmrCoreAdv::AdvancePhiAtLevel (int lev, Real time, Real dt_lev, int /*iteration*/, int /*ncycle*/)
+{
+    constexpr int num_grow = 3;
+
+    std::swap(phi_old[lev], phi_new[lev]);
+
+    MultiFab& S_new = phi_new[lev];
+
+    const Real dx = geom[lev].CellSize(0);
+    const Real dy = geom[lev].CellSize(1);
+    const Real dz = (AMREX_SPACEDIM == 2) ? Real(1.0) : geom[lev].CellSize(2);
+    AMREX_D_TERM(Real dtdx = dt_lev/dx;,
+                 Real dtdy = dt_lev/dy;,
+                 Real dtdz = dt_lev/dz);
+
+    MultiFab fluxes[AMREX_SPACEDIM];
+    if (do_reflux)
+    {
+        for (int i = 0; i < AMREX_SPACEDIM; ++i)
+        {
+            BoxArray ba = grids[lev];
+            ba.surroundingNodes(i);
+            fluxes[i].define(ba, dmap[lev], S_new.nComp(), 0);
+        }
+    }
+
+    // State with ghost cells
+    MultiFab Sborder(grids[lev], dmap[lev], S_new.nComp(), num_grow);
+    FillPatch(lev, time, Sborder, 0, Sborder.nComp());
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    {
+        FArrayBox tmpfab;
+	for (MFIter mfi(S_new,TilingIfNotGPU()); mfi.isValid(); ++mfi)
+	{
+            AMREX_ASSERT(S_new.nComp() == 1);
+
+        // ======== GET FACE VELOCITY =========
+
+            AMREX_D_TERM(Array4<Real const> velx = facevel[lev][0].const_array(mfi);,
+                         Array4<Real const> vely = facevel[lev][1].const_array(mfi);,
+                         Array4<Real const> velz = facevel[lev][2].const_array(mfi));
+
+        // ======== FLUX CALC AND UPDATE =========
+
+	    const Box& bx = mfi.tilebox();
+            const Box& gbx = amrex::grow(bx, 1);
+
+            Array4<Real const> statein  = Sborder.const_array(mfi);
+            Array4<Real      > stateout = S_new.array(mfi);
+
+            int ntmpcomps = (AMREX_SPACEDIM == 2) ? 6 : 14;
+            tmpfab.resize(amrex::grow(bx,2),ntmpcomps);
+            Elixir tmpeli = tmpfab.elixir();
+            int itmp = 0;
+
+            AMREX_D_TERM(Array4<Real> tfluxx = tmpfab.array(itmp++);,
+                         Array4<Real> tfluxy = tmpfab.array(itmp++);,
+                         Array4<Real> tfluxz = tmpfab.array(itmp++));
+
+            Array4<Real> slope2 = tmpfab.array(itmp++);
+            Array4<Real const> slope2_c = slope2;
+            Array4<Real> slope4 = tmpfab.array(itmp++);
+            Array4<Real const> slope4_c = slope4;
+
+            // compute longitudinal fluxes
+            // ===========================
+
+            // x -------------------------
+            Array4<Real> phix = tmpfab.array(itmp++);
+            Array4<Real const> phix_c = phix;
+
+            amrex::launch(amrex::grow(gbx,Direction::x,1),
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                slopex2(tbx, slope2, statein);
+            });
+
+            amrex::launch(gbx,
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                slopex4(tbx, slope4, statein, slope2_c);
+            });
+
+            Box b = gbx;
+            amrex::ParallelFor(b.grow(Direction::x,-1).surroundingNodes(Direction::x),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_x(i, j, k, phix, statein, velx, slope4_c, dtdx);
+            });
+
+            // y -------------------------
+            Array4<Real> phiy = tmpfab.array(itmp++);
+            Array4<Real const> phiy_c = phiy;
+
+            amrex::launch(amrex::grow(gbx,Direction::y,1),
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                slopey2(tbx, slope2, statein);
+            });
+
+            amrex::launch(gbx,
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                slopey4(tbx, slope4, statein, slope2_c);
+            });
+
+            b = gbx;
+            amrex::ParallelFor(b.grow(Direction::y,-1).surroundingNodes(Direction::y),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_y(i, j, k, phiy, statein, vely, slope4_c, dtdy);
+            });
+
+#if (AMREX_SPACEDIM > 2)
+            // z -------------------------
+            Array4<Real> phiz = tmpfab.array(itmp++);
+            Array4<Real const> phiz_c = phiz;
+
+            amrex::launch(amrex::grow(gbx,Direction::z,1),
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                slopez2(tbx, slope2, statein);
+            });
+
+            amrex::launch(gbx,
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                slopez4(tbx, slope4, statein, slope2_c);
+            });
+
+            b = gbx;
+            amrex::ParallelFor(b.grow(Direction::z,-1).surroundingNodes(Direction::z),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_z(i, j, k, phiz, statein, velz, slope4_c, dtdz);
+            });
+
+            // compute transverse fluxes (3D only)
+            // ===================================
+
+            // xy --------------------
+            Array4<Real> phix_y = tmpfab.array(itmp++);
+            Array4<Real const> phix_y_c = phix_y;
+
+            b = bx;
+            amrex::ParallelFor(b.grow(Direction::z,1).surroundingNodes(Direction::x),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_xy(i, j, k, phix_y,
+                        velx, vely,
+                        phix_c, phiy_c,
+                        dtdy);
+            }); 
+
+            // xz --------------------
+            Array4<Real> phix_z = tmpfab.array(itmp++);
+            Array4<Real const> phix_z_c = phix_z;
+
+            b = bx;
+            amrex::ParallelFor(b.grow(Direction::y,1).surroundingNodes(Direction::x),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_xz(i, j, k, phix_z,
+                        velx, velz,
+                        phix, phiz,
+                        dtdz);
+            }); 
+
+            // yx --------------------
+            Array4<Real> phiy_x = tmpfab.array(itmp++);
+            Array4<Real const> phiy_x_c = phiy_x;
+
+            b = bx;
+            amrex::ParallelFor(b.grow(Direction::z,1).surroundingNodes(Direction::y),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_yx(i, j, k, phiy_x,
+                        velx, vely,
+                        phix, phiy,
+                        dtdx);
+            }); 
+
+            // yz --------------------
+            Array4<Real> phiy_z = tmpfab.array(itmp++);
+            Array4<Real const> phiy_z_c = phiy_z;
+
+            b = bx;
+            amrex::ParallelFor(b.grow(Direction::x,1).surroundingNodes(Direction::y),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_yz(i, j, k, phiy_z,
+                        vely, velz,
+                        phiy, phiz,
+                        dtdz);
+            }); 
+
+            // zx --------------------
+            Array4<Real> phiz_x = tmpfab.array(itmp++);
+            Array4<Real const> phiz_x_c = phiz_x;
+
+            b = bx;
+            amrex::ParallelFor(b.grow(Direction::y,1).surroundingNodes(Direction::z),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_zx(i, j, k, phiz_x,
+                        velx, velz,
+                        phix, phiz,
+                        dtdx);
+            }); 
+
+            // zy --------------------
+            Array4<Real> phiz_y = tmpfab.array(itmp++);
+            Array4<Real const> phiz_y_c = phiz_y;
+
+            b = bx;
+            amrex::ParallelFor(b.grow(Direction::x,1).surroundingNodes(Direction::z),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                flux_zy(i, j, k, phiz_y,
+                        vely, velz,
+                        phiy, phiz,
+                        dtdy);
+            }); 
+#endif
+
+            // final edge states 
+            // ===========================
+            amrex::ParallelFor(amrex::surroundingNodes(bx,Direction::x),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                create_flux_x(i, j, k, tfluxx,
+                              AMREX_D_DECL(velx,vely,velz),
+#if (AMREX_SPACEDIM == 3)
+                              phix_c, phiy_z_c, phiz_y_c,
+                              dtdy, dtdz);
+#else
+                              phix_c, phiy_c,
+                              dtdy);
+#endif
+            });
+
+            amrex::ParallelFor(amrex::surroundingNodes(bx,Direction::y),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                create_flux_y(i, j, k, tfluxy,
+                              AMREX_D_DECL(velx,vely,velz),
+#if (AMREX_SPACEDIM == 3)
+                              phiy_c, phix_z_c, phiz_x_c,
+                              dtdx, dtdz);
+#else
+                              phiy_c, phix_c,
+                              dtdx);
+#endif
+            });
+
+#if (AMREX_SPACEDIM == 3)
+            amrex::ParallelFor(amrex::surroundingNodes(bx,Direction::z),
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                create_flux_z(i, j, k, tfluxz,
+                              velx, vely, velz,
+                              phiz_c, phix_y_c, phiy_x_c,
+                              dtdx, dtdy);
+            });
+#endif
+            AMREX_ASSERT(itmp == ntmpcomps);
+
+            // compute new state (stateout) and scale fluxes based on face area.
+            // ===========================
+
+            AMREX_D_TERM(Array4<Real const> tfluxx_c = tfluxx;,
+                         Array4<Real const> tfluxy_c = tfluxy;,
+                         Array4<Real const> tfluxz_c = tfluxz);
+
+            // Do a conservative update 
+            amrex::ParallelFor(bx,
+            [=] AMREX_GPU_DEVICE (int i, int j, int k)
+            {
+                conservative(i, j, k,
+                             stateout, statein,
+                             AMREX_D_DECL(tfluxx_c,tfluxy_c,tfluxz_c),
+                             AMREX_D_DECL(dtdx,dtdy,dtdz));
+            });
+
+            if (do_reflux)
+            {
+                // Scale by face area in order to correctly reflux
+                amrex::ParallelFor(
+                    AMREX_D_DECL(amrex::surroundingNodes(bx,Direction::x),
+                                 amrex::surroundingNodes(bx,Direction::y),
+                                 amrex::surroundingNodes(bx,Direction::z)),
+                    AMREX_D_DECL([=] AMREX_GPU_DEVICE (int i, int j, int k)
+                                 {
+                                     tfluxx(i,j,k) *= dt_lev*dy*dz;
+                                 },
+                                 [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                                 {
+                                     tfluxy(i,j,k) *= dt_lev*dx*dz;
+                                 },
+                                 [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                                 {
+                                     tfluxz(i,j,k) *= dt_lev*dx*dy;
+                                 }));
+ 
+                // Copy into Flux MultiFab
+                AMREX_D_TERM(Array4<Real> fluxx = fluxes[0].array(mfi);,
+                             Array4<Real> fluxy = fluxes[1].array(mfi);,
+                             Array4<Real> fluxz = fluxes[2].array(mfi));
+                amrex::ParallelFor(
+                    AMREX_D_DECL(mfi.nodaltilebox(0),
+                                 mfi.nodaltilebox(1),
+                                 mfi.nodaltilebox(2)),
+                    AMREX_D_DECL([=] AMREX_GPU_DEVICE (int i, int j, int k)
+                                 {
+                                     fluxx(i,j,k) = tfluxx_c(i,j,k);
+                                 },
+                                 [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                                 {
+                                     fluxy(i,j,k) = tfluxy_c(i,j,k);
+                                 },
+                                 [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                                 {
+                                     fluxz(i,j,k) = tfluxz_c(i,j,k);
+                                 }));
+            }
+        }
+    }
+
+    // ======== CFL CHECK, MOVED OUTSIDE MFITER LOOP =========
+
+    AMREX_D_TERM(Real umax = facevel[lev][0].norminf(0,0,true);,
+                 Real vmax = facevel[lev][1].norminf(0,0,true);,
+                 Real wmax = facevel[lev][2].norminf(0,0,true));
+
+    if (AMREX_D_TERM(umax*dt_lev > dx, ||
+                     vmax*dt_lev > dy, ||
+                     wmax*dt_lev > dz))
+    {
+#if (AMREX_SPACEDIM > 2)
+        amrex::AllPrint() << "umax = " << umax << ", vmax = " << vmax << ", wmax = " << wmax
+                          << ", dt = " << dt_lev << " dx = " << dx << " " << dy << " " << dz << std::endl;
+#else
+        amrex::AllPrint() << "umax = " << umax << ", vmax = " << vmax
+                          << ", dt = " << dt_lev << " dx = " << dx << " " << dy << " " << dz << std::endl;
+#endif
+        amrex::Abort("CFL violation. use smaller adv.cfl.");
+    }
+
+    // increment or decrement the flux registers by area and time-weighted fluxes
+    // Note that the fluxes have already been scaled by dt and area
+    // In this example we are solving phi_t = -div(+F)
+    // The fluxes contain, e.g., F_{i+1/2,j} = (phi*u)_{i+1/2,j}
+    // Keep this in mind when considering the different sign convention for updating
+    // the flux registers from the coarse or fine grid perspective
+    // NOTE: the flux register associated with flux_reg[lev] is associated
+    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
+    if (do_reflux) { 
+	if (flux_reg[lev+1]) {
+	    for (int i = 0; i < AMREX_SPACEDIM; ++i) {
+	        // update the lev+1/lev flux register (index lev+1)   
+	        flux_reg[lev+1]->CrseInit(fluxes[i],i,0,0,fluxes[i].nComp(), -1.0);
+	    }	    
+	}
+	if (flux_reg[lev]) {
+	    for (int i = 0; i < AMREX_SPACEDIM; ++i) {
+	        // update the lev/lev-1 flux register (index lev) 
+		flux_reg[lev]->FineAdd(fluxes[i],i,0,0,fluxes[i].nComp(), 1.0);
+	    }
+	}
+    }
+}
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.H b/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.H
index 0707180a68b..1fe9a9c08c8 100644
--- a/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.H
+++ b/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.H
@@ -13,8 +13,6 @@
 #include <AMReX_FluxRegister.H>
 #include <AMReX_BCRec.H>
 
-using namespace amrex;
-
 class AmrCoreAdv
     : public amrex::AmrCore
 {
@@ -34,13 +32,13 @@ public:
     // initializes multilevel data
     void InitData ();
 
-    // Make a new level using provided BoxArray and DistributionMapping and
+    // Make a new level using provided BoxArray and DistributionMapping and 
     // fill with interpolated coarse level data.
     // overrides the pure virtual function in AmrCore
     virtual void MakeNewLevelFromCoarse (int lev, amrex::Real time, const amrex::BoxArray& ba,
 					 const amrex::DistributionMapping& dm) override;
 
-    // Remake an existing level using provided BoxArray and DistributionMapping and
+    // Remake an existing level using provided BoxArray and DistributionMapping and 
     // fill with existing fine and coarse data.
     // overrides the pure virtual function in AmrCore
     virtual void RemakeLevel (int lev, amrex::Real time, const amrex::BoxArray& ba,
@@ -60,6 +58,20 @@ public:
     // overrides the pure virtual function in AmrCore
     virtual void ErrorEst (int lev, amrex::TagBoxArray& tags, amrex::Real time, int ngrow) override;
 
+    // Advance phi at a single level for a single time step, update flux registers
+    void AdvancePhiAtLevel (int lev, amrex::Real time, amrex::Real dt_lev, int iteration, int ncycle);
+
+    // Advance phi at all levels for a single time step
+    void AdvancePhiAllLevels (amrex::Real time, amrex::Real dt_lev, int iteration);
+
+    // Define the advection velocity as the curl of a scalar field
+    void DefineVelocityAtLevel (int lev, amrex::Real time);
+
+    void DefineVelocityAllLevels (amrex::Real time);
+
+    // compute dt from CFL considerations
+    amrex::Real EstTimeStep (int lev, amrex::Real time);
+
 private:
 
     ////////////////
@@ -86,19 +98,15 @@ private:
     void GetData (int lev, amrex::Real time, amrex::Vector<amrex::MultiFab*>& data,
                   amrex::Vector<amrex::Real>& datatime);
 
-    // advance a level by dt
-    // includes a recursive call for finer levels
-    void timeStep (int lev, amrex::Real time, int iteration);
+    // Advance a level by dt - includes a recursive call for finer levels
+    void timeStepWithSubcycling (int lev, amrex::Real time, int iteration);
 
-    // advance a single level for a single time step, updates flux registers
-    void Advance (int lev, amrex::Real time, amrex::Real dt_lev, int iteration, int ncycle);
+    // Advance all levels by the same dt
+    void timeStepNoSubcycling (amrex::Real time, int iteration);
 
-    // a wrapper for EstTimeStep(0
+    // a wrapper for EstTimeStep
     void ComputeDt ();
 
-    // compute dt from CFL considerations
-    Real EstTimeStep (int lev, bool local=false) const;
-
     // get plotfile name
     std::string PlotFileName (int lev) const;
 
@@ -117,9 +125,6 @@ private:
     // read checkpoint file from disk
     void ReadCheckpointFile ();
 
-    // utility to skip to next line in Header
-    static void GotoNextLine (std::istream& is);
-
     ////////////////
     // private data members
 
@@ -127,7 +132,7 @@ private:
     amrex::Vector<int> nsubsteps;  // how many substeps on each level?
 
     // keep track of old time, new time, and time step at each level
-    amrex::Vector<amrex::Real> t_new;
+    amrex::Vector<amrex::Real> t_new;  
     amrex::Vector<amrex::Real> t_old;
     amrex::Vector<amrex::Real> dt;
 
@@ -136,18 +141,21 @@ private:
     amrex::Vector<amrex::MultiFab> phi_new;
     amrex::Vector<amrex::MultiFab> phi_old;
 
-    // BCRec is essentially a 2*DIM integer array storing the physical boundary
+    // this is essentially a 2*DIM integer array storing the physical boundary
     // condition types at the lo/hi walls in each direction
-    amrex::Vector<BCRec> bcs;  // 1-component
+    amrex::Vector<amrex::BCRec> bcs;  // 1-component
 
     // stores fluxes at coarse-fine interface for synchronization
     // this will be sized "nlevs_max+1"
     // NOTE: the flux register associated with flux_reg[lev] is associated
     // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    // therefore flux_reg[0] and flux_reg[nlevs_max] are never actually
+    // therefore flux_reg[0] and flux_reg[nlevs_max] are never actually 
     // used in the reflux operation
-    amrex::Vector<std::unique_ptr<amrex::FluxRegister> > flux_reg;
+    amrex::Vector<std::unique_ptr<amrex::FluxRegister> > flux_reg; 
 
+    // Velocity on all faces at all levels
+    amrex::Vector< amrex::Array<amrex::MultiFab, AMREX_SPACEDIM> > facevel;
+    
     ////////////////
     // runtime parameters
 
@@ -168,6 +176,9 @@ private:
     // hyperbolic refluxing as part of multilevel synchronization
     int do_reflux = 1;
 
+    // do we subcycle in time?
+    int do_subcycle = 1;
+
     // plotfile prefix and frequency
     std::string plot_file {"plt"};
     int plot_int = -1;
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.cpp b/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.cpp
index ad346dc9ccb..8047a43a141 100644
--- a/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.cpp
+++ b/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv.cpp
@@ -12,7 +12,7 @@
 #endif
 
 #include <AmrCoreAdv.H>
-#include <AmrCoreAdv_F.H>
+#include <Kernels.H>
 
 using namespace amrex;
 
@@ -32,8 +32,10 @@ AmrCoreAdv::AmrCoreAdv ()
 
     istep.resize(nlevs_max, 0);
     nsubsteps.resize(nlevs_max, 1);
-    for (int lev = 1; lev <= max_level; ++lev) {
-	nsubsteps[lev] = MaxRefRatio(lev-1);
+    if (do_subcycle) {
+        for (int lev = 1; lev <= max_level; ++lev) {
+            nsubsteps[lev] = MaxRefRatio(lev-1);
+        }
     }
 
     t_new.resize(nlevs_max, 0.0);
@@ -43,7 +45,7 @@ AmrCoreAdv::AmrCoreAdv ()
     phi_new.resize(nlevs_max);
     phi_old.resize(nlevs_max);
 
-    bcs.resize(1);
+    facevel.resize(nlevs_max);
 
     // periodic boundaries
     int bc_lo[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
@@ -54,6 +56,8 @@ AmrCoreAdv::AmrCoreAdv ()
     int bc_lo[] = {FOEXTRAP, FOEXTRAP, FOEXTRAP};
     int bc_hi[] = {FOEXTRAP, FOEXTRAP, FOEXTRAP};
 */
+
+    bcs.resize(1);     // Setup 1-component
     for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
     {
         // lo-side BCs
@@ -100,26 +104,32 @@ AmrCoreAdv::Evolve ()
     {
         amrex::Print() << "\nCoarse STEP " << step+1 << " starts ..." << std::endl;
 
-	ComputeDt();
+        ComputeDt();
 
-	int lev = 0;
-	int iteration = 1;
-	timeStep(lev, cur_time, iteration);
+        int lev = 0;
+        int iteration = 1;
+        if (do_subcycle)
+            timeStepWithSubcycling(lev, cur_time, iteration);
+        else
+            timeStepNoSubcycling(cur_time, iteration);
 
-	cur_time += dt[0];
+        cur_time += dt[0];
+
+        // sum phi to check conservation
+        Real sum_phi = phi_new[0].sum();
 
         amrex::Print() << "Coarse STEP " << step+1 << " ends." << " TIME = " << cur_time
-                       << " DT = " << dt[0]  << std::endl;
+                       << " DT = " << dt[0] << " Sum(Phi) = " << sum_phi << std::endl;
 
-	// sync up time
-	for (lev = 0; lev <= finest_level; ++lev) {
-	    t_new[lev] = cur_time;
-	}
+        // sync up time
+        for (lev = 0; lev <= finest_level; ++lev) {
+            t_new[lev] = cur_time;
+        }
 
-	if (plot_int > 0 && (step+1) % plot_int == 0) {
-	    last_plot_file_step = step+1;
-	    WritePlotFile();
-	}
+        if (plot_int > 0 && (step+1) % plot_int == 0) {
+            last_plot_file_step = step+1;
+            WritePlotFile();
+        }
 
         if (chk_int > 0 && (step+1) % chk_int == 0) {
             WriteCheckpointFile();
@@ -133,11 +143,11 @@ AmrCoreAdv::Evolve ()
         }
 #endif
 
-	if (cur_time >= stop_time - 1.e-6*dt[0]) break;
+        if (cur_time >= stop_time - 1.e-6*dt[0]) break;
     }
 
     if (plot_int > 0 && istep[0] > last_plot_file_step) {
-	WritePlotFile();
+        WritePlotFile();
     }
 }
 
@@ -166,7 +176,7 @@ AmrCoreAdv::InitData ()
     }
 }
 
-// Make a new level using provided BoxArray and DistributionMapping and
+// Make a new level using provided BoxArray and DistributionMapping and 
 // fill with interpolated coarse level data.
 // overrides the pure virtual function in AmrCore
 void
@@ -175,13 +185,19 @@ AmrCoreAdv::MakeNewLevelFromCoarse (int lev, Real time, const BoxArray& ba,
 {
     const int ncomp = phi_new[lev-1].nComp();
     const int nghost = phi_new[lev-1].nGrow();
-
+    
     phi_new[lev].define(ba, dm, ncomp, nghost);
     phi_old[lev].define(ba, dm, ncomp, nghost);
 
     t_new[lev] = time;
     t_old[lev] = time - 1.e200;
 
+    // This clears the old MultiFab and allocates the new one
+    for (int idim = 0; idim < AMREX_SPACEDIM; idim++)
+    {
+	facevel[lev][idim] = MultiFab(amrex::convert(ba,IntVect::TheDimensionVector(idim)), dm, 1, 1);
+    }
+
     if (lev > 0 && do_reflux) {
 	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
     }
@@ -189,7 +205,7 @@ AmrCoreAdv::MakeNewLevelFromCoarse (int lev, Real time, const BoxArray& ba,
     FillCoarsePatch(lev, time, phi_new[lev], 0, ncomp);
 }
 
-// Remake an existing level using provided BoxArray and DistributionMapping and
+// Remake an existing level using provided BoxArray and DistributionMapping and 
 // fill with existing fine and coarse data.
 // overrides the pure virtual function in AmrCore
 void
@@ -210,9 +226,15 @@ AmrCoreAdv::RemakeLevel (int lev, Real time, const BoxArray& ba,
     t_new[lev] = time;
     t_old[lev] = time - 1.e200;
 
+    // This clears the old MultiFab and allocates the new one
+    for (int idim = 0; idim < AMREX_SPACEDIM; idim++)
+    {
+	facevel[lev][idim] = MultiFab(amrex::convert(ba,IntVect::TheDimensionVector(idim)), dm, 1, 1);
+    }
+
     if (lev > 0 && do_reflux) {
 	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }
+    }    
 }
 
 // Delete level data
@@ -240,32 +262,41 @@ void AmrCoreAdv::MakeNewLevelFromScratch (int lev, Real time, const BoxArray& ba
     t_new[lev] = time;
     t_old[lev] = time - 1.e200;
 
+    // This clears the old MultiFab and allocates the new one
+    for (int idim = 0; idim < AMREX_SPACEDIM; idim++)
+    {
+	facevel[lev][idim] = MultiFab(amrex::convert(ba,IntVect::TheDimensionVector(idim)), dm, 1, 1);
+    }
+
     if (lev > 0 && do_reflux) {
 	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
     }
 
-    const Real* dx = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-    Real cur_time = t_new[lev];
-
     MultiFab& state = phi_new[lev];
 
-    for (MFIter mfi(state); mfi.isValid(); ++mfi)
+    const auto problo = Geom(lev).ProbLoArray();
+    const auto dx     = Geom(lev).CellSizeArray();
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    for (MFIter mfi(state,TilingIfNotGPU()); mfi.isValid(); ++mfi)
     {
-        const Box& box = mfi.validbox();
-        const int* lo  = box.loVect();
-        const int* hi  = box.hiVect();
+        Array4<Real> fab = state[mfi].array();
+        const Box& box = mfi.tilebox();
 
-	initdata(&lev, &cur_time, AMREX_ARLIM_3D(lo), AMREX_ARLIM_3D(hi),
-		 BL_TO_FORTRAN_3D(state[mfi]), AMREX_ZFILL(dx),
-		 AMREX_ZFILL(prob_lo));
+        amrex::launch(box,
+        [=] AMREX_GPU_DEVICE (Box const& tbx)
+        {
+            initdata(tbx, fab, problo, dx);
+        });
     }
 }
 
 // tag all cells for refinement
 // overrides the pure virtual function in AmrCore
 void
-AmrCoreAdv::ErrorEst (int lev, TagBoxArray& tags, Real time, int ngrow)
+AmrCoreAdv::ErrorEst (int lev, TagBoxArray& tags, Real /*time*/, int /*ngrow*/)
 {
     static bool first = true;
     static Vector<Real> phierr;
@@ -288,48 +319,28 @@ AmrCoreAdv::ErrorEst (int lev, TagBoxArray& tags, Real time, int ngrow)
 
     if (lev >= phierr.size()) return;
 
-    const int clearval = TagBox::CLEAR;
+//    const int clearval = TagBox::CLEAR;
     const int   tagval = TagBox::SET;
 
-    const Real* dx      = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-
     const MultiFab& state = phi_new[lev];
 
 #ifdef _OPENMP
-#pragma omp parallel
+#pragma omp parallel if(Gpu::notInLaunchRegion())
 #endif
     {
-        Vector<int>  itags;
-
-	for (MFIter mfi(state,true); mfi.isValid(); ++mfi)
+	
+	for (MFIter mfi(state,TilingIfNotGPU()); mfi.isValid(); ++mfi)
 	{
-	    const Box& tilebox  = mfi.tilebox();
-
-            TagBox&     tagfab  = tags[mfi];
-
-	    // We cannot pass tagfab to Fortran becuase it is BaseFab<char>.
-	    // So we are going to get a temporary integer array.
-            // set itags initially to 'untagged' everywhere
-            // we define itags over the tilebox region
-	    tagfab.get_itags(itags, tilebox);
-
-            // data pointer and index space
-	    int*        tptr    = itags.dataPtr();
-	    const int*  tlo     = tilebox.loVect();
-	    const int*  thi     = tilebox.hiVect();
-
-            // tag cells for refinement
-	    state_error(tptr,  AMREX_ARLIM_3D(tlo), AMREX_ARLIM_3D(thi),
-			BL_TO_FORTRAN_3D(state[mfi]),
-			&tagval, &clearval,
-			AMREX_ARLIM_3D(tilebox.loVect()), AMREX_ARLIM_3D(tilebox.hiVect()),
-			AMREX_ZFILL(dx), AMREX_ZFILL(prob_lo), &time, &phierr[lev]);
-	    //
-	    // Now update the tags in the TagBox in the tilebox region
-            // to be equal to itags
-	    //
-	    tagfab.tags_and_untags(itags, tilebox);
+	    const Box& bx  = mfi.tilebox();
+            const auto statefab = state.array(mfi);
+            const auto tagfab  = tags.array(mfi);
+            Real phierror = phierr[lev];
+	    
+            amrex::ParallelFor(bx,
+            [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
+            {
+                state_error(i, j, k, tagfab, statefab, phierror, tagval);
+            });
 	}
     }
 }
@@ -357,9 +368,10 @@ AmrCoreAdv::ReadParameters ()
 
     {
 	ParmParse pp("adv");
-
+	
 	pp.query("cfl", cfl);
         pp.query("do_reflux", do_reflux);
+        pp.query("do_subcycle", do_subcycle);
     }
 }
 
@@ -395,10 +407,20 @@ AmrCoreAdv::FillPatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp)
 	Vector<Real> stime;
 	GetData(0, time, smf, stime);
 
-        BndryFuncArray bfunc(phifill);
-        PhysBCFunct<BndryFuncArray> physbc(geom[lev], bcs, bfunc);
-	amrex::FillPatchSingleLevel(mf, time, smf, stime, 0, icomp, ncomp,
-                                    geom[lev], physbc, 0);
+        if(Gpu::inLaunchRegion())
+        {
+            GpuBndryFuncFab<AmrCoreFill> gpu_bndry_func(AmrCoreFill{});
+            PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > physbc(geom[lev],bcs,gpu_bndry_func);
+            amrex::FillPatchSingleLevel(mf, time, smf, stime, 0, icomp, ncomp, 
+                                        geom[lev], physbc, 0);
+        }
+        else
+        {
+            CpuBndryFuncFab bndry_func(nullptr);  // Without EXT_DIR, we can pass a nullptr.
+            PhysBCFunct<CpuBndryFuncFab> physbc(geom[lev],bcs,bndry_func);
+            amrex::FillPatchSingleLevel(mf, time, smf, stime, 0, icomp, ncomp, 
+                                        geom[lev], physbc, 0);
+        }
     }
     else
     {
@@ -407,16 +429,30 @@ AmrCoreAdv::FillPatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp)
 	GetData(lev-1, time, cmf, ctime);
 	GetData(lev  , time, fmf, ftime);
 
-        BndryFuncArray bfunc(phifill);
-        PhysBCFunct<BndryFuncArray> cphysbc(geom[lev-1],bcs,bfunc);
-        PhysBCFunct<BndryFuncArray> fphysbc(geom[lev  ],bcs,bfunc);
-
 	Interpolater* mapper = &cell_cons_interp;
 
-	amrex::FillPatchTwoLevels(mf, time, cmf, ctime, fmf, ftime,
-                                  0, icomp, ncomp, geom[lev-1], geom[lev],
-                                  cphysbc, 0, fphysbc, 0,
-                                  refRatio(lev-1), mapper, bcs, 0);
+        if(Gpu::inLaunchRegion())
+        {
+            GpuBndryFuncFab<AmrCoreFill> gpu_bndry_func(AmrCoreFill{});
+            PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > cphysbc(geom[lev-1],bcs,gpu_bndry_func);
+            PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > fphysbc(geom[lev],bcs,gpu_bndry_func);
+
+            amrex::FillPatchTwoLevels(mf, time, cmf, ctime, fmf, ftime,
+                                      0, icomp, ncomp, geom[lev-1], geom[lev],
+                                      cphysbc, 0, fphysbc, 0, refRatio(lev-1),
+                                      mapper, bcs, 0);
+        }
+        else
+        {
+            CpuBndryFuncFab bndry_func(nullptr);  // Without EXT_DIR, we can pass a nullptr.
+            PhysBCFunct<CpuBndryFuncFab> cphysbc(geom[lev-1],bcs,bndry_func);
+            PhysBCFunct<CpuBndryFuncFab> fphysbc(geom[lev],bcs,bndry_func);
+
+            amrex::FillPatchTwoLevels(mf, time, cmf, ctime, fmf, ftime,
+                                      0, icomp, ncomp, geom[lev-1], geom[lev],
+                                      cphysbc, 0, fphysbc, 0, refRatio(lev-1),
+                                      mapper, bcs, 0);
+        }
     }
 }
 
@@ -430,20 +466,32 @@ AmrCoreAdv::FillCoarsePatch (int lev, Real time, MultiFab& mf, int icomp, int nc
     Vector<MultiFab*> cmf;
     Vector<Real> ctime;
     GetData(lev-1, time, cmf, ctime);
-
+    Interpolater* mapper = &cell_cons_interp;
+    
     if (cmf.size() != 1) {
 	amrex::Abort("FillCoarsePatch: how did this happen?");
     }
 
-    BndryFuncArray bfunc(phifill);
-    PhysBCFunct<BndryFuncArray> cphysbc(geom[lev-1],bcs,bfunc);
-    PhysBCFunct<BndryFuncArray> fphysbc(geom[lev  ],bcs,bfunc);
+    if(Gpu::inLaunchRegion())
+    {
+        GpuBndryFuncFab<AmrCoreFill> gpu_bndry_func(AmrCoreFill{});
+        PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > cphysbc(geom[lev-1],bcs,gpu_bndry_func);
+        PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > fphysbc(geom[lev],bcs,gpu_bndry_func);
 
-    Interpolater* mapper = &cell_cons_interp;
+        amrex::InterpFromCoarseLevel(mf, time, *cmf[0], 0, icomp, ncomp, geom[lev-1], geom[lev],
+                                     cphysbc, 0, fphysbc, 0, refRatio(lev-1),
+                                     mapper, bcs, 0);
+    }
+    else
+    {
+        CpuBndryFuncFab bndry_func(nullptr);  // Without EXT_DIR, we can pass a nullptr.
+        PhysBCFunct<CpuBndryFuncFab> cphysbc(geom[lev-1],bcs,bndry_func);
+        PhysBCFunct<CpuBndryFuncFab> fphysbc(geom[lev],bcs,bndry_func);
 
-    amrex::InterpFromCoarseLevel(mf, time, *cmf[0], 0, icomp, ncomp, geom[lev-1], geom[lev],
-				 cphysbc, 0, fphysbc, 0, refRatio(lev-1),
-				 mapper, bcs, 0);
+        amrex::InterpFromCoarseLevel(mf, time, *cmf[0], 0, icomp, ncomp, geom[lev-1], geom[lev],
+                                     cphysbc, 0, fphysbc, 0, refRatio(lev-1),
+                                     mapper, bcs, 0);
+    }
 }
 
 // utility to copy in data from phi_old and/or phi_new into another multifab
@@ -475,10 +523,10 @@ AmrCoreAdv::GetData (int lev, Real time, Vector<MultiFab*>& data, Vector<Real>&
 }
 
 
-// advance a level by dt
-// includes a recursive call for finer levels
+// Advance a level by dt
+// (includes a recursive call for finer levels)
 void
-AmrCoreAdv::timeStep (int lev, Real time, int iteration)
+AmrCoreAdv::timeStepWithSubcycling (int lev, Real time, int iteration)
 {
     if (regrid_int > 0)  // We may need to regrid
     {
@@ -488,169 +536,112 @@ AmrCoreAdv::timeStep (int lev, Real time, int iteration)
         static Vector<int> last_regrid_step(max_level+1, 0);
 
         // regrid changes level "lev+1" so we don't regrid on max_level
-        // also make sure we don't regrid fine levels again if
+        // also make sure we don't regrid fine levels again if 
         // it was taken care of during a coarser regrid
-        if (lev < max_level && istep[lev] > last_regrid_step[lev])
+        if (lev < max_level && istep[lev] > last_regrid_step[lev]) 
         {
             if (istep[lev] % regrid_int == 0)
             {
                 // regrid could add newly refine levels (if finest_level < max_level)
                 // so we save the previous finest level index
-		int old_finest = finest_level;
-		regrid(lev, time);
+                int old_finest = finest_level; 
+                regrid(lev, time);
 
                 // mark that we have regridded this level already
-		for (int k = lev; k <= finest_level; ++k) {
-		    last_regrid_step[k] = istep[k];
-		}
+                for (int k = lev; k <= finest_level; ++k) {
+                    last_regrid_step[k] = istep[k];
+                }
 
                 // if there are newly created levels, set the time step
-		for (int k = old_finest+1; k <= finest_level; ++k) {
-		    dt[k] = dt[k-1] / MaxRefRatio(k-1);
-		}
-	    }
-	}
+                for (int k = old_finest+1; k <= finest_level; ++k) {
+                    dt[k] = dt[k-1] / MaxRefRatio(k-1);
+                }
+            }
+        }
     }
 
     if (Verbose()) {
-	amrex::Print() << "[Level " << lev << " step " << istep[lev]+1 << "] ";
-	amrex::Print() << "ADVANCE with time = " << t_new[lev]
+        amrex::Print() << "[Level " << lev << " step " << istep[lev]+1 << "] ";
+        amrex::Print() << "ADVANCE with time = " << t_new[lev] 
                        << " dt = " << dt[lev] << std::endl;
     }
 
-    // advance a single level for a single time step, updates flux registers
-    Advance(lev, time, dt[lev], iteration, nsubsteps[lev]);
+    // Advance a single level for a single time step, and update flux registers
+
+    t_old[lev] = t_new[lev];
+    t_new[lev] += dt[lev];
+
+    Real t_nph = t_old[lev] + 0.5*dt[lev]; 
+
+    DefineVelocityAtLevel(lev, t_nph);
+    AdvancePhiAtLevel(lev, time, dt[lev], iteration, nsubsteps[lev]);
 
     ++istep[lev];
 
     if (Verbose())
     {
-	amrex::Print() << "[Level " << lev << " step " << istep[lev] << "] ";
+        amrex::Print() << "[Level " << lev << " step " << istep[lev] << "] ";
         amrex::Print() << "Advanced " << CountCells(lev) << " cells" << std::endl;
     }
 
     if (lev < finest_level)
     {
         // recursive call for next-finer level
-	for (int i = 1; i <= nsubsteps[lev+1]; ++i)
-	{
-	    timeStep(lev+1, time+(i-1)*dt[lev+1], i);
-	}
+        for (int i = 1; i <= nsubsteps[lev+1]; ++i)
+        {
+            timeStepWithSubcycling(lev+1, time+(i-1)*dt[lev+1], i);
+        }
 
-	if (do_reflux)
-	{
+        if (do_reflux)
+        {
             // update lev based on coarse-fine flux mismatch
-	    flux_reg[lev+1]->Reflux(phi_new[lev], 1.0, 0, 0, phi_new[lev].nComp(), geom[lev]);
-	}
+            flux_reg[lev+1]->Reflux(phi_new[lev], 1.0, 0, 0, phi_new[lev].nComp(), geom[lev]);
+        }
 
-	AverageDownTo(lev); // average lev+1 down to lev
+        AverageDownTo(lev); // average lev+1 down to lev
     }
-
+    
 }
 
-// advance a single level for a single time step, updates flux registers
+// Advance all the levels with the same dt
 void
-AmrCoreAdv::Advance (int lev, Real time, Real dt_lev, int iteration, int ncycle)
+AmrCoreAdv::timeStepNoSubcycling (Real time, int iteration)
 {
-    constexpr int num_grow = 3;
-
-    std::swap(phi_old[lev], phi_new[lev]);
-    t_old[lev] = t_new[lev];
-    t_new[lev] += dt_lev;
+    if (max_level > 0 && regrid_int > 0)  // We may need to regrid
+    {
+        if (istep[0] % regrid_int == 0)
+        {
+            regrid(0, time);
+        }
+    }
 
-    MultiFab& S_new = phi_new[lev];
+    if (Verbose()) {
+        for (int lev = 0; lev <= finest_level; lev++)
+        {
+           amrex::Print() << "[Level " << lev << " step " << istep[lev]+1 << "] ";
+           amrex::Print() << "ADVANCE with time = " << t_new[lev] 
+                          << " dt = " << dt[0] << std::endl;
+        }
+    }
 
-    const Real old_time = t_old[lev];
-    const Real new_time = t_new[lev];
-    const Real ctr_time = 0.5*(old_time+new_time);
+    DefineVelocityAllLevels(time);
+    AdvancePhiAllLevels (time, dt[0], iteration);
 
-    const Real* dx = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
+    // Make sure the coarser levels are consistent with the finer levels
+    AverageDown ();
 
-    MultiFab fluxes[BL_SPACEDIM];
-    if (do_reflux)
-    {
-	for (int i = 0; i < BL_SPACEDIM; ++i)
-	{
-	    BoxArray ba = grids[lev];
-	    ba.surroundingNodes(i);
-	    fluxes[i].define(ba, dmap[lev], S_new.nComp(), 0);
-	}
-    }
+    for (int lev = 0; lev <= finest_level; lev++)
+        ++istep[lev];
 
-    // State with ghost cells
-    MultiFab Sborder(grids[lev], dmap[lev], S_new.nComp(), num_grow);
-    FillPatch(lev, time, Sborder, 0, Sborder.nComp());
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
+    if (Verbose())
     {
-	FArrayBox flux[BL_SPACEDIM], uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    const Box& bx = mfi.tilebox();
-
-	    const FArrayBox& statein = Sborder[mfi];
-	    FArrayBox& stateout      =   S_new[mfi];
-
-	    // Allocate fabs for fluxes and Godunov velocities.
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bxtmp = amrex::surroundingNodes(bx,i);
-		flux[i].resize(bxtmp,S_new.nComp());
-		uface[i].resize(amrex::grow(bxtmp,1),1);
-	    }
-
-            // compute velocities on faces (prescribed function of space and time)
-	    get_face_velocity(&lev, &ctr_time,
-			      AMREX_D_DECL(BL_TO_FORTRAN(uface[0]),
-				     BL_TO_FORTRAN(uface[1]),
-				     BL_TO_FORTRAN(uface[2])),
-			      dx, prob_lo);
-
-            // compute new state (stateout) and fluxes.
-            advect(&time, bx.loVect(), bx.hiVect(),
-		   BL_TO_FORTRAN_3D(statein),
-		   BL_TO_FORTRAN_3D(stateout),
-		   AMREX_D_DECL(BL_TO_FORTRAN_3D(uface[0]),
-			  BL_TO_FORTRAN_3D(uface[1]),
-			  BL_TO_FORTRAN_3D(uface[2])),
-		   AMREX_D_DECL(BL_TO_FORTRAN_3D(flux[0]),
-			  BL_TO_FORTRAN_3D(flux[1]),
-			  BL_TO_FORTRAN_3D(flux[2])),
-		   dx, &dt_lev);
-
-	    if (do_reflux) {
-		for (int i = 0; i < BL_SPACEDIM ; i++) {
-		    fluxes[i][mfi].copy<RunOn::Host>(flux[i],mfi.nodaltilebox(i));
-		}
-	    }
-	}
+        for (int lev = 0; lev <= finest_level; lev++)
+        {
+            amrex::Print() << "[Level " << lev << " step " << istep[lev] << "] ";
+            amrex::Print() << "Advanced " << CountCells(lev) << " cells" << std::endl;
+        }
     }
 
-    // increment or decrement the flux registers by area and time-weighted fluxes
-    // Note that the fluxes have already been scaled by dt and area
-    // In this example we are solving phi_t = -div(+F)
-    // The fluxes contain, e.g., F_{i+1/2,j} = (phi*u)_{i+1/2,j}
-    // Keep this in mind when considering the different sign convention for updating
-    // the flux registers from the coarse or fine grid perspective
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    if (do_reflux) {
-	if (flux_reg[lev+1]) {
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	        // update the lev+1/lev flux register (index lev+1)
-	        flux_reg[lev+1]->CrseInit(fluxes[i],i,0,0,fluxes[i].nComp(), -1.0);
-	    }
-	}
-	if (flux_reg[lev]) {
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	        // update the lev/lev-1 flux register (index lev)
-		flux_reg[lev]->FineAdd(fluxes[i],i,0,0,fluxes[i].nComp(), 1.0);
-	    }
-	}
-    }
 }
 
 // a wrapper for EstTimeStep
@@ -661,74 +652,55 @@ AmrCoreAdv::ComputeDt ()
 
     for (int lev = 0; lev <= finest_level; ++lev)
     {
-	dt_tmp[lev] = EstTimeStep(lev, true);
+        dt_tmp[lev] = EstTimeStep(lev, t_new[lev]);
     }
     ParallelDescriptor::ReduceRealMin(&dt_tmp[0], dt_tmp.size());
 
     constexpr Real change_max = 1.1;
     Real dt_0 = dt_tmp[0];
     int n_factor = 1;
+
     for (int lev = 0; lev <= finest_level; ++lev) {
-	dt_tmp[lev] = std::min(dt_tmp[lev], change_max*dt[lev]);
-	n_factor *= nsubsteps[lev];
-	dt_0 = std::min(dt_0, n_factor*dt_tmp[lev]);
+        dt_tmp[lev] = std::min(dt_tmp[lev], change_max*dt[lev]);
+        n_factor *= nsubsteps[lev];
+        dt_0 = std::min(dt_0, n_factor*dt_tmp[lev]);
     }
 
     // Limit dt's by the value of stop_time.
     const Real eps = 1.e-3*dt_0;
+
     if (t_new[0] + dt_0 > stop_time - eps) {
-	dt_0 = stop_time - t_new[0];
+        dt_0 = stop_time - t_new[0];
     }
 
     dt[0] = dt_0;
+
     for (int lev = 1; lev <= finest_level; ++lev) {
-	dt[lev] = dt[lev-1] / nsubsteps[lev];
+        dt[lev] = dt[lev-1] / nsubsteps[lev];
     }
 }
 
 // compute dt from CFL considerations
 Real
-AmrCoreAdv::EstTimeStep (int lev, bool local) const
+AmrCoreAdv::EstTimeStep (int lev, Real time)
 {
     BL_PROFILE("AmrCoreAdv::EstTimeStep()");
 
     Real dt_est = std::numeric_limits<Real>::max();
 
-    const Real* dx = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-    const Real cur_time = t_new[lev];
-    const MultiFab& S_new = phi_new[lev];
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est)
-#endif
-    {
-	FArrayBox uface[BL_SPACEDIM];
+    const Real* dx  =  geom[lev].CellSize();
 
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bx = mfi.nodaltilebox(i);
-		uface[i].resize(bx,1);
-	    }
-
-	    get_face_velocity(&lev, &cur_time,
-			      AMREX_D_DECL(BL_TO_FORTRAN(uface[0]),
-				     BL_TO_FORTRAN(uface[1]),
-				     BL_TO_FORTRAN(uface[2])),
-			      dx, prob_lo);
-
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		Real umax = uface[i].norm<RunOn::Host>(0);
-		if (umax > 1.e-100) {
-		    dt_est = std::min(dt_est, dx[i] / umax);
-		}
-	    }
-	}
+    if (time == 0.0) {
+       DefineVelocityAtLevel(lev,time);
+    } else {
+       Real t_nph_predicted = time + 0.5 * dt[lev];
+       DefineVelocityAtLevel(lev,t_nph_predicted);
     }
 
-    if (!local) {
-	ParallelDescriptor::ReduceRealMin(dt_est);
+    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
+    {
+        Real est = facevel[lev][idim].norminf(0,0,true);
+        dt_est = amrex::min(dt_est, dx[idim]/est);
     }
 
     dt_est *= cfl;
@@ -768,7 +740,7 @@ AmrCoreAdv::WritePlotFile () const
     const std::string& plotfilename = PlotFileName(istep[0]);
     const auto& mf = PlotFileMF();
     const auto& varnames = PlotFileVarNames();
-
+    
     amrex::Print() << "Writing plotfile " << plotfilename << "\n";
 
     amrex::WriteMultiLevelPlotfile(plotfilename, finest_level+1, mf, varnames,
@@ -856,6 +828,14 @@ AmrCoreAdv::WriteCheckpointFile () const
 
 }
 
+namespace {
+// utility to skip to next line in Header
+void GotoNextLine (std::istream& is)
+{
+    constexpr std::streamsize bl_ignore_max { 100000 };
+    is.ignore(bl_ignore_max, '\n');
+}
+}
 
 void
 AmrCoreAdv::ReadCheckpointFile ()
@@ -931,9 +911,16 @@ AmrCoreAdv::ReadCheckpointFile ()
         int nghost = 0;
         phi_old[lev].define(grids[lev], dmap[lev], ncomp, nghost);
         phi_new[lev].define(grids[lev], dmap[lev], ncomp, nghost);
+
         if (lev > 0 && do_reflux) {
             flux_reg[lev].reset(new FluxRegister(grids[lev], dmap[lev], refRatio(lev-1), lev, ncomp));
         }
+
+        // build face velocity MultiFabs
+        for (int idim = 0; idim < AMREX_SPACEDIM; idim++)
+        {
+	    facevel[lev][idim] = MultiFab(amrex::convert(ba,IntVect::TheDimensionVector(idim)), dm, 1, 1);
+        }
     }
 
     // read in the MultiFab data
@@ -943,11 +930,3 @@ AmrCoreAdv::ReadCheckpointFile ()
     }
 
 }
-
-// utility to skip to next line in Header
-void
-AmrCoreAdv::GotoNextLine (std::istream& is)
-{
-    constexpr std::streamsize bl_ignore_max { 100000 };
-    is.ignore(bl_ignore_max, '\n');
-}
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv_F.H b/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv_F.H
deleted file mode 100644
index 3e5bcba1e91..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/AmrCoreAdv_F.H
+++ /dev/null
@@ -1,50 +0,0 @@
-#ifndef _AmrCoreAdv_F_H_
-#define _AmrCoreAdv_F_H_
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C" 
-{
-#endif
-
-    // these are interfaces to fortran subroutines
-
-    void initdata(const int* level, const amrex_real* time, 
-		  const int* lo, const int* hi,
-		  BL_FORT_FAB_ARG_3D(state),
-		  const amrex_real* dx, const amrex_real* problo);
-
-    void get_face_velocity(const int* level, const amrex_real* time, 
-			   AMREX_D_DECL(BL_FORT_FAB_ARG(xvel),
-				  BL_FORT_FAB_ARG(yvel),
-				  BL_FORT_FAB_ARG(zvel)),
-			   const amrex_real* dx, const amrex_real* problo);
-
-    void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		     const BL_FORT_FAB_ARG_3D(state),
-		     const int* tagval, const int* clearval,
-		     const int* lo, const int* hi,
-		     const amrex_real* dx, const amrex_real* problo,
-		     const amrex_real* time, const amrex_real* phierr);
-
-    void advect(const amrex_real* time, const int* lo, const int* hi,
-		const BL_FORT_FAB_ARG_3D(statein),
-		BL_FORT_FAB_ARG_3D(stateout),
-		AMREX_D_DECL(const BL_FORT_FAB_ARG_3D(xvel),
-		       const BL_FORT_FAB_ARG_3D(yvel),
-		       const BL_FORT_FAB_ARG_3D(zvel)),
-		AMREX_D_DECL(BL_FORT_FAB_ARG_3D(fx),
-		       BL_FORT_FAB_ARG_3D(fy),
-		       BL_FORT_FAB_ARG_3D(fz)),
-		const amrex_real* dx, const amrex_real* dt);
-
-    void phifill (BL_FORT_FAB_ARG_3D(state),
-		  const int* dlo, const int* dhi,
-		  const amrex_real* dx, const amrex_real* glo, 
-		  const amrex_real* time, const int* bc);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/DefineVelocity.cpp b/Tutorials/Amr/Advection_AmrCore/Source/DefineVelocity.cpp
new file mode 100644
index 00000000000..c63d9314759
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/DefineVelocity.cpp
@@ -0,0 +1,76 @@
+#include <AmrCoreAdv.H>
+#include <Kernels.H>
+
+#include <AMReX_MultiFabUtil.H>
+
+using namespace amrex;
+
+void
+AmrCoreAdv::DefineVelocityAllLevels (Real time)
+{
+    for (int lev = 0; lev <= finest_level; ++lev)
+        DefineVelocityAtLevel(lev,time);
+}
+
+void
+AmrCoreAdv::DefineVelocityAtLevel (int lev, Real time)
+{
+    const auto dx = geom[lev].CellSizeArray();
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+    {
+        for (MFIter mfi(phi_new[lev],TilingIfNotGPU()); mfi.isValid(); ++mfi)
+        {
+
+        // ======== GET FACE VELOCITY =========
+            GpuArray<Box, AMREX_SPACEDIM> nbx;
+            AMREX_D_TERM(nbx[0] = mfi.nodaltilebox(0);,
+                         nbx[1] = mfi.nodaltilebox(1);,
+                         nbx[2] = mfi.nodaltilebox(2););
+
+            AMREX_D_TERM(const Box& ngbxx = amrex::grow(mfi.nodaltilebox(0),1);,
+                         const Box& ngbxy = amrex::grow(mfi.nodaltilebox(1),1);,
+                         const Box& ngbxz = amrex::grow(mfi.nodaltilebox(2),1););
+
+            GpuArray<Array4<Real>, AMREX_SPACEDIM> vel{ AMREX_D_DECL( facevel[lev][0].array(mfi),
+                                                                      facevel[lev][1].array(mfi),
+                                                                      facevel[lev][2].array(mfi)) };
+
+            const Box& psibox = Box(IntVect(AMREX_D_DECL(std::min(ngbxx.smallEnd(0)-1, ngbxy.smallEnd(0)-1),
+                                                         std::min(ngbxx.smallEnd(1)-1, ngbxy.smallEnd(0)-1),
+                                                         0)),
+                                    IntVect(AMREX_D_DECL(std::max(ngbxx.bigEnd(0),   ngbxy.bigEnd(0)+1),
+                                                         std::max(ngbxx.bigEnd(1)+1, ngbxy.bigEnd(1)),
+                                                         0)));
+
+            FArrayBox psifab(psibox, 1);
+            Elixir psieli = psifab.elixir();
+            Array4<Real> psi = psifab.array();
+            GeometryData geomdata = geom[lev].data();
+
+            amrex::launch(psibox,
+            [=] AMREX_GPU_DEVICE (const Box& tbx)
+            {
+                get_face_velocity_psi(tbx, time, psi, geomdata); 
+            });
+
+            amrex::ParallelFor
+                (AMREX_D_DECL(ngbxx,ngbxy,ngbxz),
+                 AMREX_D_DECL(
+                     [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                     {
+                         get_face_velocity_x(i, j, k, vel[0], psi, dx[1]);
+                     },
+                     [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                     {
+                         get_face_velocity_y(i, j, k, vel[1], psi, dx[0]);
+                     },
+                     [=] AMREX_GPU_DEVICE (int i, int j, int k)
+                     {
+                         get_face_velocity_z(i, j, k, vel[2]);
+                     }));
+        }
+    }
+}
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Kernels.H b/Tutorials/Amr/Advection_AmrCore/Source/Kernels.H
new file mode 100644
index 00000000000..399cc49af8e
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Kernels.H
@@ -0,0 +1,17 @@
+#ifndef Kernels_H_
+#define Kernels_H_
+
+#include <face_velocity.H>
+#include <Prob.H>
+#include <Adv_K.H>
+#include <slope_K.H>
+#include <Tagging.H>
+#include <bc_fill.H>
+
+#if (AMREX_SPACEDIM == 2)
+#include <compute_flux_2D_K.H>
+#else
+#include <compute_flux_3D_K.H>
+#endif
+
+#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Make.package b/Tutorials/Amr/Advection_AmrCore/Source/Make.package
index 0ce796b3cfa..df6f6fb6fa4 100644
--- a/Tutorials/Amr/Advection_AmrCore/Source/Make.package
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Make.package
@@ -1,6 +1,11 @@
-CEXE_sources += main.cpp AmrCoreAdv.cpp
-
-CEXE_headers += AmrCoreAdv.H
-
-F90EXE_sources += bc_fill_nd.F90
+CEXE_sources += AdvancePhiAtLevel.cpp
+CEXE_sources += AdvancePhiAllLevels.cpp
+CEXE_sources += AmrCoreAdv.cpp 
+CEXE_sources += DefineVelocity.cpp 
+CEXE_sources += main.cpp 
 
+CEXE_headers += AmrCoreAdv.H 
+CEXE_headers += bc_fill.H
+CEXE_headers += face_velocity.H
+CEXE_headers += Kernels.H 
+CEXE_headers += Tagging.H
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/Adv_2d.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/Adv_2d.f90
deleted file mode 100644
index bae86bfd81d..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,106 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  real(amrex_real), intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  real(amrex_real), intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  real(amrex_real), intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  real(amrex_real), intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  real(amrex_real), intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  real(amrex_real) :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  real(amrex_real), dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100644
index d08ca035210..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,114 +0,0 @@
-module compute_flux_module
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    real(amrex_real), intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    real(amrex_real), intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    real(amrex_real), intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    real(amrex_real), intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    real(amrex_real), dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    real(amrex_real) :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/slope_2d.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/slope_2d.f90
deleted file mode 100644
index b00079275be..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,128 +0,0 @@
-module slope_module
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_constants_module, only : one
-  implicit none
-
-  real(amrex_real), parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    real(amrex_real), dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(one, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    real(amrex_real) :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( one, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/Adv_3d.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/Adv_3d.f90
deleted file mode 100644
index 6aea5075527..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/Adv_3d.f90
+++ /dev/null
@@ -1,142 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            vz  , vz_lo, vz_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            flxz, fz_lo, fz_hi, &
-     &            dx,dt) bind(C, name="advect")
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_3d
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3)
-  real(amrex_real), intent(in) :: dx(3), dt, time
-  integer, intent(in) :: ui_lo(3), ui_hi(3)
-  integer, intent(in) :: uo_lo(3), uo_hi(3)
-  integer, intent(in) :: vx_lo(3), vx_hi(3)
-  integer, intent(in) :: vy_lo(3), vy_hi(3)
-  integer, intent(in) :: vz_lo(3), vz_hi(3)
-  integer, intent(in) :: fx_lo(3), fx_hi(3)
-  integer, intent(in) :: fy_lo(3), fy_hi(3)
-  integer, intent(in) :: fz_lo(3), fz_hi(3)
-  real(amrex_real), intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2),ui_lo(3):ui_hi(3))
-  real(amrex_real), intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2),uo_lo(3):uo_hi(3))
-  real(amrex_real), intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2),vx_lo(3):vx_hi(3))
-  real(amrex_real), intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2),vy_lo(3):vy_hi(3))
-  real(amrex_real), intent(in   ) :: vz  (vz_lo(1):vz_hi(1),vz_lo(2):vz_hi(2),vz_lo(3):vz_hi(3))
-  real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-  real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-  real(amrex_real), intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-
-  integer :: i, j, k
-  integer :: glo(3), ghi(3)
-  real(amrex_real) :: dtdx(3), umax, vmax, wmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  real(amrex_real), dimension(:,:,:), pointer, contiguous :: &
-       phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  ! slope
-  call bl_allocate(slope,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))  
-  
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  wmax = maxval(abs(vz))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) .or. &
-       wmax*dt .ge. dx(3) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", wmax = ", wmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_3d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       vz, vz_lo, vz_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       flxz, fz_lo, fz_hi, &
-                       phix, phix_y, phix_z, &
-                       phiy, phiy_x, phiy_z, &
-                       phiz, phiz_x, phiz_y, &
-                       slope, glo, ghi)
-
-  ! Do a conservative update
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           uout(i,j,k) = uin(i,j,k) + &
-                ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx(1) &
-                + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx(2) &
-                + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx(3) )
-        enddo
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-           flxx(i,j,k) = flxx(i,j,k) * (dt * dx(2)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)+1 
-        do i = lo(1), hi(1)
-           flxy(i,j,k) = flxy(i,j,k) * (dt * dx(1)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)+1
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           flxz(i,j,k) = flxz(i,j,k) * (dt * dx(1)*dx(2))
-        enddo
-     enddo
-  enddo
-
-  call bl_deallocate(phix  )
-  call bl_deallocate(phix_y)
-  call bl_deallocate(phix_z)
-  call bl_deallocate(phiy  )
-  call bl_deallocate(phiy_x)
-  call bl_deallocate(phiy_z)
-  call bl_deallocate(phiz  )
-  call bl_deallocate(phiz_x)
-  call bl_deallocate(phiz_y)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/Make.package b/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/compute_flux_3d.f90
deleted file mode 100644
index cf01e99b9dc..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/compute_flux_3d.f90
+++ /dev/null
@@ -1,288 +0,0 @@
-module compute_flux_module
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  private
-
-  public :: compute_flux_3d
-
-contains
-
-  subroutine compute_flux_3d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             wmac,  w_lo,  w_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             flxz, fz_lo, fz_hi, &
-                             phix, phix_y, phix_z, &
-                             phiy, phiy_x, phiy_z, &
-                             phiz, phiz_x, phiz_y, &
-                             slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey, slopez
-
-    integer, intent(in) :: lo(3), hi(3), glo(3), ghi(3)
-    real(amrex_real), intent(in) :: dt, dx(3)
-    integer, intent(in) :: ph_lo(3), ph_hi(3)
-    integer, intent(in) ::  u_lo(3),  u_hi(3)
-    integer, intent(in) ::  v_lo(3),  v_hi(3)
-    integer, intent(in) ::  w_lo(3),  w_hi(3)
-    integer, intent(in) :: fx_lo(3), fx_hi(3)
-    integer, intent(in) :: fy_lo(3), fy_hi(3)
-    integer, intent(in) :: fz_lo(3), fz_hi(3)
-    real(amrex_real), intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2),ph_lo(3):ph_hi(3))
-    real(amrex_real), intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2), u_lo(3): u_hi(3))
-    real(amrex_real), intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2), v_lo(3): v_hi(3))
-    real(amrex_real), intent(in   ) :: wmac( w_lo(1): w_hi(1), w_lo(2): w_hi(2), w_lo(3): w_hi(3))
-    real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-    real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-    real(amrex_real), intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-    real(amrex_real), dimension(glo(1):ghi(1),glo(2):ghi(2),glo(3):ghi(3)) :: &
-         phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-         
-    integer :: i, j, k
-    real(amrex_real) :: hdtdx(3), tdtdx(3)
-
-    hdtdx = 0.5*(dt/dx)
-    tdtdx = (1.d0/3.d0)*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phi(i  ,j,k) - (0.5d0 + hdtdx(1)*umac(i,j,k))*slope(i  ,j,k)
-             else
-                phix(i,j,k) = phi(i-1,j,k) + (0.5d0 - hdtdx(1)*umac(i,j,k))*slope(i-1,j,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on y faces using vmac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phi(i,j  ,k) - (0.5d0 + hdtdx(2)*vmac(i,j,k))*slope(i,j  ,k)
-             else
-                phiy(i,j,k) = phi(i,j-1,k) + (0.5d0 - hdtdx(2)*vmac(i,j,k))*slope(i,j-1,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopez(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on z faces using wmac to upwind; ignore transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phi(i,j,k  ) - (0.5d0 + hdtdx(3)*wmac(i,j,k))*slope(i,j,k  )
-             else
-                phiz(i,j,k) = phi(i,j,k-1) + (0.5d0 - hdtdx(3)*wmac(i,j,k))*slope(i,j,k-1)
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! transverse terms
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in y-transverse terms
-    do       k=lo(3)-1, hi(3)+1
-       do    j=lo(2)  , hi(2)
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i  ,j+1,k)+vmac(i  ,j,k)) * (phiy(i  ,j+1,k)-phiy(i  ,j,k)) )
-             else
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i-1,j+1,k)+vmac(i-1,j,k)) * (phiy(i-1,j+1,k)-phiy(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on x faces by adding in z-transverse terms
-    do       k=lo(3)  , hi(3)
-       do    j=lo(2)-1, hi(2)+1
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i  ,j,k+1)+wmac(i  ,j,k)) * (phiz(i  ,j,k+1)-phiz(i  ,j,k)) )
-             else
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i-1,j,k+1)+wmac(i-1,j,k)) * (phiz(i-1,j,k+1)-phiz(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j  ,k)+umac(i,j  ,k)) * (phix(i+1,j  ,k)-phix(i,j  ,k)) )
-             else
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j-1,k)+umac(i,j-1,k)) * (phix(i+1,j-1,k)-phix(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in z-transverse terms
-    do       k = lo(3)  , hi(3)
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j  ,k+1)+wmac(i,j  ,k)) * (phiz(i,j  ,k+1)-phiz(i,j  ,k)) )
-             else
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j-1,k+1)+wmac(i,j-1,k)) * (phiz(i,j-1,k+1)-phiz(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in x-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k  )+umac(i,j,k  )) * (phix(i+1,j,k  )-phix(i,j,k  )) )
-             else
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k-1)+umac(i,j,k-1)) * (phix(i+1,j,k-1)-phix(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in y-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)  , hi(2)
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k  )+vmac(i,j,k  )) * (phiy(i,j+1,k  )-phiy(i,j,k  )) )
-             else
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k-1)+vmac(i,j,k-1)) * (phiy(i,j+1,k-1)-phiy(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! final edge states
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in yz and zy transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_z(i  ,j+1,k  )-phiy_z(i  ,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i  ,j,k)) * (phiz_y(i  ,j  ,k+1)-phiz_y(i  ,j,k)) )
-             else
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1,k  )+vmac(i-1,j,k)) * (phiy_z(i-1,j+1,k  )-phiy_z(i-1,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i-1,j  ,k+1)+wmac(i-1,j,k)) * (phiz_y(i-1,j  ,k+1)-phiz_y(i-1,j,k)) )
-             end if
-
-             ! compute final x-fluxes
-             flxx(i,j,k) = umac(i,j,k)*phix(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in xz and zx transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i,j  ,k)) * (phix_z(i+1,j  ,k  )-phix_z(i,j  ,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i,j  ,k)) * (phiz_x(i  ,j  ,k+1)-phiz_x(i,j  ,k)) )
-             else
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j-1,k  )+umac(i,j-1,k)) * (phix_z(i+1,j-1,k  )-phix_z(i,j-1,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j-1,k+1)+wmac(i,j-1,k)) * (phiz_x(i  ,j-1,k+1)-phiz_x(i,j-1,k)) )
-             end if
-
-             ! compute final y-fluxes
-             flxy(i,j,k) = vmac(i,j,k)*phiy(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in xy and yx transverse terms
-    do       k = lo(3), hi(3)+1
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i  ,j,k)) * (phix_y(i+1,j  ,k  )-phix_y(i,j,k  )) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_x(i  ,j+1,k  )-phiy_x(i,j,k  )) )
-             else
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k-1)+umac(i,j,k-1)) * (phix_y(i+1,j  ,k-1)-phix_y(i,j,k-1)) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k-1)+vmac(i,j,k-1)) * (phiy_x(i  ,j+1,k-1)-phiy_x(i,j,k-1)) )
-             end if
-
-             ! compute final z-fluxes
-             flxz(i,j,k) = wmac(i,j,k)*phiz(i,j,k)
-
-          end do
-       end do
-    end do
-
-
-  end subroutine compute_flux_3d
-
-end module compute_flux_module
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/slope_3d.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/slope_3d.f90
deleted file mode 100644
index 5759ea679bc..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_3d/slope_3d.f90
+++ /dev/null
@@ -1,213 +0,0 @@
-module slope_module
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_constants_module, only : one
-  implicit none
-
-  real(amrex_real), parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey, slopez
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    integer :: i, j, k
-    real(amrex_real), dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do    k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-
-          ! first compute Fromm slopes
-          do i = lo(1)-1, hi(1)+1
-             dlft = q(i  ,j,k) - q(i-1,j,k)
-             drgt = q(i+1,j,k) - q(i  ,j,k)
-             dcen(i) = .5d0 * (dlft+drgt)
-             dsgn(i) = sign(one, dcen(i))
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i) = 0.d0
-             endif
-             df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-          end do
-          
-          ! Now limited fourth order slopes
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-             dq(i,j,k) = dsgn(i)*min(dlim(i),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(2), ddhi(2)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j, k
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do k = lo(3), hi(3)
-
-       ! first compute Fromm slopes
-       do j    = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j  ,k) - q(i,j-1,k)
-             drgt = q(i,j+1,k) - q(i,j  ,k)
-             dcen(i,j) = .5d0 * (dlft+drgt)
-             dsgn(i,j) = sign( one, dcen(i,j) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j) = 0.d0
-             endif
-             df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-          end do
-       end do
-       
-       ! Now compute limited fourth order slopes
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-             dq(i,j,k) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-          end do
-       end do
-
-    end do
-
-  end subroutine slopey_doit
-
-
-  subroutine slopez(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-
-    call slopez_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, &
-                     (/lo(1),lo(2),lo(3)-1/), (/hi(1),hi(2),hi(3)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopez
-
-  subroutine slopez_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(3), ddhi(3)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-
-    integer :: i, j, k
-    real(amrex_real) :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do k       = lo(3)-1, hi(3)+1
-       do j    = lo(2)  , hi(2)
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j,k  ) - q(i,j,k-1)
-             drgt = q(i,j,k+1) - q(i,j,k  )
-             dcen(i,j,k) = .5d0 * (dlft+drgt)
-             dsgn(i,j,k) = sign( one, dcen(i,j,k) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j,k) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j,k) = 0.d0
-             endif
-             df(i,j,k) = dsgn(i,j,k)*min( dlim(i,j,k),abs(dcen(i,j,k)) )
-          end do
-       end do
-    end do
-       
-    ! Now compute limited fourth order slopes
-    do k       = lo(3), hi(3)
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j,k) - sixth*( df(i,j,k+1) + df(i,j,k-1) )
-             dq(i,j,k) = dsgn(i,j,k)*min(dlim(i,j,k),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopez_doit
-
-end module slope_module 
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_K/Adv_K.H b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/Adv_K.H
new file mode 100644
index 00000000000..b6edf3b5590
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/Adv_K.H
@@ -0,0 +1,23 @@
+#ifndef _Adv_K_H_
+#define _Adv_K_H_
+
+#include <AMReX_Box.H>
+#include <AMReX_FArrayBox.H>
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void conservative(int i, int j, int k, 
+                  amrex::Array4<amrex::Real> const& phi_out,
+                  amrex::Array4<amrex::Real const> const& phi_in,
+                  AMREX_D_DECL(amrex::Array4<amrex::Real const> const& flxx,
+                               amrex::Array4<amrex::Real const> const& flxy,
+                               amrex::Array4<amrex::Real const> const& flxz),
+                  AMREX_D_DECL(amrex::Real dtdx, amrex::Real dtdy, amrex::Real dtdz))
+{
+    phi_out(i,j,k) = phi_in(i,j,k) + 
+                ( AMREX_D_TERM( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx,
+                              + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdy,
+                              + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdz ) );
+}
+
+#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_K/Make.package b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/Make.package
new file mode 100644
index 00000000000..e98f493727c
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/Make.package
@@ -0,0 +1,3 @@
+CEXE_headers += Adv_K.H
+CEXE_headers += compute_flux_K_$(DIM).H
+CEXE_headers += slope_K.H
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_K/compute_flux_2D_K.H b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/compute_flux_2D_K.H
new file mode 100644
index 00000000000..04fde45944b
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/compute_flux_2D_K.H
@@ -0,0 +1,66 @@
+#ifndef _compute_flux_2d_H_
+#define _compute_flux_2d_H_
+
+#include <AMReX_BLFort.H>
+#include <AMReX_Box.H>
+#include <AMReX_Geometry.H>
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_x(int i, int j, int k,
+            amrex::Array4<amrex::Real> const& px,
+            amrex::Array4<amrex::Real const> const& phi,
+            amrex::Array4<amrex::Real const> const& vx,
+            amrex::Array4<amrex::Real const> const& slope,
+            amrex::Real dtdx)
+{
+    px(i,j,k) = ( (vx(i,j,k) < 0) ?
+                phi(i  ,j,k) - slope(i  ,j,k)*(0.5 + 0.5*dtdx*vx(i,j,k)) :
+                phi(i-1,j,k) + slope(i-1,j,k)*(0.5 - 0.5*dtdx*vx(i,j,k)) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_y(int i, int j, int k,
+            amrex::Array4<amrex::Real> const& py,
+            amrex::Array4<amrex::Real const> const& phi,
+            amrex::Array4<amrex::Real const> const& vy,
+            amrex::Array4<amrex::Real const> const& slope,
+            amrex::Real dtdy)
+{
+    py(i,j,k) = ( (vy(i,j,k) < 0) ?
+                phi(i,j  ,k) - slope(i,j  ,k)*(0.5 + 0.5*dtdy*vy(i,j,k)) :
+                phi(i,j-1,k) + slope(i,j-1,k)*(0.5 - 0.5*dtdy*vy(i,j,k)) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void create_flux_x(int i, int j, int k,
+                   amrex::Array4<amrex::Real> const& fx,
+                   amrex::Array4<amrex::Real const> const& vx,
+                   amrex::Array4<amrex::Real const> const& vy,
+                   amrex::Array4<amrex::Real const> const& px,
+                   amrex::Array4<amrex::Real const> const& py,
+                   amrex::Real dtdy)
+{
+    fx(i,j,k) = ( (vx(i,j,k) < 0) ?
+                (px(i,j,k) - 0.5*dtdy * ( 0.5*(vy(i  ,j+1,k  ) + vy(i  ,j,k)) * (py(i  ,j+1,k  )-py(i  ,j,k))))*vx(i,j,k) :
+                (px(i,j,k) - 0.5*dtdy * ( 0.5*(vy(i-1,j+1,k  ) + vy(i-1,j,k)) * (py(i-1,j+1,k  )-py(i-1,j,k))))*vx(i,j,k) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void create_flux_y(int i, int j, int k,
+                   amrex::Array4<amrex::Real> const& fy,
+                   amrex::Array4<amrex::Real const> const& vx,
+                   amrex::Array4<amrex::Real const> const& vy,
+                   amrex::Array4<amrex::Real const> const& py,
+                   amrex::Array4<amrex::Real const> const& px,
+                   amrex::Real dtdx)
+{
+    fy(i,j,k) = ( (vy(i,j,k) < 0) ?
+                (py(i,j,k) - 0.5*dtdx * ( 0.5*(vx(i+1,j  ,k  ) + vx(i,j  ,k)) * (px(i+1,j  ,k  )-px(i,j  ,k))))*vy(i,j,k) :
+                (py(i,j,k) - 0.5*dtdx * ( 0.5*(vx(i+1,j-1,k  ) + vx(i,j-1,k)) * (px(i+1,j-1,k  )-px(i,j-1,k))))*vy(i,j,k) );
+}
+
+#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_K/compute_flux_3D_K.H b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/compute_flux_3D_K.H
new file mode 100644
index 00000000000..4579d752432
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/compute_flux_3D_K.H
@@ -0,0 +1,205 @@
+#ifndef _compute_flux_3d_H_
+#define _compute_flux_3d_H_
+
+#include <AMReX_BLFort.H>
+#include <AMReX_Box.H>
+#include <AMReX_Geometry.H>
+
+using namespace amrex;
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_x(int i, int j, int k,
+            Array4<Real> const& px,
+            Array4<Real const> const& phi,
+            Array4<Real const> const& vx,
+            Array4<Real const> const& slope,
+            Real dtdx)
+{
+    px(i,j,k) = ( (vx(i,j,k) < 0) ?
+                phi(i  ,j,k) - slope(i  ,j,k)*(0.5 + 0.5*dtdx*vx(i,j,k)) :
+                phi(i-1,j,k) + slope(i-1,j,k)*(0.5 - 0.5*dtdx*vx(i,j,k)) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_y(int i, int j, int k,
+            Array4<Real> const& py,
+            Array4<Real const> const& phi,
+            Array4<Real const> const& vy,
+            Array4<Real const> const& slope,
+            Real dtdy)
+{
+    py(i,j,k) = ( (vy(i,j,k) < 0) ?
+                phi(i,j  ,k) - slope(i,j  ,k)*(0.5 + 0.5*dtdy*vy(i,j,k)) :
+                phi(i,j-1,k) + slope(i,j-1,k)*(0.5 - 0.5*dtdy*vy(i,j,k)) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_z(int i, int j, int k,
+            Array4<Real> const& pz,
+            Array4<Real const> const& phi,
+            Array4<Real const> const& vz,
+            Array4<Real const> const& slope,
+            Real dtdz)
+{
+    pz(i,j,k) = ( (vz(i,j,k) < 0) ? 
+                phi(i,j,k  ) - slope(i,j,k  )*(0.5 + 0.5*dtdz*vz(i,j,k)) :
+                phi(i,j,k-1) + slope(i,j,k-1)*(0.5 - 0.5*dtdz*vz(i,j,k)) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_xy(int i, int j, int k,
+             Array4<Real> const& pxy,
+             Array4<Real const> const& vx,
+             Array4<Real const> const& vy,
+             Array4<Real const> const& px,
+             Array4<Real const> const& py,
+             Real dtdy)
+{
+    pxy(i,j,k) = ( (vx(i,j,k) < 0) ?
+                 px(i,j,k) - dtdy/3.0 * ( 0.5*(vy(i,  j+1,k) + vy(i  ,j,k)) * (py(i  ,j+1,k) - py(i  ,j,k))) :
+                 px(i,j,k) - dtdy/3.0 * ( 0.5*(vy(i-1,j+1,k) + vy(i-1,j,k)) * (py(i-1,j+1,k) - py(i-1,j,k))) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_xz(int i, int j, int k,
+             Array4<Real> const& pxz,
+             Array4<Real const> const& vx,
+             Array4<Real const> const& vz,
+             Array4<Real const> const& px,
+             Array4<Real const> const& pz,
+             Real dtdz)
+{
+    pxz(i,j,k) = ( (vx(i,j,k) < 0) ?
+                 px(i,j,k) - dtdz/3.0 * ( 0.5*(vz(i,  j,k+1) + vz(i  ,j,k)) * (pz(i  ,j,k+1) - pz(i  ,j,k))) :
+                 px(i,j,k) - dtdz/3.0 * ( 0.5*(vz(i-1,j,k+1) + vz(i-1,j,k)) * (pz(i-1,j,k+1) - pz(i-1,j,k))) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_yx(int i, int j, int k,
+             Array4<Real> const& pyx,
+             Array4<Real const> const& vx,
+             Array4<Real const> const& vy,
+             Array4<Real const> const& px,
+             Array4<Real const> const& py,
+             Real dtdx)
+{
+    pyx(i,j,k) = ( (vy(i,j,k) < 0) ?
+                 py(i,j,k) - dtdx/3.0 * ( 0.5*(vx(i+1,j  ,k) + vx(i,j  ,k)) * (px(i+1,j  ,k) - px(i,j  ,k))) :
+                 py(i,j,k) - dtdx/3.0 * ( 0.5*(vx(i+1,j-1,k) + vx(i,j-1,k)) * (px(i+1,j-1,k) - px(i,j-1,k))) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_yz(int i, int j, int k,
+             Array4<Real> const& pyz,
+             Array4<Real const> const& vy,
+             Array4<Real const> const& vz,
+             Array4<Real const> const& py,
+             Array4<Real const> const& pz,
+             Real dtdz)
+{
+    pyz(i,j,k) = ( (vy(i,j,k) < 0) ?
+                 py(i,j,k) - dtdz/3.0 * ( 0.5*(vz(i,  j,k+1) + vz(i,j  ,k)) * (pz(i,j  ,k+1) - pz(i,j  ,k))) :
+                 py(i,j,k) - dtdz/3.0 * ( 0.5*(vz(i,j-1,k+1) + vz(i,j-1,k)) * (pz(i,j-1,k+1) - pz(i,j-1,k))) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_zx(int i, int j, int k,
+             Array4<Real> const& pzx,
+             Array4<Real const> const& vx,
+             Array4<Real const> const& vz,
+             Array4<Real const> const& px,
+             Array4<Real const> const& pz,
+             Real dtdx)
+{
+    pzx(i,j,k) = ( (vz(i,j,k) < 0) ?
+                 pz(i,j,k) - dtdx/3.0 * ( 0.5*(vx(i+1,j,k  ) + vx(i,j,k  )) * (px(i+1,j,k  ) - px(i,j,k  ))) :
+                 pz(i,j,k) - dtdx/3.0 * ( 0.5*(vx(i+1,j,k-1) + vx(i,j,k-1)) * (px(i+1,j,k-1) - px(i,j,k-1))) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void flux_zy(int i, int j, int k,
+             Array4<Real> const& pzy,
+             Array4<Real const> const& vy,
+             Array4<Real const> const& vz,
+             Array4<Real const> const& py,
+             Array4<Real const> const& pz,
+             Real dtdy)
+{
+    pzy(i,j,k) = ( (vz(i,j,k) < 0) ?
+                 pz(i,j,k) - dtdy/3.0 * ( 0.5*(vy(i,j+1,k  ) + vy(i,j,k  )) * (py(i,j+1,k  ) - py(i,j,k  ))) :
+                 pz(i,j,k) - dtdy/3.0 * ( 0.5*(vy(i,j+1,k-1) + vy(i,j,k-1)) * (py(i,j+1,k-1) - py(i,j,k-1))) );
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void create_flux_x(int i, int j, int k,
+                   Array4<Real> const& fx,
+                   Array4<Real const> const& vx,
+                   Array4<Real const> const& vy,
+                   Array4<Real const> const& vz,
+                   Array4<Real const> const& px,
+                   Array4<Real const> const& pyz,
+                   Array4<Real const> const& pzy,
+                   Real dtdy, Real dtdz)
+{
+    Real f = ( (vx(i,j,k) < 0) ?
+                px(i,j,k) - 0.5*dtdy * ( 0.5*(vy(i  ,j+1,k  ) + vy(i  ,j,k)) * (pyz(i  ,j+1,k  )-pyz(i  ,j,k)))
+                          - 0.5*dtdz * ( 0.5*(vz(i  ,j  ,k+1) + vz(i  ,j,k)) * (pzy(i  ,j  ,k+1)-pzy(i  ,j,k))) :
+                px(i,j,k) - 0.5*dtdy * ( 0.5*(vy(i-1,j+1,k  ) + vy(i-1,j,k)) * (pyz(i-1,j+1,k  )-pyz(i-1,j,k)))
+                          - 0.5*dtdz * ( 0.5*(vz(i-1,j  ,k+1) + vz(i-1,j,k)) * (pzy(i-1,j  ,k+1)-pzy(i-1,j,k))) );
+
+    fx(i,j,k) = vx(i,j,k)*f;
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void create_flux_y(int i, int j, int k,
+                   Array4<Real> const& fy,
+                   Array4<Real const> const& vx,
+                   Array4<Real const> const& vy,
+                   Array4<Real const> const& vz,
+                   Array4<Real const> const& py,
+                   Array4<Real const> const& pxz,
+                   Array4<Real const> const& pzx,
+                   Real dtdx, Real dtdz)
+{
+    Real f = ( (vy(i,j,k) < 0) ?
+                py(i,j,k) - 0.5*dtdx * ( 0.5*(vx(i+1,j  ,k  ) + vx(i,j  ,k)) * (pxz(i+1,j  ,k  )-pxz(i,j  ,k)))
+                          - 0.5*dtdz * ( 0.5*(vz(i,  j  ,k+1) + vz(i,j  ,k)) * (pzx(i,  j  ,k+1)-pzx(i,j  ,k))) :
+                py(i,j,k) - 0.5*dtdx * ( 0.5*(vx(i+1,j-1,k  ) + vx(i,j-1,k)) * (pxz(i+1,j-1,k  )-pxz(i,j-1,k)))
+                          - 0.5*dtdz * ( 0.5*(vz(i  ,j-1,k+1) + vz(i,j-1,k)) * (pzx(i  ,j-1,k+1)-pzx(i,j-1,k))) );
+
+    fy(i,j,k) = vy(i,j,k)*f;
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void create_flux_z(int i, int j, int k,
+                   Array4<Real> const& fz,
+                   Array4<Real const> const& vx,
+                   Array4<Real const> const& vy,
+                   Array4<Real const> const& vz,
+                   Array4<Real const> const& pz,
+                   Array4<Real const> const& pxy,
+                   Array4<Real const> const& pyx,
+                   Real dtdx, Real dtdy)
+{
+    Real f = ( (vz(i,j,k) < 0) ?
+                pz(i,j,k) - 0.5*dtdx * ( 0.5*(vx(i+1,j  ,k  ) + vx(i,j,k  )) * (pxy(i+1,j  ,k  )-pxy(i,j,k  )))
+                          - 0.5*dtdy * ( 0.5*(vy(i,  j+1,k  ) + vy(i,j,k  )) * (pyx(i,  j+1,k  )-pyx(i,j,k  ))) :
+                pz(i,j,k) - 0.5*dtdx * ( 0.5*(vx(i+1,j  ,k-1) + vx(i,j,k-1)) * (pxy(i+1,j  ,k-1)-pxy(i,j,k-1)))
+                          - 0.5*dtdy * ( 0.5*(vy(i  ,j+1,k-1) + vy(i,j,k-1)) * (pyx(i  ,j+1,k-1)-pyx(i,j,k-1))) );
+
+    fz(i,j,k) = vz(i,j,k)*f;
+}
+
+#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/slope_3d.H b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/slope_K.H
similarity index 86%
rename from Tutorials/GPU/Advection_AmrCore/Source/Src_3d/slope_3d.H
rename to Tutorials/Amr/Advection_AmrCore/Source/Src_K/slope_K.H
index 74e08449fe0..be1e71a2972 100644
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/slope_3d.H
+++ b/Tutorials/Amr/Advection_AmrCore/Source/Src_K/slope_K.H
@@ -1,17 +1,18 @@
-#ifndef SLOPE_3D_H_
-#define SLOPE_3D_H_
+#ifndef slope_K_H_
+#define slope_K_H_
 
 #include <AMReX_Box.H>
 #include <AMReX_Geometry.H>
 #include <AMReX_Gpu.H>
-#include <AmrCoreAdv_F.H>
 
 AMREX_GPU_DEVICE
 AMREX_FORCE_INLINE
 void slopex2(amrex::Box const& bx,
-             amrex::Array4<amrex::Real> const& q,
-             amrex::Array4<amrex::Real> const& dq)
+             amrex::Array4<amrex::Real> const& dq,
+             amrex::Array4<amrex::Real const> const& q)
 {
+    using namespace amrex;
+
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
@@ -34,10 +35,12 @@ void slopex2(amrex::Box const& bx,
 AMREX_GPU_DEVICE
 AMREX_FORCE_INLINE
 void slopex4(amrex::Box const& bx,
-             amrex::Array4<amrex::Real> const& q,
-             amrex::Array4<amrex::Real> const& dq,
-             amrex::Array4<amrex::Real> const& dq4)
+             amrex::Array4<amrex::Real> const& dq4,
+             amrex::Array4<amrex::Real const> const& q,
+             amrex::Array4<amrex::Real const> const& dq)
 {
+    using namespace amrex;
+
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
@@ -63,9 +66,11 @@ void slopex4(amrex::Box const& bx,
 AMREX_GPU_DEVICE
 AMREX_FORCE_INLINE
 void slopey2(amrex::Box const& bx,
-             amrex::Array4<amrex::Real> const& q,
-             amrex::Array4<amrex::Real> const& dq)
+             amrex::Array4<amrex::Real> const& dq,
+             amrex::Array4<amrex::Real const> const& q)
 {
+    using namespace amrex;
+
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
@@ -88,10 +93,12 @@ void slopey2(amrex::Box const& bx,
 AMREX_GPU_DEVICE
 AMREX_FORCE_INLINE
 void slopey4(amrex::Box const& bx,
-             amrex::Array4<amrex::Real> const& q,
-             amrex::Array4<amrex::Real> const& dq,
-             amrex::Array4<amrex::Real> const& dq4)
+             amrex::Array4<amrex::Real> const& dq4,
+             amrex::Array4<amrex::Real const> const& q,
+             amrex::Array4<amrex::Real const> const& dq)
 {
+    using namespace amrex;
+
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
@@ -117,9 +124,11 @@ void slopey4(amrex::Box const& bx,
 AMREX_GPU_DEVICE
 AMREX_FORCE_INLINE
 void slopez2(amrex::Box const& bx,
-             amrex::Array4<amrex::Real> const&  q,
-             amrex::Array4<amrex::Real> const& dq)
+             amrex::Array4<amrex::Real> const& dq,
+             amrex::Array4<amrex::Real const> const& q)
 {
+    using namespace amrex;
+
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
@@ -142,10 +151,12 @@ void slopez2(amrex::Box const& bx,
 AMREX_GPU_DEVICE
 AMREX_FORCE_INLINE
 void slopez4(amrex::Box const& bx,
-             amrex::Array4<amrex::Real> const& q,
-             amrex::Array4<amrex::Real> const& dq,
-             amrex::Array4<amrex::Real> const& dq4)
+             amrex::Array4<amrex::Real> const& dq4,
+             amrex::Array4<amrex::Real const> const& q,
+             amrex::Array4<amrex::Real const> const& dq)
 {
+    using namespace amrex;
+
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_nd/Make.package b/Tutorials/Amr/Advection_AmrCore/Source/Src_nd/Make.package
deleted file mode 100644
index 36d550bcbe4..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_nd/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-
-f90EXE_sources += Tagging_nd.f90
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_nd/Tagging_nd.f90 b/Tutorials/Amr/Advection_AmrCore/Source/Src_nd/Tagging_nd.f90
deleted file mode 100644
index 13b5ae6a096..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_nd/Tagging_nd.f90
+++ /dev/null
@@ -1,53 +0,0 @@
-
-! ::: -----------------------------------------------------------
-! ::: This routine will tag high error cells based on the state
-! ::: 
-! ::: INPUTS/OUTPUTS:
-! ::: 
-! ::: tag        <=  integer tag array
-! ::: tag_lo,hi   => index extent of tag array
-! ::: state       => state array
-! ::: state_lo,hi => index extent of state array
-! ::: set         => integer value to tag cell for refinement
-! ::: clear       => integer value to untag cell
-! ::: lo,hi       => work region we are allowed to change
-! ::: dx          => cell size
-! ::: problo      => phys loc of lower left corner of prob domain
-! ::: time        => problem evolution time
-! ::: level       => refinement level of this array
-! ::: -----------------------------------------------------------
-
-subroutine state_error(tag,tag_lo,tag_hi, &
-                       state,state_lo,state_hi, &
-                       set,clear,&
-                       lo,hi,&
-                       dx,problo,time,phierr) bind(C, name="state_error")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-  
-  integer          :: lo(3),hi(3)
-  integer          :: state_lo(3),state_hi(3)
-  integer          :: tag_lo(3),tag_hi(3)
-  real(amrex_real) :: state(state_lo(1):state_hi(1), &
-                            state_lo(2):state_hi(2), &
-                            state_lo(3):state_hi(3))
-  integer          :: tag(tag_lo(1):tag_hi(1),tag_lo(2):tag_hi(2),tag_lo(3):tag_hi(3))
-  real(amrex_real) :: problo(3),dx(3),time,phierr
-  integer          :: set,clear
-
-  integer          :: i, j, k
-
-  ! Tag on regions of high phi
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           if (state(i,j,k) .ge. phierr) then
-              tag(i,j,k) = set
-           endif
-        enddo
-     enddo
-  enddo
-
-end subroutine state_error
-
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Tagging.H b/Tutorials/Amr/Advection_AmrCore/Source/Tagging.H
similarity index 100%
rename from Tutorials/GPU/Advection_AmrCore/Source/Tagging.H
rename to Tutorials/Amr/Advection_AmrCore/Source/Tagging.H
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/bc_fill.H b/Tutorials/Amr/Advection_AmrCore/Source/bc_fill.H
new file mode 100644
index 00000000000..ad890b7e34b
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/bc_fill.H
@@ -0,0 +1,21 @@
+#ifndef BCFILL_H
+#define BCFILL_H
+
+#include <AMReX_FArrayBox.H>
+#include <AMReX_Geometry.H>
+#include <AMReX_PhysBCFunct.H>
+
+struct AmrCoreFill
+{
+    AMREX_GPU_DEVICE
+    void operator() (const amrex::IntVect& /*iv*/, amrex::Array4<amrex::Real> const& /*data*/,
+                     const int /*dcomp*/, const int /*numcomp*/,
+                     amrex::GeometryData const& /*geom*/, const amrex::Real /*time*/,
+                     const amrex::BCRec* /*bcr*/, const int /*bcomp*/,
+                     const int /*orig_comp*/) const
+        {
+            // do something for external Dirichlet (BCType::ext_dir)
+        }
+};
+
+#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/bc_fill_nd.F90 b/Tutorials/Amr/Advection_AmrCore/Source/bc_fill_nd.F90
deleted file mode 100644
index 4bdc159ae82..00000000000
--- a/Tutorials/Amr/Advection_AmrCore/Source/bc_fill_nd.F90
+++ /dev/null
@@ -1,30 +0,0 @@
-module bc_fill_module
-
-! since this is a .F90 file (instead of .f90) we run this through a C++ preprocessor
-! for e.g., #if (BL_SPACEDIM == 1) statements.
-
-  implicit none
-
-  public
-
-contains
-
-  subroutine phifill(phi,phi_lo,phi_hi,domlo,domhi,delta,xlo,time,bc) &
-       bind(C, name="phifill")
-
-    use amrex_fort_module, only : bl_spacedim, amrex_real
-    use amrex_filcc_module, only : amrex_filccn
-
-    implicit none
-
-    integer      :: phi_lo(3),phi_hi(3)
-    integer      :: bc(bl_spacedim,2)
-    integer      :: domlo(3), domhi(3)
-    real(amrex_real) :: delta(3), xlo(3), time
-    real(amrex_real) :: phi(phi_lo(1):phi_hi(1),phi_lo(2):phi_hi(2),phi_lo(3):phi_hi(3))
-
-    call amrex_filccn(phi_lo, phi_hi, phi, phi_lo, phi_hi, 1, domlo, domhi, delta, xlo, bc)
-
-  end subroutine phifill
-  
-end module bc_fill_module
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/face_velocity.H b/Tutorials/Amr/Advection_AmrCore/Source/face_velocity.H
new file mode 100644
index 00000000000..4803e1dbb7a
--- /dev/null
+++ b/Tutorials/Amr/Advection_AmrCore/Source/face_velocity.H
@@ -0,0 +1,63 @@
+#ifndef FACE_VELOCITY_H_
+#define FACE_VELOCITY_H_
+
+#include <AMReX_Geometry.H>
+#include <AMReX_FArrayBox.H>
+#include <AMReX_REAL.H>
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void get_face_velocity_psi(amrex::Box const& bx,
+                           const amrex::Real time,
+                           amrex::Array4<amrex::Real> const& psi,
+                           amrex::GeometryData const& geomdata)
+{
+    using namespace amrex;
+    constexpr Real PI = 3.1415926535897932384626;
+
+    const auto lo  = lbound(bx);
+    const auto hi  = ubound(bx);
+
+    const Real* AMREX_RESTRICT prob_lo = geomdata.ProbLo();
+    const Real* AMREX_RESTRICT dx      = geomdata.CellSize(); 
+
+    for     (int j = lo.y; j <= hi.y; ++j) {
+        Real y = dx[1]*(0.5+j) + prob_lo[1]; 
+        AMREX_PRAGMA_SIMD
+        for (int i = lo.x; i <= hi.x; ++i) {
+            Real x = dx[0]*(0.5+i) + prob_lo[0];
+            psi(i,j,0) = std::pow(std::sin(PI*x), 2) * std::pow(std::sin(PI*y), 2)
+                       * std::cos(PI*time/2.0) * 1.0/PI;
+        }
+    }
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void get_face_velocity_x(int i, int j, int k,
+                         amrex::Array4<amrex::Real> const& vx,
+                         amrex::Array4<amrex::Real> const& psi,
+                         amrex::Real dy)
+{
+    vx(i,j,k) = -( (psi(i,j+1,0)+psi(i-1,j+1,0)) - (psi(i,j-1,0)+psi(i-1,j-1,0)) ) * (0.25/dy);
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void get_face_velocity_y(int i, int j, int k,
+                         amrex::Array4<amrex::Real> const& vy,
+                         amrex::Array4<amrex::Real> const& psi,
+                         amrex::Real dx)
+{
+    vy(i,j,k) =  ( (psi(i+1,j,0)+psi(i+1,j-1,0)) - (psi(i-1,j,0)+psi(i-1,j-1,0)) ) * (0.25/dx);
+}
+
+AMREX_GPU_DEVICE
+AMREX_FORCE_INLINE
+void get_face_velocity_z(int i, int j, int k,
+                         amrex::Array4<amrex::Real> const& vz)
+{
+    vz(i,j,k) =  0.0; 
+}
+
+#endif
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/main.cpp b/Tutorials/Amr/Advection_AmrCore/Source/main.cpp
index e2078b2a3db..87211df9ea1 100644
--- a/Tutorials/Amr/Advection_AmrCore/Source/main.cpp
+++ b/Tutorials/Amr/Advection_AmrCore/Source/main.cpp
@@ -13,13 +13,13 @@ int main(int argc, char* argv[])
 {
     amrex::Initialize(argc,argv);
 
-    // timer for profiling
-    BL_PROFILE_VAR("main()", pmain);
+    {
+        // timer for profiling
+        BL_PROFILE("main()");
 
-    // wallclock time
-    const Real strt_total = amrex::second();
+        // wallclock time
+        const Real strt_total = amrex::second();
 
-    {
         // constructor - reads in parameters from inputs file
         //             - sizes multilevel arrays and data structures
         AmrCoreAdv amr_core_adv;
@@ -33,15 +33,12 @@ int main(int argc, char* argv[])
         // wallclock time
 	Real end_total = amrex::second() - strt_total;
 	
-        // print wallclock time
-	ParallelDescriptor::ReduceRealMax(end_total ,ParallelDescriptor::IOProcessorNumber());
 	if (amr_core_adv.Verbose()) {
+            // print wallclock time
+            ParallelDescriptor::ReduceRealMax(end_total ,ParallelDescriptor::IOProcessorNumber());
             amrex::Print() << "\nTotal Time: " << end_total << '\n';
 	}
     }
 
-    // destroy timer for profiling
-    BL_PROFILE_VAR_STOP(pmain);
-
     amrex::Finalize();
 }
diff --git a/Tutorials/Amr/Advection_AmrLevel/CMakeLists.txt b/Tutorials/Amr/Advection_AmrLevel/CMakeLists.txt
index 45c63276bbc..f2e2b58ffd3 100644
--- a/Tutorials/Amr/Advection_AmrLevel/CMakeLists.txt
+++ b/Tutorials/Amr/Advection_AmrLevel/CMakeLists.txt
@@ -1,4 +1,4 @@
-if ( (DIM EQUAL 1) OR NOT ENABLE_FORTRAN )
+if ( (AMReX_SPACEDIM EQUAL 1) OR NOT CMAKE_Fortran_COMPILER_LOADED )
    return()
 endif ()
 
@@ -11,101 +11,66 @@ endif ()
 # 2) Uniform Velocity
 #
 
-set (SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
 
 #
 # Sources common to both cases
 #
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-find_all_sources ( SRC3 INC3 ROOT ${SRC_DIR}/Src_nd )
+set(_sources Adv_F.H  AmrLevelAdv.cpp  AmrLevelAdv.H  LevelBldAdv.cpp  main.cpp)
+
+list(APPEND _sources Src_${AMReX_SPACEDIM}d/Adv_${AMReX_SPACEDIM}d.f90 Src_${AMReX_SPACEDIM}d/compute_flux_${AMReX_SPACEDIM}d.f90
+   Src_${AMReX_SPACEDIM}d/slope_${AMReX_SPACEDIM}d.f90 )
+
+list(APPEND _sources Src_nd/Adv_nd.f90  Src_nd/Tagging_nd.f90  Src_nd/tagging_params.f90)
+
+list(TRANSFORM _sources PREPEND Source/)
 
 
 ###############################################################################
 #
 # Single Vortex tutorial ------------------------------------------------------
 #
-################################################################################
-set ( EXENAME  "Advection_AmrLevel_SV.exe")
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex )
-
-
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-set_target_properties ( ${EXENAME} PROPERTIES
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex )
-
-target_link_libraries (${EXENAME} amrex)
+###############################################################################
+set(_sv_exe_dir Exec/SingleVortex/)
 
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${EXENAME} )
-endif ()
+set(_sv_sources face_velocity_${AMReX_SPACEDIM}d.f90  Prob.f90)
+list(TRANSFORM _sv_sources PREPEND ${_sv_exe_dir})
+list(APPEND _sv_sources ${_sources})
 
-#
-# Find input files
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false
-   ${EXE_DIR}/input* ${EXE_DIR}/probin)
+set(_input_files inputs inputs.tracers probin)
+list(TRANSFORM _input_files PREPEND ${_sv_exe_dir})
 
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex )
+setup_tutorial(_sv_sources _input_files
+   HAS_FORTRAN_MODULES
+   BASE_NAME Advection_AmrLevel_SV
+   RUNTIME_SUBDIR SingleVortex)
 
-add_tutorial (${EXENAME})
+unset(_sv_sources)
+unset(_sv_exe_dir)
 
 
 ###############################################################################
 #
-# Single Vortex tutorial ------------------------------------------------------
+# Uniform Velocity tutorial ---------------------------------------------------
 #
-################################################################################
-set ( EXENAME  "Advection_AmrLevel_UV.exe")
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/UniformVelocity)
-
-
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/probdata.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
+###############################################################################
+set(_uv_exe_dir Exec/UniformVelocity/)
 
-set_target_properties ( ${EXENAME} PROPERTIES
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/UniformVelocity )
+set(_uv_sources face_velocity_${AMReX_SPACEDIM}d.f90  Prob.f90 probdata.f90)
+list(TRANSFORM _uv_sources PREPEND ${_uv_exe_dir})
+list(APPEND _uv_sources ${_sources})
 
-target_link_libraries (${EXENAME} amrex)
+set(_input_files inputs inputs.regt probin)
+list(TRANSFORM _input_files PREPEND ${_uv_exe_dir})
 
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${EXENAME} )
-endif ()
+setup_tutorial(_uv_sources _input_files
+   HAS_FORTRAN_MODULES
+   BASE_NAME Advection_AmrLevel_UV
+   RUNTIME_SUBDIR UniformVelocity)
 
-#
-# Find input files
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false
-   ${EXE_DIR}/input* ${EXE_DIR}/probin)
+unset(_uv_sources)
+unset(_uv_exe_dir)
 
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/UniformVelocity )
 
-add_tutorial (${EXENAME})
+# Final clean up
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile b/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile
index a2a6e47b60f..e63036b588d 100644
--- a/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile
+++ b/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../../..
+AMREX_HOME = ../../../../..
 USE_EB = FALSE
 PRECISION  = DOUBLE
 PROFILE    = FALSE
diff --git a/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90
index b4063a8ccb3..d95a53e3d82 100644
--- a/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90
+++ b/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90
@@ -20,7 +20,7 @@ subroutine get_face_velocity(level, time, &
   double precision, intent(in) :: dx(3), prob_lo(3)
 
   integer :: i, j, k, plo(2), phi(2)
-  double precision :: x, y, z
+  double precision :: x, y
   double precision, pointer, contiguous :: psi(:,:)
   double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
 
diff --git a/Tutorials/Amr/Advection_AmrLevel/Exec/UniformVelocity/GNUmakefile b/Tutorials/Amr/Advection_AmrLevel/Exec/UniformVelocity/GNUmakefile
index 55d91cbb9a6..899bb52926d 100644
--- a/Tutorials/Amr/Advection_AmrLevel/Exec/UniformVelocity/GNUmakefile
+++ b/Tutorials/Amr/Advection_AmrLevel/Exec/UniformVelocity/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../../..
+AMREX_HOME = ../../../../..
 USE_EB =FALSE
 PRECISION  = DOUBLE
 PROFILE    = FALSE
diff --git a/Tutorials/Amr/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90 b/Tutorials/Amr/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90
index 37b54c6442c..6beaf0bbb79 100644
--- a/Tutorials/Amr/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90
+++ b/Tutorials/Amr/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90
@@ -51,7 +51,7 @@ subroutine advect(time, lo, hi, &
   ! We like to allocate these **pointers** here and then pass them to a function
   ! to remove their pointerness for performance, because normally pointers could
   ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
+  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
   ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
   ! Note that one MUST CALL BL_DEALLOCATE.
 
diff --git a/Tutorials/Amr/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90 b/Tutorials/Amr/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90
index ce90338f939..7cede23cf06 100644
--- a/Tutorials/Amr/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90
+++ b/Tutorials/Amr/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90
@@ -63,7 +63,7 @@ subroutine advect(time, lo, hi, &
   ! We like to allocate these **pointers** here and then pass them to a function
   ! to remove their pointerness for performance, because normally pointers could
   ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
+  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
   ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
   ! Note that one MUST CALL BL_DEALLOCATE.
 
diff --git a/Tutorials/Amr/Advection_F/CMakeLists.txt b/Tutorials/Amr/Advection_F/CMakeLists.txt
deleted file mode 100644
index 5d02b8865cb..00000000000
--- a/Tutorials/Amr/Advection_F/CMakeLists.txt
+++ /dev/null
@@ -1,58 +0,0 @@
-#
-# This test requires ENABLE_PARTICLES and ENABLE_F_INTERFACES
-#
-if ( (NOT ENABLE_PARTICLES) OR (NOT ENABLE_FORTRAN_INTERFACES) )
-   return ()
-endif ()
-
-set ( EXENAME  "Advection_F_SingleVortex.exe" )
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex)
-set ( SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
-
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-
-#
-# Find sources and include paths
-#
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-
-
-#
-# Add sources to target
-# 
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob_${DIM}d.f90 ${EXE_DIR}/face_velocity_${DIM}d.F90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-if ("${INC1} ${INC2} ${INC3}")
-   target_include_directories ( ${EXENAME} PRIVATE ${INC1} ${INC2} ${INC3} )
-endif ()
-
-set_target_properties ( ${EXENAME} PROPERTIES      
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex
-   LINKER_LANGUAGE
-   Fortran
-   )
-
-target_link_libraries (${EXENAME} amrex)
-
-#
-# Find input files 
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false 
-   ${CMAKE_CURRENT_LIST_DIR}/input* )
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex ) 
-
-
-add_tutorial (${EXENAME})   
-
diff --git a/Tutorials/Amr/Advection_F/Source/Src_3d/Make.package b/Tutorials/Amr/Advection_F/Source/Src_3d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/Amr/Advection_F/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/Amr/Advection_octree_F/CMakeLists.txt b/Tutorials/Amr/Advection_octree_F/CMakeLists.txt
deleted file mode 100644
index 26d92cd9af5..00000000000
--- a/Tutorials/Amr/Advection_octree_F/CMakeLists.txt
+++ /dev/null
@@ -1,57 +0,0 @@
-#
-# This test requires a 2D build
-# 
-if ( NOT (${DIM} EQUAL 2) OR (NOT ENABLE_FORTRAN_INTERFACES) )
-   return ()
-endif ()
-
-set ( EXENAME  "Advection_octreeF_SingleVortex.exe" )
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex)
-set ( SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
-
-
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-#
-# Find sources and include paths
-#
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-
-#
-# Add sources to target
-# 
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/face_velocity_${DIM}d.F90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-if ("${INC1} ${INC2} ${INC3}")
-   target_include_directories ( ${EXENAME} PRIVATE ${INC1} ${INC2} ${INC3} )
-endif ()
-
-set_target_properties ( ${EXENAME} PROPERTIES      
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex
-   LINKER_LANGUAGE
-   Fortran
-   )
-
-target_link_libraries (${EXENAME} amrex)
-
-#
-# Find input files 
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false 
-   ${CMAKE_CURRENT_LIST_DIR}/input* )
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex ) 
-
-
-add_tutorial (${EXENAME})   
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/Make.Adv.mpi b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/Make.Adv.mpi
deleted file mode 100755
index 70bc99182b8..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/Make.Adv.mpi
+++ /dev/null
@@ -1,67 +0,0 @@
-AMREX_HOME = ../../../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand
-TOP := $(ADR_DIR)
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/Amr/Make.package
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi/Make.package
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-CXXFLAGS += $(PPFLAGS) 
-libraries += $(LDFLAGS)
-
-vpathdir += $(AMREX_HOME)/Src/Boundary
-vpathdir += $(AMREX_HOME)/Src/Base
-vpathdir += $(AMREX_HOME)/Src/Amr
-vpathdir += $(AMREX_HOME)/Src/AmrCore
-vpathdir += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs   := Base Boundary AmrCore Amr Particle
-Ppack   += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-LDFLAGS += $(LIBFLAGS)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-vpath %.c   . $(VPATH_LOCATIONS)
-vpath %.cpp . $(VPATH_LOCATIONS)
-vpath %.h   . $(VPATH_LOCATIONS)
-vpath %.H   . $(VPATH_LOCATIONS)
-vpath %.F   . $(VPATH_LOCATIONS)
-vpath %.f90 . $(VPATH_LOCATIONS)
-vpath %.F90 . $(VPATH_LOCATIONS)
-vpath %.f   . $(VPATH_LOCATIONS)
-vpath %.fi  . $(VPATH_LOCATIONS)
-
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-#-----------------------------------------------------------------------------
-# for debugging.  To see the value of a Makefile variable,
-# e.g. COMP, simply do "make print-COMP".  This will
-# print out the value.
-print-%: ; @echo $* is $($*)
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/Make.Adv.upcxx b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/Make.Adv.upcxx
deleted file mode 100755
index cd418788349..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/Make.Adv.upcxx
+++ /dev/null
@@ -1,75 +0,0 @@
-AMREX_HOME = ../../../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand
-TOP := $(ADR_DIR)
-UPCXX_INSTALL=/usr/common/ftg/upcxx/generic/
-#/global/common/cori/ftg/upcxx/2019.3.0/hsw/gnu/PrgEnv-gnu-6.0.4-7.3.0/
-#/usr/common/ftg/upcxx/generic
-PPFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta PPFLAGS)
-LDFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta LDFLAGS)
-LIBFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta LIBFLAGS) 
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/Amr/Make.package
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx/perilla.mak
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common/perilla.mak
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx/Make.package
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-CXXFLAGS += $(PPFLAGS) 
-libraries += $(LDFLAGS)
-
-vpathdir += $(AMREX_HOME)/Src/Boundary
-vpathdir += $(AMREX_HOME)/Src/Base
-vpathdir += $(AMREX_HOME)/Src/Amr
-vpathdir += $(AMREX_HOME)/Src/AmrCore
-vpathdir += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs   := Base Boundary AmrCore Amr Particle
-Ppack   += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-LDFLAGS += $(LIBFLAGS)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-vpath %.c   . $(VPATH_LOCATIONS)
-vpath %.cpp . $(VPATH_LOCATIONS)
-vpath %.h   . $(VPATH_LOCATIONS)
-vpath %.H   . $(VPATH_LOCATIONS)
-vpath %.F   . $(VPATH_LOCATIONS)
-vpath %.f90 . $(VPATH_LOCATIONS)
-vpath %.F90 . $(VPATH_LOCATIONS)
-vpath %.f   . $(VPATH_LOCATIONS)
-vpath %.fi  . $(VPATH_LOCATIONS)
-
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.upcxx
-
-
-#-----------------------------------------------------------------------------
-# for debugging.  To see the value of a Makefile variable,
-# e.g. COMP, simply do "make print-COMP".  This will
-# print out the value.
-print-%: ; @echo $* is $($*)
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/GNUmakefile b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/GNUmakefile
deleted file mode 100755
index dedfd45a8b7..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/GNUmakefile
+++ /dev/null
@@ -1,24 +0,0 @@
-AMREX_HOME ?= ../../../../../../
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-#DIM        = 2
-DIM       = 3
-CPPFLAGS += -DUSE_PERILLA -DMPICH_SKIP_MPICXX -std=c++11 -DUSE_PERILLA_ON_DEMAND 
-#-DPERILLA_USE_UPCXX
-
-COMP	   = gcc
-FCOMP	   = gfortran
-
-USE_MPI    = TRUE
-USE_OMP    = TRUE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv.mpi
-#include ../Make.Adv.upcxx
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/Make.package b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/Make.package
deleted file mode 100755
index c478388fbdc..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/Prob.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/Prob.f90
deleted file mode 100755
index 93278c87712..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/Prob.f90
+++ /dev/null
@@ -1,57 +0,0 @@
-
-subroutine amrex_probinit (init,name,namlen,problo,probhi) bind(c)
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  ! nothing needs to be done here
-
-end subroutine amrex_probinit
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo) bind(C, name="initdata")
-
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2 + (z-0.5d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/face_velocity_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/face_velocity_2d.f90
deleted file mode 100755
index 368b58f7252..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/face_velocity_2d.f90
+++ /dev/null
@@ -1,61 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo)
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  integer :: i, j, plo(2), phi(2)
-  double precision :: x, y
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-
-  ! y velocity
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-
-  call bl_deallocate(psi)
-  
-end subroutine get_face_velocity
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/face_velocity_3d.f90
deleted file mode 100755
index b4063a8ccb3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/face_velocity_3d.f90
+++ /dev/null
@@ -1,69 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3, &
-     vy, vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3, &
-     vz, vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3
-  integer, intent(in) :: vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3
-  integer, intent(in) :: vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2,vx_l3:vx_h3)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2,vy_l3:vy_h3)
-  double precision, intent(out) :: vz(vz_l1:vz_h1,vz_l2:vz_h2,vz_l3:vz_h3)
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer :: i, j, k, plo(2), phi(2)
-  double precision :: x, y, z
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do k = vx_l3, vx_h3
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j,k) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-  end do
-
-  ! y velocity
-  do k = vy_l3, vy_h3
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j,k) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-  end do
-
-  vz = 1.d0
-
-  call bl_deallocate(psi)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/inputs b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/inputs
deleted file mode 100755
index c8604dd7e36..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,42 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 10
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  32   32   32
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratios
-amr.regrid_int      = 2      # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 20    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 0      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 20     # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/probin b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/probin
deleted file mode 100755
index 46d1856ad55..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/SingleVortex/probin
+++ /dev/null
@@ -1,14 +0,0 @@
-&fortin
-
-   adv_vel = 1.d0, 1.d0, 1.d0
-
-/
-
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/GNUmakefile b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/GNUmakefile
deleted file mode 100755
index 222595ecf90..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/GNUmakefile
+++ /dev/null
@@ -1,21 +0,0 @@
-BOXLIB_HOME ?= ../../../..
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-DIM        = 2
-#DIM       = 3
-
-COMP	   = g++
-FCOMP	   = gfortran
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/Make.package b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/Make.package
deleted file mode 100755
index 01fd65d6390..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90 probdata.f90
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/Prob.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/Prob.f90
deleted file mode 100755
index 268e4c94024..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/Prob.f90
+++ /dev/null
@@ -1,84 +0,0 @@
-
-subroutine PROBINIT (init,name,namlen,problo,probhi)
-
-  use probdata_module
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  integer untin,i
-
-  namelist /fortin/ adv_vel
-  
-  !
-  ! Build "probin" filename -- the name of file containing fortin namelist.
-  !     
-  integer maxlen
-  parameter (maxlen=256)
-  character probin*(maxlen)
-  
-  if (namlen .gt. maxlen) then
-     write(6,*) 'probin file name too long'
-     stop
-  end if
-  
-  do i = 1, namlen
-     probin(i:i) = char(name(i))
-  end do
-  
-  adv_vel = 1.d0
-
-  ! Read namelists
-  untin = 9
-  open(untin,file=probin(1:namlen),form='formatted',status='old')
-  read(untin,fortin)
-  close(unit=untin)
-
-end subroutine PROBINIT
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo)
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.0d0)**2 + (y-0.0d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.0d0)**2 + (y-0.0d0)**2 + (z-0.0d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/face_velocity_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/face_velocity_2d.f90
deleted file mode 100755
index 9030e96eec8..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/face_velocity_2d.f90
+++ /dev/null
@@ -1,22 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo)
-
-  use probdata_module, only : adv_vel
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  vx = adv_vel(1)
-  vy = adv_vel(2)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/inputs b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/inputs
deleted file mode 100755
index 61b29a7c4b3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/inputs
+++ /dev/null
@@ -1,39 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 1000000
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     = -1.0 -1.0 -1.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# TIME STEP CONTROL
-adv.cfl            = 0.9     # cfl number for hyperbolic system
-
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.regrid_int      = 2       # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 10    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 1      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 10     # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/probdata.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/probdata.f90
deleted file mode 100755
index ffacef798b9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/probdata.f90
+++ /dev/null
@@ -1,7 +0,0 @@
-module probdata_module
-
-  implicit none
-
-  double precision, save :: adv_vel(3)
-
-end module probdata_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/probin b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/probin
deleted file mode 100755
index 46d1856ad55..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Exec/UniformVelocity/probin
+++ /dev/null
@@ -1,14 +0,0 @@
-&fortin
-
-   adv_vel = 1.d0, 1.d0, 1.d0
-
-/
-
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/README b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/README
deleted file mode 100755
index abc53af9c00..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/README
+++ /dev/null
@@ -1,9 +0,0 @@
-AMR_Adv_C: This code advects a single scalar field with a velocity
-field that is specified on faces.
-
-It is a BoxLib based code designed to run in parallel using MPI/OMP.
-
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d. 
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with Visit.
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv.H b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv.H
deleted file mode 100755
index fb188eecf31..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv.H
+++ /dev/null
@@ -1,224 +0,0 @@
-#ifndef _Adv_H_
-#define _Adv_H_
-
-#include <AMReX_AmrLevel.H>
-#include <AMReX_FluxRegister.H>
-//#include <BL_CXX11.H>
-
-#include <iostream>
-#include <Perilla.H>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-enum StateType { State_Type = 0,
-                 NUM_STATE_TYPE };
-
-//
-// AmrLevel-derived class for hyperbolic conservation equations
-//
-
-class Adv
-    :
-    public AmrLevel
-{
-public:
-    //
-    //Default constructor.  Builds invalid object.
-    //
-    Adv ();
-    //
-    //The basic constructor.
-    //
-    Adv (Amr&            papa,
-	 int             lev,
-	 const Geometry& level_geom,
-	 const BoxArray& bl,
-	 const DistributionMapping& dm,
-	 Real            time);
-    //
-    //The destructor.
-    //
-    virtual ~Adv ();
-    //
-    //Restart from a checkpoint file.
-    //
-    virtual void restart (Amr&          papa,
-                          std::istream& is,
-			  bool          bReadSpecial = false);
-    virtual void checkPoint (const std::string& dir,
-                             std::ostream&      os,
-                             amrex::VisMF::How  how = amrex::VisMF::NFiles,
-                             bool               dump_old = true);
-
-
-    /*A string written as the first item in writePlotFile() at
-               level zero. It is so we can distinguish between different
-               types of plot files. For Adv it has the form: Adv-Vnnn
-    */
-    virtual std::string thePlotFileType () const;
-
-    //
-    //Write a plotfile to specified directory.
-    //
-    virtual void writePlotFile (const std::string& dir,
-                                std::ostream&      os,
-                                VisMF::How         how);
-    //
-    //Define data descriptors.
-    //
-    static void variableSetUp ();
-    //
-    //Cleanup data descriptors at end of run.
-    //
-    static void variableCleanUp ();
-    //
-    //Initialize grid data at problem start-up.
-    //
-    virtual void initData ();
-    //
-    //Initialize data on this level from another Adv (during regrid).
-    //
-    virtual void init (AmrLevel& old);
-    //
-    //Initialize data on this level after regridding if old level did not previously exist
-    //
-    virtual void init ();
-    //
-    //Proceed with next timestep?
-    //
-    virtual int okToContinue () { return 1; }
-    virtual int okToRegrid () { return false; }
-    //
-    //Advance grids at this level in time.
-    //
-    virtual Real advance (Real time,
-                          Real dt,
-                          int  iteration,
-                          int  ncycle);
-
-    virtual void initPerilla(Real time);
-    virtual void finalizePerilla (Real time);
-    //
-    //Estimate time step.
-    //
-    Real estTimeStep (Real dt_old);
-    //
-    //Compute initial time step.
-    //
-    Real initialTimeStep ();
-    //
-    //Compute initial `dt'.
-    //
-    virtual void computeInitialDt (int                   finest_level,
-                                   int                   sub_cycle,
-                                   Vector<int>&           n_cycle,
-                                   const Vector<IntVect>& ref_ratio,
-                                   Vector<Real>&          dt_level,
-                                   Real                  stop_time);
-    //
-    //Compute new `dt'.
-    //
-    virtual void computeNewDt (int                   finest_level,
-                               int                   sub_cycle,
-                               Vector<int>&           n_cycle,
-                               const Vector<IntVect>& ref_ratio,
-                               Vector<Real>&          dt_min,
-                               Vector<Real>&          dt_level,
-                               Real                  stop_time,
-                               int                   post_regrid_flag);
-    //
-    //Do work after timestep().
-    //
-    virtual void post_timestep (int iteration);
-    //
-    //Do work after regrid().
-    //
-    virtual void post_regrid (int lbase, int new_finest) { ; }
-    //
-    //Do work after a restart().
-    //
-    virtual void post_restart () { ; }
-    //
-    //Do work after init().
-    //
-    virtual void post_init (Real stop_time);
-    //
-    //Error estimation for regridding.
-    //
-    virtual void errorEst (TagBoxArray& tb,
-                           int          clearval,
-                           int          tagval,
-                           Real         time,
-			   int          n_error_buf = 0, int ngrow = 0);
-
-    static int  NUM_STATE;
-    static int  NUM_GROW;
-  
-protected:
-
-    static void read_params ();
-
-    Adv& getLevel (int lev);
-
-    FluxRegister& getFluxReg ();
-    FluxRegister& getFluxReg (int lev);
-
-    void reflux ();
-  
-    void avgDown ();
-  
-    void avgDown (int iteration);
-
-    void avgDown (int state_indx, int iteration);
-
-    //
-    // The data.
-    //
-    FluxRegister*        flux_reg;
-    //
-    // Static data members.
-    //
-    static int       verbose;
-    static Real      cfl;
-    static int       do_reflux;
-
-public:
-  
-    MultiFab* Sborder;
-    amrex::Vector<AsyncFillPatchIterator*> SborderFPI;
-
-    MultiFab*  S_fine;
-    MultiFab*  crse_S_fine;  
-    MultiFab*  S_crse;
-    RegionGraph* RG_S_fine;
-    RegionGraph* RG_S_crse;
-};    
-
-//
-// Inlines.
-//
-
-inline
-Adv&
-Adv::getLevel (int lev)
-{
-    return *(Adv *) &parent->getLevel(lev);
-}
-
-inline
-FluxRegister&
-Adv::getFluxReg ()
-{
-    BL_ASSERT(flux_reg);
-    return *flux_reg;
-}
-
-inline
-FluxRegister&
-Adv::getFluxReg (int lev)
-{
-    return getLevel(lev).getFluxReg();
-}
-#endif /*_Adv_H_*/
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv.cpp
deleted file mode 100755
index 5e25b2c66c8..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv.cpp
+++ /dev/null
@@ -1,379 +0,0 @@
-#include <Adv.H>
-#include <Adv_F.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_TagBox.H>
-#include <AMReX_ParmParse.H>
-
-#include <Perilla.H>
-#include <RegionGraph.H>
-#include <WorkerThread.H>
-
-#include <iostream>
-#include <iomanip>
-#include <Perilla.H>
-
-#include <string>
-#include <fstream>
-
-#include <AsyncMultiFabUtil.H>
-
-
-using namespace amrex;
-using namespace perilla;
-
-int      Adv::verbose         = 0;
-Real     Adv::cfl             = 0.9;
-int      Adv::do_reflux       = 0;
-
-int      Adv::NUM_STATE       = 1;  // One variable in the state
-int      Adv::NUM_GROW        = 3;  // number of ghost cells
-
-    void
-Adv::read_params ()
-{
-    static bool done = false;
-
-    if (done) return;
-
-    done = true;
-
-    ParmParse pp("adv");   
-
-    pp.query("v",verbose);
-    pp.query("cfl",cfl);
-    pp.query("do_reflux",do_reflux);
-}
-
-Adv::Adv ()
-{
-    flux_reg = 0;
-    Sborder = 0;
-    SborderFPI.clear();    
-    S_fine = NULL;
-    S_crse = NULL;
-    RG_S_fine = NULL;
-    RG_S_crse = NULL;
-}
-
-Adv::Adv (Amr&            papa,
-	int             lev,
-	const Geometry& level_geom,
-	const BoxArray& bl,
-	const DistributionMapping& dm,
-	Real            time)
-    :
-	AmrLevel(papa,lev,level_geom,bl,dm,time) 
-{
-    flux_reg = 0;
-    if (level > 0 && do_reflux)
-	flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-
-    Sborder = 0;
-    SborderFPI.clear();
-    S_fine = NULL;
-    S_crse = NULL;
-    RG_S_fine = NULL;
-    RG_S_crse = NULL;    
-}
-
-Adv::~Adv () 
-{
-    delete flux_reg;
-}
-
-    void
-Adv::initData ()
-{
-    //
-    // Loop over grids, call FORTRAN function to init with data.
-    //
-    const Real* dx  = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    MultiFab& S_new = get_new_data(State_Type);
-    Real cur_time   = state[State_Type].curTime();
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Initializing the data at level " << level << std::endl;
-
-
-    for (MFIter mfi(S_new); mfi.isValid(); ++mfi)
-    {
-	const Box& box     = mfi.validbox();
-	const int* lo      = box.loVect();
-	const int* hi      = box.hiVect();
-
-	initdata(level, cur_time, ARLIM_3D(lo), ARLIM_3D(hi),
-		BL_TO_FORTRAN_3D(S_new[mfi]), ZFILL(dx),
-		ZFILL(prob_lo));
-    }
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Done initializing the level " << level << " data " << std::endl;
-}
-
-    void
-Adv::init (AmrLevel &old)
-{
-    Adv* oldlev = (Adv*) &old;
-    //
-    // Create new grid data by fillpatching from old.
-    //
-    Real dt_new    = parent->dtLevel(level);
-    Real cur_time  = oldlev->state[State_Type].curTime();
-    Real prev_time = oldlev->state[State_Type].prevTime();
-    Real dt_old    = cur_time - prev_time;
-    setTimeLevel(cur_time,dt_old,dt_new);
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-    FillPatch(old, S_new, 0, cur_time, State_Type, 0, NUM_STATE);
-}
-
-//
-// This version inits the data on a new level that did not
-// exist before regridding.
-//
-    void
-Adv::init ()
-{
-    Real dt        = parent->dtLevel(level);
-    Real cur_time  = getLevel(level-1).state[State_Type].curTime();
-    Real prev_time = getLevel(level-1).state[State_Type].prevTime();
-
-    Real dt_old = (cur_time - prev_time)/(Real)parent->MaxRefRatio(level-1);
-
-    setTimeLevel(cur_time,dt_old,dt);
-    MultiFab& S_new = get_new_data(State_Type);
-    FillCoarsePatch(S_new, 0, cur_time, State_Type, 0, NUM_STATE);
-}
-
-
-    void
-Adv::post_timestep (int iteration)
-{
-
-    //
-    // Integration cycle on fine level grids is complete
-    // do post_timestep stuff here.
-    //
-    int finest_level = parent->finestLevel();
-
-    if (do_reflux && level < finest_level)
-	    reflux();
-
-    avgDown(iteration);
-}
-
-    void
-Adv::post_init (Real stop_time)
-{
-    if (level > 0)
-	return;
-    //
-    // Average data down from finer levels
-    // so that conserved data is consistent between levels.
-    //
-    int finest_level = parent->finestLevel();
-    for (int k = finest_level; k>= 0; k--)
-	getLevel(k).avgDown();
-}
-
-    void
-Adv::reflux ()
-{
-    BL_ASSERT(level<parent->finestLevel());
-
-    const Real strt = ParallelDescriptor::second();
-
-    getFluxReg(level+1).Reflux(get_new_data(State_Type),1.0,0,0,NUM_STATE,geom);
-
-    if (verbose)
-    {
-	const int IOProc = ParallelDescriptor::IOProcessorNumber();
-	Real      end    = ParallelDescriptor::second() - strt;
-
-	ParallelDescriptor::ReduceRealMax(end,IOProc);
-
-	if (ParallelDescriptor::IOProcessor())
-	    std::cout << "Adv::reflux() at level " << level << " : time = " << end << std::endl;
-    }
-}
-
-
-    void
-Adv::avgDown ()
-{
-    if (level == parent->finestLevel()) return;
-
-    Adv& fine_lev = getLevel(level+1);
-    MultiFab&  S_fine   = fine_lev.get_new_data(State_Type);
-    MultiFab&  S_crse   = get_new_data(State_Type);
-
-    amrex::average_down(S_fine,S_crse,
-	    fine_lev.geom,geom,
-	    0,S_fine.nComp(),parent->refRatio(level));
-
-}
-
-
-    void
-Adv::avgDown (int iteration)
-{
-    avgDown(State_Type, iteration);
-}
-
-    void
-Adv::avgDown (int state_indx, int iteration)
-{
-    std::vector<RegionGraph*> flattenedGraphArray;
-    Perilla::flattenGraphHierarchy(parent->graphArray, flattenedGraphArray);
-
-    if(level < parent->finestLevel())
-    {
-        Adv& fine_lev = getLevel(level+1);
-
-        MultiFab* tS_fine = &(fine_lev.get_new_data(state_indx));
-        MultiFab* tS_crse = &(get_new_data(state_indx));
-
-        MultiFab& S_new = get_new_data(state_indx);
-        const Real time = state[state_indx].curTime();
-
-
-#pragma omp parallel default(shared)
-{
-        for(RGIter rgi(RG_S_crse, flattenedGraphArray); rgi.isValid(); ++rgi)
-        {
-            int f = rgi.currentRegion;
-            average_down_pull(rgi, S_fine, S_crse, RG_S_fine, RG_S_crse,
-                                   fine_lev.geom, geom, 0, S_fine->nComp(),
-                                   parent->refRatio(level),f);
-            // Send data to advance for next subcycle iteration  
-            if(iteration < parent->nCycle(level))
-                SborderFPI[iteration]->SendIntraLevel(rgi, NUM_GROW, time, state_indx, 0, NUM_STATE, iteration, f, false);
-        }
-}
-    }
-
-    if (level > 0 && iteration == parent->nCycle(level))
-    {
-      Adv& crse_lev = getLevel(level-1);
-
-      MultiFab* S_fine = &(get_new_data(state_indx));
-      MultiFab* S_crse = &(crse_lev.get_new_data(state_indx));
-
-#pragma omp parallel default(shared)
-{
-      for(RGIter rgi(crse_lev.RG_S_fine, flattenedGraphArray, true); rgi.isValid(); ++rgi)
-        {
-          int f = rgi.currentRegion;
-          average_down_push(rgi, S_fine, S_crse, crse_lev.crse_S_fine,
-                                    crse_lev.RG_S_fine, crse_lev.RG_S_crse,geom,crse_lev.geom,
-                                    0,crse_lev.get_new_data(state_indx).nComp(),parent->refRatio(level-1),f);
-
-        }
-}
-    }
-}
-
-    void
-Adv::initPerilla(Real time)
-{
-    int state_indx = State_Type;
-    Sborder = new MultiFab(grids, dmap, NUM_STATE, NUM_GROW);
-    amrex::MultiFab tmp_Sborder(grids, dmap, NUM_STATE, NUM_GROW);
-
-    SborderFPI.resize(parent->nCycle(level));        
-    for(int i=0; i<parent->nCycle(level); i++)
-    {
-	SborderFPI[i] = new AsyncFillPatchIterator(*this, tmp_Sborder, NUM_GROW, time+(i*parent->dtLevel(level)), State_Type, 0, NUM_STATE,i+1);
-    }
-
-    if(level < parent->finestLevel())
-    {
-	Adv& fine_lev = getLevel(level+1);
-	S_fine = &(fine_lev.get_new_data(state_indx));
-	S_crse = &(get_new_data(state_indx));
-	RG_S_crse = new RegionGraph(S_crse->IndexArray().size());
-	parent->graphArray[level].push_back(RG_S_crse);
-
-	const BoxArray& fine_BA = S_fine->boxArray();
-	BoxArray crse_S_fine_BA = fine_BA;
-	crse_S_fine_BA.coarsen(parent->refRatio(level));
-	crse_S_fine = new MultiFab(crse_S_fine_BA, S_fine->DistributionMap(), S_fine->nComp(),0);
-
-	RG_S_fine = new RegionGraph(crse_S_fine->IndexArray().size());
-	RG_S_fine->buildTileArray(*crse_S_fine);
-
-	Perilla::multifabExtractCopyAssoc( RG_S_crse, RG_S_fine, *S_crse, *crse_S_fine, S_fine->nComp(), 0, 0, Periodicity::NonPeriodic());
-	parent->graphArray[level].push_back(RG_S_fine);
-    }
-}
-
-    void
-Adv::finalizePerilla (Real time)
-{
-    if(ParallelDescriptor::MyProc()==0)
-	std::cout<< "Finalizing Perilla Level " << level <<std::endl;
-
-    for(int i=0; i< parent->nCycle(level); i++)
-    {
-	 delete SborderFPI[i];
-    }
-    SborderFPI.clear();
-    if(Sborder) delete Sborder;    
-
-    if(level < parent->finestLevel())
-    {
-	S_fine = 0;
-	S_crse = 0;
-	if(crse_S_fine) delete crse_S_fine;
-	if(RG_S_fine) delete RG_S_fine;
-	if(RG_S_crse) delete RG_S_crse;	
-    }
-}
-
-    void
-Adv::errorEst (TagBoxArray& tags,
-	int          clearval,
-	int          tagval,
-	Real         time,
-	int          n_error_buf,
-	int          ngrow)
-{
-    const Real* dx        = geom.CellSize();
-    const Real* prob_lo   = geom.ProbLo();
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-	Vector<int>  itags;
-
-	for (MFIter mfi(S_new,true); mfi.isValid(); ++mfi)
-	{
-	    const Box&  tilebx  = mfi.tilebox();
-
-	    TagBox&     tagfab  = tags[mfi];
-
-	    // We cannot pass tagfab to Fortran becuase it is BaseFab<char>.
-	    // So we are going to get a temporary integer array.
-	    tagfab.get_itags(itags, tilebx);
-
-	    // data pointer and index space
-	    int*        tptr    = itags.dataPtr();
-	    const int*  tlo     = tilebx.loVect();
-	    const int*  thi     = tilebx.hiVect();
-
-	    state_error(tptr,  ARLIM_3D(tlo), ARLIM_3D(thi),
-		    BL_TO_FORTRAN_3D(S_new[mfi]),
-		    &tagval, &clearval,
-		    ARLIM_3D(tilebx.loVect()), ARLIM_3D(tilebx.hiVect()),
-		    ZFILL(dx), ZFILL(prob_lo), &time, &level);
-	    // Now update the tags in the TagBox.
-	    //
-	    tagfab.tags_and_untags(itags, tilebx);
-	}
-    }
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/AdvBld.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/AdvBld.cpp
deleted file mode 100755
index 171b3478d0e..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/AdvBld.cpp
+++ /dev/null
@@ -1,57 +0,0 @@
-
-#include <AMReX_LevelBld.H>
-#include <Adv.H>
-
-using namespace amrex;
-
-class AdvBld
-    :
-    public LevelBld
-{
-    virtual void variableSetUp () override;
-    virtual void variableCleanUp () override;
-    virtual AmrLevel *operator() () override;
-    virtual AmrLevel *operator() (Amr&            papa,
-                                  int             lev,
-                                  const Geometry& level_geom,
-                                  const BoxArray& ba,
-				  const DistributionMapping& dm,
-                                  Real            time) override;
-};
-
-AdvBld Adv_bld;
-
-LevelBld*
-getLevelBld ()
-{
-    return &Adv_bld;
-}
-
-void
-AdvBld::variableSetUp ()
-{
-    Adv::variableSetUp();
-}
-
-void
-AdvBld::variableCleanUp ()
-{
-    Adv::variableCleanUp();
-}
-
-AmrLevel*
-AdvBld::operator() ()
-{
-    return new Adv;
-}
-
-AmrLevel*
-AdvBld::operator() (Amr&            papa,
-		    int             lev,
-		    const Geometry& level_geom,
-		    const BoxArray& ba,
-		    const DistributionMapping& dm,
-		    Real            time)
-{
-    return new Adv(papa, lev, level_geom, ba, dm, time);
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_F.H b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_F.H
deleted file mode 100755
index a56dc5abd83..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_F.H
+++ /dev/null
@@ -1,44 +0,0 @@
-#ifndef _Adv_F_H_
-#define _Adv_F_H_
-#include <AMReX_BLFort.H>
-
-extern "C" 
-{
-  void get_tagging_params(const int* name, const int* namlen);
-
-  void nullfill(BL_FORT_FAB_ARG_3D(state),
-		const int* dlo, const int* dhi,
-		const amrex::Real* dx, const amrex::Real* glo, 
-		const amrex::Real* time, const int* bc);
-  
-  void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		   BL_FORT_FAB_ARG_3D(state),
-		   const int* tagval, const int* clearval,
-		   const int* lo, const int* hi,
-		   const amrex::Real* dx, const amrex::Real* problo,
-		   const amrex::Real* time, const int* level);
-  
-  void initdata(const int& level, const amrex::Real& time, 
-		const int* lo, const int* hi,
-		BL_FORT_FAB_ARG_3D(state),
-		const amrex::Real* dx, const amrex::Real* problo);
-  
-  void get_face_velocity(const int& level, const amrex::Real& time, 
-			 D_DECL(BL_FORT_FAB_ARG(xvel),
-				BL_FORT_FAB_ARG(yvel),
-				BL_FORT_FAB_ARG(zvel)),
-			 const amrex::Real* dx, const amrex::Real* problo);
-  
-  void advect(const amrex::Real& time, const int* lo, const int*hi,
-	      const BL_FORT_FAB_ARG_3D(statein),
-	      BL_FORT_FAB_ARG_3D(stateout),
-	      D_DECL(const BL_FORT_FAB_ARG_3D(xvel),
-		     const BL_FORT_FAB_ARG_3D(yvel),
-		     const BL_FORT_FAB_ARG_3D(zvel)),
-	      D_DECL(BL_FORT_FAB_ARG_3D(fx),
-		     BL_FORT_FAB_ARG_3D(fy),
-		     BL_FORT_FAB_ARG_3D(fz)),
-	      const amrex::Real* dx, const amrex::Real& dt);
-}
-
-#endif
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_advance.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_advance.cpp
deleted file mode 100755
index ef9ff158c88..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_advance.cpp
+++ /dev/null
@@ -1,115 +0,0 @@
-#include <Adv.H>
-#include <Adv_F.H>
-#include <WorkerThread.H>
-#include <RegionGraph.H>
-#include <Perilla.H>
-#include <string>
-#include <fstream>
-
-using namespace perilla;
-
-    Real
-Adv::advance (Real time,
-	Real dt,
-	int  iteration,
-	int  ncycle)
-{
-	for (int k = 0; k < NUM_STATE_TYPE; k++) {
-	    state[k].allocOldData();
-	    state[k].swapTimeLevels(dt);
-	}
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-    const Real prev_time = state[State_Type].prevTime();
-    const Real cur_time = state[State_Type].curTime();
-    const Real ctr_time = 0.5*(prev_time + cur_time);
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-
-    // Get pointers to Flux registers, or set pointer to zero if not there.
-    FluxRegister *fine    = 0;
-    FluxRegister *current = 0;
-
-    int finest_level = parent->finestLevel();
-
-	if (do_reflux && level < finest_level) {
-	    fine = &getFluxReg(level+1);
-	    fine->setVal(0.0);
-	}
-
-    if (do_reflux && level > 0) {
-	current = &getFluxReg(level);
-    }
-
-    MultiFab fluxes[BL_SPACEDIM];
-
-    if (do_reflux)
-    {
-	for (int j = 0; j < BL_SPACEDIM; j++)
-	{
-	    BoxArray ba = S_new.boxArray();
-	    ba.surroundingNodes(j);
-	    fluxes[j].define(ba, dmap, NUM_STATE, 0);
-	}
-    }
-
-    amrex::Vector<AsyncFillPatchIterator*> upperAFPI;
-    if(level < parent->finestLevel())
-    {
-	Adv& upperLevel = getLevel(level+1);
-	upperAFPI = upperLevel.SborderFPI;
-    }
-
-#pragma omp parallel default(shared)
-{
-    FArrayBox flux[BL_SPACEDIM], uface[BL_SPACEDIM];
-    for (RGIter rgi(SborderFPI, upperAFPI, *(Sborder), NUM_GROW, state[State_Type].prevTime(), State_Type, 0, NUM_STATE, iteration); rgi.isValid(); ++rgi){
-	int f = rgi.currentRegion;
-	int fid = S_new.IndexArray()[f];
-	int fis = Sborder->IndexArray()[f];
-	const FArrayBox& statein = (*(Sborder))[fis];
-	FArrayBox& stateout      =   S_new[fid];
-	MFIter mfi(S_new, true);
-
-	const Box& bx = rgi.tilebox();
-	rgi.sync_workers();
-	for (int i = 0; i < BL_SPACEDIM ; i++) {
-	    const Box& bxtmp = amrex::surroundingNodes(bx,i);
-	    {
-		flux[i].resize(bxtmp,NUM_STATE);
-		uface[i].resize(amrex::grow(bxtmp,1),1);
-	    }
-	}
-
-	get_face_velocity(level, ctr_time,
-		D_DECL(BL_TO_FORTRAN(uface[0]),
-		    BL_TO_FORTRAN(uface[1]),
-		    BL_TO_FORTRAN(uface[2])),
-		dx, prob_lo);
-	advect(time, bx.loVect(), bx.hiVect(),
-		BL_TO_FORTRAN_3D(statein),
-		BL_TO_FORTRAN_3D(stateout),
-		D_DECL(BL_TO_FORTRAN_3D(uface[0]),
-		    BL_TO_FORTRAN_3D(uface[1]),
-		    BL_TO_FORTRAN_3D(uface[2])),
-		D_DECL(BL_TO_FORTRAN_3D(flux[0]),
-		    BL_TO_FORTRAN_3D(flux[1]),
-		    BL_TO_FORTRAN_3D(flux[2])),
-		dx, dt);
-
-	if (do_reflux) {
-	    for (int i = 0; i < BL_SPACEDIM ; i++)
-		fluxes[i][f].copy(flux[i],mfi.nodaltilebox(i));       
-	}
-    }
-}
-    if (do_reflux) {
-	if (fine) {
-		for (int i = 0; i < BL_SPACEDIM ; i++)
-		    fine->CrseInit(fluxes[i],i,0,0,NUM_STATE,-1.);
-	}
-    }
-    return dt;
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_dt.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_dt.cpp
deleted file mode 100755
index 188cb000f9f..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_dt.cpp
+++ /dev/null
@@ -1,171 +0,0 @@
-
-#include <Adv.H>
-#include <Adv_F.H>
-
-Real
-Adv::initialTimeStep ()
-{
-    return estTimeStep(0.0);
-}
-
-Real
-Adv::estTimeStep (Real)
-{
-    // This is just a dummy value to start with 
-    Real dt_est  = 1.0e+20;
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    const Real cur_time = state[State_Type].curTime();
-    const MultiFab& S_new = get_new_data(State_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est)
-#endif
-    {
-	FArrayBox uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bx = mfi.nodaltilebox(i);
-		uface[i].resize(bx,1);
-	    }
-
-            get_face_velocity(level, cur_time,
-                              D_DECL(BL_TO_FORTRAN(uface[0]),
-                                     BL_TO_FORTRAN(uface[1]),
-                                     BL_TO_FORTRAN(uface[2])),
-                              dx, prob_lo);
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		Real umax = uface[i].norm(0);
-		if (umax > 1.e-100) {
-		    dt_est = std::min(dt_est, dx[i] / umax);
-		}
-	    }
-	}
-    }
-
-    ParallelDescriptor::ReduceRealMin(dt_est);
-    dt_est *= cfl;
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Adv::estTimeStep at level " << level << ":  dt_est = " << dt_est << std::endl;
-    
-    return dt_est;
-}
-
-void
-Adv::computeNewDt (int                   finest_level,
-		   int                   sub_cycle,
-		   Vector<int>&           n_cycle,
-		   const Vector<IntVect>& ref_ratio,
-		   Vector<Real>&          dt_min,
-		   Vector<Real>&          dt_level,
-		   Real                  stop_time,
-		   int                   post_regrid_flag)
-{
-    //
-    // We are at the end of a coarse grid timecycle.
-    // Compute the timesteps for the next iteration.
-    //
-    if (level > 0)
-        return;
-
-    for (int i = 0; i <= finest_level; i++)
-    {
-        Adv& adv_level = getLevel(i);
-        dt_min[i] = adv_level.estTimeStep(dt_level[i]);
-    }
-
-    if (post_regrid_flag == 1) 
-    {
-	//
-	// Limit dt's by pre-regrid dt
-	//
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],dt_level[i]);
-	}
-    }
-    else 
-    {
-	//
-	// Limit dt's by change_max * old dt
-	//
-	static Real change_max = 1.1;
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],change_max*dt_level[i]);
-	}
-    }
-    
-    //
-    // Find the minimum over all levels
-    //
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_min[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
-
-void
-Adv::computeInitialDt (int                   finest_level,
-		       int                   sub_cycle,
-		       Vector<int>&           n_cycle,
-		       const Vector<IntVect>& ref_ratio,
-		       Vector<Real>&          dt_level,
-		       Real                  stop_time)
-{
-    //
-    // Grids have been constructed, compute dt for all levels.
-    //
-    if (level > 0)
-        return;
-
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        dt_level[i] = getLevel(i).initialTimeStep();
-        n_factor   *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_level[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_io.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_io.cpp
deleted file mode 100755
index c08230422ce..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_io.cpp
+++ /dev/null
@@ -1,209 +0,0 @@
-#include <Adv.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-void
-Adv::restart (Amr&          papa,
-	      std::istream& is,
-	      bool          bReadSpecial)
-{
-    AmrLevel::restart(papa,is,bReadSpecial);
-
-    BL_ASSERT(flux_reg == 0);
-    if (level > 0 && do_reflux)
-        flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-}
-
-/*
-void
-Adv::post_restart() 
-{
-#ifdef PARTICLES
-    if (do_tracers and level == 0) {
-      BL_ASSERT(TracerPC == 0);
-      TracerPC.reset(new AmrTracerParticleContainer(parent));
-      TracerPC->Restart(parent->theRestartFile(), "Tracer");
-    }
-#endif
-}
-*/
-
-void 
-Adv::checkPoint (const std::string& dir,
-		 std::ostream&      os,
-		 VisMF::How         how,
-		 bool               dump_old) 
-{
-  AmrLevel::checkPoint(dir, os, how, dump_old);
-#ifdef PARTICLES
-  if (do_tracers and level == 0) {
-    TracerPC->Checkpoint(dir, "Tracer", true);
-  }
-#endif
-}
-
-
-std::string
-Adv::thePlotFileType () const
-{
-    static const std::string the_plot_file_type("HyperCLaw-V1.1");
-    return the_plot_file_type;
-}
-
-
-void
-Adv::writePlotFile (const std::string& dir,
-		    std::ostream&      os,
-		    VisMF::How         how)
-{
-    int i, n;
-    //
-    // The list of indices of State to write to plotfile.
-    // first component of pair is state_type,
-    // second component of pair is component # within the state_type
-    //
-    std::vector<std::pair<int,int> > plot_var_map;
-    for (int typ = 0; typ < desc_lst.size(); typ++)
-        for (int comp = 0; comp < desc_lst[typ].nComp();comp++)
-            if (parent->isStatePlotVar(desc_lst[typ].name(comp)) &&
-                desc_lst[typ].getType() == IndexType::TheCellType())
-                plot_var_map.push_back(std::pair<int,int>(typ,comp));
-
-    int n_data_items = plot_var_map.size();
-
-    Real cur_time = state[State_Type].curTime();
-
-#ifdef PARTICLES
-    if (do_tracers and level == 0) {
-      TracerPC->Checkpoint(dir, "Tracer", true);
-    }
-#endif
-
-    if (level == 0 && ParallelDescriptor::IOProcessor())
-    {
-        //
-        // The first thing we write out is the plotfile type.
-        //
-        os << thePlotFileType() << '\n';
-
-        if (n_data_items == 0)
-            amrex::Error("Must specify at least one valid data item to plot");
-
-        os << n_data_items << '\n';
-
-	//
-	// Names of variables
-	//
-	for (i =0; i < plot_var_map.size(); i++)
-        {
-	    int typ = plot_var_map[i].first;
-	    int comp = plot_var_map[i].second;
-	    os << desc_lst[typ].name(comp) << '\n';
-        }
-
-        os << BL_SPACEDIM << '\n';
-        os << parent->cumTime() << '\n';
-        int f_lev = parent->finestLevel();
-        os << f_lev << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbLo(i) << ' ';
-        os << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbHi(i) << ' ';
-        os << '\n';
-        for (i = 0; i < f_lev; i++)
-            os << parent->refRatio(i)[0] << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->Geom(i).Domain() << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->levelSteps(i) << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-        {
-            for (int k = 0; k < BL_SPACEDIM; k++)
-                os << parent->Geom(i).CellSize()[k] << ' ';
-            os << '\n';
-        }
-        os << (int) Geom().Coord() << '\n';
-        os << "0\n"; // Write bndry data.
-
-    }
-    // Build the directory to hold the MultiFab at this level.
-    // The name is relative to the directory containing the Header file.
-    //
-    static const std::string BaseName = "/Cell";
-    char buf[64];
-    sprintf(buf, "Level_%d", level);
-    std::string Level = buf;
-    //
-    // Now for the full pathname of that directory.
-    //
-    std::string FullPath = dir;
-    if (!FullPath.empty() && FullPath[FullPath.size()-1] != '/')
-        FullPath += '/';
-    FullPath += Level;
-    //
-    // Only the I/O processor makes the directory if it doesn't already exist.
-    //
-    if (ParallelDescriptor::IOProcessor())
-        if (!amrex::UtilCreateDirectory(FullPath, 0755))
-            amrex::CreateDirectoryFailed(FullPath);
-    //
-    // Force other processors to wait till directory is built.
-    //
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << level << ' ' << grids.size() << ' ' << cur_time << '\n';
-        os << parent->levelSteps(level) << '\n';
-
-        for (i = 0; i < grids.size(); ++i)
-        {
-            RealBox gridloc = RealBox(grids[i],geom.CellSize(),geom.ProbLo());
-            for (n = 0; n < BL_SPACEDIM; n++)
-                os << gridloc.lo(n) << ' ' << gridloc.hi(n) << '\n';
-        }
-        //
-        // The full relative pathname of the MultiFabs at this level.
-        // The name is relative to the Header file containing this name.
-        // It's the name that gets written into the Header.
-        //
-        if (n_data_items > 0)
-        {
-            std::string PathNameInHeader = Level;
-            PathNameInHeader += BaseName;
-            os << PathNameInHeader << '\n';
-        }
-    }
-    //
-    // We combine all of the multifabs -- state, derived, etc -- into one
-    // multifab -- plotMF.
-    // NOTE: In this tutorial code, there is no derived data
-    int       cnt   = 0;
-    const int nGrow = 0;
-    MultiFab  plotMF(grids,dmap,n_data_items,nGrow);
-    MultiFab* this_dat = 0;
-    //
-    // Cull data from state variables -- use no ghost cells.
-    //
-    for (i = 0; i < plot_var_map.size(); i++)
-    {
-	int typ  = plot_var_map[i].first;
-	int comp = plot_var_map[i].second;
-	this_dat = &state[typ].newData();
-	MultiFab::Copy(plotMF,*this_dat,comp,cnt,1,nGrow);
-	cnt++;
-    }
-
-    //
-    // Use the Full pathname when naming the MultiFab.
-    //
-    std::string TheFullPath = FullPath;
-    TheFullPath += BaseName;
-    VisMF::Write(plotMF,TheFullPath,how,true);
-}
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_setup.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_setup.cpp
deleted file mode 100755
index cc8938abf32..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Adv_setup.cpp
+++ /dev/null
@@ -1,51 +0,0 @@
-
-#include <Adv.H>
-#include <Adv_F.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BC_TYPES.H>
-
-void
-Adv::variableCleanUp () 
-{
-    desc_lst.clear();
-}
-
-void
-Adv::variableSetUp ()
-{
-    BL_ASSERT(desc_lst.size() == 0);
-
-    // Get options, set phys_bc
-    read_params();
-
-    desc_lst.addDescriptor(State_Type,IndexType::TheCellType(),
-                           StateDescriptor::Point,0,NUM_STATE,
-			   &cell_cons_interp);
-
-    int lo_bc[BL_SPACEDIM];
-    int hi_bc[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	lo_bc[i] = hi_bc[i] = INT_DIR;   // periodic boundaries
-    }
-    
-    BCRec bc(lo_bc, hi_bc);
-    desc_lst.setComponent(State_Type, 0, "phi", bc,
-                          StateDescriptor::BndryFunc(nullfill));
-
-    //
-    // read taggin parameters from probin file
-    //
-
-    std::string probin_file("probin");
-
-    ParmParse ppa("amr");
-    ppa.query("probin_file",probin_file);
-
-    int probin_file_length = probin_file.length();
-    Vector<int> probin_file_name(probin_file_length);
-
-    for (int i = 0; i < probin_file_length; i++)
-	probin_file_name[i] = probin_file[i];
-     get_tagging_params(probin_file_name.dataPtr(), &probin_file_length);
-
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Make.package b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Make.package
deleted file mode 100755
index eaa93d165aa..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Make.package
+++ /dev/null
@@ -1,9 +0,0 @@
-CEXE_sources += Adv.cpp Adv_advance.cpp Adv_setup.cpp 
-CEXE_sources += AdvBld.cpp Adv_io.cpp Adv_dt.cpp
-CEXE_sources += main.cpp 
-
-CEXE_headers += Adv.H
-
-FEXE_headers += Adv_F.H
-
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/Adv_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/Adv_2d.f90
deleted file mode 100755
index 75a536d1d70..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,118 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt)
-  
-  use mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  double precision, intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  double precision :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Final fluxes
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = phix(i,j) * vx(i,j)
-     end do
-  end do
-  !
-  do    j = lo(2), hi(2)+1
-     do i = lo(1), hi(1)
-        flxy(i,j) = phiy(i,j) * vy(i,j)
-     end do
-  end do
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/Make.package b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/Make.package
deleted file mode 100755
index 08c638054bb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100755
index 7361a8ce7a0..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,113 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    double precision, intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/slope_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/slope_2d.f90
deleted file mode 100755
index 1fa7d7a525e..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,126 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(1.d0, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/Adv_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/Adv_3d.f90
deleted file mode 100755
index ab15c03a473..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/Adv_3d.f90
+++ /dev/null
@@ -1,144 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            vz  , vz_lo, vz_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            flxz, fz_lo, fz_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_3d
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3)
-  double precision, intent(in) :: dx(3), dt, time
-  integer, intent(in) :: ui_lo(3), ui_hi(3)
-  integer, intent(in) :: uo_lo(3), uo_hi(3)
-  integer, intent(in) :: vx_lo(3), vx_hi(3)
-  integer, intent(in) :: vy_lo(3), vy_hi(3)
-  integer, intent(in) :: vz_lo(3), vz_hi(3)
-  integer, intent(in) :: fx_lo(3), fx_hi(3)
-  integer, intent(in) :: fy_lo(3), fy_hi(3)
-  integer, intent(in) :: fz_lo(3), fz_hi(3)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2),ui_lo(3):ui_hi(3))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2),uo_lo(3):uo_hi(3))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2),vx_lo(3):vx_hi(3))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2),vy_lo(3):vy_hi(3))
-  double precision, intent(in   ) :: vz  (vz_lo(1):vz_hi(1),vz_lo(2):vz_hi(2),vz_lo(3):vz_hi(3))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-  double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-
-  integer :: i, j, k
-  integer :: glo(3), ghi(3)
-  double precision :: dtdx(3), umax, vmax, wmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:,:), pointer, contiguous :: &
-       phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  ! slope
-  call bl_allocate(slope,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))  
-  
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  wmax = maxval(abs(vz))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) .or. &
-       wmax*dt .ge. dx(3) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", wmax = ", wmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-  
-  
-  ! call a function to compute flux
-  call compute_flux_3d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       vz, vz_lo, vz_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       flxz, fz_lo, fz_hi, &
-                       phix, phix_y, phix_z, &
-                       phiy, phiy_x, phiy_z, &
-                       phiz, phiz_x, phiz_y, &
-                       slope, glo, ghi)   
-
-  ! Do a conservative update
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           uout(i,j,k) = uin(i,j,k) + &
-                ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx(1) &
-                + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx(2) &
-                + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx(3) )
-           
-        enddo
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-           flxx(i,j,k) = flxx(i,j,k) * (dt * dx(2)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)+1 
-        do i = lo(1), hi(1)
-           flxy(i,j,k) = flxy(i,j,k) * (dt * dx(1)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)+1
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           flxz(i,j,k) = flxz(i,j,k) * (dt * dx(1)*dx(2))
-        enddo
-     enddo
-  enddo
-
-  call bl_deallocate(phix  )
-  call bl_deallocate(phix_y)
-  call bl_deallocate(phix_z)
-  call bl_deallocate(phiy  )
-  call bl_deallocate(phiy_x)
-  call bl_deallocate(phiy_z)
-  call bl_deallocate(phiz  )
-  call bl_deallocate(phiz_x)
-  call bl_deallocate(phiz_y)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/Make.package b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/Make.package
deleted file mode 100755
index 08c638054bb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/compute_flux_3d.f90
deleted file mode 100755
index 81662295831..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/compute_flux_3d.f90
+++ /dev/null
@@ -1,287 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_3d
-
-contains
-
-  subroutine compute_flux_3d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             wmac,  w_lo,  w_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             flxz, fz_lo, fz_hi, &
-                             phix, phix_y, phix_z, &
-                             phiy, phiy_x, phiy_z, &
-                             phiz, phiz_x, phiz_y, &
-                             slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey, slopez
-
-    integer, intent(in) :: lo(3), hi(3), glo(3), ghi(3)
-    double precision, intent(in) :: dt, dx(3)
-    integer, intent(in) :: ph_lo(3), ph_hi(3)
-    integer, intent(in) ::  u_lo(3),  u_hi(3)
-    integer, intent(in) ::  v_lo(3),  v_hi(3)
-    integer, intent(in) ::  w_lo(3),  w_hi(3)
-    integer, intent(in) :: fx_lo(3), fx_hi(3)
-    integer, intent(in) :: fy_lo(3), fy_hi(3)
-    integer, intent(in) :: fz_lo(3), fz_hi(3)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2),ph_lo(3):ph_hi(3))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2), u_lo(3): u_hi(3))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2), v_lo(3): v_hi(3))
-    double precision, intent(in   ) :: wmac( w_lo(1): w_hi(1), w_lo(2): w_hi(2), w_lo(3): w_hi(3))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-    double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2),glo(3):ghi(3)) :: &
-         phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(3), tdtdx(3)
-
-    hdtdx = 0.5*(dt/dx)
-    tdtdx = (1.d0/3.d0)*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phi(i  ,j,k) - (0.5d0 + hdtdx(1)*umac(i,j,k))*slope(i  ,j,k)
-             else
-                phix(i,j,k) = phi(i-1,j,k) + (0.5d0 - hdtdx(1)*umac(i,j,k))*slope(i-1,j,k)
-             end if
-             
-          end do
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on y faces using vmac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phi(i,j  ,k) - (0.5d0 + hdtdx(2)*vmac(i,j,k))*slope(i,j  ,k)
-             else
-                phiy(i,j,k) = phi(i,j-1,k) + (0.5d0 - hdtdx(2)*vmac(i,j,k))*slope(i,j-1,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopez(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on z faces using wmac to upwind; ignore transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phi(i,j,k  ) - (0.5d0 + hdtdx(3)*wmac(i,j,k))*slope(i,j,k  )
-             else
-                phiz(i,j,k) = phi(i,j,k-1) + (0.5d0 - hdtdx(3)*wmac(i,j,k))*slope(i,j,k-1)
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! transverse terms
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in y-transverse terms
-    do       k=lo(3)-1, hi(3)+1
-       do    j=lo(2)  , hi(2)
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i  ,j+1,k)+vmac(i  ,j,k)) * (phiy(i  ,j+1,k)-phiy(i  ,j,k)) )
-             else
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i-1,j+1,k)+vmac(i-1,j,k)) * (phiy(i-1,j+1,k)-phiy(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on x faces by adding in z-transverse terms
-    do       k=lo(3)  , hi(3)
-       do    j=lo(2)-1, hi(2)+1
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i  ,j,k+1)+wmac(i  ,j,k)) * (phiz(i  ,j,k+1)-phiz(i  ,j,k)) )
-             else
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i-1,j,k+1)+wmac(i-1,j,k)) * (phiz(i-1,j,k+1)-phiz(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j  ,k)+umac(i,j  ,k)) * (phix(i+1,j  ,k)-phix(i,j  ,k)) )
-             else
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j-1,k)+umac(i,j-1,k)) * (phix(i+1,j-1,k)-phix(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in z-transverse terms
-    do       k = lo(3)  , hi(3)
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j  ,k+1)+wmac(i,j  ,k)) * (phiz(i,j  ,k+1)-phiz(i,j  ,k)) )
-             else
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j-1,k+1)+wmac(i,j-1,k)) * (phiz(i,j-1,k+1)-phiz(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in x-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k  )+umac(i,j,k  )) * (phix(i+1,j,k  )-phix(i,j,k  )) )
-             else
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k-1)+umac(i,j,k-1)) * (phix(i+1,j,k-1)-phix(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in y-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)  , hi(2)
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k  )+vmac(i,j,k  )) * (phiy(i,j+1,k  )-phiy(i,j,k  )) )
-             else
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k-1)+vmac(i,j,k-1)) * (phiy(i,j+1,k-1)-phiy(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! final edge states
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in yz and zy transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_z(i  ,j+1,k  )-phiy_z(i  ,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i  ,j,k)) * (phiz_y(i  ,j  ,k+1)-phiz_y(i  ,j,k)) )
-             else
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1,k  )+vmac(i-1,j,k)) * (phiy_z(i-1,j+1,k  )-phiy_z(i-1,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i-1,j  ,k+1)+wmac(i-1,j,k)) * (phiz_y(i-1,j  ,k+1)-phiz_y(i-1,j,k)) )
-             end if
-
-             ! compute final x-fluxes
-             flxx(i,j,k) = umac(i,j,k)*phix(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in xz and zx transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i,j  ,k)) * (phix_z(i+1,j  ,k  )-phix_z(i,j  ,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i,j  ,k)) * (phiz_x(i  ,j  ,k+1)-phiz_x(i,j  ,k)) )
-             else
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j-1,k  )+umac(i,j-1,k)) * (phix_z(i+1,j-1,k  )-phix_z(i,j-1,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j-1,k+1)+wmac(i,j-1,k)) * (phiz_x(i  ,j-1,k+1)-phiz_x(i,j-1,k)) )
-             end if
-
-             ! compute final y-fluxes
-             flxy(i,j,k) = vmac(i,j,k)*phiy(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in xy and yx transverse terms
-    do       k = lo(3), hi(3)+1
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i  ,j,k)) * (phix_y(i+1,j  ,k  )-phix_y(i,j,k  )) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_x(i  ,j+1,k  )-phiy_x(i,j,k  )) )
-             else
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k-1)+umac(i,j,k-1)) * (phix_y(i+1,j  ,k-1)-phix_y(i,j,k-1)) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k-1)+vmac(i,j,k-1)) * (phiy_x(i  ,j+1,k-1)-phiy_x(i,j,k-1)) )
-             end if
-
-             ! compute final z-fluxes
-             flxz(i,j,k) = wmac(i,j,k)*phiz(i,j,k)
-
-          end do
-       end do
-    end do
-
-
-  end subroutine compute_flux_3d
-
-end module compute_flux_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/slope_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/slope_3d.f90
deleted file mode 100755
index 418ac9d5ff3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_3d/slope_3d.f90
+++ /dev/null
@@ -1,211 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey, slopez
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    integer :: i, j, k
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do    k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-
-          ! first compute Fromm slopes
-          do i = lo(1)-1, hi(1)+1
-             dlft = q(i  ,j,k) - q(i-1,j,k)
-             drgt = q(i+1,j,k) - q(i  ,j,k)
-             dcen(i) = .5d0 * (dlft+drgt)
-             dsgn(i) = sign(1.d0, dcen(i))
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i) = 0.d0
-             endif
-             df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-          end do
-          
-          ! Now limited fourth order slopes
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-             dq(i,j,k) = dsgn(i)*min(dlim(i),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    do k = lo(3), hi(3)
-
-       ! first compute Fromm slopes
-       do j    = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j  ,k) - q(i,j-1,k)
-             drgt = q(i,j+1,k) - q(i,j  ,k)
-             dcen(i,j) = .5d0 * (dlft+drgt)
-             dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j) = 0.d0
-             endif
-             df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-          end do
-       end do
-       
-       ! Now compute limited fourth order slopes
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-             dq(i,j,k) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-          end do
-       end do
-
-    end do
-
-  end subroutine slopey_doit
-
-
-  subroutine slopez(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-
-    call slopez_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, &
-                     (/lo(1),lo(2),lo(3)-1/), (/hi(1),hi(2),hi(3)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopez
-
-  subroutine slopez_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(3), ddhi(3)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do k       = lo(3)-1, hi(3)+1
-       do j    = lo(2)  , hi(2)
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j,k  ) - q(i,j,k-1)
-             drgt = q(i,j,k+1) - q(i,j,k  )
-             dcen(i,j,k) = .5d0 * (dlft+drgt)
-             dsgn(i,j,k) = sign( 1.d0, dcen(i,j,k) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j,k) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j,k) = 0.d0
-             endif
-             df(i,j,k) = dsgn(i,j,k)*min( dlim(i,j,k),abs(dcen(i,j,k)) )
-          end do
-       end do
-    end do
-       
-    ! Now compute limited fourth order slopes
-    do k       = lo(3), hi(3)
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j,k) - sixth*( df(i,j,k+1) + df(i,j,k-1) )
-             dq(i,j,k) = dsgn(i,j,k)*min(dlim(i,j,k),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopez_doit
-
-end module slope_module 
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Adv_nd.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Adv_nd.f90
deleted file mode 100755
index b8dab92f175..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Adv_nd.f90
+++ /dev/null
@@ -1,63 +0,0 @@
-subroutine nullfill(adv,adv_lo,adv_hi,domlo,domhi,delta,xlo,time,bc) bind(C, name="nullfill")
-  implicit none
-  integer          :: adv_lo(3),adv_hi(3)
-  integer          :: bc(*)
-  integer          :: domlo(3), domhi(3)
-  double precision :: delta(3), xlo(3), time
-  double precision :: adv(adv_lo(1):adv_hi(1),adv_lo(2):adv_hi(2),adv_lo(3):adv_hi(3))
-  ! no physical boundaries to fill because it is all periodic
-  return
-end subroutine nullfill
-
-
-subroutine get_tagging_params(name, namlen) bind(C, name="get_tagging_params")
-
-  use tagging_params_module
-
-  ! Initialize the tagging parameters
-
-  integer, intent(in) :: namlen
-  integer, intent(in) :: name(namlen)
-        
-  integer :: un, i, status
-
-  integer, parameter :: maxlen = 256
-  character (len=maxlen) :: probin
-
-  namelist /tagging/ phierr, phigrad, max_phierr_lev, max_phigrad_lev
-
-  ! Set namelist defaults
-  phierr = 1.d20
-  phigrad = 1.d20
-  max_phierr_lev = -1
-  max_phigrad_lev = -1
-
-  ! create the filename
-  if (namlen > maxlen) then
-     print *, 'probin file name too long'
-     stop
-  endif
-
-  do i = 1, namlen
-     probin(i:i) = char(name(i))
-  end do
-
-  ! read in the namelist
-  un = 9
-  open (unit=un, file=probin(1:namlen), form='formatted', status='old')
-  read (unit=un, nml=tagging, iostat=status)
-  
-  if (status < 0) then
-     ! the namelist does not exist, so we just go with the defaults
-     continue
-
-  else if (status > 0) then
-     ! some problem in the namelist
-     print *, 'ERROR: problem in the tagging namelist'
-     stop
-  endif
-
-  close (unit=un)
-  
-end subroutine get_tagging_params
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Make.package b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Make.package
deleted file mode 100755
index 259de879545..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Adv_nd.f90 
-f90EXE_sources += Tagging_nd.f90 tagging_params.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Tagging_nd.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Tagging_nd.f90
deleted file mode 100755
index 394c35584ec..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/Tagging_nd.f90
+++ /dev/null
@@ -1,85 +0,0 @@
-
-! ::: -----------------------------------------------------------
-! ::: This routine will tag high error cells based on the state
-! ::: 
-! ::: INPUTS/OUTPUTS:
-! ::: 
-! ::: tag        <=  integer tag array
-! ::: tag_lo,hi   => index extent of tag array
-! ::: state       => state array
-! ::: state_lo,hi => index extent of state array
-! ::: set         => integer value to tag cell for refinement
-! ::: clear       => integer value to untag cell
-! ::: lo,hi       => work region we are allowed to change
-! ::: dx          => cell size
-! ::: problo      => phys loc of lower left corner of prob domain
-! ::: time        => problem evolution time
-! ::: level       => refinement level of this array
-! ::: -----------------------------------------------------------
-
-subroutine state_error(tag,tag_lo,tag_hi, &
-                       state,state_lo,state_hi, &
-                       set,clear,&
-                       lo,hi,&
-                       dx,problo,time,level) bind(C, name="state_error")
-
-  use tagging_params_module, only : phierr, phigrad, max_phierr_lev, max_phigrad_lev
-  implicit none
-  
-  integer          :: lo(3),hi(3)
-  integer          :: state_lo(3),state_hi(3)
-  integer          :: tag_lo(3),tag_hi(3)
-  double precision :: state(state_lo(1):state_hi(1), &
-                            state_lo(2):state_hi(2), &
-                            state_lo(3):state_hi(3))
-  integer          :: tag(tag_lo(1):tag_hi(1),tag_lo(2):tag_hi(2),tag_lo(3):tag_hi(3))
-  double precision :: problo(3),dx(3),time
-  integer          :: level,set,clear
-
-  double precision :: ax, ay, az
-  integer          :: i, j, k, dim
-
-  if (state_lo(3) .eq. state_hi(3)) then
-     dim = 2
-  else
-     dim = 3
-  end if
-
-  ! Tag on regions of high phi
-  if (level .lt. max_phierr_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              if (state(i,j,k) .ge. phierr(level)) then
-                 tag(i,j,k) = set
-              endif
-           enddo
-        enddo
-     enddo
-  endif
-
-  ! Tag on regions of high phisity gradient
-  if (level .lt. max_phigrad_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              ax = abs(state(i-1,j,k)-state(i,j,k))
-              ax = max(ax, abs(state(i,j,k)-state(i+1,j,k)))
-              ay = abs(state(i,j-1,k)-state(i,j,k))
-              ay = max(ay, abs(state(i,j,k)-state(i,j+1,k)))
-              if (dim .eq. 2) then
-                 az = 0.d0
-              else
-                 az = abs(state(i,j,k-1)-state(i,j,k))
-                 az = max(az, abs(state(i,j,k)-state(i,j,k+1)))
-              end if
-              if (max(ax,ay,az) .ge. phigrad(level)) then
-                 tag(i,j,k) = set
-              end if
-            enddo
-         enddo
-      end do
-   endif
-  
-end subroutine state_error
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/tagging_params.f90 b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/tagging_params.f90
deleted file mode 100755
index 3281fbf3dd9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/Src_nd/tagging_params.f90
+++ /dev/null
@@ -1,7 +0,0 @@
-module tagging_params_module
-
-  double precision, save :: phierr(0:15), phigrad(0:15)
-
-  integer, save :: max_phierr_lev, max_phigrad_lev
-
-end module tagging_params_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/main.cpp b/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/main.cpp
deleted file mode 100755
index 2cd6f2d7485..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_Async_OnDemand/Source/main.cpp
+++ /dev/null
@@ -1,98 +0,0 @@
-#include <new>
-#include <iostream>
-#include <iomanip>
-
-#include <AMReX_Amr.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_AmrLevel.H>
-#include <PerillaRts.H>
-
-using namespace amrex;
-using namespace perilla;
-int
-main (int   argc,
-      char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    Real dRunTime1 = ParallelDescriptor::second();
-
-    std::cout << std::setprecision(10);
-
-    int  max_step;
-    Real strt_time;
-    Real stop_time;
-    ParmParse pp; 
-
-    max_step  = -1;
-    strt_time =  0.0;
-    stop_time = -1.0;
-
-    pp.query("max_step",max_step);
-    pp.query("strt_time",strt_time);
-    pp.query("stop_time",stop_time);
-
-    if (strt_time < 0.0) {
-        amrex::Abort("MUST SPECIFY a non-negative strt_time"); 
-    }
-
-    if (max_step < 0 && stop_time < 0.0) {
-	amrex::Abort("Exiting because neither max_step nor stop_time is non-negative.");
-    }
-
-    {
-        Amr amr;
-
-        amr.init(strt_time,stop_time);
-
-#if USE_PERILLA_PTHREADS
-        RTS rts;
-        rts.Init(ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs());
-        rts.Iterate(&amr, max_step, stop_time); //run coarseTimeSteps on the amr object 
-
-        rts.Barrier();
-        // Write final checkpoint and plotfile
-        if (amr.stepOfLastCheckPoint() < amr.levelSteps(0)) {
-            amr.checkPoint();
-        }
-
-        if (amr.stepOfLastPlotFile() < amr.levelSteps(0)) {
-            amr.writePlotFile();
-        }
-        rts.Finalize();
-#elif defined(USE_PERILLA_ON_DEMAND)
-        while ( amr.okToContinue() &&
-               (amr.levelSteps(0) < max_step || max_step < 0) &&
-               (amr.cumTime() < stop_time || stop_time < 0.0) )
-
-        {
-            //
-            // Do a coarse timestep.  Recursively calls timeStep()
-            //
-            amr.coarseTimeStep(stop_time);
-        }
-
-        // Write final checkpoint and plotfile
-        if (amr.stepOfLastCheckPoint() < amr.levelSteps(0)) {
-            amr.checkPoint();
-        }
-
-        if (amr.stepOfLastPlotFile() < amr.levelSteps(0)) {
-            amr.writePlotFile();
-        }
-#endif
-    }
-
-    Real dRunTime2 = ParallelDescriptor::second() - dRunTime1;
-
-    ParallelDescriptor::ReduceRealMax(dRunTime2, ParallelDescriptor::IOProcessorNumber());
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        std::cout << "Run time = " << dRunTime2 << std::endl;
-    }
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/Make.Adv.mpi b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/Make.Adv.mpi
deleted file mode 100755
index 22223fc13a1..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/Make.Adv.mpi
+++ /dev/null
@@ -1,67 +0,0 @@
-AMREX_HOME = ../../../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi
-TOP := $(ADR_DIR)
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/Amr/Make.package
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi/Make.package
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-CXXFLAGS += $(PPFLAGS) 
-libraries += $(LDFLAGS)
-
-vpathdir += $(AMREX_HOME)/Src/Boundary
-vpathdir += $(AMREX_HOME)/Src/Base
-vpathdir += $(AMREX_HOME)/Src/Amr
-vpathdir += $(AMREX_HOME)/Src/AmrCore
-vpathdir += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs   := Base Boundary AmrCore Amr Particle
-Ppack   += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-LDFLAGS += $(LIBFLAGS)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-vpath %.c   . $(VPATH_LOCATIONS)
-vpath %.cpp . $(VPATH_LOCATIONS)
-vpath %.h   . $(VPATH_LOCATIONS)
-vpath %.H   . $(VPATH_LOCATIONS)
-vpath %.F   . $(VPATH_LOCATIONS)
-vpath %.f90 . $(VPATH_LOCATIONS)
-vpath %.F90 . $(VPATH_LOCATIONS)
-vpath %.f   . $(VPATH_LOCATIONS)
-vpath %.fi  . $(VPATH_LOCATIONS)
-
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-#-----------------------------------------------------------------------------
-# for debugging.  To see the value of a Makefile variable,
-# e.g. COMP, simply do "make print-COMP".  This will
-# print out the value.
-print-%: ; @echo $* is $($*)
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/Make.Adv.upcxx b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/Make.Adv.upcxx
deleted file mode 100755
index 3fb833e1d58..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/Make.Adv.upcxx
+++ /dev/null
@@ -1,73 +0,0 @@
-AMREX_HOME = ../../../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi
-TOP := $(ADR_DIR)
-UPCXX_INSTALL=/global/common/cori/ftg/upcxx/2019.3.0/hsw/gnu/PrgEnv-gnu-6.0.4-7.3.0/
-PPFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta PPFLAGS)
-LDFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta LDFLAGS)
-LIBFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta LIBFLAGS) 
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/Amr/Make.package
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx/perilla.mak
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common/perilla.mak
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx/Make.package
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-CXXFLAGS += $(PPFLAGS) 
-libraries += $(LDFLAGS)
-
-vpathdir += $(AMREX_HOME)/Src/Boundary
-vpathdir += $(AMREX_HOME)/Src/Base
-vpathdir += $(AMREX_HOME)/Src/Amr
-vpathdir += $(AMREX_HOME)/Src/AmrCore
-vpathdir += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs   := Base Boundary AmrCore Amr Particle
-Ppack   += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-LDFLAGS += $(LIBFLAGS)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-vpath %.c   . $(VPATH_LOCATIONS)
-vpath %.cpp . $(VPATH_LOCATIONS)
-vpath %.h   . $(VPATH_LOCATIONS)
-vpath %.H   . $(VPATH_LOCATIONS)
-vpath %.F   . $(VPATH_LOCATIONS)
-vpath %.f90 . $(VPATH_LOCATIONS)
-vpath %.F90 . $(VPATH_LOCATIONS)
-vpath %.f   . $(VPATH_LOCATIONS)
-vpath %.fi  . $(VPATH_LOCATIONS)
-
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.upcxx
-
-
-#-----------------------------------------------------------------------------
-# for debugging.  To see the value of a Makefile variable,
-# e.g. COMP, simply do "make print-COMP".  This will
-# print out the value.
-print-%: ; @echo $* is $($*)
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/GNUmakefile b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/GNUmakefile
deleted file mode 100755
index 6e2ee06a6f9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/GNUmakefile
+++ /dev/null
@@ -1,24 +0,0 @@
-AMREX_HOME ?= ../../../../../../
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-#DIM        = 2
-DIM       = 3
-CPPFLAGS += -DUSE_PERILLA -DMPICH_SKIP_MPICXX -std=c++11 -DUSE_PERILLA_PTHREADS 
-#-DPERILLA_USE_UPCXX
-
-COMP	   = g++
-FCOMP	   = gfortran
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv.mpi
-#include ../Make.Adv.upcxx
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/Make.package
deleted file mode 100755
index c478388fbdc..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/Prob.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/Prob.f90
deleted file mode 100755
index 93278c87712..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/Prob.f90
+++ /dev/null
@@ -1,57 +0,0 @@
-
-subroutine amrex_probinit (init,name,namlen,problo,probhi) bind(c)
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  ! nothing needs to be done here
-
-end subroutine amrex_probinit
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo) bind(C, name="initdata")
-
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2 + (z-0.5d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/face_velocity_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/face_velocity_2d.f90
deleted file mode 100755
index 368b58f7252..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/face_velocity_2d.f90
+++ /dev/null
@@ -1,61 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo)
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  integer :: i, j, plo(2), phi(2)
-  double precision :: x, y
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-
-  ! y velocity
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-
-  call bl_deallocate(psi)
-  
-end subroutine get_face_velocity
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/face_velocity_3d.f90
deleted file mode 100755
index b4063a8ccb3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/face_velocity_3d.f90
+++ /dev/null
@@ -1,69 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3, &
-     vy, vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3, &
-     vz, vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3
-  integer, intent(in) :: vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3
-  integer, intent(in) :: vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2,vx_l3:vx_h3)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2,vy_l3:vy_h3)
-  double precision, intent(out) :: vz(vz_l1:vz_h1,vz_l2:vz_h2,vz_l3:vz_h3)
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer :: i, j, k, plo(2), phi(2)
-  double precision :: x, y, z
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do k = vx_l3, vx_h3
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j,k) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-  end do
-
-  ! y velocity
-  do k = vy_l3, vy_h3
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j,k) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-  end do
-
-  vz = 1.d0
-
-  call bl_deallocate(psi)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/inputs b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/inputs
deleted file mode 100755
index 98c73dcf907..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,42 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 10
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratios
-amr.regrid_int      = 30      # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 32
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 20    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 0      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 20     # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/probin b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/probin
deleted file mode 100755
index 46d1856ad55..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/SingleVortex/probin
+++ /dev/null
@@ -1,14 +0,0 @@
-&fortin
-
-   adv_vel = 1.d0, 1.d0, 1.d0
-
-/
-
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/GNUmakefile b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/GNUmakefile
deleted file mode 100755
index 222595ecf90..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/GNUmakefile
+++ /dev/null
@@ -1,21 +0,0 @@
-BOXLIB_HOME ?= ../../../..
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-DIM        = 2
-#DIM       = 3
-
-COMP	   = g++
-FCOMP	   = gfortran
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/Make.package
deleted file mode 100755
index 01fd65d6390..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90 probdata.f90
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/Prob.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/Prob.f90
deleted file mode 100755
index 268e4c94024..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/Prob.f90
+++ /dev/null
@@ -1,84 +0,0 @@
-
-subroutine PROBINIT (init,name,namlen,problo,probhi)
-
-  use probdata_module
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  integer untin,i
-
-  namelist /fortin/ adv_vel
-  
-  !
-  ! Build "probin" filename -- the name of file containing fortin namelist.
-  !     
-  integer maxlen
-  parameter (maxlen=256)
-  character probin*(maxlen)
-  
-  if (namlen .gt. maxlen) then
-     write(6,*) 'probin file name too long'
-     stop
-  end if
-  
-  do i = 1, namlen
-     probin(i:i) = char(name(i))
-  end do
-  
-  adv_vel = 1.d0
-
-  ! Read namelists
-  untin = 9
-  open(untin,file=probin(1:namlen),form='formatted',status='old')
-  read(untin,fortin)
-  close(unit=untin)
-
-end subroutine PROBINIT
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo)
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.0d0)**2 + (y-0.0d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.0d0)**2 + (y-0.0d0)**2 + (z-0.0d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/face_velocity_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/face_velocity_2d.f90
deleted file mode 100755
index 9030e96eec8..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/face_velocity_2d.f90
+++ /dev/null
@@ -1,22 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo)
-
-  use probdata_module, only : adv_vel
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  vx = adv_vel(1)
-  vy = adv_vel(2)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/inputs b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/inputs
deleted file mode 100755
index 61b29a7c4b3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/inputs
+++ /dev/null
@@ -1,39 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 1000000
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     = -1.0 -1.0 -1.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# TIME STEP CONTROL
-adv.cfl            = 0.9     # cfl number for hyperbolic system
-
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.regrid_int      = 2       # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 10    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 1      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 10     # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/probdata.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/probdata.f90
deleted file mode 100755
index ffacef798b9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/probdata.f90
+++ /dev/null
@@ -1,7 +0,0 @@
-module probdata_module
-
-  implicit none
-
-  double precision, save :: adv_vel(3)
-
-end module probdata_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/probin b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/probin
deleted file mode 100755
index 46d1856ad55..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Exec/UniformVelocity/probin
+++ /dev/null
@@ -1,14 +0,0 @@
-&fortin
-
-   adv_vel = 1.d0, 1.d0, 1.d0
-
-/
-
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/README b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/README
deleted file mode 100755
index abc53af9c00..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/README
+++ /dev/null
@@ -1,9 +0,0 @@
-AMR_Adv_C: This code advects a single scalar field with a velocity
-field that is specified on faces.
-
-It is a BoxLib based code designed to run in parallel using MPI/OMP.
-
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d. 
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with Visit.
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv.H b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv.H
deleted file mode 100755
index a29261a5f00..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv.H
+++ /dev/null
@@ -1,223 +0,0 @@
-#ifndef _Adv_H_
-#define _Adv_H_
-
-#include <AMReX_AmrLevel.H>
-#include <AMReX_FluxRegister.H>
-//#include <BL_CXX11.H>
-
-#include <iostream>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-enum StateType { State_Type = 0,
-                 NUM_STATE_TYPE };
-
-//
-// AmrLevel-derived class for hyperbolic conservation equations
-//
-
-class Adv
-    :
-    public AmrLevel
-{
-public:
-    //
-    //Default constructor.  Builds invalid object.
-    //
-    Adv ();
-    //
-    //The basic constructor.
-    //
-    Adv (Amr&            papa,
-	 int             lev,
-	 const Geometry& level_geom,
-	 const BoxArray& bl,
-	 const DistributionMapping& dm,
-	 Real            time);
-    //
-    //The destructor.
-    //
-    virtual ~Adv ();
-    //
-    //Restart from a checkpoint file.
-    //
-    virtual void restart (Amr&          papa,
-                          std::istream& is,
-			  bool          bReadSpecial = false);
-    virtual void checkPoint (const std::string& dir,
-                             std::ostream&      os,
-                             amrex::VisMF::How  how = amrex::VisMF::NFiles,
-                             bool               dump_old = true);
-
-
-    /*A string written as the first item in writePlotFile() at
-               level zero. It is so we can distinguish between different
-               types of plot files. For Adv it has the form: Adv-Vnnn
-    */
-    virtual std::string thePlotFileType () const;
-
-    //
-    //Write a plotfile to specified directory.
-    //
-    virtual void writePlotFile (const std::string& dir,
-                                std::ostream&      os,
-                                VisMF::How         how);
-    //
-    //Define data descriptors.
-    //
-    static void variableSetUp ();
-    //
-    //Cleanup data descriptors at end of run.
-    //
-    static void variableCleanUp ();
-    //
-    //Initialize grid data at problem start-up.
-    //
-    virtual void initData ();
-    //
-    //Initialize data on this level from another Adv (during regrid).
-    //
-    virtual void init (AmrLevel& old);
-    //
-    //Initialize data on this level after regridding if old level did not previously exist
-    //
-    virtual void init ();
-    //
-    //Proceed with next timestep?
-    //
-    virtual int okToContinue () { return 1; }
-//    virtual int okToRegrid () { return false; }
-    //
-    //Advance grids at this level in time.
-    //
-    virtual Real advance (Real time,
-                          Real dt,
-                          int  iteration,
-                          int  ncycle);
-
-    virtual void initPerilla(Real time);
-    virtual void finalizePerilla (Real time);
-    //
-    //Estimate time step.
-    //
-    Real estTimeStep (Real dt_old);
-    //
-    //Compute initial time step.
-    //
-    Real initialTimeStep ();
-    //
-    //Compute initial `dt'.
-    //
-    virtual void computeInitialDt (int                   finest_level,
-                                   int                   sub_cycle,
-                                   Vector<int>&           n_cycle,
-                                   const Vector<IntVect>& ref_ratio,
-                                   Vector<Real>&          dt_level,
-                                   Real                  stop_time);
-    //
-    //Compute new `dt'.
-    //
-    virtual void computeNewDt (int                   finest_level,
-                               int                   sub_cycle,
-                               Vector<int>&           n_cycle,
-                               const Vector<IntVect>& ref_ratio,
-                               Vector<Real>&          dt_min,
-                               Vector<Real>&          dt_level,
-                               Real                  stop_time,
-                               int                   post_regrid_flag);
-    //
-    //Do work after timestep().
-    //
-    virtual void post_timestep (int iteration);
-    //
-    //Do work after regrid().
-    //
-    virtual void post_regrid (int lbase, int new_finest) { ; }
-    //
-    //Do work after a restart().
-    //
-    virtual void post_restart () { ; }
-    //
-    //Do work after init().
-    //
-    virtual void post_init (Real stop_time);
-    //
-    //Error estimation for regridding.
-    //
-    virtual void errorEst (TagBoxArray& tb,
-                           int          clearval,
-                           int          tagval,
-                           Real         time,
-			   int          n_error_buf = 0, int ngrow = 0);
-
-    static int  NUM_STATE;
-    static int  NUM_GROW;
-  
-protected:
-
-    static void read_params ();
-
-    Adv& getLevel (int lev);
-
-    FluxRegister& getFluxReg ();
-    FluxRegister& getFluxReg (int lev);
-
-    void reflux ();
-  
-    void avgDown ();
-  
-    void avgDown (int iteration);
-
-    void avgDown (int state_indx, int iteration);
-
-    //
-    // The data.
-    //
-    FluxRegister*        flux_reg;
-    //
-    // Static data members.
-    //
-    static int       verbose;
-    static Real      cfl;
-    static int       do_reflux;
-
-public:
-  
-    MultiFab* Sborder;
-    std::vector<FillPatchIterator*> SborderFPI;
-
-    MultiFab*  S_fine;
-    MultiFab*  crse_S_fine;  
-    MultiFab*  S_crse;
-    RegionGraph* RG_S_fine;
-    RegionGraph* RG_S_crse;
-};    
-
-//
-// Inlines.
-//
-
-inline
-Adv&
-Adv::getLevel (int lev)
-{
-    return *(Adv *) &parent->getLevel(lev);
-}
-
-inline
-FluxRegister&
-Adv::getFluxReg ()
-{
-    BL_ASSERT(flux_reg);
-    return *flux_reg;
-}
-
-inline
-FluxRegister&
-Adv::getFluxReg (int lev)
-{
-    return getLevel(lev).getFluxReg();
-}
-#endif /*_Adv_H_*/
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv.cpp
deleted file mode 100755
index c6052250b87..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv.cpp
+++ /dev/null
@@ -1,410 +0,0 @@
-#include <Adv.H>
-#include <Adv_F.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_TagBox.H>
-#include <AMReX_ParmParse.H>
-
-#include <Perilla.H>
-#include <RegionGraph.H>
-#include <WorkerThread.H>
-
-#include <iostream>
-#include <iomanip>
-
-#include <string>
-#include <fstream>
-
-
-using namespace amrex;
-using namespace perilla;
-
-int      Adv::verbose         = 0;
-Real     Adv::cfl             = 0.9;
-int      Adv::do_reflux       = 0;
-
-int      Adv::NUM_STATE       = 1;  // One variable in the state
-int      Adv::NUM_GROW        = 3;  // number of ghost cells
-
-    void
-Adv::read_params ()
-{
-    static bool done = false;
-
-    if (done) return;
-
-    done = true;
-
-    ParmParse pp("adv");   
-
-    pp.query("v",verbose);
-    pp.query("cfl",cfl);
-    pp.query("do_reflux",do_reflux);
-}
-
-Adv::Adv ()
-{
-    flux_reg = 0;
-    Sborder = 0;
-    SborderFPI.clear();    
-    S_fine = NULL;
-    S_crse = NULL;
-    RG_S_fine = NULL;
-    RG_S_crse = NULL;
-}
-
-Adv::Adv (Amr&            papa,
-	int             lev,
-	const Geometry& level_geom,
-	const BoxArray& bl,
-	const DistributionMapping& dm,
-	Real            time)
-    :
-	AmrLevel(papa,lev,level_geom,bl,dm,time) 
-{
-    flux_reg = 0;
-    if (level > 0 && do_reflux)
-	flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-
-    Sborder = 0;
-    SborderFPI.clear();
-    S_fine = NULL;
-    S_crse = NULL;
-    RG_S_fine = NULL;
-    RG_S_crse = NULL;    
-}
-
-Adv::~Adv () 
-{
-    delete flux_reg;
-}
-
-    void
-Adv::initData ()
-{
-    //
-    // Loop over grids, call FORTRAN function to init with data.
-    //
-    const Real* dx  = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    MultiFab& S_new = get_new_data(State_Type);
-    Real cur_time   = state[State_Type].curTime();
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Initializing the data at level " << level << std::endl;
-
-
-    for (MFIter mfi(S_new); mfi.isValid(); ++mfi)
-    {
-	const Box& box     = mfi.validbox();
-	const int* lo      = box.loVect();
-	const int* hi      = box.hiVect();
-
-	initdata(level, cur_time, ARLIM_3D(lo), ARLIM_3D(hi),
-		BL_TO_FORTRAN_3D(S_new[mfi]), ZFILL(dx),
-		ZFILL(prob_lo));
-    }
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Done initializing the level " << level << " data " << std::endl;
-}
-
-    void
-Adv::init (AmrLevel &old)
-{
-    Adv* oldlev = (Adv*) &old;
-    //
-    // Create new grid data by fillpatching from old.
-    //
-    Real dt_new    = parent->dtLevel(level);
-    Real cur_time  = oldlev->state[State_Type].curTime();
-    Real prev_time = oldlev->state[State_Type].prevTime();
-    Real dt_old    = cur_time - prev_time;
-    setTimeLevel(cur_time,dt_old,dt_new);
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-    FillPatch(old, S_new, 0, cur_time, State_Type, 0, NUM_STATE);
-}
-
-//
-// This version inits the data on a new level that did not
-// exist before regridding.
-//
-    void
-Adv::init ()
-{
-    Real dt        = parent->dtLevel(level);
-    Real cur_time  = getLevel(level-1).state[State_Type].curTime();
-    Real prev_time = getLevel(level-1).state[State_Type].prevTime();
-
-    Real dt_old = (cur_time - prev_time)/(Real)parent->MaxRefRatio(level-1);
-
-    setTimeLevel(cur_time,dt_old,dt);
-    MultiFab& S_new = get_new_data(State_Type);
-    FillCoarsePatch(S_new, 0, cur_time, State_Type, 0, NUM_STATE);
-}
-
-
-    void
-Adv::post_timestep (int iteration)
-{
-
-    //
-    // Integration cycle on fine level grids is complete
-    // do post_timestep stuff here.
-    //
-    int finest_level = parent->finestLevel();
-
-    if(perilla::isMasterThread())
-	if (do_reflux && level < finest_level)
-	    reflux();
-    perilla::syncAllWorkerThreads();
-
-    avgDown(iteration);
-}
-
-    void
-Adv::post_init (Real stop_time)
-{
-    if (level > 0)
-	return;
-    //
-    // Average data down from finer levels
-    // so that conserved data is consistent between levels.
-    //
-    int finest_level = parent->finestLevel();
-    for (int k = finest_level; k>= 0; k--)
-	getLevel(k).avgDown();
-}
-
-    void
-Adv::reflux ()
-{
-    BL_ASSERT(level<parent->finestLevel());
-
-    const Real strt = ParallelDescriptor::second();
-
-    getFluxReg(level+1).Reflux(get_new_data(State_Type),1.0,0,0,NUM_STATE,geom);
-
-    if (verbose)
-    {
-	const int IOProc = ParallelDescriptor::IOProcessorNumber();
-	Real      end    = ParallelDescriptor::second() - strt;
-
-	ParallelDescriptor::ReduceRealMax(end,IOProc);
-
-	if (ParallelDescriptor::IOProcessor())
-	    std::cout << "Adv::reflux() at level " << level << " : time = " << end << std::endl;
-    }
-}
-
-
-    void
-Adv::avgDown ()
-{
-    if (level == parent->finestLevel()) return;
-
-    Adv& fine_lev = getLevel(level+1);
-    MultiFab&  S_fine   = fine_lev.get_new_data(State_Type);
-    MultiFab&  S_crse   = get_new_data(State_Type);
-
-    amrex::average_down(S_fine,S_crse,
-	    fine_lev.geom,geom,
-	    0,S_fine.nComp(),parent->refRatio(level));
-
-}
-
-
-    void
-Adv::avgDown (int iteration)
-{
-    avgDown(State_Type, iteration);
-}
-
-    void
-Adv::avgDown (int state_indx, int iteration)
-{
-    int tid = perilla::tid();
-    int tg = perilla::wid();
-    int nt = perilla::wtid();
-    int myProc = ParallelDescriptor::MyProc();
-    int f;
-
-    if(level < parent->finestLevel())
-    {
-	Adv& fine_lev = getLevel(level+1);
-
-	MultiFab* tS_fine = &(fine_lev.get_new_data(state_indx));
-	MultiFab* tS_crse = &(get_new_data(state_indx));
-
-	MultiFab& S_new = get_new_data(state_indx);
-	const Real time = state[state_indx].curTime();
-
-
-	if(perilla::isMasterWorkerThread())
-	    RG_S_crse->Reset();
-
-	while(!RG_S_crse->isGraphEmpty())
-	{
-	    f = RG_S_crse->getAnyFireableRegion();	  
-
-	    Perilla::multifabCopyPull(RG_S_crse, RG_S_fine, tS_crse, tS_fine, f, 0, 0, S_fine->nComp(), 0, 0, false);
-
-	    perilla::syncWorkerThreads();
-
-	    // Send data to advance for next subcycle iteration  
-	    if(iteration < parent->nCycle(level))
-		SborderFPI[iteration]->FillPatchPush(NUM_GROW, time, state_indx, 0, NUM_STATE, f, 0x02, false);
-	    RG_S_crse->finalizeRegion(f);
-	}
-
-	if(perilla::isMasterWorkerThread())
-	    RG_S_crse->finalizeGraph();
-    }
-
-    perilla::syncWorkers();
-
-    if (level > 0 && iteration == parent->nCycle(level))
-    {
-	Adv& crse_lev = getLevel(level-1);            
-	MultiFab* tS_fine = &(get_new_data(state_indx));
-	MultiFab* tS_crse = &(crse_lev.get_new_data(state_indx));
-
-
-	if(perilla::isMasterWorkerThread())
-	{
-	    crse_lev.RG_S_fine->Reset();	  
-	}
-
-
-	while(!crse_lev.RG_S_fine->isGraphEmpty())
-	{	
-	    f = crse_lev.RG_S_fine->getAnyFireableRegion();
-	    int lfi = tS_fine->IndexArray()[f];
-#if 0
-            const FArrayBox& fin = (*S_fine)[lfi]; 
-            const FArrayBox& cin = (*crse_S_fine)[lfi]; 
-
-	    int tg = perilla::wid();
-	    int nt = perilla::wtid();
-
-	    for(int t=0; t<crse_lev.RG_S_fine->fabTiles[f]->numTiles; t++)
-		if(t % (perilla::NUM_THREADS_PER_TEAM-1) == nt)
-		{
-		    const Box& tbx = *(crse_lev.RG_S_fine->fabTiles[f]->tileBx[t]);
-                    amrex_avgdown(tbx,cin.array(),fin.array(),0,0,ncomp,ratio);
-		}
-#endif
-	    perilla::syncWorkerThreads();
-	    Perilla::multifabCopyPushAsync(crse_lev.RG_S_crse, crse_lev.RG_S_fine, tS_crse, tS_fine, f, 0, 0, crse_lev.S_fine->nComp(), 0, 0, false);
-
-	    crse_lev.RG_S_fine->finalizeRegion(f);	      
-	}
-
-	if(perilla::isMasterWorkerThread())
-	    crse_lev.RG_S_fine->finalizeGraph();
-    }
-}
-
-    void
-Adv::initPerilla(Real time)
-{
-    int state_indx = State_Type;
-    Sborder = new MultiFab(grids, dmap, NUM_STATE, NUM_GROW);
-
-    SborderFPI.resize(parent->nCycle(level));        
-    for(int i=0; i<parent->nCycle(level); i++)
-    {
-	SborderFPI[i] = new FillPatchIterator(*this, *(Sborder),NUM_GROW, time+(i*parent->dtLevel(level)), State_Type, 0, NUM_STATE,0);
-	SborderFPI[i]->initFillPatch(NUM_GROW, time+(i*parent->dtLevel(level)), State_Type, 0, NUM_STATE, i+1);	
-    }
-
-    if(level < parent->finestLevel())
-    {
-	Adv& fine_lev = getLevel(level+1);
-	S_fine = &(fine_lev.get_new_data(state_indx));
-	S_crse = &(get_new_data(state_indx));
-
-	const BoxArray& fine_BA = S_fine->boxArray();
-	BoxArray crse_S_fine_BA = fine_BA;
-	crse_S_fine_BA.coarsen(parent->refRatio(level));
-	crse_S_fine = new MultiFab(crse_S_fine_BA, S_fine->DistributionMap(), S_fine->nComp(),0);
-
-	RG_S_crse = new RegionGraph(S_crse->IndexArray().size());
-	RG_S_fine = new RegionGraph(crse_S_fine->IndexArray().size());
-	RG_S_fine->buildTileArray(*crse_S_fine);
-
-	Perilla::multifabExtractCopyAssoc( RG_S_crse, RG_S_fine, *S_crse, *crse_S_fine, S_fine->nComp(), 0, 0, Periodicity::NonPeriodic());
-	parent->graphArray[level].push_back(RG_S_crse);
-	parent->graphArray[level].push_back(RG_S_fine);
-    }
-}
-
-    void
-Adv::finalizePerilla (Real time)
-{
-    if(ParallelDescriptor::MyProc()==0)
-	std::cout<< "Finalizing Perilla Level " << level <<std::endl;
-
-    for(int i=0; i< parent->nCycle(level); i++)
-    {
-	 delete SborderFPI[i];
-    }
-    SborderFPI.clear();
-    if(Sborder) delete Sborder;    
-
-    if(level < parent->finestLevel())
-    {
-	S_fine = 0;
-	S_crse = 0;
-	if(crse_S_fine) delete crse_S_fine;
-	if(RG_S_fine) delete RG_S_fine;
-	if(RG_S_crse) delete RG_S_crse;	
-    }
-}
-
-    void
-Adv::errorEst (TagBoxArray& tags,
-	int          clearval,
-	int          tagval,
-	Real         time,
-	int          n_error_buf,
-	int          ngrow)
-{
-    const Real* dx        = geom.CellSize();
-    const Real* prob_lo   = geom.ProbLo();
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-	Vector<int>  itags;
-
-	for (MFIter mfi(S_new,true); mfi.isValid(); ++mfi)
-	{
-	    const Box&  tilebx  = mfi.tilebox();
-
-	    TagBox&     tagfab  = tags[mfi];
-
-	    // We cannot pass tagfab to Fortran becuase it is BaseFab<char>.
-	    // So we are going to get a temporary integer array.
-	    tagfab.get_itags(itags, tilebx);
-
-	    // data pointer and index space
-	    int*        tptr    = itags.dataPtr();
-	    const int*  tlo     = tilebx.loVect();
-	    const int*  thi     = tilebx.hiVect();
-
-	    state_error(tptr,  ARLIM_3D(tlo), ARLIM_3D(thi),
-		    BL_TO_FORTRAN_3D(S_new[mfi]),
-		    &tagval, &clearval,
-		    ARLIM_3D(tilebx.loVect()), ARLIM_3D(tilebx.hiVect()),
-		    ZFILL(dx), ZFILL(prob_lo), &time, &level);
-	    // Now update the tags in the TagBox.
-	    //
-	    tagfab.tags_and_untags(itags, tilebx);
-	}
-    }
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/AdvBld.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/AdvBld.cpp
deleted file mode 100755
index 171b3478d0e..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/AdvBld.cpp
+++ /dev/null
@@ -1,57 +0,0 @@
-
-#include <AMReX_LevelBld.H>
-#include <Adv.H>
-
-using namespace amrex;
-
-class AdvBld
-    :
-    public LevelBld
-{
-    virtual void variableSetUp () override;
-    virtual void variableCleanUp () override;
-    virtual AmrLevel *operator() () override;
-    virtual AmrLevel *operator() (Amr&            papa,
-                                  int             lev,
-                                  const Geometry& level_geom,
-                                  const BoxArray& ba,
-				  const DistributionMapping& dm,
-                                  Real            time) override;
-};
-
-AdvBld Adv_bld;
-
-LevelBld*
-getLevelBld ()
-{
-    return &Adv_bld;
-}
-
-void
-AdvBld::variableSetUp ()
-{
-    Adv::variableSetUp();
-}
-
-void
-AdvBld::variableCleanUp ()
-{
-    Adv::variableCleanUp();
-}
-
-AmrLevel*
-AdvBld::operator() ()
-{
-    return new Adv;
-}
-
-AmrLevel*
-AdvBld::operator() (Amr&            papa,
-		    int             lev,
-		    const Geometry& level_geom,
-		    const BoxArray& ba,
-		    const DistributionMapping& dm,
-		    Real            time)
-{
-    return new Adv(papa, lev, level_geom, ba, dm, time);
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_F.H b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_F.H
deleted file mode 100755
index a56dc5abd83..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_F.H
+++ /dev/null
@@ -1,44 +0,0 @@
-#ifndef _Adv_F_H_
-#define _Adv_F_H_
-#include <AMReX_BLFort.H>
-
-extern "C" 
-{
-  void get_tagging_params(const int* name, const int* namlen);
-
-  void nullfill(BL_FORT_FAB_ARG_3D(state),
-		const int* dlo, const int* dhi,
-		const amrex::Real* dx, const amrex::Real* glo, 
-		const amrex::Real* time, const int* bc);
-  
-  void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		   BL_FORT_FAB_ARG_3D(state),
-		   const int* tagval, const int* clearval,
-		   const int* lo, const int* hi,
-		   const amrex::Real* dx, const amrex::Real* problo,
-		   const amrex::Real* time, const int* level);
-  
-  void initdata(const int& level, const amrex::Real& time, 
-		const int* lo, const int* hi,
-		BL_FORT_FAB_ARG_3D(state),
-		const amrex::Real* dx, const amrex::Real* problo);
-  
-  void get_face_velocity(const int& level, const amrex::Real& time, 
-			 D_DECL(BL_FORT_FAB_ARG(xvel),
-				BL_FORT_FAB_ARG(yvel),
-				BL_FORT_FAB_ARG(zvel)),
-			 const amrex::Real* dx, const amrex::Real* problo);
-  
-  void advect(const amrex::Real& time, const int* lo, const int*hi,
-	      const BL_FORT_FAB_ARG_3D(statein),
-	      BL_FORT_FAB_ARG_3D(stateout),
-	      D_DECL(const BL_FORT_FAB_ARG_3D(xvel),
-		     const BL_FORT_FAB_ARG_3D(yvel),
-		     const BL_FORT_FAB_ARG_3D(zvel)),
-	      D_DECL(BL_FORT_FAB_ARG_3D(fx),
-		     BL_FORT_FAB_ARG_3D(fy),
-		     BL_FORT_FAB_ARG_3D(fz)),
-	      const amrex::Real* dx, const amrex::Real& dt);
-}
-
-#endif
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_advance.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_advance.cpp
deleted file mode 100755
index c92a37fa10c..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_advance.cpp
+++ /dev/null
@@ -1,209 +0,0 @@
-#include <Adv.H>
-#include <Adv_F.H>
-#include <WorkerThread.H>
-#include <RegionGraph.H>
-#include <Perilla.H>
-#include <string>
-#include <fstream>
-
-using namespace perilla;
-
-Real
-Adv::advance (Real time,
-	Real dt,
-	int  iteration,
-	int  ncycle)
-{
-    int tg = perilla::wid();
-    int nt = perilla::wtid();
-    int myProc = ParallelDescriptor::MyProc();
-
-    perilla::syncAllWorkerThreads(); //tasks handled by workers in a process share the state data
-    if(perilla::isMasterThread())
-    {
-	for (int k = 0; k < NUM_STATE_TYPE; k++) {
-	    state[k].allocOldData();
-	    state[k].swapTimeLevels(dt);
-	}
-    }
-    perilla::syncAllWorkerThreads();
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-    const Real prev_time = state[State_Type].prevTime();
-    const Real cur_time = state[State_Type].curTime();
-    const Real ctr_time = 0.5*(prev_time + cur_time);
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-
-    // Get pointers to Flux registers, or set pointer to zero if not there.
-    FluxRegister *fine    = 0;
-    FluxRegister *current = 0;
-
-    int finest_level = parent->finestLevel();
-
-    if(perilla::isMasterThread())
-    {
-	if (do_reflux && level < finest_level) {
-	    fine = &getFluxReg(level+1);
-	    fine->setVal(0.0);
-	}
-    }
-    perilla::syncAllWorkerThreads();
-
-    if (do_reflux && level > 0) {
-	current = &getFluxReg(level);
-    }
-
-    MultiFab fluxes[BL_SPACEDIM];
-
-    if (do_reflux)
-    {
-	for (int j = 0; j < BL_SPACEDIM; j++)
-	{
-	    BoxArray ba = S_new.boxArray();
-	    ba.surroundingNodes(j);
-	    fluxes[j].define(ba, dmap, NUM_STATE, 0);
-	}
-    }
-
-    //This is the FillPatch on the coarsest level, starting the async execution on multiple AMR levels
-    if(level == 0 && iteration == 1)
-    {
-	Adv& thisLevel = getLevel(level);	
-	bool isSingleThread=false;
-	for(int f=0; f<Sborder->IndexArray().size(); f++)
-	{
-	    if(WorkerThread::isMyRegion(tg, f))
-	    {		
-		for(int i=0; i<parent->nCycle(level); i++)
-		{
-		    //cout<<"Filling level 0"<<endl;
-		    thisLevel.SborderFPI[i]->FillPatchPush(NUM_GROW, time+(i*parent->dtLevel(level)), State_Type /*index to state data*/, 0 /*base component*/, NUM_STATE/* num components*/, f /*fill FAB f only*/, 0xFF, isSingleThread);				
-		}
-	    }
-	}
-    }    
-    perilla::syncWorkerThreads();
-
-    FArrayBox flux[BL_SPACEDIM], uface[BL_SPACEDIM];
-
-    if(level < parent->finestLevel())
-    {
-	Adv& upperLevel = getLevel(level+1);
-	bool isSingleThread=false;
-	unsigned char tuc = 0x04;
-	upperLevel.SborderFPI[0]->FillPatchPush(NUM_GROW, time, State_Type /*index to state data*/, 0 /*base component*/, NUM_STATE/* num components*/, -1/*fill whole AMR level*/, tuc, isSingleThread);
-    }
-
-    //double ulp_etime = omp_get_wtime();
-
-    if(perilla::isMasterWorkerThread())
-	SborderFPI[iteration-1]->Reset();
-    perilla::syncWorkerThreads();
-
-    double stime, etime;
-
-    if(nt == perilla::NUM_THREADS_PER_TEAM-2)
-    {
-	bool singleThread= true;
-	while(SborderFPI[iteration-1]->destGraph->worker[tg]->completedRegionQueue->queueSize(true)!=SborderFPI[iteration-1]->destGraph->worker[tg]->totalTasks ||
-		SborderFPI[iteration-1]->destGraph->worker[tg]->computedTasks!=SborderFPI[iteration-1]->destGraph->worker[tg]->totalTasks)
-	{
-	    int f = SborderFPI[iteration-1]->destGraph->getFireableRegion(singleThread);
-	    if(f != -1)
-	    {
-		SborderFPI[iteration-1]->FillPatchPull(NUM_GROW, time, State_Type, 0, NUM_STATE, f, true);
-		SborderFPI[iteration-1]->destGraph->setFireableRegion(f);
-	    }
-
-	    if(SborderFPI[iteration-1]->destGraph->worker[tg]->computedRegionQueue->queueSize()!=0)
-	    {
-		f = SborderFPI[iteration-1]->destGraph->worker[tg]->computedRegionQueue->removeRegion();
-
-		if(level == parent->finestLevel() && iteration < ncycle)
-		    SborderFPI[iteration]->FillPatchPush(NUM_GROW, time+dt, State_Type, 0, NUM_STATE, f /*fill FAB f only*/, 0x02, true);
-
-		if(level < parent->finestLevel())
-		{
-		    Adv& upperLevel = getLevel(level+1);
-		    for(int i=0; i<parent->nCycle(level+1); i++)
-		    {
-			unsigned char tuc = 0x01;
-			upperLevel.SborderFPI[i]->FillPatchPush(NUM_GROW, time+(i*parent->dtLevel(level+1)), State_Type, 0, NUM_STATE, f /*fill FAB f only*/, tuc, true);
-		    }
-		}	
-		SborderFPI[iteration-1]->destGraph->worker[tg]->completedRegionQueue->addRegion(f,true);
-	    }
-	}
-    }
-    else
-    {
-	while(!SborderFPI[iteration-1]->destGraph->isGraphEmptyV2())
-	{
-	    int f = SborderFPI[iteration-1]->destGraph->getPulledFireableRegion();	
-	    int fid = S_new.IndexArray()[f];
-	    int fis = Sborder->IndexArray()[f];
-	    const FArrayBox& statein = (*(Sborder))[fis];
-	    FArrayBox& stateout      =   S_new[fid];
-	    MFIter mfi(S_new, true);
-            SborderFPI[iteration-1]->destGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-2);
-	    for(int t=0; t<SborderFPI[iteration-1]->destGraph->fabTiles[f]->numTiles; t++)	  
-		if(t % (perilla::NUM_THREADS_PER_TEAM-2) == nt)
-		{	
-		    const Box& bx = *(SborderFPI[iteration-1]->destGraph->fabTiles[f]->tileBx[t]);
-		    for (int i = 0; i < BL_SPACEDIM ; i++) {
-			const Box& bxtmp = amrex::surroundingNodes(bx,i);
-			{
-			    flux[i].resize(bxtmp,NUM_STATE);
-			    uface[i].resize(amrex::grow(bxtmp,1),1);
-			}
-		    }
-
-		    get_face_velocity(level, ctr_time,
-			    D_DECL(BL_TO_FORTRAN(uface[0]),
-				BL_TO_FORTRAN(uface[1]),
-				BL_TO_FORTRAN(uface[2])),
-			    dx, prob_lo);
-		    advect(time, bx.loVect(), bx.hiVect(),
-			    BL_TO_FORTRAN_3D(statein),
-			    BL_TO_FORTRAN_3D(stateout),
-			    D_DECL(BL_TO_FORTRAN_3D(uface[0]),
-				BL_TO_FORTRAN_3D(uface[1]),
-				BL_TO_FORTRAN_3D(uface[2])),
-			    D_DECL(BL_TO_FORTRAN_3D(flux[0]),
-				BL_TO_FORTRAN_3D(flux[1]),
-				BL_TO_FORTRAN_3D(flux[2])),
-			    dx, dt);
-
-		    if (do_reflux) {
-			for (int i = 0; i < BL_SPACEDIM ; i++)
-			    fluxes[i][f].copy(flux[i],mfi.nodaltilebox(i));	  
-		    }
-		}   // End of single Fab computation using tiling
-            SborderFPI[iteration-1]->destGraph->worker[tg]->l_barr->sync(perilla::NUM_THREADS_PER_TEAM-2);
-	    if (do_reflux) {
-		if (current) {
-		    for (int i = 0; i < BL_SPACEDIM ; i++)
-			current->FineAdd(fluxes[i][f], i, fluxes[i].IndexArray()[f], 0, 0, NUM_STATE, 1.0, RunOn::Cpu);
-		}
-	    }
-	    SborderFPI[iteration-1]->destGraph->regionComputed(f);
-	}// while(!SborderFPI[i]->destGraph->isGraphEmpty())
-    }
-    if (do_reflux) {
-	if (fine) {
-	    if(perilla::isMasterThread())
-		for (int i = 0; i < BL_SPACEDIM ; i++)
-		    fine->CrseInit(fluxes[i],i,0,0,NUM_STATE,-1.);
-	}
-	perilla::syncAllWorkerThreads();
-    }
-
-    if(perilla::isMasterWorkerThread())
-	SborderFPI[iteration-1]->finalizeGraphs();
-
-    perilla::syncAllWorkerThreads();
-    return dt;
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_dt.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_dt.cpp
deleted file mode 100755
index 188cb000f9f..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_dt.cpp
+++ /dev/null
@@ -1,171 +0,0 @@
-
-#include <Adv.H>
-#include <Adv_F.H>
-
-Real
-Adv::initialTimeStep ()
-{
-    return estTimeStep(0.0);
-}
-
-Real
-Adv::estTimeStep (Real)
-{
-    // This is just a dummy value to start with 
-    Real dt_est  = 1.0e+20;
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    const Real cur_time = state[State_Type].curTime();
-    const MultiFab& S_new = get_new_data(State_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est)
-#endif
-    {
-	FArrayBox uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bx = mfi.nodaltilebox(i);
-		uface[i].resize(bx,1);
-	    }
-
-            get_face_velocity(level, cur_time,
-                              D_DECL(BL_TO_FORTRAN(uface[0]),
-                                     BL_TO_FORTRAN(uface[1]),
-                                     BL_TO_FORTRAN(uface[2])),
-                              dx, prob_lo);
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		Real umax = uface[i].norm(0);
-		if (umax > 1.e-100) {
-		    dt_est = std::min(dt_est, dx[i] / umax);
-		}
-	    }
-	}
-    }
-
-    ParallelDescriptor::ReduceRealMin(dt_est);
-    dt_est *= cfl;
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Adv::estTimeStep at level " << level << ":  dt_est = " << dt_est << std::endl;
-    
-    return dt_est;
-}
-
-void
-Adv::computeNewDt (int                   finest_level,
-		   int                   sub_cycle,
-		   Vector<int>&           n_cycle,
-		   const Vector<IntVect>& ref_ratio,
-		   Vector<Real>&          dt_min,
-		   Vector<Real>&          dt_level,
-		   Real                  stop_time,
-		   int                   post_regrid_flag)
-{
-    //
-    // We are at the end of a coarse grid timecycle.
-    // Compute the timesteps for the next iteration.
-    //
-    if (level > 0)
-        return;
-
-    for (int i = 0; i <= finest_level; i++)
-    {
-        Adv& adv_level = getLevel(i);
-        dt_min[i] = adv_level.estTimeStep(dt_level[i]);
-    }
-
-    if (post_regrid_flag == 1) 
-    {
-	//
-	// Limit dt's by pre-regrid dt
-	//
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],dt_level[i]);
-	}
-    }
-    else 
-    {
-	//
-	// Limit dt's by change_max * old dt
-	//
-	static Real change_max = 1.1;
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],change_max*dt_level[i]);
-	}
-    }
-    
-    //
-    // Find the minimum over all levels
-    //
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_min[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
-
-void
-Adv::computeInitialDt (int                   finest_level,
-		       int                   sub_cycle,
-		       Vector<int>&           n_cycle,
-		       const Vector<IntVect>& ref_ratio,
-		       Vector<Real>&          dt_level,
-		       Real                  stop_time)
-{
-    //
-    // Grids have been constructed, compute dt for all levels.
-    //
-    if (level > 0)
-        return;
-
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        dt_level[i] = getLevel(i).initialTimeStep();
-        n_factor   *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_level[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_io.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_io.cpp
deleted file mode 100755
index c08230422ce..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_io.cpp
+++ /dev/null
@@ -1,209 +0,0 @@
-#include <Adv.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-void
-Adv::restart (Amr&          papa,
-	      std::istream& is,
-	      bool          bReadSpecial)
-{
-    AmrLevel::restart(papa,is,bReadSpecial);
-
-    BL_ASSERT(flux_reg == 0);
-    if (level > 0 && do_reflux)
-        flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-}
-
-/*
-void
-Adv::post_restart() 
-{
-#ifdef PARTICLES
-    if (do_tracers and level == 0) {
-      BL_ASSERT(TracerPC == 0);
-      TracerPC.reset(new AmrTracerParticleContainer(parent));
-      TracerPC->Restart(parent->theRestartFile(), "Tracer");
-    }
-#endif
-}
-*/
-
-void 
-Adv::checkPoint (const std::string& dir,
-		 std::ostream&      os,
-		 VisMF::How         how,
-		 bool               dump_old) 
-{
-  AmrLevel::checkPoint(dir, os, how, dump_old);
-#ifdef PARTICLES
-  if (do_tracers and level == 0) {
-    TracerPC->Checkpoint(dir, "Tracer", true);
-  }
-#endif
-}
-
-
-std::string
-Adv::thePlotFileType () const
-{
-    static const std::string the_plot_file_type("HyperCLaw-V1.1");
-    return the_plot_file_type;
-}
-
-
-void
-Adv::writePlotFile (const std::string& dir,
-		    std::ostream&      os,
-		    VisMF::How         how)
-{
-    int i, n;
-    //
-    // The list of indices of State to write to plotfile.
-    // first component of pair is state_type,
-    // second component of pair is component # within the state_type
-    //
-    std::vector<std::pair<int,int> > plot_var_map;
-    for (int typ = 0; typ < desc_lst.size(); typ++)
-        for (int comp = 0; comp < desc_lst[typ].nComp();comp++)
-            if (parent->isStatePlotVar(desc_lst[typ].name(comp)) &&
-                desc_lst[typ].getType() == IndexType::TheCellType())
-                plot_var_map.push_back(std::pair<int,int>(typ,comp));
-
-    int n_data_items = plot_var_map.size();
-
-    Real cur_time = state[State_Type].curTime();
-
-#ifdef PARTICLES
-    if (do_tracers and level == 0) {
-      TracerPC->Checkpoint(dir, "Tracer", true);
-    }
-#endif
-
-    if (level == 0 && ParallelDescriptor::IOProcessor())
-    {
-        //
-        // The first thing we write out is the plotfile type.
-        //
-        os << thePlotFileType() << '\n';
-
-        if (n_data_items == 0)
-            amrex::Error("Must specify at least one valid data item to plot");
-
-        os << n_data_items << '\n';
-
-	//
-	// Names of variables
-	//
-	for (i =0; i < plot_var_map.size(); i++)
-        {
-	    int typ = plot_var_map[i].first;
-	    int comp = plot_var_map[i].second;
-	    os << desc_lst[typ].name(comp) << '\n';
-        }
-
-        os << BL_SPACEDIM << '\n';
-        os << parent->cumTime() << '\n';
-        int f_lev = parent->finestLevel();
-        os << f_lev << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbLo(i) << ' ';
-        os << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbHi(i) << ' ';
-        os << '\n';
-        for (i = 0; i < f_lev; i++)
-            os << parent->refRatio(i)[0] << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->Geom(i).Domain() << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->levelSteps(i) << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-        {
-            for (int k = 0; k < BL_SPACEDIM; k++)
-                os << parent->Geom(i).CellSize()[k] << ' ';
-            os << '\n';
-        }
-        os << (int) Geom().Coord() << '\n';
-        os << "0\n"; // Write bndry data.
-
-    }
-    // Build the directory to hold the MultiFab at this level.
-    // The name is relative to the directory containing the Header file.
-    //
-    static const std::string BaseName = "/Cell";
-    char buf[64];
-    sprintf(buf, "Level_%d", level);
-    std::string Level = buf;
-    //
-    // Now for the full pathname of that directory.
-    //
-    std::string FullPath = dir;
-    if (!FullPath.empty() && FullPath[FullPath.size()-1] != '/')
-        FullPath += '/';
-    FullPath += Level;
-    //
-    // Only the I/O processor makes the directory if it doesn't already exist.
-    //
-    if (ParallelDescriptor::IOProcessor())
-        if (!amrex::UtilCreateDirectory(FullPath, 0755))
-            amrex::CreateDirectoryFailed(FullPath);
-    //
-    // Force other processors to wait till directory is built.
-    //
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << level << ' ' << grids.size() << ' ' << cur_time << '\n';
-        os << parent->levelSteps(level) << '\n';
-
-        for (i = 0; i < grids.size(); ++i)
-        {
-            RealBox gridloc = RealBox(grids[i],geom.CellSize(),geom.ProbLo());
-            for (n = 0; n < BL_SPACEDIM; n++)
-                os << gridloc.lo(n) << ' ' << gridloc.hi(n) << '\n';
-        }
-        //
-        // The full relative pathname of the MultiFabs at this level.
-        // The name is relative to the Header file containing this name.
-        // It's the name that gets written into the Header.
-        //
-        if (n_data_items > 0)
-        {
-            std::string PathNameInHeader = Level;
-            PathNameInHeader += BaseName;
-            os << PathNameInHeader << '\n';
-        }
-    }
-    //
-    // We combine all of the multifabs -- state, derived, etc -- into one
-    // multifab -- plotMF.
-    // NOTE: In this tutorial code, there is no derived data
-    int       cnt   = 0;
-    const int nGrow = 0;
-    MultiFab  plotMF(grids,dmap,n_data_items,nGrow);
-    MultiFab* this_dat = 0;
-    //
-    // Cull data from state variables -- use no ghost cells.
-    //
-    for (i = 0; i < plot_var_map.size(); i++)
-    {
-	int typ  = plot_var_map[i].first;
-	int comp = plot_var_map[i].second;
-	this_dat = &state[typ].newData();
-	MultiFab::Copy(plotMF,*this_dat,comp,cnt,1,nGrow);
-	cnt++;
-    }
-
-    //
-    // Use the Full pathname when naming the MultiFab.
-    //
-    std::string TheFullPath = FullPath;
-    TheFullPath += BaseName;
-    VisMF::Write(plotMF,TheFullPath,how,true);
-}
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_setup.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_setup.cpp
deleted file mode 100755
index cc8938abf32..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Adv_setup.cpp
+++ /dev/null
@@ -1,51 +0,0 @@
-
-#include <Adv.H>
-#include <Adv_F.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BC_TYPES.H>
-
-void
-Adv::variableCleanUp () 
-{
-    desc_lst.clear();
-}
-
-void
-Adv::variableSetUp ()
-{
-    BL_ASSERT(desc_lst.size() == 0);
-
-    // Get options, set phys_bc
-    read_params();
-
-    desc_lst.addDescriptor(State_Type,IndexType::TheCellType(),
-                           StateDescriptor::Point,0,NUM_STATE,
-			   &cell_cons_interp);
-
-    int lo_bc[BL_SPACEDIM];
-    int hi_bc[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	lo_bc[i] = hi_bc[i] = INT_DIR;   // periodic boundaries
-    }
-    
-    BCRec bc(lo_bc, hi_bc);
-    desc_lst.setComponent(State_Type, 0, "phi", bc,
-                          StateDescriptor::BndryFunc(nullfill));
-
-    //
-    // read taggin parameters from probin file
-    //
-
-    std::string probin_file("probin");
-
-    ParmParse ppa("amr");
-    ppa.query("probin_file",probin_file);
-
-    int probin_file_length = probin_file.length();
-    Vector<int> probin_file_name(probin_file_length);
-
-    for (int i = 0; i < probin_file_length; i++)
-	probin_file_name[i] = probin_file[i];
-     get_tagging_params(probin_file_name.dataPtr(), &probin_file_length);
-
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Make.package
deleted file mode 100755
index eaa93d165aa..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Make.package
+++ /dev/null
@@ -1,9 +0,0 @@
-CEXE_sources += Adv.cpp Adv_advance.cpp Adv_setup.cpp 
-CEXE_sources += AdvBld.cpp Adv_io.cpp Adv_dt.cpp
-CEXE_sources += main.cpp 
-
-CEXE_headers += Adv.H
-
-FEXE_headers += Adv_F.H
-
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/Adv_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/Adv_2d.f90
deleted file mode 100755
index 75a536d1d70..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,118 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt)
-  
-  use mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  double precision, intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  double precision :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Final fluxes
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = phix(i,j) * vx(i,j)
-     end do
-  end do
-  !
-  do    j = lo(2), hi(2)+1
-     do i = lo(1), hi(1)
-        flxy(i,j) = phiy(i,j) * vy(i,j)
-     end do
-  end do
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/Make.package
deleted file mode 100755
index 08c638054bb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100755
index 7361a8ce7a0..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,113 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    double precision, intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/slope_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/slope_2d.f90
deleted file mode 100755
index 1fa7d7a525e..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,126 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(1.d0, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/Adv_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/Adv_3d.f90
deleted file mode 100755
index ab15c03a473..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/Adv_3d.f90
+++ /dev/null
@@ -1,144 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            vz  , vz_lo, vz_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            flxz, fz_lo, fz_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_3d
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3)
-  double precision, intent(in) :: dx(3), dt, time
-  integer, intent(in) :: ui_lo(3), ui_hi(3)
-  integer, intent(in) :: uo_lo(3), uo_hi(3)
-  integer, intent(in) :: vx_lo(3), vx_hi(3)
-  integer, intent(in) :: vy_lo(3), vy_hi(3)
-  integer, intent(in) :: vz_lo(3), vz_hi(3)
-  integer, intent(in) :: fx_lo(3), fx_hi(3)
-  integer, intent(in) :: fy_lo(3), fy_hi(3)
-  integer, intent(in) :: fz_lo(3), fz_hi(3)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2),ui_lo(3):ui_hi(3))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2),uo_lo(3):uo_hi(3))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2),vx_lo(3):vx_hi(3))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2),vy_lo(3):vy_hi(3))
-  double precision, intent(in   ) :: vz  (vz_lo(1):vz_hi(1),vz_lo(2):vz_hi(2),vz_lo(3):vz_hi(3))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-  double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-
-  integer :: i, j, k
-  integer :: glo(3), ghi(3)
-  double precision :: dtdx(3), umax, vmax, wmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:,:), pointer, contiguous :: &
-       phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  ! slope
-  call bl_allocate(slope,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))  
-  
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  wmax = maxval(abs(vz))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) .or. &
-       wmax*dt .ge. dx(3) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", wmax = ", wmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-  
-  
-  ! call a function to compute flux
-  call compute_flux_3d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       vz, vz_lo, vz_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       flxz, fz_lo, fz_hi, &
-                       phix, phix_y, phix_z, &
-                       phiy, phiy_x, phiy_z, &
-                       phiz, phiz_x, phiz_y, &
-                       slope, glo, ghi)   
-
-  ! Do a conservative update
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           uout(i,j,k) = uin(i,j,k) + &
-                ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx(1) &
-                + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx(2) &
-                + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx(3) )
-           
-        enddo
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-           flxx(i,j,k) = flxx(i,j,k) * (dt * dx(2)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)+1 
-        do i = lo(1), hi(1)
-           flxy(i,j,k) = flxy(i,j,k) * (dt * dx(1)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)+1
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           flxz(i,j,k) = flxz(i,j,k) * (dt * dx(1)*dx(2))
-        enddo
-     enddo
-  enddo
-
-  call bl_deallocate(phix  )
-  call bl_deallocate(phix_y)
-  call bl_deallocate(phix_z)
-  call bl_deallocate(phiy  )
-  call bl_deallocate(phiy_x)
-  call bl_deallocate(phiy_z)
-  call bl_deallocate(phiz  )
-  call bl_deallocate(phiz_x)
-  call bl_deallocate(phiz_y)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/Make.package
deleted file mode 100755
index 08c638054bb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/compute_flux_3d.f90
deleted file mode 100755
index 81662295831..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/compute_flux_3d.f90
+++ /dev/null
@@ -1,287 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_3d
-
-contains
-
-  subroutine compute_flux_3d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             wmac,  w_lo,  w_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             flxz, fz_lo, fz_hi, &
-                             phix, phix_y, phix_z, &
-                             phiy, phiy_x, phiy_z, &
-                             phiz, phiz_x, phiz_y, &
-                             slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey, slopez
-
-    integer, intent(in) :: lo(3), hi(3), glo(3), ghi(3)
-    double precision, intent(in) :: dt, dx(3)
-    integer, intent(in) :: ph_lo(3), ph_hi(3)
-    integer, intent(in) ::  u_lo(3),  u_hi(3)
-    integer, intent(in) ::  v_lo(3),  v_hi(3)
-    integer, intent(in) ::  w_lo(3),  w_hi(3)
-    integer, intent(in) :: fx_lo(3), fx_hi(3)
-    integer, intent(in) :: fy_lo(3), fy_hi(3)
-    integer, intent(in) :: fz_lo(3), fz_hi(3)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2),ph_lo(3):ph_hi(3))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2), u_lo(3): u_hi(3))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2), v_lo(3): v_hi(3))
-    double precision, intent(in   ) :: wmac( w_lo(1): w_hi(1), w_lo(2): w_hi(2), w_lo(3): w_hi(3))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-    double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2),glo(3):ghi(3)) :: &
-         phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(3), tdtdx(3)
-
-    hdtdx = 0.5*(dt/dx)
-    tdtdx = (1.d0/3.d0)*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phi(i  ,j,k) - (0.5d0 + hdtdx(1)*umac(i,j,k))*slope(i  ,j,k)
-             else
-                phix(i,j,k) = phi(i-1,j,k) + (0.5d0 - hdtdx(1)*umac(i,j,k))*slope(i-1,j,k)
-             end if
-             
-          end do
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on y faces using vmac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phi(i,j  ,k) - (0.5d0 + hdtdx(2)*vmac(i,j,k))*slope(i,j  ,k)
-             else
-                phiy(i,j,k) = phi(i,j-1,k) + (0.5d0 - hdtdx(2)*vmac(i,j,k))*slope(i,j-1,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopez(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on z faces using wmac to upwind; ignore transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phi(i,j,k  ) - (0.5d0 + hdtdx(3)*wmac(i,j,k))*slope(i,j,k  )
-             else
-                phiz(i,j,k) = phi(i,j,k-1) + (0.5d0 - hdtdx(3)*wmac(i,j,k))*slope(i,j,k-1)
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! transverse terms
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in y-transverse terms
-    do       k=lo(3)-1, hi(3)+1
-       do    j=lo(2)  , hi(2)
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i  ,j+1,k)+vmac(i  ,j,k)) * (phiy(i  ,j+1,k)-phiy(i  ,j,k)) )
-             else
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i-1,j+1,k)+vmac(i-1,j,k)) * (phiy(i-1,j+1,k)-phiy(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on x faces by adding in z-transverse terms
-    do       k=lo(3)  , hi(3)
-       do    j=lo(2)-1, hi(2)+1
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i  ,j,k+1)+wmac(i  ,j,k)) * (phiz(i  ,j,k+1)-phiz(i  ,j,k)) )
-             else
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i-1,j,k+1)+wmac(i-1,j,k)) * (phiz(i-1,j,k+1)-phiz(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j  ,k)+umac(i,j  ,k)) * (phix(i+1,j  ,k)-phix(i,j  ,k)) )
-             else
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j-1,k)+umac(i,j-1,k)) * (phix(i+1,j-1,k)-phix(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in z-transverse terms
-    do       k = lo(3)  , hi(3)
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j  ,k+1)+wmac(i,j  ,k)) * (phiz(i,j  ,k+1)-phiz(i,j  ,k)) )
-             else
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j-1,k+1)+wmac(i,j-1,k)) * (phiz(i,j-1,k+1)-phiz(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in x-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k  )+umac(i,j,k  )) * (phix(i+1,j,k  )-phix(i,j,k  )) )
-             else
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k-1)+umac(i,j,k-1)) * (phix(i+1,j,k-1)-phix(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in y-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)  , hi(2)
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k  )+vmac(i,j,k  )) * (phiy(i,j+1,k  )-phiy(i,j,k  )) )
-             else
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k-1)+vmac(i,j,k-1)) * (phiy(i,j+1,k-1)-phiy(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! final edge states
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in yz and zy transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_z(i  ,j+1,k  )-phiy_z(i  ,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i  ,j,k)) * (phiz_y(i  ,j  ,k+1)-phiz_y(i  ,j,k)) )
-             else
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1,k  )+vmac(i-1,j,k)) * (phiy_z(i-1,j+1,k  )-phiy_z(i-1,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i-1,j  ,k+1)+wmac(i-1,j,k)) * (phiz_y(i-1,j  ,k+1)-phiz_y(i-1,j,k)) )
-             end if
-
-             ! compute final x-fluxes
-             flxx(i,j,k) = umac(i,j,k)*phix(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in xz and zx transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i,j  ,k)) * (phix_z(i+1,j  ,k  )-phix_z(i,j  ,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i,j  ,k)) * (phiz_x(i  ,j  ,k+1)-phiz_x(i,j  ,k)) )
-             else
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j-1,k  )+umac(i,j-1,k)) * (phix_z(i+1,j-1,k  )-phix_z(i,j-1,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j-1,k+1)+wmac(i,j-1,k)) * (phiz_x(i  ,j-1,k+1)-phiz_x(i,j-1,k)) )
-             end if
-
-             ! compute final y-fluxes
-             flxy(i,j,k) = vmac(i,j,k)*phiy(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in xy and yx transverse terms
-    do       k = lo(3), hi(3)+1
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i  ,j,k)) * (phix_y(i+1,j  ,k  )-phix_y(i,j,k  )) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_x(i  ,j+1,k  )-phiy_x(i,j,k  )) )
-             else
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k-1)+umac(i,j,k-1)) * (phix_y(i+1,j  ,k-1)-phix_y(i,j,k-1)) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k-1)+vmac(i,j,k-1)) * (phiy_x(i  ,j+1,k-1)-phiy_x(i,j,k-1)) )
-             end if
-
-             ! compute final z-fluxes
-             flxz(i,j,k) = wmac(i,j,k)*phiz(i,j,k)
-
-          end do
-       end do
-    end do
-
-
-  end subroutine compute_flux_3d
-
-end module compute_flux_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/slope_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/slope_3d.f90
deleted file mode 100755
index 418ac9d5ff3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_3d/slope_3d.f90
+++ /dev/null
@@ -1,211 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey, slopez
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    integer :: i, j, k
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do    k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-
-          ! first compute Fromm slopes
-          do i = lo(1)-1, hi(1)+1
-             dlft = q(i  ,j,k) - q(i-1,j,k)
-             drgt = q(i+1,j,k) - q(i  ,j,k)
-             dcen(i) = .5d0 * (dlft+drgt)
-             dsgn(i) = sign(1.d0, dcen(i))
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i) = 0.d0
-             endif
-             df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-          end do
-          
-          ! Now limited fourth order slopes
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-             dq(i,j,k) = dsgn(i)*min(dlim(i),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    do k = lo(3), hi(3)
-
-       ! first compute Fromm slopes
-       do j    = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j  ,k) - q(i,j-1,k)
-             drgt = q(i,j+1,k) - q(i,j  ,k)
-             dcen(i,j) = .5d0 * (dlft+drgt)
-             dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j) = 0.d0
-             endif
-             df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-          end do
-       end do
-       
-       ! Now compute limited fourth order slopes
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-             dq(i,j,k) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-          end do
-       end do
-
-    end do
-
-  end subroutine slopey_doit
-
-
-  subroutine slopez(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-
-    call slopez_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, &
-                     (/lo(1),lo(2),lo(3)-1/), (/hi(1),hi(2),hi(3)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopez
-
-  subroutine slopez_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(3), ddhi(3)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do k       = lo(3)-1, hi(3)+1
-       do j    = lo(2)  , hi(2)
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j,k  ) - q(i,j,k-1)
-             drgt = q(i,j,k+1) - q(i,j,k  )
-             dcen(i,j,k) = .5d0 * (dlft+drgt)
-             dsgn(i,j,k) = sign( 1.d0, dcen(i,j,k) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j,k) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j,k) = 0.d0
-             endif
-             df(i,j,k) = dsgn(i,j,k)*min( dlim(i,j,k),abs(dcen(i,j,k)) )
-          end do
-       end do
-    end do
-       
-    ! Now compute limited fourth order slopes
-    do k       = lo(3), hi(3)
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j,k) - sixth*( df(i,j,k+1) + df(i,j,k-1) )
-             dq(i,j,k) = dsgn(i,j,k)*min(dlim(i,j,k),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopez_doit
-
-end module slope_module 
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Adv_nd.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Adv_nd.f90
deleted file mode 100755
index b8dab92f175..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Adv_nd.f90
+++ /dev/null
@@ -1,63 +0,0 @@
-subroutine nullfill(adv,adv_lo,adv_hi,domlo,domhi,delta,xlo,time,bc) bind(C, name="nullfill")
-  implicit none
-  integer          :: adv_lo(3),adv_hi(3)
-  integer          :: bc(*)
-  integer          :: domlo(3), domhi(3)
-  double precision :: delta(3), xlo(3), time
-  double precision :: adv(adv_lo(1):adv_hi(1),adv_lo(2):adv_hi(2),adv_lo(3):adv_hi(3))
-  ! no physical boundaries to fill because it is all periodic
-  return
-end subroutine nullfill
-
-
-subroutine get_tagging_params(name, namlen) bind(C, name="get_tagging_params")
-
-  use tagging_params_module
-
-  ! Initialize the tagging parameters
-
-  integer, intent(in) :: namlen
-  integer, intent(in) :: name(namlen)
-        
-  integer :: un, i, status
-
-  integer, parameter :: maxlen = 256
-  character (len=maxlen) :: probin
-
-  namelist /tagging/ phierr, phigrad, max_phierr_lev, max_phigrad_lev
-
-  ! Set namelist defaults
-  phierr = 1.d20
-  phigrad = 1.d20
-  max_phierr_lev = -1
-  max_phigrad_lev = -1
-
-  ! create the filename
-  if (namlen > maxlen) then
-     print *, 'probin file name too long'
-     stop
-  endif
-
-  do i = 1, namlen
-     probin(i:i) = char(name(i))
-  end do
-
-  ! read in the namelist
-  un = 9
-  open (unit=un, file=probin(1:namlen), form='formatted', status='old')
-  read (unit=un, nml=tagging, iostat=status)
-  
-  if (status < 0) then
-     ! the namelist does not exist, so we just go with the defaults
-     continue
-
-  else if (status > 0) then
-     ! some problem in the namelist
-     print *, 'ERROR: problem in the tagging namelist'
-     stop
-  endif
-
-  close (unit=un)
-  
-end subroutine get_tagging_params
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Make.package
deleted file mode 100755
index 259de879545..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Adv_nd.f90 
-f90EXE_sources += Tagging_nd.f90 tagging_params.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Tagging_nd.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Tagging_nd.f90
deleted file mode 100755
index 394c35584ec..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/Tagging_nd.f90
+++ /dev/null
@@ -1,85 +0,0 @@
-
-! ::: -----------------------------------------------------------
-! ::: This routine will tag high error cells based on the state
-! ::: 
-! ::: INPUTS/OUTPUTS:
-! ::: 
-! ::: tag        <=  integer tag array
-! ::: tag_lo,hi   => index extent of tag array
-! ::: state       => state array
-! ::: state_lo,hi => index extent of state array
-! ::: set         => integer value to tag cell for refinement
-! ::: clear       => integer value to untag cell
-! ::: lo,hi       => work region we are allowed to change
-! ::: dx          => cell size
-! ::: problo      => phys loc of lower left corner of prob domain
-! ::: time        => problem evolution time
-! ::: level       => refinement level of this array
-! ::: -----------------------------------------------------------
-
-subroutine state_error(tag,tag_lo,tag_hi, &
-                       state,state_lo,state_hi, &
-                       set,clear,&
-                       lo,hi,&
-                       dx,problo,time,level) bind(C, name="state_error")
-
-  use tagging_params_module, only : phierr, phigrad, max_phierr_lev, max_phigrad_lev
-  implicit none
-  
-  integer          :: lo(3),hi(3)
-  integer          :: state_lo(3),state_hi(3)
-  integer          :: tag_lo(3),tag_hi(3)
-  double precision :: state(state_lo(1):state_hi(1), &
-                            state_lo(2):state_hi(2), &
-                            state_lo(3):state_hi(3))
-  integer          :: tag(tag_lo(1):tag_hi(1),tag_lo(2):tag_hi(2),tag_lo(3):tag_hi(3))
-  double precision :: problo(3),dx(3),time
-  integer          :: level,set,clear
-
-  double precision :: ax, ay, az
-  integer          :: i, j, k, dim
-
-  if (state_lo(3) .eq. state_hi(3)) then
-     dim = 2
-  else
-     dim = 3
-  end if
-
-  ! Tag on regions of high phi
-  if (level .lt. max_phierr_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              if (state(i,j,k) .ge. phierr(level)) then
-                 tag(i,j,k) = set
-              endif
-           enddo
-        enddo
-     enddo
-  endif
-
-  ! Tag on regions of high phisity gradient
-  if (level .lt. max_phigrad_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              ax = abs(state(i-1,j,k)-state(i,j,k))
-              ax = max(ax, abs(state(i,j,k)-state(i+1,j,k)))
-              ay = abs(state(i,j-1,k)-state(i,j,k))
-              ay = max(ay, abs(state(i,j,k)-state(i,j+1,k)))
-              if (dim .eq. 2) then
-                 az = 0.d0
-              else
-                 az = abs(state(i,j,k-1)-state(i,j,k))
-                 az = max(az, abs(state(i,j,k)-state(i,j,k+1)))
-              end if
-              if (max(ax,ay,az) .ge. phigrad(level)) then
-                 tag(i,j,k) = set
-              end if
-            enddo
-         enddo
-      end do
-   endif
-  
-end subroutine state_error
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/tagging_params.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/tagging_params.f90
deleted file mode 100755
index 3281fbf3dd9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/Src_nd/tagging_params.f90
+++ /dev/null
@@ -1,7 +0,0 @@
-module tagging_params_module
-
-  double precision, save :: phierr(0:15), phigrad(0:15)
-
-  integer, save :: max_phierr_lev, max_phigrad_lev
-
-end module tagging_params_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/main.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/main.cpp
deleted file mode 100755
index fafe6d713d0..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync/Source/main.cpp
+++ /dev/null
@@ -1,75 +0,0 @@
-#include <new>
-#include <iostream>
-#include <iomanip>
-
-#include <AMReX_Amr.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_AmrLevel.H>
-#include <PerillaRts.H>
-
-using namespace amrex;
-using namespace perilla;
-int
-main (int   argc,
-      char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    Real dRunTime1 = ParallelDescriptor::second();
-
-    std::cout << std::setprecision(10);
-
-    int  max_step;
-    Real strt_time;
-    Real stop_time;
-    ParmParse pp; 
-
-    max_step  = -1;
-    strt_time =  0.0;
-    stop_time = -1.0;
-
-    pp.query("max_step",max_step);
-    pp.query("strt_time",strt_time);
-    pp.query("stop_time",stop_time);
-
-    if (strt_time < 0.0) {
-        amrex::Abort("MUST SPECIFY a non-negative strt_time"); 
-    }
-
-    if (max_step < 0 && stop_time < 0.0) {
-	amrex::Abort("Exiting because neither max_step nor stop_time is non-negative.");
-    }
-
-    {
-        Amr amr;
-
-        amr.init(strt_time,stop_time);
-
-        RTS rts;
-        rts.Init(ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs());
-        rts.Iterate(&amr, max_step, stop_time); //run coarseTimeSteps on the amr object 
-
-        rts.Barrier();
-        // Write final checkpoint and plotfile
-        if (amr.stepOfLastCheckPoint() < amr.levelSteps(0)) {
-            amr.checkPoint();
-        }
-
-        if (amr.stepOfLastPlotFile() < amr.levelSteps(0)) {
-            amr.writePlotFile();
-        }
-    }
-
-    Real dRunTime2 = ParallelDescriptor::second() - dRunTime1;
-
-    ParallelDescriptor::ReduceRealMax(dRunTime2, ParallelDescriptor::IOProcessorNumber());
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        std::cout << "Run time = " << dRunTime2 << std::endl;
-    }
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/Make.Adv.mpi b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/Make.Adv.mpi
deleted file mode 100755
index 22223fc13a1..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/Make.Adv.mpi
+++ /dev/null
@@ -1,67 +0,0 @@
-AMREX_HOME = ../../../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi
-TOP := $(ADR_DIR)
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/Amr/Make.package
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi/Make.package
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-CXXFLAGS += $(PPFLAGS) 
-libraries += $(LDFLAGS)
-
-vpathdir += $(AMREX_HOME)/Src/Boundary
-vpathdir += $(AMREX_HOME)/Src/Base
-vpathdir += $(AMREX_HOME)/Src/Amr
-vpathdir += $(AMREX_HOME)/Src/AmrCore
-vpathdir += $(AMREX_HOME)/Src/AmrTask/rts_impls/mpi
-
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs   := Base Boundary AmrCore Amr Particle
-Ppack   += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-LDFLAGS += $(LIBFLAGS)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-vpath %.c   . $(VPATH_LOCATIONS)
-vpath %.cpp . $(VPATH_LOCATIONS)
-vpath %.h   . $(VPATH_LOCATIONS)
-vpath %.H   . $(VPATH_LOCATIONS)
-vpath %.F   . $(VPATH_LOCATIONS)
-vpath %.f90 . $(VPATH_LOCATIONS)
-vpath %.F90 . $(VPATH_LOCATIONS)
-vpath %.f   . $(VPATH_LOCATIONS)
-vpath %.fi  . $(VPATH_LOCATIONS)
-
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-#-----------------------------------------------------------------------------
-# for debugging.  To see the value of a Makefile variable,
-# e.g. COMP, simply do "make print-COMP".  This will
-# print out the value.
-print-%: ; @echo $* is $($*)
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/Make.Adv.upcxx b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/Make.Adv.upcxx
deleted file mode 100755
index 3fb833e1d58..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/Make.Adv.upcxx
+++ /dev/null
@@ -1,73 +0,0 @@
-AMREX_HOME = ../../../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi
-TOP := $(ADR_DIR)
-UPCXX_INSTALL=/global/common/cori/ftg/upcxx/2019.3.0/hsw/gnu/PrgEnv-gnu-6.0.4-7.3.0/
-PPFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta PPFLAGS)
-LDFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta LDFLAGS)
-LIBFLAGS=$(shell $(UPCXX_INSTALL)/bin/upcxx-meta LIBFLAGS) 
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/Amr/Make.package
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx/perilla.mak
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/runtime_common/perilla.mak
-include $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx/Make.package
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack   += $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-CXXFLAGS += $(PPFLAGS) 
-libraries += $(LDFLAGS)
-
-vpathdir += $(AMREX_HOME)/Src/Boundary
-vpathdir += $(AMREX_HOME)/Src/Base
-vpathdir += $(AMREX_HOME)/Src/Amr
-vpathdir += $(AMREX_HOME)/Src/AmrCore
-vpathdir += $(AMREX_HOME)/Src/AmrTask/rts_impls/upcxx
-
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs   := Base Boundary AmrCore Amr Particle
-Ppack   += $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-LDFLAGS += $(LIBFLAGS)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
-
-vpath %.c   . $(VPATH_LOCATIONS)
-vpath %.cpp . $(VPATH_LOCATIONS)
-vpath %.h   . $(VPATH_LOCATIONS)
-vpath %.H   . $(VPATH_LOCATIONS)
-vpath %.F   . $(VPATH_LOCATIONS)
-vpath %.f90 . $(VPATH_LOCATIONS)
-vpath %.F90 . $(VPATH_LOCATIONS)
-vpath %.f   . $(VPATH_LOCATIONS)
-vpath %.fi  . $(VPATH_LOCATIONS)
-
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.upcxx
-
-
-#-----------------------------------------------------------------------------
-# for debugging.  To see the value of a Makefile variable,
-# e.g. COMP, simply do "make print-COMP".  This will
-# print out the value.
-print-%: ; @echo $* is $($*)
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/GNUmakefile b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/GNUmakefile
deleted file mode 100755
index 27b0735bb62..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/GNUmakefile
+++ /dev/null
@@ -1,24 +0,0 @@
-AMREX_HOME ?= ../../../../../../
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-#DIM        = 2
-DIM       = 3
-CPPFLAGS += -DUSE_PERILLA -DMPICH_SKIP_MPICXX -std=c++11  -DUSE_PERILLA_OMP 
-#-DPERILLA_USE_UPCXX
-
-COMP	   = gcc
-FCOMP	   = gfortran
-
-USE_MPI    = TRUE
-USE_OMP    = TRUE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv.mpi
-#include ../Make.Adv.upcxx
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/Make.package
deleted file mode 100755
index c478388fbdc..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/Prob.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/Prob.f90
deleted file mode 100755
index 93278c87712..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/Prob.f90
+++ /dev/null
@@ -1,57 +0,0 @@
-
-subroutine amrex_probinit (init,name,namlen,problo,probhi) bind(c)
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  ! nothing needs to be done here
-
-end subroutine amrex_probinit
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo) bind(C, name="initdata")
-
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2 + (z-0.5d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/face_velocity_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/face_velocity_2d.f90
deleted file mode 100755
index 368b58f7252..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/face_velocity_2d.f90
+++ /dev/null
@@ -1,61 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo)
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  integer :: i, j, plo(2), phi(2)
-  double precision :: x, y
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-
-  ! y velocity
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-
-  call bl_deallocate(psi)
-  
-end subroutine get_face_velocity
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/face_velocity_3d.f90
deleted file mode 100755
index b4063a8ccb3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/face_velocity_3d.f90
+++ /dev/null
@@ -1,69 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3, &
-     vy, vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3, &
-     vz, vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3
-  integer, intent(in) :: vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3
-  integer, intent(in) :: vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2,vx_l3:vx_h3)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2,vy_l3:vy_h3)
-  double precision, intent(out) :: vz(vz_l1:vz_h1,vz_l2:vz_h2,vz_l3:vz_h3)
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer :: i, j, k, plo(2), phi(2)
-  double precision :: x, y, z
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do k = vx_l3, vx_h3
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j,k) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-  end do
-
-  ! y velocity
-  do k = vy_l3, vy_h3
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j,k) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-  end do
-
-  vz = 1.d0
-
-  call bl_deallocate(psi)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/inputs b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/inputs
deleted file mode 100755
index abd5938064c..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,42 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 100
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  128   128   128
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratios
-amr.regrid_int      = 2      # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 20    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 0      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 20     # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/probin b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/probin
deleted file mode 100755
index 46d1856ad55..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/SingleVortex/probin
+++ /dev/null
@@ -1,14 +0,0 @@
-&fortin
-
-   adv_vel = 1.d0, 1.d0, 1.d0
-
-/
-
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/GNUmakefile b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/GNUmakefile
deleted file mode 100755
index 222595ecf90..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/GNUmakefile
+++ /dev/null
@@ -1,21 +0,0 @@
-BOXLIB_HOME ?= ../../../..
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-DIM        = 2
-#DIM       = 3
-
-COMP	   = g++
-FCOMP	   = gfortran
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/Make.package
deleted file mode 100755
index 01fd65d6390..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90 probdata.f90
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/Prob.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/Prob.f90
deleted file mode 100755
index 268e4c94024..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/Prob.f90
+++ /dev/null
@@ -1,84 +0,0 @@
-
-subroutine PROBINIT (init,name,namlen,problo,probhi)
-
-  use probdata_module
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  integer untin,i
-
-  namelist /fortin/ adv_vel
-  
-  !
-  ! Build "probin" filename -- the name of file containing fortin namelist.
-  !     
-  integer maxlen
-  parameter (maxlen=256)
-  character probin*(maxlen)
-  
-  if (namlen .gt. maxlen) then
-     write(6,*) 'probin file name too long'
-     stop
-  end if
-  
-  do i = 1, namlen
-     probin(i:i) = char(name(i))
-  end do
-  
-  adv_vel = 1.d0
-
-  ! Read namelists
-  untin = 9
-  open(untin,file=probin(1:namlen),form='formatted',status='old')
-  read(untin,fortin)
-  close(unit=untin)
-
-end subroutine PROBINIT
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo)
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.0d0)**2 + (y-0.0d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.0d0)**2 + (y-0.0d0)**2 + (z-0.0d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/face_velocity_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/face_velocity_2d.f90
deleted file mode 100755
index 9030e96eec8..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/face_velocity_2d.f90
+++ /dev/null
@@ -1,22 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo)
-
-  use probdata_module, only : adv_vel
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  vx = adv_vel(1)
-  vy = adv_vel(2)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/inputs b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/inputs
deleted file mode 100755
index 61b29a7c4b3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/inputs
+++ /dev/null
@@ -1,39 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 1000000
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     = -1.0 -1.0 -1.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# TIME STEP CONTROL
-adv.cfl            = 0.9     # cfl number for hyperbolic system
-
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.regrid_int      = 2       # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 10    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 1      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 10     # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/probdata.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/probdata.f90
deleted file mode 100755
index ffacef798b9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/probdata.f90
+++ /dev/null
@@ -1,7 +0,0 @@
-module probdata_module
-
-  implicit none
-
-  double precision, save :: adv_vel(3)
-
-end module probdata_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/probin b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/probin
deleted file mode 100755
index 46d1856ad55..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Exec/UniformVelocity/probin
+++ /dev/null
@@ -1,14 +0,0 @@
-&fortin
-
-   adv_vel = 1.d0, 1.d0, 1.d0
-
-/
-
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/README b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/README
deleted file mode 100755
index abc53af9c00..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/README
+++ /dev/null
@@ -1,9 +0,0 @@
-AMR_Adv_C: This code advects a single scalar field with a velocity
-field that is specified on faces.
-
-It is a BoxLib based code designed to run in parallel using MPI/OMP.
-
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d. 
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with Visit.
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv.H b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv.H
deleted file mode 100755
index fb188eecf31..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv.H
+++ /dev/null
@@ -1,224 +0,0 @@
-#ifndef _Adv_H_
-#define _Adv_H_
-
-#include <AMReX_AmrLevel.H>
-#include <AMReX_FluxRegister.H>
-//#include <BL_CXX11.H>
-
-#include <iostream>
-#include <Perilla.H>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-enum StateType { State_Type = 0,
-                 NUM_STATE_TYPE };
-
-//
-// AmrLevel-derived class for hyperbolic conservation equations
-//
-
-class Adv
-    :
-    public AmrLevel
-{
-public:
-    //
-    //Default constructor.  Builds invalid object.
-    //
-    Adv ();
-    //
-    //The basic constructor.
-    //
-    Adv (Amr&            papa,
-	 int             lev,
-	 const Geometry& level_geom,
-	 const BoxArray& bl,
-	 const DistributionMapping& dm,
-	 Real            time);
-    //
-    //The destructor.
-    //
-    virtual ~Adv ();
-    //
-    //Restart from a checkpoint file.
-    //
-    virtual void restart (Amr&          papa,
-                          std::istream& is,
-			  bool          bReadSpecial = false);
-    virtual void checkPoint (const std::string& dir,
-                             std::ostream&      os,
-                             amrex::VisMF::How  how = amrex::VisMF::NFiles,
-                             bool               dump_old = true);
-
-
-    /*A string written as the first item in writePlotFile() at
-               level zero. It is so we can distinguish between different
-               types of plot files. For Adv it has the form: Adv-Vnnn
-    */
-    virtual std::string thePlotFileType () const;
-
-    //
-    //Write a plotfile to specified directory.
-    //
-    virtual void writePlotFile (const std::string& dir,
-                                std::ostream&      os,
-                                VisMF::How         how);
-    //
-    //Define data descriptors.
-    //
-    static void variableSetUp ();
-    //
-    //Cleanup data descriptors at end of run.
-    //
-    static void variableCleanUp ();
-    //
-    //Initialize grid data at problem start-up.
-    //
-    virtual void initData ();
-    //
-    //Initialize data on this level from another Adv (during regrid).
-    //
-    virtual void init (AmrLevel& old);
-    //
-    //Initialize data on this level after regridding if old level did not previously exist
-    //
-    virtual void init ();
-    //
-    //Proceed with next timestep?
-    //
-    virtual int okToContinue () { return 1; }
-    virtual int okToRegrid () { return false; }
-    //
-    //Advance grids at this level in time.
-    //
-    virtual Real advance (Real time,
-                          Real dt,
-                          int  iteration,
-                          int  ncycle);
-
-    virtual void initPerilla(Real time);
-    virtual void finalizePerilla (Real time);
-    //
-    //Estimate time step.
-    //
-    Real estTimeStep (Real dt_old);
-    //
-    //Compute initial time step.
-    //
-    Real initialTimeStep ();
-    //
-    //Compute initial `dt'.
-    //
-    virtual void computeInitialDt (int                   finest_level,
-                                   int                   sub_cycle,
-                                   Vector<int>&           n_cycle,
-                                   const Vector<IntVect>& ref_ratio,
-                                   Vector<Real>&          dt_level,
-                                   Real                  stop_time);
-    //
-    //Compute new `dt'.
-    //
-    virtual void computeNewDt (int                   finest_level,
-                               int                   sub_cycle,
-                               Vector<int>&           n_cycle,
-                               const Vector<IntVect>& ref_ratio,
-                               Vector<Real>&          dt_min,
-                               Vector<Real>&          dt_level,
-                               Real                  stop_time,
-                               int                   post_regrid_flag);
-    //
-    //Do work after timestep().
-    //
-    virtual void post_timestep (int iteration);
-    //
-    //Do work after regrid().
-    //
-    virtual void post_regrid (int lbase, int new_finest) { ; }
-    //
-    //Do work after a restart().
-    //
-    virtual void post_restart () { ; }
-    //
-    //Do work after init().
-    //
-    virtual void post_init (Real stop_time);
-    //
-    //Error estimation for regridding.
-    //
-    virtual void errorEst (TagBoxArray& tb,
-                           int          clearval,
-                           int          tagval,
-                           Real         time,
-			   int          n_error_buf = 0, int ngrow = 0);
-
-    static int  NUM_STATE;
-    static int  NUM_GROW;
-  
-protected:
-
-    static void read_params ();
-
-    Adv& getLevel (int lev);
-
-    FluxRegister& getFluxReg ();
-    FluxRegister& getFluxReg (int lev);
-
-    void reflux ();
-  
-    void avgDown ();
-  
-    void avgDown (int iteration);
-
-    void avgDown (int state_indx, int iteration);
-
-    //
-    // The data.
-    //
-    FluxRegister*        flux_reg;
-    //
-    // Static data members.
-    //
-    static int       verbose;
-    static Real      cfl;
-    static int       do_reflux;
-
-public:
-  
-    MultiFab* Sborder;
-    amrex::Vector<AsyncFillPatchIterator*> SborderFPI;
-
-    MultiFab*  S_fine;
-    MultiFab*  crse_S_fine;  
-    MultiFab*  S_crse;
-    RegionGraph* RG_S_fine;
-    RegionGraph* RG_S_crse;
-};    
-
-//
-// Inlines.
-//
-
-inline
-Adv&
-Adv::getLevel (int lev)
-{
-    return *(Adv *) &parent->getLevel(lev);
-}
-
-inline
-FluxRegister&
-Adv::getFluxReg ()
-{
-    BL_ASSERT(flux_reg);
-    return *flux_reg;
-}
-
-inline
-FluxRegister&
-Adv::getFluxReg (int lev)
-{
-    return getLevel(lev).getFluxReg();
-}
-#endif /*_Adv_H_*/
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv.cpp
deleted file mode 100755
index 698c2437beb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv.cpp
+++ /dev/null
@@ -1,372 +0,0 @@
-#include <Adv.H>
-#include <Adv_F.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_TagBox.H>
-#include <AMReX_ParmParse.H>
-
-#include <Perilla.H>
-#include <RegionGraph.H>
-#include <WorkerThread.H>
-
-#include <iostream>
-#include <iomanip>
-#include <Perilla.H>
-
-#include <string>
-#include <fstream>
-
-#include <AsyncMultiFabUtil.H>
-
-
-using namespace amrex;
-using namespace perilla;
-
-int      Adv::verbose         = 0;
-Real     Adv::cfl             = 0.9;
-int      Adv::do_reflux       = 0;
-
-int      Adv::NUM_STATE       = 1;  // One variable in the state
-int      Adv::NUM_GROW        = 3;  // number of ghost cells
-
-    void
-Adv::read_params ()
-{
-    static bool done = false;
-
-    if (done) return;
-
-    done = true;
-
-    ParmParse pp("adv");   
-
-    pp.query("v",verbose);
-    pp.query("cfl",cfl);
-    pp.query("do_reflux",do_reflux);
-}
-
-Adv::Adv ()
-{
-    flux_reg = 0;
-    Sborder = 0;
-    SborderFPI.clear();    
-    S_fine = NULL;
-    S_crse = NULL;
-    RG_S_fine = NULL;
-    RG_S_crse = NULL;
-}
-
-Adv::Adv (Amr&            papa,
-	int             lev,
-	const Geometry& level_geom,
-	const BoxArray& bl,
-	const DistributionMapping& dm,
-	Real            time)
-    :
-	AmrLevel(papa,lev,level_geom,bl,dm,time) 
-{
-    flux_reg = 0;
-    if (level > 0 && do_reflux)
-	flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-
-    Sborder = 0;
-    SborderFPI.clear();
-    S_fine = NULL;
-    S_crse = NULL;
-    RG_S_fine = NULL;
-    RG_S_crse = NULL;    
-}
-
-Adv::~Adv () 
-{
-    delete flux_reg;
-}
-
-    void
-Adv::initData ()
-{
-    //
-    // Loop over grids, call FORTRAN function to init with data.
-    //
-    const Real* dx  = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    MultiFab& S_new = get_new_data(State_Type);
-    Real cur_time   = state[State_Type].curTime();
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Initializing the data at level " << level << std::endl;
-
-
-    for (MFIter mfi(S_new); mfi.isValid(); ++mfi)
-    {
-	const Box& box     = mfi.validbox();
-	const int* lo      = box.loVect();
-	const int* hi      = box.hiVect();
-
-	initdata(level, cur_time, ARLIM_3D(lo), ARLIM_3D(hi),
-		BL_TO_FORTRAN_3D(S_new[mfi]), ZFILL(dx),
-		ZFILL(prob_lo));
-    }
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Done initializing the level " << level << " data " << std::endl;
-}
-
-    void
-Adv::init (AmrLevel &old)
-{
-    Adv* oldlev = (Adv*) &old;
-    //
-    // Create new grid data by fillpatching from old.
-    //
-    Real dt_new    = parent->dtLevel(level);
-    Real cur_time  = oldlev->state[State_Type].curTime();
-    Real prev_time = oldlev->state[State_Type].prevTime();
-    Real dt_old    = cur_time - prev_time;
-    setTimeLevel(cur_time,dt_old,dt_new);
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-    FillPatch(old, S_new, 0, cur_time, State_Type, 0, NUM_STATE);
-}
-
-//
-// This version inits the data on a new level that did not
-// exist before regridding.
-//
-    void
-Adv::init ()
-{
-    Real dt        = parent->dtLevel(level);
-    Real cur_time  = getLevel(level-1).state[State_Type].curTime();
-    Real prev_time = getLevel(level-1).state[State_Type].prevTime();
-
-    Real dt_old = (cur_time - prev_time)/(Real)parent->MaxRefRatio(level-1);
-
-    setTimeLevel(cur_time,dt_old,dt);
-    MultiFab& S_new = get_new_data(State_Type);
-    FillCoarsePatch(S_new, 0, cur_time, State_Type, 0, NUM_STATE);
-}
-
-
-    void
-Adv::post_timestep (int iteration)
-{
-
-    //
-    // Integration cycle on fine level grids is complete
-    // do post_timestep stuff here.
-    //
-    int finest_level = parent->finestLevel();
-
-    if(perilla::isMasterThread())
-	if (do_reflux && level < finest_level)
-	    reflux();
-    perilla::syncAllWorkerThreads();
-
-    avgDown(iteration);
-}
-
-    void
-Adv::post_init (Real stop_time)
-{
-    if (level > 0)
-	return;
-    //
-    // Average data down from finer levels
-    // so that conserved data is consistent between levels.
-    //
-    int finest_level = parent->finestLevel();
-    for (int k = finest_level; k>= 0; k--)
-	getLevel(k).avgDown();
-}
-
-    void
-Adv::reflux ()
-{
-    BL_ASSERT(level<parent->finestLevel());
-
-    const Real strt = ParallelDescriptor::second();
-
-    getFluxReg(level+1).Reflux(get_new_data(State_Type),1.0,0,0,NUM_STATE,geom);
-
-    if (verbose)
-    {
-	const int IOProc = ParallelDescriptor::IOProcessorNumber();
-	Real      end    = ParallelDescriptor::second() - strt;
-
-	ParallelDescriptor::ReduceRealMax(end,IOProc);
-
-	if (ParallelDescriptor::IOProcessor())
-	    std::cout << "Adv::reflux() at level " << level << " : time = " << end << std::endl;
-    }
-}
-
-
-    void
-Adv::avgDown ()
-{
-    if (level == parent->finestLevel()) return;
-
-    Adv& fine_lev = getLevel(level+1);
-    MultiFab&  S_fine   = fine_lev.get_new_data(State_Type);
-    MultiFab&  S_crse   = get_new_data(State_Type);
-
-    amrex::average_down(S_fine,S_crse,
-	    fine_lev.geom,geom,
-	    0,S_fine.nComp(),parent->refRatio(level));
-
-}
-
-
-    void
-Adv::avgDown (int iteration)
-{
-    avgDown(State_Type, iteration);
-}
-
-    void
-Adv::avgDown (int state_indx, int iteration)
-{
-    if(level < parent->finestLevel())
-    {
-        Adv& fine_lev = getLevel(level+1);
-
-        MultiFab* tS_fine = &(fine_lev.get_new_data(state_indx));
-        MultiFab* tS_crse = &(get_new_data(state_indx));
-
-        MultiFab& S_new = get_new_data(state_indx);
-        const Real time = state[state_indx].curTime();
-
-
-        for(RGIter rgi(RG_S_crse); rgi.isValid(); ++rgi)
-        {
-            int f = rgi.currentRegion;
-            average_down_pull(rgi, S_fine, S_crse, RG_S_fine, RG_S_crse,
-                                   fine_lev.geom, geom, 0, S_fine->nComp(),
-                                   parent->refRatio(level),f);
-            // Send data to advance for next subcycle iteration  
-            if(iteration < parent->nCycle(level))
-                SborderFPI[iteration]->SendIntraLevel(rgi, NUM_GROW, time, state_indx, 0, NUM_STATE, iteration, f, false);
-        }
-    }
-
-    if (level > 0 && iteration == parent->nCycle(level))
-    {
-      Adv& crse_lev = getLevel(level-1);
-
-      MultiFab* S_fine = &(get_new_data(state_indx));
-      MultiFab* S_crse = &(crse_lev.get_new_data(state_indx));
-
-      for(RGIter rgi(crse_lev.RG_S_fine,true); rgi.isValid(); ++rgi)
-        {
-          int f = rgi.currentRegion;
-          average_down_push(rgi, S_fine, S_crse, crse_lev.crse_S_fine,
-                                    crse_lev.RG_S_fine, crse_lev.RG_S_crse,geom,crse_lev.geom,
-                                    0,crse_lev.get_new_data(state_indx).nComp(),parent->refRatio(level-1),f);
-
-        }
-    }
-}
-
-    void
-Adv::initPerilla(Real time)
-{
-    int state_indx = State_Type;
-    Sborder = new MultiFab(grids, dmap, NUM_STATE, NUM_GROW);
-    amrex::MultiFab tmp_Sborder(grids, dmap, NUM_STATE, NUM_GROW);
-
-    SborderFPI.resize(parent->nCycle(level));        
-    for(int i=0; i<parent->nCycle(level); i++)
-    {
-	SborderFPI[i] = new AsyncFillPatchIterator(*this, tmp_Sborder, NUM_GROW, time+(i*parent->dtLevel(level)), State_Type, 0, NUM_STATE,i+1);
-    }
-
-    if(level < parent->finestLevel())
-    {
-	Adv& fine_lev = getLevel(level+1);
-	S_fine = &(fine_lev.get_new_data(state_indx));
-	S_crse = &(get_new_data(state_indx));
-	RG_S_crse = new RegionGraph(S_crse->IndexArray().size());
-	parent->graphArray[level].push_back(RG_S_crse);
-
-	const BoxArray& fine_BA = S_fine->boxArray();
-	BoxArray crse_S_fine_BA = fine_BA;
-	crse_S_fine_BA.coarsen(parent->refRatio(level));
-	crse_S_fine = new MultiFab(crse_S_fine_BA, S_fine->DistributionMap(), S_fine->nComp(),0);
-
-	RG_S_fine = new RegionGraph(crse_S_fine->IndexArray().size());
-	RG_S_fine->buildTileArray(*crse_S_fine);
-
-	Perilla::multifabExtractCopyAssoc( RG_S_crse, RG_S_fine, *S_crse, *crse_S_fine, S_fine->nComp(), 0, 0, Periodicity::NonPeriodic());
-	parent->graphArray[level].push_back(RG_S_fine);
-    }
-}
-
-    void
-Adv::finalizePerilla (Real time)
-{
-    if(ParallelDescriptor::MyProc()==0)
-	std::cout<< "Finalizing Perilla Level " << level <<std::endl;
-
-    for(int i=0; i< parent->nCycle(level); i++)
-    {
-	 delete SborderFPI[i];
-    }
-    SborderFPI.clear();
-    if(Sborder) delete Sborder;    
-
-    if(level < parent->finestLevel())
-    {
-	S_fine = 0;
-	S_crse = 0;
-	if(crse_S_fine) delete crse_S_fine;
-	if(RG_S_fine) delete RG_S_fine;
-	if(RG_S_crse) delete RG_S_crse;	
-    }
-}
-
-    void
-Adv::errorEst (TagBoxArray& tags,
-	int          clearval,
-	int          tagval,
-	Real         time,
-	int          n_error_buf,
-	int          ngrow)
-{
-    const Real* dx        = geom.CellSize();
-    const Real* prob_lo   = geom.ProbLo();
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-	Vector<int>  itags;
-
-	for (MFIter mfi(S_new,true); mfi.isValid(); ++mfi)
-	{
-	    const Box&  tilebx  = mfi.tilebox();
-
-	    TagBox&     tagfab  = tags[mfi];
-
-	    // We cannot pass tagfab to Fortran becuase it is BaseFab<char>.
-	    // So we are going to get a temporary integer array.
-	    tagfab.get_itags(itags, tilebx);
-
-	    // data pointer and index space
-	    int*        tptr    = itags.dataPtr();
-	    const int*  tlo     = tilebx.loVect();
-	    const int*  thi     = tilebx.hiVect();
-
-	    state_error(tptr,  ARLIM_3D(tlo), ARLIM_3D(thi),
-		    BL_TO_FORTRAN_3D(S_new[mfi]),
-		    &tagval, &clearval,
-		    ARLIM_3D(tilebx.loVect()), ARLIM_3D(tilebx.hiVect()),
-		    ZFILL(dx), ZFILL(prob_lo), &time, &level);
-	    // Now update the tags in the TagBox.
-	    //
-	    tagfab.tags_and_untags(itags, tilebx);
-	}
-    }
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/AdvBld.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/AdvBld.cpp
deleted file mode 100755
index 171b3478d0e..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/AdvBld.cpp
+++ /dev/null
@@ -1,57 +0,0 @@
-
-#include <AMReX_LevelBld.H>
-#include <Adv.H>
-
-using namespace amrex;
-
-class AdvBld
-    :
-    public LevelBld
-{
-    virtual void variableSetUp () override;
-    virtual void variableCleanUp () override;
-    virtual AmrLevel *operator() () override;
-    virtual AmrLevel *operator() (Amr&            papa,
-                                  int             lev,
-                                  const Geometry& level_geom,
-                                  const BoxArray& ba,
-				  const DistributionMapping& dm,
-                                  Real            time) override;
-};
-
-AdvBld Adv_bld;
-
-LevelBld*
-getLevelBld ()
-{
-    return &Adv_bld;
-}
-
-void
-AdvBld::variableSetUp ()
-{
-    Adv::variableSetUp();
-}
-
-void
-AdvBld::variableCleanUp ()
-{
-    Adv::variableCleanUp();
-}
-
-AmrLevel*
-AdvBld::operator() ()
-{
-    return new Adv;
-}
-
-AmrLevel*
-AdvBld::operator() (Amr&            papa,
-		    int             lev,
-		    const Geometry& level_geom,
-		    const BoxArray& ba,
-		    const DistributionMapping& dm,
-		    Real            time)
-{
-    return new Adv(papa, lev, level_geom, ba, dm, time);
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_F.H b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_F.H
deleted file mode 100755
index a56dc5abd83..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_F.H
+++ /dev/null
@@ -1,44 +0,0 @@
-#ifndef _Adv_F_H_
-#define _Adv_F_H_
-#include <AMReX_BLFort.H>
-
-extern "C" 
-{
-  void get_tagging_params(const int* name, const int* namlen);
-
-  void nullfill(BL_FORT_FAB_ARG_3D(state),
-		const int* dlo, const int* dhi,
-		const amrex::Real* dx, const amrex::Real* glo, 
-		const amrex::Real* time, const int* bc);
-  
-  void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		   BL_FORT_FAB_ARG_3D(state),
-		   const int* tagval, const int* clearval,
-		   const int* lo, const int* hi,
-		   const amrex::Real* dx, const amrex::Real* problo,
-		   const amrex::Real* time, const int* level);
-  
-  void initdata(const int& level, const amrex::Real& time, 
-		const int* lo, const int* hi,
-		BL_FORT_FAB_ARG_3D(state),
-		const amrex::Real* dx, const amrex::Real* problo);
-  
-  void get_face_velocity(const int& level, const amrex::Real& time, 
-			 D_DECL(BL_FORT_FAB_ARG(xvel),
-				BL_FORT_FAB_ARG(yvel),
-				BL_FORT_FAB_ARG(zvel)),
-			 const amrex::Real* dx, const amrex::Real* problo);
-  
-  void advect(const amrex::Real& time, const int* lo, const int*hi,
-	      const BL_FORT_FAB_ARG_3D(statein),
-	      BL_FORT_FAB_ARG_3D(stateout),
-	      D_DECL(const BL_FORT_FAB_ARG_3D(xvel),
-		     const BL_FORT_FAB_ARG_3D(yvel),
-		     const BL_FORT_FAB_ARG_3D(zvel)),
-	      D_DECL(BL_FORT_FAB_ARG_3D(fx),
-		     BL_FORT_FAB_ARG_3D(fy),
-		     BL_FORT_FAB_ARG_3D(fz)),
-	      const amrex::Real* dx, const amrex::Real& dt);
-}
-
-#endif
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_advance.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_advance.cpp
deleted file mode 100755
index 90c5a1c7687..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_advance.cpp
+++ /dev/null
@@ -1,126 +0,0 @@
-#include <Adv.H>
-#include <Adv_F.H>
-#include <WorkerThread.H>
-#include <RegionGraph.H>
-#include <Perilla.H>
-#include <string>
-#include <fstream>
-
-using namespace perilla;
-
-    Real
-Adv::advance (Real time,
-	Real dt,
-	int  iteration,
-	int  ncycle)
-{
-    syncAllWorkerThreads(); //tasks handled by workers in a process share the state data
-    if(isMasterThread())
-    {
-	for (int k = 0; k < NUM_STATE_TYPE; k++) {
-	    state[k].allocOldData();
-	    state[k].swapTimeLevels(dt);
-	}
-    }
-    syncAllWorkerThreads();
-
-    MultiFab& S_new = get_new_data(State_Type);
-
-    const Real prev_time = state[State_Type].prevTime();
-    const Real cur_time = state[State_Type].curTime();
-    const Real ctr_time = 0.5*(prev_time + cur_time);
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-
-    // Get pointers to Flux registers, or set pointer to zero if not there.
-    FluxRegister *fine    = 0;
-    FluxRegister *current = 0;
-
-    int finest_level = parent->finestLevel();
-
-    if(isMasterThread())
-    {
-	if (do_reflux && level < finest_level) {
-	    fine = &getFluxReg(level+1);
-	    fine->setVal(0.0);
-	}
-    }
-    syncAllWorkerThreads();
-
-    if (do_reflux && level > 0) {
-	current = &getFluxReg(level);
-    }
-
-    MultiFab fluxes[BL_SPACEDIM];
-
-    if (do_reflux)
-    {
-	for (int j = 0; j < BL_SPACEDIM; j++)
-	{
-	    BoxArray ba = S_new.boxArray();
-	    ba.surroundingNodes(j);
-	    fluxes[j].define(ba, dmap, NUM_STATE, 0);
-	}
-    }
-
-    amrex::Vector<AsyncFillPatchIterator*> upperAFPI;
-    if(level < parent->finestLevel())
-    {
-	Adv& upperLevel = getLevel(level+1);
-	upperAFPI = upperLevel.SborderFPI;
-    }
-    FArrayBox flux[BL_SPACEDIM], uface[BL_SPACEDIM];
-
-    syncAllWorkerThreads();
-
-    for (RGIter rgi(SborderFPI, upperAFPI, *(Sborder), NUM_GROW, state[State_Type].prevTime(), State_Type, 0, NUM_STATE, iteration); rgi.isValid(); ++rgi){
-	int f = rgi.currentRegion;
-	int fid = S_new.IndexArray()[f];
-	int fis = Sborder->IndexArray()[f];
-	const FArrayBox& statein = (*(Sborder))[fis];
-	FArrayBox& stateout      =   S_new[fid];
-	MFIter mfi(S_new, true);
-
-
-	const Box& bx = rgi.tilebox();
-	rgi.sync_workers();
-	for (int i = 0; i < BL_SPACEDIM ; i++) {
-	    const Box& bxtmp = amrex::surroundingNodes(bx,i);
-	    {
-		flux[i].resize(bxtmp,NUM_STATE);
-		uface[i].resize(amrex::grow(bxtmp,1),1);
-	    }
-	}
-
-	get_face_velocity(level, ctr_time,
-		D_DECL(BL_TO_FORTRAN(uface[0]),
-		    BL_TO_FORTRAN(uface[1]),
-		    BL_TO_FORTRAN(uface[2])),
-		dx, prob_lo);
-	advect(time, bx.loVect(), bx.hiVect(),
-		BL_TO_FORTRAN_3D(statein),
-		BL_TO_FORTRAN_3D(stateout),
-		D_DECL(BL_TO_FORTRAN_3D(uface[0]),
-		    BL_TO_FORTRAN_3D(uface[1]),
-		    BL_TO_FORTRAN_3D(uface[2])),
-		D_DECL(BL_TO_FORTRAN_3D(flux[0]),
-		    BL_TO_FORTRAN_3D(flux[1]),
-		    BL_TO_FORTRAN_3D(flux[2])),
-		dx, dt);
-
-	if (do_reflux) {
-	    for (int i = 0; i < BL_SPACEDIM ; i++)
-		fluxes[i][f].copy(flux[i],mfi.nodaltilebox(i));       
-	}
-    }
-    if (do_reflux) {
-	if (fine) {
-	    if(isMasterThread())
-		for (int i = 0; i < BL_SPACEDIM ; i++)
-		    fine->CrseInit(fluxes[i],i,0,0,NUM_STATE,-1.);
-	}
-    }
-    syncAllWorkerThreads();
-    return dt;
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_dt.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_dt.cpp
deleted file mode 100755
index 188cb000f9f..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_dt.cpp
+++ /dev/null
@@ -1,171 +0,0 @@
-
-#include <Adv.H>
-#include <Adv_F.H>
-
-Real
-Adv::initialTimeStep ()
-{
-    return estTimeStep(0.0);
-}
-
-Real
-Adv::estTimeStep (Real)
-{
-    // This is just a dummy value to start with 
-    Real dt_est  = 1.0e+20;
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    const Real cur_time = state[State_Type].curTime();
-    const MultiFab& S_new = get_new_data(State_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est)
-#endif
-    {
-	FArrayBox uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bx = mfi.nodaltilebox(i);
-		uface[i].resize(bx,1);
-	    }
-
-            get_face_velocity(level, cur_time,
-                              D_DECL(BL_TO_FORTRAN(uface[0]),
-                                     BL_TO_FORTRAN(uface[1]),
-                                     BL_TO_FORTRAN(uface[2])),
-                              dx, prob_lo);
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		Real umax = uface[i].norm(0);
-		if (umax > 1.e-100) {
-		    dt_est = std::min(dt_est, dx[i] / umax);
-		}
-	    }
-	}
-    }
-
-    ParallelDescriptor::ReduceRealMin(dt_est);
-    dt_est *= cfl;
-
-    if (verbose && ParallelDescriptor::IOProcessor())
-	std::cout << "Adv::estTimeStep at level " << level << ":  dt_est = " << dt_est << std::endl;
-    
-    return dt_est;
-}
-
-void
-Adv::computeNewDt (int                   finest_level,
-		   int                   sub_cycle,
-		   Vector<int>&           n_cycle,
-		   const Vector<IntVect>& ref_ratio,
-		   Vector<Real>&          dt_min,
-		   Vector<Real>&          dt_level,
-		   Real                  stop_time,
-		   int                   post_regrid_flag)
-{
-    //
-    // We are at the end of a coarse grid timecycle.
-    // Compute the timesteps for the next iteration.
-    //
-    if (level > 0)
-        return;
-
-    for (int i = 0; i <= finest_level; i++)
-    {
-        Adv& adv_level = getLevel(i);
-        dt_min[i] = adv_level.estTimeStep(dt_level[i]);
-    }
-
-    if (post_regrid_flag == 1) 
-    {
-	//
-	// Limit dt's by pre-regrid dt
-	//
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],dt_level[i]);
-	}
-    }
-    else 
-    {
-	//
-	// Limit dt's by change_max * old dt
-	//
-	static Real change_max = 1.1;
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],change_max*dt_level[i]);
-	}
-    }
-    
-    //
-    // Find the minimum over all levels
-    //
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_min[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
-
-void
-Adv::computeInitialDt (int                   finest_level,
-		       int                   sub_cycle,
-		       Vector<int>&           n_cycle,
-		       const Vector<IntVect>& ref_ratio,
-		       Vector<Real>&          dt_level,
-		       Real                  stop_time)
-{
-    //
-    // Grids have been constructed, compute dt for all levels.
-    //
-    if (level > 0)
-        return;
-
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        dt_level[i] = getLevel(i).initialTimeStep();
-        n_factor   *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_level[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_io.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_io.cpp
deleted file mode 100755
index c08230422ce..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_io.cpp
+++ /dev/null
@@ -1,209 +0,0 @@
-#include <Adv.H>
-#include <AMReX_Utility.H>
-
-using namespace amrex;
-
-void
-Adv::restart (Amr&          papa,
-	      std::istream& is,
-	      bool          bReadSpecial)
-{
-    AmrLevel::restart(papa,is,bReadSpecial);
-
-    BL_ASSERT(flux_reg == 0);
-    if (level > 0 && do_reflux)
-        flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-}
-
-/*
-void
-Adv::post_restart() 
-{
-#ifdef PARTICLES
-    if (do_tracers and level == 0) {
-      BL_ASSERT(TracerPC == 0);
-      TracerPC.reset(new AmrTracerParticleContainer(parent));
-      TracerPC->Restart(parent->theRestartFile(), "Tracer");
-    }
-#endif
-}
-*/
-
-void 
-Adv::checkPoint (const std::string& dir,
-		 std::ostream&      os,
-		 VisMF::How         how,
-		 bool               dump_old) 
-{
-  AmrLevel::checkPoint(dir, os, how, dump_old);
-#ifdef PARTICLES
-  if (do_tracers and level == 0) {
-    TracerPC->Checkpoint(dir, "Tracer", true);
-  }
-#endif
-}
-
-
-std::string
-Adv::thePlotFileType () const
-{
-    static const std::string the_plot_file_type("HyperCLaw-V1.1");
-    return the_plot_file_type;
-}
-
-
-void
-Adv::writePlotFile (const std::string& dir,
-		    std::ostream&      os,
-		    VisMF::How         how)
-{
-    int i, n;
-    //
-    // The list of indices of State to write to plotfile.
-    // first component of pair is state_type,
-    // second component of pair is component # within the state_type
-    //
-    std::vector<std::pair<int,int> > plot_var_map;
-    for (int typ = 0; typ < desc_lst.size(); typ++)
-        for (int comp = 0; comp < desc_lst[typ].nComp();comp++)
-            if (parent->isStatePlotVar(desc_lst[typ].name(comp)) &&
-                desc_lst[typ].getType() == IndexType::TheCellType())
-                plot_var_map.push_back(std::pair<int,int>(typ,comp));
-
-    int n_data_items = plot_var_map.size();
-
-    Real cur_time = state[State_Type].curTime();
-
-#ifdef PARTICLES
-    if (do_tracers and level == 0) {
-      TracerPC->Checkpoint(dir, "Tracer", true);
-    }
-#endif
-
-    if (level == 0 && ParallelDescriptor::IOProcessor())
-    {
-        //
-        // The first thing we write out is the plotfile type.
-        //
-        os << thePlotFileType() << '\n';
-
-        if (n_data_items == 0)
-            amrex::Error("Must specify at least one valid data item to plot");
-
-        os << n_data_items << '\n';
-
-	//
-	// Names of variables
-	//
-	for (i =0; i < plot_var_map.size(); i++)
-        {
-	    int typ = plot_var_map[i].first;
-	    int comp = plot_var_map[i].second;
-	    os << desc_lst[typ].name(comp) << '\n';
-        }
-
-        os << BL_SPACEDIM << '\n';
-        os << parent->cumTime() << '\n';
-        int f_lev = parent->finestLevel();
-        os << f_lev << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbLo(i) << ' ';
-        os << '\n';
-        for (i = 0; i < BL_SPACEDIM; i++)
-            os << Geom().ProbHi(i) << ' ';
-        os << '\n';
-        for (i = 0; i < f_lev; i++)
-            os << parent->refRatio(i)[0] << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->Geom(i).Domain() << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-            os << parent->levelSteps(i) << ' ';
-        os << '\n';
-        for (i = 0; i <= f_lev; i++)
-        {
-            for (int k = 0; k < BL_SPACEDIM; k++)
-                os << parent->Geom(i).CellSize()[k] << ' ';
-            os << '\n';
-        }
-        os << (int) Geom().Coord() << '\n';
-        os << "0\n"; // Write bndry data.
-
-    }
-    // Build the directory to hold the MultiFab at this level.
-    // The name is relative to the directory containing the Header file.
-    //
-    static const std::string BaseName = "/Cell";
-    char buf[64];
-    sprintf(buf, "Level_%d", level);
-    std::string Level = buf;
-    //
-    // Now for the full pathname of that directory.
-    //
-    std::string FullPath = dir;
-    if (!FullPath.empty() && FullPath[FullPath.size()-1] != '/')
-        FullPath += '/';
-    FullPath += Level;
-    //
-    // Only the I/O processor makes the directory if it doesn't already exist.
-    //
-    if (ParallelDescriptor::IOProcessor())
-        if (!amrex::UtilCreateDirectory(FullPath, 0755))
-            amrex::CreateDirectoryFailed(FullPath);
-    //
-    // Force other processors to wait till directory is built.
-    //
-    ParallelDescriptor::Barrier();
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        os << level << ' ' << grids.size() << ' ' << cur_time << '\n';
-        os << parent->levelSteps(level) << '\n';
-
-        for (i = 0; i < grids.size(); ++i)
-        {
-            RealBox gridloc = RealBox(grids[i],geom.CellSize(),geom.ProbLo());
-            for (n = 0; n < BL_SPACEDIM; n++)
-                os << gridloc.lo(n) << ' ' << gridloc.hi(n) << '\n';
-        }
-        //
-        // The full relative pathname of the MultiFabs at this level.
-        // The name is relative to the Header file containing this name.
-        // It's the name that gets written into the Header.
-        //
-        if (n_data_items > 0)
-        {
-            std::string PathNameInHeader = Level;
-            PathNameInHeader += BaseName;
-            os << PathNameInHeader << '\n';
-        }
-    }
-    //
-    // We combine all of the multifabs -- state, derived, etc -- into one
-    // multifab -- plotMF.
-    // NOTE: In this tutorial code, there is no derived data
-    int       cnt   = 0;
-    const int nGrow = 0;
-    MultiFab  plotMF(grids,dmap,n_data_items,nGrow);
-    MultiFab* this_dat = 0;
-    //
-    // Cull data from state variables -- use no ghost cells.
-    //
-    for (i = 0; i < plot_var_map.size(); i++)
-    {
-	int typ  = plot_var_map[i].first;
-	int comp = plot_var_map[i].second;
-	this_dat = &state[typ].newData();
-	MultiFab::Copy(plotMF,*this_dat,comp,cnt,1,nGrow);
-	cnt++;
-    }
-
-    //
-    // Use the Full pathname when naming the MultiFab.
-    //
-    std::string TheFullPath = FullPath;
-    TheFullPath += BaseName;
-    VisMF::Write(plotMF,TheFullPath,how,true);
-}
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_setup.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_setup.cpp
deleted file mode 100755
index cc8938abf32..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Adv_setup.cpp
+++ /dev/null
@@ -1,51 +0,0 @@
-
-#include <Adv.H>
-#include <Adv_F.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_BC_TYPES.H>
-
-void
-Adv::variableCleanUp () 
-{
-    desc_lst.clear();
-}
-
-void
-Adv::variableSetUp ()
-{
-    BL_ASSERT(desc_lst.size() == 0);
-
-    // Get options, set phys_bc
-    read_params();
-
-    desc_lst.addDescriptor(State_Type,IndexType::TheCellType(),
-                           StateDescriptor::Point,0,NUM_STATE,
-			   &cell_cons_interp);
-
-    int lo_bc[BL_SPACEDIM];
-    int hi_bc[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	lo_bc[i] = hi_bc[i] = INT_DIR;   // periodic boundaries
-    }
-    
-    BCRec bc(lo_bc, hi_bc);
-    desc_lst.setComponent(State_Type, 0, "phi", bc,
-                          StateDescriptor::BndryFunc(nullfill));
-
-    //
-    // read taggin parameters from probin file
-    //
-
-    std::string probin_file("probin");
-
-    ParmParse ppa("amr");
-    ppa.query("probin_file",probin_file);
-
-    int probin_file_length = probin_file.length();
-    Vector<int> probin_file_name(probin_file_length);
-
-    for (int i = 0; i < probin_file_length; i++)
-	probin_file_name[i] = probin_file[i];
-     get_tagging_params(probin_file_name.dataPtr(), &probin_file_length);
-
-}
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Make.package
deleted file mode 100755
index eaa93d165aa..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Make.package
+++ /dev/null
@@ -1,9 +0,0 @@
-CEXE_sources += Adv.cpp Adv_advance.cpp Adv_setup.cpp 
-CEXE_sources += AdvBld.cpp Adv_io.cpp Adv_dt.cpp
-CEXE_sources += main.cpp 
-
-CEXE_headers += Adv.H
-
-FEXE_headers += Adv_F.H
-
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/Adv_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/Adv_2d.f90
deleted file mode 100755
index 75a536d1d70..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,118 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt)
-  
-  use mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  double precision, intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  double precision :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Final fluxes
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = phix(i,j) * vx(i,j)
-     end do
-  end do
-  !
-  do    j = lo(2), hi(2)+1
-     do i = lo(1), hi(1)
-        flxy(i,j) = phiy(i,j) * vy(i,j)
-     end do
-  end do
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/Make.package
deleted file mode 100755
index 08c638054bb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100755
index 7361a8ce7a0..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,113 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    double precision, intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/slope_2d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/slope_2d.f90
deleted file mode 100755
index 1fa7d7a525e..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,126 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(1.d0, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/Adv_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/Adv_3d.f90
deleted file mode 100755
index ab15c03a473..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/Adv_3d.f90
+++ /dev/null
@@ -1,144 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            vz  , vz_lo, vz_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            flxz, fz_lo, fz_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_3d
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3)
-  double precision, intent(in) :: dx(3), dt, time
-  integer, intent(in) :: ui_lo(3), ui_hi(3)
-  integer, intent(in) :: uo_lo(3), uo_hi(3)
-  integer, intent(in) :: vx_lo(3), vx_hi(3)
-  integer, intent(in) :: vy_lo(3), vy_hi(3)
-  integer, intent(in) :: vz_lo(3), vz_hi(3)
-  integer, intent(in) :: fx_lo(3), fx_hi(3)
-  integer, intent(in) :: fy_lo(3), fy_hi(3)
-  integer, intent(in) :: fz_lo(3), fz_hi(3)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2),ui_lo(3):ui_hi(3))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2),uo_lo(3):uo_hi(3))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2),vx_lo(3):vx_hi(3))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2),vy_lo(3):vy_hi(3))
-  double precision, intent(in   ) :: vz  (vz_lo(1):vz_hi(1),vz_lo(2):vz_hi(2),vz_lo(3):vz_hi(3))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-  double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-
-  integer :: i, j, k
-  integer :: glo(3), ghi(3)
-  double precision :: dtdx(3), umax, vmax, wmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:,:), pointer, contiguous :: &
-       phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  ! slope
-  call bl_allocate(slope,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))  
-  
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  wmax = maxval(abs(vz))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) .or. &
-       wmax*dt .ge. dx(3) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", wmax = ", wmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-  
-  
-  ! call a function to compute flux
-  call compute_flux_3d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       vz, vz_lo, vz_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       flxz, fz_lo, fz_hi, &
-                       phix, phix_y, phix_z, &
-                       phiy, phiy_x, phiy_z, &
-                       phiz, phiz_x, phiz_y, &
-                       slope, glo, ghi)   
-
-  ! Do a conservative update
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           uout(i,j,k) = uin(i,j,k) + &
-                ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx(1) &
-                + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx(2) &
-                + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx(3) )
-           
-        enddo
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-           flxx(i,j,k) = flxx(i,j,k) * (dt * dx(2)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)+1 
-        do i = lo(1), hi(1)
-           flxy(i,j,k) = flxy(i,j,k) * (dt * dx(1)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)+1
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           flxz(i,j,k) = flxz(i,j,k) * (dt * dx(1)*dx(2))
-        enddo
-     enddo
-  enddo
-
-  call bl_deallocate(phix  )
-  call bl_deallocate(phix_y)
-  call bl_deallocate(phix_z)
-  call bl_deallocate(phiy  )
-  call bl_deallocate(phiy_x)
-  call bl_deallocate(phiy_z)
-  call bl_deallocate(phiz  )
-  call bl_deallocate(phiz_x)
-  call bl_deallocate(phiz_y)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/Make.package
deleted file mode 100755
index 08c638054bb..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/compute_flux_3d.f90
deleted file mode 100755
index 81662295831..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/compute_flux_3d.f90
+++ /dev/null
@@ -1,287 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_3d
-
-contains
-
-  subroutine compute_flux_3d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             wmac,  w_lo,  w_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             flxz, fz_lo, fz_hi, &
-                             phix, phix_y, phix_z, &
-                             phiy, phiy_x, phiy_z, &
-                             phiz, phiz_x, phiz_y, &
-                             slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey, slopez
-
-    integer, intent(in) :: lo(3), hi(3), glo(3), ghi(3)
-    double precision, intent(in) :: dt, dx(3)
-    integer, intent(in) :: ph_lo(3), ph_hi(3)
-    integer, intent(in) ::  u_lo(3),  u_hi(3)
-    integer, intent(in) ::  v_lo(3),  v_hi(3)
-    integer, intent(in) ::  w_lo(3),  w_hi(3)
-    integer, intent(in) :: fx_lo(3), fx_hi(3)
-    integer, intent(in) :: fy_lo(3), fy_hi(3)
-    integer, intent(in) :: fz_lo(3), fz_hi(3)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2),ph_lo(3):ph_hi(3))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2), u_lo(3): u_hi(3))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2), v_lo(3): v_hi(3))
-    double precision, intent(in   ) :: wmac( w_lo(1): w_hi(1), w_lo(2): w_hi(2), w_lo(3): w_hi(3))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-    double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2),glo(3):ghi(3)) :: &
-         phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(3), tdtdx(3)
-
-    hdtdx = 0.5*(dt/dx)
-    tdtdx = (1.d0/3.d0)*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phi(i  ,j,k) - (0.5d0 + hdtdx(1)*umac(i,j,k))*slope(i  ,j,k)
-             else
-                phix(i,j,k) = phi(i-1,j,k) + (0.5d0 - hdtdx(1)*umac(i,j,k))*slope(i-1,j,k)
-             end if
-             
-          end do
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on y faces using vmac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phi(i,j  ,k) - (0.5d0 + hdtdx(2)*vmac(i,j,k))*slope(i,j  ,k)
-             else
-                phiy(i,j,k) = phi(i,j-1,k) + (0.5d0 - hdtdx(2)*vmac(i,j,k))*slope(i,j-1,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopez(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on z faces using wmac to upwind; ignore transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phi(i,j,k  ) - (0.5d0 + hdtdx(3)*wmac(i,j,k))*slope(i,j,k  )
-             else
-                phiz(i,j,k) = phi(i,j,k-1) + (0.5d0 - hdtdx(3)*wmac(i,j,k))*slope(i,j,k-1)
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! transverse terms
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in y-transverse terms
-    do       k=lo(3)-1, hi(3)+1
-       do    j=lo(2)  , hi(2)
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i  ,j+1,k)+vmac(i  ,j,k)) * (phiy(i  ,j+1,k)-phiy(i  ,j,k)) )
-             else
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i-1,j+1,k)+vmac(i-1,j,k)) * (phiy(i-1,j+1,k)-phiy(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on x faces by adding in z-transverse terms
-    do       k=lo(3)  , hi(3)
-       do    j=lo(2)-1, hi(2)+1
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i  ,j,k+1)+wmac(i  ,j,k)) * (phiz(i  ,j,k+1)-phiz(i  ,j,k)) )
-             else
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i-1,j,k+1)+wmac(i-1,j,k)) * (phiz(i-1,j,k+1)-phiz(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j  ,k)+umac(i,j  ,k)) * (phix(i+1,j  ,k)-phix(i,j  ,k)) )
-             else
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j-1,k)+umac(i,j-1,k)) * (phix(i+1,j-1,k)-phix(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in z-transverse terms
-    do       k = lo(3)  , hi(3)
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j  ,k+1)+wmac(i,j  ,k)) * (phiz(i,j  ,k+1)-phiz(i,j  ,k)) )
-             else
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j-1,k+1)+wmac(i,j-1,k)) * (phiz(i,j-1,k+1)-phiz(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in x-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k  )+umac(i,j,k  )) * (phix(i+1,j,k  )-phix(i,j,k  )) )
-             else
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k-1)+umac(i,j,k-1)) * (phix(i+1,j,k-1)-phix(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in y-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)  , hi(2)
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k  )+vmac(i,j,k  )) * (phiy(i,j+1,k  )-phiy(i,j,k  )) )
-             else
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k-1)+vmac(i,j,k-1)) * (phiy(i,j+1,k-1)-phiy(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! final edge states
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in yz and zy transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_z(i  ,j+1,k  )-phiy_z(i  ,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i  ,j,k)) * (phiz_y(i  ,j  ,k+1)-phiz_y(i  ,j,k)) )
-             else
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1,k  )+vmac(i-1,j,k)) * (phiy_z(i-1,j+1,k  )-phiy_z(i-1,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i-1,j  ,k+1)+wmac(i-1,j,k)) * (phiz_y(i-1,j  ,k+1)-phiz_y(i-1,j,k)) )
-             end if
-
-             ! compute final x-fluxes
-             flxx(i,j,k) = umac(i,j,k)*phix(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in xz and zx transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i,j  ,k)) * (phix_z(i+1,j  ,k  )-phix_z(i,j  ,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i,j  ,k)) * (phiz_x(i  ,j  ,k+1)-phiz_x(i,j  ,k)) )
-             else
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j-1,k  )+umac(i,j-1,k)) * (phix_z(i+1,j-1,k  )-phix_z(i,j-1,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j-1,k+1)+wmac(i,j-1,k)) * (phiz_x(i  ,j-1,k+1)-phiz_x(i,j-1,k)) )
-             end if
-
-             ! compute final y-fluxes
-             flxy(i,j,k) = vmac(i,j,k)*phiy(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in xy and yx transverse terms
-    do       k = lo(3), hi(3)+1
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i  ,j,k)) * (phix_y(i+1,j  ,k  )-phix_y(i,j,k  )) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_x(i  ,j+1,k  )-phiy_x(i,j,k  )) )
-             else
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k-1)+umac(i,j,k-1)) * (phix_y(i+1,j  ,k-1)-phix_y(i,j,k-1)) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k-1)+vmac(i,j,k-1)) * (phiy_x(i  ,j+1,k-1)-phiy_x(i,j,k-1)) )
-             end if
-
-             ! compute final z-fluxes
-             flxz(i,j,k) = wmac(i,j,k)*phiz(i,j,k)
-
-          end do
-       end do
-    end do
-
-
-  end subroutine compute_flux_3d
-
-end module compute_flux_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/slope_3d.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/slope_3d.f90
deleted file mode 100755
index 418ac9d5ff3..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_3d/slope_3d.f90
+++ /dev/null
@@ -1,211 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey, slopez
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    integer :: i, j, k
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do    k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-
-          ! first compute Fromm slopes
-          do i = lo(1)-1, hi(1)+1
-             dlft = q(i  ,j,k) - q(i-1,j,k)
-             drgt = q(i+1,j,k) - q(i  ,j,k)
-             dcen(i) = .5d0 * (dlft+drgt)
-             dsgn(i) = sign(1.d0, dcen(i))
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i) = 0.d0
-             endif
-             df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-          end do
-          
-          ! Now limited fourth order slopes
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-             dq(i,j,k) = dsgn(i)*min(dlim(i),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    do k = lo(3), hi(3)
-
-       ! first compute Fromm slopes
-       do j    = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j  ,k) - q(i,j-1,k)
-             drgt = q(i,j+1,k) - q(i,j  ,k)
-             dcen(i,j) = .5d0 * (dlft+drgt)
-             dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j) = 0.d0
-             endif
-             df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-          end do
-       end do
-       
-       ! Now compute limited fourth order slopes
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-             dq(i,j,k) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-          end do
-       end do
-
-    end do
-
-  end subroutine slopey_doit
-
-
-  subroutine slopez(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-
-    call slopez_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, &
-                     (/lo(1),lo(2),lo(3)-1/), (/hi(1),hi(2),hi(3)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopez
-
-  subroutine slopez_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(3), ddhi(3)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do k       = lo(3)-1, hi(3)+1
-       do j    = lo(2)  , hi(2)
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j,k  ) - q(i,j,k-1)
-             drgt = q(i,j,k+1) - q(i,j,k  )
-             dcen(i,j,k) = .5d0 * (dlft+drgt)
-             dsgn(i,j,k) = sign( 1.d0, dcen(i,j,k) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j,k) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j,k) = 0.d0
-             endif
-             df(i,j,k) = dsgn(i,j,k)*min( dlim(i,j,k),abs(dcen(i,j,k)) )
-          end do
-       end do
-    end do
-       
-    ! Now compute limited fourth order slopes
-    do k       = lo(3), hi(3)
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j,k) - sixth*( df(i,j,k+1) + df(i,j,k-1) )
-             dq(i,j,k) = dsgn(i,j,k)*min(dlim(i,j,k),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopez_doit
-
-end module slope_module 
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Adv_nd.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Adv_nd.f90
deleted file mode 100755
index b8dab92f175..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Adv_nd.f90
+++ /dev/null
@@ -1,63 +0,0 @@
-subroutine nullfill(adv,adv_lo,adv_hi,domlo,domhi,delta,xlo,time,bc) bind(C, name="nullfill")
-  implicit none
-  integer          :: adv_lo(3),adv_hi(3)
-  integer          :: bc(*)
-  integer          :: domlo(3), domhi(3)
-  double precision :: delta(3), xlo(3), time
-  double precision :: adv(adv_lo(1):adv_hi(1),adv_lo(2):adv_hi(2),adv_lo(3):adv_hi(3))
-  ! no physical boundaries to fill because it is all periodic
-  return
-end subroutine nullfill
-
-
-subroutine get_tagging_params(name, namlen) bind(C, name="get_tagging_params")
-
-  use tagging_params_module
-
-  ! Initialize the tagging parameters
-
-  integer, intent(in) :: namlen
-  integer, intent(in) :: name(namlen)
-        
-  integer :: un, i, status
-
-  integer, parameter :: maxlen = 256
-  character (len=maxlen) :: probin
-
-  namelist /tagging/ phierr, phigrad, max_phierr_lev, max_phigrad_lev
-
-  ! Set namelist defaults
-  phierr = 1.d20
-  phigrad = 1.d20
-  max_phierr_lev = -1
-  max_phigrad_lev = -1
-
-  ! create the filename
-  if (namlen > maxlen) then
-     print *, 'probin file name too long'
-     stop
-  endif
-
-  do i = 1, namlen
-     probin(i:i) = char(name(i))
-  end do
-
-  ! read in the namelist
-  un = 9
-  open (unit=un, file=probin(1:namlen), form='formatted', status='old')
-  read (unit=un, nml=tagging, iostat=status)
-  
-  if (status < 0) then
-     ! the namelist does not exist, so we just go with the defaults
-     continue
-
-  else if (status > 0) then
-     ! some problem in the namelist
-     print *, 'ERROR: problem in the tagging namelist'
-     stop
-  endif
-
-  close (unit=un)
-  
-end subroutine get_tagging_params
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Make.package b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Make.package
deleted file mode 100755
index 259de879545..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Adv_nd.f90 
-f90EXE_sources += Tagging_nd.f90 tagging_params.f90
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Tagging_nd.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Tagging_nd.f90
deleted file mode 100755
index 394c35584ec..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/Tagging_nd.f90
+++ /dev/null
@@ -1,85 +0,0 @@
-
-! ::: -----------------------------------------------------------
-! ::: This routine will tag high error cells based on the state
-! ::: 
-! ::: INPUTS/OUTPUTS:
-! ::: 
-! ::: tag        <=  integer tag array
-! ::: tag_lo,hi   => index extent of tag array
-! ::: state       => state array
-! ::: state_lo,hi => index extent of state array
-! ::: set         => integer value to tag cell for refinement
-! ::: clear       => integer value to untag cell
-! ::: lo,hi       => work region we are allowed to change
-! ::: dx          => cell size
-! ::: problo      => phys loc of lower left corner of prob domain
-! ::: time        => problem evolution time
-! ::: level       => refinement level of this array
-! ::: -----------------------------------------------------------
-
-subroutine state_error(tag,tag_lo,tag_hi, &
-                       state,state_lo,state_hi, &
-                       set,clear,&
-                       lo,hi,&
-                       dx,problo,time,level) bind(C, name="state_error")
-
-  use tagging_params_module, only : phierr, phigrad, max_phierr_lev, max_phigrad_lev
-  implicit none
-  
-  integer          :: lo(3),hi(3)
-  integer          :: state_lo(3),state_hi(3)
-  integer          :: tag_lo(3),tag_hi(3)
-  double precision :: state(state_lo(1):state_hi(1), &
-                            state_lo(2):state_hi(2), &
-                            state_lo(3):state_hi(3))
-  integer          :: tag(tag_lo(1):tag_hi(1),tag_lo(2):tag_hi(2),tag_lo(3):tag_hi(3))
-  double precision :: problo(3),dx(3),time
-  integer          :: level,set,clear
-
-  double precision :: ax, ay, az
-  integer          :: i, j, k, dim
-
-  if (state_lo(3) .eq. state_hi(3)) then
-     dim = 2
-  else
-     dim = 3
-  end if
-
-  ! Tag on regions of high phi
-  if (level .lt. max_phierr_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              if (state(i,j,k) .ge. phierr(level)) then
-                 tag(i,j,k) = set
-              endif
-           enddo
-        enddo
-     enddo
-  endif
-
-  ! Tag on regions of high phisity gradient
-  if (level .lt. max_phigrad_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              ax = abs(state(i-1,j,k)-state(i,j,k))
-              ax = max(ax, abs(state(i,j,k)-state(i+1,j,k)))
-              ay = abs(state(i,j-1,k)-state(i,j,k))
-              ay = max(ay, abs(state(i,j,k)-state(i,j+1,k)))
-              if (dim .eq. 2) then
-                 az = 0.d0
-              else
-                 az = abs(state(i,j,k-1)-state(i,j,k))
-                 az = max(az, abs(state(i,j,k)-state(i,j,k+1)))
-              end if
-              if (max(ax,ay,az) .ge. phigrad(level)) then
-                 tag(i,j,k) = set
-              end if
-            enddo
-         enddo
-      end do
-   endif
-  
-end subroutine state_error
-
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/tagging_params.f90 b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/tagging_params.f90
deleted file mode 100755
index 3281fbf3dd9..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/Src_nd/tagging_params.f90
+++ /dev/null
@@ -1,7 +0,0 @@
-module tagging_params_module
-
-  double precision, save :: phierr(0:15), phigrad(0:15)
-
-  integer, save :: max_phierr_lev, max_phigrad_lev
-
-end module tagging_params_module
diff --git a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/main.cpp b/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/main.cpp
deleted file mode 100755
index 7f6ac1f848c..00000000000
--- a/Tutorials/AmrTask/MiniApps/Adv_phaseAsync_rgi/Source/main.cpp
+++ /dev/null
@@ -1,76 +0,0 @@
-#include <new>
-#include <iostream>
-#include <iomanip>
-
-#include <AMReX_Amr.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_AmrLevel.H>
-#include <PerillaRts.H>
-
-using namespace amrex;
-using namespace perilla;
-int
-main (int   argc,
-      char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    Real dRunTime1 = ParallelDescriptor::second();
-
-    std::cout << std::setprecision(10);
-
-    int  max_step;
-    Real strt_time;
-    Real stop_time;
-    ParmParse pp; 
-
-    max_step  = -1;
-    strt_time =  0.0;
-    stop_time = -1.0;
-
-    pp.query("max_step",max_step);
-    pp.query("strt_time",strt_time);
-    pp.query("stop_time",stop_time);
-
-    if (strt_time < 0.0) {
-        amrex::Abort("MUST SPECIFY a non-negative strt_time"); 
-    }
-
-    if (max_step < 0 && stop_time < 0.0) {
-	amrex::Abort("Exiting because neither max_step nor stop_time is non-negative.");
-    }
-
-    {
-        Amr amr;
-
-        amr.init(strt_time,stop_time);
-
-        RTS rts;
-        rts.Init(ParallelDescriptor::MyProc(), ParallelDescriptor::NProcs());
-        rts.Iterate(&amr, max_step, stop_time); //run coarseTimeSteps on the amr object 
-
-        rts.Barrier();
-        // Write final checkpoint and plotfile
-        if (amr.stepOfLastCheckPoint() < amr.levelSteps(0)) {
-            amr.checkPoint();
-        }
-
-        if (amr.stepOfLastPlotFile() < amr.levelSteps(0)) {
-            amr.writePlotFile();
-        }
-        rts.Finalize();
-    }
-
-    Real dRunTime2 = ParallelDescriptor::second() - dRunTime1;
-
-    ParallelDescriptor::ReduceRealMax(dRunTime2, ParallelDescriptor::IOProcessorNumber());
-
-    if (ParallelDescriptor::IOProcessor())
-    {
-        std::cout << "Run time = " << dRunTime2 << std::endl;
-    }
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tutorials/Basic/HeatEquation_EX1_C/CMakeLists.txt b/Tutorials/Basic/HeatEquation_EX1_C/CMakeLists.txt
index 65fe6b2774e..b98b8b46966 100644
--- a/Tutorials/Basic/HeatEquation_EX1_C/CMakeLists.txt
+++ b/Tutorials/Basic/HeatEquation_EX1_C/CMakeLists.txt
@@ -1,47 +1,15 @@
-get_filename_component( _base_name ${CMAKE_CURRENT_LIST_DIR} NAME )
-
-set( _test_name ${_base_name} )
-set( _exe_name  ${_base_name}.exe )
-set( _src_dir   ${CMAKE_CURRENT_LIST_DIR}/Source )
-set( _exe_dir   ${CMAKE_CURRENT_LIST_DIR}/Exec )
-
-#
-# Create target (executable) for this tutorial
-#
-add_executable( ${_exe_name} EXCLUDE_FROM_ALL "" )
-
-target_sources( ${_exe_name}
-   PRIVATE
-   ${_src_dir}/main.cpp
-   ${_src_dir}/myfunc.cpp
-   ${_src_dir}/myfunc.H
-   ${_src_dir}/mykernel.H
-   )
-
-target_include_directories( ${_exe_name} PRIVATE  ${_src_dir} )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${_exe_name} )
+if (AMReX_SPACEDIM EQUAL 1)
+   return()
 endif ()
 
-target_link_libraries( ${_exe_name} amrex )
+# List of source files
+set(_sources main.cpp myfunc.cpp myfunc.H mykernel.H)
+list(TRANSFORM _sources PREPEND "Source/")
 
-#
-# Find input files and copy them to corresponding build dir
-#
-file( GLOB_RECURSE _input_files LIST_DIRECTORIES false  ${_exe_dir}/input* )
-file( COPY ${_input_files} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+# List of input files
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false Exec/input* )
 
-#
-# Add to the "tutorial" target
-#
-add_tutorial(${_exe_name})
+setup_tutorial(_sources _input_files)
 
-#
-# Clean up
-#
-unset( _test_name )
-unset( _exe_name  )
-unset( _src_dir   )
-unset( _exe_dir   )
-unset( _input_files )
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HeatEquation_EX1_C/Exec/GNUmakefile b/Tutorials/Basic/HeatEquation_EX1_C/Exec/GNUmakefile
index 5696a12e6ba..9d68c61378e 100644
--- a/Tutorials/Basic/HeatEquation_EX1_C/Exec/GNUmakefile
+++ b/Tutorials/Basic/HeatEquation_EX1_C/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 DEBUG        = FALSE
 USE_MPI      = FALSE
diff --git a/Tutorials/Basic/HeatEquation_EX1_C/Source/main.cpp b/Tutorials/Basic/HeatEquation_EX1_C/Source/main.cpp
index 1b7e48ccf21..dda83bdb86c 100644
--- a/Tutorials/Basic/HeatEquation_EX1_C/Source/main.cpp
+++ b/Tutorials/Basic/HeatEquation_EX1_C/Source/main.cpp
@@ -62,8 +62,8 @@ void main_main ()
         ba.maxSize(max_grid_size);
 
        // This defines the physical box, [-1,1] in each direction.
-        RealBox real_box({AMREX_D_DECL(-1.0_rt,-1.0_rt,-1.0_rt)},
-                         {AMREX_D_DECL( 1.0_rt, 1.0_rt, 1.0_rt)});
+        RealBox real_box({AMREX_D_DECL(-Real(1.0),-Real(1.0),-Real(1.0))},
+                         {AMREX_D_DECL( Real(1.0), Real(1.0), Real(1.0))});
 
         // periodic in all direction
         Array<int,AMREX_SPACEDIM> is_periodic{AMREX_D_DECL(1,1,1)};
@@ -90,10 +90,14 @@ void main_main ()
     init_phi(phi_new, geom);
     // ========================================
 
-    Real dt = 0.9_rt*dx[0]*dx[0] / (2.0_rt*AMREX_SPACEDIM);
+    Real cfl = 0.9;
+    Real coeff = AMREX_D_TERM(   1./(dx[0]*dx[0]),
+                               + 1./(dx[1]*dx[1]),
+                               + 1./(dx[2]*dx[2]) );
+    Real dt = cfl/(2.0*coeff);
 
     // time = starting time in the simulation
-    Real time = 0.0_rt;
+    Real time = 0.0;
 
     // Write a plotfile of the initial data if plot_int > 0 (plot_int was defined in the inputs file)
     if (plot_int > 0)
diff --git a/Tutorials/Basic/HeatEquation_EX1_C/Source/mykernel.H b/Tutorials/Basic/HeatEquation_EX1_C/Source/mykernel.H
index 44a2e326302..e334f7f6c7e 100644
--- a/Tutorials/Basic/HeatEquation_EX1_C/Source/mykernel.H
+++ b/Tutorials/Basic/HeatEquation_EX1_C/Source/mykernel.H
@@ -9,21 +9,17 @@ void init_phi (int i, int j, int k,
                amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dx,
                amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& prob_lo)
 {
-    using namespace amrex::literals;
+    using amrex::Real;;
 
-    amrex::Real x = prob_lo[0] + (i+0.5_rt) * dx[0];
-    amrex::Real y = prob_lo[1] + (j+0.5_rt) * dx[1];
+    Real x = prob_lo[0] + (i+Real(0.5)) * dx[0];
+    Real y = prob_lo[1] + (j+Real(0.5)) * dx[1];
 #if (AMREX_SPACEDIM > 2)
-    amrex::Real z = prob_lo[2] + (k+0.5_rt) * dx[2];
+    Real z = prob_lo[2] + (k+Real(0.5)) * dx[2];
 #else
-    amrex::Real z = 0._rt;
-#endif
-    amrex::Real r2 = ((x-0.25_rt)*(x-0.25_rt)+(y-0.25_rt)*(y-0.25_rt)+(z-0.25_rt)*(z-0.25_rt))/0.01_rt;
-#ifdef AMREX_USE_HIP
-    phi(i,j,k) = 1._rt + ::exp(-r2); // xxxxx HIP todo
-#else
-    phi(i,j,k) = 1._rt + std::exp(-r2);
+    Real z = Real(0.);
 #endif
+    Real r2 = ((x-Real(0.25))*(x-Real(0.25))+(y-Real(0.25))*(y-Real(0.25))+(z-Real(0.25))*(z-Real(0.25)))/Real(0.01);
+    phi(i,j,k) = Real(1.) + std::exp(-r2);
 }
 
 
diff --git a/Tutorials/Basic/HeatEquation_EX1_CF/CMakeLists.txt b/Tutorials/Basic/HeatEquation_EX1_CF/CMakeLists.txt
index d32437e72a3..52f84352496 100644
--- a/Tutorials/Basic/HeatEquation_EX1_CF/CMakeLists.txt
+++ b/Tutorials/Basic/HeatEquation_EX1_CF/CMakeLists.txt
@@ -1,68 +1,47 @@
-if ( (DIM EQUAL 1) OR NOT ENABLE_FORTRAN)
+if ( (AMReX_SPACEDIM EQUAL 1) OR NOT CMAKE_Fortran_COMPILER_LOADED)
    return()
 endif ()
 
-get_filename_component ( DIRNAME ${CMAKE_CURRENT_LIST_DIR} NAME )
+set(_sources
+   advance_${AMReX_SPACEDIM}d.f90
+   advance.cpp
+   init_phi_${AMReX_SPACEDIM}d.f90
+   main.cpp
+   myfunc_F.H
+   myfunc.H )
 
-set ( TESTNAME ${DIRNAME} )
-set ( EXENAME  ${DIRNAME}.exe )
-set ( SRC_DIR  ${CMAKE_CURRENT_LIST_DIR}/Source )
-set ( EXE_DIR  ${CMAKE_CURRENT_LIST_DIR}/Exec )
+list(TRANSFORM _sources PREPEND "Source/")
 
-#
-# Create target (executable) for this tutorial
-#
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
+set(_input_files  Exec/inputs_${AMReX_SPACEDIM}d)
 
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${SRC_DIR}/advance_${DIM}d.f90
-   ${SRC_DIR}/advance.cpp
-   ${SRC_DIR}/init_phi_${DIM}d.f90
-   ${SRC_DIR}/main.cpp
-   ${SRC_DIR}/myfunc_F.H
-   ${SRC_DIR}/myfunc.H )
+setup_tutorial(_sources _input_files)
 
-set_target_properties ( ${EXENAME} PROPERTIES
-   INCLUDE_DIRECTORIES
-   "${SRC_DIR};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR} )
+unset( _sources )
+unset( _input_files  )
 
-target_link_libraries ( ${EXENAME} amrex )
 
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${EXENAME} )
-endif ()
 
-#
-# Copy input files to corresponding build dir
-# First copy operation is run when builddir is setup
-set (INPUT_FILES ${EXE_DIR}/inputs_${DIM}d )
+# if ( (NOT AMReX_CUDA) AND (NOT AMReX_DPCPP) )
 
-file ( COPY ${INPUT_FILES} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+#    add_custom_target( run_${EXENAME}
+#       COMMAND
+#       cp ${INPUT_FILES} ${CMAKE_CURRENT_BINARY_DIR}
+#       COMMAND
+#       ${EXENAME} inputs_${AMReX_SPACEDIM}d  nsteps = 10
+#       DEPENDS
+#       ${INPUT_FILES}
+#       WORKING_DIRECTORY
+#       ${CMAKE_CURRENT_BINARY_DIR}
+#       COMMENT
+#       "Running ${EXENAME}"
+#       VERBATIM
+#       )
 
-if (NOT ENABLE_CUDA)
 
-   add_custom_target( run_${EXENAME}
-      COMMAND
-      cp ${INPUT_FILES} ${CMAKE_CURRENT_BINARY_DIR}
-      COMMAND
-      ${EXENAME} inputs_${DIM}d  nsteps = 10
-      DEPENDS
-      ${INPUT_FILES}
-      WORKING_DIRECTORY
-      ${CMAKE_CURRENT_BINARY_DIR}
-      COMMENT
-      "Running ${EXENAME}"
-      VERBATIM
-      )
 
-   #
-   # Add to the "tutorial" target
-   #
-   add_tutorial (run_${EXENAME})
+#    #
+#    # Add to the "tutorial" target
+#    #
+#    add_tutorial (run_${EXENAME})
 
-endif ()
+# endif ()
diff --git a/Tutorials/Basic/HeatEquation_EX1_CF/Exec/GNUmakefile b/Tutorials/Basic/HeatEquation_EX1_CF/Exec/GNUmakefile
index f8aa3731ddd..bfee3038012 100644
--- a/Tutorials/Basic/HeatEquation_EX1_CF/Exec/GNUmakefile
+++ b/Tutorials/Basic/HeatEquation_EX1_CF/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 DEBUG     = FALSE
 USE_MPI   = FALSE
diff --git a/Tutorials/Basic/HeatEquation_EX1_CF/Source/advance.cpp b/Tutorials/Basic/HeatEquation_EX1_CF/Source/advance.cpp
index fb8e4dcab15..eaad43c02aa 100644
--- a/Tutorials/Basic/HeatEquation_EX1_CF/Source/advance.cpp
+++ b/Tutorials/Basic/HeatEquation_EX1_CF/Source/advance.cpp
@@ -14,10 +14,6 @@ void advance (MultiFab& phi_old,
     // includes periodic domain boundaries
     phi_old.FillBoundary(geom.periodicity());
 
-    int Ncomp = phi_old.nComp();
-    int ng_p = phi_old.nGrow();
-    int ng_f = flux[0].nGrow();
-
     const Real* dx = geom.CellSize();
 
     //
diff --git a/Tutorials/Basic/HeatEquation_EX1_CF/Source/main.cpp b/Tutorials/Basic/HeatEquation_EX1_CF/Source/main.cpp
index 307f28d44ac..8527499f400 100644
--- a/Tutorials/Basic/HeatEquation_EX1_CF/Source/main.cpp
+++ b/Tutorials/Basic/HeatEquation_EX1_CF/Source/main.cpp
@@ -98,7 +98,12 @@ void main_main ()
 
     // compute the time step
     const Real* dx = geom.CellSize();
-    Real dt = 0.9*dx[0]*dx[0] / (2.0*AMREX_SPACEDIM);
+
+    Real cfl = 0.9;
+    Real coeff = AMREX_D_TERM(   1./(dx[0]*dx[0]),
+                               + 1./(dx[1]*dx[1]),
+                               + 1./(dx[2]*dx[2]) );
+    Real dt = cfl/(2.0*coeff);
 
     // time = starting time in the simulation
     Real time = 0.0;
diff --git a/Tutorials/Basic/HeatEquation_EX1_F/CMakeLists.txt b/Tutorials/Basic/HeatEquation_EX1_F/CMakeLists.txt
index 27eab272c3b..5fdf94ab1f9 100644
--- a/Tutorials/Basic/HeatEquation_EX1_F/CMakeLists.txt
+++ b/Tutorials/Basic/HeatEquation_EX1_F/CMakeLists.txt
@@ -2,51 +2,17 @@
 # This tutorial needs Fortran interfaces
 # Disable for cuda
 #
-if ( NOT ENABLE_FORTRAN_INTERFACES OR ENABLE_CUDA )
+if ( NOT AMReX_FORTRAN_INTERFACES OR AMReX_CUDA )
    return()
 endif ()
 
-get_filename_component( _base_name ${CMAKE_CURRENT_LIST_DIR} NAME )
+# List of source files
+set(_sources fmain.F90 init_phi.f90 advance.f90)
 
-set( _test_name ${_base_name} )
-set( _exe_name  ${_base_name}.exe )
+# List of input files
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false input* )
 
-#
-# Create target (executable) for this tutorial
-#
-add_executable( ${_exe_name} EXCLUDE_FROM_ALL "" )
-
-target_sources( ${_exe_name}
-   PRIVATE
-   fmain.f90
-   init_phi.f90
-   advance.f90
-   )
-
-target_link_libraries( ${_exe_name} amrex )
-
-
-set_target_properties ( ${_exe_name} PROPERTIES
-   INCLUDE_DIRECTORIES
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   )
-
-#
-# Find input files and copy them to corresponding build dir
-#
-file( GLOB_RECURSE _input_files LIST_DIRECTORIES false  input* )
-file( COPY ${_input_files} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULES)
 
-#
-# Add to the "tutorial" target
-#
-add_tutorial(${_exe_name})
-
-#
-# Clean up
-#
-unset( _test_name )
-unset( _exe_name  )
-unset( _input_files )
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HeatEquation_EX1_F/GNUmakefile b/Tutorials/Basic/HeatEquation_EX1_F/GNUmakefile
index d621bf0932d..440edbaf79b 100644
--- a/Tutorials/Basic/HeatEquation_EX1_F/GNUmakefile
+++ b/Tutorials/Basic/HeatEquation_EX1_F/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 DEBUG     = TRUE
 
diff --git a/Tutorials/Basic/HeatEquation_EX1_F/Make.package b/Tutorials/Basic/HeatEquation_EX1_F/Make.package
index 154d01be813..b53345f45b9 100644
--- a/Tutorials/Basic/HeatEquation_EX1_F/Make.package
+++ b/Tutorials/Basic/HeatEquation_EX1_F/Make.package
@@ -1,2 +1,2 @@
-f90EXE_sources += fmain.f90 init_phi.f90 advance.f90
-
+f90EXE_sources += init_phi.f90 advance.f90
+F90EXE_sources += fmain.F90
diff --git a/Tutorials/Basic/HeatEquation_EX1_F/fmain.f90 b/Tutorials/Basic/HeatEquation_EX1_F/fmain.F90
similarity index 88%
rename from Tutorials/Basic/HeatEquation_EX1_F/fmain.f90
rename to Tutorials/Basic/HeatEquation_EX1_F/fmain.F90
index 608e2f45c3d..89ce2420244 100644
--- a/Tutorials/Basic/HeatEquation_EX1_F/fmain.f90
+++ b/Tutorials/Basic/HeatEquation_EX1_F/fmain.F90
@@ -11,7 +11,7 @@ program main
   integer :: n_cell, max_grid_size, nsteps, plot_int
   integer, parameter :: ncomp = 1, nghost = 1  ! one component, one ghost
   integer :: istep
-  real(amrex_real) :: dt, time
+  real(amrex_real) :: dt, coeff, time
   type(amrex_parmparse) :: pp
   type(amrex_box) :: domain
   type(amrex_boxarray)  :: ba
@@ -66,7 +66,16 @@ program main
   time = 0.d0
 
   ! choose a time step with a diffusive CFL of 0.9
-  dt = 0.9d0*geom%dx(1)**2/(2.d0*amrex_spacedim)
+
+#if (AMREX_SPACEDIM==1)
+  coeff = 1./(geom%dx(1)*geom%dx(1))
+#elif (AMREX_SPACEDIM==2)
+  coeff = 1./(geom%dx(1)*geom%dx(1)) + 1./(geom%dx(2)*geom%dx(2))
+#else
+  coeff = 1./(geom%dx(1)*geom%dx(1)) + 1./(geom%dx(2)*geom%dx(2)) + 1./(geom%dx(3)*geom%dx(3))
+#endif
+
+  dt = 0.9d0/(2.d0*coeff)
 
   do istep = 1, nsteps
 
diff --git a/Tutorials/Basic/HeatEquation_EX1_F/inputs b/Tutorials/Basic/HeatEquation_EX1_F/inputs
index bdbad89909f..df821326fb9 100644
--- a/Tutorials/Basic/HeatEquation_EX1_F/inputs
+++ b/Tutorials/Basic/HeatEquation_EX1_F/inputs
@@ -13,5 +13,5 @@ geometry.coord_sys = 0
 geometry.prob_lo = -1.0  -1.0  -1.0
 geometry.prob_hi =  1.0   1.0   1.0
 
-# Periodic? Default in BoxLib is set to 0 (no).
+# Periodic? Default in AMReX is set to 0 (no).
 geometry.is_periodic = 1  1  1
diff --git a/Tutorials/Basic/HeatEquation_EX2_C/CMakeLists.txt b/Tutorials/Basic/HeatEquation_EX2_C/CMakeLists.txt
new file mode 100644
index 00000000000..a65d6d90376
--- /dev/null
+++ b/Tutorials/Basic/HeatEquation_EX2_C/CMakeLists.txt
@@ -0,0 +1,11 @@
+# List of source files
+set(_sources main.cpp myfunc.cpp myfunc.H mykernel.H)
+list(TRANSFORM _sources PREPEND "Source/")
+
+# List of input files
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false Exec/input* )
+
+setup_tutorial(_sources _input_files)
+
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HeatEquation_EX2_C/Exec/GNUmakefile b/Tutorials/Basic/HeatEquation_EX2_C/Exec/GNUmakefile
index b39a7e0b262..f885d9d5353 100644
--- a/Tutorials/Basic/HeatEquation_EX2_C/Exec/GNUmakefile
+++ b/Tutorials/Basic/HeatEquation_EX2_C/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 DEBUG     = FALSE
 USE_MPI   = TRUE 
diff --git a/Tutorials/Basic/HeatEquation_EX2_C/Source/main.cpp b/Tutorials/Basic/HeatEquation_EX2_C/Source/main.cpp
index b1b761fa12a..79472a7cada 100644
--- a/Tutorials/Basic/HeatEquation_EX2_C/Source/main.cpp
+++ b/Tutorials/Basic/HeatEquation_EX2_C/Source/main.cpp
@@ -144,7 +144,11 @@ void main_main ()
 	}
     }
 
-    Real dt = 0.9*dx[0]*dx[0] / (2.0*AMREX_SPACEDIM);
+    Real cfl = 0.9;
+    Real coeff = AMREX_D_TERM(   1./(dx[0]*dx[0]),
+                               + 1./(dx[1]*dx[1]),
+                               + 1./(dx[2]*dx[2]) );
+    Real dt = cfl/(2.0*coeff);
 
     // time = starting time in the simulation
     Real time = 0.0;
diff --git a/Tutorials/Basic/HeatEquation_EX2_C/Source/mykernel.H b/Tutorials/Basic/HeatEquation_EX2_C/Source/mykernel.H
index d82b38f9726..f1cef4df381 100644
--- a/Tutorials/Basic/HeatEquation_EX2_C/Source/mykernel.H
+++ b/Tutorials/Basic/HeatEquation_EX2_C/Source/mykernel.H
@@ -13,11 +13,7 @@ void init_phi (int i, int j, int k,
     amrex::Real y = prob_lo[1] + (j+0.5) * dx[1];
     amrex::Real z = prob_lo[2] + (k+0.5) * dx[2];
     amrex::Real r2 = ((x-0.25)*(x-0.25)+(y-0.25)*(y-0.25)+(z-0.25)*(z-0.25))/0.01;
-#ifdef AMREX_USE_HIP
-    phi(i,j,k) = 1. + ::exp(-r2); // xxxxx HIP todo
-#else
     phi(i,j,k) = 1. + std::exp(-r2);
-#endif
 }
 
 
diff --git a/Tutorials/Basic/HeatEquation_EX2_CF/CMakeLists.txt b/Tutorials/Basic/HeatEquation_EX2_CF/CMakeLists.txt
index c38b8a0716b..19119b1a668 100644
--- a/Tutorials/Basic/HeatEquation_EX2_CF/CMakeLists.txt
+++ b/Tutorials/Basic/HeatEquation_EX2_CF/CMakeLists.txt
@@ -1,63 +1,15 @@
-#
-# This tutorial needs Fortran
-#
-if ( NOT CMAKE_Fortran_COMPILER_LOADED )
+if ( NOT CMAKE_Fortran_COMPILER_LOADED OR ( AMReX_SPACEDIM EQUAL 1) )
    return()
 endif ()
 
-get_filename_component( _base_name ${CMAKE_CURRENT_LIST_DIR} NAME )
+# List of source files
+set(_sources main.cpp advance.cpp myfunc_F.H myfunc.H init_phi_${AMReX_SPACEDIM}d.f90 advance_${AMReX_SPACEDIM}d.f90)
+list(TRANSFORM _sources PREPEND "Source/")
 
-set( _test_name ${_base_name} )
-set( _exe_name  ${_base_name}.exe )
-set( _src_dir   ${CMAKE_CURRENT_LIST_DIR}/Source )
-set( _exe_dir   ${CMAKE_CURRENT_LIST_DIR}/Exec )
+# List of input files
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false Exec/input* )
 
-#
-# Create target (executable) for this tutorial
-#
-add_executable( ${_exe_name} EXCLUDE_FROM_ALL "" )
+setup_tutorial(_sources _input_files)
 
-target_sources( ${_exe_name}
-   PRIVATE
-   ${_src_dir}/main.cpp
-   ${_src_dir}/advance.cpp
-   ${_src_dir}/myfunc_F.H
-   ${_src_dir}/myfunc.H
-   ${_src_dir}/init_phi_${DIM}d.f90
-   ${_src_dir}/advance_${DIM}d.f90
-   )
-
-target_include_directories( ${_exe_name} PRIVATE  ${_src_dir} )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${_exe_name} )
-endif ()
-
-target_link_libraries( ${_exe_name} amrex )
-
-set_target_properties ( ${_exe_name} PROPERTIES
-   INCLUDE_DIRECTORIES
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   )
-
-#
-# Find input files and copy them to corresponding build dir
-#
-file( GLOB_RECURSE _input_files LIST_DIRECTORIES false  ${_exe_dir}/input* )
-file( COPY ${_exe_dir}/inputs_${DIM}d DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-#
-# Add to the "tutorial" target
-#
-add_tutorial(${_exe_name})
-
-#
-# Clean up
-#
-unset( _test_name )
-unset( _exe_name  )
-unset( _src_dir   )
-unset( _exe_dir   )
-unset( _input_files )
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HeatEquation_EX2_CF/Exec/GNUmakefile b/Tutorials/Basic/HeatEquation_EX2_CF/Exec/GNUmakefile
index f8aa3731ddd..bfee3038012 100644
--- a/Tutorials/Basic/HeatEquation_EX2_CF/Exec/GNUmakefile
+++ b/Tutorials/Basic/HeatEquation_EX2_CF/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 DEBUG     = FALSE
 USE_MPI   = FALSE
diff --git a/Tutorials/Basic/HeatEquation_EX2_CF/Source/advance.cpp b/Tutorials/Basic/HeatEquation_EX2_CF/Source/advance.cpp
index 41220ef164b..da35a2ee645 100644
--- a/Tutorials/Basic/HeatEquation_EX2_CF/Source/advance.cpp
+++ b/Tutorials/Basic/HeatEquation_EX2_CF/Source/advance.cpp
@@ -20,10 +20,6 @@ void advance (MultiFab& phi_old,
     // Fill non-periodic physical boundaries
     FillDomainBoundary(phi_old, geom, bc);
 
-    int Ncomp = phi_old.nComp();
-    int ng_p = phi_old.nGrow();
-    int ng_f = flux[0].nGrow();
-
     const Real* dx = geom.CellSize();
 
     //
diff --git a/Tutorials/Basic/HeatEquation_EX2_CF/Source/main.cpp b/Tutorials/Basic/HeatEquation_EX2_CF/Source/main.cpp
index 2408a95b530..7c897af128b 100644
--- a/Tutorials/Basic/HeatEquation_EX2_CF/Source/main.cpp
+++ b/Tutorials/Basic/HeatEquation_EX2_CF/Source/main.cpp
@@ -150,7 +150,11 @@ void main_main ()
 
     // compute the time step
     const Real* dx = geom.CellSize();
-    Real dt = 0.9*dx[0]*dx[0] / (2.0*AMREX_SPACEDIM);
+    Real cfl = 0.9;
+    Real coeff = AMREX_D_TERM(   1./(dx[0]*dx[0]),
+                               + 1./(dx[1]*dx[1]),
+                               + 1./(dx[2]*dx[2]) );
+    Real dt = cfl/(2.0*coeff);
 
     // Write a plotfile of the initial data if plot_int > 0 (plot_int was defined in the inputs file)
     if (plot_int > 0)
diff --git a/Tutorials/Basic/HeatEquation_EX3_C/CMakeLists.txt b/Tutorials/Basic/HeatEquation_EX3_C/CMakeLists.txt
index b7134386b6c..e39a0471013 100644
--- a/Tutorials/Basic/HeatEquation_EX3_C/CMakeLists.txt
+++ b/Tutorials/Basic/HeatEquation_EX3_C/CMakeLists.txt
@@ -1,62 +1,15 @@
-#
-# This tutorial needs Fortran
-#
-if ( NOT CMAKE_Fortran_COMPILER_LOADED )
+if ( NOT CMAKE_Fortran_COMPILER_LOADED OR (AMReX_SPACEDIM EQUAL 1))
    return()
 endif ()
 
-get_filename_component( _base_name ${CMAKE_CURRENT_LIST_DIR} NAME )
+# List of source files
+set(_sources main.cpp advance.cpp myfunc_F.H myfunc.H init_phi_${AMReX_SPACEDIM}d.f90)
+list(TRANSFORM _sources PREPEND "Source/")
 
-set( _test_name ${_base_name} )
-set( _exe_name  ${_base_name}.exe )
-set( _src_dir   ${CMAKE_CURRENT_LIST_DIR}/Source )
-set( _exe_dir   ${CMAKE_CURRENT_LIST_DIR}/Exec )
+# List of input files
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false Exec/input* )
 
-#
-# Create target (executable) for this tutorial
-#
-add_executable( ${_exe_name} EXCLUDE_FROM_ALL "" )
+setup_tutorial(_sources _input_files)
 
-target_sources( ${_exe_name}
-   PRIVATE
-   ${_src_dir}/main.cpp
-   ${_src_dir}/advance.cpp
-   ${_src_dir}/myfunc_F.H
-   ${_src_dir}/myfunc.H
-   ${_src_dir}/init_phi_${DIM}d.f90
-   )
-
-target_include_directories( ${_exe_name} PRIVATE  ${_src_dir} )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${_exe_name} )
-endif ()
-
-target_link_libraries( ${_exe_name} amrex )
-
-set_target_properties ( ${_exe_name} PROPERTIES
-   INCLUDE_DIRECTORIES
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   )
-
-#
-# Find input files and copy them to corresponding build dir
-#
-file( GLOB_RECURSE _input_files LIST_DIRECTORIES false  ${_exe_dir}/input* )
-file( COPY ${_exe_dir}/inputs_${DIM}d DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-#
-# Add to the "tutorial" target
-#
-add_tutorial(${_exe_name})
-
-#
-# Clean up
-#
-unset( _test_name )
-unset( _exe_name  )
-unset( _src_dir   )
-unset( _exe_dir   )
-unset( _input_files )
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HeatEquation_EX3_C/Exec/GNUmakefile b/Tutorials/Basic/HeatEquation_EX3_C/Exec/GNUmakefile
index 7567f38adea..494da00de1e 100644
--- a/Tutorials/Basic/HeatEquation_EX3_C/Exec/GNUmakefile
+++ b/Tutorials/Basic/HeatEquation_EX3_C/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 DEBUG     = FALSE
 USE_MPI   = FALSE
diff --git a/Tutorials/Basic/HeatEquation_EX3_C/Source/advance.cpp b/Tutorials/Basic/HeatEquation_EX3_C/Source/advance.cpp
index 17f09acb6f4..1fdbf7691c3 100644
--- a/Tutorials/Basic/HeatEquation_EX3_C/Source/advance.cpp
+++ b/Tutorials/Basic/HeatEquation_EX3_C/Source/advance.cpp
@@ -125,8 +125,8 @@ void advance (MultiFab& phi_old,
     mlmg.setMaxFmgIter(max_fmg_iter);
     int verbose = 2;
     mlmg.setVerbose(verbose);
-    int cg_verbose = 0;
-    mlmg.setCGVerbose(cg_verbose);
+    int bottom_verbose = 0;
+    mlmg.setBottomVerbose(bottom_verbose);
 
     // relative and absolute tolerances for linear solve
     const Real tol_rel = 1.e-10;
diff --git a/Tutorials/Basic/HeatEquation_EX3_C/Source/main.cpp b/Tutorials/Basic/HeatEquation_EX3_C/Source/main.cpp
index 1cc2ef0d904..f88e1a8645a 100644
--- a/Tutorials/Basic/HeatEquation_EX3_C/Source/main.cpp
+++ b/Tutorials/Basic/HeatEquation_EX3_C/Source/main.cpp
@@ -151,8 +151,12 @@ void main_main ()
     // Compute the time step
     // Implicit time step is imFactor*(explicit time step)
     const Real* dx = geom.CellSize();
+    Real cfl = 0.9;
+    Real coeff = AMREX_D_TERM(   1./(dx[0]*dx[0]),
+                               + 1./(dx[1]*dx[1]),
+                               + 1./(dx[2]*dx[2]) );
     const int imFactor = pow(10, AMREX_SPACEDIM-1);
-    Real dt = imFactor*0.9*dx[0]*dx[0] / (2.0*AMREX_SPACEDIM);
+    Real dt = imFactor*cfl/(2.0*coeff);
 
     // Write a plotfile of the initial data if plot_int > 0 (plot_int was defined in the inputs file)
     if (plot_int > 0)
diff --git a/Tutorials/Basic/HelloWorld_C/CMakeLists.txt b/Tutorials/Basic/HelloWorld_C/CMakeLists.txt
new file mode 100644
index 00000000000..71a78c13816
--- /dev/null
+++ b/Tutorials/Basic/HelloWorld_C/CMakeLists.txt
@@ -0,0 +1,10 @@
+# List of source files
+set(_sources main.cpp)
+
+# List of input files
+set(_input_files)
+
+setup_tutorial(_sources _input_files)
+
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HelloWorld_C/GNUmakefile b/Tutorials/Basic/HelloWorld_C/GNUmakefile
index 43bf6852362..1f634080bee 100644
--- a/Tutorials/Basic/HelloWorld_C/GNUmakefile
+++ b/Tutorials/Basic/HelloWorld_C/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 DEBUG	= TRUE
diff --git a/Tutorials/Basic/HelloWorld_F/CMakeLists.txt b/Tutorials/Basic/HelloWorld_F/CMakeLists.txt
new file mode 100644
index 00000000000..a3c5d2a270a
--- /dev/null
+++ b/Tutorials/Basic/HelloWorld_F/CMakeLists.txt
@@ -0,0 +1,14 @@
+if ( NOT AMReX_FORTRAN_INTERFACES )
+   return()
+endif ()
+
+# List of source files
+set(_sources fmain.f90)
+
+# List of input files
+set(_input_files)
+
+setup_tutorial(_sources _input_files)
+
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/HelloWorld_F/GNUmakefile b/Tutorials/Basic/HelloWorld_F/GNUmakefile
index 70ceedfaf1f..7d8f037bd1f 100644
--- a/Tutorials/Basic/HelloWorld_F/GNUmakefile
+++ b/Tutorials/Basic/HelloWorld_F/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 DEBUG	= TRUE
diff --git a/Tutorials/Basic/PrefixSum_MultiFab/CMakeLists.txt b/Tutorials/Basic/PrefixSum_MultiFab/CMakeLists.txt
new file mode 100644
index 00000000000..113f8d5818c
--- /dev/null
+++ b/Tutorials/Basic/PrefixSum_MultiFab/CMakeLists.txt
@@ -0,0 +1,10 @@
+# List of source files
+set(_sources main.cpp)
+
+# List of input files
+set(_input_files inputs Parallel-Prefix-Sum.ipynb)
+
+setup_tutorial(_sources _input_files)
+
+unset( _sources )
+unset( _input_files   )
diff --git a/Tutorials/Basic/PrefixSum_MultiFab/GNUmakefile b/Tutorials/Basic/PrefixSum_MultiFab/GNUmakefile
index e5b149de863..ac011373aac 100644
--- a/Tutorials/Basic/PrefixSum_MultiFab/GNUmakefile
+++ b/Tutorials/Basic/PrefixSum_MultiFab/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG     = FALSE
 USE_MPI   = TRUE
diff --git a/Tutorials/Basic/PrefixSum_MultiFab/main.cpp b/Tutorials/Basic/PrefixSum_MultiFab/main.cpp
index e8839a20a1f..026193880d1 100644
--- a/Tutorials/Basic/PrefixSum_MultiFab/main.cpp
+++ b/Tutorials/Basic/PrefixSum_MultiFab/main.cpp
@@ -117,7 +117,7 @@ void main_main ()
         int reverse;
         Real exclusive_sum;
 
-        GidLo(Long id, int smallend, int reverse_order) : gid(id), lo(smallend), reverse(reverse_order), exclusive_sum(0.0) {};
+        GidLo(Long id, int smallend, int reverse_order) : gid(id), lo(smallend), reverse(reverse_order), exclusive_sum(0.0) {}
 
         // sort grids either increasing (forward) or decreasing (reverse) by their lo index
         bool operator<(const GidLo& other) const
diff --git a/Tutorials/Basic/main_C/CMakeLists.txt b/Tutorials/Basic/main_C/CMakeLists.txt
new file mode 100644
index 00000000000..82aae874283
--- /dev/null
+++ b/Tutorials/Basic/main_C/CMakeLists.txt
@@ -0,0 +1,11 @@
+if (NOT AMReX_MPI)
+   return()
+endif ()
+
+set(_sources main.cpp)
+set(_input_files)
+
+setup_tutorial(_sources  _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Basic/main_C/GNUmakefile b/Tutorials/Basic/main_C/GNUmakefile
index b8cbfc6fa4d..434dcf1971d 100644
--- a/Tutorials/Basic/main_C/GNUmakefile
+++ b/Tutorials/Basic/main_C/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 DEBUG	= TRUE
diff --git a/Tutorials/Basic/main_F/CMakeLists.txt b/Tutorials/Basic/main_F/CMakeLists.txt
new file mode 100644
index 00000000000..21897514c6a
--- /dev/null
+++ b/Tutorials/Basic/main_F/CMakeLists.txt
@@ -0,0 +1,11 @@
+if (NOT AMReX_FORTRAN_INTERFACES OR NOT AMReX_MPI)
+   return()
+endif ()
+
+set(_sources main.F90)
+set(_input_files)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Basic/main_F/GNUmakefile b/Tutorials/Basic/main_F/GNUmakefile
index e0498c23dbf..2a0004dee3d 100644
--- a/Tutorials/Basic/main_F/GNUmakefile
+++ b/Tutorials/Basic/main_F/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 DEBUG	= TRUE
diff --git a/Tutorials/Blueprint/AssignMultiLevelDensity/CMakeLists.txt b/Tutorials/Blueprint/AssignMultiLevelDensity/CMakeLists.txt
new file mode 100644
index 00000000000..25957b4b3b1
--- /dev/null
+++ b/Tutorials/Blueprint/AssignMultiLevelDensity/CMakeLists.txt
@@ -0,0 +1,11 @@
+if (NOT CMAKE_Fortran_COMPILER_LOADED OR NOT AMReX_PARTICLES)
+   return()
+endif ()
+
+set(_sources main.cpp)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Blueprint/AssignMultiLevelDensity/GNUmakefile b/Tutorials/Blueprint/AssignMultiLevelDensity/GNUmakefile
index 80422c7d39f..fbb89968201 100644
--- a/Tutorials/Blueprint/AssignMultiLevelDensity/GNUmakefile
+++ b/Tutorials/Blueprint/AssignMultiLevelDensity/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 #
 # This example requires installs of:
diff --git a/Tutorials/Blueprint/CellSortedParticles/CMakeLists.txt b/Tutorials/Blueprint/CellSortedParticles/CMakeLists.txt
new file mode 100644
index 00000000000..d4b73bc5dd8
--- /dev/null
+++ b/Tutorials/Blueprint/CellSortedParticles/CMakeLists.txt
@@ -0,0 +1,11 @@
+if (NOT (AMReX_SPACEDIM EQUAL 3) OR NOT CMAKE_Fortran_COMPILER_LOADED OR NOT AMReX_PARTICLES)
+   return()
+endif ()
+
+set(_sources cell_sorted_3d.F90 cell_sorted_F.H CellSortedPC.cpp CellSortedPC.H main.cpp)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Blueprint/CellSortedParticles/GNUmakefile b/Tutorials/Blueprint/CellSortedParticles/GNUmakefile
index 8cd0d25e2f1..1296c2c6280 100644
--- a/Tutorials/Blueprint/CellSortedParticles/GNUmakefile
+++ b/Tutorials/Blueprint/CellSortedParticles/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tutorials/Blueprint/HeatEquation_EX1_C/CMakeLists.txt b/Tutorials/Blueprint/HeatEquation_EX1_C/CMakeLists.txt
new file mode 100644
index 00000000000..7db48013c10
--- /dev/null
+++ b/Tutorials/Blueprint/HeatEquation_EX1_C/CMakeLists.txt
@@ -0,0 +1,13 @@
+if (AMReX_SPACEDIM EQUAL 1 OR NOT CMAKE_Fortran_COMPILER_LOADED)
+   return()
+endif ()
+
+set(_sources advance_${AMReX_SPACEDIM}d.f90 advance.cpp init_phi_${AMReX_SPACEDIM}d.f90 main.cpp myfunc_F.H  myfunc.H)
+list(TRANSFORM _sources PREPEND Source/)
+
+set(_input_files Exec/inputs_${AMReX_SPACEDIM}d)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Blueprint/HeatEquation_EX1_C/Exec/GNUmakefile b/Tutorials/Blueprint/HeatEquation_EX1_C/Exec/GNUmakefile
index 38143b3f34c..cb765c87c8e 100644
--- a/Tutorials/Blueprint/HeatEquation_EX1_C/Exec/GNUmakefile
+++ b/Tutorials/Blueprint/HeatEquation_EX1_C/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 #
 # This example requires installs of:
diff --git a/Tutorials/CMakeLists.txt b/Tutorials/CMakeLists.txt
index 203470a90c5..509912e6646 100644
--- a/Tutorials/CMakeLists.txt
+++ b/Tutorials/CMakeLists.txt
@@ -1,46 +1,115 @@
-set ( AMREX_TUTORIALS_DIR ${CMAKE_CURRENT_LIST_DIR} )
+#
+# List of subdirectories to search for CMakeLists.
+# For now, we do not include MUI, SDC, SWFFT
+#
+set( AMREX_TUTORIALS_SUBDIRS Amr Basic ForkJoin)
+
+if (AMReX_ASCENT)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS Blueprint)
+endif ()
+
+if (AMReX_EB)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS EB)
+endif ()
+
+if (AMReX_LINEAR_SOLVERS)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS LinearSolvers)
+endif ()
+
+if (AMReX_PARTICLES)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS Particles)
+endif ()
+
+if (AMReX_SUNDIALS)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS CVODE SUNDIALS)
+endif ()
 
+if (AMReX_FORTRAN_INTERFACES)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS FortranInterface)
+endif ()
 
-set ( AMREX_TUTORIALS_SUBDIRS Amr Basic CVODE GPU LinearSolvers ) # For now only Amr
+if (AMReX_CUDA)
+   list(APPEND AMREX_TUTORIALS_SUBDIRS GPU)
+endif ()
 
-prepend ( AMREX_TUTORIALS_SUBDIRS ${AMREX_TUTORIALS_DIR})
+list(TRANSFORM AMREX_TUTORIALS_SUBDIRS PREPEND "${CMAKE_CURRENT_LIST_DIR}/")
 
 #
-# Create a target to build all tutorials and an indentical one for
-# test_install
+# Function to setup the tutorials
 #
-# !!!!!! ATTENTION: target "tutorial" and "test_install" are the same for
-#  the time being until we decide what to do with test_install
-# 
-add_custom_target (tutorials)
-add_custom_target (test_install)
+function (setup_tutorial _srcs  _inputs)
+
+   cmake_parse_arguments( "" "HAS_FORTRAN_MODULES"
+      "BASE_NAME;RUNTIME_SUBDIR;EXTRA_DEFINITIONS" "" ${ARGN} )
+
+   if (_BASE_NAME)
+      set(_base_name ${_BASE_NAME})
+   else ()
+      string(REGEX REPLACE ".*Tutorials/" "" _base_name ${CMAKE_CURRENT_LIST_DIR})
+      string(REPLACE "/" "_" _base_name ${_base_name})
+   endif ()
+
+   # Prepend "Tutorial_" to base name
+   set(_base_name "Tutorial_${_base_name}")
+
+   if (_RUNTIME_SUBDIR)
+      set(_exe_dir ${CMAKE_CURRENT_BINARY_DIR}/${_RUNTIME_SUBDIR})
+   else ()
+      set(_exe_dir ${CMAKE_CURRENT_BINARY_DIR})
+   endif ()
+
+   set( _exe_name  ${_base_name} )
+
+   add_executable( ${_exe_name} )
+
+   target_sources( ${_exe_name} PRIVATE ${${_srcs}} )
+
+   set_target_properties( ${_exe_name} PROPERTIES RUNTIME_OUTPUT_DIRECTORY ${_exe_dir} )
+
+   if (_EXTRA_DEFINITIONS)
+      target_compile_definitions(${_exe_name} PRIVATE ${_EXTRA_DEFINITIONS})
+   endif ()
+
+   # Find out which include directory is needed
+   set(_includes ${${_srcs}})
+   list(FILTER _includes INCLUDE REGEX "\\.H$")
+   foreach(_item IN LISTS _includes)
+      get_filename_component( _include_dir ${_item} DIRECTORY)
+      target_include_directories( ${_exe_name} PRIVATE  ${_include_dir} )
+   endforeach()
+
+   if (_HAS_FORTRAN_MODULES)
+      target_include_directories(${_exe_name}
+         PRIVATE
+         ${CMAKE_CURRENT_BINARY_DIR}/mod_files)
+      set_target_properties( ${_exe_name}
+         PROPERTIES
+         Fortran_MODULE_DIRECTORY
+         ${CMAKE_CURRENT_BINARY_DIR}/mod_files )
+   endif ()
+
+   target_link_libraries( ${_exe_name} amrex )
+
+   if (AMReX_CUDA)
+      setup_target_for_cuda_compilation( ${_exe_name} )
+   endif ()
+
+   if (${_inputs})
+      file( COPY ${${_inputs}} DESTINATION ${_exe_dir} )
+   endif ()
+
+endfunction ()
 
 #
-# Here we define a macro to accumulate all the tutorial targets
+# Loop over subdirs and add to the build those containing CMakeLists.txt
 #
-set ( TUTORIAL_TARGETS )
+foreach (_subdir IN LISTS AMREX_TUTORIALS_SUBDIRS)
 
-macro (add_tutorial targets_list)
-   add_dependencies (tutorials ${targets_list})
-   add_dependencies (test_install ${targets_list})
-endmacro ()
+   file( GLOB_RECURSE _tutorials "${_subdir}/*CMakeLists.txt" )
 
-#
-# Loop over subdirs
-# 
-foreach (subdir ${AMREX_TUTORIALS_SUBDIRS})
-   
-   file ( GLOB_RECURSE  ALL_TUTORIALS "${subdir}/*CMakeLists.txt" ) 
-
-   foreach ( this_tutorial ${ALL_TUTORIALS})
-      get_filename_component (dir ${this_tutorial} DIRECTORY )
-      add_subdirectory (${dir})
+   foreach ( _item  IN LISTS _tutorials)
+      get_filename_component(_dir ${_item} DIRECTORY )
+      add_subdirectory(${_dir})
    endforeach ()
-   
-endforeach ()
-
 
-# Just write something if
-add_custom_command(TARGET test_install POST_BUILD
-                   COMMAND ${CMAKE_COMMAND} -E cmake_echo_color --cyan
-                   "AMReX installation is working")
+endforeach ()
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/GNUmakefile b/Tutorials/CVODE/EX1_F/GNUmakefile
similarity index 77%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/GNUmakefile
rename to Tutorials/CVODE/EX1_F/GNUmakefile
index f48433dd516..6b6f869c139 100644
--- a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/GNUmakefile
+++ b/Tutorials/CVODE/EX1_F/GNUmakefile
@@ -1,6 +1,5 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../..
+# AMREX_HOME defines the directory in which we will find all the AMReX code
+AMREX_HOME = ../..
 
 DEBUG     = FALSE
 USE_MPI   = TRUE
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/Make.package b/Tutorials/CVODE/EX1_F/Make.package
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/Make.package
rename to Tutorials/CVODE/EX1_F/Make.package
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/inputs b/Tutorials/CVODE/EX1_F/inputs
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/inputs
rename to Tutorials/CVODE/EX1_F/inputs
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/integrate_ode.f90 b/Tutorials/CVODE/EX1_F/integrate_ode.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/integrate_ode.f90
rename to Tutorials/CVODE/EX1_F/integrate_ode.f90
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/main.cpp b/Tutorials/CVODE/EX1_F/main.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/main.cpp
rename to Tutorials/CVODE/EX1_F/main.cpp
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/myfunc_F.H b/Tutorials/CVODE/EX1_F/myfunc_F.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/myfunc_F.H
rename to Tutorials/CVODE/EX1_F/myfunc_F.H
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX1/ode_mod.f90 b/Tutorials/CVODE/EX1_F/ode_mod.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX1/ode_mod.f90
rename to Tutorials/CVODE/EX1_F/ode_mod.f90
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/GNUmakefile b/Tutorials/CVODE/EX2_F/GNUmakefile
similarity index 78%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/GNUmakefile
rename to Tutorials/CVODE/EX2_F/GNUmakefile
index 1aa90b7b131..b8375246efe 100644
--- a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/GNUmakefile
+++ b/Tutorials/CVODE/EX2_F/GNUmakefile
@@ -1,6 +1,5 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../..
+# AMREX_HOME defines the directory in which we will find all the AMReX code
+AMREX_HOME = ../..
 
 DEBUG     = FALSE
 USE_MPI   = TRUE
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/Make.package b/Tutorials/CVODE/EX2_F/Make.package
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/Make.package
rename to Tutorials/CVODE/EX2_F/Make.package
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/inputs b/Tutorials/CVODE/EX2_F/inputs
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/inputs
rename to Tutorials/CVODE/EX2_F/inputs
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/integrate_ode_no_jac.f90 b/Tutorials/CVODE/EX2_F/integrate_ode_no_jac.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/integrate_ode_no_jac.f90
rename to Tutorials/CVODE/EX2_F/integrate_ode_no_jac.f90
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/integrate_ode_with_jac.f90 b/Tutorials/CVODE/EX2_F/integrate_ode_with_jac.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/integrate_ode_with_jac.f90
rename to Tutorials/CVODE/EX2_F/integrate_ode_with_jac.f90
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/main.cpp b/Tutorials/CVODE/EX2_F/main.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/main.cpp
rename to Tutorials/CVODE/EX2_F/main.cpp
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/myfunc_F.H b/Tutorials/CVODE/EX2_F/myfunc_F.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/myfunc_F.H
rename to Tutorials/CVODE/EX2_F/myfunc_F.H
diff --git a/Tutorials/CVODE/SUNDIALS2_finterface/EX2/ode_mod.f90 b/Tutorials/CVODE/EX2_F/ode_mod.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS2_finterface/EX2/ode_mod.f90
rename to Tutorials/CVODE/EX2_F/ode_mod.f90
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/CMakeLists.txt b/Tutorials/CVODE/SUNDIALS3_finterface/EX1/CMakeLists.txt
deleted file mode 100644
index 90bf02bc98a..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/CMakeLists.txt
+++ /dev/null
@@ -1,43 +0,0 @@
-#
-# Does not work if amrex is built in shared mode
-#
-if (NOT (ENABLE_SUNDIALS AND ENABLE_SUNDIALS_CVODE) )
-  return()
-endif ()
-
-set( EXENAME  "sundials3_cvode_finterface_ex1.exe" )
-
-add_executable( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-target_sources( ${EXENAME} PRIVATE
-   integrate_ode.f90
-   main.cpp
-   myfunc_F.H
-   ode_mod.f90
-   )
-
-set_target_properties( ${EXENAME} PROPERTIES      
-   INCLUDE_DIRECTORIES
-   "${CMAKE_CURRENT_LIST_DIR};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR} )
-
-target_link_libraries( ${EXENAME} amrex )
-
-#
-# Find input files 
-#
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false  ${CMAKE_CURRENT_LIST_DIR}/input* )
-
-#
-# Copy input files to corresponding build dir
-#
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} ) 
-
-#
-# Add to the "tutorial" target
-# 
-add_tutorial(${EXENAME})   
-
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/main.cpp b/Tutorials/CVODE/SUNDIALS3_finterface/EX1/main.cpp
deleted file mode 100644
index 5b347bdd612..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/main.cpp
+++ /dev/null
@@ -1,160 +0,0 @@
-#include <fstream>
-#include <iomanip>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_MultiFab.H>
-#include <AMReX_Print.H>
-#include <AMReX_PlotFileUtil.H>
-
-#include "myfunc_F.H"
-
-// This tutorial demonstrates how to use CVODE to integrate a single ODE per
-// cell, where the Jacobian matrix is not provided by the user. If using Newton
-// iteration to integrate the ODE, CVODE will construct a Jacobian by numerical
-// differentiation.
-
-using namespace amrex;
-
-int main (int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-    {
-        // What time is it now?  We'll use this to compute total run time.
-        Real strt_time = ParallelDescriptor::second();
-
-        std::cout << std::setprecision(15);
-
-        int n_cell, max_grid_size;
-        int cvode_meth, cvode_itmeth, write_plotfile;
-        bool do_tiling;
-
-        // inputs parameters
-        {
-            // ParmParse is way of reading inputs from the inputs file
-            ParmParse pp;
-
-            // We need to get n_cell from the inputs file - this is the number of
-            // cells on each side of a square (or cubic) domain.
-            pp.get("n_cell",n_cell);
-
-            // Default nsteps to 0, allow us to set it to something else in the
-            // inputs file
-            pp.get("max_grid_size",max_grid_size);
-
-            // Select CVODE solve method.
-            //   1 = Adams (for non-stiff problems)
-            //   2 = BDF (for stiff problems)
-            pp.get("cvode_meth",cvode_meth);
-            // Select CVODE solver iteration method.
-            //   1 = Functional iteration
-            //   2 = Newton iteration
-            pp.get("cvode_itmeth",cvode_itmeth);
-
-            pp.get("write_plotfile",write_plotfile);
-            pp.get("do_tiling",do_tiling);
-        }
-
-        if (cvode_meth < 1)
-            amrex::Abort("Unknown cvode_meth");
-        if (cvode_itmeth < 1)
-            amrex::Abort("Unknown cvode_itmeth");
-
-        amrex::Print() << "This is AMReX version " << amrex::Version() << std::endl;
-        amrex::Print() << "Problem domain size: nx = ny = nz = " << n_cell << std::endl;
-        amrex::Print() << "Max grid size: " << max_grid_size << std::endl;
-        amrex::Print() << "CVODE method: ";
-        if (cvode_meth == 1) {
-            amrex::Print() << "Adams (non-stiff)";
-        } else if (cvode_meth == 2) {
-            amrex::Print() << "BDF (stiff)";
-        }
-        amrex::Print() << std::endl;
-        amrex::Print() << "CVODE iteration method: ";
-        if (cvode_itmeth == 1) {
-            amrex::Print() << "Functional";
-        } else if (cvode_itmeth == 2) {
-            amrex::Print() << "Newton";
-        }
-        amrex::Print() << std::endl;
-
-        // make BoxArray and Geometry
-        BoxArray ba;
-        Geometry geom;
-        {
-            IntVect dom_lo(IntVect(D_DECL(0,0,0)));
-            IntVect dom_hi(IntVect(D_DECL(n_cell-1, n_cell-1, n_cell-1)));
-            Box domain(dom_lo, dom_hi);
-
-            // Initialize the boxarray "ba" from the single box "bx"
-            ba.define(domain);
-
-            // Break up boxarray "ba" into chunks no larger than "max_grid_size"
-            // along a direction
-            ba.maxSize(max_grid_size);
-
-            // This defines the physical size of the box.  Right now the box is
-            // [-1,1] in each direction.
-            RealBox real_box;
-            for (int n = 0; n < BL_SPACEDIM; n++) {
-                real_box.setLo(n,-1.0);
-                real_box.setHi(n, 1.0);
-            }
-
-            // This sets the boundary conditions to be doubly or triply periodic
-            int is_periodic[BL_SPACEDIM];
-            for (int i = 0; i < BL_SPACEDIM; i++) {
-                is_periodic[i] = 1;
-            }
-
-            // This defines a Geometry object
-            geom.define(domain,&real_box,CoordSys::cartesian,is_periodic);
-        }
-
-        // Ncomp = number of components for each array
-        int Ncomp  = 1;
-
-        // time = starting time in the simulation
-        Real time = 0.0;
-
-        DistributionMapping dm(ba);
-
-        // Create MultiFab with no ghost cells.
-        MultiFab mf(ba, dm, Ncomp, 0);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-        for ( MFIter mfi(mf, do_tiling); mfi.isValid(); ++mfi )
-        {
-            const Box& tbx = mfi.tilebox();
-
-            integrate_ode(mf[mfi].dataPtr(),
-                          tbx.loVect(),
-                          tbx.hiVect(),
-                          &cvode_meth,
-                          &cvode_itmeth);
-        }
-
-        if (write_plotfile)
-        {
-            amrex::WriteSingleLevelPlotfile("PLT_OUTPUT",
-                                            mf,
-                                            {"y1"},
-                                            geom,
-                                            time,
-                                            0);
-        }
-
-        // Call the timer again and compute the maximum difference between the start time and stop time
-        //   over all processors
-        Real stop_time = ParallelDescriptor::second() - strt_time;
-        const int IOProc = ParallelDescriptor::IOProcessorNumber();
-        ParallelDescriptor::ReduceRealMax(stop_time,IOProc);
-
-        // Tell the I/O Processor to write out the "run time"
-        amrex::Print() << "Run time = " << stop_time << std::endl;
-    }
-    amrex::Finalize();
-    return 0;
-}
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/GNUmakefile b/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/GNUmakefile
deleted file mode 100644
index b578be2413b..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/GNUmakefile
+++ /dev/null
@@ -1,22 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
-
-DEBUG     = FALSE
-USE_MPI   = FALSE
-USE_OMP   = FALSE
-COMP      = gnu
-DIM       = 3
-PRECISION = DOUBLE
-EBASE     = ark_analytic_fp
-
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
-USE_ARKODE_LIBS = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/Make.package b/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/Make.package
deleted file mode 100644
index 79563bdd6e7..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-ifeq ($(USE_ARKODE_LIBS), TRUE)
-     f90EXE_sources += ark_analytic_fp.f90
-endif
\ No newline at end of file
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/ark_analytic_fp.f90 b/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/ark_analytic_fp.f90
deleted file mode 100644
index b0c5474751b..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_ark_analytic_fp/ark_analytic_fp.f90
+++ /dev/null
@@ -1,280 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-!                modified by Jean M. Sexton @ LBL
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! The following is a simple example problem with an analytical
-! solution.
-!
-!   dy/dt = lamda*y + 1/(1+t^2) - lamda*atan(t)
-!
-! for t in the interval [0.0, 10.0], with initial condition: y=0.
-!
-! The stiffness of the problem is directly proportional to the
-! value of lamda. The value of lamda should be negative to
-! result in a well-posed ODE; for values with magnitude larger
-! than 100 the problem becomes quite stiff.
-! ------------------------------------------------------------------
-
-module ode_mod
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  !======= Declarations =========
-  implicit none
-
-  ! number of equations
-  integer(c_long), parameter :: neq = 1
-
-  ! ODE parameters
-  double precision, parameter :: lamda = -100.0d0
-
-contains
-
-  ! ----------------------------------------------------------------
-  ! RhsFn provides the right hand side function for the
-  ! ODE: dy/dt = f(t,y)
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
-       result(ierr) bind(C,name='RhsFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn        ! current time
-    type(c_ptr), value    :: sunvec_y  ! solution N_Vector
-    type(c_ptr), value    :: sunvec_f  ! rhs N_Vector
-    type(c_ptr), value    :: user_data ! user-defined data
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-    real(c_double), pointer :: fvec(:)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FN_VGetData_Serial(sunvec_y, yvec)
-    call FN_VGetData_Serial(sunvec_f, fvec)
-
-    ! fill RHS vector
-    fvec(1) = lamda*yvec(1) + 1.0/(1.0+tn*tn) - lamda*atan(tn);
-
-    ! return success
-    ierr = 0
-    return
-
-  end function RhsFn
-
-end module ode_mod
-
-
-program main
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  use farkode_mod         ! Fortran interface to ARKODE
-  use fnvector_serial_mod ! Fortran interface to serial N_Vector
-  use ode_mod             ! ODE functions
-  use arkode_interface
-
-  !======= Declarations =========
-  implicit none
-
-  ! local variables
-  real(c_double) :: tstart     ! initial time
-  real(c_double) :: tend       ! final time
-  real(c_double) :: rtol, atol ! relative and absolute tolerance
-  real(c_double) :: dtout      ! output time interval
-  real(c_double) :: tout       ! output time
-  real(c_double) :: tcur       ! current time
-  integer(c_int) :: imethod, idefault, pq
-
-  integer(c_int) :: ierr       ! error flag from C functions
-  integer(c_int) :: nout       ! number of outputs
-
-  integer :: outstep           ! output loop counter
-
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: arkode_mem     ! ARKODE memory
-
-  ! solution vector, neq is set in the ode_functions module
-  real(c_double) :: yvec(neq)
-
-  !======= Internals ============
-
-  ! initialize ODE
-  tstart = 0.0d0
-  tend   = 10.0d0
-  tcur   = tstart
-  tout   = tstart
-  dtout  = 1.0d0
-  nout   = ceiling(tend/dtout)
-
-  ! initialize solution vector
-  yvec(1) = 0.0d0
-
-  ! create SUNDIALS N_Vector
-  sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) print *,'ERROR: sunvec = NULL'
-
-  ! create ARKode memory
-  arkode_mem = FARKodeCreate()
-  if (.not. c_associated(arkode_mem)) print *,'ERROR: arkode_mem = NULL'
-
-  ! initialize ARKode
-!  ierr = FARKodeInit(arkode_mem, c_funloc(RhsFn), c_null_ptr, tstart, sunvec_y)
-  ierr = FARKodeInit(arkode_mem, c_null_ptr, c_funloc(RhsFn), tstart, sunvec_y)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FARKodeInit, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! Tell ARKODE to use a dense linear solver.
-  ierr = FARKDense(arkode_mem, neq)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FARKDense, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set relative and absolute tolerances
-  rtol = 1.0d-6
-  atol = 1.0d-10
-
-  ierr = FARKodeSStolerances(arkode_mem, rtol, atol)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FARKodeSStolerances, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  imethod = 4
-  idefault = 1
-  pq = 0
-  ierr = FARKodeSetAdaptivityMethod(arkode_mem, imethod, idefault, pq, c_null_ptr)
-  
-  ! Start time stepping
-  print *, '   '
-  print *, 'Finished initialization, starting time steps'
-  print *, '   '
-  print *, '       t           y        '
-  print *, '----------------------------'
-  print '(2x,2(es12.5,1x))', tcur, yvec(1)
-  do outstep = 1,nout
-
-     ! call ARKode
-     tout = min(tout + dtout, tend)
-     ierr = FARKode(arkode_mem, tout, sunvec_y, tcur, ARK_NORMAL)
-     if (ierr /= 0) then
-        write(*,*) 'Error in FARKODE, ierr = ', ierr, '; halting'
-        stop
-     endif
-
-     ! output current solution
-     print '(2x,2(es12.5,1x))', tcur, yvec(1)
-
-  enddo
-
-  ! diagnostics output
-  call ARKodeStats(arkode_mem)
-  call FN_VDestroy_Serial(sunvec_y)
-
-  ! clean up
-  call FARKodeFree(arkode_mem)
-
-end program main
-
-
-! ----------------------------------------------------------------
-! ARKodeStats
-!
-! Print ARKODE statstics to stdandard out
-! ----------------------------------------------------------------
-subroutine ARKodeStats(arkode_mem)
-
-  !======= Inclusions ===========
-  use iso_c_binding
-  use farkode_mod
-
-  !======= Declarations =========
-  implicit none
-
-  type(c_ptr), intent(in) :: arkode_mem ! solver memory structure
-
-  integer(c_int)  :: ierr ! error flag
-
-  integer(c_long) :: nsteps     ! num steps
-  integer(c_long) :: nst_a      ! num steps attempted
-  integer(c_long) :: nfe        ! num explicit function evals
-  integer(c_long) :: nfi        ! num implicit function evals
-  integer(c_long) :: nfevals    ! num function evals
-  integer(c_long) :: nlinsetups ! num linear solver setups
-  integer(c_long) :: netfails   ! num error test fails
-
-  integer(c_int) :: qlast ! method order in last step
-  integer(c_int) :: qcur  ! method order for next step
-
-  real(c_double) :: hinused ! initial step size
-  real(c_double) :: hlast   ! last step size
-  real(c_double) :: hcur    ! step size for next step
-  real(c_double) :: tcur    ! internal time reached
-
-  integer(c_long) :: nniters  ! nonlinear solver iterations
-  integer(c_long) :: nncfails ! nonlinear solver fails
-  integer(c_long) :: njacevals! number of Jacobian evaluations
-  integer(c_long) :: nfeLS    ! number of nonlinear solver rhs evaluations
-
-  !======= Internals ============
-
-  ierr = FARKodeGetNumSteps(arkode_mem, nsteps)
-  ierr = FARKodeGetNumStepAttempts(arkode_mem, nst_a)
-  ierr = FARKodeGetNumRhsEvals(arkode_mem, nfe, nfi)
-  nfevals=nfe+nfi
-  ierr = FARKodeGetActualInitStep(arkode_mem, hinused)
-  ierr = FARKodeGetLastStep(arkode_mem, hlast)
-  ierr = FARKodeGetCurrentStep(arkode_mem, hcur)
-  ierr = FARKodeGetCurrentTime(arkode_mem, tcur)
-  ierr = FARKodeGetNumLinSolvSetups(arkode_mem, nlinsetups)
-  ierr = FARKodeGetNumErrTestFails(arkode_mem, netfails)
-  ierr = FARKodeGetNumNonlinSolvIters(arkode_mem, nniters)
-  ierr = FARKodeGetNumNonlinSolvConvFails(arkode_mem, nncfails)
-  ierr = FARKDlsGetNumJacEvals(arkode_mem, njacevals)
-  ierr = FARKDlsGetNumRhsEvals(arkode_mem, nfeLS)
-
-  print *, ' '
-  print *, ' General Solver Stats:'
-  print '(4x,A,i9)'    ,'Total internal steps taken    =',nsteps
-  print '(4x,A,i9)'    ,'Total internal steps attempts =',nst_a
-  print '(4x,A,i9)'    ,'Total rhs function calls      =',nfevals
-  print '(4x,A,i9)'    ,'Num lin solver setup calls    =',nlinsetups
-  print '(4x,A,i9)'    ,'Num error test failures       =',netfails
-  print '(4x,A,es12.5)','First internal step size      =',hinused
-  print '(4x,A,es12.5)','Last internal step size       =',hlast
-  print '(4x,A,es12.5)','Next internal step size       =',hcur
-  print '(4x,A,es12.5)','Current internal time         =',tcur
-  print '(4x,A,i9)'    ,'Num nonlinear solver iters    =',nniters
-  print '(4x,A,i9)'    ,'Num nonlinear solver fails    =',nncfails
-  print *, ' '
-
-  return
-
-end subroutine ARKodeStats
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/Make.package b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/Make.package
deleted file mode 100644
index 13a4ef61b25..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += cv_analytic_fp.f90
\ No newline at end of file
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/cv_analytic_fp.f90 b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/cv_analytic_fp.f90
deleted file mode 100644
index dde3b63d3fc..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/cv_analytic_fp.f90
+++ /dev/null
@@ -1,260 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! The following is a simple example problem with an analytical
-! solution.
-!
-!   dy/dt = lamda*y + 1/(1+t^2) - lamda*atan(t)
-!
-! for t in the interval [0.0, 10.0], with initial condition: y=0.
-!
-! The stiffness of the problem is directly proportional to the
-! value of lamda. The value of lamda should be negative to
-! result in a well-posed ODE; for values with magnitude larger
-! than 100 the problem becomes quite stiff.
-! ------------------------------------------------------------------
-
-module ode_mod
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  !======= Declarations =========
-  implicit none
-
-  ! number of equations
-  integer(c_long), parameter :: neq = 1
-
-  ! ODE parameters
-  double precision, parameter :: lamda = -100.0d0
-
-contains
-
-  ! ----------------------------------------------------------------
-  ! RhsFn provides the right hand side function for the
-  ! ODE: dy/dt = f(t,y)
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
-       result(ierr) bind(C,name='RhsFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn        ! current time
-    type(c_ptr), value    :: sunvec_y  ! solution N_Vector
-    type(c_ptr), value    :: sunvec_f  ! rhs N_Vector
-    type(c_ptr), value    :: user_data ! user-defined data
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-    real(c_double), pointer :: fvec(:)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FN_VGetData_Serial(sunvec_y, yvec)
-    call FN_VGetData_Serial(sunvec_f, fvec)
-
-    ! fill RHS vector
-    fvec(1) = lamda*yvec(1) + 1.0/(1.0+tn*tn) - lamda*atan(tn);
-
-    ! return success
-    ierr = 0
-    return
-
-  end function RhsFn
-
-end module ode_mod
-
-
-program main
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  use fcvode_mod          ! Fortran interface to CVODE
-  use fnvector_serial_mod ! Fortran interface to serial N_Vector
-  use ode_mod             ! ODE functions
-
-  !======= Declarations =========
-  implicit none
-
-  ! local variables
-  real(c_double) :: tstart     ! initial time
-  real(c_double) :: tend       ! final time
-  real(c_double) :: rtol, atol ! relative and absolute tolerance
-  real(c_double) :: dtout      ! output time interval
-  real(c_double) :: tout       ! output time
-  real(c_double) :: tcur       ! current time
-
-  integer(c_int) :: ierr       ! error flag from C functions
-  integer(c_int) :: nout       ! number of outputs
-
-  integer :: outstep           ! output loop counter
-
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: cvode_mem     ! CVODE memory
-
-  ! solution vector, neq is set in the ode_functions module
-  real(c_double) :: yvec(neq)
-
-  !======= Internals ============
-
-  ! initialize ODE
-  tstart = 0.0d0
-  tend   = 10.0d0
-  tcur   = tstart
-  tout   = tstart
-  dtout  = 1.0d0
-  nout   = ceiling(tend/dtout)
-
-  ! initialize solution vector
-  yvec(1) = 0.0d0
-
-  ! create SUNDIALS N_Vector
-  sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) print *,'ERROR: sunvec = NULL'
-
-  ! create CVode memory
-  cvode_mem = FCVodeCreate(CV_ADAMS, CV_FUNCTIONAL)
-  if (.not. c_associated(cvode_mem)) print *,'ERROR: cvode_mem = NULL'
-
-  ! initialize CVode
-  ierr = FCVodeInit(cvode_mem, c_funloc(RhsFn), tstart, sunvec_y)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeInit, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set relative and absolute tolerances
-  rtol = 1.0d-6
-  atol = 1.0d-10
-
-  ierr = FCVodeSStolerances(cvode_mem, rtol, atol)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeSStolerances, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! Start time stepping
-  print *, '   '
-  print *, 'Finished initialization, starting time steps'
-  print *, '   '
-  print *, '       t           y        '
-  print *, '----------------------------'
-  print '(2x,2(es12.5,1x))', tcur, yvec(1)
-  do outstep = 1,nout
-
-     ! call CVode
-     tout = min(tout + dtout, tend)
-     ierr = FCVode(cvode_mem, tout, sunvec_y, tcur, CV_NORMAL)
-     if (ierr /= 0) then
-        write(*,*) 'Error in FCVODE, ierr = ', ierr, '; halting'
-        stop
-     endif
-
-     ! output current solution
-     print '(2x,2(es12.5,1x))', tcur, yvec(1)
-
-  enddo
-
-  ! diagnostics output
-  call CVodeStats(cvode_mem)
-  call FN_VDestroy_Serial(sunvec_y)
-
-  ! clean up
-  call FCVodeFree(cvode_mem)
-
-end program main
-
-
-! ----------------------------------------------------------------
-! CVodeStats
-!
-! Print CVODE statstics to stdandard out
-! ----------------------------------------------------------------
-subroutine CVodeStats(cvode_mem)
-
-  !======= Inclusions ===========
-  use iso_c_binding
-  use fcvode_mod
-
-  !======= Declarations =========
-  implicit none
-
-  type(c_ptr), intent(in) :: cvode_mem ! solver memory structure
-
-  integer(c_int)  :: ierr ! error flag
-
-  integer(c_long) :: nsteps     ! num steps
-  integer(c_long) :: nfevals    ! num function evals
-  integer(c_long) :: nlinsetups ! num linear solver setups
-  integer(c_long) :: netfails   ! num error test fails
-
-  integer(c_int) :: qlast ! method order in last step
-  integer(c_int) :: qcur  ! method order for next step
-
-  real(c_double) :: hinused ! initial step size
-  real(c_double) :: hlast   ! last step size
-  real(c_double) :: hcur    ! step size for next step
-  real(c_double) :: tcur    ! internal time reached
-
-  integer(c_long) :: nniters  ! nonlinear solver iterations
-  integer(c_long) :: nncfails ! nonlinear solver fails
-
-  !======= Internals ============
-
-  ! general solver statistics
-  ierr = FCVodeGetIntegratorStats(cvode_mem, nsteps, nfevals, nlinsetups, &
-       netfails, qlast, qcur, hinused, hlast, hcur, tcur)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetIntegratorStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! nonlinear solver statistics
-  ierr = FCVodeGetNonlinSolvStats(cvode_mem, nniters, nncfails)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetNonlinSolvStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  print *, ' '
-  print *, ' General Solver Stats:'
-  print '(4x,A,i9)'    ,'Total internal steps taken =',nsteps
-  print '(4x,A,i9)'    ,'Total rhs function calls   =',nfevals
-  print '(4x,A,i9)'    ,'Num lin solver setup calls =',nlinsetups
-  print '(4x,A,i9)'    ,'Num error test failures    =',netfails
-  print '(4x,A,i9)'    ,'Last method order          =',qlast
-  print '(4x,A,i9)'    ,'Next method order          =',qcur
-  print '(4x,A,es12.5)','First internal step size   =',hinused
-  print '(4x,A,es12.5)','Last internal step size    =',hlast
-  print '(4x,A,es12.5)','Next internal step size    =',hcur
-  print '(4x,A,es12.5)','Current internal time      =',tcur
-  print '(4x,A,i9)'    ,'Num nonlinear solver iters =',nniters
-  print '(4x,A,i9)'    ,'Num nonlinear solver fails =',nncfails
-  print *, ' '
-
-  return
-
-end subroutine CVodeStats
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/cv_analytic_fp.out b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/cv_analytic_fp.out
deleted file mode 100644
index 5c886f0a04e..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/cv_analytic_fp.out
+++ /dev/null
@@ -1,33 +0,0 @@
- Creating N_Vector...
- Initializing CVode solver...
-    
- Finished initialization, starting time steps
-    
-        t           y        
- ----------------------------
-   0.00000E+00  0.00000E+00
-   1.00000E+00  7.85398E-01
-   2.00000E+00  1.10715E+00
-   3.00000E+00  1.24905E+00
-   4.00000E+00  1.32582E+00
-   5.00000E+00  1.37340E+00
-   6.00000E+00  1.40565E+00
-   7.00000E+00  1.42890E+00
-   8.00000E+00  1.44644E+00
-   9.00000E+00  1.46014E+00
-   1.00000E+01  1.47113E+00
-  
-  General Solver Stats:
-    Total internal steps taken =     1817
-    Total rhs function calls   =     3934
-    Num lin solver setup calls =        0
-    Num error test failures    =        0
-    Last method order          =        1
-    Next method order          =        1
-    First internal step size   = 6.10352E-12
-    Last internal step size    = 3.95234E-03
-    Next internal step size    = 3.95234E-03
-    Current internal time      = 1.00010E+01
-    Num nonlinear solver iters =     3930
-    Num nonlinear solver fails =      614
-  
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/GNUmakefile b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/GNUmakefile
deleted file mode 100644
index d52252dcd3d..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
-
-DEBUG     = FALSE
-USE_MPI   = FALSE
-COMP      = gnu
-DIM       = 3
-PRECISION = DOUBLE
-EBASE     = cv_analytic_sys_dns
-
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/Make.package b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/Make.package
deleted file mode 100644
index fab0a8638cd..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += cv_analytic_sys_dns.f90
\ No newline at end of file
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/cv_analytic_sys_dns.f90 b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/cv_analytic_sys_dns.f90
deleted file mode 100644
index cdd4075490a..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/cv_analytic_sys_dns.f90
+++ /dev/null
@@ -1,323 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! The following is a simple example problem with an analytical
-! solution.
-!
-!   dy/dt = A * y
-!
-! where A = V * D * Vi
-!
-!      [ lamda/4 - 23/40 | lamda/4 - 3/40 | lamda/4 + 13/40 ]
-!  A = [ lamda/4 + 21/40 | lamda/4 + 1/40 | lamda/4 - 11/40 ]
-!      [ lamda/2 + 1/20  | lamda/2 + 1/20 | lamda/2 - 1/20  ]
-!
-!      [  1 -1 1 ]     [ -1/2   0     0   ]      [ 5/4 1/4 -3/4 ]
-!  V = [ -1  2 1 ] D = [   0  -1/10   0   ] Vi = [ 1/2 1/2 -1/2 ]
-!      [  0 -1 2 ]     [   0    0   lamda ]      [ 1/4 1/4  1/4 ]
-!
-! and lamda is a large negative number. The analytical solution to
-! this problem is
-!
-!   y(t) = V * exp(D * t) * Vi * y0
-!
-! for t in the interval [0.0, 0.05], with initial condition:
-! y(0) = [1,1,1]'.
-!
-! The stiffness of the problem is directly proportional to the value
-! of lamda. The value of lamda should be negative to result in a
-! well-posed ODE; for values with magnitude larger than 100 the
-! problem becomes quite stiff.
-!
-! In this example, we choose lamda = -100.
-!
-! Output is printed every 1.0 units of time (10 total).
-! Run statistics (optional outputs) are printed at the end.
-! ------------------------------------------------------------------
-
-module ode_mod
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  !======= Declarations =========
-  implicit none
-
-  ! number of equations
-  integer(c_long), parameter :: neq = 3
-
-  ! ODE parameters
-  double precision, parameter :: lamda = -100.0d0
-
-contains
-
-  ! ----------------------------------------------------------------
-  ! RhsFn: The right hand side function for the ODE dy/dt = A * y
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
-       result(ierr) bind(C,name='RhsFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn        ! current time
-    type(c_ptr), value    :: sunvec_y  ! solution N_Vector
-    type(c_ptr), value    :: sunvec_f  ! rhs N_Vector
-    type(c_ptr), value    :: user_data ! user-defined data
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-    real(c_double), pointer :: fvec(:)
-
-    ! ODE system matrix
-    real(c_double) :: Amat(neq,neq)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FN_VGetData_Serial(sunvec_y, yvec)
-    call FN_VGetData_Serial(sunvec_f, fvec)
-
-    ! fill A matrix (column major ordering)
-    Amat = reshape([&
-         lamda/4.d0 - 23.d0/40.d0, lamda/4.d0 + 21.d0/40, lamda/2.d0 + 1.d0/20.d0,   &
-         lamda/4.d0 - 3.d0/40.d0,  lamda/4.d0 + 1.d0/40,  lamda/2.d0 + 1.d0/20.d0,   &
-         lamda/4.d0 + 13.d0/40.d0, lamda/4.d0 - 11.d0/40, lamda/2.d0 - 1.d0/20.d0 ], &
-         [3,3])
-
-    ! fill RHS vector f(t,y) = A*y
-    fvec = matmul(Amat, yvec)
-
-    ! return success
-    ierr = 0
-    return
-
-  end function RhsFn
-
-end module ode_mod
-
-
-program main
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  use fcvode_mod            ! Fortran interface to CVODE
-  use fnvector_serial_mod   ! Fortran interface to serial N_Vector
-  use fsunmat_dense_mod     ! Fortran interface to dense SUNMatrix
-  use fsunlinsol_dense_mod  ! Fortran interface to dense SUNLinearSolver
-  use ode_mod               ! ODE functions
-
-  !======= Declarations =========
-  implicit none
-
-  ! local variables
-  real(c_double) :: tstart     ! initial time
-  real(c_double) :: tend       ! final time
-  real(c_double) :: rtol, atol ! relative and absolute tolerance
-  real(c_double) :: dtout      ! output time interval
-  real(c_double) :: tout       ! output time
-  real(c_double) :: tcur       ! current time
-
-  integer(c_int) :: ierr       ! error flag from C functions
-  integer(c_int) :: nout       ! number of outputs
-
-  integer :: outstep           ! output loop counter
-
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: sunmat_A      ! sundials matrix
-  type(c_ptr) :: sunlinsol_LS  ! sundials linear solver
-  type(c_ptr) :: cvode_mem     ! CVODE memory
-
-  ! solution vector, neq is set in the ode_functions module
-  real(c_double) :: yvec(neq)
-
-  !======= Internals ============
-
-  ! initialize ODE
-  tstart = 0.0d0
-  tend   = 0.05d0
-  tcur   = tstart
-  tout   = tstart
-  dtout  = 0.005d0
-  nout   = ceiling(tend/dtout)
-
-  ! initialize solution vector
-  yvec(1) = 1.0d0
-  yvec(2) = 1.0d0
-  yvec(3) = 1.0d0
-
-  ! create a serial vector
-  sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) print *,'ERROR: sunvec = NULL'
-
-  ! create a dense matrix
-  sunmat_A = FSUNDenseMatrix(neq, neq);
-  if (.not. c_associated(sunmat_A)) print *,'ERROR: sunmat = NULL'
-
-  ! create a dense linear solver
-  sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A);
-  if (.not. c_associated(sunlinsol_LS)) print *,'ERROR: sunlinsol = NULL'
-
-  ! create CVode memory
-  cvode_mem = FCVodeCreate(CV_BDF, CV_NEWTON)
-  if (.not. c_associated(cvode_mem)) print *,'ERROR: cvode_mem = NULL'
-
-  ! initialize CVode
-  ierr = FCVodeInit(cvode_mem, c_funloc(RhsFn), tstart, sunvec_y)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeInit, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set relative and absolute tolerances
-  rtol = 1.0d-6
-  atol = 1.0d-10
-
-  ierr = FCVodeSStolerances(cvode_mem, rtol, atol)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeSStolerances, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! attach linear solver
-  ierr = FCVDlsSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A);
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsSetLinearSolver, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! start time stepping
-  print *, '   '
-  print *, 'Finished initialization, starting time steps'
-  print *, '   '
-  print *, '       t           y1           y2           y3       '
-  print *, '------------------------------------------------------'
-  print '(2x,4(es12.5,1x))', tcur, yvec(1), yvec(2), yvec(3)
-  do outstep = 1,nout
-
-     ! call CVode
-     tout = min(tout + dtout, tend)
-     ierr = FCVode(cvode_mem, tout, sunvec_y, tcur, CV_NORMAL)
-     if (ierr /= 0) then
-        write(*,*) 'Error in FCVODE, ierr = ', ierr, '; halting'
-        stop
-     endif
-
-     ! output current solution
-     print '(2x,4(es12.5,1x))', tcur, yvec(1), yvec(2), yvec(3)
-
-  enddo
-
-  ! diagnostics output
-  call CVodeStats(cvode_mem)
-
-  ! clean up
-  call FCVodeFree(cvode_mem)
-  call FSUNLinSolFree_Dense(sunlinsol_LS)
-  call FSUNMatDestroy_Dense(sunmat_A)
-  call FN_VDestroy_Serial(sunvec_y)
-
-end program main
-
-
-! ----------------------------------------------------------------
-! CVodeStats
-!
-! Print CVODE statstics to stdandard out
-! ----------------------------------------------------------------
-subroutine CVodeStats(cvode_mem)
-
-  !======= Inclusions ===========
-  use iso_c_binding
-  use fcvode_mod
-
-  !======= Declarations =========
-  implicit none
-
-  type(c_ptr), intent(in) :: cvode_mem ! solver memory structure
-
-  integer(c_int)  :: ierr ! error flag
-
-  integer(c_long) :: nsteps     ! num steps
-  integer(c_long) :: nfevals    ! num function evals
-  integer(c_long) :: nlinsetups ! num linear solver setups
-  integer(c_long) :: netfails   ! num error test fails
-
-  integer(c_int) :: qlast ! method order in last step
-  integer(c_int) :: qcur  ! method order for next step
-
-  real(c_double) :: hinused ! initial step size
-  real(c_double) :: hlast   ! last step size
-  real(c_double) :: hcur    ! step size for next step
-  real(c_double) :: tcur    ! internal time reached
-
-  integer(c_long) :: nniters  ! nonlinear solver iterations
-  integer(c_long) :: nncfails ! nonlinear solver fails
-
-  integer(c_long) :: njevals  ! num Jacobian evaluations
-
-  !======= Internals ============
-
-  ! general solver statistics
-  ierr = FCVodeGetIntegratorStats(cvode_mem, nsteps, nfevals, nlinsetups, &
-       netfails, qlast, qcur, hinused, hlast, hcur, tcur)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetIntegratorStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! nonlinear solver statistics
-  ierr = FCVodeGetNonlinSolvStats(cvode_mem, nniters, nncfails)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetNonlinSolvStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! number of Jacobian evaluations
-  ierr = FCVDlsGetNumJacEvals(cvode_mem, njevals)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsGetNumJacEvals, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  print *, ' '
-  print *, ' General Solver Stats:'
-  print '(4x,A,i9)'    ,'Total internal steps taken =',nsteps
-  print '(4x,A,i9)'    ,'Total rhs function calls   =',nfevals
-  print '(4x,A,i9)'    ,'Num lin solver setup calls =',nlinsetups
-  print '(4x,A,i9)'    ,'Num error test failures    =',netfails
-  print '(4x,A,i9)'    ,'Last method order          =',qlast
-  print '(4x,A,i9)'    ,'Next method order          =',qcur
-  print '(4x,A,es12.5)','First internal step size   =',hinused
-  print '(4x,A,es12.5)','Last internal step size    =',hlast
-  print '(4x,A,es12.5)','Next internal step size    =',hcur
-  print '(4x,A,es12.5)','Current internal time      =',tcur
-  print '(4x,A,i9)'    ,'Num nonlinear solver iters =',nniters
-  print '(4x,A,i9)'    ,'Num nonlinear solver fails =',nncfails
-  print '(4x,A,i9)'    ,'Num Jacobian evaluations   =',njevals
-  print *, ' '
-
-  return
-
-end subroutine CVodeStats
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/cv_analytic_sys_dns.out b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/cv_analytic_sys_dns.out
deleted file mode 100644
index 2c3c74c90fd..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns/cv_analytic_sys_dns.out
+++ /dev/null
@@ -1,31 +0,0 @@
-    
- Finished initialization, starting time steps
-    
-        t           y1           y2           y3       
- ------------------------------------------------------
-   0.00000E+00  1.00000E+00  1.00000E+00  1.00000E+00
-   5.00000E-03  7.03275E-01  7.06270E-01  4.10045E-01
-   1.00000E-02  5.22668E-01  5.28650E-01  5.23171E-02
-   1.50000E-02  4.12493E-01  4.21452E-01 -1.64556E-01
-   2.00000E-02  3.45038E-01  3.56966E-01 -2.95998E-01
-   2.50000E-02  3.03496E-01  3.18384E-01 -3.75623E-01
-   3.00000E-02  2.77673E-01  2.95512E-01 -4.23820E-01
-   3.50000E-02  2.61385E-01  2.82166E-01 -4.52956E-01
-   4.00000E-02  2.50882E-01  2.74596E-01 -4.70529E-01
-   4.50000E-02  2.43891E-01  2.70529E-01 -4.81091E-01
-   5.00000E-02  2.39030E-01  2.68584E-01 -4.87399E-01
-  
-  General Solver Stats:
-    Total internal steps taken =       73
-    Total rhs function calls   =      106
-    Num lin solver setup calls =       21
-    Num error test failures    =        6
-    Last method order          =        5
-    Next method order          =        5
-    First internal step size   = 6.86623E-06
-    Last internal step size    = 1.52516E-03
-    Next internal step size    = 1.52516E-03
-    Current internal time      = 5.10348E-02
-    Num nonlinear solver iters =      102
-    Num nonlinear solver fails =        0
-  
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/GNUmakefile b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/GNUmakefile
deleted file mode 100644
index 9d1f20392c7..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
-
-DEBUG     = FALSE
-USE_MPI   = FALSE
-COMP      = gnu
-DIM       = 3
-PRECISION = DOUBLE
-EBASE     = cv_analytic_sys_dns_jac
-
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/Make.package b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/Make.package
deleted file mode 100644
index d8f29f36b7b..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += cv_analytic_sys_dns_jac.f90
\ No newline at end of file
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/cv_analytic_sys_dns_jac.f90 b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/cv_analytic_sys_dns_jac.f90
deleted file mode 100644
index 9866ecc183b..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/cv_analytic_sys_dns_jac.f90
+++ /dev/null
@@ -1,379 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! The following is a simple example problem with an analytical
-! solution.
-!
-!   dy/dt = A * y
-!
-! where A = V * D * Vi
-!
-!      [ lamda/4 - 23/40 | lamda/4 - 3/40 | lamda/4 + 13/40 ]
-!  A = [ lamda/4 + 21/40 | lamda/4 + 1/40 | lamda/4 - 11/40 ]
-!      [ lamda/2 + 1/20  | lamda/2 + 1/20 | lamda/2 - 1/20  ]
-!
-!      [  1 -1 1 ]     [ -1/2   0     0   ]      [ 5/4 1/4 -3/4 ]
-!  V = [ -1  2 1 ] D = [   0  -1/10   0   ] Vi = [ 1/2 1/2 -1/2 ]
-!      [  0 -1 2 ]     [   0    0   lamda ]      [ 1/4 1/4  1/4 ]
-!
-! and lamda is a large negative number. The analytical solution to
-! this problem is
-!
-!   y(t) = V * exp(D * t) * Vi * y0
-!
-! for t in the interval [0.0, 0.05], with initial condition:
-! y(0) = [1,1,1]'.
-!
-! The stiffness of the problem is directly proportional to the value
-! of lamda. The value of lamda should be negative to result in a
-! well-posed ODE; for values with magnitude larger than 100 the
-! problem becomes quite stiff.
-!
-! In this example, we choose lamda = -100.
-!
-! Output is printed every 1.0 units of time (10 total).
-! Run statistics (optional outputs) are printed at the end.
-! ------------------------------------------------------------------
-
-module ode_mod
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  !======= Declarations =========
-  implicit none
-
-  ! number of equations
-  integer(c_long), parameter :: neq = 3
-
-  ! ODE parameters
-  double precision, parameter :: lamda = -100.0d0
-
-contains
-
-  ! ----------------------------------------------------------------
-  ! RhsFn: The right hand side function for the ODE dy/dt = A * y
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
-       result(ierr) bind(C,name='RhsFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn        ! current time
-    type(c_ptr), value    :: sunvec_y  ! solution N_Vector
-    type(c_ptr), value    :: sunvec_f  ! rhs N_Vector
-    type(c_ptr), value    :: user_data ! user-defined data
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-    real(c_double), pointer :: fvec(:)
-
-    ! ODE system matrix
-    real(c_double) :: Amat(neq,neq)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FN_VGetData_Serial(sunvec_y, yvec)
-    call FN_VGetData_Serial(sunvec_f, fvec)
-
-    ! fill A matrix (column major ordering)
-    Amat = reshape([&
-         lamda/4.d0 - 23.d0/40.d0, lamda/4.d0 + 21.d0/40, lamda/2.d0 + 1.d0/20.d0,   &
-         lamda/4.d0 - 3.d0/40.d0,  lamda/4.d0 + 1.d0/40,  lamda/2.d0 + 1.d0/20.d0,   &
-         lamda/4.d0 + 13.d0/40.d0, lamda/4.d0 - 11.d0/40, lamda/2.d0 - 1.d0/20.d0 ], &
-         [3,3])
-
-    ! fill RHS vector f(t,y) = A*y
-    fvec = matmul(Amat, yvec)
-
-    ! return success
-    ierr = 0
-    return
-
-  end function RhsFn
-
-
-  ! ----------------------------------------------------------------
-  ! JacFn: The Jacobian of the ODE hand side function J = df/dy
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function JacFn(tn, sunvec_y, sunvec_f, sunmat_J, &
-       user_data, tmp1, tmp2, tmp3) &
-       result(ierr) bind(C,name='JacFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fsunmat_dense_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn               ! current time
-    type(c_ptr), value    :: sunvec_y         ! current solution N_Vector
-    type(c_ptr), value    :: sunvec_f         ! current rhs N_Vector
-    type(c_ptr), value    :: sunmat_J         ! Jacobian SUNMatrix
-    type(c_ptr), value    :: user_data        ! user-defined data
-    type(c_ptr), value    :: tmp1, tmp2, tmp3 ! workspace N_Vectors
-
-    ! pointer to data in SUNDAILS matrix
-    real(c_double), pointer :: Jmat(:,:)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FSUNMatGetData_Dense(sunmat_J, Jmat)
-
-    ! fill J matrix (column major ordering)
-    Jmat = reshape([&
-         lamda/4.d0 - 23.d0/40.d0, lamda/4.d0 + 21.d0/40, lamda/2.d0 + 1.d0/20.d0,   &
-         lamda/4.d0 - 3.d0/40.d0,  lamda/4.d0 + 1.d0/40,  lamda/2.d0 + 1.d0/20.d0,   &
-         lamda/4.d0 + 13.d0/40.d0, lamda/4.d0 - 11.d0/40, lamda/2.d0 - 1.d0/20.d0 ], &
-         [3,3])
-
-    ! return success
-    ierr = 0
-    return
-
-  end function JacFn
-
-end module ode_mod
-
-
-program main
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  use fcvode_mod            ! Fortran interface to CVODE
-  use fnvector_serial_mod   ! Fortran interface to serial N_Vector
-  use fsunmat_dense_mod     ! Fortran interface to dense SUNMatrix
-  use fsunlinsol_dense_mod  ! Fortran interface to dense SUNLinearSolver
-  use ode_mod               ! ODE functions
-
-  !======= Declarations =========
-  implicit none
-
-  ! local variables
-  real(c_double) :: tstart     ! initial time
-  real(c_double) :: tend       ! final time
-  real(c_double) :: rtol, atol ! relative and absolute tolerance
-  real(c_double) :: dtout      ! output time interval
-  real(c_double) :: tout       ! output time
-  real(c_double) :: tcur       ! current time
-
-  integer(c_int) :: ierr       ! error flag from C functions
-  integer(c_int) :: nout       ! number of outputs
-
-  integer :: outstep           ! output loop counter
-
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: sunmat_A      ! sundials matrix
-  type(c_ptr) :: sunlinsol_LS  ! sundials linear solver
-  type(c_ptr) :: cvode_mem     ! CVODE memory
-
-  ! solution vector, neq is set in the ode_functions module
-  real(c_double) :: yvec(neq)
-
-  !======= Internals ============
-
-  ! initialize ODE
-  tstart = 0.0d0
-  tend   = 0.05d0
-  tcur   = tstart
-  tout   = tstart
-  dtout  = 0.005d0
-  nout   = ceiling(tend/dtout)
-
-  ! initialize solution vector
-  yvec(1) = 1.0d0
-  yvec(2) = 1.0d0
-  yvec(3) = 1.0d0
-
-  ! create a serial vector
-  sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) print *,'ERROR: sunvec = NULL'
-
-  ! create a dense matrix
-  sunmat_A = FSUNDenseMatrix(neq, neq);
-  if (.not. c_associated(sunmat_A)) print *,'ERROR: sunmat = NULL'
-
-  ! create a dense linear solver
-  sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A);
-  if (.not. c_associated(sunlinsol_LS)) print *,'ERROR: sunlinsol = NULL'
-
-  ! create CVode memory
-  cvode_mem = FCVodeCreate(CV_BDF, CV_NEWTON)
-  if (.not. c_associated(cvode_mem)) print *,'ERROR: cvode_mem = NULL'
-
-  ! initialize CVode
-  ierr = FCVodeInit(cvode_mem, c_funloc(RhsFn), tstart, sunvec_y)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeInit, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set relative and absolute tolerances
-  rtol = 1.0d-6
-  atol = 1.0d-10
-
-  ierr = FCVodeSStolerances(cvode_mem, rtol, atol)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeSStolerances, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! attach linear solver
-  ierr = FCVDlsSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A);
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsSetLinearSolver, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set Jacobian routine
-  ierr = FCVDlsSetJacFn(cvode_mem, c_funloc(JacFn))
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsSetJacFn, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! start time stepping
-  print *, '   '
-  print *, 'Finished initialization, starting time steps'
-  print *, '   '
-  print *, '       t           y1           y2           y3       '
-  print *, '------------------------------------------------------'
-  print '(2x,4(es12.5,1x))', tcur, yvec(1), yvec(2), yvec(3)
-  do outstep = 1,nout
-
-     ! call CVode
-     tout = min(tout + dtout, tend)
-     ierr = FCVode(cvode_mem, tout, sunvec_y, tcur, CV_NORMAL)
-     if (ierr /= 0) then
-        write(*,*) 'Error in FCVODE, ierr = ', ierr, '; halting'
-        stop
-     endif
-
-     ! output current solution
-     print '(2x,4(es12.5,1x))', tcur, yvec(1), yvec(2), yvec(3)
-
-  enddo
-
-  ! diagnostics output
-  call CVodeStats(cvode_mem)
-
-  ! clean up
-  call FCVodeFree(cvode_mem)
-  call FSUNLinSolFree_Dense(sunlinsol_LS)
-  call FSUNMatDestroy_Dense(sunmat_A)
-  call FN_VDestroy_Serial(sunvec_y)
-
-end program main
-
-
-! ----------------------------------------------------------------
-! CVodeStats
-!
-! Print CVODE statstics to stdandard out
-! ----------------------------------------------------------------
-subroutine CVodeStats(cvode_mem)
-
-  !======= Inclusions ===========
-  use iso_c_binding
-  use fcvode_mod
-
-  !======= Declarations =========
-  implicit none
-
-  type(c_ptr), intent(in) :: cvode_mem ! solver memory structure
-
-  integer(c_int)  :: ierr ! error flag
-
-  integer(c_long) :: nsteps     ! num steps
-  integer(c_long) :: nfevals    ! num function evals
-  integer(c_long) :: nlinsetups ! num linear solver setups
-  integer(c_long) :: netfails   ! num error test fails
-
-  integer(c_int) :: qlast ! method order in last step
-  integer(c_int) :: qcur  ! method order for next step
-
-  real(c_double) :: hinused ! initial step size
-  real(c_double) :: hlast   ! last step size
-  real(c_double) :: hcur    ! step size for next step
-  real(c_double) :: tcur    ! internal time reached
-
-  integer(c_long) :: nniters  ! nonlinear solver iterations
-  integer(c_long) :: nncfails ! nonlinear solver fails
-
-  integer(c_long) :: njevals  ! num Jacobian evaluations
-
-  !======= Internals ============
-
-  ! general solver statistics
-  ierr = FCVodeGetIntegratorStats(cvode_mem, nsteps, nfevals, nlinsetups, &
-       netfails, qlast, qcur, hinused, hlast, hcur, tcur)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetIntegratorStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! nonlinear solver statistics
-  ierr = FCVodeGetNonlinSolvStats(cvode_mem, nniters, nncfails)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetNonlinSolvStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! number of Jacobian evaluations
-  ierr = FCVDlsGetNumJacEvals(cvode_mem, njevals)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsGetNumJacEvals, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  print *, ' '
-  print *, ' General Solver Stats:'
-  print '(4x,A,i9)'    ,'Total internal steps taken =',nsteps
-  print '(4x,A,i9)'    ,'Total rhs function calls   =',nfevals
-  print '(4x,A,i9)'    ,'Num lin solver setup calls =',nlinsetups
-  print '(4x,A,i9)'    ,'Num error test failures    =',netfails
-  print '(4x,A,i9)'    ,'Last method order          =',qlast
-  print '(4x,A,i9)'    ,'Next method order          =',qcur
-  print '(4x,A,es12.5)','First internal step size   =',hinused
-  print '(4x,A,es12.5)','Last internal step size    =',hlast
-  print '(4x,A,es12.5)','Next internal step size    =',hcur
-  print '(4x,A,es12.5)','Current internal time      =',tcur
-  print '(4x,A,i9)'    ,'Num nonlinear solver iters =',nniters
-  print '(4x,A,i9)'    ,'Num nonlinear solver fails =',nncfails
-  print '(4x,A,i9)'    ,'Num Jacobian evaluations   =',njevals
-  print *, ' '
-
-  return
-
-end subroutine CVodeStats
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/cv_analytic_sys_dns_jac.out b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/cv_analytic_sys_dns_jac.out
deleted file mode 100644
index 726d98cffeb..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_sys_dns_jac/cv_analytic_sys_dns_jac.out
+++ /dev/null
@@ -1,32 +0,0 @@
-    
- Finished initialization, starting time steps
-    
-        t           y1           y2           y3       
- ------------------------------------------------------
-   0.00000E+00  1.00000E+00  1.00000E+00  1.00000E+00
-   5.00000E-03  7.03275E-01  7.06270E-01  4.10045E-01
-   1.00000E-02  5.22668E-01  5.28650E-01  5.23171E-02
-   1.50000E-02  4.12493E-01  4.21452E-01 -1.64556E-01
-   2.00000E-02  3.45038E-01  3.56966E-01 -2.95998E-01
-   2.50000E-02  3.03496E-01  3.18384E-01 -3.75623E-01
-   3.00000E-02  2.77673E-01  2.95512E-01 -4.23820E-01
-   3.50000E-02  2.61385E-01  2.82166E-01 -4.52956E-01
-   4.00000E-02  2.50882E-01  2.74596E-01 -4.70529E-01
-   4.50000E-02  2.43891E-01  2.70529E-01 -4.81091E-01
-   5.00000E-02  2.39030E-01  2.68584E-01 -4.87399E-01
-  
-  General Solver Stats:
-    Total internal steps taken =       73
-    Total rhs function calls   =      106
-    Num lin solver setup calls =       21
-    Num error test failures    =        6
-    Last method order          =        5
-    Next method order          =        5
-    First internal step size   = 6.86623E-06
-    Last internal step size    = 1.52515E-03
-    Next internal step size    = 1.52515E-03
-    Current internal time      = 5.10347E-02
-    Num nonlinear solver iters =      102
-    Num nonlinear solver fails =        0
-    Num Jacobian evaluations   =        2
-  
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/GNUmakefile b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/GNUmakefile
deleted file mode 100644
index e774718e350..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
-
-DEBUG     = FALSE
-USE_MPI   = FALSE
-COMP      = gnu
-DIM       = 3
-PRECISION = DOUBLE
-EBASE     = cv_brusselator_dns
-
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/Make.package b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/Make.package
deleted file mode 100644
index ea2f5b681bc..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += cv_brusselator_dns.f90
\ No newline at end of file
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/cv_brusselator_dns.f90 b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/cv_brusselator_dns.f90
deleted file mode 100644
index 21ca78c9dcf..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/cv_brusselator_dns.f90
+++ /dev/null
@@ -1,369 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner @ LLNL
-!                Daniel R. Reynolds @ SMU
-! ------------------------------------------------------------------
-! LLNS Copyright Start
-! Copyright (c) 2014, Lawrence Livermore National Security
-! This work was performed under the auspices of the U.S. Department
-! of Energy by Lawrence Livermore National Laboratory in part under
-! Contract W-7405-Eng-48 and in part under Contract DE-AC52-07NA27344.
-! Produced at the Lawrence Livermore National Laboratory.
-! All rights reserved.
-! For details, see the LICENSE file.
-! LLNS Copyright End
-! ------------------------------------------------------------------
-! This test simulates a brusselator problem from chemical kinetics.
-! This is an ODE system with 3 components, Y = [u,v,w], satisfying
-! the equations,
-!
-!    du/dt = a - (w+1)*u + v*u^2
-!    dv/dt = w*u - v*u^2
-!    dw/dt = (b-w)/ep - w*u
-!
-! for t in the interval [0.0, 10.0], with initial conditions
-! Y0 = [3.9, 1.1, 2.8], and parameter values a=1.2, b=2.5, and
-! ep=1.0e-5
-!
-! Here, all three components exhibit a rapid transient change during
-! the first 0.2 time units, followed by a slow and smooth evolution.
-! ------------------------------------------------------------------
-
-module ode_mod
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  !======= Declarations =========
-  implicit none
-
-  ! number of equations
-  integer(c_long), parameter :: neq = 3
-
-  ! ODE parameters
-  double precision, parameter :: a  = 1.2d0
-  double precision, parameter :: b  = 2.5d0
-  double precision, parameter :: ep = 1.0d-5
-
-contains
-
-  ! ----------------------------------------------------------------
-  ! RhsFn provides the right hand side function for the
-  ! ODE: dy/dt = f(t,y)
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
-       result(ierr) bind(C,name='RhsFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn        ! current time
-    type(c_ptr), value    :: sunvec_y  ! solution N_Vector
-    type(c_ptr), value    :: sunvec_f  ! rhs N_Vector
-    type(c_ptr), value    :: user_data ! user-defined data
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-    real(c_double), pointer :: fvec(:)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FN_VGetData_Serial(sunvec_y, yvec)
-    call FN_VGetData_Serial(sunvec_f, fvec)
-
-    ! fill RHS vector
-    fvec(1) = a  -  (yvec(3) + 1.0d0) * yvec(1)  +  yvec(2) * yvec(1) * yvec(1)
-    fvec(2) = yvec(3) * yvec(1)  -  yvec(2) * yvec(1) * yvec(1)
-    fvec(3) = (b-yvec(3))/ep - yvec(3) * yvec(1)
-
-    ! return success
-    ierr = 0
-    return
-
-  end function RhsFn
-
-  ! ----------------------------------------------------------------
-  ! JacFn: The Jacobian of the ODE hand side function J = df/dy
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function JacFn(tn, sunvec_y, sunvec_f, sunmat_J, &
-       user_data, tmp1, tmp2, tmp3) &
-       result(ierr) bind(C,name='JacFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-    use fsunmat_dense_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn               ! current time
-    type(c_ptr), value    :: sunvec_y         ! current solution N_Vector
-    type(c_ptr), value    :: sunvec_f         ! current rhs N_Vector
-    type(c_ptr), value    :: sunmat_J         ! Jacobian SUNMatrix
-    type(c_ptr), value    :: user_data        ! user-defined data
-    type(c_ptr), value    :: tmp1, tmp2, tmp3 ! workspace N_Vectors
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-
-    ! pointer to data in SUNDAILS matrix
-    real(c_double), pointer :: Jmat(:,:)
-
-    !======= Internals ============
-
-    ! get data array from SUNDIALS vector
-    call FN_VGetData_Serial(sunvec_y, yvec)
-
-    ! get data arrays from SUNDIALS vectors
-    call FSUNMatGetData_Dense(sunmat_J, Jmat)
-
-    ! fill Jacobian matrix
-    Jmat(1,1) = -(yvec(3)+1.0d0) + 2.0d0*yvec(1)*yvec(2);
-    Jmat(2,1) = yvec(3) - 2.0d0*yvec(1)*yvec(2);
-    Jmat(3,1) = -yvec(3);
-
-    Jmat(1,2) = yvec(1)*yvec(1);
-    Jmat(2,2) = -yvec(1)*yvec(1);
-    Jmat(3,2) = 0.0d0;
-
-    Jmat(1,3) = -yvec(1);
-    Jmat(2,3) = yvec(1);
-    Jmat(3,3) = -1.0d0/ep - yvec(1);
-
-    ! return success
-    ierr = 0
-    return
-
-  end function JacFn
-
-end module ode_mod
-
-
-program main
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  use fcvode_mod            ! Fortran interface to CVODE
-  use fnvector_serial_mod   ! Fortran interface to serial N_Vector
-  use fsunmat_dense_mod     ! Fortran interface to dense SUNMatrix
-  use fsunlinsol_dense_mod  ! Fortran interface to dense SUNLinearSolver
-  use ode_mod               ! ODE functions
-
-  !======= Declarations =========
-  implicit none
-
-  ! local variables
-  real(c_double) :: tstart     ! initial time
-  real(c_double) :: tend       ! final time
-  real(c_double) :: rtol, atol ! relative and absolute tolerance
-  real(c_double) :: dtout      ! output time interval
-  real(c_double) :: tout       ! output time
-  real(c_double) :: tcur       ! current time
-
-  integer(c_int) :: ierr       ! error flag from C functions
-  integer(c_int) :: nout       ! number of outputs
-
-  integer :: outstep           ! output loop counter
-
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: sunmat_A      ! sundials matrix
-  type(c_ptr) :: sunlinsol_LS  ! sundials linear solver
-  type(c_ptr) :: cvode_mem     ! CVODE memory
-
-  ! solution vector, neq is set in the ode_functions module
-  real(c_double) :: yvec(neq)
-
-  !======= Internals ============
-
-  ! initialize ODE
-  tstart = 0.0d0
-  tend   = 10.0d0
-  tcur   = tstart
-  tout   = tstart
-  dtout  = (tend-tstart)/10.d0
-  nout   = ceiling(tend/dtout)
-
-  ! initialize solution vector
-  yvec(1) = 3.9d0
-  yvec(2) = 1.1d0
-  yvec(3) = 2.8d0
-
-  ! create SUNDIALS N_Vector
-  sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) print *,'ERROR: sunvec = NULL'
-
-  ! create a dense matrix
-  sunmat_A = FSUNDenseMatrix(neq, neq);
-  if (.not. c_associated(sunmat_A)) print *,'ERROR: sunmat = NULL'
-
-  ! create a dense linear solver
-  sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A);
-  if (.not. c_associated(sunlinsol_LS)) print *,'ERROR: sunlinsol = NULL'
-
-  ! create CVode memory
-  cvode_mem = FCVodeCreate(CV_BDF, CV_NEWTON)
-  if (.not. c_associated(cvode_mem)) print *,'ERROR: cvode_mem = NULL'
-
-  ! initialize CVode
-  ierr = FCVodeInit(cvode_mem, c_funloc(RhsFn), tstart, sunvec_y)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeInit, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set relative and absolute tolerances
-  rtol = 1.0d-5
-  atol = 1.0d-10
-
-  ierr = FCVodeSStolerances(cvode_mem, rtol, atol)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeSStolerances, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! attach linear solver
-  ierr = FCVDlsSetLinearSolver(cvode_mem, sunlinsol_LS, sunmat_A);
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsSetLinearSolver, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! set Jacobian routine
-  ierr = FCVDlsSetJacFn(cvode_mem, c_funloc(JacFn))
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsSetJacFn, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! start time stepping
-  print *, '   '
-  print *, 'Finished initialization, starting time steps'
-  print *, '   '
-  print *, '      t           u           v           w'
-  print *, '----------------------------------------------------'
-  print '(1x,4(es12.5,1x))', tcur, yvec(1), yvec(2), yvec(3)
-  do outstep = 1,nout
-
-     ! call CVode
-     tout = min(tout + dtout, tend)
-     ierr = FCVode(cvode_mem, tout, sunvec_y, tcur, CV_NORMAL)
-     if (ierr /= 0) then
-        write(*,*) 'Error in FCVODE, ierr = ', ierr, '; halting'
-        stop
-     endif
-
-     ! output current solution
-     print '(1x,4(es12.5,1x))', tcur, yvec(1), yvec(2), yvec(3)
-
-  enddo
-
-  ! diagnostics output
-  call CVodeStats(cvode_mem)
-
-  ! clean up
-  call FCVodeFree(cvode_mem)
-  call FSUNLinSolFree_Dense(sunlinsol_LS)
-  call FSUNMatDestroy_Dense(sunmat_A)
-  call FN_VDestroy_Serial(sunvec_y)
-
-end program Main
-
-
-! ----------------------------------------------------------------
-! CVodeStats
-!
-! Print CVODE statstics to stdandard out
-! ----------------------------------------------------------------
-subroutine CVodeStats(cvode_mem)
-
-  !======= Inclusions ===========
-  use iso_c_binding
-  use fcvode_mod
-
-  !======= Declarations =========
-  implicit none
-
-  type(c_ptr), intent(in) :: cvode_mem ! solver memory structure
-
-  integer(c_int)  :: ierr ! error flag
-
-  integer(c_long) :: nsteps     ! num steps
-  integer(c_long) :: nfevals    ! num function evals
-  integer(c_long) :: nlinsetups ! num linear solver setups
-  integer(c_long) :: netfails   ! num error test fails
-
-  integer(c_int) :: qlast ! method order in last step
-  integer(c_int) :: qcur  ! method order for next step
-
-  real(c_double) :: hinused ! initial step size
-  real(c_double) :: hlast   ! last step size
-  real(c_double) :: hcur    ! step size for next step
-  real(c_double) :: tcur    ! internal time reached
-
-  integer(c_long) :: nniters  ! nonlinear solver iterations
-  integer(c_long) :: nncfails ! nonlinear solver fails
-
-  integer(c_long) :: njevals  ! num Jacobian evaluations
-
-  !======= Internals ============
-
-  ! general solver statistics
-  ierr = FCVodeGetIntegratorStats(cvode_mem, nsteps, nfevals, nlinsetups, &
-       netfails, qlast, qcur, hinused, hlast, hcur, tcur)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetIntegratorStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! nonlinear solver statistics
-  ierr = FCVodeGetNonlinSolvStats(cvode_mem, nniters, nncfails)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVodeGetNonlinSolvStats, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  ! nonlinear solver statistics
-  ierr = FCVDlsGetNumJacEvals(cvode_mem, njevals)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsGetNumJacEvals, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  print *, ' '
-  print *, ' General Solver Stats:'
-  print '(4x,A,i9)'    ,'Total internal steps taken =',nsteps
-  print '(4x,A,i9)'    ,'Total rhs function calls   =',nfevals
-  print '(4x,A,i9)'    ,'Num lin solver setup calls =',nlinsetups
-  print '(4x,A,i9)'    ,'Num error test failures    =',netfails
-  print '(4x,A,i9)'    ,'Last method order          =',qlast
-  print '(4x,A,i9)'    ,'Next method order          =',qcur
-  print '(4x,A,es12.5)','First internal step size   =',hinused
-  print '(4x,A,es12.5)','Last internal step size    =',hlast
-  print '(4x,A,es12.5)','Next internal step size    =',hcur
-  print '(4x,A,es12.5)','Current internal time      =',tcur
-  print '(4x,A,i9)'    ,'Num nonlinear solver iters =',nniters
-  print '(4x,A,i9)'    ,'Num nonlinear solver fails =',nncfails
-  print '(4x,A,i9)'    ,'Num Jacobian evaluations   =',njevals
-  print *, ' '
-
-  return
-
-end subroutine CVodeStats
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/cv_brusselator_dns.out b/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/cv_brusselator_dns.out
deleted file mode 100644
index 974aad510d5..00000000000
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_brusselator_dns/cv_brusselator_dns.out
+++ /dev/null
@@ -1,32 +0,0 @@
-    
- Finished initialization, starting time steps
-    
-       t           u           v           w
- ----------------------------------------------------
-  0.00000E+00  3.90000E+00  1.10000E+00  2.80000E+00
-  1.00000E+00  2.07524E+00  1.05963E+00  2.49995E+00
-  2.00000E+00  1.10046E+00  1.72359E+00  2.49997E+00
-  3.00000E+00  7.89552E-01  2.32675E+00  2.49998E+00
-  4.00000E+00  8.11753E-01  2.72563E+00  2.49998E+00
-  5.00000E+00  1.18689E+00  2.59560E+00  2.49997E+00
-  6.00000E+00  1.88737E+00  1.49415E+00  2.49995E+00
-  7.00000E+00  1.32344E+00  1.61892E+00  2.49997E+00
-  8.00000E+00  9.21907E-01  2.13003E+00  2.49998E+00
-  9.00000E+00  8.49566E-01  2.53930E+00  2.49998E+00
-  1.00000E+01  1.06481E+00  2.59595E+00  2.49997E+00
-  
-  General Solver Stats:
-    Total internal steps taken =      187
-    Total rhs function calls   =      255
-    Num lin solver setup calls =       40
-    Num error test failures    =        8
-    Last method order          =        5
-    Next method order          =        5
-    First internal step size   = 8.98870E-08
-    Last internal step size    = 1.66465E-01
-    Next internal step size    = 1.66465E-01
-    Current internal time      = 1.00487E+01
-    Num nonlinear solver iters =      251
-    Num nonlinear solver fails =        0
-    Num Jacobian evaluations   =        4
-  
diff --git a/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/GNUmakefile b/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/GNUmakefile
deleted file mode 100644
index 11a59e53dd2..00000000000
--- a/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/GNUmakefile
+++ /dev/null
@@ -1,23 +0,0 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
-
-DEBUG     = FALSE
-USE_MPI   = FALSE
-USE_OMP   = FALSE
-COMP      = gnu
-DIM       = 3
-PRECISION = DOUBLE
-EBASE     = ark_analytic
-
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_ARKODE_LIBS = TRUE
-USE_SUNDIALS_3x4x = TRUE
-SUNDIALS_VERSION = 4
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include ./Make.package
-include $(AMREX_HOME)/Src/Base/Make.package
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/Make.package b/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/Make.package
deleted file mode 100644
index f272f377767..00000000000
--- a/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-ifeq ($(USE_ARKODE_LIBS), TRUE)
-     f90EXE_sources += ark_analytic_f2003.f90
-endif
diff --git a/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/ark_analytic_f2003.f90 b/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/ark_analytic_f2003.f90
deleted file mode 100644
index 0a38d8c2990..00000000000
--- a/Tutorials/CVODE/SUNDIALS4/EX_ark_analytic/ark_analytic_f2003.f90
+++ /dev/null
@@ -1,283 +0,0 @@
-! ------------------------------------------------------------------
-! Programmer(s): David J. Gardner, Cody J. Balos @ LLNL
-!                modified by Jean M. Sexton @ LBL
-! ------------------------------------------------------------------
-! SUNDIALS Copyright Start
-! Copyright (c) 2002-2019, Lawrence Livermore National Security
-! and Southern Methodist University.
-! All rights reserved.
-!
-! See the top-level LICENSE and NOTICE files for details.
-!
-! SPDX-License-Identifier: BSD-3-Clause
-! SUNDIALS Copyright End
-! ------------------------------------------------------------------
-! The following is a simple example problem with an analytical
-! solution.
-!
-!   dy/dt = lamda*y + 1/(1+t^2) - lamda*atan(t)
-!
-! for t in the interval [0.0, 10.0], with initial condition: y=0.
-!
-! The stiffness of the problem is directly proportional to the
-! value of lamda. The value of lamda should be negative to
-! result in a well-posed ODE; for values with magnitude larger
-! than 100 the problem becomes quite stiff.
-! ------------------------------------------------------------------
-
-module ode_mod
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  !======= Declarations =========
-  implicit none
-
-  ! number of equations
-  integer(c_long), parameter :: neq = 1
-
-  ! ODE parameters
-  double precision, parameter :: lamda = -100.0d0
-
-contains
-
-  ! ----------------------------------------------------------------
-  ! RhsFn provides the right hand side function for the
-  ! ODE: dy/dt = f(t,y)
-  !
-  ! Return values:
-  !    0 = success,
-  !    1 = recoverable error,
-  !   -1 = non-recoverable error
-  ! ----------------------------------------------------------------
-  integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
-       result(ierr) bind(C,name='RhsFn')
-
-    !======= Inclusions ===========
-    use, intrinsic :: iso_c_binding
-    use fnvector_serial_mod
-
-    !======= Declarations =========
-    implicit none
-
-    ! calling variables
-    real(c_double), value :: tn        ! current time
-    type(c_ptr), value    :: sunvec_y  ! solution N_Vector
-    type(c_ptr), value    :: sunvec_f  ! rhs N_Vector
-    type(c_ptr), value    :: user_data ! user-defined data
-
-    ! pointers to data in SUNDAILS vectors
-    real(c_double), pointer :: yvec(:)
-    real(c_double), pointer :: fvec(:)
-
-    !======= Internals ============
-
-    ! get data arrays from SUNDIALS vectors
-    call FN_VGetData_Serial(sunvec_y, yvec)
-    call FN_VGetData_Serial(sunvec_f, fvec)
-
-    ! fill RHS vector
-    fvec(1) = lamda*yvec(1) + 1.0/(1.0+tn*tn) - lamda*atan(tn);
-
-    ! return success
-    ierr = 0
-    return
-
-  end function RhsFn
-
-end module ode_mod
-
-
-program main
-
-  !======= Inclusions ===========
-  use, intrinsic :: iso_c_binding
-
-  use farkode_mod          ! Fortran interface to the ARKode module
-  use farkode_arkstep_mod  ! Fortran interface to the ARKStep module
-  use fnvector_serial_mod  ! Fortran interface to serial n_vector
-  use fsunmatrix_dense_mod ! Fortran interface to dense SUNMatrix
-  use fsunlinsol_dense_mod ! Fortran interface to dense SUNLinearSolver
-  use ode_mod             ! ODE functions
-  ! use arkode_interface
-
-  !======= Declarations =========
-  implicit none
-
-  ! local variables
-  real(c_double) :: tstart     ! initial time
-  real(c_double) :: tend       ! final time
-  real(c_double) :: rtol, atol ! relative and absolute tolerance
-  real(c_double) :: dtout      ! output time interval
-  real(c_double) :: tout       ! output time
-  real(c_double) :: tcur       ! current time
-  integer(c_int) :: imethod, idefault, pq
-
-  integer(c_int) :: ierr       ! error flag from C functions
-  integer(c_int) :: nout       ! number of outputs
-
-  integer :: outstep           ! output loop counter
-
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: sunmat_A      ! sundials matrix
-  type(c_ptr) :: sunls         ! sundials linear solver
-  type(c_ptr) :: arkode_mem    ! ARKODE memory
-
-  ! solution vector, neq is set in the ode_functions module
-  real(c_double) :: yvec(neq)
-
-  !======= Internals ============
-
-  ! initialize ODE
-  tstart = 0.0d0
-  tend   = 10.0d0
-  tcur   = tstart
-  tout   = tstart
-  dtout  = 1.0d0
-  nout   = ceiling(tend/dtout)
-
-  ! initialize solution vector
-  yvec(1) = 0.0d0
-
-  ! create SUNDIALS N_Vector
-  sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) print *,'ERROR: sunvec = NULL'
-
-  ! create ARKStep memory
-  arkode_mem = FARKStepCreate(c_null_ptr, c_funloc(RhsFn), tstart, sunvec_y)
-  if (.not. c_associated(arkode_mem)) print *,'ERROR: arkode_mem = NULL'
-
-  ! Tell ARKODE to use a dense linear solver.
-  sunmat_A = FSUNDenseMatrix(neq, neq)
-  if (.not. c_associated(sunmat_A)) print *,'ERROR: sunmat = NULL'
-
-  sunls = FSUNDenseLinearSolver(sunvec_y, sunmat_A)
-  if (.not. c_associated(sunls)) print *,'ERROR: sunls = NULL'
-
-  ierr = FARKStepSetLinearSolver(arkode_mem, sunls, sunmat_A)
-  if (ierr /= 0) then
-    write(*,*) 'Error in FARKStepSetLinearSolver'
-    stop
-  end if
-
-  ! set relative and absolute tolerances
-  rtol = 1.0d-6
-  atol = 1.0d-10
-
-  ierr = FARKStepSStolerances(arkode_mem, rtol, atol)
-  if (ierr /= 0) then
-     write(*,*) 'Error in FARKStepSStolerances, ierr = ', ierr, '; halting'
-     stop
-  end if
-
-  imethod = 4
-  idefault = 1
-  pq = 0
-  ierr = FARKStepSetAdaptivityMethod(arkode_mem, imethod, idefault, pq, c_null_ptr)
-  
-  ! Start time stepping
-  print *, '   '
-  print *, 'Finished initialization, starting time steps'
-  print *, '   '
-  print *, '       t           y        '
-  print *, '----------------------------'
-  print '(2x,2(es12.5,1x))', tcur, yvec(1)
-  do outstep = 1,nout
-
-     ! call ARKStep
-     tout = min(tout + dtout, tend)
-     ierr = FARKStepEvolve(arkode_mem, tout, sunvec_y, tcur, ARK_NORMAL)
-     if (ierr /= 0) then
-        write(*,*) 'Error in FARKODE, ierr = ', ierr, '; halting'
-        stop
-     endif
-
-     ! output current solution
-     print '(2x,2(es12.5,1x))', tcur, yvec(1)
-
-  enddo
-
-  ! diagnostics output
-  call ARKStepStats(arkode_mem)
-  call FN_VDestroy_Serial(sunvec_y)
-
-  ! clean up
-  call FARKStepFree(arkode_mem)
-
-end program main
-
-
-! ----------------------------------------------------------------
-! ARKStepStats
-!
-! Print ARKODE statstics to stdandard out
-! ----------------------------------------------------------------
-subroutine ARKStepStats(arkode_mem)
-
-  !======= Inclusions ===========
-  use iso_c_binding
-  use farkode_mod
-  use farkode_arkstep_mod
-
-  !======= Declarations =========
-  implicit none
-
-  type(c_ptr), intent(in) :: arkode_mem ! solver memory structure
-
-  integer(c_int)  :: ierr ! error flag
-
-  integer(c_long) :: nsteps     ! num steps
-  integer(c_long) :: nst_a      ! num steps attempted
-  integer(c_long) :: nfe        ! num explicit function evals
-  integer(c_long) :: nfi        ! num implicit function evals
-  integer(c_long) :: nfevals    ! num function evals
-  integer(c_long) :: nlinsetups ! num linear solver setups
-  integer(c_long) :: netfails   ! num error test fails
-
-  integer(c_int) :: qlast ! method order in last step
-  integer(c_int) :: qcur  ! method order for next step
-
-  real(c_double) :: hinused ! initial step size
-  real(c_double) :: hlast   ! last step size
-  real(c_double) :: hcur    ! step size for next step
-  real(c_double) :: tcur    ! internal time reached
-
-  integer(c_long) :: nniters  ! nonlinear solver iterations
-  integer(c_long) :: nncfails ! nonlinear solver fails
-  integer(c_long) :: njacevals! number of Jacobian evaluations
-  integer(c_long) :: nfeLS    ! number of nonlinear solver rhs evaluations
-
-  !======= Internals ============
-
-  ierr = FARKStepGetNumSteps(arkode_mem, nsteps)
-  ierr = FARKStepGetNumStepAttempts(arkode_mem, nst_a)
-  ierr = FARKStepGetNumRhsEvals(arkode_mem, nfe, nfi)
-  nfevals=nfe+nfi
-  ierr = FARKStepGetActualInitStep(arkode_mem, hinused)
-  ierr = FARKStepGetLastStep(arkode_mem, hlast)
-  ierr = FARKStepGetCurrentStep(arkode_mem, hcur)
-  ierr = FARKStepGetCurrentTime(arkode_mem, tcur)
-  ierr = FARKStepGetNumLinSolvSetups(arkode_mem, nlinsetups)
-  ierr = FARKStepGetNumErrTestFails(arkode_mem, netfails)
-  ierr = FARKStepGetNumNonlinSolvIters(arkode_mem, nniters)
-  ierr = FARKStepGetNumNonlinSolvConvFails(arkode_mem, nncfails)
-  ierr = FARKStepGetNumJacEvals(arkode_mem, njacevals)
-
-  print *, ' '
-  print *, ' General Solver Stats:'
-  print '(4x,A,i9)'    ,'Total internal steps taken    =',nsteps
-  print '(4x,A,i9)'    ,'Total internal steps attempts =',nst_a
-  print '(4x,A,i9)'    ,'Total rhs function calls      =',nfevals
-  print '(4x,A,i9)'    ,'Num lin solver setup calls    =',nlinsetups
-  print '(4x,A,i9)'    ,'Num error test failures       =',netfails
-  print '(4x,A,es12.5)','First internal step size      =',hinused
-  print '(4x,A,es12.5)','Last internal step size       =',hlast
-  print '(4x,A,es12.5)','Next internal step size       =',hcur
-  print '(4x,A,es12.5)','Current internal time         =',tcur
-  print '(4x,A,i9)'    ,'Num nonlinear solver iters    =',nniters
-  print '(4x,A,i9)'    ,'Num nonlinear solver fails    =',nncfails
-  print *, ' '
-
-  return
-
-end subroutine ARKStepStats
diff --git a/Tutorials/EB/CNS/CMakeLists.txt b/Tutorials/EB/CNS/CMakeLists.txt
new file mode 100644
index 00000000000..3d4e948252b
--- /dev/null
+++ b/Tutorials/EB/CNS/CMakeLists.txt
@@ -0,0 +1,108 @@
+if (NOT (AMReX_SPACEDIM EQUAL 3) OR NOT CMAKE_Fortran_COMPILER_LOADED)
+   return()
+endif ()
+
+#
+# This directory contains 4 tutorials
+#
+#  * Combustor
+#  * Pulse
+#  * ShockRef
+#  * Sod
+#
+
+set(_sources main.cpp CNS_advance.cpp CNSBld.cpp CNS.cpp CNS_F.H CNS.H CNS_init_eb2.cpp CNS_io.cpp
+   CNS_setup.cpp )
+
+set(_diffusion_sources cns_diff_mod.F90 cns_eb_diff_mod.F90 cns_eb_diff_wall.F90 diff_coef_mod.F90)
+list(TRANSFORM _diffusion_sources PREPEND diffusion/)
+
+set(_fortran_sources bc_fill_nd.F90 CNS_derive.F90 CNS_divop.F90 CNS_dudt.F90 CNS_f.F90 CNS_nd.F90
+   CNS_physics.F90 CNS_tagging.F90 )
+list(TRANSFORM _fortran_sources PREPEND fortran/)
+
+set(_hydro_sources analriem3d.F90 cns_eb_hyp_wall.F90 Hyp_gamma_MOL_EB.F90 Hyp_gamma_MOL.F90
+   slope_mol_3d_gamma_EB.F90 slope_mol_3d_gamma.F90)
+list(TRANSFORM _hydro_sources PREPEND hydro/)
+
+list(APPEND _sources ${_diffusion_sources} ${_fortran_sources} ${_hydro_sources})
+list(TRANSFORM _sources PREPEND Source/)
+
+unset(_diffusion_sources)
+unset(_fortran_sources)
+unset(_hydro_sources)
+
+
+
+##########################################################################################
+#
+# Combustor tutorial
+#
+##########################################################################################
+set(_combustor_sources Exec/Combustor/cns_prob.F90 ${_sources})
+set(_input_files Exec/Combustor/inputs Exec/Combustor/inputs.regt)
+
+setup_tutorial(_combustor_sources _input_files
+   HAS_FORTRAN_MODULES
+   BASE_NAME CNS_Combustor
+   RUNTIME_SUBDIR Combustor)
+
+unset(_combustor_sources)
+
+
+
+##########################################################################################
+#
+# Pulse tutorial
+#
+##########################################################################################
+set(_pulse_sources Exec/Pulse/cns_prob.F90 ${_sources})
+set(_input_files Exec/Pulse/inputs Exec/Pulse/inputs.regt)
+
+setup_tutorial(_pulse_sources _input_files
+   HAS_FORTRAN_MODULES
+   BASE_NAME CNS_Pulse
+   RUNTIME_SUBDIR Pulse)
+
+unset(_pulse_sources)
+
+
+
+##########################################################################################
+#
+# ShockRef tutorial
+#
+##########################################################################################
+set(_shockref_sources Exec/ShockRef/cns_prob.F90 ${_sources})
+set(_input_files Exec/ShockRef/inputs Exec/ShockRef/inputs.regt Exec/ShockRef/inputs.amr)
+
+setup_tutorial(_shockref_sources _input_files
+   HAS_FORTRAN_MODULES
+   BASE_NAME CNS_ShockRef
+   RUNTIME_SUBDIR ShockRef)
+
+unset(_shockref_sources)
+
+
+
+##########################################################################################
+#
+# Sod tutorial
+#
+##########################################################################################
+set(_sod_sources Exec/Sod/cns_prob.F90 ${_sources})
+set(_input_files Exec/Sod/inputs)
+
+setup_tutorial(_sod_sources _input_files
+   HAS_FORTRAN_MODULES
+   BASE_NAME CNS_Sod
+   RUNTIME_SUBDIR Sod)
+
+unset(_sod_sources)
+
+
+#
+# Clean-up
+#
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/EB/Donut/Exec/GNUmakefile b/Tutorials/EB/Donut/Exec/GNUmakefile
deleted file mode 100644
index 440f78d3626..00000000000
--- a/Tutorials/EB/Donut/Exec/GNUmakefile
+++ /dev/null
@@ -1,26 +0,0 @@
-AMREX_HOME := ../../../..
-
-EBASE = EBL
-
-DIM          = 3
-COMP         = gnu
-
-DEBUG        = FALSE
-
-USE_MPI      = TRUE
-USE_OMP      = FALSE
-
-USE_EB       = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/EB/Make.package
-
-include $(AMREX_HOME)/Tutorials/EB/Donut/Src/Make.package
-VPATH_LOCATIONS += $(AMREX_HOME)/Tutorials/EB/Donut/Src
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Tutorials/EB/Donut/Src
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/EB/Donut/Exec/inputs b/Tutorials/EB/Donut/Exec/inputs
deleted file mode 100644
index 0d40166b61e..00000000000
--- a/Tutorials/EB/Donut/Exec/inputs
+++ /dev/null
@@ -1,30 +0,0 @@
-max_lev = 2
-
-# Number of grid cells in each direction at the coarsest level
-n_cell = 240 240 240
-
-# Maximum allowable size of each subdomain in the problem domain;
-#    this is used to decompose the domain for parallel calculations.
-max_grid_size = 30
-
-prob_lo     = 0.      0.      0.      # lo corner of physical domain
-prob_hi     = 60.000  60.000  60.000  # hi corner of physical domain
-
-is_periodic = 0       0       0       # Is periodic in each direction?
-
-
-
-eb_amr.eb_pad     = 2
-eb_amr.max_eb_pad = 8
-
-# VERBOSITY
-amr.v               = 1       # verbosity in Amr
-
-# REFINEMENT
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.blocking_factor = 6       # block factor in grid generation
-amr.max_grid_size   = 6
-
-
-amr.phierr = 1 .1
-
diff --git a/Tutorials/EB/Donut/Src/Make.package b/Tutorials/EB/Donut/Src/Make.package
deleted file mode 100644
index 3a48a57331e..00000000000
--- a/Tutorials/EB/Donut/Src/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-CEXE_sources   += main.cpp
diff --git a/Tutorials/EB/Donut/Src/main.cpp b/Tutorials/EB/Donut/Src/main.cpp
deleted file mode 100644
index 9949aa751c0..00000000000
--- a/Tutorials/EB/Donut/Src/main.cpp
+++ /dev/null
@@ -1,202 +0,0 @@
-#include <AMReX.H>
-
-#include <AMReX_ParmParse.H>
-
-#include <AMReX_MultiFab.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_BoxArray.H>
-#include <AMReX_MultiCutFab.H>
-#include <AMReX_EBFArrayBox.H>
-#include <AMReX_EBFabFactory.H>
-#include <AMReX_DistributionMapping.H>
-
-#include <AMReX_EB2.H>
-#include <AMReX_EB2_IF_Torus.H>
-#include <AMReX_EB2_IF_Union.H>
-#include <AMReX_EB2_IF_Cylinder.H>
-#include <AMReX_EB2_IF_Difference.H>
-#include <AMReX_EB2_GeometryShop.H>
-
-#include <AMReX_WriteEBSurface.H>
-#include <AMReX_WriteEB_F.H>
-
-#include <AMReX_EB_LSCore.H>
-
-using namespace amrex;
-
-inline
-void set_tooth_pos(RealArray & tooth_pos, Real angle, Real radius, const RealArray & center) {
-    tooth_pos[0] = center[0] + radius * std::cos(angle);
-    tooth_pos[1] = center[1] + radius * std::sin(angle);
-}
-
-
-int main (int argc, char * argv[]) {
-    amrex::Initialize(argc, argv);
-    // Issue an error if AMR input file is not given
-    if ( argc < 2 )
-        amrex::Abort("AMReX input file missing");
-
-    // {...} in order to ensure everything has gone out of scope (and therefore
-    // is deallocated) before amrex::Finalize is called.
-    {
-
-        /************************************************************************
-         * Load GRID parameters                                                 *
-         ***********************************************************************/
-
-        // AMREX_SPACEDIM: number of dimensions
-        int n_cell, max_grid_size, max_lev;
-        Vector<int> is_periodic(AMREX_SPACEDIM,0);  // non-periodic in all direction by default
-        Vector<Real> prob_lo(AMREX_SPACEDIM,0);
-        Vector<Real> prob_hi(AMREX_SPACEDIM,0);
-        {
-            // ParmParse is way of reading inputs from the inputs file
-            ParmParse pp;
-
-            // We need to get n_cell from the inputs file - this is the number of
-            // cells on each side of a square (or cubic) domain.
-            pp.get("n_cell", n_cell);
-
-            // The domain is broken into boxes of size max_grid_size
-            pp.get("max_grid_size", max_grid_size);
-
-            pp.getarr("is_periodic", is_periodic);
-
-            pp.getarr("prob_lo", prob_lo);
-            pp.getarr("prob_hi", prob_hi);
-
-            pp.get("max_lev", max_lev);
-        }
-
-        /************************************************************************
-         * BUILD BoxArray, Geometry, and DistributionMapping                    *
-         ***********************************************************************/
-
-        BoxArray grids;
-        Geometry geom;
-        IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-        IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-        Box domain(dom_lo, dom_hi);
-
-        // Initialize the boxarray "grids" from the single box "domain"
-        grids.define(domain);
-        // Break up boxarray "grids" into chunks no larger than "max_grid_size"
-        // along a direction
-        grids.maxSize(max_grid_size);
-
-        // This defines the physical box, [-1,1] in each direction.
-        RealBox real_box( prob_lo[0], prob_lo[1],
-                          prob_lo[2], prob_hi[0],
-                          prob_hi[1], prob_hi[2] );
-
-        // This defines a Geometry object
-        geom.define(domain, & real_box, CoordSys::cartesian, is_periodic.data());
-
-        DistributionMapping dmap(grids, ParallelDescriptor::NProcs());
-
-
-        /************************************************************************
-         * Basic DONUT                                                          *
-         ***********************************************************************/
-
-        RealArray donut_center{30., 30., 30.};
-        EB2::TorusIF donut(10, 5, donut_center, false);
-
-
-        /************************************************************************
-         * Bite Mark                                                            *
-         ***********************************************************************/
-
-        Real radius = 5;
-        Real tooth_radius = 1.3;
-        RealArray bite_center{15., 30., 30.};
-        EB2::CylinderIF bite_0(radius, 2, bite_center, false);
-
-        Real angle_0 = -1.45;
-        RealArray tooth_pos = bite_center;
-
-        set_tooth_pos(tooth_pos, 0 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_1(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 0.4 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_2(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 0.8 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_3(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 1.2 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_4(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 1.6 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_5(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 2.0 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_6(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 2.4 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_7(tooth_radius, 2, tooth_pos, false);
-
-        set_tooth_pos(tooth_pos, 2.8 + angle_0, radius - tooth_radius*0.6, bite_center);
-        EB2::CylinderIF tooth_8(tooth_radius, 2, tooth_pos, false);
-
-        auto bite = EB2::makeUnion(bite_0,
-                                   tooth_1, tooth_2, tooth_3, tooth_4, tooth_5,
-                                   tooth_6, tooth_7, tooth_8);
-
-
-        /************************************************************************
-         * Take a bite OUT of DONUT                                             *
-         ***********************************************************************/
-
-        auto bite_donut = EB2::makeDifference(donut, bite);
-
-
-        /************************************************************************
-         * Construct EB surface                                                 *
-         ***********************************************************************/
-
-        auto gshop = EB2::makeShop(bite_donut);
-        EB2::Build(gshop, geom, 0, 0);
-
-        const EB2::IndexSpace & ebis_donut = EB2::IndexSpace::top();
-
-        int eb_grow = 1;
-        EBFArrayBoxFactory ebf_donut ( ebis_donut.getLevel(geom), geom, grids, dmap,
-                                       {eb_grow, eb_grow, eb_grow}, EBSupport::full );
-
-        Print() << "Writing EB surface" << std::endl;
-        WriteEBSurface (grids, dmap, geom, &ebf_donut);
-
-
-        /************************************************************************
-         * Build AMR mesh around donut                                          *
-         ***********************************************************************/
-
-        Print() << "Building adaptive mesh" << std::endl;
-
-        Box domain_crse = domain;
-        domain_crse.coarsen(4);
-
-        const IntVect & dom_crse_lo = domain_crse.smallEnd();
-        const IntVect & dom_crse_hi = domain_crse.bigEnd();
-        // Picket-fence principle
-        IntVect n_cells_crse= dom_crse_hi - dom_crse_lo + IntVect{1, 1, 1};
-        Vector<int> v_cells = {
-            AMREX_D_DECL(n_cells_crse[0], n_cells_crse[1], n_cells_crse[2])
-        };
-
-        amrex::Print() << "Declaring AMR levelset:" << std::endl
-                       << "coarsest level: " << domain_crse << " n_cells: " << n_cells_crse
-                       << std::endl;
-
-        LSCore<decltype(bite_donut)> ls_core(gshop, & real_box, max_lev, v_cells);
-        ls_core.InitData();
-        ls_core.WritePlotFile();
-
-        amrex::Print() << " ... done" <<std::endl;
-    }
-
-    amrex::Finalize();
-    return 0;
-}
diff --git a/Tutorials/EB/GeometryGeneration/CMakeLists.txt b/Tutorials/EB/GeometryGeneration/CMakeLists.txt
new file mode 100644
index 00000000000..d414c09fae6
--- /dev/null
+++ b/Tutorials/EB/GeometryGeneration/CMakeLists.txt
@@ -0,0 +1,11 @@
+if (NOT AMReX_SPACEDIM EQUAL 3)
+   return()
+endif ()
+
+set(_sources main.cpp)
+set(_input_files)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/EB/GeometryGeneration/GNUmakefile b/Tutorials/EB/GeometryGeneration/GNUmakefile
index 4d80a08a991..fed63926a09 100644
--- a/Tutorials/EB/GeometryGeneration/GNUmakefile
+++ b/Tutorials/EB/GeometryGeneration/GNUmakefile
@@ -11,7 +11,7 @@ COMP = gnu
 
 DIM = 3
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/EB/LevelSet/Exec/GNUmakefile b/Tutorials/EB/LevelSet/Exec/GNUmakefile
deleted file mode 100644
index cc1d3df6b50..00000000000
--- a/Tutorials/EB/LevelSet/Exec/GNUmakefile
+++ /dev/null
@@ -1,26 +0,0 @@
-AMREX_HOME := ../../../..
-
-EBASE = EBL
-
-DIM          = 3
-COMP         = gnu
-
-DEBUG        = FALSE
-
-USE_MPI      = TRUE
-USE_OMP      = FALSE
-
-USE_EB       = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-include $(AMREX_HOME)/Src/Base/Make.package
-include $(AMREX_HOME)/Src/Boundary/Make.package
-include $(AMREX_HOME)/Src/AmrCore/Make.package
-include $(AMREX_HOME)/Src/EB/Make.package
-
-include $(AMREX_HOME)/Tutorials/EB/LevelSet/Src/Make.package
-VPATH_LOCATIONS += $(AMREX_HOME)/Tutorials/EB/LevelSet/Src
-INCLUDE_LOCATIONS += $(AMREX_HOME)/Tutorials/EB/LevelSet/Src
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/EB/LevelSet/Exec/inputs b/Tutorials/EB/LevelSet/Exec/inputs
deleted file mode 100644
index 8b140b2621f..00000000000
--- a/Tutorials/EB/LevelSet/Exec/inputs
+++ /dev/null
@@ -1,79 +0,0 @@
-n_lev = 4
-
-# Number of grid cells in each direction at the coarsest level
-n_cell = 32 32 48
-
-# Maximum allowable size of each subdomain in the problem domain;
-#    this is used to decompose the domain for parallel calculations.
-max_grid_size = 8
-
-prob_lo     = 0.      0.      0.      # lo corner of physical domain
-prob_hi     = 0.0032  0.0032  0.0048  # hi corner of physical domain
-
-is_periodic = 0       0       0       # Is periodic in each direction?
-
-#########################################################################
-# This is the poly geometry
-#########################################################################
-
-eb.make_poly    = false
-
-# Cylinder ::  x^2 + y^2 = R^2
-poly.poly2_x_coeffs =    0.00     0.00     1.00
-poly.poly2_y_coeffs =    0.00     0.00     1.00
-poly.poly2_z_coeffs =   -2.56e-6  0.00     0.00
-
-poly.poly2_translate =   1.6e-3   1.6e-3   0.00
-
-#########################################################################
-# This is the cylinder geometry
-#########################################################################
-
-eb.make_cylinder  = true
-
-cyl.cyl_dir       = 2
-cyl.cyl_radius    = .0016
-cyl.cyl_length    = .0048
-#cyl.cyl_length    = -1
-cyl.cyl_translate = .0016 .0016 0.
-
-#########################################################################
-# Level set specifications
-#########################################################################
-
-# Collision algorithm details:
-# Level-set refinement and padding
-eb.levelset__refinement = 2
-eb.levelset__pad        = 4
-
-# EBIS refinement and padding
-eb.levelset__eb_refinement = 1
-eb.levelset__eb_pad        = 4
-
-
-eb_amr.eb_pad     = 1
-eb_amr.max_eb_pad = 4
-
-amr.n_cell        = 8  8  12
-amr.max_grid_size = 4
-
-geometry.prob_lo     = 0.      0.      0.      # lo corner of physical domain
-geometry.prob_hi     = 0.0032  0.0032  0.0048  # hi corner of physical domain
-
-geometry.is_periodic = 0       0       0       # Is periodic in each direction?
-
-# VERBOSITY
-amr.v               = 1       # verbosity in Amr
-
-# REFINEMENT
-amr.max_level       = 3       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.blocking_factor = 1       # block factor in grid generation
-
-
-
-# Tagging
-amr.phierr = 1.e-3  5.e-4  1.e-4  5.e-5  1.e-5
-#amr.phierr = 8.e-5  6.e-5  4.e-5  1.e-5
-#amr.phierr = 1.e-3  6.e-4  2.e-4  8.e-5  4.e-5
-#amr.phierr = 6.e-4  2.e-4  8.e-5  4.e-5
diff --git a/Tutorials/EB/LevelSet/Exec/inputs_eb2 b/Tutorials/EB/LevelSet/Exec/inputs_eb2
deleted file mode 100644
index a43373ceb5a..00000000000
--- a/Tutorials/EB/LevelSet/Exec/inputs_eb2
+++ /dev/null
@@ -1,50 +0,0 @@
-# Number of grid cells in each direction at the coarsest level
-n_cell = 32 32 32
-
-# Maximum allowable size of each subdomain in the problem domain;
-#    this is used to decompose the domain for parallel calculations.
-max_grid_size = 8
-
-prob_lo     = 0.      0.      0.      # lo corner of physical domain
-prob_hi     = 0.0032  0.0032  0.0032  # hi corner of physical domain
-
-is_periodic = 1       1       0       # Is periodic in each direction?
-
-#########################################################################
-# This is the poly geometry
-#########################################################################
-
-eb.make_poly    = false
-
-# Cylinder ::  x^2 + y^2 = R^2
-poly.poly2_x_coeffs =    0.00     0.00     1.00
-poly.poly2_y_coeffs =    0.00     0.00     1.00
-poly.poly2_z_coeffs =   -2.56e-6  0.00     0.00
-
-poly.poly2_translate =   1.6e-3   1.6e-3   0.00
-
-#########################################################################
-# This is the cylinder geometry
-#########################################################################
-
-eb.make_cylinder  = true
-
-cyl.cyl_dir       = 2
-cyl.cyl_radius    = .0016
-cyl.cyl_length    = .0032
-cyl.cyl_translate = .0016 .0016 0.
-
-
-
-#########################################################################
-# Level set specifications
-#########################################################################
-
-# Collision algorithm details:
-# Level-set refinement and padding
-eb.levelset__refinement = 2
-eb.levelset__pad        = 4
-
-# EBIS refinement and padding
-eb.levelset__eb_refinement = 1
-eb.levelset__eb_pad        = 8
diff --git a/Tutorials/EB/LevelSet/Src/Make.package b/Tutorials/EB/LevelSet/Src/Make.package
deleted file mode 100644
index c455afb5e5d..00000000000
--- a/Tutorials/EB/LevelSet/Src/Make.package
+++ /dev/null
@@ -1,5 +0,0 @@
-CEXE_sources += main.cpp
-CEXE_sources += make_cylinder.cpp
-CEXE_sources += make_poly.cpp
-CEXE_sources += make_eb.cpp
-CEXE_headers += make_shapes.H
diff --git a/Tutorials/EB/LevelSet/Src/main.cpp b/Tutorials/EB/LevelSet/Src/main.cpp
deleted file mode 100644
index 40625ae3e1b..00000000000
--- a/Tutorials/EB/LevelSet/Src/main.cpp
+++ /dev/null
@@ -1,131 +0,0 @@
-#include <fstream>
-#include <iomanip>
-
-#include <AMReX_ParmParse.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_iMultiFab.H>
-
-#include "make_shapes.H"
-
-using namespace amrex;
-
-int main (int argc, char* argv[]) {
-
-    amrex::Initialize(argc, argv);
-    // Issue an error if AMR input file is not given
-    if ( argc < 2 )
-       amrex::Abort("AMReX input file missing");
-
-
-    /****************************************************************************
-     * Load LEVEL-SET parameters                                                *
-     ***************************************************************************/
-
-    int levelset__refinement    = 1;
-    int levelset__eb_refinement = 1;
-    int levelset__pad           = 1;
-    int levelset__eb_pad        = 1;
-    {
-        ParmParse pp("eb");
-
-        // Parameters used be the level-set algorithm. Refer to LSFactory (or
-        // mfix_level.H) for more details:
-        //   -> refinement: how well resolved (fine) the (level-set/EB-facet)
-        //                  grid needs to be (note: a fine level-set grid means
-        //                  that distances and normals are computed accurately)
-        //   -> pad:        how many (refined) grid points _outside_ the
-        //                  problem domain the grid extends (avoids edge cases
-        //                  in physical domain)
-        pp.query("levelset__refinement", levelset__refinement);
-        pp.query("levelset__eb_refinement", levelset__eb_refinement);
-        pp.query("levelset__pad", levelset__pad);
-        pp.query("levelset__eb_pad", levelset__eb_pad);
-    }
-
-
-    /****************************************************************************
-     * Load GRID parameters                                                     *
-     ***************************************************************************/
-
-    // AMREX_SPACEDIM: number of dimensions
-    int n_cell, max_grid_size, n_lev;
-    Vector<int> is_periodic(AMREX_SPACEDIM,0);  // non-periodic in all direction by default
-    Vector<Real> prob_lo(AMREX_SPACEDIM,0);
-    Vector<Real> prob_hi(AMREX_SPACEDIM,0);
-    {
-        // ParmParse is way of reading inputs from the inputs file
-        ParmParse pp;
-
-        // We need to get n_cell from the inputs file - this is the number of
-        // cells on each side of a square (or cubic) domain.
-        pp.get("n_cell", n_cell);
-
-        // The domain is broken into boxes of size max_grid_size
-        pp.get("max_grid_size", max_grid_size);
-
-        pp.getarr("is_periodic", is_periodic);
-
-        pp.getarr("prob_lo", prob_lo);
-        pp.getarr("prob_hi", prob_hi);
-
-        pp.get("n_lev", n_lev);
-    }
-
-
-    /****************************************************************************
-     * BUILD BoxArray, Geometry, and DistributionMapping                        *
-     ***************************************************************************/
-
-    BoxArray grids;
-    Geometry geom;
-    {
-        IntVect dom_lo(AMREX_D_DECL(       0,        0,        0));
-        IntVect dom_hi(AMREX_D_DECL(n_cell-1, n_cell-1, n_cell-1));
-        Box domain(dom_lo, dom_hi);
-
-        // Initialize the boxarray "grids" from the single box "domain"
-        grids.define(domain);
-        // Break up boxarray "grids" into chunks no larger than "max_grid_size" along a direction
-        grids.maxSize(max_grid_size);
-
-        // This defines the physical box, [-1,1] in each direction.
-        RealBox real_box( prob_lo[0], prob_lo[1], prob_lo[2], prob_hi[0], prob_hi[1], prob_hi[2] );
-
-        // This defines a Geometry object
-        geom.define(domain,&real_box,CoordSys::cartesian,is_periodic.data());
-    }
-
-    DistributionMapping dmap(grids, ParallelDescriptor::NProcs());
-
-    // Level-Set: initialize container for level set
-    // level-set MultiFab is defined here, and set to (fortran) huge(amrex_real)
-    //            -> use min to intersect new eb boundaries (in update)
-    // If you plant to use untions (max), then use level_set->invert() here
-    // first...
-
-    int lev = 0;
-    std::unique_ptr<LSFactory> level_set = std::unique_ptr<LSFactory>(
-        new LSFactory(lev, levelset__refinement, levelset__eb_refinement,
-                      levelset__pad, levelset__eb_pad, grids, geom, dmap) );
-
-    LSCoreBase * ls_core;
-
-    // Constructs EB, followed by level-set or ls_core
-    make_my_eb2(n_lev, grids, dmap, geom, level_set.get(), ls_core);
-
-    ls_core->InitData();
-    ls_core->WritePlotFile();
-    ls_core->WriteCheckpointFile();
-
-
-    const MultiFab * ls_data = level_set->get_data();
-
-    VisMF::Write(* ls_data, "LevelSet");
-
-    level_set.reset();
-    delete ls_core;
-
-    amrex::Finalize();
-    return 0;
-}
diff --git a/Tutorials/EB/LevelSet/Src/make_cylinder.cpp b/Tutorials/EB/LevelSet/Src/make_cylinder.cpp
deleted file mode 100644
index 216b46446e2..00000000000
--- a/Tutorials/EB/LevelSet/Src/make_cylinder.cpp
+++ /dev/null
@@ -1,138 +0,0 @@
-
-#include <AMReX_EB2_IF_Plane.H>
-#include <AMReX_EB2_IF_Polynomial.H>
-#include <AMReX_EB2_IF_Intersection.H>
-
-#include <AMReX_EB_LSCore.H>
-
-#include <make_shapes.H>
-
-using namespace amrex;
-
-
-std::unique_ptr<CappedCylinderIF>
-make_cylinder_eb2_geom(int dir, Real radius, Real length, const RealVect & translation,
-                       int lev, const Geometry & geom, const DistributionMapping & dm,
-                       LSFactory * level_set, LSCoreBase *& ls_core) {
-    // Polynomial defining (curved) cylinder walls parallel to a given axis:
-    //     IF = a^2 + b^2 - R^2
-    // where a, b \in {a, x, z} - {axis} for example, if the cylinder lies on
-    // the y-axis => IF = x^2 + z^2 - R^2
-    Vector<EB2::PolyTerm> poly;
-    for(int idir = 0; idir < 3; idir++) {
-        // Constucts the coefficient vector describing a cylinder with
-        // orientation given by axis `dir`:
-        //    *  coefvec[0] = R^2 term
-        //    *  coefvec[2] = {x,y,z}^2 term
-        Vector<Real> coefvec(3);
-        if( idir == dir) coefvec = { - std::pow(radius, 2), 0. ,0.};
-        else             coefvec = {0., 0., 1};
-
-        for(int lc = 0; lc < 3; lc++) {
-            // x^(lc) term
-            IntVect powers = IntVect::Zero;
-            powers[idir] = lc;
-            EB2::PolyTerm mono = {.coef = coefvec[lc], .powers = powers};
-            poly.push_back(mono);
-        }
-    }
-
-
-    // box to clip to correct length
-    RealArray normal_1 = {0., 0., 0.} , center_1 = {0., 0., 0.},
-              normal_2 = {0., 0., 0.} , center_2 = {0., 0., 0.},
-      offset = { translation[0], translation[1], translation[2] };
-
-    center_1[dir] = 0.0;
-    normal_1[dir] = 1.0;
-
-    center_2[dir] = length;
-    normal_2[dir] =-1.0;
-
-
-    int max_level = 0;
-    int grid_size = 16;
-    bool eb_verbosity = true;
-
-    /****************************************************************************
-     *                                                                          *
-     * Fill Level-set using:                                                    *
-     *      -> Walls (where the GeometryShop's implicit function is a signed    *
-     *         distance): implicit function's value                             *
-     *      -> Cylinder (where GeometryShop's implicit function is singed but   *
-     *         not a distance): min distance to EB facets                       *
-     *      Note: this requires building and destroying the EBTower (twice),    *
-     *      so any EBTower data built before this will be lost...               *
-     *                                                                          *
-     ****************************************************************************/
-
-    // Define temporary level-sets used for constructing the cylinder:
-    LSFactory ls_cylinder(* level_set);
-    LSFactory ls_walls(* level_set);
-
-
-
-    WallsIF walls_if(EB2::UnionIF<EB2::PlaneIF,EB2::PlaneIF>(EB2::PlaneIF(center_1, normal_1, false),
-                                                             EB2::PlaneIF(center_2, normal_2, false)),
-                     offset);
-    EB2::GeometryShop<WallsIF> walls_gshop(walls_if);
-    GShopLSFactory<WallsIF>    walls_ls_gshop(walls_gshop, * level_set);
-
-    // Implicit function used by LSFactory
-    //  -- returned MF has the same DM as LSFactory
-    std::unique_ptr<MultiFab>  walls_mf_impfunc = walls_ls_gshop.fill_impfunc();
-
-    Print() << "adding end caps" << std::endl;
-    ls_walls.Intersect(* walls_mf_impfunc);
-    level_set->Union(* walls_mf_impfunc);
-    VisMF::Write(* ls_walls.get_data(), "LevelSet_EndCaps");
-    VisMF::Write(* walls_mf_impfunc, "ImpFunc_EndCaps");
-
-
-    CylinderIF                    cylinder_if(EB2::PolynomialIF(poly), offset);
-    EB2::GeometryShop<CylinderIF> cylinder_gshop(cylinder_if);
-    GShopLSFactory<CylinderIF>    cylinder_ls_gshop(cylinder_gshop, * level_set);
-
-    // Implicit function used by LSFactory
-    //  -- returned MF has the same DM as LSFactory
-    std::unique_ptr<MultiFab> cylinder_mf_impfunc = cylinder_ls_gshop.fill_impfunc();
-
-    VisMF::Write(* cylinder_mf_impfunc, "ImpFunc_SideWalls");
-
-    Print() << "building cyldinder EB2" << std::endl;
-    // Build level for cylinder walls
-    const Geometry & eb_geom = level_set->get_eb_geom();
-    EB2::Build(cylinder_gshop, eb_geom, max_level, max_level);
-
-    const EB2::IndexSpace & cylinder_ebis = EB2::IndexSpace::top();
-    const EB2::Level &      cylinder_lev  = cylinder_ebis.getLevel(eb_geom);
-
-    int eb_grow = ls_cylinder.get_eb_pad();
-    EBFArrayBoxFactory eb_factory_cylinder(cylinder_lev, eb_geom, level_set->get_eb_ba(), dm,
-                                           {eb_grow, eb_grow, eb_grow}, EBSupport::full);
-
-    Print() << "adding cylinder walls" << std::endl;
-    std::unique_ptr<iMultiFab> flag_valid =
-        ls_cylinder.Intersect(eb_factory_cylinder, * cylinder_mf_impfunc);
-
-    VisMF::Write(* ls_cylinder.get_data(), "LevelSet_SideWalls");
-
-    //ls_walls.intersection_ebf(eb_factory_cylinder, * cylinder_mf_impfunc);
-    //level_set->update_union(* ls_walls.get_data(), * flag_valid);
-    //level_set->intersection_ebf(eb_factory_cylinder, * cylinder_mf_impfunc);
-    level_set->Fill(eb_factory_cylinder, * cylinder_mf_impfunc);
-
-    std::unique_ptr<CappedCylinderIF> ret = std::unique_ptr<CappedCylinderIF>(
-        new CappedCylinderIF(EB2::TranslationIF<EB2::UnionIF<EB2::PlaneIF,EB2::PlaneIF>>(walls_if),
-                             EB2::TranslationIF<EB2::PolynomialIF>(cylinder_if))
-        );
-
-    EB2::GeometryShop<CappedCylinderIF> capped_cylinder_gshop(* ret);
-    ls_core = new LSCore<CappedCylinderIF>(capped_cylinder_gshop);
-
-    // ls_core = new LSCore<CylinderIF>(cylinder_gshop);
-
-    // ls_core = new LSCore<WallsIF>(walls_gshop);
-
-    return ret;
-}
diff --git a/Tutorials/EB/LevelSet/Src/make_eb.cpp b/Tutorials/EB/LevelSet/Src/make_eb.cpp
deleted file mode 100644
index 59426d20ca5..00000000000
--- a/Tutorials/EB/LevelSet/Src/make_eb.cpp
+++ /dev/null
@@ -1,123 +0,0 @@
-
-#include <AMReX_EBFabFactory.H>
-#include <AMReX_EB2_IF_Polynomial.H>
-#include <AMReX_EB_levelset.H>
-#include <AMReX_EB_LSCore.H>
-
-#include <AMReX_ParmParse.H>
-
-#include <algorithm>
-
-#include <make_shapes.H>
-
-using namespace amrex;
-
-
-void make_my_eb2(int n_lev, const BoxArray & grids, const DistributionMapping & dmap,
-                 const Geometry & geom, LSFactory * level_set, LSCoreBase *& ls_core) {
-
-    int lev  = 0;
-
-    // If all directions are periodic => nothing to be done
-    if (geom.isAllPeriodic()) return;
-
-    ParmParse pp("eb");
-
-    bool make_poly     = false;
-    bool make_cylinder = false;
-
-    pp.query("make_poly", make_poly);
-    pp.query("make_cylinder", make_cylinder);
-
-    if (make_poly && make_cylinder)
-        amrex::Abort("Must specify only one of make_poly OR make_cylinder");
-    if (!make_poly && !make_cylinder)
-        amrex::Abort("Must specify one of make_poly or make_cylinder");
-
-
-    bool eb_verbosity = true;
-    int max_level = 0;
-    int grid_size = 16;
-
-
-    if (make_poly) {
-
-        /************************************************************************
-         * POLY GEOMETRY                                                        *
-         ***********************************************************************/
-
-        amrex::Print() << "Using poly2 geometry" << std::endl;
-
-        // Construct Polynomial implicit function, and GeometryShop object
-        // GeometryShop's PolynomialIF is not a signed distance function...
-        //      => it's easier to use PolynomialIF and to build an
-        //         EBFArrayBoxFactory which defines our EB surface now
-        //          => define the level set as the (signed) distance to the
-        //             closest point on the EB-facets
-
-        std::unique_ptr<CylinderIF> impfunc = make_poly_eb2_geom(lev, SpaceDim, "poly2");
-
-        Geometry geom_eb = LSUtility::make_eb_geometry(* level_set, geom);
-        EB2::GeometryShop<CylinderIF> gshop(* impfunc);
-
-        // LSCore<CylinderIF> amr_ls(gshop);
-        // amr_ls.InitData();
-        // amr_ls.WritePlotFile();
-        // amr_ls.WriteCheckpointFile();
-
-        GShopLSFactory<CylinderIF>    cylinder_ls_gshop(gshop, * level_set);
-
-        // Implicit function used by LSFactory
-        //  -- returned MF has the same DM as LSFactory
-        std::unique_ptr<MultiFab> cylinder_mf_impfunc = cylinder_ls_gshop.fill_impfunc();
-
-
-        EB2::Build(gshop, geom_eb, max_level, max_level);
-
-        const EB2::IndexSpace & cylinder_ebis = EB2::IndexSpace::top();
-        const EB2::Level &      cylinder_lev  = cylinder_ebis.getLevel(geom);
-
-
-        int eb_pad = level_set->get_eb_pad();
-        EBFArrayBoxFactory eb_factory(cylinder_lev, geom_eb, level_set->get_eb_ba(), dmap,
-                                      {eb_pad, eb_pad, eb_pad}, EBSupport::full);
-
-        //Fill Level-set using eb_factory
-        level_set->Intersect(eb_factory, * cylinder_mf_impfunc);
-
-        ls_core = new LSCore<CylinderIF>(gshop);
-
-
-    } else if (make_cylinder) {
-
-        /************************************************************************
-         * CYLINDER GEOMETRY                                                    *
-         ***********************************************************************/
-
-        amrex::Print() << "Using cylinder geometry" << std::endl;
-
-        int cyl_dir;
-        Real cyl_radius;
-        Real cyl_length;
-        Vector<Real> transvec(3);
-        {
-          ParmParse pp("cyl");
-          pp.get("cyl_dir", cyl_dir);
-          pp.get("cyl_radius", cyl_radius);
-          pp.get("cyl_length", cyl_length);
-          pp.getarr("cyl_translate", transvec,  0, 3);
-        }
-
-        RealVect translation = RealVect(transvec);
-
-        // The make_cylinder_geom function unions the cylinder level-set function
-        // "onto" the level-set factory input argument (`level_set`). As
-        // `level_set` is initialized to fortran `huge`, we have to invert it
-        // first. Otherwise the uninion operation (which takes a max) ignores the
-        // new level-set.
-        level_set->invert();
-
-        make_cylinder_eb2_geom(cyl_dir, cyl_radius, cyl_length, translation,
-                               lev, geom, dmap, level_set, ls_core);
-    }
-}
diff --git a/Tutorials/EB/LevelSet/Src/make_poly.cpp b/Tutorials/EB/LevelSet/Src/make_poly.cpp
deleted file mode 100644
index 54156a27aaa..00000000000
--- a/Tutorials/EB/LevelSet/Src/make_poly.cpp
+++ /dev/null
@@ -1,75 +0,0 @@
-
-#include <AMReX_ParmParse.H>
-
-#include <make_shapes.H>
-
-using namespace amrex;
-
-
-
-std::unique_ptr<CylinderIF>
-make_poly_eb2_geom(int lev, int max_order, std::string field_prefix)
-{
-    // Construct the ParamParse database field names based on the
-    // `field_prefix` string:
-    ParmParse pp("poly");
-
-    // Coefficients vector is stored in the inputs database with the field name:
-    //      <field_prefix>_[x,y,z]_coeffs
-    const std::array<const std::string, 3> var_names{"x", "y", "z"};
-    std::array<std::string, 3> field_names;
-    for(int i = 0; i < 3; i++) {
-        std::stringstream field_name;
-        field_name << field_prefix;
-        field_name << "_" << var_names[i] << "_coeffs";
-        field_names[i] = field_name.str();
-    }
-
-    // There are two more fields associated with the PolynomialIF:
-    //      <field_prefix>_mirror    (true if fluid is inside the PolynomialIF)
-    //      <field_prefix>_translate (vector representing center-axis position)
-    std::stringstream mirror_field, translate_field;
-    mirror_field << field_prefix << "_mirror";
-    translate_field << field_prefix << "_translate";
-
-
-    // Generate vector representing polynomial
-    Vector<EB2::PolyTerm> poly;
-    for(int idir = 0; idir < 3; idir++) {
-        Vector<Real> coefvec(SpaceDim);
-
-        if(idir == 0)      pp.getarr(field_names[idir].c_str(), coefvec, 0, max_order);
-        else if(idir == 1) pp.getarr(field_names[idir].c_str(), coefvec, 0, max_order);
-        else if(idir == 2) pp.getarr(field_names[idir].c_str(), coefvec, 0, max_order);
-
-        for(int lc = 0; lc < max_order; lc++) {
-            // x^(lc) term
-            Real coef = coefvec[lc];
-            IntVect powers = IntVect::Zero;
-            powers[idir] = lc;
-
-            EB2::PolyTerm mono = {.coef = coef, .powers = powers};
-            poly.push_back(mono);
-        }
-    }
-
-
-    /****************************************************************************
-     * Construct PolynomialIF (called CylinderIF here when used within a        *
-     * TranslationIF, see make_shapes.H )                                       *
-     ****************************************************************************/
-
-    bool flip = true;
-    pp.query(mirror_field.str().c_str(), flip);
-
-    Vector<Real> transvec(SpaceDim);
-    pp.getarr(translate_field.str().c_str(), transvec, 0, SpaceDim);
-
-    RealArray offset = {AMREX_D_DECL(transvec[0], transvec[1], transvec[2])};
-    CylinderIF poly2(EB2::PolynomialIF(poly, flip), offset);
-
-    std::unique_ptr<CylinderIF> ret = std::unique_ptr<CylinderIF>(new CylinderIF(poly2));
-
-    return ret;
-
-}
diff --git a/Tutorials/EB/LevelSet/Src/make_shapes.H b/Tutorials/EB/LevelSet/Src/make_shapes.H
deleted file mode 100644
index 0e180d3c631..00000000000
--- a/Tutorials/EB/LevelSet/Src/make_shapes.H
+++ /dev/null
@@ -1,62 +0,0 @@
-#include <AMReX_REAL.H>
-#include <AMReX_Vector.H>
-#include <AMReX_RealVect.H>
-
-#include <AMReX_EBFArrayBox.H>
-#include <AMReX_EB_levelset.H>
-#include <AMReX_EBFabFactory.H>
-
-#include <AMReX_EB2.H>
-#include <AMReX_EB2_IF_Plane.H>
-#include <AMReX_EB2_IF_Polynomial.H>
-#include <AMReX_EB2_IF_Intersection.H>
-#include <AMReX_EB2_IF_Union.H>
-#include <AMReX_EB2_IF_Intersection.H>
-#include <AMReX_EB2_IF_Translation.H>
-
-#include <AMReX_EB_LSCoreBase.H>
-
-using namespace amrex;
-
-
-/********************************************************************************
- * ALIAS for the otherwise loooooooooong template parameter names:              *
- *       WallsIF          : Implicit function for two planar walls              *
- *       CylinderIF       : Implicit for a polynomial (which has been           *
- *                          translated representing the cylinder walls          *
- *       CappedCylinderIF : Implicit for a polynomial (e.g. cylinder walls)     *
- *                          with planar caps on either end                      *
- *******************************************************************************/
-
-using WallsIF = typename
-    EB2::TranslationIF<
-        EB2::UnionIF<
-            EB2::PlaneIF,
-            EB2::PlaneIF
-        >
-    >;
-
-using CylinderIF = typename
-    EB2::TranslationIF<
-        EB2::PolynomialIF
-    >;
-
-using CappedCylinderIF = typename
-    EB2::UnionIF<
-        WallsIF,
-        CylinderIF
-    >;
-
-
-void make_my_eb2(int n_lev, const BoxArray & grids, const DistributionMapping & dmap,
-                 const Geometry & geom, LSFactory * level_set, LSCoreBase *& ls_core);
-
-
-std::unique_ptr<CappedCylinderIF>
-make_cylinder_eb2_geom(int dir, Real radius, Real length, const RealVect & translation,
-                       int lev, const Geometry & geom, const DistributionMapping & dm,
-                       LSFactory * level_set, LSCoreBase *& ls_core);
-
-
-std::unique_ptr<CylinderIF>
-make_poly_eb2_geom(int lev, int max_order, std::string field_prefix);
diff --git a/Tutorials/EB/MacProj/CMakeLists.txt b/Tutorials/EB/MacProj/CMakeLists.txt
new file mode 100644
index 00000000000..e9b1811e564
--- /dev/null
+++ b/Tutorials/EB/MacProj/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/EB/MacProj/GNUmakefile b/Tutorials/EB/MacProj/GNUmakefile
index a668e10609c..747fc2b98d7 100644
--- a/Tutorials/EB/MacProj/GNUmakefile
+++ b/Tutorials/EB/MacProj/GNUmakefile
@@ -9,7 +9,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/EB/Poisson/CMakeLists.txt b/Tutorials/EB/Poisson/CMakeLists.txt
new file mode 100644
index 00000000000..3f4450a15d3
--- /dev/null
+++ b/Tutorials/EB/Poisson/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources     main.cpp Poisson.cpp Poisson.H)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/EB/Poisson/GNUmakefile b/Tutorials/EB/Poisson/GNUmakefile
index 92bc5360d62..4a6fb1f4d90 100644
--- a/Tutorials/EB/Poisson/GNUmakefile
+++ b/Tutorials/EB/Poisson/GNUmakefile
@@ -9,7 +9,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/ForkJoin/MLMG/CMakeLists.txt b/Tutorials/ForkJoin/MLMG/CMakeLists.txt
new file mode 100644
index 00000000000..302917bfe7a
--- /dev/null
+++ b/Tutorials/ForkJoin/MLMG/CMakeLists.txt
@@ -0,0 +1,11 @@
+if (NOT CMAKE_Fortran_COMPILER_LOADED OR NOT AMReX_LINEAR_SOLVERS)
+   return()
+endif ()
+
+set(_sources main.cpp ff.f90)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/ForkJoin/MLMG/GNUmakefile b/Tutorials/ForkJoin/MLMG/GNUmakefile
index 0b36f5f51f3..4d08f6d59c4 100644
--- a/Tutorials/ForkJoin/MLMG/GNUmakefile
+++ b/Tutorials/ForkJoin/MLMG/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 DEBUG ?= TRUE
 DIM ?= 2
diff --git a/Tutorials/ForkJoin/Simple/CMakeLists.txt b/Tutorials/ForkJoin/Simple/CMakeLists.txt
new file mode 100644
index 00000000000..3299cd9a02d
--- /dev/null
+++ b/Tutorials/ForkJoin/Simple/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources main.cpp MyTest.cpp MyTest_F.H MyTest.H)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/ForkJoin/Simple/GNUmakefile b/Tutorials/ForkJoin/Simple/GNUmakefile
index 8f5c9ae72b4..fcff941ad77 100644
--- a/Tutorials/ForkJoin/Simple/GNUmakefile
+++ b/Tutorials/ForkJoin/Simple/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 DEBUG ?= FALSE
 DIM ?= 3
diff --git a/Tutorials/ForkJoin/Simple/MyTest.cpp b/Tutorials/ForkJoin/Simple/MyTest.cpp
index 2ee7bbd4320..992415fb94e 100644
--- a/Tutorials/ForkJoin/Simple/MyTest.cpp
+++ b/Tutorials/ForkJoin/Simple/MyTest.cpp
@@ -92,7 +92,7 @@ MyTest::readParameters ()
     int n_comp_all;
     pp.get("n_comp_all",n_comp_all);
 
-    Box domain(IntVect(D_DECL(0,0,0)),IntVect(n_cell-1,n_cell-1,n_cell-1));
+    Box domain(IntVect(D_DECL(0,0,0)),IntVect(D_DECL(n_cell-1,n_cell-1,n_cell-1)));
     BoxArray grids(domain);
     grids.maxSize(max_grid_size);
 
diff --git a/Tutorials/FortranInterface/Advection_F/CMakeLists.txt b/Tutorials/FortranInterface/Advection_F/CMakeLists.txt
new file mode 100644
index 00000000000..23c1787c3bb
--- /dev/null
+++ b/Tutorials/FortranInterface/Advection_F/CMakeLists.txt
@@ -0,0 +1,25 @@
+if ( NOT AMReX_PARTICLES OR (AMReX_SPACEDIM EQUAL 1) )
+   return ()
+endif ()
+
+set(_sources advect_${AMReX_SPACEDIM}d_mod.F90 compute_flux_${AMReX_SPACEDIM}d.f90 slope_${AMReX_SPACEDIM}d.f90 )
+list(TRANSFORM _sources PREPEND Src_${AMReX_SPACEDIM}d/ )
+
+list(APPEND _sources amr_data_mod.F90 averagedown_mod.F90 bc_mod.F90 compute_dt_mod.F90
+   evolve_mod.F90 fillpatch_mod.F90 fmain.F90 initdata.F90 Make.package my_amr_mod.F90
+   plotfile_mod.F90 tagging_mod.F90)
+
+list(TRANSFORM _sources PREPEND Source/ )
+
+list(APPEND _sources
+   Exec/SingleVortex/face_velocity_${AMReX_SPACEDIM}d.F90
+   Exec/SingleVortex/Prob_${AMReX_SPACEDIM}d.f90
+   )
+
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false
+   ${CMAKE_CURRENT_LIST_DIR}/input* )
+
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULES)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Amr/Advection_F/Exec/Make.Adv b/Tutorials/FortranInterface/Advection_F/Exec/Make.Adv
similarity index 90%
rename from Tutorials/Amr/Advection_F/Exec/Make.Adv
rename to Tutorials/FortranInterface/Advection_F/Exec/Make.Adv
index 3a3515783f4..51a01191072 100644
--- a/Tutorials/Amr/Advection_F/Exec/Make.Adv
+++ b/Tutorials/FortranInterface/Advection_F/Exec/Make.Adv
@@ -1,5 +1,5 @@
 AMREX_HOME ?= ../../../../..
-TOP := $(AMREX_HOME)/Tutorials/Amr/Advection_F
+TOP := $(AMREX_HOME)/Tutorials/FortranInterface/Advection_F
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/GNUmakefile b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/GNUmakefile
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/GNUmakefile
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/GNUmakefile
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/Make.package b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/Make.package
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Make.package
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/Prob_2d.f90 b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Prob_2d.f90
similarity index 91%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/Prob_2d.f90
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Prob_2d.f90
index b9b02a55632..1b7d0a99c07 100644
--- a/Tutorials/Amr/Advection_F/Exec/SingleVortex/Prob_2d.f90
+++ b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Prob_2d.f90
@@ -51,7 +51,7 @@ subroutine init_part_data(pc, lev, mfi, lo, hi, dx, prob_lo)
 
     use amrex_fort_module, only : amrex_spacedim, amrex_real
     use amrex_particlecontainer_module, only: amrex_particlecontainer, amrex_particle, &
-         amrex_get_next_particle_id, amrex_get_cpu
+         amrex_get_next_particle_id, amrex_get_cpu, amrex_set_particle_id, amrex_set_particle_cpu
     use amrex_multifab_module, only : amrex_mfiter
     
     implicit none
@@ -60,7 +60,7 @@ subroutine init_part_data(pc, lev, mfi, lo, hi, dx, prob_lo)
     type(amrex_mfiter), intent(in) :: mfi
     integer, intent(in) :: lo(2), hi(2)
     real(amrex_real), intent(in) :: dx(2), prob_lo(2)
-    
+
     integer          :: i,j
     real(amrex_real) :: x,y
     type(amrex_particle) :: p
@@ -75,11 +75,11 @@ subroutine init_part_data(pc, lev, mfi, lo, hi, dx, prob_lo)
 
           p%vel = 0.d0
 
-          p%id  = amrex_get_next_particle_id()
-          p%cpu = amrex_get_cpu()
+          call amrex_set_particle_id(amrex_get_next_particle_id(), p)
+          call amrex_set_particle_cpu(amrex_get_cpu(), p)
 
           call pc%add_particle(lev, mfi, p)
-          
+
        end do
     end do
     
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/Prob_3d.f90 b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Prob_3d.f90
similarity index 92%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/Prob_3d.f90
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Prob_3d.f90
index 743e93ff4b9..8eb0c211828 100644
--- a/Tutorials/Amr/Advection_F/Exec/SingleVortex/Prob_3d.f90
+++ b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/Prob_3d.f90
@@ -69,7 +69,7 @@ subroutine init_part_data(pc, lev, mfi, lo, hi, dx, prob_lo)
 
     use amrex_fort_module, only : amrex_spacedim, amrex_real
     use amrex_particlecontainer_module, only: amrex_particlecontainer, amrex_particle, &
-         amrex_get_next_particle_id, amrex_get_cpu
+         amrex_get_next_particle_id, amrex_get_cpu, amrex_set_particle_id, amrex_set_particle_cpu
     use amrex_multifab_module, only : amrex_mfiter
     
     implicit none
@@ -93,18 +93,18 @@ subroutine init_part_data(pc, lev, mfi, lo, hi, dx, prob_lo)
              p%pos(1) = x
              p%pos(2) = y
              p%pos(3) = x
-             
+
              p%vel = 0.d0
 
-             p%id  = amrex_get_next_particle_id()
-             p%cpu = amrex_get_cpu()
-             
+             call amrex_set_particle_id(amrex_get_next_particle_id(), p)
+             call amrex_set_particle_cpu(amrex_get_cpu(), p)
+
              call pc%add_particle(lev, mfi, p)
-             
+
           end do
        end do
     end do
-    
+
   end subroutine init_part_data
 
 end module prob_module
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/face_velocity_2d.F90 b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/face_velocity_2d.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/face_velocity_2d.F90
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/face_velocity_2d.F90
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/face_velocity_3d.F90 b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/face_velocity_3d.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/face_velocity_3d.F90
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/face_velocity_3d.F90
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/inputs b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/inputs
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/inputs
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/inputs
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/inputs.physbc b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/inputs.physbc
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/inputs.physbc
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/inputs.physbc
diff --git a/Tutorials/Amr/Advection_F/Exec/SingleVortex/inputs.rt b/Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/inputs.rt
similarity index 100%
rename from Tutorials/Amr/Advection_F/Exec/SingleVortex/inputs.rt
rename to Tutorials/FortranInterface/Advection_F/Exec/SingleVortex/inputs.rt
diff --git a/Tutorials/Amr/Advection_F/README b/Tutorials/FortranInterface/Advection_F/README
similarity index 100%
rename from Tutorials/Amr/Advection_F/README
rename to Tutorials/FortranInterface/Advection_F/README
diff --git a/Tutorials/Amr/Advection_F/Source/Make.package b/Tutorials/FortranInterface/Advection_F/Source/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/Make.package
rename to Tutorials/FortranInterface/Advection_F/Source/Make.package
diff --git a/Tutorials/Amr/Advection_F/Source/Src_2d/Make.package b/Tutorials/FortranInterface/Advection_F/Source/Src_2d/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/Src_2d/Make.package
rename to Tutorials/FortranInterface/Advection_F/Source/Src_2d/Make.package
diff --git a/Tutorials/Amr/Advection_F/Source/Src_2d/advect_2d_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/Src_2d/advect_2d_mod.F90
similarity index 98%
rename from Tutorials/Amr/Advection_F/Source/Src_2d/advect_2d_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/Src_2d/advect_2d_mod.F90
index 530b2825b9e..7832a876d4c 100644
--- a/Tutorials/Amr/Advection_F/Source/Src_2d/advect_2d_mod.F90
+++ b/Tutorials/FortranInterface/Advection_F/Source/Src_2d/advect_2d_mod.F90
@@ -58,7 +58,7 @@ subroutine advect(time, lo, hi, &
     ! We like to allocate these **pointers** here and then pass them to a function
     ! to remove their pointerness for performance, because normally pointers could
     ! be aliasing.  We need to use pointers instead of allocatable arrays because
-    ! we like to use BoxLib's amrex_allocate to allocate memeory instead of the intrinsic
+    ! we like to use AMReX's amrex_allocate to allocate memeory instead of the intrinsic
     ! allocate.  Amrex_allocate is much faster than allocate inside OMP.  
     ! Note that one MUST CALL AMREX_DEALLOCATE.
     
diff --git a/Tutorials/Amr/Advection_F/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/FortranInterface/Advection_F/Source/Src_2d/compute_flux_2d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/Src_2d/compute_flux_2d.f90
rename to Tutorials/FortranInterface/Advection_F/Source/Src_2d/compute_flux_2d.f90
diff --git a/Tutorials/Amr/Advection_F/Source/Src_2d/slope_2d.f90 b/Tutorials/FortranInterface/Advection_F/Source/Src_2d/slope_2d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/Src_2d/slope_2d.f90
rename to Tutorials/FortranInterface/Advection_F/Source/Src_2d/slope_2d.f90
diff --git a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/Make.package b/Tutorials/FortranInterface/Advection_F/Source/Src_3d/Make.package
similarity index 65%
rename from Tutorials/Amr/Advection_AmrCore/Source/Src_2d/Make.package
rename to Tutorials/FortranInterface/Advection_F/Source/Src_3d/Make.package
index 08c638054bb..31150ba83b7 100644
--- a/Tutorials/Amr/Advection_AmrCore/Source/Src_2d/Make.package
+++ b/Tutorials/FortranInterface/Advection_F/Source/Src_3d/Make.package
@@ -1,3 +1,3 @@
-f90EXE_sources += Adv_$(DIM)d.f90
+F90EXE_sources += advect_$(DIM)d_mod.F90
 f90EXE_sources += slope_$(DIM)d.f90
 f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/Amr/Advection_F/Source/Src_3d/Adv_3d.f90 b/Tutorials/FortranInterface/Advection_F/Source/Src_3d/advect_3d_mod.F90
similarity index 99%
rename from Tutorials/Amr/Advection_F/Source/Src_3d/Adv_3d.f90
rename to Tutorials/FortranInterface/Advection_F/Source/Src_3d/advect_3d_mod.F90
index 8bafd18e7a8..575ea309380 100644
--- a/Tutorials/Amr/Advection_F/Source/Src_3d/Adv_3d.f90
+++ b/Tutorials/FortranInterface/Advection_F/Source/Src_3d/advect_3d_mod.F90
@@ -73,7 +73,7 @@ subroutine advect(time, lo, hi, &
   ! We like to allocate these **pointers** here and then pass them to a function
   ! to remove their pointerness for performance, because normally pointers could
   ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
+  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
   ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
   ! Note that one MUST CALL BL_DEALLOCATE.
 
diff --git a/Tutorials/Amr/Advection_F/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/FortranInterface/Advection_F/Source/Src_3d/compute_flux_3d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/Src_3d/compute_flux_3d.f90
rename to Tutorials/FortranInterface/Advection_F/Source/Src_3d/compute_flux_3d.f90
diff --git a/Tutorials/Amr/Advection_F/Source/Src_3d/slope_3d.f90 b/Tutorials/FortranInterface/Advection_F/Source/Src_3d/slope_3d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/Src_3d/slope_3d.f90
rename to Tutorials/FortranInterface/Advection_F/Source/Src_3d/slope_3d.f90
diff --git a/Tutorials/Amr/Advection_F/Source/amr_data_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/amr_data_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/amr_data_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/amr_data_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/averagedown_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/averagedown_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/averagedown_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/averagedown_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/bc_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/bc_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/bc_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/bc_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/compute_dt_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/compute_dt_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/compute_dt_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/compute_dt_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/evolve_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/evolve_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/evolve_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/evolve_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/fillpatch_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/fillpatch_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/fillpatch_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/fillpatch_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/fmain.F90 b/Tutorials/FortranInterface/Advection_F/Source/fmain.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/fmain.F90
rename to Tutorials/FortranInterface/Advection_F/Source/fmain.F90
diff --git a/Tutorials/Amr/Advection_F/Source/initdata.F90 b/Tutorials/FortranInterface/Advection_F/Source/initdata.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/initdata.F90
rename to Tutorials/FortranInterface/Advection_F/Source/initdata.F90
diff --git a/Tutorials/Amr/Advection_F/Source/my_amr_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/my_amr_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/my_amr_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/my_amr_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/plotfile_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/plotfile_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/plotfile_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/plotfile_mod.F90
diff --git a/Tutorials/Amr/Advection_F/Source/tagging_mod.F90 b/Tutorials/FortranInterface/Advection_F/Source/tagging_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_F/Source/tagging_mod.F90
rename to Tutorials/FortranInterface/Advection_F/Source/tagging_mod.F90
diff --git a/Tutorials/FortranInterface/Advection_octree_F/CMakeLists.txt b/Tutorials/FortranInterface/Advection_octree_F/CMakeLists.txt
new file mode 100644
index 00000000000..a33076aa5df
--- /dev/null
+++ b/Tutorials/FortranInterface/Advection_octree_F/CMakeLists.txt
@@ -0,0 +1,26 @@
+if ( NOT AMReX_SPACEDIM EQUAL 2)
+   return ()
+endif ()
+
+set(_sources advect_2d_mod.F90 compute_flux_2d.f90 slope_2d.f90)
+list(TRANSFORM _sources PREPEND Src_2d/ )
+
+list(APPEND _sources amr_data_mod.F90 averagedown_mod.F90 bc_mod.F90
+   compute_dt_mod.F90 evolve_mod.F90 fillpatch_mod.F90 fmain.F90
+   initdata.F90 my_amr_mod.F90 plotfile_mod.F90 tagging_mod.F90)
+
+list(TRANSFORM _sources PREPEND Source/ )
+
+list(APPEND _sources
+   Exec/SingleVortex/face_velocity_2d.F90
+   Exec/SingleVortex/Prob.f90
+   )
+
+file(GLOB_RECURSE _input_files LIST_DIRECTORIES false
+   ${CMAKE_CURRENT_LIST_DIR}/input* )
+
+
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULES)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Amr/Advection_octree_F2/Exec/Make.Adv b/Tutorials/FortranInterface/Advection_octree_F/Exec/Make.Adv
similarity index 89%
rename from Tutorials/Amr/Advection_octree_F2/Exec/Make.Adv
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/Make.Adv
index b33937bbbf0..ae1064ba651 100644
--- a/Tutorials/Amr/Advection_octree_F2/Exec/Make.Adv
+++ b/Tutorials/FortranInterface/Advection_octree_F/Exec/Make.Adv
@@ -1,5 +1,5 @@
 AMREX_HOME ?= ../../../../..
-TOP := $(AMREX_HOME)/Tutorials/Amr/Advection_octree_F2
+TOP := $(AMREX_HOME)/Tutorials/FortranInterface/Advection_octree_F
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/GNUmakefile b/Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/GNUmakefile
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/GNUmakefile
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/GNUmakefile
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/Make.package b/Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/Make.package
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/Make.package
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/Prob.f90 b/Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/Prob.f90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/Prob.f90
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/Prob.f90
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/face_velocity_2d.F90 b/Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/face_velocity_2d.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/face_velocity_2d.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/face_velocity_2d.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/inputs b/Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/inputs
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/inputs
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/inputs
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/inputs.rt b/Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/inputs.rt
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Exec/SingleVortex/inputs.rt
rename to Tutorials/FortranInterface/Advection_octree_F/Exec/SingleVortex/inputs.rt
diff --git a/Tutorials/Amr/Advection_octree_F/README b/Tutorials/FortranInterface/Advection_octree_F/README
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/README
rename to Tutorials/FortranInterface/Advection_octree_F/README
diff --git a/Tutorials/Amr/Advection_octree_F/Source/Make.package b/Tutorials/FortranInterface/Advection_octree_F/Source/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/Make.package
rename to Tutorials/FortranInterface/Advection_octree_F/Source/Make.package
diff --git a/Tutorials/Amr/Advection_octree_F/Source/Src_2d/Make.package b/Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/Src_2d/Make.package
rename to Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/Make.package
diff --git a/Tutorials/Amr/Advection_octree_F/Source/Src_2d/advect_2d_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/advect_2d_mod.F90
similarity index 97%
rename from Tutorials/Amr/Advection_octree_F/Source/Src_2d/advect_2d_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/advect_2d_mod.F90
index 9709c4144ef..f156191b9c7 100644
--- a/Tutorials/Amr/Advection_octree_F/Source/Src_2d/advect_2d_mod.F90
+++ b/Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/advect_2d_mod.F90
@@ -58,7 +58,7 @@ subroutine advect(time, lo, hi, &
     ! We like to allocate these **pointers** here and then pass them to a function
     ! to remove their pointerness for performance, because normally pointers could
     ! be aliasing.  We need to use pointers instead of allocatable arrays because
-    ! we like to use BoxLib's amrex_allocate to allocate memeory instead of the intrinsic
+    ! we like to use AMReX's amrex_allocate to allocate memeory instead of the intrinsic
     ! allocate.  Amrex_allocate is much faster than allocate inside OMP.  
     ! Note that one MUST CALL AMREX_DEALLOCATE.
     
diff --git a/Tutorials/Amr/Advection_octree_F/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/compute_flux_2d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/Src_2d/compute_flux_2d.f90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/compute_flux_2d.f90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/Src_2d/slope_2d.f90 b/Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/slope_2d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/Src_2d/slope_2d.f90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/Src_2d/slope_2d.f90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/amr_data_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/amr_data_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/amr_data_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/amr_data_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/averagedown_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/averagedown_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/averagedown_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/averagedown_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/bc_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/bc_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/bc_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/bc_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/compute_dt_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/compute_dt_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/compute_dt_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/compute_dt_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/evolve_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/evolve_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/evolve_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/evolve_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/fillpatch_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/fillpatch_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/fillpatch_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/fillpatch_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/fmain.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/fmain.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/fmain.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/fmain.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/initdata.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/initdata.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/initdata.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/initdata.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/my_amr_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/my_amr_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/my_amr_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/my_amr_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/plotfile_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/plotfile_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/plotfile_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/plotfile_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F/Source/tagging_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F/Source/tagging_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F/Source/tagging_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F/Source/tagging_mod.F90
diff --git a/Tutorials/FortranInterface/Advection_octree_F2/CMakeLists.txt b/Tutorials/FortranInterface/Advection_octree_F2/CMakeLists.txt
new file mode 100644
index 00000000000..b70ec236b5d
--- /dev/null
+++ b/Tutorials/FortranInterface/Advection_octree_F2/CMakeLists.txt
@@ -0,0 +1,26 @@
+if ( NOT AMReX_SPACEDIM EQUAL 2 )
+   return ()
+endif ()
+
+set(_sources advect_2d_mod.F90 compute_flux_2d.f90 slope_2d.f90)
+list(TRANSFORM _sources PREPEND Src_2d/ )
+
+list(APPEND _sources amr_data_mod.F90 averagedown_mod.F90 bc_mod.F90
+   compute_dt_mod.F90 evolve_mod.F90 fillpatch_mod.F90 fmain.F90
+   initdata.F90 my_amr_mod.F90 plotfile_mod.F90 tagging_mod.F90)
+
+list(TRANSFORM _sources PREPEND Source/ )
+
+list(APPEND _sources
+   Exec/SingleVortex/face_velocity_2d.F90
+   Exec/SingleVortex/Prob.f90
+   )
+
+file(GLOB_RECURSE _input_files LIST_DIRECTORIES false
+   ${CMAKE_CURRENT_LIST_DIR}/input* )
+
+
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULES)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Amr/Advection_octree_F/Exec/Make.Adv b/Tutorials/FortranInterface/Advection_octree_F2/Exec/Make.Adv
similarity index 89%
rename from Tutorials/Amr/Advection_octree_F/Exec/Make.Adv
rename to Tutorials/FortranInterface/Advection_octree_F2/Exec/Make.Adv
index 7c40c408465..58e91c06770 100644
--- a/Tutorials/Amr/Advection_octree_F/Exec/Make.Adv
+++ b/Tutorials/FortranInterface/Advection_octree_F2/Exec/Make.Adv
@@ -1,5 +1,5 @@
 AMREX_HOME ?= ../../../../..
-TOP := $(AMREX_HOME)/Tutorials/Amr/Advection_octree_F
+TOP := $(AMREX_HOME)/Tutorials/FortranInterface/Advection_octree_F2
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/GNUmakefile b/Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/GNUmakefile
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/GNUmakefile
rename to Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/GNUmakefile
diff --git a/Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/Make.package b/Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/Make.package
rename to Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/Make.package
diff --git a/Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/Prob.f90 b/Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/Prob.f90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/Prob.f90
rename to Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/Prob.f90
diff --git a/Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/face_velocity_2d.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/face_velocity_2d.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/face_velocity_2d.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/face_velocity_2d.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/inputs b/Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/inputs
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Exec/SingleVortex/inputs
rename to Tutorials/FortranInterface/Advection_octree_F2/Exec/SingleVortex/inputs
diff --git a/Tutorials/Amr/Advection_octree_F2/README b/Tutorials/FortranInterface/Advection_octree_F2/README
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/README
rename to Tutorials/FortranInterface/Advection_octree_F2/README
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/Make.package b/Tutorials/FortranInterface/Advection_octree_F2/Source/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/Make.package
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/Make.package
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/Src_2d/Make.package b/Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/Make.package
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/Src_2d/Make.package
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/Make.package
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/Src_2d/advect_2d_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/advect_2d_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/Src_2d/advect_2d_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/advect_2d_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/compute_flux_2d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/Src_2d/compute_flux_2d.f90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/compute_flux_2d.f90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/Src_2d/slope_2d.f90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/slope_2d.f90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/Src_2d/slope_2d.f90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/Src_2d/slope_2d.f90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/amr_data_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/amr_data_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/amr_data_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/amr_data_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/averagedown_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/averagedown_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/averagedown_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/averagedown_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/bc_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/bc_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/bc_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/bc_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/compute_dt_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/compute_dt_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/compute_dt_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/compute_dt_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/evolve_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/evolve_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/evolve_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/evolve_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/fillpatch_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/fillpatch_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/fillpatch_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/fillpatch_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/fmain.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/fmain.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/fmain.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/fmain.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/initdata.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/initdata.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/initdata.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/initdata.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/my_amr_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/my_amr_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/my_amr_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/my_amr_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/plotfile_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/plotfile_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/plotfile_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/plotfile_mod.F90
diff --git a/Tutorials/Amr/Advection_octree_F2/Source/tagging_mod.F90 b/Tutorials/FortranInterface/Advection_octree_F2/Source/tagging_mod.F90
similarity index 100%
rename from Tutorials/Amr/Advection_octree_F2/Source/tagging_mod.F90
rename to Tutorials/FortranInterface/Advection_octree_F2/Source/tagging_mod.F90
diff --git a/Tutorials/GPU/Advection_AmrCore/CMakeLists.txt b/Tutorials/GPU/Advection_AmrCore/CMakeLists.txt
deleted file mode 100644
index e2e08c68a35..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/CMakeLists.txt
+++ /dev/null
@@ -1,60 +0,0 @@
-# Disabled for now
-return()
-
-#
-# Does not work if amrex is built in shared mode
-#
-if (BUILD_SHARED_LIBS)
-  return()
-endif ()
-
-#
-# This test works for both 2D and 3D builds 
-#
-set ( EXENAME  "Advection_AmrCore_GPU.exe" )
-set ( SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex )
-
-#
-# Create target (executable) for this tutorial
-# 
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-#
-# Set target (executable) properties 
-#
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-find_all_sources ( SRC3 INC3 ROOT ${SRC_DIR}/Src_nd )
-
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-set_target_properties ( ${EXENAME} PROPERTIES      
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR} )
-
-target_link_libraries ( ${EXENAME} amrex ${AMREX_EXTRA_Fortran_LINK_LINE} )
-
-#
-# Find input files 
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false  ${EXE_DIR}/input* )
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} ) 
-file ( COPY ${EXE_DIR}/sensei DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-#
-# Add to the "tutorial" target
-# 
-add_tutorial (${EXENAME})   
-
diff --git a/Tutorials/GPU/Advection_AmrCore/Exec/Make.Adv b/Tutorials/GPU/Advection_AmrCore/Exec/Make.Adv
deleted file mode 100644
index a5c80613a27..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Exec/Make.Adv
+++ /dev/null
@@ -1,33 +0,0 @@
-AMREX_HOME ?= ../../../..
-ADR_DIR   ?= $(AMREX_HOME)/Tutorials/GPU/Advection_AmrCore
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-BL_NO_FORT = TRUE
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-Bdirs 	:= Source Source/Src_$(DIM)d
-Bpack	+= $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs 	:= Base Boundary AmrCore
-ifeq ($(USE_SENSEI_INSITU),TRUE)
-	Pdirs += Amr Extern/SENSEI
-endif
-Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/GNUmakefile b/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/GNUmakefile
deleted file mode 100644
index 306dc38d676..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/GNUmakefile
+++ /dev/null
@@ -1,25 +0,0 @@
-AMREX_HOME ?= ../../../../..
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = TRUE
-DEBUG      = FALSE
-
-#DIM        = 2
-DIM       = 3
-
-COMP	   = gnu
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE 
-USE_CUDA   = TRUE
-
-BL_NO_FORT = TRUE
-
-USE_SENSEI_INSITU = FALSE
-
-Bpack   := ./Make.package 
-Blocs   := . 
-
-include ../Make.Adv
diff --git a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/Make.package b/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/Make.package
deleted file mode 100644
index 7e76727a778..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1,4 +0,0 @@
-CEXE_headers += Prob.H face_velocity.H
-
-#f90EXE_sources += face_velocity_$(DIM)d.f90
-#f90EXE_source += Prob.f90
diff --git a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/Prob.H b/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/Prob.H
deleted file mode 100644
index 78d061ac913..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/Prob.H
+++ /dev/null
@@ -1,44 +0,0 @@
-#ifndef PROB_H_
-#define PROB_H_
-
-#include <AmrCoreAdv_F.H>
-
-#include <AMReX_Box.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Geometry.H>
-
-using namespace amrex;
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void
-initdata(Box const& bx, Array4<Real> const& phi, GeometryData const& geomdata)
-{
-    const auto lo = lbound(bx);
-    const auto hi = ubound(bx);    
-
-    const Real* AMREX_RESTRICT prob_lo = geomdata.ProbLo();
-    const Real* AMREX_RESTRICT dx      = geomdata.CellSize();
-
-#ifdef _OPENMP
-#pragma omp parallel for collapse(2) if (GPU::notInLaunchRegion())
-#endif
-    for         (int k = lo.z; k <= hi.z; ++k) {
-        for     (int j = lo.y; j <= hi.y; ++j) {
-            Real z = prob_lo[2] + (0.5+k) * dx[2];
-            Real y = prob_lo[1] + (0.5+j) * dx[1];
-            AMREX_PRAGMA_SIMD
-            for (int i = lo.x; i <= hi.x; ++i) {
-                Real x = prob_lo[0] + (0.5+i) * dx[0]; 
-#if (AMREX_SPACEDIM == 2)
-                Real r2 = (pow(x-0.5, 2) + pow((y-0.75),2)) / 0.01;
-#else
-                Real r2 = (pow(x-0.5, 2) + pow((y-0.75),2) + pow((z-0.5),2)) / 0.01;
-#endif
-                phi(i,j,k) = 1.0 + std::exp(-r2);
-            }
-        }
-    }
-}
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/face_velocity.H b/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/face_velocity.H
deleted file mode 100644
index 689f336dc05..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/face_velocity.H
+++ /dev/null
@@ -1,68 +0,0 @@
-#ifndef FACE_VELOCITY_H_
-#define FACE_VELOCITY_H_
-
-#include <AMReX_Geometry.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_REAL.H>
-#include <AmrCoreAdv_F.H>
-
-using namespace amrex;
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void get_face_velocity_psi(Box const& bx,
-                           const Real time,
-                           Array4<Real> const& psi,
-                           GeometryData const& geomdata)
-{
-    const auto lo  = lbound(bx);
-    const auto hi  = ubound(bx);
-
-    const Real* AMREX_RESTRICT prob_lo = geomdata.ProbLo();
-    const Real* AMREX_RESTRICT dx      = geomdata.CellSize(); 
-
-    for     (int j = lo.y; j <= hi.y; ++j) {
-        Real y = dx[1]*(0.5+j) + prob_lo[1]; 
-        AMREX_PRAGMA_SIMD
-        for (int i = lo.x; i <= hi.x; ++i) {
-            Real x = dx[0]*(0.5+i) + prob_lo[0];
-            psi(i,j,0) = pow(sin(M_PI*x), 2) * pow(sin(M_PI*y), 2)
-                       * cos(M_PI*time/2.0) * 1.0/M_PI; 
-        }
-    }
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void get_face_velocity_x(int i, int j, int k,
-                         Array4<Real> const& vx,
-                         Array4<Real> const& psi,
-                         GpuArray<Real, AMREX_SPACEDIM> prob_lo,
-                         GpuArray<Real, AMREX_SPACEDIM> dx)
-{
-    vx(i,j,k) = -( (psi(i,j+1,0)+psi(i-1,j+1,0)) - (psi(i,j-1,0)+psi(i-1,j-1,0)) ) * (0.25/dx[1]); 
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void get_face_velocity_y(int i, int j, int k,
-                         Array4<Real> const& vy,
-                         Array4<Real> const& psi,
-                         GpuArray<Real, AMREX_SPACEDIM> prob_lo,
-                         GpuArray<Real, AMREX_SPACEDIM> dx)
-{
-    vy(i,j,k) =  ( (psi(i+1,j,0)+psi(i+1,j-1,0)) - (psi(i-1,j,0)+psi(i-1,j-1,0)) ) * (0.25/dx[0]); 
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void get_face_velocity_z(int i, int j, int k,
-                         Array4<Real> const& vz,
-                         Array4<Real> const& psi,
-                         GpuArray<Real, AMREX_SPACEDIM> prob_lo,
-                         GpuArray<Real, AMREX_SPACEDIM> dx)
-{
-    vz(i,j,k) =  1.0; 
-}
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/inputs b/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/inputs
deleted file mode 100644
index b5215ed73b1..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,51 +0,0 @@
-max_step  = 100
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64 
-
-# VERBOSITY
-amr.v              = 1       # verbosity in Amr
-
-# REFINEMENT
-amr.max_level       = 0       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 64
-
-amr.regrid_int      = 2       # how often to regrid
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-
-adv.do_reflux = 1
-
-
-# Tagging
-adv.phierr = 1.01  1.1  1.5
-
-# PLOTFILES
-amr.plot_file  = plt    # root name of plot file
-amr.plot_int   = 10     # number of timesteps between plot files
-
-# CHECKPOINT
-amr.chk_file = chk      # root name of checkpoint file
-amr.chk_int  = -1       # number of timesteps between checkpoint files
-#amr.restart  = chk00060 # restart from this checkpoint file
-
-# SENSEI in situ
-# enable and choose the configuration based on your build
-sensei.enabled = 0
-sensei.config = sensei/render_iso_catalyst_2d.xml
-#sensei.config = sensei/render_iso_catalyst_3d.xml
-#sensei.config = sensei/render_iso_libsim_2d.xml
-#sensei.config = sensei/render_iso_libsim_3d.xml
-sensei.frequency = 2
diff --git a/Tutorials/GPU/Advection_AmrCore/README b/Tutorials/GPU/Advection_AmrCore/README
deleted file mode 100644
index 7c4eb512323..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/README
+++ /dev/null
@@ -1,13 +0,0 @@
-Advection_AmrCore: This tutorial contains an AMR advection code that advects a single 
-scalar field with a velocity field that is specified on faces.
-
-It is an AMReX based code designed to run in parallel using MPI/OMP.
-
-This example uses source code from the amrex/Src/Base, Boundary, and AmrCore directories.
-Notably, this example does not use source code from amrex/Src/Amr
-(see the tutorial Advection_AmrLevel).
-
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with VisIt.
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv.H b/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv.H
deleted file mode 100644
index e920105778c..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv.H
+++ /dev/null
@@ -1,189 +0,0 @@
-#ifndef AmrCoreAdv_H_
-#define AmrCoreAdv_H_
-
-#include <string>
-#include <limits>
-#include <memory>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-#include <AMReX_AmrCore.H>
-#include <AMReX_FluxRegister.H>
-#include <AMReX_BCRec.H>
-#if defined(BL_USE_SENSEI_INSITU)
-namespace amrex {
-class AmrMeshInSituBridge;
-}
-#endif
-
-using namespace amrex;
-
-class AmrCoreAdv
-    : public amrex::AmrCore
-{
-public:
-
-    ////////////////
-    // public member functions
-
-    // constructor - reads in parameters from inputs file
-    //             - sizes multilevel arrays and data structures
-    AmrCoreAdv ();
-    virtual ~AmrCoreAdv();
-
-    // advance solution to final time
-    void Evolve ();
-
-    // initializes multilevel data
-    void InitData ();
-
-    // Make a new level using provided BoxArray and DistributionMapping and 
-    // fill with interpolated coarse level data.
-    // overrides the pure virtual function in AmrCore
-    virtual void MakeNewLevelFromCoarse (int lev, amrex::Real time, const amrex::BoxArray& ba,
-					 const amrex::DistributionMapping& dm) override;
-
-    // Remake an existing level using provided BoxArray and DistributionMapping and 
-    // fill with existing fine and coarse data.
-    // overrides the pure virtual function in AmrCore
-    virtual void RemakeLevel (int lev, amrex::Real time, const amrex::BoxArray& ba,
-			      const amrex::DistributionMapping& dm) override;
-
-    // Delete level data
-    // overrides the pure virtual function in AmrCore
-    virtual void ClearLevel (int lev) override;
-
-    // Make a new level from scratch using provided BoxArray and DistributionMapping.
-    // Only used during initialization.
-    // overrides the pure virtual function in AmrCore
-    virtual void MakeNewLevelFromScratch (int lev, amrex::Real time, const amrex::BoxArray& ba,
-					  const amrex::DistributionMapping& dm) override;
-
-    // tag all cells for refinement
-    // overrides the pure virtual function in AmrCore
-    virtual void ErrorEst (int lev, amrex::TagBoxArray& tags, amrex::Real time, int ngrow) override;
-
-    // advance a single level for a single time step, updates flux registers
-    void Advance (int lev, amrex::Real time, amrex::Real dt_lev, int iteration, int ncycle);
-
-    // compute dt from CFL considerations
-    Real EstTimeStep (int lev, bool local=false) const;
-
-private:
-
-    ////////////////
-    // private member functions
-
-    // read in some parameters from inputs file
-    void ReadParameters();
-
-    // set covered coarse cells to be the average of overlying fine cells
-    void AverageDown ();
-
-    // more flexible version of AverageDown() that lets you average down across multiple levels
-    void AverageDownTo (int crse_lev);
-
-    // compute a new multifab by coping in phi from valid region and filling ghost cells
-    // works for single level and 2-level cases (fill fine grid ghost by interpolating from coarse)
-    void FillPatch (int lev, amrex::Real time, amrex::MultiFab& mf, int icomp, int ncomp);
-
-    // fill an entire multifab by interpolating from the coarser level
-    // this comes into play when a new level of refinement appears
-    void FillCoarsePatch (int lev, amrex::Real time, amrex::MultiFab& mf, int icomp, int ncomp);
-
-    // utility to copy in data from phi_old and/or phi_new into another multifab
-    void GetData (int lev, amrex::Real time, amrex::Vector<amrex::MultiFab*>& data,
-                  amrex::Vector<amrex::Real>& datatime);
-
-    // advance a level by dt
-    // includes a recursive call for finer levels
-    void timeStep (int lev, amrex::Real time, int iteration);
-
-    // a wrapper for EstTimeStep(0
-    void ComputeDt ();
-
-    // get plotfile name
-    std::string PlotFileName (int lev) const;
-
-    // put together an array of multifabs for writing
-    amrex::Vector<const amrex::MultiFab*> PlotFileMF () const;
-
-    // set plotfile variables names
-    amrex::Vector<std::string> PlotFileVarNames () const;
-
-    // write plotfile to disk
-    void WritePlotFile () const;
-
-    // write checkpoint file to disk
-    void WriteCheckpointFile () const;
-
-    // read checkpoint file from disk
-    void ReadCheckpointFile ();
-
-    // utility to skip to next line in Header
-    static void GotoNextLine (std::istream& is);
-
-    ////////////////
-    // private data members
-
-    amrex::Vector<int> istep;      // which step?
-    amrex::Vector<int> nsubsteps;  // how many substeps on each level?
-
-    // keep track of old time, new time, and time step at each level
-    amrex::Vector<amrex::Real> t_new;  
-    amrex::Vector<amrex::Real> t_old;
-    amrex::Vector<amrex::Real> dt;
-
-    // array of multifabs to store the solution at each level of refinement
-    // after advancing a level we use "swap".
-    amrex::Vector<amrex::MultiFab> phi_new;
-    amrex::Vector<amrex::MultiFab> phi_old;
-
-    // this is essentially a 2*DIM integer array storing the physical boundary
-    // condition types at the lo/hi walls in each direction
-    amrex::Vector<BCRec> bcs;  // 1-component
-
-    // stores fluxes at coarse-fine interface for synchronization
-    // this will be sized "nlevs_max+1"
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    // therefore flux_reg[0] and flux_reg[nlevs_max] are never actually 
-    // used in the reflux operation
-    amrex::Vector<std::unique_ptr<amrex::FluxRegister> > flux_reg; 
-    
-    ////////////////
-    // runtime parameters
-
-    // maximum number of steps and stop time
-    int max_step = std::numeric_limits<int>::max();
-    amrex::Real stop_time = std::numeric_limits<amrex::Real>::max();
-
-    // if >= 0 we restart from a checkpoint
-    std::string restart_chkfile = "";
-
-    // advective cfl number - dt = cfl*dx/umax
-    amrex::Real cfl = 0.7;
-
-    // how often each level regrids the higher levels of refinement
-    // (after a level advances that many time steps)
-    int regrid_int = 2;
-
-    // hyperbolic refluxing as part of multilevel synchronization
-    int do_reflux = 1;
-
-    // plotfile prefix and frequency
-    std::string plot_file {"plt"};
-    int plot_int = -1;
-
-    // checkpoint prefix and frequency
-    std::string chk_file {"chk"};
-    int chk_int = -1;
-
-#if defined(BL_USE_SENSEI_INSITU)
-    amrex::AmrMeshInSituBridge *insitu_bridge;
-#endif
-};
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv.cpp b/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv.cpp
deleted file mode 100644
index ca68d39c607..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv.cpp
+++ /dev/null
@@ -1,1350 +0,0 @@
-
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_FillPatchUtil.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_PhysBCFunct.H>
-#include <Kernels_3d.H>
-
-#ifdef BL_USE_SENSEI_INSITU
-#include <AMReX_AmrMeshInSituBridge.H>
-#endif
-
-#ifdef AMREX_MEM_PROFILING
-#include <AMReX_MemProfiler.H>
-#endif
-
-#include <AmrCoreAdv.H>
-
-using namespace amrex;
-
-// constructor - reads in parameters from inputs file
-//             - sizes multilevel arrays and data structures
-//             - initializes BCRec boundary condition object
-AmrCoreAdv::AmrCoreAdv ()
-{
-    ReadParameters();
-
-    // Geometry on all levels has been defined already.
-
-    // No valid BoxArray and DistributionMapping have been defined.
-    // But the arrays for them have been resized.
-
-    int nlevs_max = max_level + 1;
-
-    istep.resize(nlevs_max, 0);
-    nsubsteps.resize(nlevs_max, 1);
-    for (int lev = 1; lev <= max_level; ++lev) {
-	nsubsteps[lev] = MaxRefRatio(lev-1);
-    }
-
-    t_new.resize(nlevs_max, 0.0);
-    t_old.resize(nlevs_max, -1.e100);
-    dt.resize(nlevs_max, 1.e100);
-
-    phi_new.resize(nlevs_max);
-    phi_old.resize(nlevs_max);
-
-    // periodic boundaries
-    int bc_lo[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
-    int bc_hi[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
-
-/*
-    // walls (Neumann)
-    int bc_lo[] = {FOEXTRAP, FOEXTRAP, FOEXTRAP};
-    int bc_hi[] = {FOEXTRAP, FOEXTRAP, FOEXTRAP};
-*/
-
-    bcs.resize(1);     // Setup 1-component
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
-    {
-        // lo-side BCs
-        if (bc_lo[idim] == BCType::int_dir  ||  // periodic uses "internal Dirichlet"
-            bc_lo[idim] == BCType::foextrap ||  // first-order extrapolation
-            bc_lo[idim] == BCType::ext_dir ) {  // external Dirichlet
-            bcs[0].setLo(idim, bc_lo[idim]);
-        }
-        else {
-            amrex::Abort("Invalid bc_lo");
-        }
-
-        // hi-side BCSs
-        if (bc_hi[idim] == BCType::int_dir  ||  // periodic uses "internal Dirichlet"
-            bc_hi[idim] == BCType::foextrap ||  // first-order extrapolation
-            bc_hi[idim] == BCType::ext_dir ) {  // external Dirichlet
-            bcs[0].setHi(idim, bc_hi[idim]);
-        }
-        else {
-            amrex::Abort("Invalid bc_hi");
-        }
-    }
-
-    // stores fluxes at coarse-fine interface for synchronization
-    // this will be sized "nlevs_max+1"
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    // therefore flux_reg[0] is never actually used in the reflux operation
-    flux_reg.resize(nlevs_max+1);
-
-#ifdef BL_USE_SENSEI_INSITU
-    insitu_bridge = new amrex::AmrMeshInSituBridge;
-    insitu_bridge->initialize();
-#endif
-}
-
-AmrCoreAdv::~AmrCoreAdv ()
-{
-#ifdef BL_USE_SENSEI_INSITU
-    delete insitu_bridge;
-#endif
-}
-
-// advance solution to final time
-void
-AmrCoreAdv::Evolve ()
-{
-    Real cur_time = t_new[0];
-    int last_plot_file_step = 0;
-
-    for (int step = istep[0]; step < max_step && cur_time < stop_time; ++step)
-    {
-        amrex::Print() << "\nCoarse STEP " << step+1 << " starts ..." << std::endl;
-
-	ComputeDt();
-
-	int lev = 0;
-	int iteration = 1;
-	timeStep(lev, cur_time, iteration);
-
-	cur_time += dt[0];
-
-        amrex::Print() << "Coarse STEP " << step+1 << " ends." << " TIME = " << cur_time
-                       << " DT = " << dt[0]  << std::endl;
-
-	// sync up time
-	for (lev = 0; lev <= finest_level; ++lev) {
-	    t_new[lev] = cur_time;
-	}
-
-	if (plot_int > 0 && (step+1) % plot_int == 0) {
-	    last_plot_file_step = step+1;
-	    WritePlotFile();
-	}
-
-        if (chk_int > 0 && (step+1) % chk_int == 0) {
-            WriteCheckpointFile();
-        }
-
-#ifdef BL_USE_SENSEI_INSITU
-        insitu_bridge->update(step, cur_time,
-            static_cast<amrex::AmrMesh*>(this), {&phi_new}, {{"phi"}});
-#endif
-
-#ifdef AMREX_MEM_PROFILING
-        {
-            std::ostringstream ss;
-            ss << "[STEP " << step+1 << "]";
-            MemProfiler::report(ss.str());
-        }
-#endif
-
-	if (cur_time >= stop_time - 1.e-6*dt[0]) break;
-    }
-
-    if (plot_int > 0 && istep[0] > last_plot_file_step) {
-	WritePlotFile();
-    }
-
-#ifdef BL_USE_SENSEI_INSITU
-    insitu_bridge->finalize();
-#endif
-}
-
-// initializes multilevel data
-void
-AmrCoreAdv::InitData ()
-{
-    if (restart_chkfile == "") {
-        // start simulation from the beginning
-        const Real time = 0.0;
-        InitFromScratch(time);
-        AverageDown();
-
-        if (chk_int > 0) {
-            WriteCheckpointFile();
-        }
-
-    }
-    else {
-        // restart from a checkpoint
-        ReadCheckpointFile();
-    }
-
-    if (plot_int > 0) {
-        WritePlotFile();
-    }
-}
-
-// Make a new level using provided BoxArray and DistributionMapping and 
-// fill with interpolated coarse level data.
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::MakeNewLevelFromCoarse (int lev, Real time, const BoxArray& ba,
-				    const DistributionMapping& dm)
-{
-    const int ncomp = phi_new[lev-1].nComp();
-    const int nghost = phi_new[lev-1].nGrow();
-    
-    phi_new[lev].define(ba, dm, ncomp, nghost);
-    phi_old[lev].define(ba, dm, ncomp, nghost);
-
-    t_new[lev] = time;
-    t_old[lev] = time - 1.e200;
-
-    if (lev > 0 && do_reflux) {
-	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }
-
-    FillCoarsePatch(lev, time, phi_new[lev], 0, ncomp);
-}
-
-// Remake an existing level using provided BoxArray and DistributionMapping and 
-// fill with existing fine and coarse data.
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::RemakeLevel (int lev, Real time, const BoxArray& ba,
-			 const DistributionMapping& dm)
-{
-    const int ncomp = phi_new[lev].nComp();
-    const int nghost = phi_new[lev].nGrow();
-
-    MultiFab new_state(ba, dm, ncomp, nghost);
-    MultiFab old_state(ba, dm, ncomp, nghost);
-
-    FillPatch(lev, time, new_state, 0, ncomp);
-
-    std::swap(new_state, phi_new[lev]);
-    std::swap(old_state, phi_old[lev]);
-
-    t_new[lev] = time;
-    t_old[lev] = time - 1.e200;
-
-    if (lev > 0 && do_reflux) {
-	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }    
-}
-
-// Delete level data
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::ClearLevel (int lev)
-{
-    phi_new[lev].clear();
-    phi_old[lev].clear();
-    flux_reg[lev].reset(nullptr);
-}
-
-// Make a new level from scratch using provided BoxArray and DistributionMapping.
-// Only used during initialization.
-// overrides the pure virtual function in AmrCore
-void AmrCoreAdv::MakeNewLevelFromScratch (int lev, Real time, const BoxArray& ba,
-					  const DistributionMapping& dm)
-{
-    const int ncomp = 1;
-    const int nghost = 0;
-
-    phi_new[lev].define(ba, dm, ncomp, nghost);
-    phi_old[lev].define(ba, dm, ncomp, nghost);
-
-    t_new[lev] = time;
-    t_old[lev] = time - 1.e200;
-
-    if (lev > 0 && do_reflux) {
-	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }
-
-    Real cur_time = t_new[lev];
-    MultiFab& state = phi_new[lev];
-
-    for (MFIter mfi(state); mfi.isValid(); ++mfi)
-    {
-        Array4<Real> fab = state[mfi].array();
-        GeometryData geomData = geom[lev].data();
-        const Box& box = mfi.validbox();
-
-        amrex::launch(box,
-        [=] AMREX_GPU_DEVICE (Box const& tbx)
-        {
-            initdata(tbx, fab, geomData);
-        });
-    }
-}
-
-// tag all cells for refinement
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::ErrorEst (int lev, TagBoxArray& tags, Real time, int ngrow)
-{
-    static bool first = true;
-    static Vector<Real> phierr;
-
-    // only do this during the first call to ErrorEst
-    if (first)
-    {
-	first = false;
-        // read in an array of "phierr", which is the tagging threshold
-        // in this example, we tag values of "phi" which are greater than phierr
-        // for that particular level
-        // in subroutine state_error, you could use more elaborate tagging, such
-        // as more advanced logical expressions, or gradients, etc.
-	ParmParse pp("adv");
-	int n = pp.countval("phierr");
-	if (n > 0) {
-	    pp.getarr("phierr", phierr, 0, n);
-	}
-    }
-
-    if (lev >= phierr.size()) return;
-
-//    const int clearval = TagBox::CLEAR;
-    const int   tagval = TagBox::SET;
-
-    const MultiFab& state = phi_new[lev];
-
-#ifdef _OPENMP
-#pragma omp parallel if(Gpu::notInLaunchRegion())
-#endif
-    {
-	
-	for (MFIter mfi(state,TilingIfNotGPU()); mfi.isValid(); ++mfi)
-	{
-	    const Box& bx  = mfi.tilebox();
-            const auto statefab = state.array(mfi);
-            const auto tagfab  = tags.array(mfi);
-            Real phierror = phierr[lev];
-	    
-            amrex::ParallelFor(bx,
-            [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
-            {
-                state_error(i, j, k, tagfab, statefab, phierror, tagval);
-            });
-	}
-    }
-}
-
-// read in some parameters from inputs file
-void
-AmrCoreAdv::ReadParameters ()
-{
-    {
-	ParmParse pp;  // Traditionally, max_step and stop_time do not have prefix.
-	pp.query("max_step", max_step);
-	pp.query("stop_time", stop_time);
-    }
-
-    {
-	ParmParse pp("amr"); // Traditionally, these have prefix, amr.
-
-	pp.query("regrid_int", regrid_int);
-	pp.query("plot_file", plot_file);
-	pp.query("plot_int", plot_int);
-	pp.query("chk_file", chk_file);
-	pp.query("chk_int", chk_int);
-        pp.query("restart",restart_chkfile);
-    }
-
-    {
-	ParmParse pp("adv");
-	
-	pp.query("cfl", cfl);
-        pp.query("do_reflux", do_reflux);
-    }
-}
-
-// set covered coarse cells to be the average of overlying fine cells
-void
-AmrCoreAdv::AverageDown ()
-{
-    for (int lev = finest_level-1; lev >= 0; --lev)
-    {
-	amrex::average_down(phi_new[lev+1], phi_new[lev],
-                            geom[lev+1], geom[lev],
-                            0, phi_new[lev].nComp(), refRatio(lev));
-    }
-}
-
-// more flexible version of AverageDown() that lets you average down across multiple levels
-void
-AmrCoreAdv::AverageDownTo (int crse_lev)
-{
-    amrex::average_down(phi_new[crse_lev+1], phi_new[crse_lev],
-                        geom[crse_lev+1], geom[crse_lev],
-                        0, phi_new[crse_lev].nComp(), refRatio(crse_lev));
-}
-
-// compute a new multifab by coping in phi from valid region and filling ghost cells
-// works for single level and 2-level cases (fill fine grid ghost by interpolating from coarse)
-void
-AmrCoreAdv::FillPatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp)
-{
-    if (lev == 0)
-    {
-	Vector<MultiFab*> smf;
-	Vector<Real> stime;
-	GetData(0, time, smf, stime);
-
-        if(Gpu::inLaunchRegion())
-        {
-            GpuBndryFuncFab<AmrCoreFill> gpu_bndry_func(AmrCoreFill{});
-            PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > physbc(geom[lev],bcs,gpu_bndry_func);
-            amrex::FillPatchSingleLevel(mf, time, smf, stime, 0, icomp, ncomp, 
-                                        geom[lev], physbc, 0);
-        }
-        else
-        {
-            CpuBndryFuncFab bndry_func(nullptr);  // Without EXT_DIR, we can pass a nullptr.
-            PhysBCFunct<CpuBndryFuncFab> physbc(geom[lev],bcs,bndry_func);
-            amrex::FillPatchSingleLevel(mf, time, smf, stime, 0, icomp, ncomp, 
-                                        geom[lev], physbc, 0);
-        }
-    }
-    else
-    {
-	Vector<MultiFab*> cmf, fmf;
-	Vector<Real> ctime, ftime;
-	GetData(lev-1, time, cmf, ctime);
-	GetData(lev  , time, fmf, ftime);
-
-	Interpolater* mapper = &cell_cons_interp;
-
-        if(Gpu::inLaunchRegion())
-        {
-            GpuBndryFuncFab<AmrCoreFill> gpu_bndry_func(AmrCoreFill{});
-            PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > cphysbc(geom[lev-1],bcs,gpu_bndry_func);
-            PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > fphysbc(geom[lev],bcs,gpu_bndry_func);
-
-            amrex::FillPatchTwoLevels(mf, time, cmf, ctime, fmf, ftime,
-                                      0, icomp, ncomp, geom[lev-1], geom[lev],
-                                      cphysbc, 0, fphysbc, 0, refRatio(lev-1),
-                                      mapper, bcs, 0);
-        }
-        else
-        {
-            CpuBndryFuncFab bndry_func(nullptr);  // Without EXT_DIR, we can pass a nullptr.
-            PhysBCFunct<CpuBndryFuncFab> cphysbc(geom[lev-1],bcs,bndry_func);
-            PhysBCFunct<CpuBndryFuncFab> fphysbc(geom[lev],bcs,bndry_func);
-
-            amrex::FillPatchTwoLevels(mf, time, cmf, ctime, fmf, ftime,
-                                      0, icomp, ncomp, geom[lev-1], geom[lev],
-                                      cphysbc, 0, fphysbc, 0, refRatio(lev-1),
-                                      mapper, bcs, 0);
-        }
-    }
-}
-
-// fill an entire multifab by interpolating from the coarser level
-// this comes into play when a new level of refinement appears
-void
-AmrCoreAdv::FillCoarsePatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp)
-{
-    BL_ASSERT(lev > 0);
-
-    Vector<MultiFab*> cmf;
-    Vector<Real> ctime;
-    GetData(lev-1, time, cmf, ctime);
-    Interpolater* mapper = &cell_cons_interp;
-    
-    if (cmf.size() != 1) {
-	amrex::Abort("FillCoarsePatch: how did this happen?");
-    }
-
-    if(Gpu::inLaunchRegion())
-    {
-        GpuBndryFuncFab<AmrCoreFill> gpu_bndry_func(AmrCoreFill{});
-        PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > cphysbc(geom[lev-1],bcs,gpu_bndry_func);
-        PhysBCFunct<GpuBndryFuncFab<AmrCoreFill> > fphysbc(geom[lev],bcs,gpu_bndry_func);
-
-        amrex::InterpFromCoarseLevel(mf, time, *cmf[0], 0, icomp, ncomp, geom[lev-1], geom[lev],
-                                     cphysbc, 0, fphysbc, 0, refRatio(lev-1),
-                                     mapper, bcs, 0);
-    }
-    else
-    {
-        CpuBndryFuncFab bndry_func(nullptr);  // Without EXT_DIR, we can pass a nullptr.
-        PhysBCFunct<CpuBndryFuncFab> cphysbc(geom[lev-1],bcs,bndry_func);
-        PhysBCFunct<CpuBndryFuncFab> fphysbc(geom[lev],bcs,bndry_func);
-
-        amrex::InterpFromCoarseLevel(mf, time, *cmf[0], 0, icomp, ncomp, geom[lev-1], geom[lev],
-                                     cphysbc, 0, fphysbc, 0, refRatio(lev-1),
-                                     mapper, bcs, 0);
-    }
-}
-
-// utility to copy in data from phi_old and/or phi_new into another multifab
-void
-AmrCoreAdv::GetData (int lev, Real time, Vector<MultiFab*>& data, Vector<Real>& datatime)
-{
-    data.clear();
-    datatime.clear();
-
-    const Real teps = (t_new[lev] - t_old[lev]) * 1.e-3;
-
-    if (time > t_new[lev] - teps && time < t_new[lev] + teps)
-    {
-	data.push_back(&phi_new[lev]);
-	datatime.push_back(t_new[lev]);
-    }
-    else if (time > t_old[lev] - teps && time < t_old[lev] + teps)
-    {
-	data.push_back(&phi_old[lev]);
-	datatime.push_back(t_old[lev]);
-    }
-    else
-    {
-	data.push_back(&phi_old[lev]);
-	data.push_back(&phi_new[lev]);
-	datatime.push_back(t_old[lev]);
-	datatime.push_back(t_new[lev]);
-    }
-}
-
-
-// advance a level by dt
-// includes a recursive call for finer levels
-void
-AmrCoreAdv::timeStep (int lev, Real time, int iteration)
-{
-    if (regrid_int > 0)  // We may need to regrid
-    {
-
-        // help keep track of whether a level was already regridded
-        // from a coarser level call to regrid
-        static Vector<int> last_regrid_step(max_level+1, 0);
-
-        // regrid changes level "lev+1" so we don't regrid on max_level
-        // also make sure we don't regrid fine levels again if 
-        // it was taken care of during a coarser regrid
-        if (lev < max_level && istep[lev] > last_regrid_step[lev]) 
-        {
-            if (istep[lev] % regrid_int == 0)
-            {
-                // regrid could add newly refine levels (if finest_level < max_level)
-                // so we save the previous finest level index
-		int old_finest = finest_level; 
-		regrid(lev, time);
-
-                // mark that we have regridded this level already
-		for (int k = lev; k <= finest_level; ++k) {
-		    last_regrid_step[k] = istep[k];
-		}
-
-                // if there are newly created levels, set the time step
-		for (int k = old_finest+1; k <= finest_level; ++k) {
-		    dt[k] = dt[k-1] / MaxRefRatio(k-1);
-		}
-	    }
-	}
-    }
-
-    if (Verbose()) {
-	amrex::Print() << "[Level " << lev << " step " << istep[lev]+1 << "] ";
-	amrex::Print() << "ADVANCE with time = " << t_new[lev] 
-                       << " dt = " << dt[lev] << std::endl;
-    }
-
-    // advance a single level for a single time step, updates flux registers
-    Advance(lev, time, dt[lev], iteration, nsubsteps[lev]);
-
-    ++istep[lev];
-
-    if (Verbose())
-    {
-	amrex::Print() << "[Level " << lev << " step " << istep[lev] << "] ";
-        amrex::Print() << "Advanced " << CountCells(lev) << " cells" << std::endl;
-    }
-
-    if (lev < finest_level)
-    {
-        // recursive call for next-finer level
-	for (int i = 1; i <= nsubsteps[lev+1]; ++i)
-	{
-	    timeStep(lev+1, time+(i-1)*dt[lev+1], i);
-	}
-
-	if (do_reflux)
-	{
-            // update lev based on coarse-fine flux mismatch
-	    flux_reg[lev+1]->Reflux(phi_new[lev], 1.0, 0, 0, phi_new[lev].nComp(), geom[lev]);
-	}
-
-	AverageDownTo(lev); // average lev+1 down to lev
-    }
-    
-}
-
-// advance a single level for a single time step, updates flux registers
-void
-AmrCoreAdv::Advance (int lev, Real time, Real dt_lev, int iteration, int ncycle)
-{
-    constexpr int num_grow = 3;
-
-    std::swap(phi_old[lev], phi_new[lev]);
-    t_old[lev] = t_new[lev];
-    t_new[lev] += dt_lev;
-
-    MultiFab& S_new = phi_new[lev];
-
-    const Real old_time = t_old[lev];
-    const Real new_time = t_new[lev];
-    const Real ctr_time = 0.5*(old_time+new_time);
-
-    const auto dx = geom[lev].CellSizeArray();
-    GpuArray<Real, AMREX_SPACEDIM> dtdx;
-    for (int i=0; i<AMREX_SPACEDIM; ++i)
-    {
-        dtdx[i] = dt_lev/(dx[i]);
-    }
-
-    const Real* prob_lo = geom[lev].ProbLo();
-
-    MultiFab fluxes[BL_SPACEDIM];
-    if (do_reflux)
-    {
-	for (int i = 0; i < BL_SPACEDIM; ++i)
-	{
-	    BoxArray ba = grids[lev];
-	    ba.surroundingNodes(i);
-	    fluxes[i].define(ba, dmap[lev], S_new.nComp(), 0);
-	}
-    }
-
-    // State with ghost cells
-    MultiFab Sborder(grids[lev], dmap[lev], S_new.nComp(), num_grow);
-    FillPatch(lev, time, Sborder, 0, Sborder.nComp());
-
-
-/*
-    // Allocate fabs for fluxes and Godunov velocities. (Kept for reference).
-    for (int i = 0; i < BL_SPACEDIM ; i++) {
-	const Box& bxtmp = amrex::surroundingNodes(bx,i);
-	flux[i].resize(bxtmp,S_new.nComp());
-	uface[i].resize(amrex::grow(bxtmp,1),1);
-    }
-*/
-
-    // Build temporary multiFabs to work on.
-    Array<MultiFab, AMREX_SPACEDIM> fluxcalc;
-    Array<MultiFab, AMREX_SPACEDIM> facevel;
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
-        BoxArray ba = amrex::convert(S_new.boxArray(), IntVect::TheDimensionVector(idim));
-
-        fluxcalc[idim].define (ba,         S_new.DistributionMap(), S_new.nComp(), 0);
-        facevel [idim].define (ba.grow(1), S_new.DistributionMap(),             1, 0);
-    }
-
-#ifdef _OPENMP
-#pragma omp parallel if (Gpu::notInLaunchRegion())
-#endif
-    {
-	for (MFIter mfi(S_new,TilingIfNotGPU()); mfi.isValid(); ++mfi)
-	{
-
-        // ======== GET FACE VELOCITY =========
-            GpuArray<Box, AMREX_SPACEDIM> nbx;
-            AMREX_D_TERM(nbx[0] = mfi.nodaltilebox(0);,
-                         nbx[1] = mfi.nodaltilebox(1);,
-                         nbx[2] = mfi.nodaltilebox(2););
-
-            AMREX_D_TERM(const Box& ngbxx = amrex::grow(mfi.nodaltilebox(0),1);,
-                         const Box& ngbxy = amrex::grow(mfi.nodaltilebox(1),1);,
-                         const Box& ngbxz = amrex::grow(mfi.nodaltilebox(2),1););
-
-            GpuArray<Array4<Real>, AMREX_SPACEDIM> vel{ AMREX_D_DECL( facevel[0].array(mfi),
-                                                                      facevel[1].array(mfi),
-                                                                      facevel[2].array(mfi)) };
-
-            const Box& psibox = Box(IntVect(AMREX_D_DECL(std::min(ngbxx.smallEnd(0)-1, ngbxy.smallEnd(0)-1),
-                                                         std::min(ngbxx.smallEnd(1)-1, ngbxy.smallEnd(0)-1),
-                                                         0)),
-                                    IntVect(AMREX_D_DECL(std::max(ngbxx.bigEnd(0),   ngbxy.bigEnd(0)+1),
-                                                         std::max(ngbxx.bigEnd(1)+1, ngbxy.bigEnd(1)),
-                                                         0)));
-
-            FArrayBox psifab(psibox, 1);
-            Elixir psieli = psifab.elixir();
-            Array4<Real> psi = psifab.array();
-            GeometryData geomdata = geom[lev].data();
-            auto prob_lo = geom[lev].ProbLoArray();
-            auto dx = geom[lev].CellSizeArray();
-
-            amrex::launch(psibox,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                get_face_velocity_psi(tbx, ctr_time,
-                                      psi, geomdata); 
-            });
-
-            AMREX_D_TERM(
-                         amrex::ParallelFor(ngbxx,
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             get_face_velocity_x(i, j, k, vel[0], psi, prob_lo, dx); 
-                         });,
-
-                         amrex::ParallelFor(ngbxy,
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             get_face_velocity_y(i, j, k, vel[1], psi, prob_lo, dx);
-                         });,
-
-                         amrex::ParallelFor(ngbxz,
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             get_face_velocity_z(i, j, k, vel[2], psi, prob_lo, dx);
-                         });
-                        );
-
-        // ======== FLUX CALC AND UPDATE =========
-
-	    const Box& bx = mfi.tilebox();
-            const Box& gbx = amrex::grow(bx, 1);
-
-            Array4<Real> statein  = Sborder.array(mfi);
-            Array4<Real> stateout = S_new.array(mfi);
-
-            GpuArray<Array4<Real>, AMREX_SPACEDIM> flux{ AMREX_D_DECL(fluxcalc[0].array(mfi),
-                                                                      fluxcalc[1].array(mfi),
-                                                                      fluxcalc[2].array(mfi)) };
-
-            AMREX_D_TERM(const Box& dqbxx = amrex::grow(bx, IntVect{2, 1, 1});,
-                         const Box& dqbxy = amrex::grow(bx, IntVect{1, 2, 1});,
-                         const Box& dqbxz = amrex::grow(bx, IntVect{1, 1, 2}););
-
-            FArrayBox slope2fab (amrex::grow(bx, 2), 1);
-            Elixir slope2eli = slope2fab.elixir();
-            Array4<Real> slope2 = slope2fab.array();
-            FArrayBox slope4fab (amrex::grow(bx, 1), 1);
-            Elixir slope4eli = slope4fab.elixir();
-            Array4<Real> slope4 = slope4fab.array();
-
-            // compute longitudinal fluxes
-            // ===========================
-
-            // x -------------------------
-            FArrayBox phixfab (gbx, 1);
-            Elixir phixeli = phixfab.elixir();
-            Array4<Real> phix = phixfab.array();
-
-            amrex::launch(dqbxx,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                slopex2(tbx, statein, slope2);
-            });
-
-            amrex::launch(gbx,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                slopex4(tbx, statein, slope2, slope4);
-            });
-
-            amrex::ParallelFor(amrex::growLo(gbx, 0, -1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_x(i, j, k, statein, vel[0], phix, slope4, dtdx); 
-            });
-
-            // y -------------------------
-            FArrayBox phiyfab (gbx, 1);
-            Elixir phiyeli = phiyfab.elixir();
-            Array4<Real> phiy = phiyfab.array();
-
-            amrex::launch(dqbxy,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                slopey2(tbx, statein, slope2);
-            });
-
-            amrex::launch(gbx,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                slopey4(tbx, statein, slope2, slope4);
-            });
-
-            amrex::ParallelFor(amrex::growLo(gbx, 1, -1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_y(i, j, k, statein, vel[1], phiy, slope4, dtdx); 
-            });
-
-            // z -------------------------
-            FArrayBox phizfab (gbx, 1);
-            Elixir phizeli = phizfab.elixir();
-            Array4<Real> phiz = phizfab.array();
-
-            amrex::launch(dqbxz,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                slopez2(tbx, statein, slope2);
-            });
-
-            amrex::launch(gbx,
-            [=] AMREX_GPU_DEVICE (const Box& tbx)
-            {
-                slopez4(tbx, statein, slope2, slope4);
-            });
-
-            amrex::ParallelFor(amrex::growLo(gbx, 2, -1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_z(i, j, k, statein, vel[2], phiz, slope4, dtdx); 
-            });
-
-            // compute transverse fluxes
-            // ===========================
-
-            AMREX_D_TERM(const Box& gbxx = amrex::grow(bx, 0, 1);,
-                         const Box& gbxy = amrex::grow(bx, 1, 1);,
-                         const Box& gbxz = amrex::grow(bx, 2, 1););
-
-            // xy & xz --------------------
-            FArrayBox phix_yfab (gbx, 1);
-            FArrayBox phix_zfab (gbx, 1);
-            Elixir phix_yeli = phix_yfab.elixir();
-            Elixir phix_zeli = phix_zfab.elixir();
-            Array4<Real> phix_y = phix_yfab.array();
-            Array4<Real> phix_z = phix_zfab.array();
-
-            amrex::ParallelFor(amrex::growHi(gbxz, 0, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_xy(i, j, k, 
-                        AMREX_D_DECL(vel[0], vel[1], vel[2]),
-                        AMREX_D_DECL(phix, phiy, phiz),
-                        phix_y, dtdx);
-            }); 
-
-            amrex::ParallelFor(amrex::growHi(gbxy, 0, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_xz(i, j, k,
-                        AMREX_D_DECL(vel[0], vel[1], vel[2]),
-                        AMREX_D_DECL(phix, phiy, phiz),
-                        phix_z, dtdx);
-            }); 
-
-            // yz & yz --------------------
-            FArrayBox phiy_xfab (gbx, 1);
-            FArrayBox phiy_zfab (gbx, 1);
-            Elixir phiy_xeli = phiy_xfab.elixir();
-            Elixir phiy_zeli = phiy_zfab.elixir();
-            Array4<Real> phiy_x = phiy_xfab.array();
-            Array4<Real> phiy_z = phiy_zfab.array();
-
-            amrex::ParallelFor(amrex::growHi(gbxz, 1, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_yx(i, j, k,
-                        AMREX_D_DECL(vel[0], vel[1], vel[2]),
-                        AMREX_D_DECL(phix, phiy, phiz),
-                        phiy_x, dtdx);
-            }); 
-
-            amrex::ParallelFor(amrex::growHi(gbxx, 1, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_yz(i, j, k,
-                        AMREX_D_DECL(vel[0], vel[1], vel[2]),
-                        AMREX_D_DECL(phix, phiy, phiz),
-                        phiy_z, dtdx);
-            }); 
-
-            // zx & zy --------------------
-            FArrayBox phiz_xfab (gbx, 1);
-            FArrayBox phiz_yfab (gbx, 1);
-            Elixir phiz_xeli = phiz_xfab.elixir();
-            Elixir phiz_yeli = phiz_yfab.elixir();
-            Array4<Real> phiz_x = phiz_xfab.array();
-            Array4<Real> phiz_y = phiz_yfab.array();
-
-            amrex::ParallelFor(amrex::growHi(gbxy, 2, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_zx(i, j, k, 
-                        AMREX_D_DECL(vel[0], vel[1], vel[2]),
-                        AMREX_D_DECL(phix, phiy, phiz),
-                        phiz_x, dtdx);
-            }); 
-
-            amrex::ParallelFor(amrex::growHi(gbxx, 2, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                flux_zy(i, j, k,
-                        AMREX_D_DECL(vel[0], vel[1], vel[2]),
-                        AMREX_D_DECL(phix, phiy, phiz),
-                        phiz_y, dtdx);
-            }); 
-
-            // final edge states 
-            // ===========================
-            amrex::ParallelFor(amrex::growHi(bx, 0, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                combine_flux_x(i, j, k,
-                               vel[0], vel[1], vel[2],
-                               phix, phiy_z, phiz_y,
-                               flux[0], dtdx);
-            });
-
-            amrex::ParallelFor(amrex::growHi(bx, 1, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                combine_flux_y(i, j, k,
-                               vel[0], vel[1], vel[2],
-                               phiy, phix_z, phiz_x,
-                               flux[1], dtdx);
-            });
-
-            amrex::ParallelFor(amrex::growHi(bx, 2, 1),
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                combine_flux_z(i, j, k,
-                               vel[0], vel[1], vel[2],
-                               phiz, phix_y, phiy_x,
-                               flux[2], dtdx);
-            });
-
-            // compute new state (stateout) and scale fluxes based on face area.
-            // ===========================
-
-            // Do a conservative update 
-            amrex::ParallelFor(bx,
-            [=] AMREX_GPU_DEVICE (int i, int j, int k)
-            {
-                conservative(i, j, k,
-                             statein, stateout,
-                             AMREX_D_DECL(flux[0], flux[1], flux[2]),
-                             dtdx);
-            });
-
-            // Scale by face area in order to correctly reflux
-            AMREX_D_TERM(
-                         amrex::ParallelFor(amrex::growHi(bx, 0, 1),
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             flux_scale_x(i, j, k, flux[0], dt_lev, dx);
-                         });,
- 
-                         amrex::ParallelFor(amrex::growHi(bx, 1, 1),
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             flux_scale_y(i, j, k, flux[1], dt_lev, dx);
-                         });,
-
-                         amrex::ParallelFor(amrex::growHi(bx, 2, 1),
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             flux_scale_z(i, j, k, flux[2], dt_lev, dx);
-                         });
-                        );
-
-            GpuArray<Array4<Real>, AMREX_SPACEDIM> fluxout{ AMREX_D_DECL(fluxes[0].array(mfi),
-                                                                         fluxes[1].array(mfi),
-                                                                         fluxes[2].array(mfi)) };
-          
-            if (do_reflux) {
-                for (int idim = 0; idim < BL_SPACEDIM; ++idim) {
-                    amrex::ParallelFor(nbx[idim],
-                    [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                    {
-                        fluxout[idim](i,j,k) = flux[idim](i,j,k);
-                    });
-                }
-            }
-        }
-    }
-
-    // ======== CFL CHECK, MOVED OUTSIDE MFITER LOOP =========
-
-    AMREX_D_TERM(Real umax = facevel[0].norm0(0,0,false);,
-                 Real vmax = facevel[1].norm0(0,0,false);,
-                 Real wmax = facevel[2].norm0(0,0,false););
-
-    if (AMREX_D_TERM(umax*dt_lev > dx[0], ||
-                     vmax*dt_lev > dx[1], ||
-                     wmax*dt_lev > dx[2]))
-    {
-        amrex::Print() << "umax = " << umax << ", vmax = " << vmax << ", wmax = " << wmax 
-                       << ", dt = " << ctr_time << " dx = " << dx[1] << " " << dx[2] << " " << dx[3] << std::endl;
-        amrex::Abort("CFL violation. use smaller adv.cfl.");
-    }
-
-    // ======== END OF GPU EDIT, (FOR NOW) =========
-
-    // increment or decrement the flux registers by area and time-weighted fluxes
-    // Note that the fluxes have already been scaled by dt and area
-    // In this example we are solving phi_t = -div(+F)
-    // The fluxes contain, e.g., F_{i+1/2,j} = (phi*u)_{i+1/2,j}
-    // Keep this in mind when considering the different sign convention for updating
-    // the flux registers from the coarse or fine grid perspective
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    if (do_reflux) { 
-	if (flux_reg[lev+1]) {
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	        // update the lev+1/lev flux register (index lev+1)   
-	        flux_reg[lev+1]->CrseInit(fluxes[i],i,0,0,fluxes[i].nComp(), -1.0);
-	    }	    
-	}
-	if (flux_reg[lev]) {
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	        // update the lev/lev-1 flux register (index lev) 
-		flux_reg[lev]->FineAdd(fluxes[i],i,0,0,fluxes[i].nComp(), 1.0);
-	    }
-	}
-    }
-}
-
-// a wrapper for EstTimeStep
-void
-AmrCoreAdv::ComputeDt ()
-{
-    Vector<Real> dt_tmp(finest_level+1);
-
-    for (int lev = 0; lev <= finest_level; ++lev)
-    {
-	dt_tmp[lev] = EstTimeStep(lev, true);
-    }
-    ParallelDescriptor::ReduceRealMin(&dt_tmp[0], dt_tmp.size());
-
-    constexpr Real change_max = 1.1;
-    Real dt_0 = dt_tmp[0];
-    int n_factor = 1;
-    for (int lev = 0; lev <= finest_level; ++lev) {
-	dt_tmp[lev] = std::min(dt_tmp[lev], change_max*dt[lev]);
-	n_factor *= nsubsteps[lev];
-	dt_0 = std::min(dt_0, n_factor*dt_tmp[lev]);
-    }
-
-    // Limit dt's by the value of stop_time.
-    const Real eps = 1.e-3*dt_0;
-    if (t_new[0] + dt_0 > stop_time - eps) {
-	dt_0 = stop_time - t_new[0];
-    }
-
-    dt[0] = dt_0;
-    for (int lev = 1; lev <= finest_level; ++lev) {
-	dt[lev] = dt[lev-1] / nsubsteps[lev];
-    }
-}
-
-// compute dt from CFL considerations
-Real
-AmrCoreAdv::EstTimeStep (int lev, bool local) const
-{
-    BL_PROFILE("AmrCoreAdv::EstTimeStep()");
-
-    Real dt_est = std::numeric_limits<Real>::max();
-
-    const Real* dx = geom[lev].CellSize();
-//    const Real* prob_lo = geom[lev].ProbLo();
-    const Real cur_time = t_new[lev];
-    const MultiFab& S_new = phi_new[lev];
-
-    Array<MultiFab,AMREX_SPACEDIM> facevel;
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
-        facevel[idim].define(amrex::convert(S_new.boxArray(), IntVect::TheDimensionVector(idim)),
-                             S_new.DistributionMap(), 1, 0);
-    }
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est) if (Gpu::notInLaunchRegion())
-#endif
-    {
-        // Calculate face velocities.
-	for (MFIter mfi(S_new,TilingIfNotGPU()); mfi.isValid(); ++mfi)
-	{
-            AMREX_D_TERM(const Box& nbxx = mfi.nodaltilebox(0);,
-                         const Box& nbxy = mfi.nodaltilebox(1);,
-                         const Box& nbxz = mfi.nodaltilebox(2););
-
-            GpuArray<Array4<Real>, AMREX_SPACEDIM> vel { AMREX_D_DECL(facevel[0].array(mfi),
-                                                                      facevel[1].array(mfi),
-                                                                      facevel[2].array(mfi)) };
-
-            const Box& psibox = Box(IntVect(AMREX_D_DECL(std::min(nbxx.smallEnd(0)-1, nbxy.smallEnd(0)-1),
-                                                         std::min(nbxx.smallEnd(1)-1, nbxy.smallEnd(0)-1),
-                                                         0)),
-                                    IntVect(AMREX_D_DECL(std::max(nbxx.bigEnd(0),     nbxy.bigEnd(0)+1),
-                                                         std::max(nbxx.bigEnd(1)+1,   nbxy.bigEnd(1)),
-                                                         0)));
-
-            FArrayBox psifab(psibox, 1);
-            Elixir psieli = psifab.elixir();
-            Array4<Real> psi = psifab.array();
-            GeometryData geomdata = geom[lev].data();
-            auto prob_lo = geom[lev].ProbLoArray();
-            auto dx = geom[lev].CellSizeArray();
-
-            amrex::launch(psibox, 
-            [=] AMREX_GPU_DEVICE (Box const& tbx)
-            {
-                get_face_velocity_psi(tbx, cur_time, psi, geomdata); 
-            });
-
-            AMREX_D_TERM(
-                         amrex::ParallelFor(nbxx,
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             get_face_velocity_x(i, j, k, vel[0], psi, prob_lo, dx); 
-                         });,
-
-                         amrex::ParallelFor(nbxy,
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             get_face_velocity_y(i, j, k, vel[1], psi, prob_lo, dx);
-                         });,
-
-                         amrex::ParallelFor(nbxz,
-                         [=] AMREX_GPU_DEVICE (int i, int j, int k)
-                         {
-                             get_face_velocity_z(i, j, k, vel[2], psi, prob_lo, dx);
-                         });
-                        );
-
-	}
-    }
-
-    for (int i=0; i<BL_SPACEDIM; ++i)
-    {
-        Real est = facevel[i].norm0(0,0,true);
-        dt_est = std::min(dt_est, dx[i]/est);
-    }
-
-    // Currently, this never happens (function called with local = true).
-    // Reduction occurs outside this function.
-    if (!local) {
-	ParallelDescriptor::ReduceRealMin(dt_est);
-    }
-
-    dt_est *= cfl;
-
-    return dt_est;
-}
-
-// get plotfile name
-std::string
-AmrCoreAdv::PlotFileName (int lev) const
-{
-    return amrex::Concatenate(plot_file, lev, 5);
-}
-
-// put together an array of multifabs for writing
-Vector<const MultiFab*>
-AmrCoreAdv::PlotFileMF () const
-{
-    Vector<const MultiFab*> r;
-    for (int i = 0; i <= finest_level; ++i) {
-	r.push_back(&phi_new[i]);
-    }
-    return r;
-}
-
-// set plotfile variable names
-Vector<std::string>
-AmrCoreAdv::PlotFileVarNames () const
-{
-    return {"phi"};
-}
-
-// write plotfile to disk
-void
-AmrCoreAdv::WritePlotFile () const
-{
-    const std::string& plotfilename = PlotFileName(istep[0]);
-    const auto& mf = PlotFileMF();
-    const auto& varnames = PlotFileVarNames();
-    
-    amrex::Print() << "Writing plotfile " << plotfilename << "\n";
-
-    amrex::WriteMultiLevelPlotfile(plotfilename, finest_level+1, mf, varnames,
-				   Geom(), t_new[0], istep, refRatio());
-}
-
-void
-AmrCoreAdv::WriteCheckpointFile () const
-{
-
-    // chk00010            write a checkpoint file with this root directory
-    // chk00010/Header     this contains information you need to save (e.g., finest_level, t_new, etc.) and also
-    //                     the BoxArrays at each level
-    // chk00010/Level_0/
-    // chk00010/Level_1/
-    // etc.                these subdirectories will hold the MultiFab data at each level of refinement
-
-    // checkpoint file name, e.g., chk00010
-    const std::string& checkpointname = amrex::Concatenate(chk_file,istep[0]);
-
-    amrex::Print() << "Writing checkpoint " << checkpointname << "\n";
-
-    const int nlevels = finest_level+1;
-
-    // ---- prebuild a hierarchy of directories
-    // ---- dirName is built first.  if dirName exists, it is renamed.  then build
-    // ---- dirName/subDirPrefix_0 .. dirName/subDirPrefix_nlevels-1
-    // ---- if callBarrier is true, call ParallelDescriptor::Barrier()
-    // ---- after all directories are built
-    // ---- ParallelDescriptor::IOProcessor() creates the directories
-    amrex::PreBuildDirectorHierarchy(checkpointname, "Level_", nlevels, true);
-
-    // write Header file
-   if (ParallelDescriptor::IOProcessor()) {
-
-       std::string HeaderFileName(checkpointname + "/Header");
-       VisMF::IO_Buffer io_buffer(VisMF::IO_Buffer_Size);
-       std::ofstream HeaderFile;
-       HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-       HeaderFile.open(HeaderFileName.c_str(), std::ofstream::out   |
-		                               std::ofstream::trunc |
-                                               std::ofstream::binary);
-       if( ! HeaderFile.good()) {
-           amrex::FileOpenFailed(HeaderFileName);
-       }
-
-       HeaderFile.precision(17);
-
-       // write out title line
-       HeaderFile << "Checkpoint file for AmrCoreAdv\n";
-
-       // write out finest_level
-       HeaderFile << finest_level << "\n";
-
-       // write out array of istep
-       for (int i = 0; i < istep.size(); ++i) {
-           HeaderFile << istep[i] << " ";
-       }
-       HeaderFile << "\n";
-
-       // write out array of dt
-       for (int i = 0; i < dt.size(); ++i) {
-           HeaderFile << dt[i] << " ";
-       }
-       HeaderFile << "\n";
-
-       // write out array of t_new
-       for (int i = 0; i < t_new.size(); ++i) {
-           HeaderFile << t_new[i] << " ";
-       }
-       HeaderFile << "\n";
-
-       // write the BoxArray at each level
-       for (int lev = 0; lev <= finest_level; ++lev) {
-           boxArray(lev).writeOn(HeaderFile);
-           HeaderFile << '\n';
-       }
-   }
-
-   // write the MultiFab data to, e.g., chk00010/Level_0/
-   for (int lev = 0; lev <= finest_level; ++lev) {
-       VisMF::Write(phi_new[lev],
-                    amrex::MultiFabFileFullPrefix(lev, checkpointname, "Level_", "phi"));
-   }
-
-}
-
-
-void
-AmrCoreAdv::ReadCheckpointFile ()
-{
-
-    amrex::Print() << "Restart from checkpoint " << restart_chkfile << "\n";
-
-    // Header
-    std::string File(restart_chkfile + "/Header");
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    Vector<char> fileCharPtr;
-    ParallelDescriptor::ReadAndBcastFile(File, fileCharPtr);
-    std::string fileCharPtrString(fileCharPtr.dataPtr());
-    std::istringstream is(fileCharPtrString, std::istringstream::in);
-
-    std::string line, word;
-
-    // read in title line
-    std::getline(is, line);
-
-    // read in finest_level
-    is >> finest_level;
-    GotoNextLine(is);
-
-    // read in array of istep
-    std::getline(is, line);
-    {
-        std::istringstream lis(line);
-        int i = 0;
-        while (lis >> word) {
-            istep[i++] = std::stoi(word);
-        }
-    }
-
-    // read in array of dt
-    std::getline(is, line);
-    {
-        std::istringstream lis(line);
-        int i = 0;
-        while (lis >> word) {
-            dt[i++] = std::stod(word);
-        }
-    }
-
-    // read in array of t_new
-    std::getline(is, line);
-    {
-        std::istringstream lis(line);
-        int i = 0;
-        while (lis >> word) {
-            t_new[i++] = std::stod(word);
-        }
-    }
-
-    for (int lev = 0; lev <= finest_level; ++lev) {
-
-        // read in level 'lev' BoxArray from Header
-        BoxArray ba;
-        ba.readFrom(is);
-        GotoNextLine(is);
-
-        // create a distribution mapping
-        DistributionMapping dm { ba, ParallelDescriptor::NProcs() };
-
-        // set BoxArray grids and DistributionMapping dmap in AMReX_AmrMesh.H class
-        SetBoxArray(lev, ba);
-        SetDistributionMap(lev, dm);
-
-        // build MultiFab and FluxRegister data
-        int ncomp = 1;
-        int nghost = 0;
-        phi_old[lev].define(grids[lev], dmap[lev], ncomp, nghost);
-        phi_new[lev].define(grids[lev], dmap[lev], ncomp, nghost);
-        if (lev > 0 && do_reflux) {
-            flux_reg[lev].reset(new FluxRegister(grids[lev], dmap[lev], refRatio(lev-1), lev, ncomp));
-        }
-    }
-
-    // read in the MultiFab data
-    for (int lev = 0; lev <= finest_level; ++lev) {
-        VisMF::Read(phi_new[lev],
-                    amrex::MultiFabFileFullPrefix(lev, restart_chkfile, "Level_", "phi"));
-    }
-
-}
-
-// utility to skip to next line in Header
-void
-AmrCoreAdv::GotoNextLine (std::istream& is)
-{
-    constexpr std::streamsize bl_ignore_max { 100000 };
-    is.ignore(bl_ignore_max, '\n');
-}
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv_F.H b/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv_F.H
deleted file mode 100644
index 215aea72cfc..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/AmrCoreAdv_F.H
+++ /dev/null
@@ -1,33 +0,0 @@
-#ifndef _AmrCoreAdv_F_H_
-#define _AmrCoreAdv_F_H_
-
-#include <AMReX_BLFort.H>
-#include <AMReX_Box.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Geometry.H>
-
-using namespace amrex;
-
-#ifdef __cplusplus
-extern "C" 
-{
-#endif
-
-    void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		     const BL_FORT_FAB_ARG_3D(state),
-		     const int* tagval, const int* clearval,
-		     const int* lo, const int* hi,
-		     const amrex_real* dx, const amrex_real* problo,
-		     const amrex_real* time, const amrex_real* phierr);
-
-
-    void phifill (BL_FORT_FAB_ARG_3D(state),
-		  const int* dlo, const int* dhi,
-		  const amrex_real* dx, const amrex_real* glo, 
-		  const amrex_real* time, const int* bc);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Kernels_3d.H b/Tutorials/GPU/Advection_AmrCore/Source/Kernels_3d.H
deleted file mode 100644
index 84c27b8ee22..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Kernels_3d.H
+++ /dev/null
@@ -1,12 +0,0 @@
-#ifndef Kernels_H_
-#define Kernels_H_
-
-#include <face_velocity.H>
-#include <Prob.H>
-#include <Adv_3d.H>
-#include <compute_flux_3d.H>
-#include <slope_3d.H>
-#include <Tagging.H>
-#include <bc_fill.H>
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Make.package b/Tutorials/GPU/Advection_AmrCore/Source/Make.package
deleted file mode 100644
index 37aa5795ad6..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-CEXE_sources += main.cpp AmrCoreAdv.cpp
-
-CEXE_headers += AmrCoreAdv.H Kernels_3d.H Tagging.H bc_fill.H
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/Adv_2d.f90 b/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/Adv_2d.f90
deleted file mode 100644
index 918d0d01da7..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,119 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  real(amrex_real), intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  real(amrex_real), intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  real(amrex_real), intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  real(amrex_real), intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  real(amrex_real), intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  real(amrex_real) :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  real(amrex_real), dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Final fluxes
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = phix(i,j) * vx(i,j)
-     end do
-  end do
-  !
-  do    j = lo(2), hi(2)+1
-     do i = lo(1), hi(1)
-        flxy(i,j) = phiy(i,j) * vy(i,j)
-     end do
-  end do
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/Make.package b/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100644
index d08ca035210..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,114 +0,0 @@
-module compute_flux_module
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    real(amrex_real), intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    real(amrex_real), intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    real(amrex_real), intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    real(amrex_real), intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    real(amrex_real), dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    real(amrex_real) :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/slope_2d.f90 b/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/slope_2d.f90
deleted file mode 100644
index b00079275be..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,128 +0,0 @@
-module slope_module
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_constants_module, only : one
-  implicit none
-
-  real(amrex_real), parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    real(amrex_real), dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(one, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    real(amrex_real) :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( one, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/Adv_3d.H b/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/Adv_3d.H
deleted file mode 100644
index faed09fe74d..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/Adv_3d.H
+++ /dev/null
@@ -1,57 +0,0 @@
-#ifndef _Adv_3d_H_
-#define _Adv_3d_H_
-
-#include <AmrCoreAdv_F.H>
-#include <AMReX_Box.H>
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Geometry.H>
-
-using namespace amrex;
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void conservative(int i, int j, int k, 
-                  Array4<Real> const& uin,
-                  Array4<Real> const& uout,
-                  AMREX_D_DECL(Array4<Real> const& flxx,
-                               Array4<Real> const& flxy,
-                               Array4<Real> const& flxz),
-                  const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    uout(i,j,k) = uin(i,j,k) + 
-                  ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx[0] 
-                  + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx[1] 
-                  + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx[2] );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_scale_x(int i, int j, int k,
-                  Array4<Real> const& flxx,
-                  Real dt,
-                  const GpuArray<Real, AMREX_SPACEDIM>& dx)
-{
-   flxx(i,j,k) = flxx(i,j,k) * (dt * dx[1]*dx[2]);
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_scale_y(int i, int j, int k,
-                  Array4<Real> const& flxy,
-                  Real dt,
-                  const GpuArray<Real, AMREX_SPACEDIM>& dx)
-{
-   flxy(i,j,k) = flxy(i,j,k) * (dt * dx[0]*dx[2]);
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_scale_z(int i, int j ,int k,
-                  Array4<Real> const& flxz,
-                  Real dt,
-                  const GpuArray<Real, AMREX_SPACEDIM>& dx)
-{
-    flxz(i,j,k) = flxz(i,j,k) * (dt * dx[0]*dx[1]);
-}
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/Make.package b/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/Make.package
deleted file mode 100644
index c367a41c4d3..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-CEXE_headers += Adv_$(DIM)d.H
-CEXE_headers += computer_flux_$(DIM)d.H
-CEXE_headers += slope_$(DIM)d.H
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/compute_flux_3d.H b/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/compute_flux_3d.H
deleted file mode 100644
index 0fc0d402ed3..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/Src_3d/compute_flux_3d.H
+++ /dev/null
@@ -1,218 +0,0 @@
-#ifndef _compute_flux_3d_H_
-#define _compute_flux_3d_H_
-
-#include <AMReX_BLFort.H>
-#include <AMReX_Box.H>
-#include <AMReX_Geometry.H>
-#include <AmrCoreAdv_F.H>
-
-using namespace amrex;
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_x(int i, int j, int k,
-            Array4<Real> const& phi,
-            Array4<Real> const& vx,
-            Array4<Real> const& px,
-            Array4<Real> const& slope,
-            const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    px(i,j,k) = ( (vx(i,j,k) < 0) ? 
-                phi(i  ,j,k) - slope(i  ,j,k)*(0.5 + 0.5*dtdx[0]*vx(i,j,k)) : 
-                phi(i-1,j,k) + slope(i-1,j,k)*(0.5 - 0.5*dtdx[0]*vx(i,j,k)) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_y(int i, int j, int k,
-            Array4<Real> const& phi,
-            Array4<Real> const& vy,
-            Array4<Real> const& py,
-            Array4<Real> const& slope,
-            const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    py(i,j,k) = ( (vy(i,j,k) < 0) ? 
-                phi(i,j  ,k) - slope(i,j  ,k)*(0.5 + 0.5*dtdx[0]*vy(i,j,k)) : 
-                phi(i,j-1,k) + slope(i,j-1,k)*(0.5 - 0.5*dtdx[0]*vy(i,j,k)) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_z(int i, int j, int k,
-            Array4<Real> const& phi,
-            Array4<Real> const& vz,
-            Array4<Real> const& pz,
-            Array4<Real> const& slope,
-            const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pz(i,j,k) = ( (vz(i,j,k) < 0) ? 
-                phi(i,j,k  ) - slope(i,j,k  )*(0.5 + 0.5*dtdx[0]*vz(i,j,k)) : 
-                phi(i,j,k-1) + slope(i,j,k-1)*(0.5 - 0.5*dtdx[0]*vz(i,j,k)) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_xy(int i, int j, int k, 
-             AMREX_D_DECL(Array4<Real> const& vx, 
-                          Array4<Real> const& vy,
-                          Array4<Real> const& vz),
-             AMREX_D_DECL(Array4<Real> const& px,
-                          Array4<Real> const& py,
-                          Array4<Real> const& pz),
-             Array4<Real> const& pxy,
-             const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pxy(i,j,k) = ( (vx(i,j,k) < 0) ? 
-                 px(i,j,k) - dtdx[1]/3.0 * ( 0.5*(vy(i,  j+1,k) + vy(i  ,j,k)) * (py(i  ,j+1,k) - py(i  ,j,k))) : 
-                 px(i,j,k) - dtdx[1]/3.0 * ( 0.5*(vy(i-1,j+1,k) + vy(i-1,j,k)) * (py(i-1,j+1,k) - py(i-1,j,k))) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_xz(int i, int j, int k,
-             AMREX_D_DECL(Array4<Real> const& vx, 
-                          Array4<Real> const& vy,
-                          Array4<Real> const& vz),
-             AMREX_D_DECL(Array4<Real> const& px,
-                          Array4<Real> const& py,
-                          Array4<Real> const& pz),
-             Array4<Real> const& pxz,
-             const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pxz(i,j,k) = ( (vx(i,j,k) < 0) ? 
-                 px(i,j,k) - dtdx[2]/3.0 * ( 0.5*(vz(i,  j,k+1) + vz(i  ,j,k)) * (pz(i  ,j,k+1) - pz(i  ,j,k))) : 
-                 px(i,j,k) - dtdx[2]/3.0 * ( 0.5*(vz(i-1,j,k+1) + vz(i-1,j,k)) * (pz(i-1,j,k+1) - pz(i-1,j,k))) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_yx(int i, int j, int k,
-             AMREX_D_DECL(Array4<Real> const& vx, 
-                          Array4<Real> const& vy,
-                          Array4<Real> const& vz),
-             AMREX_D_DECL(Array4<Real> const& px,
-                          Array4<Real> const& py,
-                          Array4<Real> const& pz),
-             Array4<Real> const& pyx,
-             const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pyx(i,j,k) = ( (vy(i,j,k) < 0) ? 
-                 py(i,j,k) - dtdx[0]/3.0 * ( 0.5*(vx(i+1,j  ,k) + vx(i,j  ,k)) * (px(i+1,j  ,k) - px(i,j  ,k))) : 
-                 py(i,j,k) - dtdx[0]/3.0 * ( 0.5*(vx(i+1,j-1,k) + vx(i,j-1,k)) * (px(i+1,j-1,k) - px(i,j-1,k))) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_yz(int i, int j, int k,
-             AMREX_D_DECL(Array4<Real> const& vx, 
-                          Array4<Real> const& vy,
-                          Array4<Real> const& vz),
-             AMREX_D_DECL(Array4<Real> const& px,
-                          Array4<Real> const& py,
-                          Array4<Real> const& pz),
-             Array4<Real> const& pyz,
-             const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pyz(i,j,k) = ( (vy(i,j,k) < 0) ? 
-                 py(i,j,k) - dtdx[2]/3.0 * ( 0.5*(vz(i,  j,k+1) + vz(i,j  ,k)) * (pz(i,j  ,k+1) - pz(i,j  ,k))) : 
-                 py(i,j,k) - dtdx[2]/3.0 * ( 0.5*(vz(i,j-1,k+1) + vz(i,j-1,k)) * (pz(i,j-1,k+1) - pz(i,j-1,k))) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_zx(int i, int j, int k,
-             AMREX_D_DECL(Array4<Real> const& vx, 
-                          Array4<Real> const& vy,
-                          Array4<Real> const& vz),
-             AMREX_D_DECL(Array4<Real> const& px,
-                          Array4<Real> const& py,
-                          Array4<Real> const& pz),
-             Array4<Real> const& pzx,
-             const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pzx(i,j,k) = ( (vz(i,j,k) < 0) ? 
-                 pz(i,j,k) - dtdx[0]/3.0 * ( 0.5*(vx(i+1,j,k  ) + vx(i,j,k  )) * (px(i+1,j,k  ) - px(i,j,k  ))) : 
-                 pz(i,j,k) - dtdx[0]/3.0 * ( 0.5*(vx(i+1,j,k-1) + vx(i,j,k-1)) * (px(i+1,j,k-1) - px(i,j,k-1))) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void flux_zy(int i, int j, int k,
-             AMREX_D_DECL(Array4<Real> const& vx, 
-                          Array4<Real> const& vy,
-                          Array4<Real> const& vz),
-             AMREX_D_DECL(Array4<Real> const& px,
-                          Array4<Real> const& py,
-                          Array4<Real> const& pz),
-             Array4<Real> const& pzy,
-             const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pzy(i,j,k) = ( (vz(i,j,k) < 0) ? 
-                 pz(i,j,k) - dtdx[1]/3.0 * ( 0.5*(vy(i,j+1,k  ) + vy(i,j,k  )) * (py(i,j+1,k  ) - py(i,j,k  ))) : 
-                 pz(i,j,k) - dtdx[1]/3.0 * ( 0.5*(vy(i,j+1,k-1) + vy(i,j,k-1)) * (py(i,j+1,k-1) - py(i,j,k-1))) );
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void combine_flux_x(int i, int j, int k,
-                    AMREX_D_DECL(Array4<Real> const& vx, 
-                                 Array4<Real> const& vy,
-                                 Array4<Real> const& vz),
-                    Array4<Real> const& px,
-                    Array4<Real> const& pyz,
-                    Array4<Real> const& pzy,
-                    Array4<Real> const& fx,
-                    const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    px(i,j,k) = ( (vx(i,j,k) < 0) ? 
-                px(i,j,k) - 0.5*dtdx[1] * ( 0.5*(vy(i  ,j+1,k  ) + vy(i  ,j,k)) * (pyz(i  ,j+1,k  )-pyz(i  ,j,k)))
-                          - 0.5*dtdx[2] * ( 0.5*(vz(i  ,j  ,k+1) + vz(i  ,j,k)) * (pzy(i  ,j  ,k+1)-pzy(i  ,j,k))) :
-                px(i,j,k) - 0.5*dtdx[1] * ( 0.5*(vy(i-1,j+1,k  ) + vy(i-1,j,k)) * (pyz(i-1,j+1,k  )-pyz(i-1,j,k)))
-                          - 0.5*dtdx[2] * ( 0.5*(vz(i-1,j  ,k+1) + vz(i-1,j,k)) * (pzy(i-1,j  ,k+1)-pzy(i-1,j,k))) );
-
-    fx(i,j,k) = vx(i,j,k)*px(i,j,k);
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void combine_flux_y(int i, int j, int k,
-                    AMREX_D_DECL(Array4<Real> const& vx, 
-                                 Array4<Real> const& vy,
-                                 Array4<Real> const& vz),
-                    Array4<Real> const& py,
-                    Array4<Real> const& pxz,
-                    Array4<Real> const& pzx,
-                    Array4<Real> const& fy,
-                    const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    py(i,j,k) = ( (vy(i,j,k) < 0) ? 
-                py(i,j,k) - 0.5*dtdx[0] * ( 0.5*(vx(i+1,j  ,k  ) + vx(i,j  ,k)) * (pxz(i+1,j  ,k  )-pxz(i,j  ,k)))
-                          - 0.5*dtdx[2] * ( 0.5*(vz(i,  j  ,k+1) + vz(i,j  ,k)) * (pzx(i,  j  ,k+1)-pzx(i,j  ,k))) :
-                py(i,j,k) - 0.5*dtdx[0] * ( 0.5*(vx(i+1,j-1,k  ) + vx(i,j-1,k)) * (pxz(i+1,j-1,k  )-pxz(i,j-1,k)))
-                          - 0.5*dtdx[2] * ( 0.5*(vz(i  ,j-1,k+1) + vz(i,j-1,k)) * (pzx(i  ,j-1,k+1)-pzx(i,j-1,k))) );
-
-    fy(i,j,k) = vy(i,j,k)*py(i,j,k);
-}
-
-AMREX_GPU_DEVICE
-AMREX_FORCE_INLINE
-void combine_flux_z(int i, int j, int k,
-                    AMREX_D_DECL(Array4<Real> const& vx, 
-                                 Array4<Real> const& vy,
-                                 Array4<Real> const& vz),
-                    Array4<Real> const& pz,
-                    Array4<Real> const& pxy,
-                    Array4<Real> const& pyx,
-                    Array4<Real> const& fz,
-                    const GpuArray<Real, AMREX_SPACEDIM>& dtdx)
-{
-    pz(i,j,k) = ( (vz(i,j,k) < 0) ? 
-                pz(i,j,k) - 0.5*dtdx[0] * ( 0.5*(vx(i+1,j  ,k  ) + vx(i,j,k  )) * (pxy(i+1,j  ,k  )-pxy(i,j,k  )))
-                          - 0.5*dtdx[1] * ( 0.5*(vy(i,  j+1,k  ) + vy(i,j,k  )) * (pyx(i,  j+1,k  )-pyx(i,j,k  ))) :
-                pz(i,j,k) - 0.5*dtdx[0] * ( 0.5*(vx(i+1,j  ,k-1) + vx(i,j,k-1)) * (pxy(i+1,j  ,k-1)-pxy(i,j,k-1)))
-                          - 0.5*dtdx[1] * ( 0.5*(vy(i  ,j+1,k-1) + vy(i,j,k-1)) * (pyx(i  ,j+1,k-1)-pyx(i,j,k-1))) );
-
-    fz(i,j,k) = vz(i,j,k)*pz(i,j,k);
-}
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/bc_fill.H b/Tutorials/GPU/Advection_AmrCore/Source/bc_fill.H
deleted file mode 100644
index d507dfcc748..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/bc_fill.H
+++ /dev/null
@@ -1,23 +0,0 @@
-#ifndef BCFILL_H
-#define BCFILL_H
-
-#include <AMReX_FArrayBox.H>
-#include <AMReX_Geometry.H>
-#include <AMReX_PhysBCFunct.H>
-
-using namespace amrex;
-
-struct AmrCoreFill
-{
-    AMREX_GPU_DEVICE
-    void operator() (const IntVect& iv, Array4<Real> const& data,
-                     const int dcomp, const int numcomp,
-                     GeometryData const& geom, const Real time,
-                     const BCRec* bcr, const int bcomp,
-                     const int orig_comp) const
-        {
-            // do something for external Dirichlet (BCType::ext_dir)
-        }
-};
-
-#endif
diff --git a/Tutorials/GPU/Advection_AmrCore/Source/main.cpp b/Tutorials/GPU/Advection_AmrCore/Source/main.cpp
deleted file mode 100644
index e2078b2a3db..00000000000
--- a/Tutorials/GPU/Advection_AmrCore/Source/main.cpp
+++ /dev/null
@@ -1,47 +0,0 @@
-
-#include <iostream>
-
-#include <AMReX.H>
-#include <AMReX_BLProfiler.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <AmrCoreAdv.H>
-
-using namespace amrex;
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-
-    // timer for profiling
-    BL_PROFILE_VAR("main()", pmain);
-
-    // wallclock time
-    const Real strt_total = amrex::second();
-
-    {
-        // constructor - reads in parameters from inputs file
-        //             - sizes multilevel arrays and data structures
-        AmrCoreAdv amr_core_adv;
-	
-        // initialize AMR data
-	amr_core_adv.InitData();
-
-        // advance solution to final time
-	amr_core_adv.Evolve();
-	
-        // wallclock time
-	Real end_total = amrex::second() - strt_total;
-	
-        // print wallclock time
-	ParallelDescriptor::ReduceRealMax(end_total ,ParallelDescriptor::IOProcessorNumber());
-	if (amr_core_adv.Verbose()) {
-            amrex::Print() << "\nTotal Time: " << end_total << '\n';
-	}
-    }
-
-    // destroy timer for profiling
-    BL_PROFILE_VAR_STOP(pmain);
-
-    amrex::Finalize();
-}
diff --git a/Tutorials/GPU/CNS/CMakeLists.txt b/Tutorials/GPU/CNS/CMakeLists.txt
new file mode 100644
index 00000000000..b27e27fe42f
--- /dev/null
+++ b/Tutorials/GPU/CNS/CMakeLists.txt
@@ -0,0 +1,50 @@
+if (NOT AMReX_SPACEDIM EQUAL 3)
+   return()
+endif ()
+
+#
+# This directory contains 2 tutorials
+#
+#  * RT
+#  * Sod
+#
+set(_sources main.cpp CNS_advance.cpp CNS_bcfill.cpp CNSBld.cpp CNS.cpp CNS_derive.cpp CNS_derive.H CNS.H
+   CNS_index_macros.H CNS_io.cpp CNS_K.H CNS_parm.cpp CNS_parm.H CNS_setup.cpp CNS_tagging.H
+   hydro/CNS_hydro_K.H)
+list(TRANSFORM _sources PREPEND Source/)
+
+##########################################################################################
+#
+# RT tutorial
+#
+##########################################################################################
+set(_rt_sources Exec/RT/cns_prob.cpp Exec/RT/cns_prob.H Exec/RT/cns_prob_parm.H ${_sources})
+set(_input_files Exec/RT/inputs Exec/RT/inputs-rt)
+
+setup_tutorial(_rt_sources _input_files
+   BASE_NAME GPU_CNS_RT
+   RUNTIME_SUBDIR RT)
+
+unset(_rt_sources)
+
+
+##########################################################################################
+#
+# Sod tutorial
+#
+##########################################################################################
+set(_sod_sources Exec/Sod/cns_prob.cpp Exec/Sod/cns_prob.H Exec/Sod/cns_prob_parm.H ${_sources})
+set(_input_files Exec/Sod/inputs Exec/Sod/inputs-rt)
+
+setup_tutorial(_sod_sources _input_files
+   BASE_NAME GPU_CNS_Sod
+   RUNTIME_SUBDIR Sod)
+
+unset(_sod_sources)
+
+
+#
+# Clean-up
+#
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/GPU/CNS/Exec/RT/cns_prob.H b/Tutorials/GPU/CNS/Exec/RT/cns_prob.H
index 8a55995fd80..a5590ba95d6 100644
--- a/Tutorials/GPU/CNS/Exec/RT/cns_prob.H
+++ b/Tutorials/GPU/CNS/Exec/RT/cns_prob.H
@@ -13,42 +13,42 @@ void
 cns_initdata (int i, int j, int k, amrex::Array4<amrex::Real> const& state,
               amrex::GeometryData const& geomdata, Parm const& parm, ProbParm const& prob_parm)
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    const amrex::Real* prob_lo = geomdata.ProbLo();
-    const amrex::Real* prob_hi = geomdata.ProbHi();
-    const amrex::Real* dx      = geomdata.CellSize();
+    const Real* prob_lo = geomdata.ProbLo();
+    const Real* prob_hi = geomdata.ProbHi();
+    const Real* dx      = geomdata.CellSize();
 
-    constexpr amrex::Real pi = 3.14159265358979323846264338327950288_rt;
-    const amrex::Real splitx = 0.5_rt*(prob_lo[0]+prob_hi[0]);
-    const amrex::Real splity = 0.5_rt*(prob_lo[1]+prob_hi[1]);
-    const amrex::Real splitz = 0.5_rt*(prob_lo[2]+prob_hi[2]);
-    const amrex::Real L_x = prob_hi[0] - prob_lo[0];
-    const amrex::Real presmid = prob_parm.p0_base - prob_parm.rho_1*splitz;
+    constexpr Real pi = Real(3.14159265358979323846264338327950288);
+    const Real splitx = Real(0.5)*(prob_lo[0]+prob_hi[0]);
+    const Real splity = Real(0.5)*(prob_lo[1]+prob_hi[1]);
+    const Real splitz = Real(0.5)*(prob_lo[2]+prob_hi[2]);
+    const Real L_x = prob_hi[0] - prob_lo[0];
+    const Real presmid = prob_parm.p0_base - prob_parm.rho_1*splitz;
 
-    const amrex::Real z = prob_lo[2] + (k+0.5_rt)*dx[2];
-    const amrex::Real y = prob_lo[1] + (j+0.5_rt)*dx[1];
-    const amrex::Real x = prob_lo[0] + (i+0.5_rt)*dx[0];
+    const Real z = prob_lo[2] + (k+Real(0.5))*dx[2];
+    const Real y = prob_lo[1] + (j+Real(0.5))*dx[1];
+    const Real x = prob_lo[0] + (i+Real(0.5))*dx[0];
 
-    amrex::Real Pt;
+    Real Pt;
     if (z < splitz) {
         Pt = prob_parm.p0_base - prob_parm.rho_1*z;
     } else {
         Pt = presmid - prob_parm.rho_2*(z-splitz);
     }
-    const amrex::Real rhoet = Pt/(parm.eos_gamma-1.0_rt);
+    const Real rhoet = Pt/(parm.eos_gamma-Real(1.0));
 
-    const Real r2d = amrex::min(std::hypot((x-splitx),(y-splity)), 0.5_rt*L_x);
-    const Real pertheight = 0.5_rt - 0.01_rt*std::cos(2.0_rt*pi*r2d/L_x);
-    const Real rhot = prob_parm.rho_1 + ((prob_parm.rho_2-prob_parm.rho_1)/2.0_rt)*(1.0_rt+std::tanh((z-pertheight)/0.005_rt));
+    const Real r2d = amrex::min(std::hypot((x-splitx),(y-splity)), Real(0.5)*L_x);
+    const Real pertheight = Real(0.5) - Real(0.01)*std::cos(Real(2.0)*pi*r2d/L_x);
+    const Real rhot = prob_parm.rho_1 + ((prob_parm.rho_2-prob_parm.rho_1)/Real(2.0))*(Real(1.0)+std::tanh((z-pertheight)/Real(0.005)));
 
     state(i,j,k,URHO ) = rhot;
-    state(i,j,k,UMX  ) = 0.0_rt;
-    state(i,j,k,UMY  ) = 0.0_rt;
-    state(i,j,k,UMZ  ) = 0.0_rt;
+    state(i,j,k,UMX  ) = Real(0.0);
+    state(i,j,k,UMY  ) = Real(0.0);
+    state(i,j,k,UMZ  ) = Real(0.0);
     state(i,j,k,UEINT) = rhoet;
     state(i,j,k,UEDEN) = rhoet;
-    state(i,j,k,UTEMP) = 0.0_rt;
+    state(i,j,k,UTEMP) = Real(0.0);
 }
 
 #endif
diff --git a/Tutorials/GPU/CNS/Exec/RT/cns_prob.cpp b/Tutorials/GPU/CNS/Exec/RT/cns_prob.cpp
index 152a0abecea..c50a402a4a4 100644
--- a/Tutorials/GPU/CNS/Exec/RT/cns_prob.cpp
+++ b/Tutorials/GPU/CNS/Exec/RT/cns_prob.cpp
@@ -4,11 +4,11 @@
 #include <AMReX_ParmParse.H>
 
 extern "C" {
-    void amrex_probinit (const int* init,
-                         const int* name,
-                         const int* namelen,
-                         const amrex_real* problo,
-                         const amrex_real* probhi)
+    void amrex_probinit (const int* /*init*/,
+                         const int* /*name*/,
+                         const int* /*namelen*/,
+                         const amrex_real* /*problo*/,
+                         const amrex_real* /*probhi*/)
     {
         // could read parmparse parameters here
     }
diff --git a/Tutorials/GPU/CNS/Exec/RT/cns_prob_parm.H b/Tutorials/GPU/CNS/Exec/RT/cns_prob_parm.H
index 0ea77ee1d74..8bafefa4553 100644
--- a/Tutorials/GPU/CNS/Exec/RT/cns_prob_parm.H
+++ b/Tutorials/GPU/CNS/Exec/RT/cns_prob_parm.H
@@ -9,9 +9,9 @@ using namespace amrex::literals;
 struct ProbParm
     : amrex::Gpu::Managed
 {
-    amrex::Real rho_1 = 0.5_rt;
-    amrex::Real rho_2 = 2.0_rt;
-    amrex::Real p0_base = 5.0_rt;
+    amrex::Real rho_1 = 0.5;
+    amrex::Real rho_2 = 2.0;
+    amrex::Real p0_base = 5.0;
 };
 
 #endif
diff --git a/Tutorials/GPU/CNS/Exec/Sod/cns_prob.H b/Tutorials/GPU/CNS/Exec/Sod/cns_prob.H
index f235bde8b2f..229b32d1ab8 100644
--- a/Tutorials/GPU/CNS/Exec/Sod/cns_prob.H
+++ b/Tutorials/GPU/CNS/Exec/Sod/cns_prob.H
@@ -13,14 +13,14 @@ void
 cns_initdata (int i, int j, int k, amrex::Array4<amrex::Real> const& state,
               amrex::GeometryData const& geomdata, Parm const& parm, ProbParm const& prob_parm)
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    const amrex::Real* prob_lo = geomdata.ProbLo();
-    const amrex::Real* dx      = geomdata.CellSize();
+    const Real* prob_lo = geomdata.ProbLo();
+    const Real* dx      = geomdata.CellSize();
 
-    amrex::Real x = prob_lo[0] + (i+0.5_rt)*dx[0];
-    amrex::Real Pt, rhot, uxt;
-    if (x < 0.5_rt) {
+    Real x = prob_lo[0] + (i+Real(0.5))*dx[0];
+    Real Pt, rhot, uxt;
+    if (x < Real(0.5)) {
         Pt = prob_parm.p_l;
         rhot = prob_parm.rho_l;
         uxt = prob_parm.u_l;
@@ -31,12 +31,12 @@ cns_initdata (int i, int j, int k, amrex::Array4<amrex::Real> const& state,
     }
     state(i,j,k,URHO ) = rhot;
     state(i,j,k,UMX  ) = rhot*uxt;
-    state(i,j,k,UMY  ) = 0.0_rt;
-    state(i,j,k,UMZ  ) = 0.0_rt;
-    amrex::Real et = Pt/(parm.eos_gamma-1.0_rt);
+    state(i,j,k,UMY  ) = Real(0.0);
+    state(i,j,k,UMZ  ) = Real(0.0);
+    Real et = Pt/(parm.eos_gamma-Real(1.0));
     state(i,j,k,UEINT) = et;
-    state(i,j,k,UEDEN) = et + 0.5_rt*rhot*uxt*uxt;
-    state(i,j,k,UTEMP) = 0.0_rt;
+    state(i,j,k,UEDEN) = et + Real(0.5)*rhot*uxt*uxt;
+    state(i,j,k,UTEMP) = Real(0.0);
 }
 
 #endif
diff --git a/Tutorials/GPU/CNS/Exec/Sod/cns_prob.cpp b/Tutorials/GPU/CNS/Exec/Sod/cns_prob.cpp
index af2760cc2ef..9f7966864db 100644
--- a/Tutorials/GPU/CNS/Exec/Sod/cns_prob.cpp
+++ b/Tutorials/GPU/CNS/Exec/Sod/cns_prob.cpp
@@ -5,11 +5,11 @@
 #include "CNS.H"
 
 extern "C" {
-    void amrex_probinit (const int* init,
-                         const int* name,
-                         const int* namelen,
-                         const amrex_real* problo,
-                         const amrex_real* probhi)
+    void amrex_probinit (const int* /*init*/,
+                         const int* /*name*/,
+                         const int* /*namelen*/,
+                         const amrex_real* /*problo*/,
+                         const amrex_real* /*probhi*/)
     {
         amrex::ParmParse pp("prob");
 
diff --git a/Tutorials/GPU/CNS/Exec/Sod/cns_prob_parm.H b/Tutorials/GPU/CNS/Exec/Sod/cns_prob_parm.H
index fb30cbfa4b0..ccccb2a8162 100644
--- a/Tutorials/GPU/CNS/Exec/Sod/cns_prob_parm.H
+++ b/Tutorials/GPU/CNS/Exec/Sod/cns_prob_parm.H
@@ -9,12 +9,12 @@ using namespace amrex::literals;
 struct ProbParm
     : amrex::Gpu::Managed
 {
-    amrex::Real p_l = 1.0_rt;
-    amrex::Real p_r = 0.1_rt;
-    amrex::Real rho_l = 1.0_rt;
-    amrex::Real rho_r = 0.125_rt;
-    amrex::Real u_l = 0.0_rt;
-    amrex::Real u_r = 0.0_rt;
+    amrex::Real p_l = 1.0;
+    amrex::Real p_r = 0.1;
+    amrex::Real rho_l = 1.0;
+    amrex::Real rho_r = 0.125;
+    amrex::Real u_l = 0.0;
+    amrex::Real u_r = 0.0;
 };
 
 #endif
diff --git a/Tutorials/GPU/CNS/Source/CNS.cpp b/Tutorials/GPU/CNS/Source/CNS.cpp
index 7eeff959f24..8af54d28b73 100644
--- a/Tutorials/GPU/CNS/Source/CNS.cpp
+++ b/Tutorials/GPU/CNS/Source/CNS.cpp
@@ -17,12 +17,12 @@ BCRec     CNS::phys_bc;
 
 int       CNS::verbose = 0;
 IntVect   CNS::hydro_tile_size {AMREX_D_DECL(1024,16,16)};
-Real      CNS::cfl       = 0.3_rt;
+Real      CNS::cfl       = 0.3;
 int       CNS::do_reflux = 1;
 int       CNS::refine_max_dengrad_lev   = -1;
-Real      CNS::refine_dengrad           = 1.0e10_rt;
+Real      CNS::refine_dengrad           = 1.0e10;
 
-Real      CNS::gravity = 0.0_rt;
+Real      CNS::gravity = 0.0;
 
 CNS::CNS ()
 {}
@@ -102,9 +102,9 @@ CNS::initData ()
 
 void
 CNS::computeInitialDt (int                    finest_level,
-                       int                    sub_cycle,
+                       int                    /*sub_cycle*/,
                        Vector<int>&           n_cycle,
-                       const Vector<IntVect>& ref_ratio,
+                       const Vector<IntVect>& /*ref_ratio*/,
                        Vector<Real>&          dt_level,
                        Real                   stop_time)
 {
@@ -127,9 +127,9 @@ CNS::computeInitialDt (int                    finest_level,
     //
     // Limit dt's by the value of stop_time.
     //
-    const Real eps = 0.001_rt*dt_0;
+    const Real eps = 0.001*dt_0;
     Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0_rt) {
+    if (stop_time >= 0.0) {
         if ((cur_time + dt_0) > (stop_time - eps))
             dt_0 = stop_time - cur_time;
     }
@@ -144,9 +144,9 @@ CNS::computeInitialDt (int                    finest_level,
 
 void
 CNS::computeNewDt (int                    finest_level,
-                   int                    sub_cycle,
+                   int                    /*sub_cycle*/,
                    Vector<int>&           n_cycle,
-                   const Vector<IntVect>& ref_ratio,
+                   const Vector<IntVect>& /*ref_ratio*/,
                    Vector<Real>&          dt_min,
                    Vector<Real>&          dt_level,
                    Real                   stop_time,
@@ -201,9 +201,9 @@ CNS::computeNewDt (int                    finest_level,
     //
     // Limit dt's by the value of stop_time.
     //
-    const Real eps = 0.001_rt*dt_0;
+    const Real eps = 0.001*dt_0;
     Real cur_time  = state[State_Type].curTime();
-    if (stop_time >= 0.0_rt) {
+    if (stop_time >= 0.0) {
         if ((cur_time + dt_0) > (stop_time - eps)) {
             dt_0 = stop_time - cur_time;
         }
@@ -218,19 +218,19 @@ CNS::computeNewDt (int                    finest_level,
 }
 
 void
-CNS::post_regrid (int lbase, int new_finest)
+CNS::post_regrid (int /*lbase*/, int /*new_finest*/)
 {
 }
 
 void
-CNS::post_timestep (int iteration)
+CNS::post_timestep (int /*iteration*/)
 {
     BL_PROFILE("post_timestep");
 
     if (do_reflux && level < parent->finestLevel()) {
         MultiFab& S = get_new_data(State_Type);
         CNS& fine_level = getLevel(level+1);
-        fine_level.flux_reg->Reflux(S, 1.0_rt, 0, 0, NUM_STATE, geom);
+        fine_level.flux_reg->Reflux(S, Real(1.0), 0, 0, NUM_STATE, geom);
     }
 
     if (level < parent->finestLevel()) {
@@ -239,7 +239,7 @@ CNS::post_timestep (int iteration)
 }
 
 void
-CNS::postCoarseTimeStep (Real time)
+CNS::postCoarseTimeStep (Real /*time*/)
 {
     BL_PROFILE("postCoarseTimeStep()");
 
@@ -290,7 +290,7 @@ CNS::post_restart ()
 }
 
 void
-CNS::errorEst (TagBoxArray& tags, int, int, Real time, int, int)
+CNS::errorEst (TagBoxArray& tags, int, int, Real /*time*/, int, int)
 {
     BL_PROFILE("CNS::errorEst()");
 
@@ -383,7 +383,7 @@ CNS::buildMetrics ()
 {
     // make sure dx == dy == dz
     const Real* dx = geom.CellSize();
-    if (std::abs(dx[0]-dx[1]) > 1.e-12_rt*dx[0] || std::abs(dx[0]-dx[2]) > 1.e-12_rt*dx[0]) {
+    if (std::abs(dx[0]-dx[1]) > Real(1.e-12)*dx[0] || std::abs(dx[0]-dx[2]) > Real(1.e-12)*dx[0]) {
         amrex::Abort("CNS: must have dx == dy == dz\n");
     }
 }
diff --git a/Tutorials/GPU/CNS/Source/CNS_K.H b/Tutorials/GPU/CNS/Source/CNS_K.H
index e1df7294a23..b59526d6090 100644
--- a/Tutorials/GPU/CNS/Source/CNS_K.H
+++ b/Tutorials/GPU/CNS/Source/CNS_K.H
@@ -16,33 +16,33 @@ cns_estdt (amrex::Box const& bx, amrex::Array4<Real const> const& state,
            amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dx,
            Parm const& parm) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
 #if !defined(__CUDACC__) || (__CUDACC_VER_MAJOR__ != 9) || (__CUDACC_VER_MINOR__ != 2)
-    amrex::Real dt = std::numeric_limits<amrex::Real>::max();
+    Real dt = std::numeric_limits<Real>::max();
 #else
-    amrex::Real dt = 1.e37_rt;
+    Real dt = Real(1.e37);
 #endif
 
     for         (int k = lo.z; k <= hi.z; ++k) {
         for     (int j = lo.y; j <= hi.y; ++j) {
             for (int i = lo.x; i <= hi.x; ++i) {
-                amrex::Real rho = state(i,j,k,URHO);
-                amrex::Real mx  = state(i,j,k,UMX);
-                amrex::Real my  = state(i,j,k,UMY);
-                amrex::Real mz  = state(i,j,k,UMY);
-                amrex::Real ei  = state(i,j,k,UEINT);
-                amrex::Real rhoinv = 1.0_rt/amrex::max(rho,parm.smallr);
-                amrex::Real vx = mx*rhoinv;
-                amrex::Real vy = my*rhoinv;
-                amrex::Real vz = mz*rhoinv;
-                amrex::Real p = amrex::max((parm.eos_gamma-1.0_rt)*ei, parm.smallp);
-                amrex::Real cs = amrex::Math::sqrt(parm.eos_gamma*p*rhoinv);
-                amrex::Real dtx = dx[0]/(amrex::Math::abs(vx)+cs);
-                amrex::Real dty = dx[1]/(amrex::Math::abs(vy)+cs);
-                amrex::Real dtz = dx[2]/(amrex::Math::abs(vz)+cs);
+                Real rho = state(i,j,k,URHO);
+                Real mx  = state(i,j,k,UMX);
+                Real my  = state(i,j,k,UMY);
+                Real mz  = state(i,j,k,UMY);
+                Real ei  = state(i,j,k,UEINT);
+                Real rhoinv = Real(1.0)/amrex::max(rho,parm.smallr);
+                Real vx = mx*rhoinv;
+                Real vy = my*rhoinv;
+                Real vz = mz*rhoinv;
+                Real p = amrex::max((parm.eos_gamma-Real(1.0))*ei, parm.smallp);
+                Real cs = std::sqrt(parm.eos_gamma*p*rhoinv);
+                Real dtx = dx[0]/(amrex::Math::abs(vx)+cs);
+                Real dty = dx[1]/(amrex::Math::abs(vy)+cs);
+                Real dtz = dx[2]/(amrex::Math::abs(vz)+cs);
                 dt = amrex::min(dt,amrex::min(dtx,amrex::min(dty,dtz)));
             }
         }
@@ -58,14 +58,14 @@ void
 cns_compute_temperature (int i, int j, int k, amrex::Array4<amrex::Real> const& u,
                          Parm const& parm) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real rhoinv = 1.0_rt/u(i,j,k,URHO);
-    amrex::Real mx = u(i,j,k,UMX);
-    amrex::Real my = u(i,j,k,UMY);
-    amrex::Real mz = u(i,j,k,UMZ);
-    u(i,j,k,UEINT) = u(i,j,k,UEDEN) - 0.5_rt * rhoinv * (mx*mx+my*my+mz*mz);
-    u(i,j,k,UTEMP) = rhoinv * u(i,j,k,UEINT) * (1.0_rt/parm.cv);
+    Real rhoinv = Real(1.0)/u(i,j,k,URHO);
+    Real mx = u(i,j,k,UMX);
+    Real my = u(i,j,k,UMY);
+    Real mz = u(i,j,k,UMZ);
+    u(i,j,k,UEINT) = u(i,j,k,UEDEN) - Real(0.5) * rhoinv * (mx*mx+my*my+mz*mz);
+    u(i,j,k,UTEMP) = rhoinv * u(i,j,k,UEINT) * (Real(1.0)/parm.cv);
 }
 
 #endif
diff --git a/Tutorials/GPU/CNS/Source/CNS_advance.cpp b/Tutorials/GPU/CNS/Source/CNS_advance.cpp
index 9bea39018d3..744680f6af2 100644
--- a/Tutorials/GPU/CNS/Source/CNS_advance.cpp
+++ b/Tutorials/GPU/CNS/Source/CNS_advance.cpp
@@ -6,7 +6,7 @@
 using namespace amrex;
 
 Real
-CNS::advance (Real time, Real dt, int iteration, int ncycle)
+CNS::advance (Real time, Real dt, int /*iteration*/, int /*ncycle*/)
 {
     BL_PROFILE("CNS::advance()");
 
@@ -32,24 +32,24 @@ CNS::advance (Real time, Real dt, int iteration, int ncycle)
     }
 
     if (fr_as_crse) {
-        fr_as_crse->setVal(0.0_rt);
+        fr_as_crse->setVal(Real(0.0));
     }
 
     // RK2 stage 1
     FillPatch(*this, Sborder, NUM_GROW, time, State_Type, 0, NUM_STATE);
-    compute_dSdt(Sborder, dSdt, 0.5_rt*dt, fr_as_crse, fr_as_fine);
+    compute_dSdt(Sborder, dSdt, Real(0.5)*dt, fr_as_crse, fr_as_fine);
     // U^* = U^n + dt*dUdt^n
-    MultiFab::LinComb(S_new, 1.0_rt, Sborder, 0, dt, dSdt, 0, 0, NUM_STATE, 0);
+    MultiFab::LinComb(S_new, Real(1.0), Sborder, 0, dt, dSdt, 0, 0, NUM_STATE, 0);
     computeTemp(S_new,0);
 
     // RK2 stage 2
     // After fillpatch Sborder = U^n+dt*dUdt^n
     FillPatch(*this, Sborder, NUM_GROW, time+dt, State_Type, 0, NUM_STATE);
-    compute_dSdt(Sborder, dSdt, 0.5_rt*dt, fr_as_crse, fr_as_fine);
+    compute_dSdt(Sborder, dSdt, Real(0.5)*dt, fr_as_crse, fr_as_fine);
     // S_new = 0.5*(Sborder+S_old) = U^n + 0.5*dt*dUdt^n
-    MultiFab::LinComb(S_new, 0.5_rt, Sborder, 0, 0.5_rt, S_old, 0, 0, NUM_STATE, 0);
+    MultiFab::LinComb(S_new, Real(0.5), Sborder, 0, Real(0.5), S_old, 0, 0, NUM_STATE, 0);
     // S_new += 0.5*dt*dSdt
-    MultiFab::Saxpy(S_new, 0.5_rt*dt, dSdt, 0, 0, NUM_STATE, 0);
+    MultiFab::Saxpy(S_new, Real(0.5)*dt, dSdt, 0, 0, NUM_STATE, 0);
     // We now have S_new = U^{n+1} = (U^n+0.5*dt*dUdt^n) + 0.5*dt*dUdt^*
     computeTemp(S_new,0);
     
@@ -117,7 +117,7 @@ CNS::compute_dSdt (const MultiFab& S, MultiFab& dSdt, Real dt,
         [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
         {
             cns_riemann_x(i, j, k, fxfab, slope, q, *lparm);
-            for (int n = neqns; n < ncons; ++n) fxfab(i,j,k,n) = 0.0_rt;
+            for (int n = neqns; n < ncons; ++n) fxfab(i,j,k,n) = Real(0.0);
         });
 
         // y-direction
@@ -133,7 +133,7 @@ CNS::compute_dSdt (const MultiFab& S, MultiFab& dSdt, Real dt,
         [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
         {
             cns_riemann_y(i, j, k, fyfab, slope, q, *lparm);
-            for (int n = neqns; n < ncons; ++n) fyfab(i,j,k,n) = 0.0_rt;
+            for (int n = neqns; n < ncons; ++n) fyfab(i,j,k,n) = Real(0.0);
         });
 
         // z-direction
@@ -149,7 +149,7 @@ CNS::compute_dSdt (const MultiFab& S, MultiFab& dSdt, Real dt,
         [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
         {
             cns_riemann_z(i, j, k, fzfab, slope, q, *lparm);
-            for (int n = neqns; n < ncons; ++n) fzfab(i,j,k,n) = 0.0_rt;
+            for (int n = neqns; n < ncons; ++n) fzfab(i,j,k,n) = Real(0.0);
         });
 
         // don't have to do this, but we could
@@ -162,7 +162,7 @@ CNS::compute_dSdt (const MultiFab& S, MultiFab& dSdt, Real dt,
             cns_flux_to_dudt(i, j, k, n, dsdtfab, AMREX_D_DECL(fxfab,fyfab,fzfab), dxinv);
         });
 
-        if (gravity != 0.0_rt) {
+        if (gravity != Real(0.0)) {
             const Real g = gravity;
             const int irho = Density;
             const int imz = Zmom;
diff --git a/Tutorials/GPU/CNS/Source/CNS_bcfill.cpp b/Tutorials/GPU/CNS/Source/CNS_bcfill.cpp
index d6f60c15d30..665393345a4 100644
--- a/Tutorials/GPU/CNS/Source/CNS_bcfill.cpp
+++ b/Tutorials/GPU/CNS/Source/CNS_bcfill.cpp
@@ -29,12 +29,6 @@ void cns_bcfill (Box const& bx, FArrayBox& data,
                  const Vector<BCRec>& bcr, const int bcomp,
                  const int scomp)
 {
-    if (Gpu::inLaunchRegion()) {
-        GpuBndryFuncFab<CnsFillExtDir> gpu_bndry_func(CnsFillExtDir{});
-        gpu_bndry_func(bx,data,dcomp,numcomp,geom,time,bcr,bcomp,scomp);
-    } else {
-        // Without EXT_DIR (e.g., inflow), we can pass a nullptr
-        CpuBndryFuncFab cpu_bndry_func(nullptr);
-        cpu_bndry_func(bx,data,dcomp,numcomp,geom,time,bcr,bcomp,scomp);
-    }
+    GpuBndryFuncFab<CnsFillExtDir> gpu_bndry_func(CnsFillExtDir{});
+    gpu_bndry_func(bx,data,dcomp,numcomp,geom,time,bcr,bcomp,scomp);
 }
diff --git a/Tutorials/GPU/CNS/Source/CNS_derive.cpp b/Tutorials/GPU/CNS/Source/CNS_derive.cpp
index bedb1fd921c..848dd60b797 100644
--- a/Tutorials/GPU/CNS/Source/CNS_derive.cpp
+++ b/Tutorials/GPU/CNS/Source/CNS_derive.cpp
@@ -27,6 +27,6 @@ void cns_dervel (const Box& bx, FArrayBox& velfab, int dcomp, int /*ncomp*/,
     amrex::ParallelFor(bx,
     [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept
     {
-        vel(i,j,k,dcomp) = vel(i,j,k,1)/vel(i,j,k,0);
+        vel(i,j,k,dcomp) = dat(i,j,k,1)/dat(i,j,k,0);
     });
 }
diff --git a/Tutorials/GPU/CNS/Source/CNS_parm.H b/Tutorials/GPU/CNS/Source/CNS_parm.H
index f1cb40af699..0420c0da8a7 100644
--- a/Tutorials/GPU/CNS/Source/CNS_parm.H
+++ b/Tutorials/GPU/CNS/Source/CNS_parm.H
@@ -4,23 +4,21 @@
 #include <AMReX_REAL.H>
 #include <AMReX_GpuMemory.H>
 
-using namespace amrex::literals;
-
 struct Parm
     : public amrex::Gpu::Managed
 {
-    amrex::Real eos_gamma = 1.4_rt;
-    amrex::Real eos_mu = 28.97_rt;  // mean molecular weight
+    amrex::Real eos_gamma = 1.4;
+    amrex::Real eos_mu = 28.97;  // mean molecular weight
 
     amrex::Real cv;
     amrex::Real cp;
 
-    amrex::Real Pr  = 0.72_rt;     // Prandtl number
-    amrex::Real C_S = 1.458e-5_rt; // constant in Sutherland's law
-    amrex::Real T_S = 110.4_rt;    // Sutherland temperature
+    amrex::Real Pr  = 0.72;     // Prandtl number
+    amrex::Real C_S = 1.458e-5; // constant in Sutherland's law
+    amrex::Real T_S = 110.4;    // Sutherland temperature
 
-    amrex::Real smallr = 1.e-19_rt;
-    amrex::Real smallp = 1.e-10_rt;
+    amrex::Real smallr = 1.e-19;
+    amrex::Real smallp = 1.e-10;
 
     void Initialize ();
 };
diff --git a/Tutorials/GPU/CNS/Source/CNS_parm.cpp b/Tutorials/GPU/CNS/Source/CNS_parm.cpp
index 4a2edacd07b..3b3e4a27426 100644
--- a/Tutorials/GPU/CNS/Source/CNS_parm.cpp
+++ b/Tutorials/GPU/CNS/Source/CNS_parm.cpp
@@ -3,7 +3,7 @@
 
 void Parm::Initialize ()
 {
-    constexpr amrex::Real Ru = 8.31451e7_rt;
-    cv = Ru / (eos_mu * (eos_gamma-1.0_rt));
-    cp = eos_gamma * Ru / (eos_mu * (eos_gamma-1.0_rt));
+    constexpr amrex::Real Ru = amrex::Real(8.31451e7);
+    cv = Ru / (eos_mu * (eos_gamma-amrex::Real(1.0)));
+    cp = eos_gamma * Ru / (eos_mu * (eos_gamma-amrex::Real(1.0)));
 }
diff --git a/Tutorials/GPU/CNS/Source/hydro/CNS_hydro_K.H b/Tutorials/GPU/CNS/Source/hydro/CNS_hydro_K.H
index f098a9e0037..04f40528f13 100644
--- a/Tutorials/GPU/CNS/Source/hydro/CNS_hydro_K.H
+++ b/Tutorials/GPU/CNS/Source/hydro/CNS_hydro_K.H
@@ -14,17 +14,17 @@ cns_ctoprim (int i, int j, int k,
              amrex::Array4<amrex::Real> const& q,
              Parm const& parm) noexcept
 {
-    using namespace amrex::literals;
-
-    amrex::Real rho = amrex::max(u(i,j,k,URHO),parm.smallr);
-    amrex::Real rhoinv = 1.0_rt/rho;
-    amrex::Real ux = u(i,j,k,UMX)*rhoinv;
-    amrex::Real uy = u(i,j,k,UMY)*rhoinv;
-    amrex::Real uz = u(i,j,k,UMZ)*rhoinv;
-    amrex::Real kineng = 0.5_rt*rho*(ux*ux+uy*uy+uz*uz);
-    amrex::Real ei = u(i,j,k,UEDEN) - kineng;
-    if (ei <= 0.0_rt) ei = u(i,j,k,UEINT);
-    amrex::Real p = amrex::max((parm.eos_gamma-1.0_rt)*ei,parm.smallp);
+    using amrex::Real;
+
+    Real rho = amrex::max(u(i,j,k,URHO),parm.smallr);
+    Real rhoinv = Real(1.0)/rho;
+    Real ux = u(i,j,k,UMX)*rhoinv;
+    Real uy = u(i,j,k,UMY)*rhoinv;
+    Real uz = u(i,j,k,UMZ)*rhoinv;
+    Real kineng = Real(0.5)*rho*(ux*ux+uy*uy+uz*uz);
+    Real ei = u(i,j,k,UEDEN) - kineng;
+    if (ei <= Real(0.0)) ei = u(i,j,k,UEINT);
+    Real p = amrex::max((parm.eos_gamma-Real(1.0))*ei,parm.smallp);
     ei *= rhoinv;
 
     q(i,j,k,QRHO) = rho;
@@ -34,7 +34,7 @@ cns_ctoprim (int i, int j, int k,
     q(i,j,k,QEINT) = ei;
     q(i,j,k,QPRES) = p;
     q(i,j,k,QCS) = std::sqrt(parm.eos_gamma*p*rhoinv);
-    q(i,j,k,QTEMP) = 0.0_rt;
+    q(i,j,k,QTEMP) = Real(0.0);
 }
 
 AMREX_GPU_DEVICE
@@ -57,12 +57,12 @@ namespace {
 AMREX_GPU_DEVICE AMREX_FORCE_INLINE
 amrex::Real limiter (amrex::Real dlft, amrex::Real drgt) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real dcen = 0.5_rt*(dlft+drgt);
-    amrex::Real dsgn = amrex::Math::copysign(1.0_rt, dcen);
-    amrex::Real slop = 2.0_rt * amrex::min(amrex::Math::abs(dlft),amrex::Math::abs(drgt));
-    amrex::Real dlim = (dlft*drgt >= 0.0_rt) ? slop : 0.0_rt;
+    Real dcen = Real(0.5)*(dlft+drgt);
+    Real dsgn = amrex::Math::copysign(Real(1.0), dcen);
+    Real slop = Real(2.0) * amrex::min(amrex::Math::abs(dlft),amrex::Math::abs(drgt));
+    Real dlim = (dlft*drgt >= Real(0.0)) ? slop : Real(0.0);
     return dsgn * amrex::min(dlim,amrex::Math::abs(dcen));
 }
 
@@ -75,28 +75,28 @@ cns_slope_x (int i, int j, int k,
              amrex::Array4<amrex::Real> const& dq,
              amrex::Array4<amrex::Real const> const& q) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real dlft = 0.5_rt*(q(i,j,k,QPRES)-q(i-1,j,k,QPRES))/q(i,j,k,QCS) - 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k,QU) - q(i-1,j,k,QU));
-    amrex::Real drgt = 0.5_rt*(q(i+1,j,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) - 0.5_rt*q(i,j,k,QRHO)*(q(i+1,j,k,QU) - q(i,j,k,QU));
-    amrex::Real d0 = limiter(dlft, drgt);
+    Real dlft = Real(0.5)*(q(i,j,k,QPRES)-q(i-1,j,k,QPRES))/q(i,j,k,QCS) - Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k,QU) - q(i-1,j,k,QU));
+    Real drgt = Real(0.5)*(q(i+1,j,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) - Real(0.5)*q(i,j,k,QRHO)*(q(i+1,j,k,QU) - q(i,j,k,QU));
+    Real d0 = limiter(dlft, drgt);
 
-    amrex::Real cs2 = q(i,j,k,QCS)*q(i,j,k,QCS);
+    Real cs2 = q(i,j,k,QCS)*q(i,j,k,QCS);
     dlft = (q(i,j,k,QRHO)-q(i-1,j,k,QRHO)) - (q(i,j,k,QPRES) - q(i-1,j,k,QPRES))/cs2;
     drgt = (q(i+1,j,k,QRHO)-q(i,j,k,QRHO)) - (q(i+1,j,k,QPRES) - q(i,j,k,QPRES))/cs2;
-    amrex::Real d1 = limiter(dlft, drgt);
+    Real d1 = limiter(dlft, drgt);
 
-    dlft = 0.5_rt*(q(i,j,k,QPRES)-q(i-1,j,k,QPRES))/q(i,j,k,QCS) + 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k,QU) - q(i-1,j,k,QU));
-    drgt = 0.5_rt*(q(i+1,j,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) + 0.5_rt*q(i,j,k,QRHO)*(q(i+1,j,k,QU) - q(i,j,k,QU));
-    amrex::Real d2 = limiter(dlft, drgt);
+    dlft = Real(0.5)*(q(i,j,k,QPRES)-q(i-1,j,k,QPRES))/q(i,j,k,QCS) + Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k,QU) - q(i-1,j,k,QU));
+    drgt = Real(0.5)*(q(i+1,j,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) + Real(0.5)*q(i,j,k,QRHO)*(q(i+1,j,k,QU) - q(i,j,k,QU));
+    Real d2 = limiter(dlft, drgt);
 
     dlft = q(i,j,k,QV) - q(i-1,j,k,QV);
     drgt = q(i+1,j,k,QV) - q(i,j,k,QV);
-    amrex::Real d3 = limiter(dlft, drgt);
+    Real d3 = limiter(dlft, drgt);
 
     dlft = q(i,j,k,QW) - q(i-1,j,k,QW);
     drgt = q(i+1,j,k,QW) - q(i,j,k,QW);
-    amrex::Real d4 = limiter(dlft, drgt);
+    Real d4 = limiter(dlft, drgt);
 
     dq(i,j,k,0) = d0;
     dq(i,j,k,1) = d1;
@@ -112,28 +112,28 @@ cns_slope_y (int i, int j, int k,
              amrex::Array4<amrex::Real> const& dq,
              amrex::Array4<amrex::Real const> const& q) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real dlft = 0.5_rt*(q(i,j,k,QPRES)-q(i,j-1,k,QPRES))/q(i,j,k,QCS) - 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k,QV) - q(i,j-1,k,QV));
-    amrex::Real drgt = 0.5_rt*(q(i,j+1,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) - 0.5_rt*q(i,j,k,QRHO)*(q(i,j+1,k,QV) - q(i,j,k,QV));
-    amrex::Real d0 = limiter(dlft, drgt);
+    Real dlft = Real(0.5)*(q(i,j,k,QPRES)-q(i,j-1,k,QPRES))/q(i,j,k,QCS) - Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k,QV) - q(i,j-1,k,QV));
+    Real drgt = Real(0.5)*(q(i,j+1,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) - Real(0.5)*q(i,j,k,QRHO)*(q(i,j+1,k,QV) - q(i,j,k,QV));
+    Real d0 = limiter(dlft, drgt);
 
-    amrex::Real cs2 = q(i,j,k,QCS)*q(i,j,k,QCS);
+    Real cs2 = q(i,j,k,QCS)*q(i,j,k,QCS);
     dlft = (q(i,j,k,QRHO)-q(i,j-1,k,QRHO)) - (q(i,j,k,QPRES) - q(i,j-1,k,QPRES))/cs2;
     drgt = (q(i,j+1,k,QRHO)-q(i,j,k,QRHO)) - (q(i,j+1,k,QPRES) - q(i,j,k,QPRES))/cs2;
-    amrex::Real d1 = limiter(dlft, drgt);
+    Real d1 = limiter(dlft, drgt);
 
-    dlft = 0.5_rt*(q(i,j,k,QPRES)-q(i,j-1,k,QPRES))/q(i,j,k,QCS) + 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k,QV) - q(i,j-1,k,QV));
-    drgt = 0.5_rt*(q(i,j+1,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) + 0.5_rt*q(i,j,k,QRHO)*(q(i,j+1,k,QV) - q(i,j,k,QV));
-    amrex::Real d2 = limiter(dlft, drgt);
+    dlft = Real(0.5)*(q(i,j,k,QPRES)-q(i,j-1,k,QPRES))/q(i,j,k,QCS) + Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k,QV) - q(i,j-1,k,QV));
+    drgt = Real(0.5)*(q(i,j+1,k,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) + Real(0.5)*q(i,j,k,QRHO)*(q(i,j+1,k,QV) - q(i,j,k,QV));
+    Real d2 = limiter(dlft, drgt);
 
     dlft = q(i,j,k,QU) - q(i,j-1,k,QU);
     drgt = q(i,j+1,k,QU) - q(i,j,k,QU);
-    amrex::Real d3 = limiter(dlft, drgt);
+    Real d3 = limiter(dlft, drgt);
 
     dlft = q(i,j,k,QW) - q(i,j-1,k,QW);
     drgt = q(i,j+1,k,QW) - q(i,j,k,QW);
-    amrex::Real d4 = limiter(dlft, drgt);
+    Real d4 = limiter(dlft, drgt);
 
     dq(i,j,k,0) = d0;
     dq(i,j,k,1) = d1;
@@ -149,28 +149,28 @@ cns_slope_z (int i, int j, int k,
              amrex::Array4<amrex::Real> const& dq,
              amrex::Array4<amrex::Real const> const& q) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real dlft = 0.5_rt*(q(i,j,k,QPRES)-q(i,j,k-1,QPRES))/q(i,j,k,QCS) - 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k,QW) - q(i,j,k-1,QW));
-    amrex::Real drgt = 0.5_rt*(q(i,j,k+1,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) - 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k+1,QW) - q(i,j,k,QW));
-    amrex::Real d0 = limiter(dlft, drgt);
+    Real dlft = Real(0.5)*(q(i,j,k,QPRES)-q(i,j,k-1,QPRES))/q(i,j,k,QCS) - Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k,QW) - q(i,j,k-1,QW));
+    Real drgt = Real(0.5)*(q(i,j,k+1,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) - Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k+1,QW) - q(i,j,k,QW));
+    Real d0 = limiter(dlft, drgt);
 
-    amrex::Real cs2 = q(i,j,k,QCS)*q(i,j,k,QCS);
+    Real cs2 = q(i,j,k,QCS)*q(i,j,k,QCS);
     dlft = (q(i,j,k,QRHO)-q(i,j,k-1,QRHO)) - (q(i,j,k,QPRES) - q(i,j,k-1,QPRES))/cs2;
     drgt = (q(i,j,k+1,QRHO)-q(i,j,k,QRHO)) - (q(i,j,k+1,QPRES) - q(i,j,k,QPRES))/cs2;
-    amrex::Real d1 = limiter(dlft, drgt);
+    Real d1 = limiter(dlft, drgt);
 
-    dlft = 0.5_rt*(q(i,j,k,QPRES)-q(i,j,k-1,QPRES))/q(i,j,k,QCS) + 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k,QW) - q(i,j,k-1,QW));
-    drgt = 0.5_rt*(q(i,j,k+1,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) + 0.5_rt*q(i,j,k,QRHO)*(q(i,j,k+1,QW) - q(i,j,k,QW));
-    amrex::Real d2 = limiter(dlft, drgt);
+    dlft = Real(0.5)*(q(i,j,k,QPRES)-q(i,j,k-1,QPRES))/q(i,j,k,QCS) + Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k,QW) - q(i,j,k-1,QW));
+    drgt = Real(0.5)*(q(i,j,k+1,QPRES)-q(i,j,k,QPRES))/q(i,j,k,QCS) + Real(0.5)*q(i,j,k,QRHO)*(q(i,j,k+1,QW) - q(i,j,k,QW));
+    Real d2 = limiter(dlft, drgt);
 
     dlft = q(i,j,k,QU) - q(i,j,k-1,QU);
     drgt = q(i,j,k+1,QU) - q(i,j,k,QU);
-    amrex::Real d3 = limiter(dlft, drgt);
+    Real d3 = limiter(dlft, drgt);
 
     dlft = q(i,j,k,QV) - q(i,j,k-1,QV);
     drgt = q(i,j,k+1,QV) - q(i,j,k,QV);
-    amrex::Real d4 = limiter(dlft, drgt);
+    Real d4 = limiter(dlft, drgt);
 
     dq(i,j,k,0) = d0;
     dq(i,j,k,1) = d1;
@@ -192,125 +192,125 @@ riemann (const amrex::Real gamma, const amrex::Real smallp, const amrex::Real sm
          amrex::Real& flxrho, amrex::Real& flxu, amrex::Real& flxut,
          amrex::Real& flxutt, amrex::Real& flxe) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    constexpr amrex::Real weakwv = 1.e-3_rt;
-    constexpr amrex::Real small = 1.e-6_rt;
+    constexpr Real weakwv = Real(1.e-3);
+    constexpr Real small = Real(1.e-6);
 
-    amrex::Real clsql = gamma*pl*rl;
-    amrex::Real clsqr = gamma*pr*rr;
-    amrex::Real wl = std::sqrt(clsql);
-    amrex::Real wr = std::sqrt(clsqr);
-    amrex::Real cleft = wl/rl;
-    amrex::Real cright = wr/rr;
-    amrex::Real ccsmall = small*(cleft+cright);
+    Real clsql = gamma*pl*rl;
+    Real clsqr = gamma*pr*rr;
+    Real wl = std::sqrt(clsql);
+    Real wr = std::sqrt(clsqr);
+    Real cleft = wl/rl;
+    Real cright = wr/rr;
+    Real ccsmall = small*(cleft+cright);
 
-    amrex::Real pstar = (wl*pr + wr*pl - wr*wl*(ur-ul))/(wl+wr);
+    Real pstar = (wl*pr + wr*pl - wr*wl*(ur-ul))/(wl+wr);
     pstar = amrex::max(pstar,smallp);
-    amrex::Real pstnm1 = pstar;
+    Real pstnm1 = pstar;
 
-    amrex::Real wlsq = (.5_rt*(gamma-1._rt)*(pstar+pl)+pstar)*rl;
-    amrex::Real wrsq = (.5_rt*(gamma-1._rt)*(pstar+pr)+pstar)*rr;
+    Real wlsq = (Real(0.5)*(gamma-Real(1.))*(pstar+pl)+pstar)*rl;
+    Real wrsq = (Real(0.5)*(gamma-Real(1.))*(pstar+pr)+pstar)*rr;
 
     wl = std::sqrt(wlsq);
     wr = std::sqrt(wrsq);
-    amrex::Real ustarp = ul - (pstar-pl)/wl;
-    amrex::Real ustarm = ur + (pstar-pr)/wr;
+    Real ustarp = ul - (pstar-pl)/wl;
+    Real ustarm = ur + (pstar-pr)/wr;
 
     pstar = (wl*pr + wr*pl - wr*wl*(ur-ul))/(wl+wr);
     pstar = amrex::max(pstar,smallp);
 
-    amrex::Real ustar;
+    Real ustar;
     for (int iter = 0; iter < 3; ++iter)
     {
-        wlsq = (.5_rt*(gamma-1._rt)*(pstar+pl)+pstar)*rl;
-        wrsq = (.5_rt*(gamma-1._rt)*(pstar+pr)+pstar)*rr;
+        wlsq = (Real(0.5)*(gamma-Real(1.))*(pstar+pl)+pstar)*rl;
+        wrsq = (Real(0.5)*(gamma-Real(1.))*(pstar+pr)+pstar)*rr;
 
-        wl = 1._rt/std::sqrt(wlsq);
-        wr = 1._rt/std::sqrt(wrsq);
+        wl = Real(1.)/std::sqrt(wlsq);
+        wr = Real(1.)/std::sqrt(wrsq);
 
-        amrex::Real ustnm1 = ustarm;
-        amrex::Real ustnp1 = ustarp;
+        Real ustnm1 = ustarm;
+        Real ustnp1 = ustarp;
 
         ustarm = ur - (pr - pstar)*wr;
         ustarp = ul + (pl - pstar)*wl;
 
-        amrex::Real dpditer = amrex::Math::abs(pstnm1-pstar);
-        amrex::Real zp = amrex::Math::abs(ustarp-ustnp1);
-        if (zp-weakwv*cleft < 0.0_rt ) {
+        Real dpditer = amrex::Math::abs(pstnm1-pstar);
+        Real zp = amrex::Math::abs(ustarp-ustnp1);
+        if (zp-weakwv*cleft < Real(0.0) ) {
             zp = dpditer*wl;
         }
-        amrex::Real zm = amrex::Math::abs(ustarm-ustnm1);
-        if (zm-weakwv*cright < 0.0_rt ) {
+        Real zm = amrex::Math::abs(ustarm-ustnm1);
+        if (zm-weakwv*cright < Real(0.0) ) {
             zm = dpditer*wr;
         }
 
-        amrex::Real zz = zp+zm;
-        amrex::Real denom = dpditer/ amrex::max(zz,ccsmall);
+        Real zz = zp+zm;
+        Real denom = dpditer/ amrex::max(zz,ccsmall);
         pstnm1 = pstar;
         pstar = pstar - denom*(ustarm-ustarp);
         pstar = amrex::max(pstar,smallp);
-        ustar = 0.5_rt*(ustarm+ustarp);
+        ustar = Real(0.5)*(ustarm+ustarp);
     }
 
-    amrex::Real ro, uo, po, sgnm, utrans1, utrans2;
-    if (ustar > 0._rt) {
+    Real ro, uo, po, sgnm, utrans1, utrans2;
+    if (ustar > Real(0.)) {
         ro = rl;
         uo = ul;
         po = pl;
-        sgnm = 1._rt;
+        sgnm = Real(1.);
         utrans1 = ut1l;
         utrans2 = ut2l;
-    } else if (ustar < 0._rt) {
+    } else if (ustar < Real(0.)) {
         ro = rr;
         uo = ur;
         po = pr;
-        sgnm = -1._rt;
+        sgnm = Real(-1.);
         utrans1 = ut1r;
         utrans2 = ut2r;
     } else {
-        uo = 0.5_rt*(ur+ul);
-        po = 0.5_rt*(pr+pl);
-        ro = 2._rt*(rl*rr)/(rl+rr);
-        sgnm = 1._rt;
-        utrans1 = 0.5_rt*(ut1l+ut1r);
-        utrans2 = 0.5_rt*(ut2l+ut2r);
+        uo = Real(0.5)*(ur+ul);
+        po = Real(0.5)*(pr+pl);
+        ro = Real(2.)*(rl*rr)/(rl+rr);
+        sgnm = Real(1.);
+        utrans1 = Real(0.5)*(ut1l+ut1r);
+        utrans2 = Real(0.5)*(ut2l+ut2r);
     }
-    amrex::Real wosq = (.5_rt*(gamma-1._rt)*(pstar+po)+pstar)*ro;
-    amrex::Real co = std::sqrt(gamma * po / ro);
-    amrex::Real wo = std::sqrt(wosq);
-    amrex::Real dpjmp = pstar-po;
-    amrex::Real rstar = ro/(1._rt-ro*dpjmp/wosq);
-    amrex::Real cstar = std::sqrt(gamma * pstar / rstar);
-    amrex::Real spout = co-sgnm*uo;
-    amrex::Real spin = cstar - sgnm*uo;
+    Real wosq = (Real(0.5)*(gamma-Real(1.))*(pstar+po)+pstar)*ro;
+    Real co = std::sqrt(gamma * po / ro);
+    Real wo = std::sqrt(wosq);
+    Real dpjmp = pstar-po;
+    Real rstar = ro/(Real(1.)-ro*dpjmp/wosq);
+    Real cstar = std::sqrt(gamma * pstar / rstar);
+    Real spout = co-sgnm*uo;
+    Real spin = cstar - sgnm*uo;
     if(pstar >= po) {
         spin = wo/ro-sgnm*uo;
         spout = spin;
     }
-    amrex::Real ss = amrex::max(spout-spin, spout+spin);
-    amrex::Real frac = 0.5_rt*(1._rt+(spin+spout)/amrex::max(ss,ccsmall));
+    Real ss = amrex::max(spout-spin, spout+spin);
+    Real frac = Real(0.5)*(Real(1.)+(spin+spout)/amrex::max(ss,ccsmall));
 
-    amrex::Real rgdnv, ugdnv, pgdnv;
-    if (spout < 0._rt) {
+    Real rgdnv, ugdnv, pgdnv;
+    if (spout < Real(0.)) {
         rgdnv = ro;
         ugdnv = uo;
         pgdnv = po;
-    } else if(spin >= 0._rt) {
+    } else if(spin >= Real(0.)) {
         rgdnv = rstar;
         ugdnv = ustar;
         pgdnv = pstar;
     } else {
-        rgdnv = frac*rstar + (1._rt - frac)* ro;
-        ugdnv = frac*ustar + (1._rt - frac)* uo;
-        pgdnv = frac*pstar + (1._rt - frac)* po;
+        rgdnv = frac*rstar + (Real(1.) - frac)* ro;
+        ugdnv = frac*ustar + (Real(1.) - frac)* uo;
+        pgdnv = frac*pstar + (Real(1.) - frac)* po;
     }
     
     flxrho = rgdnv*ugdnv;
     flxu = rgdnv*ugdnv*ugdnv+pgdnv;
     flxut = rgdnv*ugdnv*utrans1;
     flxutt = rgdnv*ugdnv*utrans2;
-    flxe = ugdnv*(0.5_rt*rgdnv*(ugdnv*ugdnv+utrans1*utrans1+utrans2*utrans2) + pgdnv/(gamma -1._rt) + pgdnv);
+    flxe = ugdnv*(Real(0.5)*rgdnv*(ugdnv*ugdnv+utrans1*utrans1+utrans2*utrans2) + pgdnv/(gamma -Real(1.)) + pgdnv);
 }
 }
 
@@ -323,25 +323,25 @@ cns_riemann_x (int i, int j, int k,
                amrex::Array4<amrex::Real const> const& q,
                Parm const& parm) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real cspeed = q(i-1,j,k,QCS);
-    amrex::Real rl = q(i-1,j,k,QRHO) + 0.5_rt * ( (dq(i-1,j,k,0)+dq(i-1,j,k,2))/cspeed + dq(i-1,j,k,1));
+    Real cspeed = q(i-1,j,k,QCS);
+    Real rl = q(i-1,j,k,QRHO) + Real(0.5) * ( (dq(i-1,j,k,0)+dq(i-1,j,k,2))/cspeed + dq(i-1,j,k,1));
     rl = amrex::max(rl, parm.smallr);
-    amrex::Real ul = q(i-1,j,k,QU) + 0.5_rt * ( (dq(i-1,j,k,2)-dq(i-1,j,k,0))/q(i-1,j,k,QRHO));
-    amrex::Real pl = q(i-1,j,k,QPRES) + 0.5_rt *  (dq(i-1,j,k,0)+dq(i-1,j,k,2))*cspeed;
+    Real ul = q(i-1,j,k,QU) + Real(0.5) * ( (dq(i-1,j,k,2)-dq(i-1,j,k,0))/q(i-1,j,k,QRHO));
+    Real pl = q(i-1,j,k,QPRES) + Real(0.5) *  (dq(i-1,j,k,0)+dq(i-1,j,k,2))*cspeed;
     pl = amrex::max(pl, parm.smallp);
-    amrex::Real ut1l = q(i-1,j,k,QV) + 0.5_rt * dq(i-1,j,k,3);
-    amrex::Real ut2l = q(i-1,j,k,QW) + 0.5_rt * dq(i-1,j,k,4);
+    Real ut1l = q(i-1,j,k,QV) + Real(0.5) * dq(i-1,j,k,3);
+    Real ut2l = q(i-1,j,k,QW) + Real(0.5) * dq(i-1,j,k,4);
 
     cspeed = q(i,j,k,QCS);
-    amrex::Real rr = q(i,j,k,QRHO) - 0.5_rt * ( (dq(i,j,k,0)+dq(i,j,k,2))/cspeed + dq(i,j,k,1));
+    Real rr = q(i,j,k,QRHO) - Real(0.5) * ( (dq(i,j,k,0)+dq(i,j,k,2))/cspeed + dq(i,j,k,1));
     rr = amrex::max(rr, parm.smallr);
-    amrex::Real ur = q(i,j,k,QU) - 0.5_rt * ( (dq(i,j,k,2)-dq(i,j,k,0))/q(i,j,k,QRHO));
-    amrex::Real pr = q(i,j,k,QPRES) - 0.5_rt * (dq(i,j,k,0)+dq(i,j,k,2))*cspeed;
+    Real ur = q(i,j,k,QU) - Real(0.5) * ( (dq(i,j,k,2)-dq(i,j,k,0))/q(i,j,k,QRHO));
+    Real pr = q(i,j,k,QPRES) - Real(0.5) * (dq(i,j,k,0)+dq(i,j,k,2))*cspeed;
     pr = amrex::max(pr, parm.smallp);
-    amrex::Real ut1r = q(i,j,k,QV) - 0.5_rt * dq(i,j,k,3);
-    amrex::Real ut2r = q(i,j,k,QW) - 0.5_rt * dq(i,j,k,4);
+    Real ut1r = q(i,j,k,QV) - Real(0.5) * dq(i,j,k,3);
+    Real ut2r = q(i,j,k,QW) - Real(0.5) * dq(i,j,k,4);
 
     riemann(parm.eos_gamma, parm.smallp, parm.smallr,
             rl, ul, pl, ut1l, ut2l, rr, ur, pr, ut1r, ut2r,
@@ -357,25 +357,25 @@ cns_riemann_y (int i, int j, int k,
                amrex::Array4<amrex::Real const> const& q,
                Parm const& parm) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real cspeed = q(i,j-1,k,QCS);
-    amrex::Real rl = q(i,j-1,k,QRHO) + 0.5_rt * ( (dq(i,j-1,k,0)+dq(i,j-1,k,2))/cspeed + dq(i,j-1,k,1));
+    Real cspeed = q(i,j-1,k,QCS);
+    Real rl = q(i,j-1,k,QRHO) + Real(0.5) * ( (dq(i,j-1,k,0)+dq(i,j-1,k,2))/cspeed + dq(i,j-1,k,1));
     rl = amrex::max(rl, parm.smallr);
-    amrex::Real ul = q(i,j-1,k,QV) + 0.5_rt * ( (dq(i,j-1,k,2)-dq(i,j-1,k,0))/q(i,j-1,k,QRHO));
-    amrex::Real pl = q(i,j-1,k,QPRES) + 0.5_rt *  (dq(i,j-1,k,0)+dq(i,j-1,k,2))*cspeed;
+    Real ul = q(i,j-1,k,QV) + Real(0.5) * ( (dq(i,j-1,k,2)-dq(i,j-1,k,0))/q(i,j-1,k,QRHO));
+    Real pl = q(i,j-1,k,QPRES) + Real(0.5) *  (dq(i,j-1,k,0)+dq(i,j-1,k,2))*cspeed;
     pl = amrex::max(pl, parm.smallp);
-    amrex::Real ut1l = q(i,j-1,k,QU) + 0.5_rt * dq(i,j-1,k,3);
-    amrex::Real ut2l = q(i,j-1,k,QW) + 0.5_rt * dq(i,j-1,k,4);
+    Real ut1l = q(i,j-1,k,QU) + Real(0.5) * dq(i,j-1,k,3);
+    Real ut2l = q(i,j-1,k,QW) + Real(0.5) * dq(i,j-1,k,4);
 
     cspeed = q(i,j,k,QCS);
-    amrex::Real rr = q(i,j,k,QRHO) - 0.5_rt * ( (dq(i,j,k,0)+dq(i,j,k,2))/cspeed + dq(i,j,k,1));
+    Real rr = q(i,j,k,QRHO) - Real(0.5) * ( (dq(i,j,k,0)+dq(i,j,k,2))/cspeed + dq(i,j,k,1));
     rr = amrex::max(rr, parm.smallr);
-    amrex::Real ur = q(i,j,k,QV) - 0.5_rt * ( (dq(i,j,k,2)-dq(i,j,k,0))/q(i,j,k,QRHO));
-    amrex::Real pr = q(i,j,k,QPRES) - 0.5_rt * (dq(i,j,k,0)+dq(i,j,k,2))*cspeed;
+    Real ur = q(i,j,k,QV) - Real(0.5) * ( (dq(i,j,k,2)-dq(i,j,k,0))/q(i,j,k,QRHO));
+    Real pr = q(i,j,k,QPRES) - Real(0.5) * (dq(i,j,k,0)+dq(i,j,k,2))*cspeed;
     pr = amrex::max(pr, parm.smallp);
-    amrex::Real ut1r = q(i,j,k,QU) - 0.5_rt * dq(i,j,k,3);
-    amrex::Real ut2r = q(i,j,k,QW) - 0.5_rt * dq(i,j,k,4);
+    Real ut1r = q(i,j,k,QU) - Real(0.5) * dq(i,j,k,3);
+    Real ut2r = q(i,j,k,QW) - Real(0.5) * dq(i,j,k,4);
 
     riemann(parm.eos_gamma, parm.smallp, parm.smallr,
             rl, ul, pl, ut1l, ut2l, rr, ur, pr, ut1r, ut2r,
@@ -391,25 +391,25 @@ cns_riemann_z (int i, int j, int k,
                amrex::Array4<amrex::Real const> const& q,
                Parm const& parm) noexcept
 {
-    using namespace amrex::literals;
+    using amrex::Real;
 
-    amrex::Real cspeed = q(i,j,k-1,QCS);
-    amrex::Real rl = q(i,j,k-1,QRHO) + 0.5_rt * ( (dq(i,j,k-1,0)+dq(i,j,k-1,2))/cspeed + dq(i,j,k-1,1));
+    Real cspeed = q(i,j,k-1,QCS);
+    Real rl = q(i,j,k-1,QRHO) + Real(0.5) * ( (dq(i,j,k-1,0)+dq(i,j,k-1,2))/cspeed + dq(i,j,k-1,1));
     rl = amrex::max(rl, parm.smallr);
-    amrex::Real ul = q(i,j,k-1,QW) + 0.5_rt * ( (dq(i,j,k-1,2)-dq(i,j,k-1,0))/q(i,j,k-1,QRHO));
-    amrex::Real pl = q(i,j,k-1,QPRES) + 0.5_rt *  (dq(i,j,k-1,0)+dq(i,j,k-1,2))*cspeed;
+    Real ul = q(i,j,k-1,QW) + Real(0.5) * ( (dq(i,j,k-1,2)-dq(i,j,k-1,0))/q(i,j,k-1,QRHO));
+    Real pl = q(i,j,k-1,QPRES) + Real(0.5) *  (dq(i,j,k-1,0)+dq(i,j,k-1,2))*cspeed;
     pl = amrex::max(pl, parm.smallp);
-    amrex::Real ut1l = q(i,j,k-1,QU) + 0.5_rt * dq(i,j,k-1,3);
-    amrex::Real ut2l = q(i,j,k-1,QV) + 0.5_rt * dq(i,j,k-1,4);
+    Real ut1l = q(i,j,k-1,QU) + Real(0.5) * dq(i,j,k-1,3);
+    Real ut2l = q(i,j,k-1,QV) + Real(0.5) * dq(i,j,k-1,4);
 
     cspeed = q(i,j,k,QCS);
-    amrex::Real rr = q(i,j,k,QRHO) - 0.5_rt * ( (dq(i,j,k,0)+dq(i,j,k,2))/cspeed + dq(i,j,k,1));
+    Real rr = q(i,j,k,QRHO) - Real(0.5) * ( (dq(i,j,k,0)+dq(i,j,k,2))/cspeed + dq(i,j,k,1));
     rr = amrex::max(rr, parm.smallr);
-    amrex::Real ur = q(i,j,k,QW) - 0.5_rt * ( (dq(i,j,k,2)-dq(i,j,k,0))/q(i,j,k,QRHO));
-    amrex::Real pr = q(i,j,k,QPRES) - 0.5_rt *  (dq(i,j,k,0)+dq(i,j,k,2))*cspeed;
+    Real ur = q(i,j,k,QW) - Real(0.5) * ( (dq(i,j,k,2)-dq(i,j,k,0))/q(i,j,k,QRHO));
+    Real pr = q(i,j,k,QPRES) - Real(0.5) *  (dq(i,j,k,0)+dq(i,j,k,2))*cspeed;
     pr = amrex::max(pr, parm.smallp);
-    amrex::Real ut1r = q(i,j,k,QU) - 0.5_rt * dq(i,j,k,3);
-    amrex::Real ut2r = q(i,j,k,QV) - 0.5_rt * dq(i,j,k,4);
+    Real ut1r = q(i,j,k,QU) - Real(0.5) * dq(i,j,k,3);
+    Real ut2r = q(i,j,k,QV) - Real(0.5) * dq(i,j,k,4);
 
     riemann(parm.eos_gamma, parm.smallp, parm.smallr,
             rl, ul, pl, ut1l, ut2l, rr, ur, pr, ut1r, ut2r,
diff --git a/Tutorials/GPU/CNS/Source/main.cpp b/Tutorials/GPU/CNS/Source/main.cpp
index 5b633050cd7..f7a75cb4a77 100644
--- a/Tutorials/GPU/CNS/Source/main.cpp
+++ b/Tutorials/GPU/CNS/Source/main.cpp
@@ -15,8 +15,8 @@ int main (int argc, char* argv[])
     BL_PROFILE_VAR("main()", pmain);
 
     Real timer_tot = amrex::second();
-    Real timer_init = 0._rt;
-    Real timer_advance = 0._rt;
+    Real timer_init = Real(0.);
+    Real timer_advance = Real(0.);
 
     int  max_step;
     Real strt_time;
@@ -26,19 +26,19 @@ int main (int argc, char* argv[])
         ParmParse pp; 
 
         max_step  = -1;
-        strt_time =  0.0_rt;
-        stop_time = -1.0_rt;
+        strt_time = Real( 0.0);
+        stop_time = Real(-1.0);
 
         pp.query("max_step",max_step);
         pp.query("strt_time",strt_time);
         pp.query("stop_time",stop_time);
     }
 
-    if (strt_time < 0.0_rt) {
+    if (strt_time < Real(0.0)) {
         amrex::Abort("MUST SPECIFY a non-negative strt_time"); 
     }
 
-    if (max_step < 0 && stop_time < 0.0_rt) {
+    if (max_step < 0 && stop_time < Real(0.0)) {
 	amrex::Abort("Exiting because neither max_step nor stop_time is non-negative.");
     }
 
@@ -54,7 +54,7 @@ int main (int argc, char* argv[])
 
 	while ( amr.okToContinue() &&
   	       (amr.levelSteps(0) < max_step || max_step < 0) &&
-	       (amr.cumTime() < stop_time || stop_time < 0.0_rt) )
+	       (amr.cumTime() < stop_time || stop_time < Real(0.0)) )
 	    
 	{
 	    //
diff --git a/Tutorials/GPU/EBCNS/CMakeLists.txt b/Tutorials/GPU/EBCNS/CMakeLists.txt
new file mode 100644
index 00000000000..092b04a88d4
--- /dev/null
+++ b/Tutorials/GPU/EBCNS/CMakeLists.txt
@@ -0,0 +1,20 @@
+if (NOT AMReX_SPACEDIM EQUAL 3 OR NOT AMReX_EB)
+   return()
+endif ()
+
+set(_sources main.cpp CNS_advance.cpp CNS_bcfill.cpp CNSBld.cpp CNS.cpp CNS_derive.cpp CNS_derive.H CNS.H
+   CNS_index_macros.H CNS_init_eb2.cpp CNS_io.cpp CNS_K.H CNS_parm.cpp CNS_parm.H CNS_setup.cpp CNS_tagging.H
+   hydro/CNS_hydro_K.H)
+list(TRANSFORM _sources PREPEND Source/)
+
+
+set(_sources Exec/Sod/cns_prob.cpp Exec/Sod/cns_prob.H Exec/Sod/cns_prob_parm.H ${_sources})
+set(_input_files Exec/Sod/inputs)
+
+setup_tutorial(_sources _input_files
+   BASE_NAME GPU_EBCNS_Sod
+   RUNTIME_SUBDIR Sod
+   EXTRA_DEFINITIONS AMREX_CRSEGRNDOMP)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/GPU/EBCNS/Source/CNS.cpp b/Tutorials/GPU/EBCNS/Source/CNS.cpp
index 28961b7f502..28f494005ae 100644
--- a/Tutorials/GPU/EBCNS/Source/CNS.cpp
+++ b/Tutorials/GPU/EBCNS/Source/CNS.cpp
@@ -117,7 +117,7 @@ CNS::computeInitialDt (int                    finest_level,
     if (level > 0) {
         return;
     }
-    
+
     Real dt_0 = std::numeric_limits<Real>::max();
     int n_factor = 1;
     for (int i = 0; i <= finest_level; i++)
@@ -126,7 +126,7 @@ CNS::computeInitialDt (int                    finest_level,
         n_factor   *= n_cycle[i];
         dt_0 = std::min(dt_0,n_factor*dt_level[i]);
     }
-    
+
     //
     // Limit dt's by the value of stop_time.
     //
@@ -136,7 +136,7 @@ CNS::computeInitialDt (int                    finest_level,
         if ((cur_time + dt_0) > (stop_time - eps))
             dt_0 = stop_time - cur_time;
     }
-    
+
     n_factor = 1;
     for (int i = 0; i <= finest_level; i++)
     {
@@ -168,7 +168,7 @@ CNS::computeNewDt (int                    finest_level,
         dt_min[i] = getLevel(i).estTimeStep();
     }
 
-    if (post_regrid_flag == 1) 
+    if (post_regrid_flag == 1)
     {
 	//
 	// Limit dt's by pre-regrid dt
@@ -178,7 +178,7 @@ CNS::computeNewDt (int                    finest_level,
 	    dt_min[i] = std::min(dt_min[i],dt_level[i]);
 	}
     }
-    else 
+    else
     {
 	//
 	// Limit dt's by change_max * old dt
@@ -189,7 +189,7 @@ CNS::computeNewDt (int                    finest_level,
 	    dt_min[i] = std::min(dt_min[i],change_max*dt_level[i]);
 	}
     }
-    
+
     //
     // Find the minimum over all levels
     //
@@ -333,13 +333,13 @@ CNS::read_params ()
     ParmParse pp("cns");
 
     pp.query("v", verbose);
- 
+
     Vector<int> tilesize(AMREX_SPACEDIM);
     if (pp.queryarr("hydro_tile_size", tilesize, 0, AMREX_SPACEDIM))
     {
 	for (int i=0; i<AMREX_SPACEDIM; i++) hydro_tile_size[i] = tilesize[i];
     }
-   
+
     pp.query("cfl", cfl);
 
     Vector<int> lo_bc(AMREX_SPACEDIM), hi_bc(AMREX_SPACEDIM);
@@ -391,7 +391,7 @@ CNS::buildMetrics ()
     }
 
     const auto& ebfactory = dynamic_cast<EBFArrayBoxFactory const&>(Factory());
-    
+
     volfrac = &(ebfactory.getVolFrac());
     bndrycent = &(ebfactory.getBndryCent());
     areafrac = ebfactory.getAreaFrac();
@@ -399,7 +399,7 @@ CNS::buildMetrics ()
 
     level_mask.clear();
     level_mask.define(grids,dmap,1,1);
-    level_mask.BuildMask(geom.Domain(), geom.periodicity(), 
+    level_mask.BuildMask(geom.Domain(), geom.periodicity(),
                          level_mask_covered,
                          level_mask_notcovered,
                          level_mask_physbnd,
@@ -415,7 +415,7 @@ CNS::estTimeStep ()
     const MultiFab& S = get_new_data(State_Type);
 
     Real estdt = amrex::ReduceMin(S, 0,
-    [=] AMREX_GPU_DEVICE (Box const& bx, FArrayBox const& fab) -> Real
+    [=] AMREX_GPU_DEVICE (Box const& bx, Array4<const Real> const& fab) -> Real
     {
         return cns_estdt(bx, fab, dx);
     });
@@ -437,7 +437,7 @@ CNS::computeTemp (MultiFab& State, int ng)
 {
     BL_PROFILE("CNS::computeTemp()");
 
-    // This will reset Eint and compute Temperature 
+    // This will reset Eint and compute Temperature
 #ifdef _OPENMP
 #pragma omp parallel if (Gpu::notInLaunchRegion())
 #endif
@@ -453,4 +453,3 @@ CNS::computeTemp (MultiFab& State, int ng)
         });
     }
 }
-
diff --git a/Tutorials/GPU/EBCNS/Source/CNS_K.H b/Tutorials/GPU/EBCNS/Source/CNS_K.H
index fbe15ffe182..ae8202a6ac4 100644
--- a/Tutorials/GPU/EBCNS/Source/CNS_K.H
+++ b/Tutorials/GPU/EBCNS/Source/CNS_K.H
@@ -2,7 +2,7 @@
 #define CNS_K_H_
 
 #include "CNS_index_macros.H"
-#include <AMReX_FArrayBox.H>
+#include <AMReX_Array4.H>
 #include <limits>
 #include <cmath>
 
@@ -12,12 +12,12 @@
 AMREX_GPU_HOST_DEVICE
 inline
 amrex::Real
-cns_estdt (amrex::Box const& bx, amrex::FArrayBox const& statefab,
+cns_estdt (amrex::Box const& bx, amrex::Array4<amrex::Real const> const& state,
            amrex::GpuArray<amrex::Real,AMREX_SPACEDIM> const& dx)
 {
     const auto lo = amrex::lbound(bx);
     const auto hi = amrex::ubound(bx);
-    const auto state = statefab.array();
+
 #if !defined(__CUDACC__) || (__CUDACC_VER_MAJOR__ != 9) || (__CUDACC_VER_MINOR__ != 2)
     amrex::Real dt = std::numeric_limits<amrex::Real>::max();
 #else
@@ -45,7 +45,7 @@ cns_estdt (amrex::Box const& bx, amrex::FArrayBox const& statefab,
             }
         }
     }
-    
+
     return dt;
 }
 
diff --git a/Tutorials/GPU/Launch/CMakeLists.txt b/Tutorials/GPU/Launch/CMakeLists.txt
index 2ef40aa7685..a2d74043c55 100644
--- a/Tutorials/GPU/Launch/CMakeLists.txt
+++ b/Tutorials/GPU/Launch/CMakeLists.txt
@@ -1,54 +1,11 @@
-#
-# This test requires CUDA and pgfortran to be enabled
-#
-if ( NOT ENABLE_CUDA )
-   return ()
+if (NOT CMAKE_Fortran_COMPILER_LOADED OR NOT (AMReX_SPACEDIM EQUAL 3))
+   return()
 endif ()
 
-if ( NOT ("${CMAKE_Fortran_COMPILER_ID}" STREQUAL "PGI") )
-   return ()
-endif ()
-
-set( SRC_DIR ${CMAKE_CURRENT_LIST_DIR} )
-set( EXENAME  "gpu_launch.exe" )
-
-add_executable( ${EXENAME} EXCLUDE_FROM_ALL "")
-
-target_sources( ${EXENAME}
-   PRIVATE
-   ${SRC_DIR}/MyKernel_F.F90
-   ${SRC_DIR}/MyKernel_F.H
-   ${SRC_DIR}/main.cpp)
-
-set_source_files_properties(${SRC_DIR}/main.cpp PROPERTIES LANGUAGE CUDA)
-
-get_target_property(amrex_flags  amrex COMPILE_OPTIONS)
-
-evaluate_genex(amrex_flags amrex_fortran_flags
-   LANG   Fortran
-   COMP   ${CMAKE_Fortran_COMPILER_ID}
-   CONFIG ${CMAKE_BUILD_TYPE}
-   STRING )
-
-# Since we are forcing the use of fortran compiler to link
-# we need to specify the flags to add at link phase since
-# it won't propagate amrex ones
-set_target_properties( ${EXENAME}
-   PROPERTIES
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/Launch
-   LINKER_LANGUAGE
-   Fortran
-   LINK_FLAGS
-   "${amrex_fortran_flags}"
-   CUDA_STANDARD 14               # Adds -std=c++14
-   CUDA_STANDARD_REQUIRED ON
-   CUDA_SEPARABLE_COMPILATION ON  
-   CUDA_RESOLVE_DEVICE_SYMBOLS OFF # This is crucial to avoid the device code linkage step
-   )
+set(_sources MyKernel_F.F90 MyKernel_F.H main.cpp )
+set(_inpute_files)
 
-target_link_libraries(${EXENAME} amrex)
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULE)
 
-add_tutorial(${EXENAME})   
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/GPU/Launch/GNUmakefile b/Tutorials/GPU/Launch/GNUmakefile
index d8e729093c5..0cd59566229 100644
--- a/Tutorials/GPU/Launch/GNUmakefile
+++ b/Tutorials/GPU/Launch/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	= FALSE
 
diff --git a/Tutorials/GPU/Launch/main.cpp b/Tutorials/GPU/Launch/main.cpp
index eb7d6363a73..eef167851bd 100644
--- a/Tutorials/GPU/Launch/main.cpp
+++ b/Tutorials/GPU/Launch/main.cpp
@@ -1,6 +1,7 @@
 
 #include <AMReX.H>
 #include <AMReX_MultiFab.H>
+#include <AMReX_ParmParse.H>
 
 #include "MyKernel_F.H"
 
@@ -20,9 +21,14 @@ void main_main ()
 {
     BoxArray ba;
     {
-        Box domain_box(IntVect(0), IntVect(127));
+        int n_cell = 256;
+        int max_grid_size = 64;
+        ParmParse pp;
+        pp.query("n_cell", n_cell);
+        pp.query("max_grid_size", max_grid_size);
+        Box domain_box(IntVect(0), IntVect(n_cell-1));
         ba.define(domain_box);
-        ba.maxSize(64);
+        ba.maxSize(max_grid_size);
     }
 
     MultiFab mf(ba,DistributionMapping{ba},1,0);
diff --git a/Tutorials/GPU/ParallelReduce/CMakeLists.txt b/Tutorials/GPU/ParallelReduce/CMakeLists.txt
new file mode 100644
index 00000000000..0b66fd64103
--- /dev/null
+++ b/Tutorials/GPU/ParallelReduce/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources main.cpp)
+set(_input_files)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/GPU/ParallelReduce/GNUmakefile b/Tutorials/GPU/ParallelReduce/GNUmakefile
index c365f60ebf8..2754352287a 100644
--- a/Tutorials/GPU/ParallelReduce/GNUmakefile
+++ b/Tutorials/GPU/ParallelReduce/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 DEBUG	= FALSE
 
diff --git a/Tutorials/GPU/ParallelReduce/main.cpp b/Tutorials/GPU/ParallelReduce/main.cpp
index a806032a240..ee1e82ad4a0 100644
--- a/Tutorials/GPU/ParallelReduce/main.cpp
+++ b/Tutorials/GPU/ParallelReduce/main.cpp
@@ -45,19 +45,11 @@ void main_main ()
         auto const& fab = mf.array(mfi);
         auto const& ifab = imf.array(mfi);
 
-        amrex::ParallelFor(bx,
-        [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept 
+        amrex::ParallelForRNG(bx,
+        [=] AMREX_GPU_DEVICE (int i, int j, int k, RandomEngine const& engine) noexcept
         {
-
-#if defined(AMREX_USE_HIP) || defined(AMREX_USE_DPCPP)
-//          Currently needed for HIP to work correctly.
-//          Random lock is under investigation.
-            fab(i,j,k) = 1.0;
-            ifab(i,j,k) = 1;
-#else
-            fab(i,j,k) = amrex::Random();
-            ifab(i,j,k) = (amrex::Random() > 0.5) ? 1 : 0;
-#endif
+            fab(i,j,k) = amrex::Random(engine);
+            ifab(i,j,k) = amrex::Random_int(2,engine);
         });
     }
 
@@ -136,7 +128,7 @@ void main_main ()
                 Real rmax = -1.e30; // we should use numeric_limits.
                 Long lsum = 0;
                 amrex::Loop(bx,
-                [=,&rsum,&rmin,&rmax,&lsum] (int i, int j, int k) AMREX_NOEXCEPT {
+                [=,&rsum,&rmin,&rmax,&lsum] (int i, int j, int k) {
                     Real x =  fab(i,j,k);
                     Long ix = static_cast<Long>(ifab(i,j,k));
                     rsum += x;
@@ -259,12 +251,10 @@ void main_main ()
     int N = 1000000;
     Gpu::DeviceVector<Real> vec(N);
     Real* pvec = vec.dataPtr();
-    amrex::ParallelFor(N, [=] AMREX_GPU_DEVICE (int i) noexcept {
-#if defined(AMREX_USE_HIP) || defined(AMREX_USE_DPCPP)
-           pvec[i] = 1.5;
-#else
-           pvec[i] = amrex::Random() - 0.5;
-#endif
+    amrex::ParallelForRNG( N,
+    [=] AMREX_GPU_DEVICE (int i, RandomEngine const& engine) noexcept
+    {
+        pvec[i] = amrex::Random(engine) - 0.5;
     });
 
     {
diff --git a/Tutorials/GPU/ParallelScan/CMakeLists.txt b/Tutorials/GPU/ParallelScan/CMakeLists.txt
new file mode 100644
index 00000000000..0b66fd64103
--- /dev/null
+++ b/Tutorials/GPU/ParallelScan/CMakeLists.txt
@@ -0,0 +1,7 @@
+set(_sources main.cpp)
+set(_input_files)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/GPU/ParallelScan/GNUmakefile b/Tutorials/GPU/ParallelScan/GNUmakefile
index 0948839121c..4d94b56b785 100644
--- a/Tutorials/GPU/ParallelScan/GNUmakefile
+++ b/Tutorials/GPU/ParallelScan/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 DEBUG	= FALSE
 
diff --git a/Tutorials/GPU/ParallelScan/main.cpp b/Tutorials/GPU/ParallelScan/main.cpp
index e826186d4dc..181197b49fd 100644
--- a/Tutorials/GPU/ParallelScan/main.cpp
+++ b/Tutorials/GPU/ParallelScan/main.cpp
@@ -70,14 +70,21 @@ void main_main ()
         pp.query("n", N);
     }
 
-    amrex::Print() << "GpuMaxSize = " << amrex::Gpu::Device::totalGlobalMem() << std::endl;
-    amrex::Print() << "ParallelScan with N = " << N*sizeof(int) << std::endl;
-    amrex::Print() << "Number of Ns = " << amrex::Gpu::Device::totalGlobalMem() / (N*sizeof(int)) << std::endl;
-
     typedef int T;
+
+    Long Nmax = amrex::Gpu::Device::totalGlobalMem()/(sizeof(T)*3);
+    N = amrex::min(N,Nmax);
+
+    amrex::Print() << "ParallelScan " << N << " ints." << std::endl;
+
     Vector<T> h_in(N);
     for (auto& x: h_in) {
+#ifdef AMREX_USE_DPCPP
+        // xxxxx DPCPP todo: Random
+        x = 1;
+#else
         x = static_cast<T>((Random()-0.5)*100.);
+#endif
     }
 
     Vector<T> h_exclusive_cpu(N);
@@ -178,4 +185,6 @@ void main_main ()
 
     The_Device_Arena()->free(d_in);
     The_Device_Arena()->free(d_out);
+
+    amrex::Print() << "pass \n";
 }
diff --git a/Tutorials/GPU/run.corigpu b/Tutorials/GPU/run.corigpu
index 96b46a4aed7..2c8da893c94 100755
--- a/Tutorials/GPU/run.corigpu
+++ b/Tutorials/GPU/run.corigpu
@@ -46,39 +46,72 @@ INPUTS=inputs
 # Change parameters to match available resources & run with "./run.corigpu"
 # srun -n 8 -c 10 --gres=gpu:8 ${EXE} ${INPUTS}
 
+
 # Submit with the SBATCH configuration above to the gpu queue: "sbatch run.corigpu"
 # Can also be ran with "./run.corigpu" to run with 1 CPU and 1 GPU.
 srun ${EXE} ${INPUTS}
 
 
-# Profiling examples with NSight
-# ==============================
 
-# Run Nsight Systems:
-#   Run nsys profile and store performance data in a qdrep file
-#   Open using nsight-sys $(pwd)/nsys_out.#.######.qdrep
+# NSight Systems
+# ==============
+
+# @@ Simple Example:
 #srun nsys profile -o nsys_out.%q{SLURM_PROCID}.%q{SLURM_JOBID} ${EXE} ${INPUTS}
 
-# Run Nsight Compute:
-#    **** This will do a A LOT of analysis. Unless you want the entire job ran 7 times
-#    **** with full profiling, limit the kernels profiled with additional flags:
-#    For filtering examples, see:
-#    https://docs.nvidia.com/nsight-compute/NsightComputeCli/index.html#nvtx-filtering
-#    For full list of profile options, see:
-#    https://docs.nvidia.com/nsight-compute/NsightComputeCli/index.html#command-line-options-profile
-#    Recommended: limit kernels tested within a given BL_PROFILER timer with "--nvtx-include <configuration>"
-#      Note: Must use TINY_PROFILE=TRUE and nvtx region names are equal to BL_PROFILER timer names.
-#srun nv-nsight-cu-cli -o cucli_out.%q{SLURM_PROCID}.%q{SLURM_JOBID} ${EXE} ${INPUTS}
+# @@ Recommended Example:
+#srun nsys profile -c nvtx -p "<TINY_PROFILER_NAME>@*" -e NSYS_NVTX_PROFILER_REGISTER_ONLY=0 -o nsys_out.%q{SLURM_PROCID}.%q{SLURM_JOBID} ${EXE} ${INPUTS}
+
+# @@ Discussion:
+#   This will run nsys profile and store performance data in a qdrep file named after '-o'
+#   Open using nsight-sys $(pwd)/nsys_out.#.######.qdrep
+
+#   To capture the NVTX ranges, included in TINY_PROFILE objects, use:
+#       "-e NSYS_NVTX_PROFILER_REGISTER_ONLY=0"
+#   (TINY_PROFILE's NVTX regions do not use registered strings at this time.)
 
-# Run Nsight Systems only profiling for PROFILE_RANK MPI rank on a multi-rank job
+#   Nsight systems creates a timeline over a single, contiguous block of time.
+#   The start of the timeline can be selected using TINY_PROFILER's NVTX markers with:
+#     -c nvtx -p "region_name@*"
+#   This will turn on the profiling analysis at the first instance of the TINY_PROFILER region
+#   and run to the end of the program. To stop the analysis at the end of the same region, add:
+#     -x true
+#   Note: This will only analyze the first instance of the region, so "-x true" should be used
+#   for specific analyses, or on more inclusive timers, e.g. a timer around a full timestep.
+
+# @@ Documentation:
+#   For NSight System profiling flags:
+#      https://docs.nvidia.com/nsight-systems/profiling/index.html#cli-profile-command-switch-options
+#   For NSight examples to launch profiling, including region limiting:
+#      https://docs.nvidia.com/nsight-systems/profiling/index.html#example-interactive-cli-command-sequences
+
+# Running NSight Systems on multiple ranks
+# ========================================
+
+# Run Nsight Systems only profiling on $PROFILE_RANK rank on a multi-rank job
 #    **** Preferred for most basic use cases
 #srun ./profile_1rank.sh ${EXE} ${INPUTS}
 
-# Uncomment and copy the following lines into profile_1rank.sh 
+# Uncomment and copy the following lines into profile_1rank.sh
+# Adjust the nsys command line as needed for your test case.
 # #!/bin/bash
 # PROFILE_RANK=0
 # if [ $SLURM_PROCID == $PROFILE_RANK ]; then
 #   nsys profile -o nsys_out.%q{SLURM_PROCID}.%q{SLURM_JOBID} "$@"
-# else 
+# else
 #   "$@"
 # fi
+
+# NSight Compute
+# ==============
+
+# Run Nsight Compute:
+#    **** This will do a A LOT of analysis. Unless you want the entire job ran 7 times
+#    **** with full profiling, limit the kernels profiled with additional flags:
+#    For filtering examples, see:
+#    https://docs.nvidia.com/nsight-compute/NsightComputeCli/index.html#nvtx-filtering
+#    For full list of profile options, see:
+#    https://docs.nvidia.com/nsight-compute/NsightComputeCli/index.html#command-line-options-profile
+#    Recommended: limit kernels tested within a given BL_PROFILER timer with "--nvtx-include <configuration>"
+#      Note: Must use TINY_PROFILE=TRUE and nvtx region names are equal to BL_PROFILER timer names.
+#srun nv-nsight-cu-cli -o cucli_out.%q{SLURM_PROCID}.%q{SLURM_JOBID} ${EXE} ${INPUTS}
diff --git a/Tutorials/GPU/run.script b/Tutorials/GPU/run.script
deleted file mode 100755
index 2b861c96484..00000000000
--- a/Tutorials/GPU/run.script
+++ /dev/null
@@ -1,43 +0,0 @@
-#!/bin/bash
-#BSUB -P CSC249ADCD03
-#BSUB -W 10 
-#BSUB -nnodes 1
-#BSUB -J MMtest 
-#BSUB -o MMtest.%J
-#BSUB -e MMtest.%J
-
-module load pgi
-module load cuda
-module list
-set -x
-
-omp=1
-export OMP_NUM_THREADS=${omp}
-EXE="./main3d.pgi.MPI.CUDA.ex"
-#EXE="../main3d.pgi.CUDA.ex"
-JSRUN="jsrun -n 1 -a 1 -g 1 -c 1 --bind=packed:${omp}"
-INPUTS=inputs_3d
-
-rundir="${LSB_JOBNAME}-${LSB_JOBID}"
-#mkdir $rundir
-#cp $0 $rundir
-#cp ${INPUTS} $rundir
-#cd $rundir
-
-# 1. Run normally
-#${JSRUN} ${EXE} ${INPUTS} >& out.${LSB_JOBID}
-
-# 2. Run under nvprof and direct all stdout and stderr to nvprof.txt
-${JSRUN} nvprof ${EXE} ${INPUTS} &> nvprof.txt
-#${JSRUN} nvprof --profile-child-processes ${EXE} inputs &> nvprof.txt
-
-# 3. Run under nvprof and store performance data in a nvvp file
-# Can be converted to text using nvprof -i nvprof-timeline-%p.nvvp
-#${JSRUN} nvprof --profile-child-processes -o nvprof-timeline-%p.nvvp ${EXE} ${INPUTS} 
-
-# COLLECT PERFORMANCE METRICS - THIS IS MUCH SLOWER. Set nsteps=2 in the inputs files
-# 4. Run under nvprof and collect metrics for a subset of kernels
-#${JSRUN} nvprof --profile-child-processes --kernels '(deposit_current|gather_\w+_field|push_\w+_boris)' --analysis-metrics -o nvprof-metrics-kernel-%p.nvvp ${EXE} ${INPUTS} 
-
-# 5. Run under nvprof and collect metrics for all kernels -- much slower!
-#${JSRUN} nvprof --profile-child-processes --analysis-metrics -o nvprof-metrics-%p.nvvp ${EXE} ${INPUTS}
diff --git a/Tutorials/GPU/run.summit b/Tutorials/GPU/run.summit
index 4e92ec1c8b3..27b17753f28 100755
--- a/Tutorials/GPU/run.summit
+++ b/Tutorials/GPU/run.summit
@@ -87,36 +87,14 @@ SMPIARGS+=" --smpiargs="-disable_gpu_hooks -x PAMI_DISABLE_CUDA_HOOK=1""
 # 1. Run normally
 ${JSRUN} ${SMPIARGS} ${EXE} ${INPUTS} >& out.${LSB_JOBID}
 
-# 2. Run under nvprof and direct all stdout and stderr to nvprov.{jobid}
-#${JSRUN} ${SMPIARGS} nvprof --profile-child-processes --openmp-profiling off --device-buffer-size 64 ${EXE} ${INPUTS} &> out.${LSB_JOBID}
-
-# 3. Run under nvprof and output trace data of gpu launches. 
-#${JSRUN} ${SMPIARGS} nvprof --print-gpu-trace --profile-child-processes --openmp-profiling off --device-buffer-size 64 ${EXE} ${INPUTS} >& out.${LSB_JOBID}
-
-# 4. Run under nvprof and store performance data in a nvvp file
-#    Can be converted to text using nvprof -i nvprof-timeline-%p.nvvp
-#${JSRUN} ${SMPIARGS} nvprof --profile-child-processes --openmp-profiling off --device-buffer-size 64 -o nvprof_out.${PMIX_RANK}.${LSB_JOBID}.nvvp ${EXE} ${INPUTS} >& out.${LSB_JOBID}
-
-# 5. Run under nvprof only profiling MPI rank PROFILE_RANK
-#${JSRUN} ${SMPIARGS} ./profile_1rank.sh ${EXE} ${INPUTS} &> out.${LSB_JOBID}
-
-# Uncomment and copy the following lines into profile_1rank.sh 
-# #!/bin/bash
-# PROFILE_RANK=0
-# if [ $PMIX_RANK == $PROFILE_RANK ]; then
-#   nvprof --profile-child-processes --openmp-profiling off --device-buffer-size 64 "$@"
-# else
-#   "$@"
-# fi
-
-# 6. Run under nsys profile and store performance data in a qdrep file
+# 2. Run under nsys profile and store performance data in a qdrep file
 #${JSRUN} ${SMPIARGS} nsys profile -o nsys_out.%q{PMIX_RANK}.%q{LSB_JOBID}  ${EXE} ${INPUTS} >& out.${LSB_JOBID}
 
-# 7. Run under nsys profile and store performance data in a qdrep file and collect summary stats in sqlite file
+# 3. Run under nsys profile and store performance data in a qdrep file and collect summary stats in sqlite file
 #    Warning: summary statistics will take A LOT of extra time at the end of the run
 #${JSRUN} ${SMPIARGS} nsys profile --stats=true -o nsys_out.%q{PMIX_RANK}.%q{LSB_JOBID}  ${EXE} ${INPUTS} >& out.${LSB_JOBID}
 
-# 8. Run under nv-sight-cu-cli for Nsight Compute command line interface
+# 4. Run under nv-sight-cu-cli for Nsight Compute command line interface
 #    Warning: This will do a A LOT of analysis. Limit the kernels profiled with additional flags.
 #    For filtering examples, see:
 #    https://docs.nvidia.com/nsight-compute/NsightComputeCli/index.html#nvtx-filtering
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_C/CMakeLists.txt b/Tutorials/LinearSolvers/ABecLaplacian_C/CMakeLists.txt
index ebb0c377caa..1c925794b6d 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_C/CMakeLists.txt
+++ b/Tutorials/LinearSolvers/ABecLaplacian_C/CMakeLists.txt
@@ -1,52 +1,18 @@
-if (DIM EQUAL 1)
+if (AMReX_SPACEDIM EQUAL 1)
    return()
 endif ()
 
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ABecLaplacian_C.exe  EXCLUDE_FROM_ALL "")
-
-target_sources( ABecLaplacian_C.exe
-   PRIVATE
+set(_sources
    main.cpp
    MyTest.cpp
    initProb.cpp
    MyTestPlotfile.cpp
    MyTest.H
-   initProb_K.H
-   )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ABecLaplacian_C.exe )
-endif ()
-
-target_include_directories( ABecLaplacian_C.exe
-   PRIVATE
-   ${CMAKE_CURRENT_LIST_DIR}
-   )
-
-set_target_properties( ABecLaplacian_C.exe
-   PROPERTIES
-   INCLUDE_DIRECTORIES
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}
-   )
-
-target_link_libraries( ABecLaplacian_C.exe
-   PRIVATE
-   amrex
-   )
-
+   initProb_K.H)
 
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
 
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+setup_tutorial(_sources _input_files)
 
-# Add to the "tutorial" target
-add_tutorial(ABecLaplacian_C.exe)
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_C/GNUmakefile b/Tutorials/LinearSolvers/ABecLaplacian_C/GNUmakefile
index 55aa250347e..329fb9afcf2 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_C/GNUmakefile
+++ b/Tutorials/LinearSolvers/ABecLaplacian_C/GNUmakefile
@@ -10,7 +10,7 @@ COMP = gnu
 
 DIM = 3
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.H b/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.H
index 5f5a99d2a34..721da35d7f7 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.H
+++ b/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.H
@@ -46,10 +46,12 @@ private:
     int linop_maxorder = 2;
     bool agglomeration = true;
     bool consolidation = true;
+    bool semicoarsening = false;
     int max_coarsening_level = 30;
+    int max_semicoarsening_level = 0;
     bool use_hypre = false;
     bool use_petsc = false;
-    
+
 #ifdef AMREX_USE_HYPRE
     int hypre_interface_i = 1;  // 1. structed, 2. semi-structed, 3. ij
     amrex::Hypre::Interface hypre_interface = amrex::Hypre::Interface::structed;
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.cpp b/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.cpp
index 294af8088d1..c4657f811d6 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.cpp
+++ b/Tutorials/LinearSolvers/ABecLaplacian_C/MyTest.cpp
@@ -129,7 +129,9 @@ MyTest::solveABecLaplacian ()
     LPInfo info;
     info.setAgglomeration(agglomeration);
     info.setConsolidation(consolidation);
+    info.setSemicoarsening(semicoarsening);
     info.setMaxCoarseningLevel(max_coarsening_level);
+    info.setMaxSemicoarseningLevel(max_semicoarsening_level);
 
     const Real tol_rel = 1.e-10;
     const Real tol_abs = 0.0;
@@ -427,7 +429,9 @@ MyTest::readParameters ()
     pp.query("linop_maxorder", linop_maxorder);
     pp.query("agglomeration", agglomeration);
     pp.query("consolidation", consolidation);
+    pp.query("semicoarsening", semicoarsening);
     pp.query("max_coarsening_level", max_coarsening_level);
+    pp.query("max_semicoarsening_level", max_semicoarsening_level);
 
 #ifdef AMREX_USE_HYPRE
     pp.query("use_hypre", use_hypre);
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_C/initProb_K.H b/Tutorials/LinearSolvers/ABecLaplacian_C/initProb_K.H
index 27b6d45fc5f..b0cf8adbed2 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_C/initProb_K.H
+++ b/Tutorials/LinearSolvers/ABecLaplacian_C/initProb_K.H
@@ -12,7 +12,7 @@ void actual_init_poisson (int i, int j, int k,
 {
     constexpr amrex::Real tpi = 2.*3.1415926535897932;
     constexpr amrex::Real fpi = 4.*3.1415926535897932;
-    constexpr amrex::Real fac = tpi*tpi*3.;
+    constexpr amrex::Real fac = tpi*tpi*static_cast<amrex::Real>(AMREX_SPACEDIM);
     amrex::Real x = prob_lo[0] + dx[0] * (i + 0.5);
     amrex::Real y = prob_lo[1] + dx[1] * (j + 0.5);
     amrex::Real z = prob_lo[2] + dx[2] * (k + 0.5);
@@ -65,7 +65,7 @@ void actual_init_abeclap (int i, int j, int k,
     constexpr amrex::Real pi = 3.1415926535897932;
     constexpr amrex::Real tpi =  2.*pi;
     constexpr amrex::Real fpi =  4.*pi;
-    constexpr amrex::Real fac = 12.*pi*pi;
+    constexpr amrex::Real fac = static_cast<amrex::Real>(AMREX_SPACEDIM*4)*pi*pi;
 
     amrex::Real xc = (prob_hi[0] + prob_lo[0])*0.5;
     amrex::Real yc = (prob_hi[1] + prob_lo[1])*0.5;
@@ -115,7 +115,7 @@ void actual_init_abeclap_in (int i, int j, int k,
     constexpr amrex::Real pi = 3.1415926535897932;
     constexpr amrex::Real tpi =  2.*pi;
     constexpr amrex::Real fpi =  4.*pi;
-    constexpr amrex::Real fac = 12.*pi*pi;
+    constexpr amrex::Real fac = static_cast<amrex::Real>(AMREX_SPACEDIM*4)*pi*pi;
 
     amrex::Real xc = (prob_hi[0] + prob_lo[0])*0.5;
     amrex::Real yc = (prob_hi[1] + prob_lo[1])*0.5;
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/CMakeLists.txt b/Tutorials/LinearSolvers/ABecLaplacian_F/CMakeLists.txt
index 2c24f96522c..beb43cc38f1 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/CMakeLists.txt
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/CMakeLists.txt
@@ -1,46 +1,12 @@
-if (NOT ENABLE_FORTRAN_INTERFACES)
+if ( (AMReX_SPACEDIM EQUAL 1) OR (NOT AMReX_FORTRAN_INTERFACES) )
     return()
 endif ()
 
-if (DIM EQUAL 1)
-    return()
-endif ()
-
-#
-# Use directory name as exe name
-#
-get_filename_component(exe_name ${CMAKE_CURRENT_LIST_DIR} NAME)
-set(exe_name "${exe_name}.exe")
-
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ${exe_name} EXCLUDE_FROM_ALL "")
-
-target_sources( ${exe_name}
-    PRIVATE
-    main.F90
-    mytest.F90
-    init_prob.F90
-    )
-
-set_target_properties( ${exe_name}
-    PROPERTIES
-    INCLUDE_DIRECTORIES
-    ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-    Fortran_MODULE_DIRECTORY
-    ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-    RUNTIME_OUTPUT_DIRECTORY
-    ${CMAKE_CURRENT_BINARY_DIR}
-    )
-
-target_link_libraries( ${exe_name} PRIVATE amrex )
+set(_sources main.F90 mytest.F90 init_prob.F90)
 
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input*)
 
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULES)
 
-# Add to the "tutorial" target
-add_tutorial(${exe_name})
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/GNUmakefile b/Tutorials/LinearSolvers/ABecLaplacian_F/GNUmakefile
index 53106b57719..873be0b8b49 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/GNUmakefile
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/GNUmakefile
@@ -8,7 +8,7 @@ COMP = gnu
 
 DIM = 3
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/init_prob.F90 b/Tutorials/LinearSolvers/ABecLaplacian_F/init_prob.F90
index 7e7a7310ba1..841585c5c23 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/init_prob.F90
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/init_prob.F90
@@ -110,7 +110,7 @@ subroutine actual_init_poisson (lo, hi, rhs, rlo, rhi, exact, elo, ehi, prob_lo,
     real(amrex_real) :: x, y, z
     real(amrex_real), parameter :: tpi =  8.d0*atan(1.0)
     real(amrex_real), parameter :: fpi = 16.d0*atan(1.0)
-    real(amrex_real), parameter :: fac = tpi*tpi*3.d0
+    real(amrex_real), parameter :: fac = tpi*tpi*real(amrex_spacedim,amrex_real)
 
     do k = lo(3), hi(3)
        z = prob_lo(3) + dx(3) * (dble(k)+0.5d0)
@@ -150,7 +150,7 @@ subroutine actual_init_abeclapcian (lo, hi, glo, ghi, rhs, rlo, rhi, exact, elo,
     pi = 4.d0 * atan(1.d0)
     tpi = 2.0d0 * pi
     fpi = 4.0d0 * pi
-    fac = 12.d0 * pi**2
+    fac = real(amrex_spacedim*4,amrex_real) * pi**2
 
     xc = (prob_hi(1) + prob_lo(1))/2.d0
     yc = (prob_hi(2) + prob_lo(2))/2.d0
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/inputs b/Tutorials/LinearSolvers/ABecLaplacian_F/inputs
index 8f47f9e34a7..66de0d7faa1 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/inputs
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/inputs
@@ -12,7 +12,7 @@ prob_type = 1
 
 # For MLMG
 verbose = 2
-cg_verbose = 0
+bottom_verbose = 0
 max_iter = 100
 max_fmg_iter = 0     # # of F-cycles before switching to V.  To do pure V-cycle, set to 0
 linop_maxorder = 2
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-abeclap-lev b/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-abeclap-lev
index 1262bd4f88c..71d0ed0dbd9 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-abeclap-lev
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-abeclap-lev
@@ -12,7 +12,7 @@ prob_type = 2
 
 # For MLMG
 verbose = 2
-cg_verbose = 0
+bottom_verbose = 0
 max_iter = 100
 max_fmg_iter = 0     # # of F-cycles before switching to V.  To do pure V-cycle, set to 0
 linop_maxorder = 2
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-poisson-com b/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-poisson-com
index e7317dcd0c2..df8c52a5037 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-poisson-com
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/inputs-rt-poisson-com
@@ -12,7 +12,7 @@ prob_type = 1
 
 # For MLMG
 verbose = 2
-cg_verbose = 0
+bottom_verbose = 0
 max_iter = 100
 max_fmg_iter = 0     # # of F-cycles before switching to V.  To do pure V-cycle, set to 0
 linop_maxorder = 2
diff --git a/Tutorials/LinearSolvers/ABecLaplacian_F/mytest.F90 b/Tutorials/LinearSolvers/ABecLaplacian_F/mytest.F90
index 9976bff468c..9c52632f1b5 100644
--- a/Tutorials/LinearSolvers/ABecLaplacian_F/mytest.F90
+++ b/Tutorials/LinearSolvers/ABecLaplacian_F/mytest.F90
@@ -20,7 +20,7 @@ module mytest_module
   integer, save :: prob_type = 1
 
   integer, save :: verbose = 2
-  integer, save :: cg_verbose = 0
+  integer, save :: bottom_verbose = 0
   integer, save :: max_iter = 100
   integer, save :: max_fmg_iter = 0
   integer, save :: bottom_solver = amrex_bottom_default
@@ -68,7 +68,7 @@ subroutine init_parameters()
     call pp % query("prob_type", prob_type)
 
     call pp % query("verbose", verbose)
-    call pp % query("cg_verbose", cg_verbose)
+    call pp % query("bottom_verbose", bottom_verbose)
     call pp % query("max_iter", max_iter)
     call pp % query("max_fmg_iter", max_fmg_iter)
     call pp % query("bottom_solver", bottom_solver)
@@ -201,7 +201,7 @@ subroutine solve_poisson ()
 
        call amrex_multigrid_build(multigrid, poisson)
        call multigrid % set_verbose(verbose)
-       call multigrid % set_cg_verbose(cg_verbose)
+       call multigrid % set_bottom_verbose(bottom_verbose)
        call multigrid % set_max_iter(max_iter)
        call multigrid % set_max_fmg_iter(max_fmg_iter)
        call multigrid % set_bottom_solver(bottom_solver)
@@ -241,7 +241,7 @@ subroutine solve_poisson ()
 
           call amrex_multigrid_build(multigrid, poisson);
           call multigrid % set_verbose(verbose)
-          call multigrid % set_cg_verbose(cg_verbose)
+          call multigrid % set_bottom_verbose(bottom_verbose)
           call multigrid % set_max_iter(max_iter)
           call multigrid % set_max_fmg_iter(max_fmg_iter)
           call multigrid % set_bottom_solver(bottom_solver)
@@ -303,7 +303,7 @@ subroutine solve_abeclaplacian ()
 
        call amrex_multigrid_build(multigrid, abeclap)
        call multigrid % set_verbose(verbose)
-       call multigrid % set_cg_verbose(cg_verbose)
+       call multigrid % set_bottom_verbose(bottom_verbose)
        call multigrid % set_max_iter(max_iter)
        call multigrid % set_max_fmg_iter(max_fmg_iter)
        call multigrid % set_bottom_solver(bottom_solver)
@@ -340,7 +340,7 @@ subroutine solve_abeclaplacian ()
 
        call amrex_multigrid_build(multigrid, abeclap)
        call multigrid % set_verbose(verbose)
-       call multigrid % set_cg_verbose(cg_verbose)
+       call multigrid % set_bottom_verbose(bottom_verbose)
        call multigrid % set_max_iter(max_iter)
        call multigrid % set_max_fmg_iter(max_fmg_iter)
        call multigrid % set_bottom_solver(bottom_solver)
diff --git a/Tutorials/LinearSolvers/MAC_Projection_EB/CMakeLists.txt b/Tutorials/LinearSolvers/MAC_Projection_EB/CMakeLists.txt
index bb6c61f7ece..ea614635619 100644
--- a/Tutorials/LinearSolvers/MAC_Projection_EB/CMakeLists.txt
+++ b/Tutorials/LinearSolvers/MAC_Projection_EB/CMakeLists.txt
@@ -1,38 +1,11 @@
-if (NOT ENABLE_EB)
-    return()
+if ( (NOT AMReX_EB) OR NOT (AMReX_SPACEDIM EQUAL 3) )
+   return()
 endif ()
 
-if (DIM EQUAL 1)
-    return()
-endif ()
-
-#
-# Use directory name as exe name
-#
-get_filename_component(exe_name ${CMAKE_CURRENT_LIST_DIR} NAME)
-set(exe_name "${exe_name}.exe")
-
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ${exe_name} EXCLUDE_FROM_ALL "")
-
-target_sources( ${exe_name} PRIVATE main.cpp )
-
-
-set_target_properties( ${exe_name}
-    PROPERTIES
-    RUNTIME_OUTPUT_DIRECTORY
-    ${CMAKE_CURRENT_BINARY_DIR}
-    )
-
-target_link_libraries( ${exe_name} PRIVATE amrex )
-
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
+set(_sources main.cpp)
+set(_input_files inputs_3d)
 
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+setup_tutorial(_sources _input_files)
 
-# Add to the "tutorial" target
-add_tutorial(${exe_name})
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/LinearSolvers/MAC_Projection_EB/GNUmakefile b/Tutorials/LinearSolvers/MAC_Projection_EB/GNUmakefile
index 40e2e9b9549..93bf0ab7224 100644
--- a/Tutorials/LinearSolvers/MAC_Projection_EB/GNUmakefile
+++ b/Tutorials/LinearSolvers/MAC_Projection_EB/GNUmakefile
@@ -7,7 +7,7 @@ DIM = 3
 
 DEBUG = FALSE
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 USE_EB = TRUE
 
diff --git a/Tutorials/LinearSolvers/MAC_Projection_EB/inputs_3d b/Tutorials/LinearSolvers/MAC_Projection_EB/inputs_3d
index 56c9d80bb9b..b2ddd7d7fc2 100644
--- a/Tutorials/LinearSolvers/MAC_Projection_EB/inputs_3d
+++ b/Tutorials/LinearSolvers/MAC_Projection_EB/inputs_3d
@@ -8,6 +8,6 @@ obstacles = 0 1 2 3 4 5 6 7 8            # this is how we choose which obstacles
 use_hypre = 0                            # if 1 then use hypre instead of geometric multigrid      (default: 0)
 
 mg_verbose = 2                           # specify verbosity of geometric multigrid solver         (default: 0)
-cg_verbose = 2                           # specify verbosity of the BiCGStab bottom solver if used (default: 0)
+bottom_verbose = 2                       # specify verbosity of the bottom solver                  (default: 0)
 
 regtest    = 0                           # If regtest == 1 then we don't plot zvel (used for regression testing with GPUs)
diff --git a/Tutorials/LinearSolvers/MAC_Projection_EB/main.cpp b/Tutorials/LinearSolvers/MAC_Projection_EB/main.cpp
index 26d3b04ce5a..5debc812b7b 100644
--- a/Tutorials/LinearSolvers/MAC_Projection_EB/main.cpp
+++ b/Tutorials/LinearSolvers/MAC_Projection_EB/main.cpp
@@ -52,7 +52,7 @@ int main (int argc, char* argv[])
 
     {
         int mg_verbose = 0;
-        int cg_verbose = 0;
+        int bottom_verbose = 0;
         int n_cell = 128;
         int max_grid_size = 32;
         int use_hypre  = 0;
@@ -64,7 +64,7 @@ int main (int argc, char* argv[])
         {
             ParmParse pp;
             pp.query("mg_verbose", mg_verbose);
-            pp.query("cg_verbose", cg_verbose);
+            pp.query("bottom_verbose", bottom_verbose);
             pp.query("n_cell", n_cell);
             pp.query("max_grid_size", max_grid_size);
             pp.query("use_hypre", use_hypre);
@@ -217,7 +217,7 @@ int main (int argc, char* argv[])
 					  LinOpBCType::Periodic)});
 
         macproj.setVerbose(mg_verbose);
-        macproj.getMLMG().setBottomVerbose(cg_verbose);
+        macproj.getMLMG().setBottomVerbose(bottom_verbose);
 
 	// Define the relative tolerance
         Real reltol = 1.e-8;
diff --git a/Tutorials/LinearSolvers/MultiComponent/CMakeLists.txt b/Tutorials/LinearSolvers/MultiComponent/CMakeLists.txt
deleted file mode 100644
index 231dac1c971..00000000000
--- a/Tutorials/LinearSolvers/MultiComponent/CMakeLists.txt
+++ /dev/null
@@ -1,34 +0,0 @@
-if ( (DIM EQUAL 1) OR ENABLE_CUDA)
-    return()
-endif ()
-
-#
-# Use directory name as exe name
-#
-get_filename_component(exe_name ${CMAKE_CURRENT_LIST_DIR} NAME)
-set(exe_name "${exe_name}.exe")
-
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ${exe_name} EXCLUDE_FROM_ALL "")
-
-target_sources( ${exe_name}
-    PRIVATE
-    main.cpp
-    MCNodalLinOp.cpp
-    MCNodalLinOp.H
-    )
-
-target_include_directories(${exe_name} PRIVATE ${CMAKE_CURRENT_LIST_DIR})
-
-target_link_libraries( ${exe_name} PRIVATE amrex )
-
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
-
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-# Add to the "tutorial" target
-add_tutorial(${exe_name})
diff --git a/Tutorials/LinearSolvers/MultiComponent/GNUmakefile b/Tutorials/LinearSolvers/MultiComponent/GNUmakefile
index 47285d22598..16d51716665 100644
--- a/Tutorials/LinearSolvers/MultiComponent/GNUmakefile
+++ b/Tutorials/LinearSolvers/MultiComponent/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 
 DEBUG	?= FALSE
 DIM	?= 3
diff --git a/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.H b/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.H
index 17b0bad4421..ab19a8a1daf 100644
--- a/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.H
+++ b/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.H
@@ -97,9 +97,6 @@ public:
 private:
 	// Usual buildMasks
 	void buildMasks ();
-	// This function extends fillBoundary to account for the extra
-	// ghost nodes that are present. 
-	void realFillBoundary(MultiFab &phi, const Geometry &geom) const;
 
 	bool m_is_bottom_singular = false;
 	bool m_masks_built = false;
diff --git a/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.cpp b/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.cpp
index a1604fc3ed5..211aeb92db9 100644
--- a/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.cpp
+++ b/Tutorials/LinearSolvers/MultiComponent/MCNodalLinOp.cpp
@@ -31,6 +31,10 @@ void MCNodalLinOp::Fapply (int amrlev, int mglev, MultiFab& a_out,const MultiFab
 	domain.grow(-1); // Shrink domain so we don't operate on any boundaries
 	const Real* DX = m_geom[amrlev][mglev].CellSize();
 
+     amrex::AsyncArray<Real> aa(coeff.data(), coeff.size());
+     amrex::Real const* dcoeff = aa.data();
+     const int N = getNComp();
+
 	for (MFIter mfi(a_out, amrex::TilingIfNotGPU()); mfi.isValid(); ++mfi)
 	{
 		Box bx = mfi.tilebox();
@@ -43,9 +47,9 @@ void MCNodalLinOp::Fapply (int amrlev, int mglev, MultiFab& a_out,const MultiFab
 		for (int n = 0; n < getNComp(); n++)
 			amrex::ParallelFor (bx,[=] AMREX_GPU_DEVICE(int i, int j, int k) {
 				out(i,j,k,n) = 0.0;
-				for (int m = 0; m < getNComp(); m++)
+				for (int m = 0; m < N; m++)
 				{ 
-					out(i,j,k,n) += coeff[ncomp*n + m] *
+					out(i,j,k,n) += dcoeff[ncomp*n + m] *
 					( AMREX_D_TERM(- (in(i-1,j,k,m) - 2.0 * in(i,j,k,m) + in(i+1,j,k,m)) / DX[0] / DX[0],
 					  			   - (in(i,j-1,k,m) - 2.0 * in(i,j,k,m) + in(i,j+1,k,m)) / DX[1] / DX[1],
 					  			   - (in(i,j,k-1,m) - 2.0 * in(i,j,k,m) + in(i,j,k+1,m)) / DX[2] / DX[2])) ;
@@ -62,6 +66,10 @@ void MCNodalLinOp::Diag (int amrlev, int mglev, MultiFab& a_diag)
 	domain.grow(-1); // Shrink domain so we don't operate on any boundaries
 	const Real* DX = m_geom[amrlev][mglev].CellSize();
 
+      amrex::AsyncArray<Real> aa(coeff.data(), coeff.size());
+      amrex::Real const* dcoeff = aa.data();
+      const int N = getNComp();
+
 	for (MFIter mfi(a_diag, amrex::TilingIfNotGPU()); mfi.isValid(); ++mfi)
 	{
 		Box bx = mfi.tilebox();
@@ -72,7 +80,7 @@ void MCNodalLinOp::Diag (int amrlev, int mglev, MultiFab& a_diag)
 
 		for (int n = 0; n < getNComp(); n++)
 			amrex::ParallelFor (bx,[=] AMREX_GPU_DEVICE(int i, int j, int k) {
-				diag(i,j,k,n) = coeff[ncomp*n + n] *
+				diag(i,j,k,n) = dcoeff[N*n + n] *
 					( AMREX_D_TERM(+ 2.0 / DX[0] / DX[0],
 					  			   + 2.0 / DX[1] / DX[1],
 					  			   + 2.0 / DX[2] / DX[2]) );
@@ -147,7 +155,8 @@ void MCNodalLinOp::Fsmooth (int amrlev, int mglev, amrex::MultiFab& a_x, const a
 		}
 	}
 	amrex::Geometry geom = m_geom[amrlev][mglev];
-	realFillBoundary(a_x,geom);
+	a_x.setMultiGhost(true);
+	a_x.FillBoundary();
 	nodalSync(amrlev, mglev, a_x);
 }
 
@@ -379,13 +388,13 @@ void MCNodalLinOp::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab
 	}
 
 	MultiFab* pcrse = (need_parallel_copy) ? &cfine : &crse;
+        pcrse->setVal(0.0);
 
 	for (MFIter mfi(*pcrse, amrex::TilingIfNotGPU()); mfi.isValid(); ++mfi)
 	{
 		Box bx = mfi.tilebox();
 		bx = bx & cdomain;
 
-		pcrse->setVal(0.0);
 		amrex::Array4<const amrex::Real> const& fdata = fine.array(mfi);
 		amrex::Array4<amrex::Real> const& cdata       = pcrse->array(mfi);
 
@@ -395,6 +404,14 @@ void MCNodalLinOp::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab
 			// i,j,k == fine coordinates
 			amrex::ParallelFor (bx,[=] AMREX_GPU_DEVICE(int I, int J, int K) {
 					int i=2*I, j=2*J, k=2*K;
+#if AMREX_SPACEDIM == 2					
+						cdata(I,J,K,n) =
+							(fdata(i-1,j-1,k,n) + fdata(i-1,j+1,k,n) + fdata(i+1,j-1,k,n) + fdata(i+1,j+1,k,n)) / 16.0
+							+
+							(fdata(i-1,j,k,n)   + fdata(i,j-1,k,n)   + fdata(i+1,j,k,n)   + fdata(i,j+1,k,n)) / 8.0
+							+
+							fdata(i,j,k,n) / 4.0;
+#elif AMREX_SPACEDIM == 3					
 						cdata(I,J,K,n) =
 							(fdata(i-1,j-1,k-1,n) + fdata(i-1,j-1,k+1,n) + fdata(i-1,j+1,k-1,n) + fdata(i-1,j+1,k+1,n) +
 							 fdata(i+1,j-1,k-1,n) + fdata(i+1,j-1,k+1,n) + fdata(i+1,j+1,k-1,n) + fdata(i+1,j+1,k+1,n)) / 64.0
@@ -407,6 +424,7 @@ void MCNodalLinOp::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab
 							 fdata(i+1,j,k,n) + fdata(i,j+1,k,n) + fdata(i,j,k+1,n)) / 16.0
 							+
 							fdata(i,j,k,n) / 8.0;
+#endif							
 				});
 		}
 	}
@@ -416,7 +434,8 @@ void MCNodalLinOp::restriction (int amrlev, int cmglev, MultiFab& crse, MultiFab
 	}
 
 	amrex::Geometry geom = m_geom[amrlev][cmglev];
-	realFillBoundary(crse,geom);
+	crse.setMultiGhost(true);
+	crse.FillBoundary();
 	nodalSync(amrlev, cmglev, crse);
 }
 
@@ -483,7 +502,8 @@ void MCNodalLinOp::interpolation (int amrlev, int fmglev, MultiFab& fine, const
 		fine[mfi].plus<RunOn::Host>(tmpfab,fine_bx,fine_bx,0,0,fine.nComp());
 	}
 	amrex::Geometry geom = m_geom[amrlev][fmglev];
-	realFillBoundary(fine,geom);
+	fine.setMultiGhost(true);
+	fine.FillBoundary();
 	nodalSync(amrlev, fmglev, fine);
 }
   
@@ -496,27 +516,12 @@ void MCNodalLinOp::averageDownSolutionRHS (int camrlev, MultiFab& crse_sol, Mult
 	if (isSingular(0)) amrex::Abort("Singular operators not supported!");
 }
 
-void MCNodalLinOp::realFillBoundary(MultiFab &phi, const Geometry &geom) const
-{
-	for (int i = 0; i < 2; i++)
-	{
-		MultiFab & mf = phi;
-		mf.FillBoundary(geom.periodicity());
-		//const int ncomp = mf.nComp();
-		const int ng1 = 1;
-		const int ng2 = 2;
-		MultiFab tmpmf(mf.boxArray(), mf.DistributionMap(), ncomp, ng1);
-		MultiFab::Copy(tmpmf, mf, 0, 0, ncomp, ng1); 
-		mf.ParallelCopy   (tmpmf, 0, 0, ncomp, ng1, ng2, geom.periodicity());
-	}
-}
-
 void MCNodalLinOp::applyBC (int amrlev, int mglev, MultiFab& phi, BCMode,
 		   					amrex::MLLinOp::StateMode , bool skip_fillboundary) const
 {
 	BL_PROFILE("MCNodalLinOp::applyBC()");
 	const Geometry& geom = m_geom[amrlev][mglev];
-	if (!skip_fillboundary) realFillBoundary(phi,geom);
+	if (!skip_fillboundary) {phi.setMultiGhost(true); phi.FillBoundary();}
 }
 
 void MCNodalLinOp::reflux (int crse_amrlev,
@@ -621,9 +626,9 @@ void MCNodalLinOp::reflux (int crse_amrlev,
 
 	// Sync up ghost nodes
 	amrex::Geometry geom = m_geom[crse_amrlev][mglev];
-	realFillBoundary(res,geom);
+	res.setMultiGhost(true);
+	res.FillBoundary();
 	nodalSync(crse_amrlev,mglev, res);
-	return;
 }
 
 void
@@ -634,7 +639,8 @@ MCNodalLinOp::solutionResidual (int amrlev, MultiFab& resid, MultiFab& x, const
 	apply(amrlev, mglev, resid, x, BCMode::Inhomogeneous, StateMode::Solution);
 	MultiFab::Xpay(resid, -1.0, b, 0, 0, ncomp, 2);
 	amrex::Geometry geom = m_geom[amrlev][mglev];
-	realFillBoundary(resid,geom);
+	resid.setMultiGhost(true);
+	resid.FillBoundary();
 }
 
 void
@@ -645,5 +651,6 @@ MCNodalLinOp::correctionResidual (int amrlev, int mglev, MultiFab& resid, MultiF
 	apply(amrlev, mglev, resid, x, BCMode::Homogeneous, StateMode::Correction);
 	MultiFab::Xpay(resid, -1.0, b, 0, 0, ncomp, resid.nGrow());
 	amrex::Geometry geom = m_geom[amrlev][mglev];
-	realFillBoundary(resid,geom);
+	resid.setMultiGhost(true);
+	resid.FillBoundary();
 }
diff --git a/Tutorials/LinearSolvers/MultiComponent/inputs b/Tutorials/LinearSolvers/MultiComponent/inputs
index d93b29e9287..4c08aad0fdb 100644
--- a/Tutorials/LinearSolvers/MultiComponent/inputs
+++ b/Tutorials/LinearSolvers/MultiComponent/inputs
@@ -4,8 +4,7 @@ mesh.max_grid_size = 32         # Maximum grid size (default = very large --> no
 
 mlmg.fixed_iter = 1000          # Number of iterations before exiting gracefully
 mlmg.verbose = 2                # Verbosity of MLMG
-mlmg.cg_verbose = 0             # Verbosity of bottom solve
-mlmg.max_coarsening_level = 100 # Max MG level
+mlmg.bottom_verbose = 0         # Verbosity of bottom solve
 mlmg.max_iter = 100             # Max number of iterations before error
 mlmg.max_fmg_iter = 100         # Number of F-cycles 
 mlmg.agglomeration = 1          # Do agglomeration 
diff --git a/Tutorials/LinearSolvers/MultiComponent/main.cpp b/Tutorials/LinearSolvers/MultiComponent/main.cpp
index fb28593e07d..34b3a29f7f2 100644
--- a/Tutorials/LinearSolvers/MultiComponent/main.cpp
+++ b/Tutorials/LinearSolvers/MultiComponent/main.cpp
@@ -71,7 +71,7 @@ int main (int argc, char* argv[])
     //
     struct {
         int verbose = -1;
-        int cg_verbose = -1;
+        int bottom_verbose = -1;
         int max_iter = -1;
         int fixed_iter = -1;
         int max_fmg_iter = -1;
@@ -83,7 +83,7 @@ int main (int argc, char* argv[])
     {
         ParmParse pp("mlmg");
         pp.query("verbose",mlmg.verbose);
-        pp.query("cg_verbose",mlmg.cg_verbose );
+        pp.query("bottom_verbose",mlmg.bottom_verbose );
         pp.query("max_iter",mlmg.max_iter);
         pp.query("max_fmg_iter",mlmg.max_fmg_iter);
         pp.query("agglomeration",mlmg.agglomeration);
@@ -106,8 +106,8 @@ int main (int argc, char* argv[])
  	dmap.resize(mesh.nlevels);
  	solution.resize(mesh.nlevels);
  	rhs.resize(mesh.nlevels);
-	RealBox rb({AMREX_D_DECL(0.0,0.0,0.0)},
-			          {AMREX_D_DECL(1.0,1.0,1.0)});
+	RealBox rb({AMREX_D_DECL(-0.5,-0.5,-0.5)},
+	          {AMREX_D_DECL(0.5,0.5,0.5)});
 	Geometry::Setup(&rb, 0);
 	Box NDomain(IntVect{AMREX_D_DECL(0,0,0)}, 
                 IntVect{AMREX_D_DECL(mesh.nnodes,mesh.nnodes,mesh.nnodes)}, 
@@ -147,11 +147,18 @@ int main (int argc, char* argv[])
  		dmap   [ilev].define(cgrids[ilev]);
  		solution[ilev].define(ngrids[ilev], dmap[ilev], op.ncomp, nghost); 
         solution[ilev].setVal(0.0);
+        solution[ilev].setMultiGhost(true);
  		rhs     [ilev].define(ngrids[ilev], dmap[ilev], op.ncomp, nghost);
         rhs     [ilev].setVal(0.0);
+        rhs     [ilev].setMultiGhost(true);
            
 	    Box domain(geom[ilev].Domain());
-        const Real* DX = geom[ilev].CellSize();
+        const Real AMREX_D_DECL( dx = geom[ilev].CellSize()[0],
+                                 dy = geom[ilev].CellSize()[1],
+                                 dz = geom[ilev].CellSize()[2]);
+        const Real AMREX_D_DECL( minx = geom[ilev].ProbLo()[0],
+                                 miny = geom[ilev].ProbLo()[1],
+                                 minz = geom[ilev].ProbLo()[2]);
 	    domain.convert(IntVect::TheNodeVector());
 	    domain.grow(-1); // Shrink domain so we don't operate on any boundaries            
         for (MFIter mfi(solution[ilev], TilingIfNotGPU()); mfi.isValid(); ++mfi)
@@ -160,17 +167,21 @@ int main (int argc, char* argv[])
     		bx.grow(1);        // Expand to cover first layer of ghost nodes
     		bx = bx & domain;  // Take intersection of box and the problem domain
 		
-	   		Array4<Real> const& SOL  = solution[ilev].array(mfi);
     		Array4<Real> const& RHS  = rhs[ilev].array(mfi);
     		for (int n = 0; n < op.ncomp; n++)
     			ParallelFor (bx,[=] AMREX_GPU_DEVICE(int i, int j, int k) {
                     
-                    Real x1 = i*DX[0], x2 = j*DX[1], x3 = k*DX[2];
+                    Real AMREX_D_DECL(x1 = i*dx + minx,
+                                      x2 = j*dy + miny, 
+                                      x3 = k*dz + minz);
 
-                    if (n==0) RHS(i,j,k,n) = x1*(1.0 - x1) * x2 * (1.0 - x2) * x3 * (1.0 - x3);
+                    if (n==0) RHS(i,j,k,n) = AMREX_D_TERM(   (x1-0.5)*(x1+0.5),
+                                                           * (x2-0.5)*(x2+0.5),
+                                                           * (x3-0.5)*(x3+0.5));
                     else RHS(i,j,k,n) = 0.0;
     			});         
  	    }
+        rhs[ilev].FillBoundary(false,true);
     }
          
     // 
@@ -189,8 +200,8 @@ int main (int argc, char* argv[])
     linop.setNComp(op.ncomp);
     linop.setCoeff(op.coeff);
     linop.define(geom,cgrids,dmap,info);
-    linop.setDomainBC({amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet},
-                      {amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet});
+    linop.setDomainBC({AMREX_D_DECL(amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet)},
+                      {AMREX_D_DECL(amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet,amrex::MLLinOp::BCType::Dirichlet)});
     for (int ilev = 0; ilev < mesh.nlevels; ++ilev) linop.setLevelBC(ilev,&solution[ilev]);
 
     //
@@ -198,7 +209,7 @@ int main (int argc, char* argv[])
     //
     MLMG solver(linop);
     if (mlmg.verbose >= 0)     solver.setVerbose(mlmg.verbose);
-    if (mlmg.cg_verbose >= 0)  solver.setCGVerbose(mlmg.cg_verbose);
+    if (mlmg.bottom_verbose >= 0)  solver.setBottomVerbose(mlmg.bottom_verbose);
     if (mlmg.fixed_iter >= 0)  solver.setFixedIter(mlmg.fixed_iter);
     if (mlmg.max_iter >= 0)    solver.setMaxIter(mlmg.max_iter);
     if (mlmg.max_fmg_iter >= 0)solver.setMaxFmgIter(mlmg.max_fmg_iter);
diff --git a/Tutorials/LinearSolvers/NodalPoisson/CMakeLists.txt b/Tutorials/LinearSolvers/NodalPoisson/CMakeLists.txt
index 8d7c9b38238..2b295e77501 100644
--- a/Tutorials/LinearSolvers/NodalPoisson/CMakeLists.txt
+++ b/Tutorials/LinearSolvers/NodalPoisson/CMakeLists.txt
@@ -1,39 +1,8 @@
-if (DIM EQUAL 1)
-    return()
-endif ()
+set(_sources main.cpp MyTest.cpp MyTest.H MyTestPlotfile.cpp)
 
-#
-# Use directory name as exe name
-#
-get_filename_component(exe_name ${CMAKE_CURRENT_LIST_DIR} NAME)
-set(exe_name "${exe_name}.exe")
+file( GLOB_RECURSE _input_files LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input*)
 
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ${exe_name} EXCLUDE_FROM_ALL "")
+setup_tutorial(_sources _input_files)
 
-target_sources( ${exe_name}
-    PRIVATE
-    main.cpp
-    MyTest.cpp
-    MyTest.H
-    MyTestPlotfile.cpp
-    )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${exe_name} )
-endif ()
-
-target_include_directories(${exe_name} PRIVATE ${CMAKE_CURRENT_LIST_DIR})
-
-target_link_libraries( ${exe_name} PRIVATE amrex )
-
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
-
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-# Add to the "tutorial" target
-add_tutorial(${exe_name})
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/LinearSolvers/NodalPoisson/GNUmakefile b/Tutorials/LinearSolvers/NodalPoisson/GNUmakefile
index 53934d5fb92..1934abe5526 100644
--- a/Tutorials/LinearSolvers/NodalPoisson/GNUmakefile
+++ b/Tutorials/LinearSolvers/NodalPoisson/GNUmakefile
@@ -7,7 +7,7 @@ COMP = gnu
 
 DIM = 3
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/LinearSolvers/NodalPoisson/MyTest.H b/Tutorials/LinearSolvers/NodalPoisson/MyTest.H
index 6ddab869a19..05c6e328591 100644
--- a/Tutorials/LinearSolvers/NodalPoisson/MyTest.H
+++ b/Tutorials/LinearSolvers/NodalPoisson/MyTest.H
@@ -37,6 +37,13 @@ private:
 
     int gpu_regtest = 0;
 
+
+    bool agglomeration = false;
+    bool consolidation = false;
+    bool semicoarsening = false;
+    int max_semicoarsening_level = 0;
+
+
     amrex::Vector<amrex::Geometry> geom;
     amrex::Vector<amrex::BoxArray> grids;
     amrex::Vector<amrex::DistributionMapping> dmap;
diff --git a/Tutorials/LinearSolvers/NodalPoisson/MyTest.cpp b/Tutorials/LinearSolvers/NodalPoisson/MyTest.cpp
index db43e7880b0..3540bff3f2c 100644
--- a/Tutorials/LinearSolvers/NodalPoisson/MyTest.cpp
+++ b/Tutorials/LinearSolvers/NodalPoisson/MyTest.cpp
@@ -18,7 +18,13 @@ MyTest::solve ()
 {
     if (composite_solve)
     {
-        MLNodeLaplacian linop(geom, grids, dmap);
+        LPInfo info;
+        info.setAgglomeration(agglomeration);
+        info.setConsolidation(consolidation);
+        info.setSemicoarsening(semicoarsening);
+        info.setMaxSemicoarseningLevel(max_semicoarsening_level);
+
+        MLNodeLaplacian linop(geom, grids, dmap, info);
 
         linop.setDomainBC({AMREX_D_DECL(LinOpBCType::Dirichlet,
                                         LinOpBCType::Dirichlet,
@@ -139,6 +145,10 @@ MyTest::readParameters ()
     pp.query("reltol", reltol);
 
     pp.query("gpu_regtest", gpu_regtest);
+
+    pp.query("agglomeration", agglomeration);
+    pp.query("semicoarsening", semicoarsening);
+    pp.query("max_semicoarsening_level", max_semicoarsening_level);
 }
 
 void
diff --git a/Tutorials/LinearSolvers/Nodal_Projection_EB/CMakeLists.txt b/Tutorials/LinearSolvers/Nodal_Projection_EB/CMakeLists.txt
index e6f9516cadf..ea18875027d 100644
--- a/Tutorials/LinearSolvers/Nodal_Projection_EB/CMakeLists.txt
+++ b/Tutorials/LinearSolvers/Nodal_Projection_EB/CMakeLists.txt
@@ -1,31 +1,11 @@
-if (NOT ENABLE_EB)
-    return()
+if ( (NOT AMReX_EB) OR NOT (AMReX_SPACEDIM EQUAL 3))
+   return()
 endif ()
 
-if (DIM EQUAL 1)
-    return()
-endif ()
-
-#
-# Use directory name as exe name
-#
-get_filename_component(exe_name ${CMAKE_CURRENT_LIST_DIR} NAME)
-set(exe_name "${exe_name}.exe")
-
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ${exe_name} EXCLUDE_FROM_ALL "")
-
-target_sources( ${exe_name} PRIVATE main.cpp )
-
-target_link_libraries( ${exe_name} PRIVATE amrex )
-
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
+set(_sources main.cpp)
+set(_input_files inputs_3d)
 
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
+setup_tutorial(_sources _input_files)
 
-# Add to the "tutorial" target
-add_tutorial(${exe_name})
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/LinearSolvers/Nodal_Projection_EB/GNUmakefile b/Tutorials/LinearSolvers/Nodal_Projection_EB/GNUmakefile
index 3a9a5b280e5..8cd4be92942 100644
--- a/Tutorials/LinearSolvers/Nodal_Projection_EB/GNUmakefile
+++ b/Tutorials/LinearSolvers/Nodal_Projection_EB/GNUmakefile
@@ -7,7 +7,7 @@ DIM = 3
 
 DEBUG = FALSE
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 USE_EB = TRUE
 
diff --git a/Tutorials/LinearSolvers/Nodal_Projection_EB/inputs_3d b/Tutorials/LinearSolvers/Nodal_Projection_EB/inputs_3d
index 41cd5efdc07..20e28c11a5c 100644
--- a/Tutorials/LinearSolvers/Nodal_Projection_EB/inputs_3d
+++ b/Tutorials/LinearSolvers/Nodal_Projection_EB/inputs_3d
@@ -8,4 +8,4 @@ obstacles = 0 1 2 3 4 5 6 7 8            # this is how we choose which obstacles
 use_hypre = 0                            # if 1 then use hypre instead of geometric multigrid      (default: 0)
 
 mg_verbose = 2                           # specify verbosity of geometric multigrid solver         (default: 0)
-cg_verbose = 2                           # specify verbosity of the BiCGStab bottom solver if used (default: 0)
+bottom_verbose = 2                       # specify verbosity of the bottom solver if used (default: 0)
diff --git a/Tutorials/LinearSolvers/Nodal_Projection_EB/main.cpp b/Tutorials/LinearSolvers/Nodal_Projection_EB/main.cpp
index 74aeeaa495b..a49333bccb0 100644
--- a/Tutorials/LinearSolvers/Nodal_Projection_EB/main.cpp
+++ b/Tutorials/LinearSolvers/Nodal_Projection_EB/main.cpp
@@ -39,7 +39,7 @@ int main (int argc, char* argv[])
     
     {
         int mg_verbose = 0;
-        int cg_verbose = 0;
+        int bottom_verbose = 0;
         int n_cell = 128;
         int max_grid_size = 32;
         int use_hypre  = 0;
@@ -50,7 +50,7 @@ int main (int argc, char* argv[])
         {
             ParmParse pp;
             pp.query("mg_verbose", mg_verbose);
-            pp.query("cg_verbose", cg_verbose);
+            pp.query("bottom_verbose", bottom_verbose);
             pp.query("n_cell", n_cell);
             pp.query("max_grid_size", max_grid_size);
             pp.query("use_hypre", use_hypre);
@@ -236,10 +236,10 @@ int main (int argc, char* argv[])
  
         // We can specify the maximum number of iterations
         // nodal_solver.setMaxIter(nodal_mg_maxiter);
-        // nodal_solver.setCGMaxIter(nodal_mg_cg_maxiter);
+        // nodal_solver.setBottomMaxIter(nodal_mg_bottom_maxiter);
  
         nodal_solver.setVerbose(mg_verbose);
-        nodal_solver.setCGVerbose(cg_verbose);
+        nodal_solver.setBottomVerbose(bottom_verbose);
 
         // Set bottom-solver to use hypre instead of native BiCGStab 
         //   ( we could also have set this to cg, bicgcg, cgbicg)
diff --git a/Tutorials/LinearSolvers/NodeTensorLap/CMakeLists.txt b/Tutorials/LinearSolvers/NodeTensorLap/CMakeLists.txt
index 53f615ac348..16ef15e19ef 100644
--- a/Tutorials/LinearSolvers/NodeTensorLap/CMakeLists.txt
+++ b/Tutorials/LinearSolvers/NodeTensorLap/CMakeLists.txt
@@ -1,39 +1,7 @@
-if (DIM EQUAL 1)
-   return()
-endif ()
+set(_sources main.cpp MyTest.cpp MyTest.H MyTestPlotfile.cpp)
+set(_input_files)
 
-#
-# Use directory name as exe name
-#
-get_filename_component(exe_name ${CMAKE_CURRENT_LIST_DIR} NAME)
-set(exe_name "${exe_name}.exe")
+setup_tutorial(_sources _input_files )
 
-#
-# This test works for both 2D and 3D builds
-#
-add_executable( ${exe_name} EXCLUDE_FROM_ALL "")
-
-target_sources( ${exe_name}
-   PRIVATE
-   main.cpp
-   MyTest.cpp
-   MyTest.H
-   MyTestPlotfile.cpp
-   )
-
-if (ENABLE_CUDA)
-   set_cpp_sources_to_cuda_language( ${exe_name} )
-endif ()
-
-target_include_directories(${exe_name} PRIVATE ${CMAKE_CURRENT_LIST_DIR})
-
-target_link_libraries( ${exe_name} PRIVATE amrex )
-
-# Find input files
-file( GLOB_RECURSE inputs LIST_DIRECTORIES false ${CMAKE_CURRENT_LIST_DIR}/input* )
-
-# Copy input files to corresponding build dir
-file( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-# Add to the "tutorial" target
-add_tutorial(${exe_name})
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/LinearSolvers/NodeTensorLap/GNUmakefile b/Tutorials/LinearSolvers/NodeTensorLap/GNUmakefile
index ea2108391e3..30e64b57c97 100644
--- a/Tutorials/LinearSolvers/NodeTensorLap/GNUmakefile
+++ b/Tutorials/LinearSolvers/NodeTensorLap/GNUmakefile
@@ -9,7 +9,7 @@ COMP = gnu
 
 DIM = 2
 
-AMREX_HOME ?= ../../..
+AMREX_HOME = ../../..
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/MUI/Exec_01/GNUmakefile b/Tutorials/MUI/Exec_01/GNUmakefile
index d2c7da55e9d..7d97aed8973 100644
--- a/Tutorials/MUI/Exec_01/GNUmakefile
+++ b/Tutorials/MUI/Exec_01/GNUmakefile
@@ -1,6 +1,6 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
 # If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 MUI_HOME ?= ../../../../MUI/
 
 DEBUG     = FALSE
diff --git a/Tutorials/MUI/Exec_02/GNUmakefile b/Tutorials/MUI/Exec_02/GNUmakefile
index 37f29d32d6c..c368328f0b4 100644
--- a/Tutorials/MUI/Exec_02/GNUmakefile
+++ b/Tutorials/MUI/Exec_02/GNUmakefile
@@ -1,6 +1,6 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
 # If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
+AMREX_HOME = ../../../
 MUI_HOME ?= ../../../../MUI/
 
 DEBUG     = FALSE
diff --git a/Tutorials/Particles/CellSortedParticles/CMakeLists.txt b/Tutorials/Particles/CellSortedParticles/CMakeLists.txt
new file mode 100644
index 00000000000..af0a23bff1a
--- /dev/null
+++ b/Tutorials/Particles/CellSortedParticles/CMakeLists.txt
@@ -0,0 +1,11 @@
+if ( NOT (AMReX_SPACEDIM EQUAL 3) OR NOT CMAKE_Fortran_COMPILER_LOADED OR AMReX_CUDA OR AMReX_HIP)
+   return ()
+endif ()
+
+set(_sources cell_sorted_3d.F90 cell_sorted_F.H CellSortedPC.cpp CellSortedPC.H main.cpp )
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files HAS_FORTRAN_MODULES)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Particles/CellSortedParticles/cell_sorted_F.H b/Tutorials/Particles/CellSortedParticles/cell_sorted_F.H
index 58158b3bbae..39f30abcd1a 100644
--- a/Tutorials/Particles/CellSortedParticles/cell_sorted_F.H
+++ b/Tutorials/Particles/CellSortedParticles/cell_sorted_F.H
@@ -21,7 +21,7 @@ extern "C"
                         const amrex_real* dt);
     
 #ifdef __cplusplus
-};
+}
 #endif
 
 #endif /*_EM_PIC_F_H_*/
diff --git a/Tutorials/Particles/ElectromagneticPIC/CMakeLists.txt b/Tutorials/Particles/ElectromagneticPIC/CMakeLists.txt
new file mode 100644
index 00000000000..969cceac00c
--- /dev/null
+++ b/Tutorials/Particles/ElectromagneticPIC/CMakeLists.txt
@@ -0,0 +1,60 @@
+#
+# Contains 3 tutorials
+#
+#  * CUDA
+#  * OpenMP
+#  * OpenACC (NOT supported anymore)
+#
+if ( (NOT AMReX_CUDA AND NOT AMReX_OMP) OR (NOT AMReX_SPACEDIM EQUAL 3) )
+   return()
+endif ()
+
+
+set(_sources Constants.H EMParticleContainer.H EMParticleContainerInit.cpp Evolve.H
+   IO.cpp IO.H main.cpp NodalFlags.cpp NodalFlags.H )
+
+list(TRANSFORM _sources PREPEND Source/)
+
+
+##########################################################################################
+#
+# CUDA tutorial
+#
+##########################################################################################
+if (AMReX_CUDA)
+   set(_cuda_sources EMParticleContainer.cpp  em_pic_K.H  Evolve.cpp)
+   list(TRANSFORM _cuda_sources PREPEND Exec/CUDA/)
+   list(APPEND _cuda_sources ${_sources})
+
+   set(_input_files Exec/CUDA/inputs)
+
+   setup_tutorial(_cuda_sources _input_files
+      BASE_NAME Particles_ElectromagneticPIC_CUDA
+      RUNTIME_SUBDIR CUDA)
+
+   unset(_cuda_sources)
+endif ()
+
+
+##########################################################################################
+#
+# OpenMP tutorial
+#
+##########################################################################################
+if (AMReX_OMP)
+   set(_omp_sources EMParticleContainer.cpp em_pic_3d.F90 em_pic_F.H Evolve.cpp)
+   list(TRANSFORM _omp_sources PREPEND Exec/OpenMP/)
+   list(APPEND _omp_sources ${_sources})
+
+   set(_input_files Exec/OpenMP/inputs)
+
+   setup_tutorial(_omp_sources _input_files
+      BASE_NAME Particles_ElectromagneticPIC_OpenMP
+      RUNTIME_SUBDIR OpenMP)
+
+   unset(_omp_sources)
+endif ()
+
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/Evolve.cpp b/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/Evolve.cpp
index e52cd0fe0dd..c4c737129cc 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/Evolve.cpp
+++ b/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/Evolve.cpp
@@ -142,7 +142,7 @@ void check_solution(const MultiFab& jx, const Geometry& geom, Real time)
     const Real j_exact = -n0*PhysConst::q_e*PhysConst::c*u*std::cos(wp*time);
 
     Real max_error = amrex::ReduceMax(jx, 0,
-    [=] AMREX_GPU_HOST_DEVICE (Box const& bx, FArrayBox const& jxfab) -> Real
+    [=] AMREX_GPU_HOST_DEVICE (Box const& bx, Array4<const Real> const& jxfab) -> Real
     {
         return check_langmuir_solution(bx, test_box, jxfab, j_exact);
     });
diff --git a/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/GNUmakefile b/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/GNUmakefile
index a981dfffd57..b9a3e8bf157 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/GNUmakefile
+++ b/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../../..
+AMREX_HOME = ../../../../..
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/em_pic_K.H b/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/em_pic_K.H
index e690e27b2a3..a20a1ea4fdb 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/em_pic_K.H
+++ b/Tutorials/Particles/ElectromagneticPIC/Exec/CUDA/em_pic_K.H
@@ -3,7 +3,7 @@
 
 #include "Constants.H"
 #include "EMParticleContainer.H"
-#include <AMReX_FArrayBox.H>
+#include <AMReX_Array4.H>
 #include <cmath>
 
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
@@ -220,9 +220,9 @@ void deposit_current (amrex::Array4<amrex::Real> const& jx,
     for         (int loff = 0; loff < 2; ++loff) {
         for     (int koff = 0; koff < 2; ++koff) {
             for (int joff = 0; joff < 2; ++joff) {
-                amrex::Gpu::Atomic::Add(&jx(j0+joff,k +koff,l +loff), sx0[joff]*sy [koff]*sz [loff]*wqx);
-                amrex::Gpu::Atomic::Add(&jy(j +joff,k0+koff,l +loff), sx [joff]*sy0[koff]*sz [loff]*wqy);
-                amrex::Gpu::Atomic::Add(&jz(j +joff,k +koff,l0+loff), sx [joff]*sy [koff]*sz0[loff]*wqz);
+                amrex::Gpu::Atomic::AddNoRet(&jx(j0+joff,k +koff,l +loff), sx0[joff]*sy [koff]*sz [loff]*wqx);
+                amrex::Gpu::Atomic::AddNoRet(&jy(j +joff,k0+koff,l +loff), sx [joff]*sy0[koff]*sz [loff]*wqy);
+                amrex::Gpu::Atomic::AddNoRet(&jz(j +joff,k +koff,l0+loff), sx [joff]*sy [koff]*sz0[loff]*wqz);
             }
         }
     }
@@ -303,12 +303,11 @@ void push_magnetic_field_z (int j, int k, int l,
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
 amrex::Real
 check_langmuir_solution (amrex::Box const& bx, amrex::Box const& test_box,
-                         amrex::FArrayBox const& jxfab, amrex::Real j_exact)
+                         amrex::Array4<amrex::Real const> const& jx, amrex::Real j_exact)
 {
     amrex::Real error = 0.0;
 
     const amrex::Box b = bx & test_box;
-    const auto jx = jxfab.const_array();
     amrex::Loop(bx, [=,&error] (int j, int k, int l) noexcept
     {
         error = amrex::max(error, std::abs((jx(j,k,l) - j_exact) / j_exact));
diff --git a/Tutorials/Particles/ElectromagneticPIC/Exec/OpenACC/GNUmakefile b/Tutorials/Particles/ElectromagneticPIC/Exec/OpenACC/GNUmakefile
index a38fc377aee..d1fce48a889 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Exec/OpenACC/GNUmakefile
+++ b/Tutorials/Particles/ElectromagneticPIC/Exec/OpenACC/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../../..
+AMREX_HOME = ../../../../..
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/GNUmakefile b/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/GNUmakefile
index a8841c282c1..e9520b28254 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/GNUmakefile
+++ b/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/GNUmakefile
@@ -1,4 +1,4 @@
-AMREX_HOME ?= ../../../../../
+AMREX_HOME = ../../../../../
 
 DEBUG	= TRUE
 DEBUG	= FALSE
diff --git a/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/em_pic_F.H b/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/em_pic_F.H
index 879511812bc..443511dd96c 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/em_pic_F.H
+++ b/Tutorials/Particles/ElectromagneticPIC/Exec/OpenMP/em_pic_F.H
@@ -126,7 +126,7 @@ extern "C"
 
 
 #ifdef __cplusplus
-};
+}
 #endif
 
 #endif /*_EM_PIC_F_H_*/
diff --git a/Tutorials/Particles/ElectromagneticPIC/Source/EMParticleContainerInit.cpp b/Tutorials/Particles/ElectromagneticPIC/Source/EMParticleContainerInit.cpp
index a028db2b0b1..fc36b7d83bd 100644
--- a/Tutorials/Particles/ElectromagneticPIC/Source/EMParticleContainerInit.cpp
+++ b/Tutorials/Particles/ElectromagneticPIC/Source/EMParticleContainerInit.cpp
@@ -106,9 +106,9 @@ InitParticles(const IntVect& a_num_particles_per_cell,
             }
         });
 
-        Gpu::inclusive_scan(counts.begin(), counts.end(), offsets.begin());
+        Gpu::exclusive_scan(counts.begin(), counts.end(), offsets.begin());
 
-        int num_to_add = offsets[tile_box.numPts()-1];
+        int num_to_add = offsets[tile_box.numPts()-1] + counts[tile_box.numPts()-1];
 
         auto& particles = GetParticles(lev);
         auto& particle_tile = particles[std::make_pair(mfi.index(), mfi.LocalTileIndex())];
@@ -191,4 +191,6 @@ InitParticles(const IntVect& a_num_particles_per_cell,
             }
         });
     }
+
+    AMREX_ASSERT(OK());
 }
diff --git a/Tutorials/Particles/ElectrostaticPIC/CMakeLists.txt b/Tutorials/Particles/ElectrostaticPIC/CMakeLists.txt
new file mode 100644
index 00000000000..873b331523b
--- /dev/null
+++ b/Tutorials/Particles/ElectrostaticPIC/CMakeLists.txt
@@ -0,0 +1,13 @@
+if (AMReX_SPACEDIM EQUAL 1 OR NOT CMAKE_Fortran_COMPILER_LOADED)
+   return()
+endif ()
+
+set(_sources ElectrostaticParticleContainer.cpp ElectrostaticParticleContainer.H
+   electrostatic_pic_${AMReX_SPACEDIM}d.f90 electrostatic_pic_F.H main.cpp PhysConst.H)
+
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Particles/ElectrostaticPIC/ElectrostaticParticleContainer.cpp b/Tutorials/Particles/ElectrostaticPIC/ElectrostaticParticleContainer.cpp
index b1fa3d3b352..df7e427533f 100644
--- a/Tutorials/Particles/ElectrostaticPIC/ElectrostaticParticleContainer.cpp
+++ b/Tutorials/Particles/ElectrostaticPIC/ElectrostaticParticleContainer.cpp
@@ -273,7 +273,7 @@ FieldGather(const VectorMeshData& E,
             }
         }
     }
-};
+}
 
 void 
 ElectrostaticParticleContainer::
diff --git a/Tutorials/Particles/NeighborList/CMakeLists.txt b/Tutorials/Particles/NeighborList/CMakeLists.txt
new file mode 100644
index 00000000000..0e816ea3853
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/CMakeLists.txt
@@ -0,0 +1,13 @@
+# #
+# # This test requires CUDA and Particles to be enabled
+# #
+# if (NOT AMReX_CUDA OR NOT AMReX_PARTICLES)
+#    return ()
+# endif ()
+set(_sources CheckPair.H Constants.H main.cpp MDParticleContainer.cpp MDParticleContainer.H)
+set(_input_files inputs)
+
+setup_tutorial(_sources _input_files)
+
+unset(_sources)
+unset(_input_files)
diff --git a/Tutorials/Particles/NeighborList/CheckPair.H b/Tutorials/Particles/NeighborList/CheckPair.H
new file mode 100644
index 00000000000..5edc5cb4b9c
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/CheckPair.H
@@ -0,0 +1,20 @@
+#ifndef MD_K_H_
+#define MD_K_H_
+
+#include "Constants.H"
+
+struct CheckPair
+{
+    template <class P>
+    AMREX_GPU_DEVICE AMREX_FORCE_INLINE
+    bool operator()(const P& p1, const P& p2) const
+    {
+        amrex::Real d0 = (p1.pos(0) - p2.pos(0));
+        amrex::Real d1 = (p1.pos(1) - p2.pos(1));
+        amrex::Real d2 = (p1.pos(2) - p2.pos(2));    
+        amrex::Real dsquared = d0*d0 + d1*d1 + d2*d2;   
+        return (dsquared <= 25.0*Params::cutoff*Params::cutoff);
+    }
+};
+
+#endif
diff --git a/Tutorials/Particles/NeighborList/Constants.H b/Tutorials/Particles/NeighborList/Constants.H
new file mode 100644
index 00000000000..2e26b1939b9
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/Constants.H
@@ -0,0 +1,15 @@
+#ifndef CONSTANTS_H_
+#define CONSTANTS_H_
+
+#include <AMReX_REAL.H>
+
+namespace Params
+{
+    // This is designed to represent MFiX-like conditions where the grid spacing is 
+    //     roughly 2.5 times the particle diameter.  In main.cpp we set grid spacing to 1
+    //     so here we set cutoff to diameter = 1/2.5 --> cutoff = 0.2
+    static constexpr amrex::Real cutoff = 0.2  ;
+    static constexpr amrex::Real min_r  = 1.e-4;
+}
+
+#endif
diff --git a/Tests/GPU/Locking/GNUmakefile b/Tutorials/Particles/NeighborList/GNUmakefile
similarity index 75%
rename from Tests/GPU/Locking/GNUmakefile
rename to Tutorials/Particles/NeighborList/GNUmakefile
index e57cd89da3b..712e8518b49 100644
--- a/Tests/GPU/Locking/GNUmakefile
+++ b/Tutorials/Particles/NeighborList/GNUmakefile
@@ -6,18 +6,16 @@ DIM	= 3
 
 COMP    = gcc
 
-USE_CUDA  = TRUE
-USE_ACC   = FALSE
-USE_OMP_OFFLOAD = FALSE
-
-USE_MPI   = FALSE
+USE_MPI   = TRUE
 USE_OMP   = FALSE
+USE_CUDA  = TRUE
 
-TINY_PROFILE = FALSE
+TINY_PROFILE = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
 include ./Make.package
 include $(AMREX_HOME)/Src/Base/Make.package
+include $(AMREX_HOME)/Src/Particle/Make.package
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.rules
diff --git a/Tutorials/Particles/NeighborList/MDParticleContainer.H b/Tutorials/Particles/NeighborList/MDParticleContainer.H
new file mode 100644
index 00000000000..40dc10ad579
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/MDParticleContainer.H
@@ -0,0 +1,44 @@
+#ifndef MD_PARTICLE_CONTAINER_H_
+#define MD_PARTICLE_CONTAINER_H_
+
+#include <AMReX_Particles.H>
+#include <AMReX_NeighborParticles.H>
+
+struct PIdx
+{
+    enum {
+        vx = 0,
+        vy, vz, ax, ay, az,
+        ncomps
+    };
+};
+
+class MDParticleContainer
+    : public amrex::NeighborParticleContainer<PIdx::ncomps, 0>
+{
+
+public:
+
+    MDParticleContainer (const amrex::Geometry            & a_geom,
+                         const amrex::DistributionMapping & a_dmap,
+                         const amrex::BoxArray            & a_ba,
+                         int                                a_numcells)
+        : NeighborParticleContainer<PIdx::ncomps, 0>(a_geom, a_dmap, a_ba, a_numcells)
+    {}
+
+    void InitParticles (const amrex::IntVect& a_num_particles_per_cell,
+                        const amrex::Real     a_thermal_momentum_std,
+                        const amrex::Real     a_thermal_momentum_mean);
+
+    void computeForces ();
+
+    amrex::Real minDistance ();
+
+    void moveParticles (const amrex::Real& dt);
+
+    void writeParticles (const int n);    
+
+    amrex::Real computeStepSize(amrex::Real& cfl);
+};
+
+#endif
diff --git a/Tutorials/Particles/NeighborList/MDParticleContainer.cpp b/Tutorials/Particles/NeighborList/MDParticleContainer.cpp
new file mode 100644
index 00000000000..6487bcb7724
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/MDParticleContainer.cpp
@@ -0,0 +1,286 @@
+#include "MDParticleContainer.H"
+#include "Constants.H"
+
+#include "CheckPair.H"
+
+using namespace amrex;
+
+namespace
+{    
+    void get_position_unit_cell(Real* r, const IntVect& nppc, int i_part)
+    {
+        int nx = nppc[0];
+        int ny = nppc[1];
+        int nz = nppc[2];
+        
+        int ix_part = i_part/(ny * nz);
+        int iy_part = (i_part % (ny * nz)) % ny;
+        int iz_part = (i_part % (ny * nz)) / ny;
+        
+        r[0] = (0.5+ix_part)/nx;
+        r[1] = (0.5+iy_part)/ny;
+        r[2] = (0.5+iz_part)/nz;
+    }
+    
+    void get_gaussian_random_momentum(Real* u, Real u_mean, Real u_std) {
+        Real ux_th = amrex::RandomNormal(0.0, u_std);
+        Real uy_th = amrex::RandomNormal(0.0, u_std);
+        Real uz_th = amrex::RandomNormal(0.0, u_std);
+        
+        u[0] = u_mean + ux_th;
+        u[1] = u_mean + uy_th;
+        u[2] = u_mean + uz_th;
+    }    
+}
+
+void
+MDParticleContainer::
+InitParticles(const IntVect& a_num_particles_per_cell,
+              const Real     a_thermal_momentum_std,
+              const Real     a_thermal_momentum_mean)
+{
+    BL_PROFILE("MDParticleContainer::InitParticles");
+
+    const int lev = 0;   
+    const Real* dx = Geom(lev).CellSize();
+    const Real* plo = Geom(lev).ProbLo();
+    
+    const int num_ppc = AMREX_D_TERM( a_num_particles_per_cell[0],
+                                     *a_num_particles_per_cell[1],
+                                     *a_num_particles_per_cell[2]);
+
+    for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+    {
+        const Box& tile_box  = mfi.tilebox();
+
+        Gpu::HostVector<ParticleType> host_particles;
+        
+        for (IntVect iv = tile_box.smallEnd(); iv <= tile_box.bigEnd(); tile_box.next(iv)) {
+            for (int i_part=0; i_part<num_ppc;i_part++) {
+                Real r[3];
+                Real v[3];
+                
+                get_position_unit_cell(r, a_num_particles_per_cell, i_part);
+                
+                get_gaussian_random_momentum(v, a_thermal_momentum_mean,
+                                             a_thermal_momentum_std);
+                
+                Real x = plo[0] + (iv[0] + r[0])*dx[0];
+                Real y = plo[1] + (iv[1] + r[1])*dx[1];
+                Real z = plo[2] + (iv[2] + r[2])*dx[2];
+                
+                ParticleType p;
+                p.id()  = ParticleType::NextID();
+                p.cpu() = ParallelDescriptor::MyProc();                
+                p.pos(0) = x;
+                p.pos(1) = y;
+                p.pos(2) = z;
+                
+                p.rdata(PIdx::vx) = v[0];
+                p.rdata(PIdx::vy) = v[1];
+                p.rdata(PIdx::vz) = v[2];
+
+                p.rdata(PIdx::ax) = 0.0;
+                p.rdata(PIdx::ay) = 0.0;
+                p.rdata(PIdx::az) = 0.0;
+                
+                host_particles.push_back(p);
+            }
+        }
+        
+        auto& particles = GetParticles(lev);
+        auto& particle_tile = particles[std::make_pair(mfi.index(), mfi.LocalTileIndex())];
+        auto old_size = particle_tile.GetArrayOfStructs().size();
+        auto new_size = old_size + host_particles.size();
+        particle_tile.resize(new_size);
+        
+        Gpu::copy(Gpu::hostToDevice,
+                  host_particles.begin(),
+                  host_particles.end(),
+                  particle_tile.GetArrayOfStructs().begin() + old_size);        
+    }    
+}
+
+void MDParticleContainer::computeForces()
+{
+    BL_PROFILE("MDParticleContainer::computeForces");
+
+    const int lev = 0;
+    const Geometry& geom = Geom(lev);
+    auto& plev  = GetParticles(lev);
+
+    for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+    {
+        int gid = mfi.index();
+        int tid = mfi.LocalTileIndex();
+        auto index = std::make_pair(gid, tid);
+
+        auto& ptile = plev[index];
+        auto& aos   = ptile.GetArrayOfStructs();
+        const size_t np = aos.numParticles();
+
+        auto nbor_data = m_neighbor_list[lev][index].data();
+        ParticleType* pstruct = aos().dataPtr();
+
+       // now we loop over the neighbor list and compute the forces
+        AMREX_FOR_1D ( np, i,
+        {
+            ParticleType& p1 = pstruct[i];
+            p1.rdata(PIdx::ax) = 0.0;
+            p1.rdata(PIdx::ay) = 0.0;
+            p1.rdata(PIdx::az) = 0.0;
+
+            for (const auto& p2 : nbor_data.getNeighbors(i))
+            {                
+                Real dx = p1.pos(0) - p2.pos(0);
+                Real dy = p1.pos(1) - p2.pos(1);
+                Real dz = p1.pos(2) - p2.pos(2);
+                
+                Real r2 = dx*dx + dy*dy + dz*dz;
+                r2 = amrex::max(r2, Params::min_r*Params::min_r);
+
+		if (r2 > Params::cutoff*Params::cutoff) return;
+
+                Real r = sqrt(r2);
+                
+                Real coef = (1.0 - Params::cutoff / r) / r2;
+                p1.rdata(PIdx::ax) += coef * dx;
+                p1.rdata(PIdx::ay) += coef * dy;
+                p1.rdata(PIdx::az) += coef * dz;
+            }
+        });
+    }
+}
+
+Real MDParticleContainer::minDistance()
+{
+    BL_PROFILE("MDParticleContainer::minDistance");
+
+    const int lev = 0;
+    const Geometry& geom = Geom(lev);
+    auto& plev  = GetParticles(lev);
+
+    Real min_d = std::numeric_limits<Real>::max();
+
+    for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+    {
+        int gid = mfi.index();
+        int tid = mfi.LocalTileIndex();
+        auto index = std::make_pair(gid, tid);
+
+        auto& ptile = plev[index];
+        auto& aos   = ptile.GetArrayOfStructs();
+        const size_t np = aos.numParticles();
+
+        auto nbor_data = m_neighbor_list[lev][index].data();
+        ParticleType* pstruct = aos().dataPtr();
+
+	Gpu::DeviceScalar<Real> min_d_gpu(min_d);
+	Real* pmin_d = min_d_gpu.dataPtr();
+
+        AMREX_FOR_1D ( np, i,
+        {
+            ParticleType& p1 = pstruct[i];
+
+            for (const auto& p2 : nbor_data.getNeighbors(i))
+            {                	      
+                Real dx = p1.pos(0) - p2.pos(0);
+                Real dy = p1.pos(1) - p2.pos(1);
+                Real dz = p1.pos(2) - p2.pos(2);
+                
+                Real r2 = dx*dx + dy*dy + dz*dz;
+                r2 = amrex::max(r2, Params::min_r*Params::min_r);
+                Real r = sqrt(r2);
+                
+		Gpu::Atomic::Min(pmin_d, r);
+            }
+        });
+
+	Gpu::Device::streamSynchronize();
+
+	min_d = std::min(min_d, min_d_gpu.dataValue());
+    }
+    ParallelDescriptor::ReduceRealMin(min_d, ParallelDescriptor::IOProcessorNumber());
+
+    return min_d;
+}
+
+void MDParticleContainer::moveParticles(const amrex::Real& dt)
+{
+    BL_PROFILE("MDParticleContainer::moveParticles");
+
+    const int lev = 0;
+    const Geometry& geom = Geom(lev);
+    const auto plo = Geom(lev).ProbLoArray();
+    const auto phi = Geom(lev).ProbHiArray();
+    const auto dx = Geom(lev).CellSizeArray();
+    auto& plev  = GetParticles(lev);
+
+    for(MFIter mfi = MakeMFIter(lev); mfi.isValid(); ++mfi)
+    {
+        int gid = mfi.index();
+        int tid = mfi.LocalTileIndex();
+        
+        auto& ptile = plev[std::make_pair(gid, tid)];
+        auto& aos   = ptile.GetArrayOfStructs();
+        ParticleType* pstruct = &(aos[0]);
+
+        const size_t np = aos.numParticles();
+    
+        // now we move the particles
+        AMREX_FOR_1D ( np, i,
+        {
+            ParticleType& p = pstruct[i];            
+            p.rdata(PIdx::vx) += p.rdata(PIdx::ax) * dt;
+            p.rdata(PIdx::vy) += p.rdata(PIdx::ay) * dt;
+            p.rdata(PIdx::vz) += p.rdata(PIdx::az) * dt;
+
+            p.pos(0) += p.rdata(PIdx::vx) * dt;
+            p.pos(1) += p.rdata(PIdx::vy) * dt;
+            p.pos(2) += p.rdata(PIdx::vz) * dt;
+
+            for (int idim = 0; idim < AMREX_SPACEDIM; ++idim) {
+                while ( (p.pos(idim) < plo[idim]) or (p.pos(idim) > phi[idim]) ) {
+                    if ( p.pos(idim) < plo[idim] ) {
+                        p.pos(idim) = 2*plo[idim] - p.pos(idim);
+                    } else {
+                        p.pos(idim) = 2*phi[idim] - p.pos(idim);
+                    }
+                    p.rdata(idim) *= -1; // flip velocity
+                }
+            }
+        });
+    }
+}
+
+void MDParticleContainer::writeParticles(const int n)
+{
+    BL_PROFILE("MDParticleContainer::writeParticles");
+    const std::string& pltfile = amrex::Concatenate("particles", n, 5);
+    WriteAsciiFile(pltfile);
+}
+
+
+Real MDParticleContainer::computeStepSize(amrex::Real& cfl)
+{
+    BL_PROFILE("MDParticleContainer::computeStepSize");
+
+    Real maxVel = amrex::ReduceMax(*this, 0,
+    [=] AMREX_GPU_HOST_DEVICE (const ParticleType& p) noexcept -> Real
+                              {
+                                 Real u = std::abs(p.rdata(PIdx::vx));
+                                 Real v = std::abs(p.rdata(PIdx::vy));
+                                 Real w = std::abs(p.rdata(PIdx::vz));
+                                 return amrex::max(u,amrex::max(v,w));
+                              });
+
+    ParallelDescriptor::ReduceRealMax(maxVel);
+    
+    // This would compute dt based on the grid spacing dx
+    // const int lev = 0;   
+    // const Real* dx = Geom(lev).CellSize();
+    // return cfl*dx[0]/maxVel;
+
+    // This computes dt based on the particle cutoff radius
+    return cfl * Params::cutoff /maxVel;
+}
diff --git a/Tutorials/Particles/NeighborList/Make.package b/Tutorials/Particles/NeighborList/Make.package
new file mode 100644
index 00000000000..1dbe55d7f8a
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/Make.package
@@ -0,0 +1,6 @@
+CEXE_sources += main.cpp MDParticleContainer.cpp
+
+CEXE_headers += MDParticleContainer.H Constants.H CheckPair.H
+
+
+
diff --git a/Tutorials/Particles/NeighborList/README.md b/Tutorials/Particles/NeighborList/README.md
new file mode 100644
index 00000000000..3c8faaf279f
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/README.md
@@ -0,0 +1,9 @@
+This tutorial initializes particles, and steps through "nsteps" time steps where in each time step 
+we 
+ * compute the timestep = cfl * "cutoff" (particle radius) / max_particle_vel
+ * compute or update the grid neighbors 
+ * calculate particle neighbor lists
+ *  compute forces due to particle-particle collisions
+ * update the particle velocities then particle positions.   
+
+At every time step we print out dt and the number of particles.
diff --git a/Tutorials/Particles/NeighborList/inputs b/Tutorials/Particles/NeighborList/inputs
new file mode 100644
index 00000000000..95e3a617d22
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/inputs
@@ -0,0 +1,20 @@
+
+size = (32, 32, 32)
+
+max_grid_size = 16
+
+nsteps = 1000
+
+print_neighbor_list = false
+
+print_minimum_distance = false
+
+print_num_particles = false
+
+write_particles = false
+
+num_rebuild = 25
+
+cfl = 0.1 
+
+num_ppc = 2
diff --git a/Tutorials/Particles/NeighborList/main.cpp b/Tutorials/Particles/NeighborList/main.cpp
new file mode 100644
index 00000000000..b63b623b296
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/main.cpp
@@ -0,0 +1,130 @@
+
+#include <AMReX.H>
+#include <AMReX_ParmParse.H>
+#include <AMReX_MultiFab.H>
+
+#include "CheckPair.H"
+
+#include "MDParticleContainer.H"
+
+using namespace amrex;
+
+struct TestParams
+{
+    IntVect size;
+    int max_grid_size;
+    int nsteps;
+    int num_rebuild;
+    int num_ppc;
+    bool print_min_dist;
+    bool print_neighbor_list;
+    bool print_num_particles;
+    bool write_particles;
+    Real cfl;
+};
+
+void main_main();
+
+int main (int argc, char* argv[])
+{
+    amrex::Initialize(argc,argv);
+    main_main();
+    amrex::Finalize();
+}
+
+void get_test_params(TestParams& params)
+{
+    ParmParse pp;
+    pp.get("size", params.size);
+    pp.get("max_grid_size", params.max_grid_size);
+    pp.get("nsteps", params.nsteps);
+    pp.get("print_minimum_distance", params.print_min_dist);
+    pp.get("print_neighbor_list", params.print_neighbor_list);
+    pp.get("write_particles", params.write_particles);
+    pp.get("num_rebuild", params.num_rebuild);
+    pp.get("num_ppc", params.num_ppc);
+    pp.get("cfl", params.cfl);
+    pp.get("print_num_particles", params.print_num_particles);
+}
+
+void main_main ()
+{
+
+    amrex::Print() << "Running MD benchmark \n";
+
+    TestParams params;
+    get_test_params(params);
+
+    RealBox real_box;
+    for (int n = 0; n < BL_SPACEDIM; n++)
+    {
+        real_box.setLo(n, 0.0);
+        real_box.setHi(n, params.size[n]);
+    }
+
+    IntVect domain_lo(AMREX_D_DECL(0, 0, 0));
+    IntVect domain_hi(AMREX_D_DECL(params.size[0]-1,params.size[1]-1,params.size[2]-1));
+    const Box domain(domain_lo, domain_hi);
+
+    int coord = 0;
+    int is_per[BL_SPACEDIM];
+    for (int i = 0; i < BL_SPACEDIM; i++)
+        is_per[i] = 0;
+    Geometry geom(domain, &real_box, coord, is_per);
+    
+    BoxArray ba(domain);
+    ba.maxSize(params.max_grid_size);
+    DistributionMapping dm(ba);
+
+    const int ncells = 1;
+    MDParticleContainer pc(geom, dm, ba, ncells);
+
+    int npc = params.num_ppc;
+    IntVect nppc = IntVect(AMREX_D_DECL(npc, npc, npc));
+
+    pc.InitParticles(nppc, 1.0, 0.0);
+
+    if (params.print_num_particles) 
+      amrex::Print() << "Num particles after init is " << pc.TotalNumberOfParticles() << "\n";
+
+    int num_rebuild = params.num_rebuild;
+
+    Real cfl = params.cfl;
+    
+    Real min_d = std::numeric_limits<Real>::max();
+
+    for (int step = 0; step < params.nsteps; ++step) {
+
+	Real dt = pc.computeStepSize(cfl);
+
+	if (step % num_rebuild == 0)
+	{
+	  if (step > 0) pc.RedistributeLocal();
+
+	  pc.fillNeighbors();
+
+	  pc.buildNeighborList(CheckPair());
+	} 
+	else
+	{
+	  pc.updateNeighbors();
+	}
+
+        if (params.print_min_dist) 
+	   min_d = std::min(min_d, pc.minDistance());
+
+        if (params.print_neighbor_list) 
+           pc.printNeighborList();
+
+	pc.computeForces();
+
+	pc.moveParticles(dt);
+    }
+
+    pc.RedistributeLocal();
+
+    if (params.print_min_dist     ) amrex::Print() << "Min distance  is " << min_d << "\n";
+    if (params.print_num_particles) amrex::Print() << "Num particles is " << pc.TotalNumberOfParticles() << "\n";
+
+    if (params.write_particles) pc.writeParticles(params.nsteps);
+}
diff --git a/Tutorials/Particles/NeighborList/script.sh b/Tutorials/Particles/NeighborList/script.sh
new file mode 100644
index 00000000000..da7ec4e0e47
--- /dev/null
+++ b/Tutorials/Particles/NeighborList/script.sh
@@ -0,0 +1,42 @@
+#!/bin/bash
+#BSUB -P GEN128
+#BSUB -W 2:00
+#BSUB -nnodes 1
+#BSUB -J MFIX
+#BSUB -o MFIXo.%J
+#BSUB -e MFIXe.%J
+
+module load gcc
+module load cuda
+module list
+set -x
+
+omp=1
+export OMP_NUM_THREADS=${omp}
+EXE="../main3d.gnu.TPROF.MPI.CUDA.ex"
+JSRUN="jsrun -n 1 -a 1 -g 1 -c 1 --bind=packed:${omp} "
+
+rundir="${LSB_JOBNAME}-${LSB_JOBID}"
+mkdir $rundir
+cp $0 $rundir
+cp inputs $rundir
+cd $rundir
+
+# 1. Run normally
+${JSRUN} --smpiargs="-gpu" ${EXE} inputs
+
+# 2. Run under nvprof and direct all stdout and stderr to nvprof.txt
+#${JSRUN} --smpiargs="-gpu" nvprof --profile-child-processes ${EXE} inputs &> nvprof.txt
+
+# 3. Run under nvprof and store performance data in a nvvp file
+# Can be converted to text using nvprof -i nvprof-timeline-%p.nvvp
+#${JSRUN} --smpiargs="-gpu" nvprof --profile-child-processes --openmp-profiling off  -o nvprof-timeline-%p.nvvp ${EXE} inputs
+
+# COLLECT PERFORMANCE METRICS - THIS IS MUCH SLOWER. Set nsteps=2 in the inputs files
+# 4. Run under nvprof and collect metrics for a subset of kernels
+#${JSRUN} --smpiargs="-gpu" nvprof --profile-child-processes --kernels '(deposit_current|gather_\w+_field|push_\w+_boris)' --analysis-metrics -o nvprof-metrics-kernel-%p.nvvp ${EXE} inputs
+
+# 5. Run under nvprof and collect metrics for all kernels -- much slower!
+#${JSRUN} --smpiargs="-gpu" nvprof --profile-child-processes --analysis-metrics -o nvprof-metrics-%p.nvvp ${EXE} inputs
+
+cp ../MFIX*.${LSB_JOBID} .
diff --git a/Tutorials/SDC/MISDC_ADR_2d/Exec/GNUmakefile b/Tutorials/SDC/MISDC_ADR_2d/Exec/GNUmakefile
index 1fe299cdc29..1b456352b36 100644
--- a/Tutorials/SDC/MISDC_ADR_2d/Exec/GNUmakefile
+++ b/Tutorials/SDC/MISDC_ADR_2d/Exec/GNUmakefile
@@ -1,6 +1,5 @@
 # AMREX_HOME defines the directory in which we will find all the AMReX code.
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../../
+AMREX_HOME = ../../../../
 
 DEBUG     = FALSE
 USE_MPI   = FALSE
diff --git a/Tutorials/SDC/MISDC_ADR_2d/Source/main.cpp b/Tutorials/SDC/MISDC_ADR_2d/Source/main.cpp
index 1b367f76c1d..69b97d6d027 100644
--- a/Tutorials/SDC/MISDC_ADR_2d/Source/main.cpp
+++ b/Tutorials/SDC/MISDC_ADR_2d/Source/main.cpp
@@ -261,8 +261,8 @@ void main_main ()
   mlmg.setMaxFmgIter(max_fmg_iter);
   int verbose = 1;
   mlmg.setVerbose(verbose);
-  int cg_verbose = 0;
-  mlmg.setCGVerbose(cg_verbose);
+  int bottom_verbose = 0;
+  mlmg.setBottomVerbose(bottom_verbose);
   
 
   //  Do the time stepp[ing
diff --git a/Tutorials/SENSEI/Advection_AmrCore/CMakeLists.txt b/Tutorials/SENSEI/Advection_AmrCore/CMakeLists.txt
deleted file mode 100644
index 9eb84b62c7c..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/CMakeLists.txt
+++ /dev/null
@@ -1,57 +0,0 @@
-#
-# Does not work if amrex is built in shared mode
-#
-if (BUILD_SHARED_LIBS)
-  return()
-endif ()
-
-#
-# This test works for both 2D and 3D builds 
-#
-set ( EXENAME  "Advection_AmrCore.exe" )
-set ( SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex )
-
-#
-# Create target (executable) for this tutorial
-# 
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-#
-# Set target (executable) properties 
-#
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-find_all_sources ( SRC3 INC3 ROOT ${SRC_DIR}/Src_nd )
-
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-set_target_properties ( ${EXENAME} PROPERTIES      
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR} )
-
-target_link_libraries ( ${EXENAME} amrex ${AMREX_EXTRA_Fortran_LINK_LINE} )
-
-#
-# Find input files 
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false  ${EXE_DIR}/input* )
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR} ) 
-file ( COPY ${EXE_DIR}/sensei DESTINATION ${CMAKE_CURRENT_BINARY_DIR} )
-
-#
-# Add to the "tutorial" target
-# 
-add_tutorial (${EXENAME})   
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/Make.Adv b/Tutorials/SENSEI/Advection_AmrCore/Exec/Make.Adv
deleted file mode 100644
index 2436e5e05b4..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/Make.Adv
+++ /dev/null
@@ -1,31 +0,0 @@
-AMREX_HOME ?= ../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/SENSEI/Advection_AmrCore
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack	+= $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs 	:= Base Boundary AmrCore
-ifeq ($(USE_SENSEI_INSITU),TRUE)
-	Pdirs += Amr Extern/SENSEI
-endif
-Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/GNUmakefile b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/GNUmakefile
deleted file mode 100644
index b38fbf0526c..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/GNUmakefile
+++ /dev/null
@@ -1,20 +0,0 @@
-AMREX_HOME ?= ../../../../..
-
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = FALSE
-
-DIM        = 2
-
-COMP	   = gnu
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE
-
-USE_SENSEI_INSITU = TRUE
-
-Bpack   := ./Make.package
-Blocs   := .
-
-include ../Make.Adv
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/Make.package b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/Make.package
deleted file mode 100644
index c478388fbdc..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/Prob.f90 b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/Prob.f90
deleted file mode 100644
index 556c0d86bc5..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/Prob.f90
+++ /dev/null
@@ -1,39 +0,0 @@
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo) bind(C, name="initdata")
-
-  use amrex_fort_module, only : amrex_spacedim, amrex_real
-
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  real(amrex_real), intent(in) :: time
-  real(amrex_real), intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  real(amrex_real), intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: i,j,k
-  real(amrex_real) :: x,y,z,r2
-  
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( amrex_spacedim .eq. 2) then
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2 + (z-0.5d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/face_velocity_2d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/face_velocity_2d.f90
deleted file mode 100644
index 3db62eb9dff..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/face_velocity_2d.f90
+++ /dev/null
@@ -1,62 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  real(amrex_real), intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  real(amrex_real), intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  real(amrex_real), intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  real(amrex_real), intent(in) :: dx(2), prob_lo(2)
-
-  integer :: i, j, plo(2), phi(2)
-  real(amrex_real) :: x, y
-  real(amrex_real), pointer, contiguous :: psi(:,:)
-  real(amrex_real), parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-
-  ! y velocity
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-
-  call bl_deallocate(psi)
-  
-end subroutine get_face_velocity
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/face_velocity_3d.f90
deleted file mode 100644
index e1818d778d1..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/face_velocity_3d.f90
+++ /dev/null
@@ -1,70 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3, &
-     vy, vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3, &
-     vz, vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  real(amrex_real), intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3
-  integer, intent(in) :: vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3
-  integer, intent(in) :: vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3
-  real(amrex_real), intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2,vx_l3:vx_h3)
-  real(amrex_real), intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2,vy_l3:vy_h3)
-  real(amrex_real), intent(out) :: vz(vz_l1:vz_h1,vz_l2:vz_h2,vz_l3:vz_h3)
-  real(amrex_real), intent(in) :: dx(3), prob_lo(3)
-
-  integer :: i, j, k, plo(2), phi(2)
-  real(amrex_real) :: x, y, z
-  real(amrex_real), pointer, contiguous :: psi(:,:)
-  real(amrex_real), parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do k = vx_l3, vx_h3
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j,k) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-  end do
-
-  ! y velocity
-  do k = vy_l3, vy_h3
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j,k) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-  end do
-
-  vz = 1.d0
-
-  call bl_deallocate(psi)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/inputs b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/inputs
deleted file mode 100644
index f6f92ae3fc5..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,52 +0,0 @@
-max_step  = 100
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# VERBOSITY
-amr.v              = 1       # verbosity in Amr
-
-# REFINEMENT
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-amr.regrid_int      = 2       # how often to regrid
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-
-adv.do_reflux = 1
-
-# Tagging
-adv.phierr = 1.01  1.1  1.5
-
-# PLOTFILES
-amr.plot_file  = plt    # root name of plot file
-amr.plot_int   = -1     # number of timesteps between plot files
-
-# CHECKPOINT
-amr.chk_file = chk      # root name of checkpoint file
-amr.chk_int  = -1      # number of timesteps between checkpoint files
-#amr.restart  = chk00060 # restart from this checkpoint file
-
-# SENSEI in situ
-# enable and choose the configuration based on your build
-sensei.enabled = 1
-sensei.config = sensei/histogram_python.xml
-#sensei.config = sensei/render_iso_catalyst_2d.xml
-#sensei.config = sensei/render_iso_catalyst_3d.xml
-#sensei.config = sensei/render_iso_libsim_2d.xml
-#sensei.config = sensei/render_iso_libsim_3d.xml
-#sensei.config = sensei/write_vtk.xml
-sensei.frequency = 2
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/histogram.py b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/histogram.py
deleted file mode 100644
index f93c5701419..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/histogram.py
+++ /dev/null
@@ -1,110 +0,0 @@
-import sys
-import numpy as np
-import vtk.util.numpy_support as vtknp
-from vtk import vtkDataObject, vtkCompositeDataSet, vtkMultiBlockDataSet
-
-# default values of control parameters
-numBins = 10
-meshName = ''
-arrayName = ''
-arrayCen = vtkDataObject.POINT
-outFile = 'hist'
-verbose = True
-
-def Initialize():
-    r = comm.Get_rank()
-    if r == 0:
-        if verbose:
-            sys.stderr.write( \
-                'Initialize numBins=%d meshName=%s arrayName=%s arrayCen=%d outFile=%s\n'%( \
-                numBins, meshName, arrayName, arrayCen, outFile))
-
-        # check for valid control parameters
-        if not meshName:
-            raise RuntimeError('meshName was not set')
-        if not arrayName:
-            raise RuntimeError('arrayName was not set')
-
-def Execute(adaptor):
-    r = comm.Get_rank()
-
-    # get the mesh and array we need
-    mesh = adaptor.GetMesh(meshName, True)
-    adaptor.AddArray(mesh, meshName, arrayCen, arrayName)
-
-    # force composite data to simplify computations
-    if not isinstance(mesh, vtkCompositeDataSet):
-        s = comm.Get_size()
-        mb = vtkMultiBlockDataSet()
-        mb.SetNumberOfBlocks(s)
-        mb.SetBlock(r, mesh)
-        mesh = mb
-
-    # compute the min and max over local blocks
-    mn = sys.float_info.max
-    mx = -mn
-    it = mesh.NewIterator()
-    while not it.IsDoneWithTraversal():
-        do = it.GetCurrentDataObject()
-
-        atts = do.GetPointData() if arrayCen == vtkDataObject.POINT \
-             else do.GetCellData()
-
-        da = vtknp.vtk_to_numpy(atts.GetArray(arrayName))
-
-        mn = min(mn, np.min(da))
-        mx = max(mx, np.max(da))
-
-        it.GoToNextItem()
-
-    # compute global min and max
-    mn = comm.allreduce(mn, op=MPI.MIN)
-    mx = comm.allreduce(mx, op=MPI.MAX)
-
-    # compute the histogram over local blocks
-    it.InitTraversal()
-    while not it.IsDoneWithTraversal():
-        do = it.GetCurrentDataObject()
-
-        atts = do.GetPointData() if arrayCen == vtkDataObject.POINT \
-             else do.GetCellData()
-
-        da = vtknp.vtk_to_numpy(atts.GetArray(arrayName))
-
-        h,be = np.histogram(da, bins=numBins, range=(mn,mx))
-
-        hist = hist + h if 'hist' in globals() else h
-
-        it.GoToNextItem()
-
-    # compute the global histogram on rank 0
-    h = comm.reduce(hist, root=0, op=MPI.SUM)
-
-    # rank 0 write to disk
-    if r == 0:
-        t = adaptor.GetDataTime()
-        ts = adaptor.GetDataTimeStep()
-        fn = '%s_%s_%s_%05d.txt'%(outFile, meshName, arrayName, ts)
-        f = open(fn, 'w')
-        f.write('step : %d\n'%(ts))
-        f.write('time : %0.6g\n'%(t))
-        f.write('num bins : %d\n'%(numBins))
-        f.write('range : %0.6g %0.6g\n'%(mn, mx))
-        f.write('bin edges : ')
-        for v in be:
-            f.write('%0.6g '%(v))
-        f.write('\n')
-        f.write('counts : ')
-        for v in h:
-            f.write('%d '%(v))
-        f.write('\n')
-        f.close()
-        if verbose:
-            sys.stderr.write('Execute "%s" written\n'%(fn))
-
-def Finalize():
-    r = comm.Get_rank()
-    if r == 0 and verbose:
-        sys.stderr.write('Finalize\n')
-    return 0
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/histogram_python.xml b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/histogram_python.xml
deleted file mode 100644
index e5754480add..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/histogram_python.xml
+++ /dev/null
@@ -1,10 +0,0 @@
-<sensei>
-  <analysis type="python" script_file="sensei/histogram.py" enabled="1">
-    <initialize_source>
-numBins=10
-meshName='mesh'
-arrayName='phi'
-arrayCen=1
-     </initialize_source>
-  </analysis>
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_catalyst.py b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_catalyst.py
deleted file mode 100644
index 359a1665396..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_catalyst.py
+++ /dev/null
@@ -1,179 +0,0 @@
-
-from paraview.simple import *
-from paraview import coprocessing
-
-
-#--------------------------------------------------------------
-# Code generated from cpstate.py to create the CoProcessor.
-# ParaView 5.4.1 64 bits
-
-#--------------------------------------------------------------
-# Global screenshot output options
-imageFileNamePadding=4
-rescale_lookuptable=False
-
-
-# ----------------------- CoProcessor definition -----------------------
-
-def CreateCoProcessor():
-  def _CreatePipeline(coprocessor, datadescription):
-    class Pipeline:
-      # state file generated using paraview version 5.4.1
-
-      # ----------------------------------------------------------------
-      # setup views used in the visualization
-      # ----------------------------------------------------------------
-
-      #### disable automatic camera reset on 'Show'
-      paraview.simple._DisableFirstRenderCameraReset()
-
-      # Create a new 'Render View'
-      renderView1 = CreateView('RenderView')
-      renderView1.ViewSize = [480, 480]
-      renderView1.AxesGrid = 'GridAxes3DActor'
-      renderView1.CenterOfRotation = [0.5, 0.5, 0.0]
-      renderView1.StereoType = 0
-      renderView1.CameraPosition = [0.5, 0.5, 1.9306242333430546]
-      renderView1.CameraFocalPoint = [0.5, 0.5, -0.8014265742258199]
-      renderView1.CameraParallelScale = 0.7071067811865476
-      renderView1.Background = [0.0, 0.0, 0.0]
-
-      # register the view with coprocessor
-      # and provide it with information such as the filename to use,
-      # how frequently to write the images, etc.
-      coprocessor.RegisterView(renderView1,
-          filename='image_%t.png', freq=1, fittoscreen=0, magnification=1, width=480, height=480, cinema={})
-      renderView1.ViewTime = datadescription.GetTime()
-
-      # ----------------------------------------------------------------
-      # setup the data processing pipelines
-      # ----------------------------------------------------------------
-
-      # create a new 'XML UniformGrid AMR Reader'
-      # create a producer from a simulation input
-      amr_mesh_ = coprocessor.CreateProducer(datadescription, 'mesh')
-
-      # create a new 'Outline'
-      outline1 = Outline(Input=amr_mesh_)
-
-      # ----------------------------------------------------------------
-      # setup color maps and opacity mapes used in the visualization
-      # note: the Get..() functions create a new object, if needed
-      # ----------------------------------------------------------------
-
-      # get color transfer function/color map for 'phi'
-      phiLUT = GetColorTransferFunction('phi')
-      phiLUT.RGBPoints = [0.9990617484291469, 0.278431372549, 0.278431372549, 0.858823529412, 1.1420481577953918, 0.0, 0.0, 0.360784313725, 1.2840346622010337, 0.0, 1.0, 1.0, 1.4280209765278817, 0.0, 0.501960784314, 0.0, 1.5700074809335236, 1.0, 1.0, 0.0, 1.7129938902997686, 1.0, 0.380392156863, 0.0, 1.8559802996660135, 0.419607843137, 0.0, 0.0, 1.9989667090322585, 0.878431372549, 0.301960784314, 0.301960784314]
-      phiLUT.ColorSpace = 'RGB'
-      phiLUT.ScalarRangeInitialized = 1.0
-
-      # get opacity transfer function/opacity map for 'phi'
-      phiPWF = GetOpacityTransferFunction('phi')
-      phiPWF.Points = [0.9990617484291469, 0.0, 0.5, 0.0, 1.9989667090322585, 1.0, 0.5, 0.0]
-      phiPWF.ScalarRangeInitialized = 1
-
-      # ----------------------------------------------------------------
-      # setup the visualization in view 'renderView1'
-      # ----------------------------------------------------------------
-
-      # show data from amr_mesh_
-      amr_mesh_Display = Show(amr_mesh_, renderView1)
-      # trace defaults for the display properties.
-      amr_mesh_Display.Representation = 'Wireframe'
-      amr_mesh_Display.ColorArrayName = ['CELLS', 'phi']
-      amr_mesh_Display.LookupTable = phiLUT
-      amr_mesh_Display.OSPRayScaleArray = 'phi'
-      amr_mesh_Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      amr_mesh_Display.SelectOrientationVectors = 'None'
-      amr_mesh_Display.ScaleFactor = 0.1
-      amr_mesh_Display.SelectScaleArray = 'None'
-      amr_mesh_Display.GlyphType = 'Arrow'
-      amr_mesh_Display.GlyphTableIndexArray = 'None'
-      amr_mesh_Display.DataAxesGrid = 'GridAxesRepresentation'
-      amr_mesh_Display.PolarAxes = 'PolarAxesRepresentation'
-      amr_mesh_Display.ScalarOpacityUnitDistance = 0.08838834764831846
-      amr_mesh_Display.ScalarOpacityFunction = phiPWF
-
-      # show data from outline1
-      outline1Display = Show(outline1, renderView1)
-      # trace defaults for the display properties.
-      outline1Display.Representation = 'Surface'
-      outline1Display.ColorArrayName = [None, '']
-      outline1Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      outline1Display.SelectOrientationVectors = 'None'
-      outline1Display.ScaleFactor = 0.1
-      outline1Display.SelectScaleArray = 'None'
-      outline1Display.GlyphType = 'Arrow'
-      outline1Display.GlyphTableIndexArray = 'None'
-      outline1Display.DataAxesGrid = 'GridAxesRepresentation'
-      outline1Display.PolarAxes = 'PolarAxesRepresentation'
-      outline1Display.GaussianRadius = 0.05
-      outline1Display.SetScaleArray = [None, '']
-      outline1Display.ScaleTransferFunction = 'PiecewiseFunction'
-      outline1Display.OpacityArray = [None, '']
-      outline1Display.OpacityTransferFunction = 'PiecewiseFunction'
-
-      # ----------------------------------------------------------------
-      # finally, restore active source
-      SetActiveSource(outline1)
-      # ----------------------------------------------------------------
-    return Pipeline()
-
-  class CoProcessor(coprocessing.CoProcessor):
-    def CreatePipeline(self, datadescription):
-      self.Pipeline = _CreatePipeline(self, datadescription)
-
-  coprocessor = CoProcessor()
-  # these are the frequencies at which the coprocessor updates.
-  freqs = {'mesh': [1, 1]}
-  coprocessor.SetUpdateFrequencies(freqs)
-  return coprocessor
-
-
-#--------------------------------------------------------------
-# Global variable that will hold the pipeline for each timestep
-# Creating the CoProcessor object, doesn't actually create the ParaView pipeline.
-# It will be automatically setup when coprocessor.UpdateProducers() is called the
-# first time.
-coprocessor = CreateCoProcessor()
-
-#--------------------------------------------------------------
-# Enable Live-Visualizaton with ParaView and the update frequency
-coprocessor.EnableLiveVisualization(False, 1)
-
-# ---------------------- Data Selection method ----------------------
-
-def RequestDataDescription(datadescription):
-    "Callback to populate the request for current timestep"
-    global coprocessor
-    if datadescription.GetForceOutput() == True:
-        # We are just going to request all fields and meshes from the simulation
-        # code/adaptor.
-        for i in range(datadescription.GetNumberOfInputDescriptions()):
-            datadescription.GetInputDescription(i).AllFieldsOn()
-            datadescription.GetInputDescription(i).GenerateMeshOn()
-        return
-
-    # setup requests for all inputs based on the requirements of the
-    # pipeline.
-    coprocessor.LoadRequestedData(datadescription)
-
-# ------------------------ Processing method ------------------------
-
-def DoCoProcessing(datadescription):
-    "Callback to do co-processing for current timestep"
-    global coprocessor
-
-    # Update the coprocessor by providing it the newly generated simulation data.
-    # If the pipeline hasn't been setup yet, this will setup the pipeline.
-    coprocessor.UpdateProducers(datadescription)
-
-    # Write output data, if appropriate.
-    coprocessor.WriteData(datadescription);
-
-    # Write image capture (Last arg: rescale lookup table), if appropriate.
-    coprocessor.WriteImages(datadescription, rescale_lookuptable=rescale_lookuptable,
-        image_quality=0, padding_amount=imageFileNamePadding)
-
-    # Live Visualization, if enabled.
-    coprocessor.DoLiveVisualization(datadescription, "localhost", 22222)
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_2d.py b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_2d.py
deleted file mode 100644
index c6bbdafa9da..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_2d.py
+++ /dev/null
@@ -1,228 +0,0 @@
-
-from paraview.simple import *
-from paraview import coprocessing
-
-
-#--------------------------------------------------------------
-# Code generated from cpstate.py to create the CoProcessor.
-# ParaView 5.4.1 64 bits
-
-#--------------------------------------------------------------
-# Global screenshot output options
-imageFileNamePadding=5
-rescale_lookuptable=False
-
-
-# ----------------------- CoProcessor definition -----------------------
-
-def CreateCoProcessor():
-  def _CreatePipeline(coprocessor, datadescription):
-    class Pipeline:
-      # state file generated using paraview version 5.4.1
-
-      # ----------------------------------------------------------------
-      # setup views used in the visualization
-      # ----------------------------------------------------------------
-
-      #### disable automatic camera reset on 'Show'
-      paraview.simple._DisableFirstRenderCameraReset()
-
-      # Create a new 'Render View'
-      renderView1 = CreateView('RenderView')
-      renderView1.ViewSize = [1000, 800]
-      renderView1.InteractionMode = '2D'
-      renderView1.AxesGrid = 'GridAxes3DActor'
-      renderView1.OrientationAxesLabelColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.OrientationAxesOutlineColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.CenterOfRotation = [0.5, 0.5, 0.0]
-      renderView1.StereoType = 0
-      renderView1.CameraPosition = [0.6499329008559785, 0.4879518204669307, 10000.0]
-      renderView1.CameraFocalPoint = [0.6499329008559785, 0.4879518204669307, 0.0]
-      renderView1.CameraParallelScale = 0.5952751765669945
-      renderView1.Background = [1.0, 1.0, 1.0]
-
-      # init the 'GridAxes3DActor' selected for 'AxesGrid'
-      renderView1.AxesGrid.Visibility = 0
-      renderView1.AxesGrid.XTitle = 'X'
-      renderView1.AxesGrid.YTitle = 'Y '
-      renderView1.AxesGrid.ZTitle = ''
-      renderView1.AxesGrid.XTitleColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.XTitleBold = 1
-      renderView1.AxesGrid.XTitleFontSize = 16
-      renderView1.AxesGrid.YTitleColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.YTitleBold = 1
-      renderView1.AxesGrid.YTitleFontSize = 16
-      renderView1.AxesGrid.GridColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.XLabelColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.XLabelBold = 1
-      renderView1.AxesGrid.YLabelColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.YLabelBold = 1
-
-      # register the view with coprocessor
-      # and provide it with information such as the filename to use,
-      # how frequently to write the images, etc.
-      coprocessor.RegisterView(renderView1,
-          filename='pv_image_2d_%t.png', freq=1, fittoscreen=0, magnification=1, width=1000, height=800, cinema={})
-      renderView1.ViewTime = datadescription.GetTime()
-
-      # ----------------------------------------------------------------
-      # setup the data processing pipelines
-      # ----------------------------------------------------------------
-
-      # create a new 'XML UniformGrid AMR Reader'
-      # create a producer from a simulation input
-      mesh_0000 = coprocessor.CreateProducer(datadescription, 'mesh')
-
-      # create a new 'Cell Data to Point Data'
-      cellDatatoPointData1 = CellDatatoPointData(Input=mesh_0000)
-
-      # create a new 'Contour'
-      contour1 = Contour(Input=cellDatatoPointData1)
-      contour1.ContourBy = ['POINTS', 'phi']
-      contour1.ComputeScalars = 1
-      contour1.Isosurfaces = [0.99517, 1.1054688888888888, 1.2157677777777778, 1.3260666666666667, 1.4363655555555555, 1.5466644444444444, 1.6569633333333333, 1.767262222222222, 1.877561111111111, 1.98786]
-      contour1.PointMergeMethod = 'Uniform Binning'
-
-      # ----------------------------------------------------------------
-      # setup color maps and opacity mapes used in the visualization
-      # note: the Get..() functions create a new object, if needed
-      # ----------------------------------------------------------------
-
-      # get color transfer function/color map for 'phi'
-      phiLUT = GetColorTransferFunction('phi')
-      phiLUT.RGBPoints = [1.0, 0.278431372549, 0.278431372549, 0.858823529412, 1.1428909412660986, 0.0, 0.0, 0.360784313725, 1.2847826451806859, 0.0, 1.0, 1.0, 1.4286728237982957, 0.0, 0.501960784314, 0.0, 1.570564527712883, 1.0, 1.0, 0.0, 1.7134554689789816, 1.0, 0.380392156863, 0.0, 1.8563464102450802, 0.419607843137, 0.0, 0.0, 1.9992373515111788, 0.878431372549, 0.301960784314, 0.301960784314]
-      phiLUT.ColorSpace = 'RGB'
-      phiLUT.ScalarRangeInitialized = 1.0
-
-      # get opacity transfer function/opacity map for 'phi'
-      phiPWF = GetOpacityTransferFunction('phi')
-      phiPWF.Points = [1.0, 0.0, 0.5, 0.0, 1.9992373515111788, 1.0, 0.5, 0.0]
-      phiPWF.ScalarRangeInitialized = 1
-
-      # ----------------------------------------------------------------
-      # setup the visualization in view 'renderView1'
-      # ----------------------------------------------------------------
-
-      # show data from mesh_0000
-      mesh_0000Display = Show(mesh_0000, renderView1)
-      # trace defaults for the display properties.
-      mesh_0000Display.Representation = 'Wireframe'
-      mesh_0000Display.AmbientColor = [0.0, 0.0, 0.0]
-      mesh_0000Display.ColorArrayName = ['POINTS', '']
-      mesh_0000Display.OSPRayScaleArray = 'GhostType'
-      mesh_0000Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      mesh_0000Display.SelectOrientationVectors = 'None'
-      mesh_0000Display.ScaleFactor = 0.1
-      mesh_0000Display.SelectScaleArray = 'None'
-      mesh_0000Display.GlyphType = 'Arrow'
-      mesh_0000Display.GlyphTableIndexArray = 'None'
-      mesh_0000Display.DataAxesGrid = 'GridAxesRepresentation'
-      mesh_0000Display.PolarAxes = 'PolarAxesRepresentation'
-      mesh_0000Display.ScalarOpacityUnitDistance = 0.057873097067582834
-
-      # show data from contour1
-      contour1Display = Show(contour1, renderView1)
-      # trace defaults for the display properties.
-      contour1Display.Representation = 'Surface'
-      contour1Display.ColorArrayName = ['POINTS', 'phi']
-      contour1Display.LookupTable = phiLUT
-      contour1Display.LineWidth = 2.0
-      contour1Display.OSPRayScaleArray = 'phi'
-      contour1Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      contour1Display.SelectOrientationVectors = 'None'
-      contour1Display.ScaleFactor = 0.05746527910232544
-      contour1Display.SelectScaleArray = 'None'
-      contour1Display.GlyphType = 'Arrow'
-      contour1Display.GlyphTableIndexArray = 'None'
-      contour1Display.DataAxesGrid = 'GridAxesRepresentation'
-      contour1Display.PolarAxes = 'PolarAxesRepresentation'
-      contour1Display.GaussianRadius = 0.02873263955116272
-      contour1Display.SetScaleArray = ['POINTS', 'phi']
-      contour1Display.ScaleTransferFunction = 'PiecewiseFunction'
-      contour1Display.OpacityArray = ['POINTS', 'phi']
-      contour1Display.OpacityTransferFunction = 'PiecewiseFunction'
-
-      # show color legend
-      contour1Display.SetScalarBarVisibility(renderView1, True)
-
-      # setup the color legend parameters for each legend in this view
-
-      # get color legend/bar for phiLUT in view renderView1
-      phiLUTColorBar = GetScalarBar(phiLUT, renderView1)
-      phiLUTColorBar.WindowLocation = 'AnyLocation'
-      phiLUTColorBar.Position = [0.7951562900333077, 0.0840151515151517]
-      phiLUTColorBar.Title = 'phi'
-      phiLUTColorBar.ComponentTitle = ''
-      phiLUTColorBar.TitleColor = [0.0, 0.0, 0.0]
-      phiLUTColorBar.TitleBold = 1
-      phiLUTColorBar.TitleFontSize = 32
-      phiLUTColorBar.LabelColor = [0.0, 0.0, 0.0]
-      phiLUTColorBar.LabelBold = 1
-      phiLUTColorBar.LabelFontSize = 24
-      phiLUTColorBar.ScalarBarThickness = 28
-      phiLUTColorBar.ScalarBarLength = 0.848928571428571
-
-      # ----------------------------------------------------------------
-      # finally, restore active source
-      SetActiveSource(contour1)
-      # ----------------------------------------------------------------
-    return Pipeline()
-
-  class CoProcessor(coprocessing.CoProcessor):
-    def CreatePipeline(self, datadescription):
-      self.Pipeline = _CreatePipeline(self, datadescription)
-
-  coprocessor = CoProcessor()
-  # these are the frequencies at which the coprocessor updates.
-  freqs = {'mesh': [1, 1, 1]}
-  coprocessor.SetUpdateFrequencies(freqs)
-  return coprocessor
-
-
-#--------------------------------------------------------------
-# Global variable that will hold the pipeline for each timestep
-# Creating the CoProcessor object, doesn't actually create the ParaView pipeline.
-# It will be automatically setup when coprocessor.UpdateProducers() is called the
-# first time.
-coprocessor = CreateCoProcessor()
-
-#--------------------------------------------------------------
-# Enable Live-Visualizaton with ParaView and the update frequency
-coprocessor.EnableLiveVisualization(False, 1)
-
-# ---------------------- Data Selection method ----------------------
-
-def RequestDataDescription(datadescription):
-    "Callback to populate the request for current timestep"
-    global coprocessor
-    if datadescription.GetForceOutput() == True:
-        # We are just going to request all fields and meshes from the simulation
-        # code/adaptor.
-        for i in range(datadescription.GetNumberOfInputDescriptions()):
-            datadescription.GetInputDescription(i).AllFieldsOn()
-            datadescription.GetInputDescription(i).GenerateMeshOn()
-        return
-
-    # setup requests for all inputs based on the requirements of the
-    # pipeline.
-    coprocessor.LoadRequestedData(datadescription)
-
-# ------------------------ Processing method ------------------------
-
-def DoCoProcessing(datadescription):
-    "Callback to do co-processing for current timestep"
-    global coprocessor
-
-    # Update the coprocessor by providing it the newly generated simulation data.
-    # If the pipeline hasn't been setup yet, this will setup the pipeline.
-    coprocessor.UpdateProducers(datadescription)
-
-    # Write output data, if appropriate.
-    coprocessor.WriteData(datadescription);
-
-    # Write image capture (Last arg: rescale lookup table), if appropriate.
-    coprocessor.WriteImages(datadescription, rescale_lookuptable=rescale_lookuptable,
-        image_quality=0, padding_amount=imageFileNamePadding)
-
-    # Live Visualization, if enabled.
-    coprocessor.DoLiveVisualization(datadescription, "localhost", 22222)
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_2d.xml b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_2d.xml
deleted file mode 100644
index b54983f3adb..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_2d.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<sensei>
-  <!-- catalyst 2D -->
-  <analysis type="catalyst" pipeline="pythonscript"
-    filename="sensei/render_iso_catalyst_2d.py" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_3d.py b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_3d.py
deleted file mode 100644
index d766600ac59..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_3d.py
+++ /dev/null
@@ -1,233 +0,0 @@
-
-from paraview.simple import *
-from paraview import coprocessing
-
-
-#--------------------------------------------------------------
-# Code generated from cpstate.py to create the CoProcessor.
-# ParaView 5.4.1 64 bits
-
-#--------------------------------------------------------------
-# Global screenshot output options
-imageFileNamePadding=5
-rescale_lookuptable=False
-
-
-# ----------------------- CoProcessor definition -----------------------
-
-def CreateCoProcessor():
-  def _CreatePipeline(coprocessor, datadescription):
-    class Pipeline:
-      # state file generated using paraview version 5.4.1
-
-      # ----------------------------------------------------------------
-      # setup views used in the visualization
-      # ----------------------------------------------------------------
-
-      #### disable automatic camera reset on 'Show'
-      paraview.simple._DisableFirstRenderCameraReset()
-
-      # Create a new 'Render View'
-      renderView1 = CreateView('RenderView')
-      renderView1.ViewSize = [1000, 700]
-      renderView1.AxesGrid = 'GridAxes3DActor'
-      renderView1.CenterOfRotation = [0.5, 0.5, 0.5]
-      renderView1.StereoType = 0
-      renderView1.CameraPosition = [0.5, 0.5, 3.2557533687070332]
-      renderView1.CameraFocalPoint = [0.5, 0.5, -0.09031184624419736]
-      renderView1.CameraParallelScale = 0.8660254037844386
-      renderView1.Background = [0.0, 0.0, 0.0]
-
-      # register the view with coprocessor
-      # and provide it with information such as the filename to use,
-      # how frequently to write the images, etc.
-      coprocessor.RegisterView(renderView1,
-          filename='pv_image_3d_%t.png', freq=1, fittoscreen=0, magnification=1, width=1000, height=700, cinema={})
-      renderView1.ViewTime = datadescription.GetTime()
-
-      # ----------------------------------------------------------------
-      # setup the data processing pipelines
-      # ----------------------------------------------------------------
-
-      # create a new 'XML UniformGrid AMR Reader'
-      # create a producer from a simulation input
-      mesh_000 = coprocessor.CreateProducer(datadescription, 'mesh')
-
-      # create a new 'Cell Data to Point Data'
-      cellDatatoPointData1 = CellDatatoPointData(Input=mesh_000)
-
-      # create a new 'Contour'
-      contour1 = Contour(Input=cellDatatoPointData1)
-      contour1.ContourBy = ['POINTS', 'phi']
-      contour1.ComputeScalars = 1
-      contour1.Isosurfaces = [0.99429, 1.1043655555555556, 1.214441111111111, 1.3245166666666668, 1.4345922222222223, 1.5446677777777778, 1.6547433333333332, 1.764818888888889, 1.8748944444444444, 1.98497]
-      contour1.PointMergeMethod = 'Uniform Binning'
-
-      # create a new 'Annotate Time'
-      annotateTime1 = AnnotateTime()
-      annotateTime1.Format = 't = %0.2f'
-
-      # ----------------------------------------------------------------
-      # setup color maps and opacity mapes used in the visualization
-      # note: the Get..() functions create a new object, if needed
-      # ----------------------------------------------------------------
-
-      # get color transfer function/color map for 'phi'
-      phiLUT = GetColorTransferFunction('phi')
-      phiLUT.RGBPoints = [0.99429, 0.278431372549, 0.278431372549, 0.858823529412, 1.13595724, 0.0, 0.0, 0.360784313725, 1.2766338000000002, 0.0, 1.0, 1.0, 1.41929172, 0.0, 0.501960784314, 0.0, 1.55996828, 1.0, 1.0, 0.0, 1.70163552, 1.0, 0.380392156863, 0.0, 1.84330276, 0.419607843137, 0.0, 0.0, 1.9849700000000001, 0.878431372549, 0.301960784314, 0.301960784314]
-      phiLUT.ColorSpace = 'RGB'
-      phiLUT.ScalarRangeInitialized = 1.0
-
-      # get opacity transfer function/opacity map for 'phi'
-      phiPWF = GetOpacityTransferFunction('phi')
-      phiPWF.Points = [0.99429, 0.0, 0.5, 0.0, 1.9849700000000001, 1.0, 0.5, 0.0]
-      phiPWF.ScalarRangeInitialized = 1
-
-      # ----------------------------------------------------------------
-      # setup the visualization in view 'renderView1'
-      # ----------------------------------------------------------------
-
-      # show data from mesh_000
-      mesh_000Display = Show(mesh_000, renderView1)
-      # trace defaults for the display properties.
-      mesh_000Display.Representation = 'AMR Blocks'
-      mesh_000Display.ColorArrayName = [None, '']
-      mesh_000Display.DiffuseColor = [0.0, 0.0, 0.0]
-      mesh_000Display.OSPRayScaleArray = 'GhostType'
-      mesh_000Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      mesh_000Display.SelectOrientationVectors = 'None'
-      mesh_000Display.ScaleFactor = 0.1
-      mesh_000Display.SelectScaleArray = 'None'
-      mesh_000Display.GlyphType = 'Arrow'
-      mesh_000Display.GlyphTableIndexArray = 'None'
-      mesh_000Display.DataAxesGrid = 'GridAxesRepresentation'
-      mesh_000Display.PolarAxes = 'PolarAxesRepresentation'
-      mesh_000Display.ScalarOpacityUnitDistance = 0.0174438098693218
-
-      # init the 'GridAxesRepresentation' selected for 'DataAxesGrid'
-      mesh_000Display.DataAxesGrid.XTitle = 'X'
-      mesh_000Display.DataAxesGrid.YTitle = 'Y'
-      mesh_000Display.DataAxesGrid.ZTitle = 'Z'
-      mesh_000Display.DataAxesGrid.XTitleBold = 1
-      mesh_000Display.DataAxesGrid.XTitleFontSize = 14
-      mesh_000Display.DataAxesGrid.YTitleBold = 1
-      mesh_000Display.DataAxesGrid.YTitleFontSize = 14
-      mesh_000Display.DataAxesGrid.ZTitleBold = 1
-      mesh_000Display.DataAxesGrid.ZTitleFontSize = 14
-      mesh_000Display.DataAxesGrid.XLabelBold = 1
-      mesh_000Display.DataAxesGrid.XLabelFontSize = 14
-      mesh_000Display.DataAxesGrid.YLabelBold = 1
-      mesh_000Display.DataAxesGrid.YLabelFontSize = 14
-      mesh_000Display.DataAxesGrid.ZLabelBold = 1
-      mesh_000Display.DataAxesGrid.ZLabelFontSize = 14
-
-      # show data from contour1
-      contour1Display = Show(contour1, renderView1)
-      # trace defaults for the display properties.
-      contour1Display.Representation = 'Surface'
-      contour1Display.ColorArrayName = ['POINTS', 'phi']
-      contour1Display.LookupTable = phiLUT
-      contour1Display.OSPRayScaleArray = 'GhostType'
-      contour1Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      contour1Display.SelectOrientationVectors = 'GhostType'
-      contour1Display.ScaleFactor = 0.0572519063949585
-      contour1Display.SelectScaleArray = 'GhostType'
-      contour1Display.GlyphType = 'Arrow'
-      contour1Display.GlyphTableIndexArray = 'GhostType'
-      contour1Display.DataAxesGrid = 'GridAxesRepresentation'
-      contour1Display.PolarAxes = 'PolarAxesRepresentation'
-      contour1Display.GaussianRadius = 0.02862595319747925
-      contour1Display.SetScaleArray = ['POINTS', 'GhostType']
-      contour1Display.ScaleTransferFunction = 'PiecewiseFunction'
-      contour1Display.OpacityArray = ['POINTS', 'GhostType']
-      contour1Display.OpacityTransferFunction = 'PiecewiseFunction'
-
-      # show color legend
-      contour1Display.SetScalarBarVisibility(renderView1, True)
-
-      # show data from annotateTime1
-      annotateTime1Display = Show(annotateTime1, renderView1)
-      # trace defaults for the display properties.
-      annotateTime1Display.Bold = 1
-      annotateTime1Display.FontSize = 12
-      annotateTime1Display.WindowLocation = 'LowerLeftCorner'
-
-      # setup the color legend parameters for each legend in this view
-
-      # get color legend/bar for phiLUT in view renderView1
-      phiLUTColorBar = GetScalarBar(phiLUT, renderView1)
-      phiLUTColorBar.WindowLocation = 'AnyLocation'
-      phiLUTColorBar.Position = [0.852, 0.07857142857142851]
-      phiLUTColorBar.Title = 'phi'
-      phiLUTColorBar.ComponentTitle = ''
-      phiLUTColorBar.TitleBold = 1
-      phiLUTColorBar.TitleFontSize = 24
-      phiLUTColorBar.LabelBold = 1
-      phiLUTColorBar.LabelFontSize = 18
-      phiLUTColorBar.ScalarBarThickness = 24
-      phiLUTColorBar.ScalarBarLength = 0.8357142857142857
-
-      # ----------------------------------------------------------------
-      # finally, restore active source
-      SetActiveSource(mesh_000)
-      # ----------------------------------------------------------------
-    return Pipeline()
-
-  class CoProcessor(coprocessing.CoProcessor):
-    def CreatePipeline(self, datadescription):
-      self.Pipeline = _CreatePipeline(self, datadescription)
-
-  coprocessor = CoProcessor()
-  # these are the frequencies at which the coprocessor updates.
-  freqs = {'mesh': [1, 1, 1]}
-  coprocessor.SetUpdateFrequencies(freqs)
-  return coprocessor
-
-
-#--------------------------------------------------------------
-# Global variable that will hold the pipeline for each timestep
-# Creating the CoProcessor object, doesn't actually create the ParaView pipeline.
-# It will be automatically setup when coprocessor.UpdateProducers() is called the
-# first time.
-coprocessor = CreateCoProcessor()
-
-#--------------------------------------------------------------
-# Enable Live-Visualizaton with ParaView and the update frequency
-coprocessor.EnableLiveVisualization(False, 1)
-
-# ---------------------- Data Selection method ----------------------
-
-def RequestDataDescription(datadescription):
-    "Callback to populate the request for current timestep"
-    global coprocessor
-    if datadescription.GetForceOutput() == True:
-        # We are just going to request all fields and meshes from the simulation
-        # code/adaptor.
-        for i in range(datadescription.GetNumberOfInputDescriptions()):
-            datadescription.GetInputDescription(i).AllFieldsOn()
-            datadescription.GetInputDescription(i).GenerateMeshOn()
-        return
-
-    # setup requests for all inputs based on the requirements of the
-    # pipeline.
-    coprocessor.LoadRequestedData(datadescription)
-
-# ------------------------ Processing method ------------------------
-
-def DoCoProcessing(datadescription):
-    "Callback to do co-processing for current timestep"
-    global coprocessor
-
-    # Update the coprocessor by providing it the newly generated simulation data.
-    # If the pipeline hasn't been setup yet, this will setup the pipeline.
-    coprocessor.UpdateProducers(datadescription)
-
-    # Write output data, if appropriate.
-    coprocessor.WriteData(datadescription);
-
-    # Write image capture (Last arg: rescale lookup table), if appropriate.
-    coprocessor.WriteImages(datadescription, rescale_lookuptable=rescale_lookuptable,
-        image_quality=0, padding_amount=imageFileNamePadding)
-
-    # Live Visualization, if enabled.
-    coprocessor.DoLiveVisualization(datadescription, "localhost", 22222)
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_3d.xml b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_3d.xml
deleted file mode 100644
index b5538909057..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_catalyst_3d.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<sensei>
-  <!-- catalyst 3D -->
-  <analysis type="catalyst" pipeline="pythonscript"
-    filename="sensei/render_iso_catalyst_3d.py" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_2d.session b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_2d.session
deleted file mode 100644
index 88448199136..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_2d.session
+++ /dev/null
@@ -1,5300 +0,0 @@
-<?xml version="1.0"?>
-<Object name="VisIt">
-    <Field name="Version" type="string">2.13.2</Field>
-    <Object name="VIEWER">
-        <Object name="DEFAULT_VALUES">
-            <Object name="GlobalAttributes">
-                <Field name="autoUpdateFlag" type="bool">false</Field>
-                <Field name="replacePlots" type="bool">false</Field>
-                <Field name="applyWindow" type="bool">false</Field>
-                <Field name="applyOperator" type="bool">false</Field>
-                <Field name="windowLayout" type="int">1</Field>
-                <Field name="makeDefaultConfirm" type="bool">true</Field>
-                <Field name="cloneWindowOnFirstRef" type="bool">false</Field>
-                <Field name="automaticallyAddOperator" type="bool">false</Field>
-                <Field name="tryHarderCyclesTimes" type="bool">false</Field>
-                <Field name="treatAllDBsAsTimeVarying" type="bool">false</Field>
-                <Field name="createMeshQualityExpressions" type="bool">true</Field>
-                <Field name="createTimeDerivativeExpressions" type="bool">true</Field>
-                <Field name="createVectorMagnitudeExpressions" type="bool">true</Field>
-                <Field name="newPlotsInheritSILRestriction" type="bool">true</Field>
-                <Field name="userDirForSessionFiles" type="bool">false</Field>
-                <Field name="saveCrashRecoveryFile" type="bool">true</Field>
-                <Field name="applySelection" type="bool">false</Field>
-                <Field name="userRestoreSessionFile" type="bool">false</Field>
-                <Field name="precisionType" type="int">1</Field>
-                <Field name="backendType" type="int">0</Field>
-                <Field name="removeDuplicateNodes" type="bool">false</Field>
-            </Object>
-            <Object name="SaveWindowAttributes">
-                <Field name="outputToCurrentDirectory" type="bool">true</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="fileName" type="string">visit</Field>
-                <Field name="family" type="bool">true</Field>
-                <Field name="format" type="string">PNG</Field>
-                <Field name="width" type="int">1024</Field>
-                <Field name="height" type="int">1024</Field>
-                <Field name="screenCapture" type="bool">true</Field>
-                <Field name="saveTiled" type="bool">false</Field>
-                <Field name="quality" type="int">80</Field>
-                <Field name="progressive" type="bool">false</Field>
-                <Field name="binary" type="bool">false</Field>
-                <Field name="lastRealFilename" type="string"></Field>
-                <Field name="stereo" type="bool">false</Field>
-                <Field name="compression" type="string">None</Field>
-                <Field name="forceMerge" type="bool">false</Field>
-                <Field name="resConstraint" type="string">ScreenProportions</Field>
-                <Field name="advancedMultiWindowSave" type="bool">false</Field>
-                <Object name="subWindowAtts">
-                    <Object name="SaveSubWindowsAttributes">
-                        <Object name="win1">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win2">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win3">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win4">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win5">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win6">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win7">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win8">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win9">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win10">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win11">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win12">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win13">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win14">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win15">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win16">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ColorTableAttributes">
-                <Field name="activeContinuous" type="string">hot</Field>
-                <Field name="activeDiscrete" type="string">levels</Field>
-                <Field name="groupingFlag" type="bool">false</Field>
-                <Object name="table00">
-                    <Field name="ctName" type="string">amino_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 189 159 109 255 0.009 199 199 199 255 0.019 255 105 180 255 0.028 230 230 0 255 0.037 230 9 9 255 0.046 230 9 9 255 0.056 49 49 170 255 0.065 235 235 235 255 0.074 130 130 210 255 0.083 15 130 15 255 0.093 19 90 255 255 0.102 15 130 15 255 0.111 230 230 0 255 0.12 0 220 220 255 0.13 220 149 130 255 0.139 0 220 220 255 0.148 19 90 255 255 0.157 249 149 0 255 0.167 249 149 0 255 0.176 15 130 15 255 0.185 180 90 180 255 0.194 49 49 170 255 0.204 255 105 180 255 </Field>
-                </Object>
-                <Object name="table01">
-                    <Field name="ctName" type="string">amino_shapely</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.009 139 255 139 255 0.019 255 0 255 255 0.028 255 255 111 255 0.037 159 0 66 255 0.046 102 0 0 255 0.056 82 75 82 255 0.065 255 255 255 255 0.074 111 111 255 255 0.083 0 75 0 255 0.093 70 70 184 255 0.102 69 94 69 255 0.111 184 159 66 255 0.12 255 123 111 255 0.13 82 82 82 255 0.139 255 75 75 255 0.148 0 0 123 255 0.157 255 111 66 255 0.167 184 75 0 255 0.176 255 139 255 255 0.185 79 70 0 255 0.194 139 111 75 255 0.204 255 0 255 255 </Field>
-                </Object>
-                <Object name="table02">
-                    <Field name="ctName" type="string">bluehot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.333 0 0 127 255 0.666 0 127 255 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table03">
-                    <Field name="ctName" type="string">caleblack</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table04">
-                    <Field name="ctName" type="string">calewhite</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table05">
-                    <Field name="ctName" type="string">contoured</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.333 0 255 0 255 0.666 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table06">
-                    <Field name="ctName" type="string">cpk_jmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 217 255 255 255 0.028 204 128 255 255 0.037 194 255 0 255 0.046 255 181 181 255 0.055 144 144 144 255 0.064 47 80 248 255 0.073 255 13 13 255 0.083 144 223 80 255 0.092 179 226 245 255 0.101 171 92 241 255 0.11 137 255 0 255 0.119 190 166 166 255 0.128 239 199 159 255 0.138 255 128 0 255 0.147 255 255 47 255 0.156 31 239 31 255 0.165 128 209 226 255 0.174 143 64 211 255 0.183 60 255 0 255 0.193 230 230 230 255 0.202 190 194 198 255 0.211 166 166 171 255 0.22 137 153 198 255 0.229 156 121 198 255 0.239 223 102 51 255 0.248 239 144 159 255 0.257 80 208 80 255 0.266 199 128 51 255 0.275 124 128 175 255 0.284 194 143 143 255 0.294 102 143 143 255 0.303 188 128 226 255 0.312 255 160 0 255 0.321 166 41 41 255 0.33 92 184 209 255 0.339 111 45 175 255 0.349 0 255 0 255 0.358 147 255 255 255 0.367 147 223 223 255 0.376 115 194 200 255 0.385 83 181 181 255 0.394 58 158 158 255 0.404 35 143 143 255 0.413 9 124 139 255 0.422 0 105 133 255 0.431 192 192 192 255 0.44 255 217 143 255 0.45 166 117 115 255 0.459 102 128 128 255 0.468 158 98 181 255 0.477 211 121 0 255 0.486 147 0 147 255 0.495 66 158 175 255 0.505 86 22 143 255 0.514 0 200 0 255 0.523 111 211 255 255 0.532 255 255 198 255 0.541 217 255 198 255 0.55 198 255 198 255 0.56 162 255 198 255 0.569 143 255 198 255 0.578 96 255 198 255 0.587 69 255 198 255 0.596 47 255 198 255 0.606 31 255 198 255 0.615 0 255 156 255 0.624 0 230 117 255 0.633 0 211 82 255 0.642 0 190 56 255 0.651 0 171 35 255 0.661 77 194 255 255 0.67 77 166 255 255 0.679 32 147 213 255 0.688 37 124 171 255 0.697 37 102 149 255 0.706 22 83 134 255 0.716 208 208 223 255 0.725 255 209 34 255 0.734 184 184 208 255 0.743 166 83 77 255 0.752 86 88 96 255 0.761 158 79 181 255 0.771 171 92 0 255 0.78 117 79 69 255 0.789 66 130 149 255 0.798 66 0 102 255 0.807 0 124 0 255 0.817 111 171 249 255 0.826 0 185 255 255 0.835 0 160 255 255 0.844 0 143 255 255 0.853 0 128 255 255 0.862 0 107 255 255 0.872 83 92 241 255 0.881 120 92 226 255 0.89 137 79 226 255 0.899 160 54 211 255 0.908 179 31 211 255 0.917 179 31 185 255 0.927 179 13 166 255 0.936 188 13 134 255 0.945 198 0 102 255 0.954 204 0 88 255 0.963 209 0 79 255 0.972 217 0 69 255 0.982 223 0 56 255 0.991 230 0 45 255 1 235 0 37 255 </Field>
-                </Object>
-                <Object name="table07">
-                    <Field name="ctName" type="string">cpk_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 255 192 202 255 0.028 177 33 33 255 0.037 255 19 146 255 0.046 0 255 0 255 0.055 199 199 199 255 0.064 143 143 255 255 0.073 239 0 0 255 0.083 218 164 31 255 0.092 255 19 146 255 0.101 0 0 255 255 0.11 33 138 33 255 0.119 128 128 144 255 0.128 218 164 31 255 0.138 255 164 0 255 0.147 255 199 49 255 0.156 0 255 0 255 0.165 255 19 146 255 0.174 255 19 146 255 0.183 128 128 144 255 0.193 255 19 146 255 0.202 128 128 144 255 0.211 255 19 146 255 0.22 128 128 144 255 0.229 128 128 144 255 0.239 255 164 0 255 0.248 255 19 146 255 0.257 164 42 42 255 0.266 164 42 42 255 0.275 164 42 42 255 0.284 255 19 146 255 0.294 255 19 146 255 0.303 255 19 146 255 0.312 255 19 146 255 0.321 164 42 42 255 0.33 255 19 146 255 0.339 255 19 146 255 0.349 255 19 146 255 0.358 255 19 146 255 0.367 255 19 146 255 0.376 255 19 146 255 0.385 255 19 146 255 0.394 255 19 146 255 0.404 255 19 146 255 0.413 255 19 146 255 0.422 255 19 146 255 0.431 128 128 144 255 0.44 255 19 146 255 0.45 255 19 146 255 0.459 255 19 146 255 0.468 255 19 146 255 0.477 255 19 146 255 0.486 159 31 239 255 0.495 255 19 146 255 0.505 255 19 146 255 0.514 255 164 0 255 0.523 255 19 146 255 0.532 255 19 146 255 0.541 255 19 146 255 0.55 255 19 146 255 0.56 255 19 146 255 0.569 255 19 146 255 0.578 255 19 146 255 0.587 255 19 146 255 0.596 255 19 146 255 0.606 255 19 146 255 0.615 255 19 146 255 0.624 255 19 146 255 0.633 255 19 146 255 0.642 255 19 146 255 0.651 255 19 146 255 0.661 255 19 146 255 0.67 255 19 146 255 0.679 255 19 146 255 0.688 255 19 146 255 0.697 255 19 146 255 0.706 255 19 146 255 0.716 255 19 146 255 0.725 218 164 31 255 0.734 255 19 146 255 0.743 255 19 146 255 0.752 255 19 146 255 0.761 255 19 146 255 0.771 255 19 146 255 0.78 255 19 146 255 0.789 255 19 146 255 0.798 255 19 146 255 0.807 255 19 146 255 0.817 255 19 146 255 0.826 255 19 146 255 0.835 255 19 146 255 0.844 255 19 146 255 0.853 255 19 146 255 0.862 255 19 146 255 0.872 255 19 146 255 0.881 255 19 146 255 0.89 255 19 146 255 0.899 255 19 146 255 0.908 255 19 146 255 0.917 255 19 146 255 0.927 255 19 146 255 0.936 255 19 146 255 0.945 255 19 146 255 0.954 255 19 146 255 0.963 255 19 146 255 0.972 255 19 146 255 0.982 255 19 146 255 0.991 255 19 146 255 1 255 19 146 255 </Field>
-                </Object>
-                <Object name="table08">
-                    <Field name="ctName" type="string">difference</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.5 255 255 255 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table09">
-                    <Field name="ctName" type="string">gray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table10">
-                    <Field name="ctName" type="string">hot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.25 0 255 255 255 0.5 0 255 0 255 0.75 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table11">
-                    <Field name="ctName" type="string">hot_and_cold</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 255 255 255 0.45 0 0 255 255 0.5 0 0 127 255 0.55 255 0 0 255 1 255 255 0 255 </Field>
-                </Object>
-                <Object name="table12">
-                    <Field name="ctName" type="string">levels</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 0 255 0.034 0 255 0 255 0.069 0 0 255 255 0.103 0 255 255 255 0.138 255 0 255 255 0.172 255 255 0 255 0.207 255 135 0 255 0.241 255 0 135 255 0.276 168 168 168 255 0.31 255 68 68 255 0.345 99 255 99 255 0.379 99 99 255 255 0.414 40 165 165 255 0.448 255 99 255 255 0.483 255 255 99 255 0.517 255 170 99 255 0.552 170 79 255 255 0.586 150 0 0 255 0.621 0 150 0 255 0.655 0 0 150 255 0.69 0 109 109 255 0.724 150 0 150 255 0.759 150 150 0 255 0.793 150 84 0 255 0.828 160 0 79 255 0.862 255 104 28 255 0.897 0 170 81 255 0.931 68 255 124 255 0.966 0 130 255 255 1 130 0 255 255 </Field>
-                </Object>
-                <Object name="table13">
-                    <Field name="ctName" type="string">rainbow</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.2 0 0 255 255 0.4 0 255 255 255 0.6 0 255 0 255 0.8 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table14">
-                    <Field name="ctName" type="string">xray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 1 0 0 0 255 </Field>
-                </Object>
-                <Field name="Ntables" type="int">15</Field>
-            </Object>
-            <Object name="ExpressionList">
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ConnectedComponents/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ConnectedComponents</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/1D/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/2D/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/3D/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Flux/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Flux</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Lineout/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Lineout</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/model</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/distance</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Sum/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Mean/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Variance/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">"operators/StatisticalTrends/Std. Dev./phi"</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Slope/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Residuals/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/SurfaceNormal/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">VectorMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">SurfaceNormal</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-            </Object>
-            <Object name="AnimationAttributes">
-                <Field name="animationMode" type="string">StopMode</Field>
-                <Field name="pipelineCachingMode" type="bool">false</Field>
-                <Field name="frameIncrement" type="int">1</Field>
-                <Field name="timeout" type="int">1</Field>
-                <Field name="playbackMode" type="string">Looping</Field>
-            </Object>
-            <Object name="AnnotationAttributes">
-                <Object name="axes2D">
-                    <Object name="Axes2D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Outside</Field>
-                        <Field name="tickAxes" type="string">BottomLeft</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-                <Object name="axes3D">
-                    <Object name="Axes3D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Inside</Field>
-                        <Field name="axesType" type="string">ClosestTriad</Field>
-                        <Field name="triadFlag" type="bool">true</Field>
-                        <Field name="bboxFlag" type="bool">true</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="zAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Z-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Field name="setBBoxLocation" type="bool">false</Field>
-                        <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                    </Object>
-                </Object>
-                <Field name="userInfoFlag" type="bool">true</Field>
-                <Object name="userInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoFlag" type="bool">true</Field>
-                <Field name="timeInfoFlag" type="bool">true</Field>
-                <Object name="databaseInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                <Field name="databaseInfoTimeScale" type="double">1</Field>
-                <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                <Field name="legendInfoFlag" type="bool">true</Field>
-                <Object name="backgroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="foregroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                <Object name="gradientColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="gradientColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="backgroundMode" type="string">Solid</Field>
-                <Field name="backgroundImage" type="string"></Field>
-                <Field name="imageRepeatX" type="int">1</Field>
-                <Field name="imageRepeatY" type="int">1</Field>
-                <Object name="axesArray">
-                    <Object name="AxesArray">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="ticksVisible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Object name="axes">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string"></Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewCurveAttributes">
-                <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="domainScale" type="int">0</Field>
-                <Field name="rangeScale" type="int">0</Field>
-            </Object>
-            <Object name="View2DAttributes">
-                <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                <Field name="xScale" type="int">0</Field>
-                <Field name="yScale" type="int">0</Field>
-                <Field name="windowValid" type="bool">true</Field>
-            </Object>
-            <Object name="View3DAttributes">
-                <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="focus" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="viewAngle" type="double">30</Field>
-                <Field name="parallelScale" type="double">0.5</Field>
-                <Field name="nearPlane" type="double">-0.5</Field>
-                <Field name="farPlane" type="double">0.5</Field>
-                <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                <Field name="imageZoom" type="double">1</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="eyeAngle" type="double">2</Field>
-                <Field name="centerOfRotationSet" type="bool">false</Field>
-                <Field name="centerOfRotation" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="axis3DScaleFlag" type="bool">false</Field>
-                <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="windowValid" type="bool">false</Field>
-            </Object>
-            <Object name="LightList">
-                <Object name="light0">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                        <Field name="enabledFlag" type="bool">true</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light1">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light2">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light3">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light4">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light5">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light6">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light7">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerWindowManagerAttributes">
-                <Object name="ActionConfigurations">
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Mode</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Tools</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Window</Field>
-                        <Field name="actions" type="stringVector">"SetActiveWindowRPC" "AddWindowRPC" "CloneWindowRPC" "DeleteWindowRPC" "SetWindowLayoutRPC" "ToggleSpinModeRPC" "InvertBackgroundRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">View</Field>
-                        <Field name="actions" type="stringVector">"TogglePerspectiveViewRPC" "ResetViewRPC" "RecenterViewRPC" "UndoViewRPC" "RedoViewRPC" "ToggleFullFrameRPC" "SaveViewRPC" "ChooseCenterOfRotationRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Animation</Field>
-                        <Field name="actions" type="stringVector">"TimeSliderPreviousStateRPC" "AnimationReversePlayRPC" "AnimationStopRPC" "AnimationPlayRPC" "TimeSliderNextStateRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Operators</Field>
-                        <Field name="actions" type="stringVector">"AddOperatorRPC" "RemoveLastOperatorRPC" "RemoveAllOperatorsRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Plots</Field>
-                        <Field name="actions" type="stringVector">"AddPlotRPC" "DrawPlotsRPC" "HideActivePlotsRPC" "DeleteActivePlotsRPC" "CopyActivePlotsRPC" "SetPlotFollowsTimeRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Clear</Field>
-                        <Field name="actions" type="stringVector">"ClearWindowRPC" "ClearAllWindowsRPC" "ClearPickPointsRPC" "ClearRefLinesRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Lock</Field>
-                        <Field name="actions" type="stringVector">"ToggleLockViewModeRPC" "ToggleLockTimeRPC" "ToggleLockToolsRPC" "TurnOffAllLocksRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                </Object>
-                <Field name="toolbarsVisible" type="bool">true</Field>
-                <Field name="largeIcons" type="bool">false</Field>
-            </Object>
-            <Object name="WindowInformation">
-                <Field name="boundingBoxNavigate" type="bool">true</Field>
-                <Field name="fullFrame" type="bool">false</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="lockView" type="bool">false</Field>
-                <Field name="lockTools" type="bool">false</Field>
-                <Field name="lockTime" type="bool">false</Field>
-                <Field name="viewExtentsType" type="int">1</Field>
-            </Object>
-            <Object name="PrinterAttributes">
-                <Field name="printerName" type="string"></Field>
-                <Field name="printProgram" type="string">lpr</Field>
-                <Field name="documentName" type="string">untitled</Field>
-                <Field name="creator" type="string"></Field>
-                <Field name="numCopies" type="int">1</Field>
-                <Field name="portrait" type="bool">true</Field>
-                <Field name="printColor" type="bool">true</Field>
-                <Field name="outputToFile" type="bool">false</Field>
-                <Field name="outputToFileName" type="string">untitled</Field>
-                <Field name="pageSize" type="int">2</Field>
-            </Object>
-            <Object name="RenderingAttributes">
-                <Field name="antialiasing" type="bool">false</Field>
-                <Field name="orderComposite" type="bool">true</Field>
-                <Field name="depthCompositeThreads" type="int">2</Field>
-                <Field name="depthCompositeBlocking" type="int">65536</Field>
-                <Field name="alphaCompositeThreads" type="int">2</Field>
-                <Field name="alphaCompositeBlocking" type="int">65536</Field>
-                <Field name="depthPeeling" type="bool">false</Field>
-                <Field name="occlusionRatio" type="double">0</Field>
-                <Field name="numberOfPeels" type="int">16</Field>
-                <Field name="multiresolutionMode" type="bool">false</Field>
-                <Field name="multiresolutionCellSize" type="float">0.002</Field>
-                <Field name="geometryRepresentation" type="string">Surfaces</Field>
-                <Field name="displayListMode" type="string">Auto</Field>
-                <Field name="stereoRendering" type="bool">false</Field>
-                <Field name="stereoType" type="string">CrystalEyes</Field>
-                <Field name="notifyForEachRender" type="bool">false</Field>
-                <Field name="scalableActivationMode" type="string">Always</Field>
-                <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                <Field name="specularFlag" type="bool">false</Field>
-                <Field name="specularCoeff" type="float">0.6</Field>
-                <Field name="specularPower" type="float">10</Field>
-                <Object name="specularColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="doShadowing" type="bool">false</Field>
-                <Field name="shadowStrength" type="double">0.5</Field>
-                <Field name="doDepthCueing" type="bool">false</Field>
-                <Field name="depthCueingAutomatic" type="bool">true</Field>
-                <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                <Field name="compressionActivationMode" type="string">Never</Field>
-                <Field name="colorTexturingFlag" type="bool">true</Field>
-                <Field name="compactDomainsActivationMode" type="string">Never</Field>
-                <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="AnnotationObjectList">
-            </Object>
-            <Object name="PickAttributes">
-                <Field name="variables" type="stringVector">"default" </Field>
-                <Field name="showIncidentElements" type="bool">true</Field>
-                <Field name="showNodeId" type="bool">true</Field>
-                <Field name="showNodeDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showNodeBlockLogicalCoords" type="bool">false</Field>
-                <Field name="showNodePhysicalCoords" type="bool">false</Field>
-                <Field name="showZoneId" type="bool">true</Field>
-                <Field name="showZoneDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showZoneBlockLogicalCoords" type="bool">false</Field>
-                <Field name="doTimeCurve" type="bool">false</Field>
-                <Field name="conciseOutput" type="bool">false</Field>
-                <Field name="showTimeStep" type="bool">true</Field>
-                <Field name="showMeshName" type="bool">true</Field>
-                <Field name="useLabelAsPickLetter" type="bool">false</Field>
-                <Field name="showGlobalIds" type="bool">false</Field>
-                <Field name="showPickLetter" type="bool">true</Field>
-                <Field name="hasRangeOutput" type="bool">false</Field>
-                <Field name="elementLabel" type="string"></Field>
-                <Field name="createSpreadsheet" type="bool">false</Field>
-                <Field name="floatFormat" type="string">%g</Field>
-                <Field name="timePreserveCoord" type="bool">true</Field>
-            </Object>
-            <Object name="QueryOverTimeAttributes">
-                <Field name="timeType" type="string">Cycle</Field>
-                <Field name="startTimeFlag" type="bool">false</Field>
-                <Field name="startTime" type="int">0</Field>
-                <Field name="endTimeFlag" type="bool">false</Field>
-                <Field name="endTime" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="createWindow" type="bool">true</Field>
-                <Field name="windowId" type="int">2</Field>
-            </Object>
-            <Object name="InteractorAttributes">
-                <Field name="showGuidelines" type="bool">true</Field>
-                <Field name="clampSquare" type="bool">false</Field>
-                <Field name="fillViewportOnZoom" type="bool">true</Field>
-                <Field name="navigationMode" type="string">Trackball</Field>
-                <Field name="axisArraySnap" type="bool">true</Field>
-                <Field name="boundingBoxMode" type="string">Auto</Field>
-            </Object>
-            <Object name="MovieAttributes">
-                <Field name="generationMethod" type="string">NowCurrentInstance</Field>
-                <Field name="movieType" type="string">Simple</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="outputName" type="string">movie</Field>
-                <Field name="fileFormats" type="stringVector"></Field>
-                <Field name="useCurrentSize" type="unsignedCharVector"></Field>
-                <Field name="widths" type="intVector"></Field>
-                <Field name="heights" type="intVector"></Field>
-                <Field name="scales" type="doubleVector"></Field>
-                <Field name="stereoFlags" type="intVector"></Field>
-                <Field name="templateFile" type="string"></Field>
-                <Field name="sendEmailNotification" type="bool">false</Field>
-                <Field name="useScreenCapture" type="bool">false</Field>
-                <Field name="emailAddress" type="string"></Field>
-                <Field name="fps" type="int">10</Field>
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="endIndex" type="int">1000000000</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="initialFrameValue" type="int">0</Field>
-            </Object>
-            <Object name="FileOpenOptions">
-                <Field name="typeNames" type="stringVector">"AMR" "AMRTest" "ANALYZE" "ANSYS" "AUXFile" "AugDecomp" "BATL" "BOV" "CEAucd" "CMAT" "CTRL" "Cale" "CaleHDF5" "CarpetHDF5" "Chombo" "Claw" "CosmosPP" "Cube" "Curve2D" "DDCMD" "Dyna3D" "EnSight" "Enzo" "Exodus" "ExtrudedVol" "FLASH" "FT2" "Fluent" "GGCM" "GHOST" "GMV" "GTC" "GULP" "Gadget" "Geqdsk" "H5Nimrod" "Image" "KullLite" "LAMMPS" "Lines" "M3DC1" "M3D" "MFIXCDF" "MFIX" "MM5" "MatrixMarket" "Miranda" "NASTRAN" "NETCDF" "Nek5000" "OVERFLOW" "OpenFOAM" "PATRAN" "PDB" "PFLOTRAN" "PLOT3D" "PLY" "ParallelVelodyne" "Pixie" "PlainText" "Point3D" "ProteinDataBank" "PuReMD" "RAW" "S3D" "SAMI" "SAMRAI" "SAR" "SAS" "STAR" "STL" "SXRIS" "Shapefile" "Silo" "SimV2" "Spheral" "TCGA" "TFT" "TSurf" "Tecplot" "Tetrad" "UNIC" "VASP" "VCellMTMD" "VTK" "Velodyne" "Vis5D" "VisItXdmf" "Vista" "Vs" "WPPImage" "WavefrontOBJ" "WellLogs" "XSF" "XYZ" "Xmdv" "ZipWrapper" "lata" "unv" "volimage" "HDFS" "SPCTH" </Field>
-                <Field name="typeIDs" type="stringVector">"AMR_1.0" "AMRTest_1.0" "ANALYZE_1.0" "ANSYS_1.0" "AUXFile_1.0" "AugDecomp_1.0" "BATL_1.0" "BOV_1.0" "CEAucd_1.0" "CMAT_1.0" "CTRL_1.0" "Cale_1.1" "CaleHDF5_1.1" "CarpetHDF5_2.1" "Chombo_1.0" "Claw_1.0" "CosmosPP_1.0" "Cube_1.0" "Curve2D_1.0" "DDCMD_1.0" "Dyna3D_1.0" "EnSight_1.0" "Enzo_1.0" "Exodus_1.0" "ExtrudedVol_1.0" "FLASH_1.0" "FT2_1.0" "Fluent_1.0" "GGCM_1.0" "GHOST_1" "GMV_1.0" "GTC_1.0" "GULP_1.0" "Gadget_2.0a" "Geqdsk_1.0" "H5Nimrod_1.0" "Image_1.0" "KullLite_1.0" "LAMMPS_1.0" "Lines_1.0" "M3DC1_1.0" "M3D_1.0" "MFIXCDF_1.0" "MFIX_1.0" "MM5_1.0" "MatrixMarket_1.0" "Miranda_2.0" "NASTRAN_1.0" "NETCDF_1.0" "Nek5000_1.0" "OVERFLOW_1.0" "OpenFOAM_1.0" "PATRAN_1.0" "PDB_1.1" "PFLOTRAN_1.0" "PLOT3D_1.0" "PLY_1.0" "ParallelVelodyne_1" "Pixie_1.0" "PlainText_1.0" "Point3D_1.0" "ProteinDataBank_1.0" "PuReMD_1.0" "RAW_1.0" "S3D_1.0" "SAMI_1.0" "SAMRAI_1.0" "SAR_1.0" "SAS_1.0" "STAR_1.0" "STL_1.0" "SXRIS_1.0" "Shapefile_1.0" "Silo_1.0" "SimV2_1.0" "Spheral_1.0" "TCGA_1.0" "TFT_1.0" "TSurf_1.0" "Tecplot_1.0" "Tetrad_1.0" "UNIC_1.0" "VASP_1.0" "VCellMTMD_1.0" "VTK_1.0" "Velodyne_1.0" "Vis5D_1.0" "VisItXdmf_1.0" "Vista_1.0" "Vs_3.0.0" "WPPImage_2" "WavefrontOBJ_1.0" "WellLogs_1.0" "XSF_1.0" "XYZ_1.0" "Xmdv_1.0" "ZipWrapper_1.0" "lata_1.0" "unv_" "volimage_1.0" "HDFS_1.0" "SPCTH_1.0" </Field>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" </Field>
-                    <Field name="optBools" type="intVector">0 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Use ghost data (if present)" "Enable only root level by default" "Enable only explicitly defined materials by default" "Check for mapping file and import coordinates if available" "Use particle_nid and polymer_id to connect particles" "Always compute domain boundaries (hack for AMR stitch cells)" </Field>
-                    <Field name="optBools" type="intVector">1 0 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"ExtendVolumeByOneCell" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 5 1 4 4 </Field>
-                    <Field name="names" type="stringVector">"Automagically Detect Compound Variables" "Use Material Convention" "Material Count (-1=guess)" "Namescheme for material volume fractions" "Namescheme for material specific variables" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 </Field>
-                    <Field name="optStrings" type="stringVector">"" "" </Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"None" "ALEGRA" "CTH" "Custom" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string">"&lt;p&gt;&lt;b&gt;Automagically Detect Compound Variables&lt;/b&gt;: Checking this option will cause the plugin to try to guess that similarly named variables are the scalar components of an aggregate type such as a vector, tensor or array variable. The plugin will then automatically define expressions for these aggregate typed variables. Note that this is just a convenience to free users from having to define expressions manally within their VisIt session.&lt;p&gt; &lt;p&gt;&lt;b&gt;Material Count (-1=guess)&lt;/b&gt;: Ordinarily, the plugin will determine the material count from the material convention nameschemes. However, if it is having trouble getting the correct count, you can specify it manually with this option. &lt;p&gt;&lt;b&gt;Use Material Convention&lt;/b&gt;: A few pre-defined conventions for handling mixed materials from Exodus files are supported. In addition, you can define your own custom conventions as well. For a custom convention, you must define the &lt;i&gt;namescheme&lt;/i&gt; that will produce the names of the scalar variables holding material volume fractions. Optionally, you can specify a &lt;i&gt;namescheme&lt;/i&gt; to produce the names of the scalar variables holding material-specific values given the name of a non-material-specific variable. For more information on nameschemes, please consult the description of DBMakeNamescheme in the &lt;a href=&quot;https://wci.llnl.gov/content/assets/docs/simulation/computer-codes/silo/LLNL-SM-654357.pdf&quot;&gt;Silo user&apos;s manual&lt;/a&gt;. The nameschemes used here are identical to those described in the Silo user&apos;s manual with one extension. The conversion specifier %V is used to denote the basename (non-material-specific) name of a set of scalar variables holding material specific values.&lt;p&gt; &lt;p&gt;The ALEGRA nameschemes for volume fraction and material specific variables  are &quot;@%s@n?&apos;&amp;VOLFRC_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;The CTH nameschemes are &quot;@%s@n?&apos;&amp;VOLM_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;Finally, it is assumed materials are identified starting from one (1). The special material id of zero (0) is used to denote void."</Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" "Set up patch abutment information" </Field>
-                    <Field name="optBools" type="intVector">0 1 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 </Field>
-                    <Field name="names" type="stringVector">"Mesh refinement" "Linear mesh data location" "Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1" "2" "3" "4" "5" "6" "7" "8" "9" "10" "Node" "Element" </Field>
-                    <Field name="enumStringsSizes" type="intVector">10 2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Big Endian" "Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"Num Materials (-1==costly search)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Read all times and cycles" "Duplicate data for particle advection (slower for all other techniques)" </Field>
-                    <Field name="optBools" type="intVector">1 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Case Type" "Convert Cell Data To Point Data" "Read Zones" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"Decomposed" "Reconstructed" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"LEOS try harder level [set to 0, 1 or 2]" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 4 0 0 0 0 0 0 3 3 </Field>
-                    <Field name="names" type="stringVector">"File Format" "Solution (Q) File Name" "Solution Time field accurate" "3D" "Multi Grid" "Big Endian" "Double Precision" "IBlanking" "Gas constant R" "Gas constant Gamma" </Field>
-                    <Field name="optBools" type="intVector">1 1 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector">1 1.4 </Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector">"" </Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"ASCII" "C Binary" "Fortran Binary" </Field>
-                    <Field name="enumStringsSizes" type="intVector">3 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 </Field>
-                    <Field name="names" type="stringVector">"Partitioning" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">2 </Field>
-                    <Field name="enumStrings" type="stringVector">"X Slab" "Y Slab" "Z Slab" "KD Tree" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Data layout" "Lines to skip at beginning of file" "First row has variable names" "Column for X coordinate (or -1 for none)" "Column for Y coordinate (or -1 for none)" "Column for Z coordinate (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 -1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1D Columns" "2D Array" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Polygons as lines" "Tessellate polygons" "ESRI Logging" "DBF Logging" </Field>
-                    <Field name="optBools" type="intVector">0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Ignore spatial extents" "Ignore data extents" "Force Single" "Search For ANNOTATION_INT (!!Slow!!)" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">3 3 </Field>
-                    <Field name="enumStrings" type="stringVector">"Always" "Auto" "Never" "Undef" "Always" "Auto" "Never" "Undef" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 4 </Field>
-                    <Field name="obsoleteNames" type="stringVector">"Ignore Spatial Extents" "Ignore Data Extents" </Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Method to determine coordinate axes" "X axis variable index (or -1 for none)" "Y axis variable index (or -1 for none)" "Z axis variable index (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"Guess from variable names" "Specify explicitly (below)" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">4 4 1 4 0 </Field>
-                    <Field name="names" type="stringVector">"TMPDIR for decompressed files" "Unique moniker for dirs made in $TMPDIR" "Max. # decompressed files" "Decompression command" "Don&apos;t atexit()" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">50 </Field>
-                    <Field name="optStrings" type="stringVector">"$TMPDIR" "$USER" "" </Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Field name="Enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 </Field>
-                <Field name="preferredIDs" type="stringVector">"Silo_1.0" </Field>
-            </Object>
-            <Object name="SeedMeAttributes">
-                <Field name="clearAllTabsOnClose" type="bool">true</Field>
-            </Object>
-            <Object name="BoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="ContourAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                        <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="CurveAttributes">
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="symbol" type="string">Point</Field>
-                <Field name="pointSize" type="double">5</Field>
-                <Field name="pointFillMode" type="string">Static</Field>
-                <Field name="pointStride" type="int">1</Field>
-                <Field name="symbolDensity" type="int">50</Field>
-                <Field name="curveColorSource" type="string">Cycle</Field>
-                <Object name="curveColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="showLegend" type="bool">true</Field>
-                <Field name="showLabels" type="bool">true</Field>
-                <Field name="designator" type="string"></Field>
-                <Field name="doBallTimeCue" type="bool">false</Field>
-                <Object name="ballTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="timeCueBallSize" type="double">0.01</Field>
-                <Field name="doLineTimeCue" type="bool">false</Field>
-                <Object name="lineTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="lineTimeCueWidth" type="int">0</Field>
-                <Field name="doCropTimeCue" type="bool">false</Field>
-                <Field name="timeForTimeCue" type="double">0</Field>
-                <Field name="fillMode" type="string">NoFill</Field>
-                <Object name="fillColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="fillColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 100 100 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="polarToCartesian" type="bool">false</Field>
-                <Field name="polarCoordinateOrder" type="string">R_Theta</Field>
-                <Field name="angleUnits" type="string">Radians</Field>
-            </Object>
-            <Object name="FilledBoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Object name="mixedColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="HistogramAttributes">
-                <Field name="basedOn" type="string">ManyZonesForSingleVar</Field>
-                <Field name="histogramType" type="string">Frequency</Field>
-                <Field name="weightVariable" type="string">default</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="numBins" type="int">32</Field>
-                <Field name="domain" type="int">0</Field>
-                <Field name="zone" type="int">0</Field>
-                <Field name="useBinWidths" type="bool">true</Field>
-                <Field name="outputType" type="string">Block</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="color">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">200 80 40 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="dataScale" type="string">Linear</Field>
-                <Field name="binScale" type="string">Linear</Field>
-                <Field name="normalizeHistogram" type="bool">false</Field>
-                <Field name="computeAsCDF" type="bool">false</Field>
-            </Object>
-            <Object name="LabelAttributes">
-                <Field name="varType" type="string">LABEL_VT_UNKNOWN_TYPE</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="showNodes" type="bool">false</Field>
-                <Field name="showCells" type="bool">true</Field>
-                <Field name="restrictNumberOfLabels" type="bool">true</Field>
-                <Field name="drawLabelsFacing" type="string">Front</Field>
-                <Field name="labelDisplayFormat" type="string">Natural</Field>
-                <Field name="numberOfLabels" type="int">200</Field>
-                <Field name="specifyTextColor1" type="bool">false</Field>
-                <Object name="textColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight1" type="float">0.02</Field>
-                <Field name="specifyTextColor2" type="bool">false</Field>
-                <Object name="textColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight2" type="float">0.02</Field>
-                <Field name="horizontalJustification" type="string">HCenter</Field>
-                <Field name="verticalJustification" type="string">VCenter</Field>
-                <Field name="depthTestMode" type="string">LABEL_DT_AUTO</Field>
-                <Field name="formatTemplate" type="string">%g</Field>
-            </Object>
-            <Object name="MeshAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="meshColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="meshColorSource" type="string">Foreground</Field>
-                <Field name="opaqueColorSource" type="string">Background</Field>
-                <Field name="opaqueMode" type="string">Auto</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Object name="opaqueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="smoothingLevel" type="string">None</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="opaqueMeshIsAppropriate" type="bool">true</Field>
-                <Field name="showInternal" type="bool">false</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="opacity" type="double">1</Field>
-            </Object>
-            <Object name="MoleculeAttributes">
-                <Field name="drawAtomsAs" type="string">SphereAtoms</Field>
-                <Field name="scaleRadiusBy" type="string">Fixed</Field>
-                <Field name="drawBondsAs" type="string">CylinderBonds</Field>
-                <Field name="colorBonds" type="string">ColorByAtom</Field>
-                <Object name="bondSingleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 128 128 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="radiusVariable" type="string">default</Field>
-                <Field name="radiusScaleFactor" type="float">1</Field>
-                <Field name="radiusFixed" type="float">0.3</Field>
-                <Field name="atomSphereQuality" type="string">Medium</Field>
-                <Field name="bondCylinderQuality" type="string">Medium</Field>
-                <Field name="bondRadius" type="float">0.12</Field>
-                <Field name="bondLineWidth" type="int">0</Field>
-                <Field name="bondLineStyle" type="int">0</Field>
-                <Field name="elementColorTable" type="string">cpk_jmol</Field>
-                <Field name="residueTypeColorTable" type="string">amino_shapely</Field>
-                <Field name="residueSequenceColorTable" type="string">Default</Field>
-                <Field name="continuousColorTable" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="scalarMin" type="float">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="scalarMax" type="float">1</Field>
-            </Object>
-            <Object name="MultiCurveAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.034</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0.069</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.103</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                            <Field name="position" type="float">0.138</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.172</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                            <Field name="position" type="float">0.207</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                            <Field name="position" type="float">0.241</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                            <Field name="position" type="float">0.276</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                            <Field name="position" type="float">0.31</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                            <Field name="position" type="float">0.345</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                            <Field name="position" type="float">0.379</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                            <Field name="position" type="float">0.414</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                            <Field name="position" type="float">0.448</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                            <Field name="position" type="float">0.483</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                            <Field name="position" type="float">0.517</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">170 79 255 255 </Field>
-                            <Field name="position" type="float">0.552</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 0 255 </Field>
-                            <Field name="position" type="float">0.586</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 150 0 255 </Field>
-                            <Field name="position" type="float">0.621</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 150 255 </Field>
-                            <Field name="position" type="float">0.655</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 109 109 255 </Field>
-                            <Field name="position" type="float">0.69</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 150 255 </Field>
-                            <Field name="position" type="float">0.724</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 150 0 255 </Field>
-                            <Field name="position" type="float">0.759</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 84 0 255 </Field>
-                            <Field name="position" type="float">0.793</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">160 0 79 255 </Field>
-                            <Field name="position" type="float">0.828</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 104 28 255 </Field>
-                            <Field name="position" type="float">0.862</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 170 81 255 </Field>
-                            <Field name="position" type="float">0.897</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">68 255 124 255 </Field>
-                            <Field name="position" type="float">0.931</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 130 255 255 </Field>
-                            <Field name="position" type="float">0.966</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">130 0 255 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="changedColors" type="unsignedCharVector"></Field>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                        </Object>
-                    </Object>
-                </Object>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="yAxisTitleFormat" type="string">%g</Field>
-                <Field name="useYAxisTickSpacing" type="bool">false</Field>
-                <Field name="yAxisTickSpacing" type="double">1</Field>
-                <Field name="displayMarkers" type="bool">true</Field>
-                <Field name="markerScale" type="double">1</Field>
-                <Field name="markerLineWidth" type="int">0</Field>
-                <Field name="markerVariable" type="string">default</Field>
-                <Field name="displayIds" type="bool">false</Field>
-                <Field name="idVariable" type="string">default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="ParallelCoordinatesAttributes">
-                <Field name="scalarAxisNames" type="stringVector"></Field>
-                <Field name="visualAxisNames" type="stringVector"></Field>
-                <Field name="extentMinima" type="doubleVector"></Field>
-                <Field name="extentMaxima" type="doubleVector"></Field>
-                <Field name="drawLines" type="bool">true</Field>
-                <Object name="linesColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawContext" type="bool">true</Field>
-                <Field name="contextGamma" type="float">2</Field>
-                <Field name="contextNumPartitions" type="int">128</Field>
-                <Object name="contextColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 220 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawLinesOnlyIfExtentsOn" type="bool">true</Field>
-                <Field name="unifyAxisExtents" type="bool">false</Field>
-                <Field name="linesNumPartitions" type="int">512</Field>
-                <Field name="focusGamma" type="float">4</Field>
-                <Field name="drawFocusAs" type="string">BinsOfConstantColor</Field>
-            </Object>
-            <Object name="PseudocolorAttributes">
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="centering" type="string">Natural</Field>
-                <Field name="colorTableName" type="string">hot</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="opacityType" type="string">FullyOpaque</Field>
-                <Field name="opacityVariable" type="string"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="opacityVarMin" type="double">0</Field>
-                <Field name="opacityVarMax" type="double">1</Field>
-                <Field name="opacityVarMinFlag" type="bool">false</Field>
-                <Field name="opacityVarMaxFlag" type="bool">false</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineType" type="string">Line</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="tubeResolution" type="int">10</Field>
-                <Field name="tubeRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="tubeRadiusAbsolute" type="double">0.125</Field>
-                <Field name="tubeRadiusBBox" type="double">0.005</Field>
-                <Field name="tubeRadiusVarEnabled" type="bool">false</Field>
-                <Field name="tubeRadiusVar" type="string"></Field>
-                <Field name="tubeRadiusVarRatio" type="double">10</Field>
-                <Field name="tailStyle" type="string">None</Field>
-                <Field name="headStyle" type="string">None</Field>
-                <Field name="endPointRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="endPointRadiusAbsolute" type="double">0.125</Field>
-                <Field name="endPointRadiusBBox" type="double">0.05</Field>
-                <Field name="endPointResolution" type="int">10</Field>
-                <Field name="endPointRatio" type="double">5</Field>
-                <Field name="endPointRadiusVarEnabled" type="bool">false</Field>
-                <Field name="endPointRadiusVar" type="string"></Field>
-                <Field name="endPointRadiusVarRatio" type="double">10</Field>
-                <Field name="renderSurfaces" type="int">1</Field>
-                <Field name="renderWireframe" type="int">0</Field>
-                <Field name="renderPoints" type="int">0</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="wireframeColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Object name="pointColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ScatterAttributes">
-                <Field name="var1" type="string">default</Field>
-                <Field name="var1Role" type="string">Coordinate0</Field>
-                <Field name="var1MinFlag" type="bool">false</Field>
-                <Field name="var1MaxFlag" type="bool">false</Field>
-                <Field name="var1Min" type="double">0</Field>
-                <Field name="var1Max" type="double">1</Field>
-                <Field name="var1Scaling" type="string">Linear</Field>
-                <Field name="var1SkewFactor" type="double">1</Field>
-                <Field name="var2Role" type="string">Coordinate1</Field>
-                <Field name="var2" type="string">default</Field>
-                <Field name="var2MinFlag" type="bool">false</Field>
-                <Field name="var2MaxFlag" type="bool">false</Field>
-                <Field name="var2Min" type="double">0</Field>
-                <Field name="var2Max" type="double">1</Field>
-                <Field name="var2Scaling" type="string">Linear</Field>
-                <Field name="var2SkewFactor" type="double">1</Field>
-                <Field name="var3Role" type="string">None</Field>
-                <Field name="var3" type="string">default</Field>
-                <Field name="var3MinFlag" type="bool">false</Field>
-                <Field name="var3MaxFlag" type="bool">false</Field>
-                <Field name="var3Min" type="double">0</Field>
-                <Field name="var3Max" type="double">1</Field>
-                <Field name="var3Scaling" type="string">Linear</Field>
-                <Field name="var3SkewFactor" type="double">1</Field>
-                <Field name="var4Role" type="string">None</Field>
-                <Field name="var4" type="string">default</Field>
-                <Field name="var4MinFlag" type="bool">false</Field>
-                <Field name="var4MaxFlag" type="bool">false</Field>
-                <Field name="var4Min" type="double">0</Field>
-                <Field name="var4Max" type="double">1</Field>
-                <Field name="var4Scaling" type="string">Linear</Field>
-                <Field name="var4SkewFactor" type="double">1</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointSizePixels" type="int">1</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="scaleCube" type="bool">true</Field>
-                <Field name="colorType" type="string">ColorByForegroundColor</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="SpreadsheetAttributes">
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="formatString" type="string">%1.6f</Field>
-                <Field name="useColorTable" type="bool">false</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="showTracerPlane" type="bool">true</Field>
-                <Object name="tracerColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 150 </Field>
-                    </Object>
-                </Object>
-                <Field name="normal" type="string">Z</Field>
-                <Field name="sliceIndex" type="int">0</Field>
-                <Field name="spreadsheetFont" type="string">Courier,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="showPatchOutline" type="bool">true</Field>
-                <Field name="showCurrentCellOutline" type="bool">false</Field>
-            </Object>
-            <Object name="SubsetAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="subsetNames" type="stringVector"></Field>
-                <Field name="subsetType" type="string">Unknown</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="TensorAttributes">
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nTensors" type="int">400</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="colorByEigenvalues" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="tensorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="TruecolorAttributes">
-                <Field name="opacity" type="double">1</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-            </Object>
-            <Object name="VectorAttributes">
-                <Field name="glyphLocation" type="string">AdaptsToMeshResolution</Field>
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nVectors" type="int">400</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="headSize" type="double">0.25</Field>
-                <Field name="headOn" type="bool">true</Field>
-                <Field name="colorByMag" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="vectorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="vectorOrigin" type="string">Tail</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="lineStem" type="string">Line</Field>
-                <Field name="geometryQuality" type="string">Fast</Field>
-                <Field name="stemWidth" type="double">0.08</Field>
-                <Field name="origOnly" type="bool">true</Field>
-                <Field name="glyphType" type="string">Arrow</Field>
-            </Object>
-            <Object name="VolumeAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="colorControlPoints">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.25</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.5</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.75</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">Linear</Field>
-                        <Field name="equal" type="bool">false</Field>
-                        <Field name="discrete" type="bool">false</Field>
-                        <Field name="category" type="string"></Field>
-                    </Object>
-                </Object>
-                <Field name="opacityAttenuation" type="float">1</Field>
-                <Field name="opacityMode" type="string">FreeformMode</Field>
-                <Object name="opacityControlPoints">
-                    <Object name="GaussianControlPointList">
-                    </Object>
-                </Object>
-                <Field name="resampleFlag" type="bool">true</Field>
-                <Field name="resampleTarget" type="int">50000</Field>
-                <Field name="opacityVariable" type="string">default</Field>
-                <Field name="compactVariable" type="string">default</Field>
-                <Field name="freeformOpacity" type="unsignedCharArray" length="256">0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 </Field>
-                <Field name="useColorVarMin" type="bool">false</Field>
-                <Field name="colorVarMin" type="float">0</Field>
-                <Field name="useColorVarMax" type="bool">false</Field>
-                <Field name="colorVarMax" type="float">0</Field>
-                <Field name="useOpacityVarMin" type="bool">false</Field>
-                <Field name="opacityVarMin" type="float">0</Field>
-                <Field name="useOpacityVarMax" type="bool">false</Field>
-                <Field name="opacityVarMax" type="float">0</Field>
-                <Field name="smoothData" type="bool">false</Field>
-                <Field name="samplesPerRay" type="int">500</Field>
-                <Field name="rendererType" type="string">Splatting</Field>
-                <Field name="gradientType" type="string">SobelOperator</Field>
-                <Field name="num3DSlices" type="int">200</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="sampling" type="string">Rasterization</Field>
-                <Field name="rendererSamples" type="float">3</Field>
-                <Field name="transferFunctionDim" type="int">1</Field>
-                <Field name="lowGradientLightingReduction" type="string">Lower</Field>
-                <Field name="lowGradientLightingClampFlag" type="bool">false</Field>
-                <Field name="lowGradientLightingClampValue" type="double">1</Field>
-                <Field name="materialProperties" type="doubleArray" length="4">0.4 0.75 0 15 </Field>
-            </Object>
-            <Object name="AMRStitchCellAttributes">
-                <Field name="CreateCellsOfType" type="string">DualGridAndStitchCells</Field>
-            </Object>
-            <Object name="AxisAlignedSlice4DAttributes">
-                <Field name="I" type="intVector"></Field>
-                <Field name="J" type="intVector"></Field>
-                <Field name="K" type="intVector"></Field>
-                <Field name="L" type="intVector"></Field>
-            </Object>
-            <Object name="BoundaryOpAttributes">
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="BoxAttributes">
-                <Field name="amount" type="string">Some</Field>
-                <Field name="minx" type="double">0</Field>
-                <Field name="maxx" type="double">1</Field>
-                <Field name="miny" type="double">0</Field>
-                <Field name="maxy" type="double">1</Field>
-                <Field name="minz" type="double">0</Field>
-                <Field name="maxz" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="CartographicProjectionAttributes">
-                <Field name="projectionID" type="string">aitoff</Field>
-                <Field name="centralMeridian" type="double">0</Field>
-            </Object>
-            <Object name="ClipAttributes">
-                <Field name="quality" type="string">Fast</Field>
-                <Field name="funcType" type="string">Plane</Field>
-                <Field name="plane1Status" type="bool">true</Field>
-                <Field name="plane2Status" type="bool">false</Field>
-                <Field name="plane3Status" type="bool">false</Field>
-                <Field name="plane1Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane2Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane3Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane1Normal" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="plane2Normal" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="plane3Normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeInverse" type="bool">false</Field>
-                <Field name="planeToolControlledClipPlane" type="string">Plane1</Field>
-                <Field name="center" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereInverse" type="bool">false</Field>
-            </Object>
-            <Object name="ConeAttributes">
-                <Field name="angle" type="double">45</Field>
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="representation" type="string">Flattened</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="cutByLength" type="bool">false</Field>
-                <Field name="length" type="double">1</Field>
-            </Object>
-            <Object name="CoordSwapAttributes">
-                <Field name="newCoord1" type="string">Coord1</Field>
-                <Field name="newCoord2" type="string">Coord2</Field>
-                <Field name="newCoord3" type="string">Coord3</Field>
-            </Object>
-            <Object name="CreateBondsAttributes">
-                <Field name="elementVariable" type="string">element</Field>
-                <Field name="atomicNumber1" type="intVector">1 -1 </Field>
-                <Field name="atomicNumber2" type="intVector">-1 -1 </Field>
-                <Field name="minDist" type="doubleVector">0.4 0.4 </Field>
-                <Field name="maxDist" type="doubleVector">1.2 1.9 </Field>
-                <Field name="maxBondsClamp" type="int">10</Field>
-                <Field name="addPeriodicBonds" type="bool">false</Field>
-                <Field name="useUnitCellVectors" type="bool">true</Field>
-                <Field name="periodicInX" type="bool">true</Field>
-                <Field name="periodicInY" type="bool">true</Field>
-                <Field name="periodicInZ" type="bool">true</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-            </Object>
-            <Object name="CylinderAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="DataBinningAttributes">
-                <Field name="numDimensions" type="string">One</Field>
-                <Field name="dim1BinBasedOn" type="string">Variable</Field>
-                <Field name="dim1Var" type="string">default</Field>
-                <Field name="dim1SpecifyRange" type="bool">false</Field>
-                <Field name="dim1MinRange" type="double">0</Field>
-                <Field name="dim1MaxRange" type="double">1</Field>
-                <Field name="dim1NumBins" type="int">50</Field>
-                <Field name="dim2BinBasedOn" type="string">Variable</Field>
-                <Field name="dim2Var" type="string">default</Field>
-                <Field name="dim2SpecifyRange" type="bool">false</Field>
-                <Field name="dim2MinRange" type="double">0</Field>
-                <Field name="dim2MaxRange" type="double">1</Field>
-                <Field name="dim2NumBins" type="int">50</Field>
-                <Field name="dim3BinBasedOn" type="string">Variable</Field>
-                <Field name="dim3Var" type="string">default</Field>
-                <Field name="dim3SpecifyRange" type="bool">false</Field>
-                <Field name="dim3MinRange" type="double">0</Field>
-                <Field name="dim3MaxRange" type="double">1</Field>
-                <Field name="dim3NumBins" type="int">50</Field>
-                <Field name="outOfBoundsBehavior" type="string">Clamp</Field>
-                <Field name="reductionOperator" type="string">Average</Field>
-                <Field name="varForReduction" type="string">default</Field>
-                <Field name="emptyVal" type="double">0</Field>
-                <Field name="outputType" type="string">OutputOnBins</Field>
-                <Field name="removeEmptyValFromCurve" type="bool">true</Field>
-            </Object>
-            <Object name="DeferExpressionAttributes">
-                <Field name="exprs" type="stringVector"></Field>
-            </Object>
-            <Object name="DisplaceAttributes">
-                <Field name="factor" type="double">1</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="DualMeshAttributes">
-                <Field name="mode" type="string">Auto</Field>
-            </Object>
-            <Object name="EdgeAttributes">
-                <Field name="dummy" type="bool">true</Field>
-            </Object>
-            <Object name="ElevateAttributes">
-                <Field name="useXYLimits" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="zeroFlag" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="EllipsoidSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radii" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="rotationAngle" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ExplodeAttributes">
-                <Field name="explosionType" type="string">Point</Field>
-                <Field name="explosionPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planePoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNorm" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint2" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="materialExplosionFactor" type="double">1</Field>
-                <Field name="material" type="string"></Field>
-                <Field name="cylinderRadius" type="double">0</Field>
-                <Field name="explodeMaterialCells" type="bool">false</Field>
-                <Field name="cellExplosionFactor" type="double">1</Field>
-                <Field name="explosionPattern" type="string">Impact</Field>
-                <Field name="explodeAllCells" type="bool">false</Field>
-                <Field name="boundaryNames" type="stringVector"></Field>
-            </Object>
-            <Object name="ExternalSurfaceAttributes">
-                <Field name="removeGhosts" type="bool">false</Field>
-                <Field name="edgesIn2D" type="bool">true</Field>
-            </Object>
-            <Object name="ExtrudeAttributes">
-                <Field name="axis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="length" type="double">1</Field>
-                <Field name="steps" type="int">30</Field>
-                <Field name="preserveOriginalCellNumbers" type="bool">true</Field>
-            </Object>
-            <Object name="FFTAttributes">
-                <Field name="dummy" type="int">0</Field>
-            </Object>
-            <Object name="IndexSelectAttributes">
-                <Field name="maxDim" type="string">ThreeD</Field>
-                <Field name="dim" type="string">TwoD</Field>
-                <Field name="xAbsMax" type="int">-1</Field>
-                <Field name="xMin" type="int">0</Field>
-                <Field name="xMax" type="int">-1</Field>
-                <Field name="xIncr" type="int">1</Field>
-                <Field name="xWrap" type="bool">false</Field>
-                <Field name="yAbsMax" type="int">-1</Field>
-                <Field name="yMin" type="int">0</Field>
-                <Field name="yMax" type="int">-1</Field>
-                <Field name="yIncr" type="int">1</Field>
-                <Field name="yWrap" type="bool">false</Field>
-                <Field name="zAbsMax" type="int">-1</Field>
-                <Field name="zMin" type="int">0</Field>
-                <Field name="zMax" type="int">-1</Field>
-                <Field name="zIncr" type="int">1</Field>
-                <Field name="zWrap" type="bool">false</Field>
-                <Field name="useWholeCollection" type="bool">true</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-            </Object>
-            <Object name="IntegralCurveAttributes">
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="boxExtents" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                <Field name="useWholeBox" type="bool">true</Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="fieldData" type="doubleVector"></Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="sampleDensity2" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="displayGeometry" type="string">Lines</Field>
-                <Field name="cleanupMethod" type="string">NoCleanup</Field>
-                <Field name="cleanupThreshold" type="double">1e-08</Field>
-                <Field name="cropBeginFlag" type="bool">false</Field>
-                <Field name="cropBegin" type="double">0</Field>
-                <Field name="cropEndFlag" type="bool">false</Field>
-                <Field name="cropEnd" type="double">0</Field>
-                <Field name="cropValue" type="string">Time</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-                <Field name="selection" type="string"></Field>
-            </Object>
-            <Object name="InverseGhostZoneAttributes">
-                <Field name="requestGhostZones" type="bool">true</Field>
-                <Field name="showDuplicated" type="bool">true</Field>
-                <Field name="showEnhancedConnectivity" type="bool">true</Field>
-                <Field name="showReducedConnectivity" type="bool">true</Field>
-                <Field name="showAMRRefined" type="bool">true</Field>
-                <Field name="showExterior" type="bool">true</Field>
-                <Field name="showNotApplicable" type="bool">true</Field>
-            </Object>
-            <Object name="IsosurfaceAttributes">
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="IsovolumeAttributes">
-                <Field name="lbound" type="double">-1e+37</Field>
-                <Field name="ubound" type="double">1e+37</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LCSAttributes">
-                <Field name="sourceType" type="string">NativeMesh</Field>
-                <Field name="Resolution" type="intArray" length="3">10 10 10 </Field>
-                <Field name="UseDataSetStart" type="string">Full</Field>
-                <Field name="StartPosition" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="UseDataSetEnd" type="string">Full</Field>
-                <Field name="EndPosition" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="auxiliaryGrid" type="string">None</Field>
-                <Field name="auxiliaryGridSpacing" type="double">0.0001</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="operationType" type="string">Lyapunov</Field>
-                <Field name="cauchyGreenTensor" type="string">Right</Field>
-                <Field name="eigenComponent" type="string">Largest</Field>
-                <Field name="eigenWeight" type="double">1</Field>
-                <Field name="operatorType" type="string">BaseValue</Field>
-                <Field name="terminationType" type="string">Time</Field>
-                <Field name="terminateBySize" type="bool">false</Field>
-                <Field name="termSize" type="double">10</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="clampLogValues" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="thresholdLimit" type="double">0.1</Field>
-                <Field name="radialLimit" type="double">0.1</Field>
-                <Field name="boundaryLimit" type="double">0.1</Field>
-                <Field name="seedLimit" type="int">10</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="LagrangianAttributes">
-                <Field name="seedPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="numSteps" type="int">1000</Field>
-                <Field name="XAxisSample" type="string">Step</Field>
-                <Field name="YAxisSample" type="string">Step</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LimitCycleAttributes">
-                <Field name="sourceType" type="string">SpecifiedLine</Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="cycleTolerance" type="double">1e-06</Field>
-                <Field name="maxIterations" type="int">10</Field>
-                <Field name="showPartialResults" type="bool">true</Field>
-                <Field name="showReturnDistances" type="bool">false</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-            </Object>
-            <Object name="LineoutAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 1 0 </Field>
-                <Field name="interactive" type="bool">false</Field>
-                <Field name="ignoreGlobal" type="bool">false</Field>
-                <Field name="samplingOn" type="bool">false</Field>
-                <Field name="numberOfSamplePoints" type="int">50</Field>
-                <Field name="reflineLabels" type="bool">false</Field>
-                <Field name="designator" type="string"></Field>
-            </Object>
-            <Object name="MultiresControlAttributes">
-                <Field name="resolution" type="int">0</Field>
-                <Field name="maxResolution" type="int">1</Field>
-                <Field name="info" type="string"></Field>
-            </Object>
-            <Object name="OnionPeelAttributes">
-                <Field name="adjacencyType" type="string">Node</Field>
-                <Field name="useGlobalId" type="bool">false</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="index" type="intVector">1 </Field>
-                <Field name="logical" type="bool">false</Field>
-                <Field name="requestedLayer" type="int">0</Field>
-                <Field name="seedType" type="string">SeedCell</Field>
-                <Field name="honorOriginalMesh" type="bool">true</Field>
-            </Object>
-            <Object name="PersistentParticlesAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startPathType" type="string">Absolute</Field>
-                <Field name="stopPathType" type="string">Absolute</Field>
-                <Field name="traceVariableX" type="string">default</Field>
-                <Field name="traceVariableY" type="string">default</Field>
-                <Field name="traceVariableZ" type="string">default</Field>
-                <Field name="connectParticles" type="bool">false</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="indexVariable" type="string">default</Field>
-            </Object>
-            <Object name="PoincareAttributes">
-                <Field name="opacityType" type="string">Explicit</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="minPunctures" type="int">50</Field>
-                <Field name="maxPunctures" type="int">500</Field>
-                <Field name="puncturePlotType" type="string">Single</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="puncturePeriodTolerance" type="double">0.01</Field>
-                <Field name="puncturePlane" type="string">Poloidal</Field>
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="pointDensity" type="int">1</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">AdamsBashforth</Field>
-                <Field name="coordinateSystem" type="string">Cartesian</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-05</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="analysis" type="string">Normal</Field>
-                <Field name="maximumToroidalWinding" type="int">0</Field>
-                <Field name="overrideToroidalWinding" type="int">0</Field>
-                <Field name="overridePoloidalWinding" type="int">0</Field>
-                <Field name="windingPairConfidence" type="double">0.9</Field>
-                <Field name="rationalSurfaceFactor" type="double">0.1</Field>
-                <Field name="overlaps" type="string">Remove</Field>
-                <Field name="meshType" type="string">Curves</Field>
-                <Field name="numberPlanes" type="int">1</Field>
-                <Field name="singlePlane" type="double">0</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">0</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="colorType" type="string">ColorByColorTable</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="dataValue" type="string">SafetyFactorQ</Field>
-                <Field name="showRationalSurfaces" type="bool">false</Field>
-                <Field name="RationalSurfaceMaxIterations" type="int">2</Field>
-                <Field name="showOPoints" type="bool">false</Field>
-                <Field name="OPointMaxIterations" type="int">2</Field>
-                <Field name="showXPoints" type="bool">false</Field>
-                <Field name="XPointMaxIterations" type="int">2</Field>
-                <Field name="performOLineAnalysis" type="bool">false</Field>
-                <Field name="OLineToroidalWinding" type="int">1</Field>
-                <Field name="OLineAxisFileName" type="string"></Field>
-                <Field name="showChaotic" type="bool">false</Field>
-                <Field name="showIslands" type="bool">false</Field>
-                <Field name="SummaryFlag" type="bool">true</Field>
-                <Field name="verboseFlag" type="bool">false</Field>
-                <Field name="show1DPlots" type="bool">false</Field>
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="ProjectAttributes">
-                <Field name="projectionType" type="string">XYCartesian</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-            </Object>
-            <Object name="RadialResampleAttributes">
-                <Field name="isFast" type="bool">false</Field>
-                <Field name="minTheta" type="float">0</Field>
-                <Field name="maxTheta" type="float">90</Field>
-                <Field name="deltaTheta" type="float">5</Field>
-                <Field name="radius" type="float">0.5</Field>
-                <Field name="deltaRadius" type="float">0.05</Field>
-                <Field name="center" type="floatArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="minAzimuth" type="float">0</Field>
-                <Field name="maxAzimuth" type="float">180</Field>
-                <Field name="deltaAzimuth" type="float">5</Field>
-            </Object>
-            <Object name="ReflectAttributes">
-                <Field name="octant" type="string">PXPYPZ</Field>
-                <Field name="useXBoundary" type="bool">true</Field>
-                <Field name="specifiedX" type="double">0</Field>
-                <Field name="useYBoundary" type="bool">true</Field>
-                <Field name="specifiedY" type="double">0</Field>
-                <Field name="useZBoundary" type="bool">true</Field>
-                <Field name="specifiedZ" type="double">0</Field>
-                <Field name="reflections" type="intArray" length="8">1 0 1 0 0 0 0 0 </Field>
-            </Object>
-            <Object name="ReplicateAttributes">
-                <Field name="useUnitCellVectors" type="bool">false</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="xReplications" type="int">1</Field>
-                <Field name="yReplications" type="int">1</Field>
-                <Field name="zReplications" type="int">1</Field>
-                <Field name="mergeResults" type="bool">true</Field>
-                <Field name="replicateUnitCellAtoms" type="bool">false</Field>
-                <Field name="shiftPeriodicAtomOrigin" type="bool">false</Field>
-                <Field name="newPeriodicOrigin" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ResampleAttributes">
-                <Field name="useExtents" type="bool">true</Field>
-                <Field name="startX" type="double">0</Field>
-                <Field name="endX" type="double">1</Field>
-                <Field name="samplesX" type="int">10</Field>
-                <Field name="startY" type="double">0</Field>
-                <Field name="endY" type="double">1</Field>
-                <Field name="samplesY" type="int">10</Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="startZ" type="double">0</Field>
-                <Field name="endZ" type="double">1</Field>
-                <Field name="samplesZ" type="int">10</Field>
-                <Field name="tieResolver" type="string">random</Field>
-                <Field name="tieResolverVariable" type="string">default</Field>
-                <Field name="defaultValue" type="double">0</Field>
-                <Field name="distributedResample" type="bool">true</Field>
-                <Field name="cellCenteredOutput" type="bool">false</Field>
-            </Object>
-            <Object name="RevolveAttributes">
-                <Field name="meshType" type="string">Auto</Field>
-                <Field name="autoAxis" type="bool">true</Field>
-                <Field name="axis" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="startAngle" type="double">0</Field>
-                <Field name="stopAngle" type="double">360</Field>
-                <Field name="steps" type="int">30</Field>
-            </Object>
-            <Object name="SPHResampleAttributes">
-                <Field name="minX" type="float">0</Field>
-                <Field name="maxX" type="float">1</Field>
-                <Field name="xnum" type="int">10</Field>
-                <Field name="minY" type="float">0</Field>
-                <Field name="maxY" type="float">1</Field>
-                <Field name="ynum" type="int">10</Field>
-                <Field name="minZ" type="float">0</Field>
-                <Field name="maxZ" type="float">1</Field>
-                <Field name="znum" type="int">10</Field>
-                <Field name="tensorSupportVariable" type="string">H</Field>
-                <Field name="weightVariable" type="string">mass</Field>
-                <Field name="RK" type="bool">true</Field>
-            </Object>
-            <Object name="SliceAttributes">
-                <Field name="originType" type="string">Intercept</Field>
-                <Field name="originPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="originIntercept" type="double">0</Field>
-                <Field name="originPercent" type="double">0</Field>
-                <Field name="originZone" type="int">0</Field>
-                <Field name="originNode" type="int">0</Field>
-                <Field name="normal" type="doubleArray" length="3">0 -1 0 </Field>
-                <Field name="axisType" type="string">YAxis</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="project2d" type="bool">true</Field>
-                <Field name="interactive" type="bool">true</Field>
-                <Field name="flip" type="bool">false</Field>
-                <Field name="originZoneDomain" type="int">0</Field>
-                <Field name="originNodeDomain" type="int">0</Field>
-                <Field name="meshName" type="string">default</Field>
-                <Field name="theta" type="double">0</Field>
-                <Field name="phi" type="double">0</Field>
-            </Object>
-            <Object name="SmoothOperatorAttributes">
-                <Field name="numIterations" type="int">20</Field>
-                <Field name="relaxationFactor" type="double">0.01</Field>
-                <Field name="convergence" type="double">0</Field>
-                <Field name="maintainFeatures" type="bool">true</Field>
-                <Field name="featureAngle" type="double">45</Field>
-                <Field name="edgeAngle" type="double">15</Field>
-                <Field name="smoothBoundaries" type="bool">false</Field>
-            </Object>
-            <Object name="SphereSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-            </Object>
-            <Object name="StaggerAttributes">
-                <Field name="offsetX" type="double">0</Field>
-                <Field name="offsetY" type="double">0</Field>
-                <Field name="offsetZ" type="double">0</Field>
-            </Object>
-            <Object name="StatisticalTrendsAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startTrendType" type="string">Absolute</Field>
-                <Field name="stopTrendType" type="string">Absolute</Field>
-                <Field name="statisticType" type="string">Mean</Field>
-                <Field name="trendAxis" type="string">Step</Field>
-                <Field name="variableSource" type="string">Default</Field>
-            </Object>
-            <Object name="SubdivideQuadsAttributes">
-                <Field name="threshold" type="double">0.500002</Field>
-                <Field name="maxSubdivs" type="int">4</Field>
-                <Field name="fanOutPoints" type="bool">true</Field>
-                <Field name="doTriangles" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="ThreeSliceAttributes">
-                <Field name="x" type="double">0</Field>
-                <Field name="y" type="double">0</Field>
-                <Field name="z" type="double">0</Field>
-                <Field name="interactive" type="bool">true</Field>
-            </Object>
-            <Object name="ThresholdAttributes">
-                <Field name="outputMeshType" type="int">0</Field>
-                <Field name="boundsInputType" type="int">0</Field>
-                <Field name="listedVarNames" type="stringVector">"default" </Field>
-                <Field name="zonePortions" type="intVector"></Field>
-                <Field name="lowerBounds" type="doubleVector"></Field>
-                <Field name="upperBounds" type="doubleVector"></Field>
-                <Field name="boundsRange" type="stringVector"></Field>
-                <Field name="defaultVarName" type="string">default</Field>
-                <Field name="defaultVarIsScalar" type="bool">false</Field>
-            </Object>
-            <Object name="TransformAttributes">
-                <Field name="doRotate" type="bool">false</Field>
-                <Field name="rotateOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="rotateAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="rotateAmount" type="double">0</Field>
-                <Field name="rotateType" type="string">Deg</Field>
-                <Field name="doScale" type="bool">false</Field>
-                <Field name="scaleOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="scaleX" type="double">1</Field>
-                <Field name="scaleY" type="double">1</Field>
-                <Field name="scaleZ" type="double">1</Field>
-                <Field name="doTranslate" type="bool">false</Field>
-                <Field name="translateX" type="double">0</Field>
-                <Field name="translateY" type="double">0</Field>
-                <Field name="translateZ" type="double">0</Field>
-                <Field name="transformType" type="string">Similarity</Field>
-                <Field name="inputCoordSys" type="string">Cartesian</Field>
-                <Field name="outputCoordSys" type="string">Spherical</Field>
-                <Field name="continuousPhi" type="bool">false</Field>
-                <Field name="m00" type="double">1</Field>
-                <Field name="m01" type="double">0</Field>
-                <Field name="m02" type="double">0</Field>
-                <Field name="m03" type="double">0</Field>
-                <Field name="m10" type="double">0</Field>
-                <Field name="m11" type="double">1</Field>
-                <Field name="m12" type="double">0</Field>
-                <Field name="m13" type="double">0</Field>
-                <Field name="m20" type="double">0</Field>
-                <Field name="m21" type="double">0</Field>
-                <Field name="m22" type="double">1</Field>
-                <Field name="m23" type="double">0</Field>
-                <Field name="m30" type="double">0</Field>
-                <Field name="m31" type="double">0</Field>
-                <Field name="m32" type="double">0</Field>
-                <Field name="m33" type="double">1</Field>
-                <Field name="invertLinearTransform" type="bool">false</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-                <Field name="transformVectors" type="bool">true</Field>
-            </Object>
-            <Object name="TriangulateRegularPointsAttributes">
-                <Field name="useXGridSpacing" type="bool">false</Field>
-                <Field name="xGridSpacing" type="double">1</Field>
-                <Field name="useYGridSpacing" type="bool">false</Field>
-                <Field name="yGridSpacing" type="double">1</Field>
-            </Object>
-            <Object name="TubeAttributes">
-                <Field name="scaleByVarFlag" type="bool">false</Field>
-                <Field name="tubeRadiusType" type="string">FractionOfBBox</Field>
-                <Field name="radiusFractionBBox" type="double">0.01</Field>
-                <Field name="radiusAbsolute" type="double">1</Field>
-                <Field name="scaleVariable" type="string">default</Field>
-                <Field name="fineness" type="int">5</Field>
-                <Field name="capping" type="bool">false</Field>
-            </Object>
-            <Object name="AppearanceAttributes">
-                <Field name="useSystemDefault" type="bool">true</Field>
-                <Field name="background" type="string">#c0c0c0</Field>
-                <Field name="foreground" type="string">#000000</Field>
-                <Field name="fontName" type="string">Helvetica,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="style" type="string">gtk</Field>
-                <Field name="orientation" type="int">0</Field>
-                <Field name="defaultForeground" type="string">#000000</Field>
-                <Field name="defaultBackground" type="string">#d4d0c8</Field>
-                <Field name="defaultFontName" type="string">"Sans Serif,9,-1,5,50,0,0,0,0,0"</Field>
-                <Field name="defaultStyle" type="string">Windows</Field>
-                <Field name="defaultOrientation" type="int">0</Field>
-            </Object>
-            <Object name="PluginManagerAttributes">
-                <Field name="name" type="stringVector">"Boundary" "Contour" "Curve" "FilledBoundary" "Histogram" "Label" "Mesh" "Molecule" "MultiCurve" "ParallelCoordinates" "Pseudocolor" "Scatter" "Spreadsheet" "Subset" "Surface" "Tensor" "Truecolor" "Vector" "Volume" "WellBore" "AMRStitchCell" "BoundaryOp" "Box" "CartographicProjection" "Clip" "Cone" "ConnectedComponents" "CoordSwap" "CracksClipper" "CreateBonds" "Cylinder" "DataBinning" "Decimate" "DeferExpression" "Delaunay" "Displace" "DualMesh" "Edge" "Elevate" "EllipsoidSlice" "ExternalSurface" "ExtractPointFunction2D" "Extrude" "FFT" "FiveFoldTetSubdivision" "Flux" "IndexSelect" "IntegralCurve" "InverseGhostZone" "Isosurface" "Isovolume" "LCS" "Lagrangian" "LimitCycle" "LineSampler" "Lineout" "Merge" "ModelFit" "MultiresControl" "OnionPeel" "PDF" "PersistentParticles" "Poincare" "Project" "RadialResample" "Reflect" "Replicate" "Resample" "Revolve" "Slice" "Smooth" "SphereSlice" "Stagger" "StatisticalTrends" "SurfaceNormal" "ThreeSlice" "Threshold" "ToroidalPoloidalProjection" "Transform" "TriangulateRegularPoints" "Tube" "ZoneDump" "SPHResample" "AxisAlignedSlice4D" "Explode" "SubdivideQuads" </Field>
-                <Field name="type" type="stringVector">"plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" </Field>
-                <Field name="version" type="stringVector">"1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.1" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "2.0" "3.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" </Field>
-                <Field name="id" type="stringVector">"Boundary_1.0" "Contour_1.0" "Curve_1.0" "FilledBoundary_1.0" "Histogram_1.0" "Label_1.0" "Mesh_1.0" "Molecule_1.0" "MultiCurve_1.0" "ParallelCoordinates_1.0" "Pseudocolor_1.0" "Scatter_1.0" "Spreadsheet_1.0" "Subset_1.0" "Surface_1.0" "Tensor_1.0" "Truecolor_1.0" "Vector_1.0" "Volume_1.1" "WellBore_1.0" "AMRStitchCell_1.0" "BoundaryOp_1.0" "Box_1.0" "CartographicProjection_1.0" "Clip_1.0" "Cone_1.0" "ConnectedComponents_1.0" "CoordSwap_1.0" "CracksClipper_1.0" "CreateBonds_1.0" "Cylinder_1.0" "DataBinning_1.0" "Decimate_1.0" "DeferExpression_1.0" "Delaunay_1.0" "Displace_1.0" "DualMesh_1.0" "Edge_1.0" "Elevate_1.0" "EllipsoidSlice_1.0" "ExternalSurface_1.0" "ExtractPointFunction2D_1.0" "Extrude_1.0" "FFT_1.0" "FiveFoldTetSubdivision_1.0" "Flux_1.0" "IndexSelect_1.0" "IntegralCurve_1.0" "InverseGhostZone_1.0" "Isosurface_1.0" "Isovolume_1.0" "LCS_1.0" "Lagrangian_1.0" "LimitCycle_1.0" "LineSampler_1.0" "Lineout_1.0" "Merge_1.0" "ModelFit_1.0" "MultiresControl_1.0" "OnionPeel_1.0" "PDF_1.0" "PersistentParticles_2.0" "Poincare_3.0" "Project_1.0" "RadialResample_1.0" "Reflect_1.0" "Replicate_1.0" "Resample_1.0" "Revolve_1.0" "Slice_1.0" "Smooth_1.0" "SphereSlice_1.0" "Stagger_1.0" "StatisticalTrends_1.0" "SurfaceNormal_1.0" "ThreeSlice_1.0" "Threshold_1.0" "ToroidalPoloidalProjection_1.0" "Transform_1.0" "TriangulateRegularPoints_1.0" "Tube_1.0" "ZoneDump_1.0" "SPHResample_1.0" "AxisAlignedSlice4D_1.0" "Explode_1.0" "SubdivideQuads_1.0" </Field>
-                <Field name="category" type="stringVector">"?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "Geometry" "Slicing" "Selection" "Transforms" "Selection" "Slicing" "Analysis" "Geometry" "Analysis" "Molecular" "Selection" "Analysis" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Geometry" "Transforms" "Slicing" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Analysis" "Selection" "Integral Curves" "Debugging" "Slicing" "Selection" "Integral Curves" "Integral Curves" "Integral Curves" "Slicing" "Analysis" "Geometry" "Analysis" "Selection" "Selection" "Analysis" "Analysis" "Integral Curves" "Transforms" "Geometry" "Transforms" "Transforms" "Geometry" "Geometry" "Slicing" "Geometry" "Slicing" "Transforms" "Analysis" "Geometry" "Slicing" "Selection" "Transforms" "Transforms" "Geometry" "Geometry" "Debugging" "Geometry" "Slicing" "Transforms" "Geometry" </Field>
-                <Field name="enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 1 0 1 1 1 1 1 1 1 1 0 1 1 1 0 1 0 1 1 1 1 1 1 0 1 1 0 1 1 1 1 1 1 1 1 1 0 1 0 1 1 1 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 0 1 1 1 1 </Field>
-            </Object>
-        </Object>
-        <Object name="ViewerSubject">
-            <Object name="SourceMap">
-                <Field name="SOURCE00" type="string">localhost:/work/SENSEI/amrex/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/umesh/umesh.visit</Field>
-            </Object>
-            <Object name="SourcePlugins">
-                <Field name="localhost:/work/SENSEI/amrex/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/umesh/umesh.visit" type="string">VTK_1.0</Field>
-            </Object>
-            <Object name="DatabaseCorrelationList">
-                <Field name="needPermission" type="bool">true</Field>
-                <Field name="defaultCorrelationMethod" type="int">0</Field>
-                <Field name="whenToCorrelate" type="string">CorrelateOnlyIfSameLength</Field>
-            </Object>
-            <Object name="ViewerWindowManager">
-                <Object name="SelectionList">
-                    <Field name="autoApplyUpdates" type="bool">false</Field>
-                </Object>
-                <Field name="activeWindow" type="int">0</Field>
-                <Field name="lineoutWindow" type="int">-1</Field>
-                <Field name="timeQueryWindow" type="int">-1</Field>
-                <Field name="cameraView" type="bool">false</Field>
-                <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                <Object name="Windows">
-                    <Object name="ViewerWindow">
-                        <Field name="windowSize" type="intArray" length="2">758 815 </Field>
-                        <Field name="windowImageSize" type="intArray" length="2">758 755 </Field>
-                        <Field name="windowLocation" type="intArray" length="2">536 331 </Field>
-                        <Field name="maintainView" type="bool">false</Field>
-                        <Field name="cameraView" type="bool">false</Field>
-                        <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                        <Field name="viewIsLocked" type="bool">false</Field>
-                        <Field name="timeLocked" type="bool">false</Field>
-                        <Field name="toolsLocked" type="bool">false</Field>
-                        <Field name="interactionMode" type="string">NAVIGATE</Field>
-                        <Field name="toolUpdateMode" type="string">ONRELEASE</Field>
-                        <Object name="AnnotationAttributes">
-                            <Object name="axes2D">
-                                <Object name="Axes2D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Outside</Field>
-                                    <Field name="tickAxes" type="string">BottomLeft</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                            <Object name="axes3D">
-                                <Object name="Axes3D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Inside</Field>
-                                    <Field name="axesType" type="string">ClosestTriad</Field>
-                                    <Field name="triadFlag" type="bool">true</Field>
-                                    <Field name="bboxFlag" type="bool">true</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="zAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Z-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="setBBoxLocation" type="bool">false</Field>
-                                    <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="userInfoFlag" type="bool">true</Field>
-                            <Object name="userInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoFlag" type="bool">true</Field>
-                            <Field name="timeInfoFlag" type="bool">true</Field>
-                            <Object name="databaseInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                            <Field name="databaseInfoTimeScale" type="double">1</Field>
-                            <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                            <Field name="legendInfoFlag" type="bool">true</Field>
-                            <Object name="backgroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="foregroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                            <Object name="gradientColor1">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="gradientColor2">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="backgroundMode" type="string">Solid</Field>
-                            <Field name="backgroundImage" type="string"></Field>
-                            <Field name="imageRepeatX" type="int">1</Field>
-                            <Field name="imageRepeatY" type="int">1</Field>
-                            <Object name="axesArray">
-                                <Object name="AxesArray">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="ticksVisible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Object name="axes">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string"></Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Object name="LightList">
-                            <Object name="light0">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                                    <Field name="enabledFlag" type="bool">true</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light1">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light2">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light3">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light4">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light5">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light6">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light7">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                        <Field name="scalableActivationMode" type="int">1</Field>
-                        <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-                        <Field name="compactDomainsActivationMode" type="int">2</Field>
-                        <Field name="notifyForEachRender" type="bool">false</Field>
-                        <Field name="surfaceRepresentation" type="int">0</Field>
-                        <Field name="displayListMode" type="int">2</Field>
-                        <Field name="stereoRendering" type="bool">false</Field>
-                        <Field name="stereoType" type="int">2</Field>
-                        <Field name="antialiasing" type="bool">false</Field>
-                        <Field name="orderComposite" type="bool">true</Field>
-                        <Field name="depthPeeling" type="bool">false</Field>
-                        <Field name="occlusionRatio" type="double">0.01</Field>
-                        <Field name="numberOfPeels" type="int">32</Field>
-                        <Field name="multiresolutionMode" type="bool">false</Field>
-                        <Field name="multiresolutionCellSize" type="double">0.0020000000949949</Field>
-                        <Field name="specularFlag" type="bool">false</Field>
-                        <Field name="specularCoeff" type="double">0.600000023841858</Field>
-                        <Field name="specularPower" type="double">10</Field>
-                        <Object name="specularColor">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="doShading" type="bool">false</Field>
-                        <Field name="shadingStrength" type="double">0.5</Field>
-                        <Field name="doDepthCueing" type="bool">false</Field>
-                        <Field name="depthCueingAuto" type="bool">true</Field>
-                        <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                        <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                        <Field name="colorTexturingFlag" type="bool">true</Field>
-                        <Object name="ViewCurveAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="domainScale" type="int">0</Field>
-                            <Field name="rangeScale" type="int">0</Field>
-                        </Object>
-                        <Object name="View2DAttributes">
-                            <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                            <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                            <Field name="xScale" type="int">0</Field>
-                            <Field name="yScale" type="int">0</Field>
-                            <Field name="windowValid" type="bool">true</Field>
-                        </Object>
-                        <Object name="View3DAttributes">
-                            <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="focus" type="doubleArray" length="3">0 0 0 </Field>
-                            <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                            <Field name="viewAngle" type="double">30</Field>
-                            <Field name="parallelScale" type="double">0.5</Field>
-                            <Field name="nearPlane" type="double">-0.5</Field>
-                            <Field name="farPlane" type="double">0.5</Field>
-                            <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                            <Field name="imageZoom" type="double">1</Field>
-                            <Field name="perspective" type="bool">true</Field>
-                            <Field name="eyeAngle" type="double">2</Field>
-                            <Field name="centerOfRotationSet" type="bool">false</Field>
-                            <Field name="centerOfRotation" type="doubleArray" length="3">0 0 0 </Field>
-                            <Field name="axis3DScaleFlag" type="bool">false</Field>
-                            <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                            <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="windowValid" type="bool">false</Field>
-                        </Object>
-                        <Object name="ViewAxisArrayAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.15 0.9 0.1 0.85 </Field>
-                        </Object>
-                        <Object name="AnnotationObjectList">
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0000</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">0</Field>
-                                <Field name="doubleVector1" type="doubleVector"></Field>
-                                <Field name="stringVector1" type="stringVector"></Field>
-                                <Field name="stringVector2" type="stringVector"></Field>
-                            </Object>
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0002</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">1</Field>
-                                <Field name="doubleVector1" type="doubleVector">1.0875 1.17783 1.26816 1.3585 1.44883 1.53917 1.6295 1.71983 1.81017 1.9005 </Field>
-                                <Field name="stringVector1" type="stringVector">"" "" "" "" "" "" "" "" "" "" </Field>
-                                <Field name="stringVector2" type="stringVector">"1.0875" "1.17783" "1.26816" "1.3585" "1.44883" "1.53917" "1.6295" "1.71983" "1.81017" "1.9005" </Field>
-                            </Object>
-                        </Object>
-                        <Object name="InteractorAttributes">
-                            <Field name="showGuidelines" type="bool">true</Field>
-                            <Field name="clampSquare" type="bool">false</Field>
-                            <Field name="fillViewportOnZoom" type="bool">true</Field>
-                            <Field name="navigationMode" type="string">Trackball</Field>
-                            <Field name="axisArraySnap" type="bool">true</Field>
-                            <Field name="boundingBoxMode" type="string">Auto</Field>
-                        </Object>
-                        <Object name="ViewerPlotList">
-                            <Object name="plot00">
-                                <Field name="plotName" type="string">Plot0000</Field>
-                                <Field name="pluginID" type="string">Mesh_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">mesh</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="MeshAttributes">
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">0</Field>
-                                        <Object name="meshColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="meshColorSource" type="string">Foreground</Field>
-                                        <Field name="opaqueColorSource" type="string">Background</Field>
-                                        <Field name="opaqueMode" type="string">Auto</Field>
-                                        <Field name="pointSize" type="double">0.05</Field>
-                                        <Object name="opaqueColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="smoothingLevel" type="string">None</Field>
-                                        <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                        <Field name="pointSizeVar" type="string">default</Field>
-                                        <Field name="pointType" type="int">6</Field>
-                                        <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                        <Field name="showInternal" type="bool">false</Field>
-                                        <Field name="pointSizePixels" type="int">2</Field>
-                                        <Field name="opacity" type="double">1</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="MeshAttributes">
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">0</Field>
-                                                    <Object name="meshColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="meshColorSource" type="string">Foreground</Field>
-                                                    <Field name="opaqueColorSource" type="string">Background</Field>
-                                                    <Field name="opaqueMode" type="string">Auto</Field>
-                                                    <Field name="pointSize" type="double">0.05</Field>
-                                                    <Object name="opaqueColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="smoothingLevel" type="string">None</Field>
-                                                    <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                                    <Field name="pointSizeVar" type="string">default</Field>
-                                                    <Field name="pointType" type="int">6</Field>
-                                                    <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                                    <Field name="showInternal" type="bool">false</Field>
-                                                    <Field name="pointSizePixels" type="int">2</Field>
-                                                    <Field name="opacity" type="double">1</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Object name="plot01">
-                                <Field name="plotName" type="string">Plot0002</Field>
-                                <Field name="pluginID" type="string">Contour_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">phi</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="ContourAttributes">
-                                        <Object name="defaultPalette">
-                                            <Object name="ColorControlPointList">
-                                                <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                <Field name="smoothing" type="string">None</Field>
-                                                <Field name="equal" type="bool">true</Field>
-                                                <Field name="discrete" type="bool">true</Field>
-                                                <Field name="category" type="string">Standard</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="colorType" type="string">ColorByColorTable</Field>
-                                        <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">3</Field>
-                                        <Object name="singleColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="contourNLevels" type="int">10</Field>
-                                        <Field name="contourValue" type="doubleVector"></Field>
-                                        <Field name="contourPercent" type="doubleVector"></Field>
-                                        <Field name="contourMethod" type="string">Level</Field>
-                                        <Field name="minFlag" type="bool">false</Field>
-                                        <Field name="maxFlag" type="bool">false</Field>
-                                        <Field name="min" type="double">0</Field>
-                                        <Field name="max" type="double">1</Field>
-                                        <Field name="scaling" type="string">Linear</Field>
-                                        <Field name="wireframe" type="bool">false</Field>
-                                        <Field name="invertColorTable" type="bool">false</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="ContourAttributes">
-                                                    <Object name="defaultPalette">
-                                                        <Object name="ColorControlPointList">
-                                                            <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                            <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                            <Field name="smoothing" type="string">None</Field>
-                                                            <Field name="equal" type="bool">true</Field>
-                                                            <Field name="discrete" type="bool">true</Field>
-                                                            <Field name="category" type="string">Standard</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="colorType" type="string">ColorByColorTable</Field>
-                                                    <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">3</Field>
-                                                    <Object name="singleColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="contourNLevels" type="int">10</Field>
-                                                    <Field name="contourValue" type="doubleVector"></Field>
-                                                    <Field name="contourPercent" type="doubleVector"></Field>
-                                                    <Field name="contourMethod" type="string">Level</Field>
-                                                    <Field name="minFlag" type="bool">false</Field>
-                                                    <Field name="maxFlag" type="bool">false</Field>
-                                                    <Field name="min" type="double">0</Field>
-                                                    <Field name="max" type="double">1</Field>
-                                                    <Field name="scaling" type="string">Linear</Field>
-                                                    <Field name="wireframe" type="bool">false</Field>
-                                                    <Field name="invertColorTable" type="bool">false</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Field name="activeSource" type="string">SOURCE00</Field>
-                            <Field name="nPlots" type="int">2</Field>
-                            <Field name="keyframeMode" type="bool">false</Field>
-                            <Field name="nKeyframes" type="int">1</Field>
-                            <Object name="AnimationAttributes">
-                                <Field name="animationMode" type="string">StopMode</Field>
-                                <Field name="pipelineCachingMode" type="bool">false</Field>
-                                <Field name="frameIncrement" type="int">1</Field>
-                                <Field name="timeout" type="int">1</Field>
-                                <Field name="playbackMode" type="string">Looping</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerQueryManager">
-                <Field name="baseDesignator" type="char">A</Field>
-                <Field name="cycleDesignator" type="bool">false</Field>
-                <Field name="colorIndex" type="int">0</Field>
-            </Object>
-        </Object>
-        <Object name="ViewerEngineManager">
-            <Object name="RunningEngines">
-                <Object name="MachineProfile">
-                    <Field name="hostNickname" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="host" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="userName" type="string">notset</Field>
-                    <Field name="hostAliases" type="string"></Field>
-                    <Field name="directory" type="string"></Field>
-                    <Field name="shareOneBatchJob" type="bool">false</Field>
-                    <Field name="sshPortSpecified" type="bool">false</Field>
-                    <Field name="sshPort" type="int">22</Field>
-                    <Field name="sshCommandSpecified" type="bool">false</Field>
-                    <Field name="sshCommand" type="stringVector">"ssh" </Field>
-                    <Field name="useGateway" type="bool">false</Field>
-                    <Field name="gatewayHost" type="string"></Field>
-                    <Field name="clientHostDetermination" type="string">MachineName</Field>
-                    <Field name="manualClientHostName" type="string"></Field>
-                    <Field name="tunnelSSH" type="bool">false</Field>
-                    <Field name="maximumNodesValid" type="bool">false</Field>
-                    <Field name="maximumNodes" type="int">1</Field>
-                    <Field name="maximumProcessorsValid" type="bool">true</Field>
-                    <Field name="maximumProcessors" type="int">10</Field>
-                    <Object name="LaunchProfile">
-                        <Field name="timeout" type="int">480</Field>
-                        <Field name="numProcessors" type="int">1</Field>
-                        <Field name="numNodesSet" type="bool">false</Field>
-                        <Field name="numNodes" type="int">-1</Field>
-                        <Field name="partitionSet" type="bool">false</Field>
-                        <Field name="partition" type="string"></Field>
-                        <Field name="bankSet" type="bool">false</Field>
-                        <Field name="bank" type="string"></Field>
-                        <Field name="timeLimitSet" type="bool">false</Field>
-                        <Field name="timeLimit" type="string"></Field>
-                        <Field name="launchMethodSet" type="bool">false</Field>
-                        <Field name="launchMethod" type="string"></Field>
-                        <Field name="forceStatic" type="bool">true</Field>
-                        <Field name="forceDynamic" type="bool">false</Field>
-                        <Field name="active" type="bool">false</Field>
-                        <Field name="arguments" type="stringVector"></Field>
-                        <Field name="parallel" type="bool">false</Field>
-                        <Field name="launchArgsSet" type="bool">false</Field>
-                        <Field name="launchArgs" type="string"></Field>
-                        <Field name="sublaunchArgsSet" type="bool">false</Field>
-                        <Field name="sublaunchArgs" type="string"></Field>
-                        <Field name="sublaunchPreCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPreCmd" type="string"></Field>
-                        <Field name="sublaunchPostCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPostCmd" type="string"></Field>
-                        <Field name="machinefileSet" type="bool">false</Field>
-                        <Field name="machinefile" type="string"></Field>
-                        <Field name="visitSetsUpEnv" type="bool">false</Field>
-                        <Field name="canDoHWAccel" type="bool">false</Field>
-                        <Field name="GPUsPerNode" type="int">1</Field>
-                        <Field name="XArguments" type="string"></Field>
-                        <Field name="launchXServers" type="bool">false</Field>
-                        <Field name="XDisplay" type="string">:%l</Field>
-                        <Field name="numThreads" type="int">0</Field>
-                        <Field name="constrainNodeProcs" type="bool">false</Field>
-                        <Field name="allowableNodes" type="intVector"></Field>
-                        <Field name="allowableProcs" type="intVector"></Field>
-                        <Field name="profileName" type="string">Serial</Field>
-                    </Object>
-                    <Field name="activeProfile" type="int">1</Field>
-                </Object>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="ExportDBAttributes">
-                <Field name="allTimes" type="bool">false</Field>
-                <Field name="dirname" type="string">.</Field>
-                <Field name="filename" type="string">visit_ex_db</Field>
-                <Field name="timeStateFormat" type="string">_%04d</Field>
-                <Field name="db_type" type="string"></Field>
-                <Field name="db_type_fullname" type="string"></Field>
-                <Field name="variables" type="stringVector"></Field>
-                <Field name="writeUsingGroups" type="bool">false</Field>
-                <Field name="groupSize" type="int">48</Field>
-                <Object name="opts">
-                    <Object name="DBOptionsAttributes">
-                        <Field name="types" type="intVector"></Field>
-                        <Field name="names" type="stringVector"></Field>
-                        <Field name="optBools" type="intVector"></Field>
-                        <Field name="optFloats" type="doubleVector"></Field>
-                        <Field name="optDoubles" type="doubleVector"></Field>
-                        <Field name="optInts" type="intVector"></Field>
-                        <Field name="optStrings" type="stringVector"></Field>
-                        <Field name="optEnums" type="intVector"></Field>
-                        <Field name="enumStrings" type="stringVector"></Field>
-                        <Field name="enumStringsSizes" type="intVector"></Field>
-                        <Field name="obsoleteNames" type="stringVector"></Field>
-                        <Field name="help" type="string"></Field>
-                    </Object>
-                </Object>
-            </Object>
-        </Object>
-    </Object>
-</Object>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_2d.xml b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_2d.xml
deleted file mode 100644
index dba7640c899..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_2d.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<sensei>
-  <!-- libsim 2D -->
-  <analysis type="libsim"
-    visitdir="/work/SENSEI/visit2.13.2-install" mode="batch"
-    session="sensei/render_iso_libsim_2d.session"
-    image-filename="ls_image_2d_%ts" image-width="800" image-height="800"
-    image-format="png" frequency="1" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_3d.session b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_3d.session
deleted file mode 100644
index 571705f5800..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_3d.session
+++ /dev/null
@@ -1,5328 +0,0 @@
-<?xml version="1.0"?>
-<Object name="VisIt">
-    <Field name="Version" type="string">2.13.2</Field>
-    <Object name="VIEWER">
-        <Object name="DEFAULT_VALUES">
-            <Object name="GlobalAttributes">
-                <Field name="autoUpdateFlag" type="bool">false</Field>
-                <Field name="replacePlots" type="bool">false</Field>
-                <Field name="applyWindow" type="bool">false</Field>
-                <Field name="applyOperator" type="bool">false</Field>
-                <Field name="windowLayout" type="int">1</Field>
-                <Field name="makeDefaultConfirm" type="bool">true</Field>
-                <Field name="cloneWindowOnFirstRef" type="bool">false</Field>
-                <Field name="automaticallyAddOperator" type="bool">false</Field>
-                <Field name="tryHarderCyclesTimes" type="bool">false</Field>
-                <Field name="treatAllDBsAsTimeVarying" type="bool">false</Field>
-                <Field name="createMeshQualityExpressions" type="bool">true</Field>
-                <Field name="createTimeDerivativeExpressions" type="bool">true</Field>
-                <Field name="createVectorMagnitudeExpressions" type="bool">true</Field>
-                <Field name="newPlotsInheritSILRestriction" type="bool">true</Field>
-                <Field name="userDirForSessionFiles" type="bool">false</Field>
-                <Field name="saveCrashRecoveryFile" type="bool">true</Field>
-                <Field name="applySelection" type="bool">false</Field>
-                <Field name="userRestoreSessionFile" type="bool">false</Field>
-                <Field name="precisionType" type="int">1</Field>
-                <Field name="backendType" type="int">0</Field>
-                <Field name="removeDuplicateNodes" type="bool">false</Field>
-            </Object>
-            <Object name="SaveWindowAttributes">
-                <Field name="outputToCurrentDirectory" type="bool">true</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="fileName" type="string">visit</Field>
-                <Field name="family" type="bool">true</Field>
-                <Field name="format" type="string">PNG</Field>
-                <Field name="width" type="int">1024</Field>
-                <Field name="height" type="int">1024</Field>
-                <Field name="screenCapture" type="bool">false</Field>
-                <Field name="saveTiled" type="bool">false</Field>
-                <Field name="quality" type="int">80</Field>
-                <Field name="progressive" type="bool">false</Field>
-                <Field name="binary" type="bool">false</Field>
-                <Field name="lastRealFilename" type="string"></Field>
-                <Field name="stereo" type="bool">false</Field>
-                <Field name="compression" type="string">None</Field>
-                <Field name="forceMerge" type="bool">false</Field>
-                <Field name="resConstraint" type="string">ScreenProportions</Field>
-                <Field name="advancedMultiWindowSave" type="bool">false</Field>
-                <Object name="subWindowAtts">
-                    <Object name="SaveSubWindowsAttributes">
-                        <Object name="win1">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win2">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win3">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win4">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win5">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win6">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win7">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win8">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win9">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win10">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win11">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win12">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win13">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win14">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win15">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win16">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ColorTableAttributes">
-                <Field name="activeContinuous" type="string">hot</Field>
-                <Field name="activeDiscrete" type="string">levels</Field>
-                <Field name="groupingFlag" type="bool">false</Field>
-                <Object name="table00">
-                    <Field name="ctName" type="string">amino_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 189 159 109 255 0.009 199 199 199 255 0.019 255 105 180 255 0.028 230 230 0 255 0.037 230 9 9 255 0.046 230 9 9 255 0.056 49 49 170 255 0.065 235 235 235 255 0.074 130 130 210 255 0.083 15 130 15 255 0.093 19 90 255 255 0.102 15 130 15 255 0.111 230 230 0 255 0.12 0 220 220 255 0.13 220 149 130 255 0.139 0 220 220 255 0.148 19 90 255 255 0.157 249 149 0 255 0.167 249 149 0 255 0.176 15 130 15 255 0.185 180 90 180 255 0.194 49 49 170 255 0.204 255 105 180 255 </Field>
-                </Object>
-                <Object name="table01">
-                    <Field name="ctName" type="string">amino_shapely</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.009 139 255 139 255 0.019 255 0 255 255 0.028 255 255 111 255 0.037 159 0 66 255 0.046 102 0 0 255 0.056 82 75 82 255 0.065 255 255 255 255 0.074 111 111 255 255 0.083 0 75 0 255 0.093 70 70 184 255 0.102 69 94 69 255 0.111 184 159 66 255 0.12 255 123 111 255 0.13 82 82 82 255 0.139 255 75 75 255 0.148 0 0 123 255 0.157 255 111 66 255 0.167 184 75 0 255 0.176 255 139 255 255 0.185 79 70 0 255 0.194 139 111 75 255 0.204 255 0 255 255 </Field>
-                </Object>
-                <Object name="table02">
-                    <Field name="ctName" type="string">bluehot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.333 0 0 127 255 0.666 0 127 255 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table03">
-                    <Field name="ctName" type="string">caleblack</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table04">
-                    <Field name="ctName" type="string">calewhite</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table05">
-                    <Field name="ctName" type="string">contoured</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.333 0 255 0 255 0.666 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table06">
-                    <Field name="ctName" type="string">cpk_jmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 217 255 255 255 0.028 204 128 255 255 0.037 194 255 0 255 0.046 255 181 181 255 0.055 144 144 144 255 0.064 47 80 248 255 0.073 255 13 13 255 0.083 144 223 80 255 0.092 179 226 245 255 0.101 171 92 241 255 0.11 137 255 0 255 0.119 190 166 166 255 0.128 239 199 159 255 0.138 255 128 0 255 0.147 255 255 47 255 0.156 31 239 31 255 0.165 128 209 226 255 0.174 143 64 211 255 0.183 60 255 0 255 0.193 230 230 230 255 0.202 190 194 198 255 0.211 166 166 171 255 0.22 137 153 198 255 0.229 156 121 198 255 0.239 223 102 51 255 0.248 239 144 159 255 0.257 80 208 80 255 0.266 199 128 51 255 0.275 124 128 175 255 0.284 194 143 143 255 0.294 102 143 143 255 0.303 188 128 226 255 0.312 255 160 0 255 0.321 166 41 41 255 0.33 92 184 209 255 0.339 111 45 175 255 0.349 0 255 0 255 0.358 147 255 255 255 0.367 147 223 223 255 0.376 115 194 200 255 0.385 83 181 181 255 0.394 58 158 158 255 0.404 35 143 143 255 0.413 9 124 139 255 0.422 0 105 133 255 0.431 192 192 192 255 0.44 255 217 143 255 0.45 166 117 115 255 0.459 102 128 128 255 0.468 158 98 181 255 0.477 211 121 0 255 0.486 147 0 147 255 0.495 66 158 175 255 0.505 86 22 143 255 0.514 0 200 0 255 0.523 111 211 255 255 0.532 255 255 198 255 0.541 217 255 198 255 0.55 198 255 198 255 0.56 162 255 198 255 0.569 143 255 198 255 0.578 96 255 198 255 0.587 69 255 198 255 0.596 47 255 198 255 0.606 31 255 198 255 0.615 0 255 156 255 0.624 0 230 117 255 0.633 0 211 82 255 0.642 0 190 56 255 0.651 0 171 35 255 0.661 77 194 255 255 0.67 77 166 255 255 0.679 32 147 213 255 0.688 37 124 171 255 0.697 37 102 149 255 0.706 22 83 134 255 0.716 208 208 223 255 0.725 255 209 34 255 0.734 184 184 208 255 0.743 166 83 77 255 0.752 86 88 96 255 0.761 158 79 181 255 0.771 171 92 0 255 0.78 117 79 69 255 0.789 66 130 149 255 0.798 66 0 102 255 0.807 0 124 0 255 0.817 111 171 249 255 0.826 0 185 255 255 0.835 0 160 255 255 0.844 0 143 255 255 0.853 0 128 255 255 0.862 0 107 255 255 0.872 83 92 241 255 0.881 120 92 226 255 0.89 137 79 226 255 0.899 160 54 211 255 0.908 179 31 211 255 0.917 179 31 185 255 0.927 179 13 166 255 0.936 188 13 134 255 0.945 198 0 102 255 0.954 204 0 88 255 0.963 209 0 79 255 0.972 217 0 69 255 0.982 223 0 56 255 0.991 230 0 45 255 1 235 0 37 255 </Field>
-                </Object>
-                <Object name="table07">
-                    <Field name="ctName" type="string">cpk_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 255 192 202 255 0.028 177 33 33 255 0.037 255 19 146 255 0.046 0 255 0 255 0.055 199 199 199 255 0.064 143 143 255 255 0.073 239 0 0 255 0.083 218 164 31 255 0.092 255 19 146 255 0.101 0 0 255 255 0.11 33 138 33 255 0.119 128 128 144 255 0.128 218 164 31 255 0.138 255 164 0 255 0.147 255 199 49 255 0.156 0 255 0 255 0.165 255 19 146 255 0.174 255 19 146 255 0.183 128 128 144 255 0.193 255 19 146 255 0.202 128 128 144 255 0.211 255 19 146 255 0.22 128 128 144 255 0.229 128 128 144 255 0.239 255 164 0 255 0.248 255 19 146 255 0.257 164 42 42 255 0.266 164 42 42 255 0.275 164 42 42 255 0.284 255 19 146 255 0.294 255 19 146 255 0.303 255 19 146 255 0.312 255 19 146 255 0.321 164 42 42 255 0.33 255 19 146 255 0.339 255 19 146 255 0.349 255 19 146 255 0.358 255 19 146 255 0.367 255 19 146 255 0.376 255 19 146 255 0.385 255 19 146 255 0.394 255 19 146 255 0.404 255 19 146 255 0.413 255 19 146 255 0.422 255 19 146 255 0.431 128 128 144 255 0.44 255 19 146 255 0.45 255 19 146 255 0.459 255 19 146 255 0.468 255 19 146 255 0.477 255 19 146 255 0.486 159 31 239 255 0.495 255 19 146 255 0.505 255 19 146 255 0.514 255 164 0 255 0.523 255 19 146 255 0.532 255 19 146 255 0.541 255 19 146 255 0.55 255 19 146 255 0.56 255 19 146 255 0.569 255 19 146 255 0.578 255 19 146 255 0.587 255 19 146 255 0.596 255 19 146 255 0.606 255 19 146 255 0.615 255 19 146 255 0.624 255 19 146 255 0.633 255 19 146 255 0.642 255 19 146 255 0.651 255 19 146 255 0.661 255 19 146 255 0.67 255 19 146 255 0.679 255 19 146 255 0.688 255 19 146 255 0.697 255 19 146 255 0.706 255 19 146 255 0.716 255 19 146 255 0.725 218 164 31 255 0.734 255 19 146 255 0.743 255 19 146 255 0.752 255 19 146 255 0.761 255 19 146 255 0.771 255 19 146 255 0.78 255 19 146 255 0.789 255 19 146 255 0.798 255 19 146 255 0.807 255 19 146 255 0.817 255 19 146 255 0.826 255 19 146 255 0.835 255 19 146 255 0.844 255 19 146 255 0.853 255 19 146 255 0.862 255 19 146 255 0.872 255 19 146 255 0.881 255 19 146 255 0.89 255 19 146 255 0.899 255 19 146 255 0.908 255 19 146 255 0.917 255 19 146 255 0.927 255 19 146 255 0.936 255 19 146 255 0.945 255 19 146 255 0.954 255 19 146 255 0.963 255 19 146 255 0.972 255 19 146 255 0.982 255 19 146 255 0.991 255 19 146 255 1 255 19 146 255 </Field>
-                </Object>
-                <Object name="table08">
-                    <Field name="ctName" type="string">difference</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.5 255 255 255 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table09">
-                    <Field name="ctName" type="string">gray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table10">
-                    <Field name="ctName" type="string">hot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.25 0 255 255 255 0.5 0 255 0 255 0.75 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table11">
-                    <Field name="ctName" type="string">hot_and_cold</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 255 255 255 0.45 0 0 255 255 0.5 0 0 127 255 0.55 255 0 0 255 1 255 255 0 255 </Field>
-                </Object>
-                <Object name="table12">
-                    <Field name="ctName" type="string">levels</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 0 255 0.034 0 255 0 255 0.069 0 0 255 255 0.103 0 255 255 255 0.138 255 0 255 255 0.172 255 255 0 255 0.207 255 135 0 255 0.241 255 0 135 255 0.276 168 168 168 255 0.31 255 68 68 255 0.345 99 255 99 255 0.379 99 99 255 255 0.414 40 165 165 255 0.448 255 99 255 255 0.483 255 255 99 255 0.517 255 170 99 255 0.552 170 79 255 255 0.586 150 0 0 255 0.621 0 150 0 255 0.655 0 0 150 255 0.69 0 109 109 255 0.724 150 0 150 255 0.759 150 150 0 255 0.793 150 84 0 255 0.828 160 0 79 255 0.862 255 104 28 255 0.897 0 170 81 255 0.931 68 255 124 255 0.966 0 130 255 255 1 130 0 255 255 </Field>
-                </Object>
-                <Object name="table13">
-                    <Field name="ctName" type="string">rainbow</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.2 0 0 255 255 0.4 0 255 255 255 0.6 0 255 0 255 0.8 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table14">
-                    <Field name="ctName" type="string">xray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 1 0 0 0 255 </Field>
-                </Object>
-                <Field name="Ntables" type="int">15</Field>
-            </Object>
-            <Object name="ExpressionList">
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ConnectedComponents/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ConnectedComponents</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/1D/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/2D/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/3D/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Flux/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Flux</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Lineout/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Lineout</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/model</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">Mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/distance</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">Mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Sum/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Mean/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Variance/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">"operators/StatisticalTrends/Std. Dev./phi"</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Slope/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Residuals/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/SurfaceNormal/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">VectorMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">SurfaceNormal</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-            </Object>
-            <Object name="AnimationAttributes">
-                <Field name="animationMode" type="string">StopMode</Field>
-                <Field name="pipelineCachingMode" type="bool">false</Field>
-                <Field name="frameIncrement" type="int">1</Field>
-                <Field name="timeout" type="int">1</Field>
-                <Field name="playbackMode" type="string">Looping</Field>
-            </Object>
-            <Object name="AnnotationAttributes">
-                <Object name="axes2D">
-                    <Object name="Axes2D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Outside</Field>
-                        <Field name="tickAxes" type="string">BottomLeft</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-                <Object name="axes3D">
-                    <Object name="Axes3D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Inside</Field>
-                        <Field name="axesType" type="string">ClosestTriad</Field>
-                        <Field name="triadFlag" type="bool">true</Field>
-                        <Field name="bboxFlag" type="bool">true</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="zAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Z-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Field name="setBBoxLocation" type="bool">false</Field>
-                        <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                    </Object>
-                </Object>
-                <Field name="userInfoFlag" type="bool">true</Field>
-                <Object name="userInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoFlag" type="bool">true</Field>
-                <Field name="timeInfoFlag" type="bool">true</Field>
-                <Object name="databaseInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                <Field name="databaseInfoTimeScale" type="double">1</Field>
-                <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                <Field name="legendInfoFlag" type="bool">true</Field>
-                <Object name="backgroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="foregroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                <Object name="gradientColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="gradientColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="backgroundMode" type="string">Solid</Field>
-                <Field name="backgroundImage" type="string"></Field>
-                <Field name="imageRepeatX" type="int">1</Field>
-                <Field name="imageRepeatY" type="int">1</Field>
-                <Object name="axesArray">
-                    <Object name="AxesArray">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="ticksVisible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Object name="axes">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string"></Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewCurveAttributes">
-                <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="domainScale" type="int">0</Field>
-                <Field name="rangeScale" type="int">0</Field>
-            </Object>
-            <Object name="View2DAttributes">
-                <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                <Field name="xScale" type="int">0</Field>
-                <Field name="yScale" type="int">0</Field>
-                <Field name="windowValid" type="bool">false</Field>
-            </Object>
-            <Object name="View3DAttributes">
-                <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="focus" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="viewAngle" type="double">30</Field>
-                <Field name="parallelScale" type="double">0.866025403784439</Field>
-                <Field name="nearPlane" type="double">-1.73205080756888</Field>
-                <Field name="farPlane" type="double">1.73205080756888</Field>
-                <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                <Field name="imageZoom" type="double">1.14562037553922</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="eyeAngle" type="double">2</Field>
-                <Field name="centerOfRotationSet" type="bool">false</Field>
-                <Field name="centerOfRotation" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="axis3DScaleFlag" type="bool">false</Field>
-                <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="windowValid" type="bool">true</Field>
-            </Object>
-            <Object name="LightList">
-                <Object name="light0">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                        <Field name="enabledFlag" type="bool">true</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light1">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light2">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light3">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light4">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light5">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light6">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light7">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerWindowManagerAttributes">
-                <Object name="ActionConfigurations">
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Mode</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Tools</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Window</Field>
-                        <Field name="actions" type="stringVector">"SetActiveWindowRPC" "AddWindowRPC" "CloneWindowRPC" "DeleteWindowRPC" "SetWindowLayoutRPC" "ToggleSpinModeRPC" "InvertBackgroundRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">View</Field>
-                        <Field name="actions" type="stringVector">"TogglePerspectiveViewRPC" "ResetViewRPC" "RecenterViewRPC" "UndoViewRPC" "RedoViewRPC" "ToggleFullFrameRPC" "SaveViewRPC" "ChooseCenterOfRotationRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Animation</Field>
-                        <Field name="actions" type="stringVector">"TimeSliderPreviousStateRPC" "AnimationReversePlayRPC" "AnimationStopRPC" "AnimationPlayRPC" "TimeSliderNextStateRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Operators</Field>
-                        <Field name="actions" type="stringVector">"AddOperatorRPC" "RemoveLastOperatorRPC" "RemoveAllOperatorsRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Plots</Field>
-                        <Field name="actions" type="stringVector">"AddPlotRPC" "DrawPlotsRPC" "HideActivePlotsRPC" "DeleteActivePlotsRPC" "CopyActivePlotsRPC" "SetPlotFollowsTimeRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Clear</Field>
-                        <Field name="actions" type="stringVector">"ClearWindowRPC" "ClearAllWindowsRPC" "ClearPickPointsRPC" "ClearRefLinesRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Lock</Field>
-                        <Field name="actions" type="stringVector">"ToggleLockViewModeRPC" "ToggleLockTimeRPC" "ToggleLockToolsRPC" "TurnOffAllLocksRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                </Object>
-                <Field name="toolbarsVisible" type="bool">true</Field>
-                <Field name="largeIcons" type="bool">false</Field>
-            </Object>
-            <Object name="WindowInformation">
-                <Field name="boundingBoxNavigate" type="bool">true</Field>
-                <Field name="fullFrame" type="bool">false</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="lockView" type="bool">false</Field>
-                <Field name="lockTools" type="bool">false</Field>
-                <Field name="lockTime" type="bool">false</Field>
-                <Field name="viewExtentsType" type="int">1</Field>
-            </Object>
-            <Object name="PrinterAttributes">
-                <Field name="printerName" type="string"></Field>
-                <Field name="printProgram" type="string">lpr</Field>
-                <Field name="documentName" type="string">untitled</Field>
-                <Field name="creator" type="string"></Field>
-                <Field name="numCopies" type="int">1</Field>
-                <Field name="portrait" type="bool">true</Field>
-                <Field name="printColor" type="bool">true</Field>
-                <Field name="outputToFile" type="bool">false</Field>
-                <Field name="outputToFileName" type="string">untitled</Field>
-                <Field name="pageSize" type="int">2</Field>
-            </Object>
-            <Object name="RenderingAttributes">
-                <Field name="antialiasing" type="bool">false</Field>
-                <Field name="orderComposite" type="bool">true</Field>
-                <Field name="depthCompositeThreads" type="int">2</Field>
-                <Field name="depthCompositeBlocking" type="int">65536</Field>
-                <Field name="alphaCompositeThreads" type="int">2</Field>
-                <Field name="alphaCompositeBlocking" type="int">65536</Field>
-                <Field name="depthPeeling" type="bool">false</Field>
-                <Field name="occlusionRatio" type="double">0</Field>
-                <Field name="numberOfPeels" type="int">16</Field>
-                <Field name="multiresolutionMode" type="bool">false</Field>
-                <Field name="multiresolutionCellSize" type="float">0.002</Field>
-                <Field name="geometryRepresentation" type="string">Surfaces</Field>
-                <Field name="displayListMode" type="string">Auto</Field>
-                <Field name="stereoRendering" type="bool">false</Field>
-                <Field name="stereoType" type="string">CrystalEyes</Field>
-                <Field name="notifyForEachRender" type="bool">false</Field>
-                <Field name="scalableActivationMode" type="string">Always</Field>
-                <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                <Field name="specularFlag" type="bool">false</Field>
-                <Field name="specularCoeff" type="float">0.6</Field>
-                <Field name="specularPower" type="float">10</Field>
-                <Object name="specularColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="doShadowing" type="bool">false</Field>
-                <Field name="shadowStrength" type="double">0.5</Field>
-                <Field name="doDepthCueing" type="bool">false</Field>
-                <Field name="depthCueingAutomatic" type="bool">true</Field>
-                <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                <Field name="compressionActivationMode" type="string">Never</Field>
-                <Field name="colorTexturingFlag" type="bool">true</Field>
-                <Field name="compactDomainsActivationMode" type="string">Never</Field>
-                <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="AnnotationObjectList">
-            </Object>
-            <Object name="PickAttributes">
-                <Field name="variables" type="stringVector">"default" </Field>
-                <Field name="showIncidentElements" type="bool">true</Field>
-                <Field name="showNodeId" type="bool">true</Field>
-                <Field name="showNodeDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showNodeBlockLogicalCoords" type="bool">false</Field>
-                <Field name="showNodePhysicalCoords" type="bool">false</Field>
-                <Field name="showZoneId" type="bool">true</Field>
-                <Field name="showZoneDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showZoneBlockLogicalCoords" type="bool">false</Field>
-                <Field name="doTimeCurve" type="bool">false</Field>
-                <Field name="conciseOutput" type="bool">false</Field>
-                <Field name="showTimeStep" type="bool">true</Field>
-                <Field name="showMeshName" type="bool">true</Field>
-                <Field name="useLabelAsPickLetter" type="bool">false</Field>
-                <Field name="showGlobalIds" type="bool">false</Field>
-                <Field name="showPickLetter" type="bool">true</Field>
-                <Field name="hasRangeOutput" type="bool">false</Field>
-                <Field name="elementLabel" type="string"></Field>
-                <Field name="createSpreadsheet" type="bool">false</Field>
-                <Field name="floatFormat" type="string">%g</Field>
-                <Field name="timePreserveCoord" type="bool">true</Field>
-            </Object>
-            <Object name="QueryOverTimeAttributes">
-                <Field name="timeType" type="string">Cycle</Field>
-                <Field name="startTimeFlag" type="bool">false</Field>
-                <Field name="startTime" type="int">0</Field>
-                <Field name="endTimeFlag" type="bool">false</Field>
-                <Field name="endTime" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="createWindow" type="bool">true</Field>
-                <Field name="windowId" type="int">2</Field>
-            </Object>
-            <Object name="InteractorAttributes">
-                <Field name="showGuidelines" type="bool">true</Field>
-                <Field name="clampSquare" type="bool">false</Field>
-                <Field name="fillViewportOnZoom" type="bool">true</Field>
-                <Field name="navigationMode" type="string">Trackball</Field>
-                <Field name="axisArraySnap" type="bool">true</Field>
-                <Field name="boundingBoxMode" type="string">Auto</Field>
-            </Object>
-            <Object name="MovieAttributes">
-                <Field name="generationMethod" type="string">NowCurrentInstance</Field>
-                <Field name="movieType" type="string">Simple</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="outputName" type="string">movie</Field>
-                <Field name="fileFormats" type="stringVector"></Field>
-                <Field name="useCurrentSize" type="unsignedCharVector"></Field>
-                <Field name="widths" type="intVector"></Field>
-                <Field name="heights" type="intVector"></Field>
-                <Field name="scales" type="doubleVector"></Field>
-                <Field name="stereoFlags" type="intVector"></Field>
-                <Field name="templateFile" type="string"></Field>
-                <Field name="sendEmailNotification" type="bool">false</Field>
-                <Field name="useScreenCapture" type="bool">false</Field>
-                <Field name="emailAddress" type="string"></Field>
-                <Field name="fps" type="int">10</Field>
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="endIndex" type="int">1000000000</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="initialFrameValue" type="int">0</Field>
-            </Object>
-            <Object name="FileOpenOptions">
-                <Field name="typeNames" type="stringVector">"AMR" "AMRTest" "ANALYZE" "ANSYS" "AUXFile" "AugDecomp" "BATL" "BOV" "CEAucd" "CMAT" "CTRL" "Cale" "CaleHDF5" "CarpetHDF5" "Chombo" "Claw" "CosmosPP" "Cube" "Curve2D" "DDCMD" "Dyna3D" "EnSight" "Enzo" "Exodus" "ExtrudedVol" "FLASH" "FT2" "Fluent" "GGCM" "GHOST" "GMV" "GTC" "GULP" "Gadget" "Geqdsk" "H5Nimrod" "Image" "KullLite" "LAMMPS" "Lines" "M3DC1" "M3D" "MFIXCDF" "MFIX" "MM5" "MatrixMarket" "Miranda" "NASTRAN" "NETCDF" "Nek5000" "OVERFLOW" "OpenFOAM" "PATRAN" "PDB" "PFLOTRAN" "PLOT3D" "PLY" "ParallelVelodyne" "Pixie" "PlainText" "Point3D" "ProteinDataBank" "PuReMD" "RAW" "S3D" "SAMI" "SAMRAI" "SAR" "SAS" "STAR" "STL" "SXRIS" "Shapefile" "Silo" "SimV2" "Spheral" "TCGA" "TFT" "TSurf" "Tecplot" "Tetrad" "UNIC" "VASP" "VCellMTMD" "VTK" "Velodyne" "Vis5D" "VisItXdmf" "Vista" "Vs" "WPPImage" "WavefrontOBJ" "WellLogs" "XSF" "XYZ" "Xmdv" "ZipWrapper" "lata" "unv" "volimage" "HDFS" "Boxlib2D" "Boxlib3D" "SPCTH" </Field>
-                <Field name="typeIDs" type="stringVector">"AMR_1.0" "AMRTest_1.0" "ANALYZE_1.0" "ANSYS_1.0" "AUXFile_1.0" "AugDecomp_1.0" "BATL_1.0" "BOV_1.0" "CEAucd_1.0" "CMAT_1.0" "CTRL_1.0" "Cale_1.1" "CaleHDF5_1.1" "CarpetHDF5_2.1" "Chombo_1.0" "Claw_1.0" "CosmosPP_1.0" "Cube_1.0" "Curve2D_1.0" "DDCMD_1.0" "Dyna3D_1.0" "EnSight_1.0" "Enzo_1.0" "Exodus_1.0" "ExtrudedVol_1.0" "FLASH_1.0" "FT2_1.0" "Fluent_1.0" "GGCM_1.0" "GHOST_1" "GMV_1.0" "GTC_1.0" "GULP_1.0" "Gadget_2.0a" "Geqdsk_1.0" "H5Nimrod_1.0" "Image_1.0" "KullLite_1.0" "LAMMPS_1.0" "Lines_1.0" "M3DC1_1.0" "M3D_1.0" "MFIXCDF_1.0" "MFIX_1.0" "MM5_1.0" "MatrixMarket_1.0" "Miranda_2.0" "NASTRAN_1.0" "NETCDF_1.0" "Nek5000_1.0" "OVERFLOW_1.0" "OpenFOAM_1.0" "PATRAN_1.0" "PDB_1.1" "PFLOTRAN_1.0" "PLOT3D_1.0" "PLY_1.0" "ParallelVelodyne_1" "Pixie_1.0" "PlainText_1.0" "Point3D_1.0" "ProteinDataBank_1.0" "PuReMD_1.0" "RAW_1.0" "S3D_1.0" "SAMI_1.0" "SAMRAI_1.0" "SAR_1.0" "SAS_1.0" "STAR_1.0" "STL_1.0" "SXRIS_1.0" "Shapefile_1.0" "Silo_1.0" "SimV2_1.0" "Spheral_1.0" "TCGA_1.0" "TFT_1.0" "TSurf_1.0" "Tecplot_1.0" "Tetrad_1.0" "UNIC_1.0" "VASP_1.0" "VCellMTMD_1.0" "VTK_1.0" "Velodyne_1.0" "Vis5D_1.0" "VisItXdmf_1.0" "Vista_1.0" "Vs_3.0.0" "WPPImage_2" "WavefrontOBJ_1.0" "WellLogs_1.0" "XSF_1.0" "XYZ_1.0" "Xmdv_1.0" "ZipWrapper_1.0" "lata_1.0" "unv_" "volimage_1.0" "HDFS_1.0" "Boxlib2D_1.0" "Boxlib3D_1.0" "SPCTH_1.0" </Field>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" </Field>
-                    <Field name="optBools" type="intVector">0 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Use ghost data (if present)" "Enable only root level by default" "Enable only explicitly defined materials by default" "Check for mapping file and import coordinates if available" "Use particle_nid and polymer_id to connect particles" "Always compute domain boundaries (hack for AMR stitch cells)" </Field>
-                    <Field name="optBools" type="intVector">1 0 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"ExtendVolumeByOneCell" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 5 1 4 4 </Field>
-                    <Field name="names" type="stringVector">"Automagically Detect Compound Variables" "Use Material Convention" "Material Count (-1=guess)" "Namescheme for material volume fractions" "Namescheme for material specific variables" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 </Field>
-                    <Field name="optStrings" type="stringVector">"" "" </Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"None" "ALEGRA" "CTH" "Custom" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string">"&lt;p&gt;&lt;b&gt;Automagically Detect Compound Variables&lt;/b&gt;: Checking this option will cause the plugin to try to guess that similarly named variables are the scalar components of an aggregate type such as a vector, tensor or array variable. The plugin will then automatically define expressions for these aggregate typed variables. Note that this is just a convenience to free users from having to define expressions manally within their VisIt session.&lt;p&gt; &lt;p&gt;&lt;b&gt;Material Count (-1=guess)&lt;/b&gt;: Ordinarily, the plugin will determine the material count from the material convention nameschemes. However, if it is having trouble getting the correct count, you can specify it manually with this option. &lt;p&gt;&lt;b&gt;Use Material Convention&lt;/b&gt;: A few pre-defined conventions for handling mixed materials from Exodus files are supported. In addition, you can define your own custom conventions as well. For a custom convention, you must define the &lt;i&gt;namescheme&lt;/i&gt; that will produce the names of the scalar variables holding material volume fractions. Optionally, you can specify a &lt;i&gt;namescheme&lt;/i&gt; to produce the names of the scalar variables holding material-specific values given the name of a non-material-specific variable. For more information on nameschemes, please consult the description of DBMakeNamescheme in the &lt;a href=&quot;https://wci.llnl.gov/content/assets/docs/simulation/computer-codes/silo/LLNL-SM-654357.pdf&quot;&gt;Silo user&apos;s manual&lt;/a&gt;. The nameschemes used here are identical to those described in the Silo user&apos;s manual with one extension. The conversion specifier %V is used to denote the basename (non-material-specific) name of a set of scalar variables holding material specific values.&lt;p&gt; &lt;p&gt;The ALEGRA nameschemes for volume fraction and material specific variables  are &quot;@%s@n?&apos;&amp;VOLFRC_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;The CTH nameschemes are &quot;@%s@n?&apos;&amp;VOLM_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;Finally, it is assumed materials are identified starting from one (1). The special material id of zero (0) is used to denote void."</Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" "Set up patch abutment information" </Field>
-                    <Field name="optBools" type="intVector">0 1 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 </Field>
-                    <Field name="names" type="stringVector">"Mesh refinement" "Linear mesh data location" "Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1" "2" "3" "4" "5" "6" "7" "8" "9" "10" "Node" "Element" </Field>
-                    <Field name="enumStringsSizes" type="intVector">10 2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Big Endian" "Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"Num Materials (-1==costly search)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Read all times and cycles" "Duplicate data for particle advection (slower for all other techniques)" </Field>
-                    <Field name="optBools" type="intVector">1 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Case Type" "Convert Cell Data To Point Data" "Read Zones" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"Decomposed" "Reconstructed" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"LEOS try harder level [set to 0, 1 or 2]" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 4 0 0 0 0 0 0 3 3 </Field>
-                    <Field name="names" type="stringVector">"File Format" "Solution (Q) File Name" "Solution Time field accurate" "3D" "Multi Grid" "Big Endian" "Double Precision" "IBlanking" "Gas constant R" "Gas constant Gamma" </Field>
-                    <Field name="optBools" type="intVector">1 1 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector">1 1.4 </Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector">"" </Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"ASCII" "C Binary" "Fortran Binary" </Field>
-                    <Field name="enumStringsSizes" type="intVector">3 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 </Field>
-                    <Field name="names" type="stringVector">"Partitioning" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">2 </Field>
-                    <Field name="enumStrings" type="stringVector">"X Slab" "Y Slab" "Z Slab" "KD Tree" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Data layout" "Lines to skip at beginning of file" "First row has variable names" "Column for X coordinate (or -1 for none)" "Column for Y coordinate (or -1 for none)" "Column for Z coordinate (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 -1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1D Columns" "2D Array" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Polygons as lines" "Tessellate polygons" "ESRI Logging" "DBF Logging" </Field>
-                    <Field name="optBools" type="intVector">0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Ignore spatial extents" "Ignore data extents" "Force Single" "Search For ANNOTATION_INT (!!Slow!!)" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">3 3 </Field>
-                    <Field name="enumStrings" type="stringVector">"Always" "Auto" "Never" "Undef" "Always" "Auto" "Never" "Undef" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 4 </Field>
-                    <Field name="obsoleteNames" type="stringVector">"Ignore Spatial Extents" "Ignore Data Extents" </Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Method to determine coordinate axes" "X axis variable index (or -1 for none)" "Y axis variable index (or -1 for none)" "Z axis variable index (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"Guess from variable names" "Specify explicitly (below)" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">4 4 1 4 0 </Field>
-                    <Field name="names" type="stringVector">"TMPDIR for decompressed files" "Unique moniker for dirs made in $TMPDIR" "Max. # decompressed files" "Decompression command" "Don&apos;t atexit()" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">50 </Field>
-                    <Field name="optStrings" type="stringVector">"$TMPDIR" "$USER" "" </Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Field name="Enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 </Field>
-                <Field name="preferredIDs" type="stringVector">"Silo_1.0" </Field>
-            </Object>
-            <Object name="SeedMeAttributes">
-                <Field name="clearAllTabsOnClose" type="bool">true</Field>
-            </Object>
-            <Object name="BoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="ContourAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                        <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="CurveAttributes">
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="symbol" type="string">Point</Field>
-                <Field name="pointSize" type="double">5</Field>
-                <Field name="pointFillMode" type="string">Static</Field>
-                <Field name="pointStride" type="int">1</Field>
-                <Field name="symbolDensity" type="int">50</Field>
-                <Field name="curveColorSource" type="string">Cycle</Field>
-                <Object name="curveColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="showLegend" type="bool">true</Field>
-                <Field name="showLabels" type="bool">true</Field>
-                <Field name="designator" type="string"></Field>
-                <Field name="doBallTimeCue" type="bool">false</Field>
-                <Object name="ballTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="timeCueBallSize" type="double">0.01</Field>
-                <Field name="doLineTimeCue" type="bool">false</Field>
-                <Object name="lineTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="lineTimeCueWidth" type="int">0</Field>
-                <Field name="doCropTimeCue" type="bool">false</Field>
-                <Field name="timeForTimeCue" type="double">0</Field>
-                <Field name="fillMode" type="string">NoFill</Field>
-                <Object name="fillColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="fillColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 100 100 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="polarToCartesian" type="bool">false</Field>
-                <Field name="polarCoordinateOrder" type="string">R_Theta</Field>
-                <Field name="angleUnits" type="string">Radians</Field>
-            </Object>
-            <Object name="FilledBoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Object name="mixedColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="HistogramAttributes">
-                <Field name="basedOn" type="string">ManyZonesForSingleVar</Field>
-                <Field name="histogramType" type="string">Frequency</Field>
-                <Field name="weightVariable" type="string">default</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="numBins" type="int">32</Field>
-                <Field name="domain" type="int">0</Field>
-                <Field name="zone" type="int">0</Field>
-                <Field name="useBinWidths" type="bool">true</Field>
-                <Field name="outputType" type="string">Block</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="color">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">200 80 40 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="dataScale" type="string">Linear</Field>
-                <Field name="binScale" type="string">Linear</Field>
-                <Field name="normalizeHistogram" type="bool">false</Field>
-                <Field name="computeAsCDF" type="bool">false</Field>
-            </Object>
-            <Object name="LabelAttributes">
-                <Field name="varType" type="string">LABEL_VT_UNKNOWN_TYPE</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="showNodes" type="bool">false</Field>
-                <Field name="showCells" type="bool">true</Field>
-                <Field name="restrictNumberOfLabels" type="bool">true</Field>
-                <Field name="drawLabelsFacing" type="string">Front</Field>
-                <Field name="labelDisplayFormat" type="string">Natural</Field>
-                <Field name="numberOfLabels" type="int">200</Field>
-                <Field name="specifyTextColor1" type="bool">false</Field>
-                <Object name="textColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight1" type="float">0.02</Field>
-                <Field name="specifyTextColor2" type="bool">false</Field>
-                <Object name="textColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight2" type="float">0.02</Field>
-                <Field name="horizontalJustification" type="string">HCenter</Field>
-                <Field name="verticalJustification" type="string">VCenter</Field>
-                <Field name="depthTestMode" type="string">LABEL_DT_AUTO</Field>
-                <Field name="formatTemplate" type="string">%g</Field>
-            </Object>
-            <Object name="MeshAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="meshColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="meshColorSource" type="string">Foreground</Field>
-                <Field name="opaqueColorSource" type="string">Background</Field>
-                <Field name="opaqueMode" type="string">Auto</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Object name="opaqueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="smoothingLevel" type="string">None</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="opaqueMeshIsAppropriate" type="bool">true</Field>
-                <Field name="showInternal" type="bool">false</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="opacity" type="double">1</Field>
-            </Object>
-            <Object name="MoleculeAttributes">
-                <Field name="drawAtomsAs" type="string">SphereAtoms</Field>
-                <Field name="scaleRadiusBy" type="string">Fixed</Field>
-                <Field name="drawBondsAs" type="string">CylinderBonds</Field>
-                <Field name="colorBonds" type="string">ColorByAtom</Field>
-                <Object name="bondSingleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 128 128 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="radiusVariable" type="string">default</Field>
-                <Field name="radiusScaleFactor" type="float">1</Field>
-                <Field name="radiusFixed" type="float">0.3</Field>
-                <Field name="atomSphereQuality" type="string">Medium</Field>
-                <Field name="bondCylinderQuality" type="string">Medium</Field>
-                <Field name="bondRadius" type="float">0.12</Field>
-                <Field name="bondLineWidth" type="int">0</Field>
-                <Field name="bondLineStyle" type="int">0</Field>
-                <Field name="elementColorTable" type="string">cpk_jmol</Field>
-                <Field name="residueTypeColorTable" type="string">amino_shapely</Field>
-                <Field name="residueSequenceColorTable" type="string">Default</Field>
-                <Field name="continuousColorTable" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="scalarMin" type="float">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="scalarMax" type="float">1</Field>
-            </Object>
-            <Object name="MultiCurveAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.034</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0.069</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.103</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                            <Field name="position" type="float">0.138</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.172</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                            <Field name="position" type="float">0.207</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                            <Field name="position" type="float">0.241</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                            <Field name="position" type="float">0.276</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                            <Field name="position" type="float">0.31</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                            <Field name="position" type="float">0.345</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                            <Field name="position" type="float">0.379</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                            <Field name="position" type="float">0.414</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                            <Field name="position" type="float">0.448</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                            <Field name="position" type="float">0.483</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                            <Field name="position" type="float">0.517</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">170 79 255 255 </Field>
-                            <Field name="position" type="float">0.552</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 0 255 </Field>
-                            <Field name="position" type="float">0.586</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 150 0 255 </Field>
-                            <Field name="position" type="float">0.621</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 150 255 </Field>
-                            <Field name="position" type="float">0.655</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 109 109 255 </Field>
-                            <Field name="position" type="float">0.69</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 150 255 </Field>
-                            <Field name="position" type="float">0.724</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 150 0 255 </Field>
-                            <Field name="position" type="float">0.759</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 84 0 255 </Field>
-                            <Field name="position" type="float">0.793</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">160 0 79 255 </Field>
-                            <Field name="position" type="float">0.828</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 104 28 255 </Field>
-                            <Field name="position" type="float">0.862</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 170 81 255 </Field>
-                            <Field name="position" type="float">0.897</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">68 255 124 255 </Field>
-                            <Field name="position" type="float">0.931</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 130 255 255 </Field>
-                            <Field name="position" type="float">0.966</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">130 0 255 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="changedColors" type="unsignedCharVector"></Field>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                        </Object>
-                    </Object>
-                </Object>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="yAxisTitleFormat" type="string">%g</Field>
-                <Field name="useYAxisTickSpacing" type="bool">false</Field>
-                <Field name="yAxisTickSpacing" type="double">1</Field>
-                <Field name="displayMarkers" type="bool">true</Field>
-                <Field name="markerScale" type="double">1</Field>
-                <Field name="markerLineWidth" type="int">0</Field>
-                <Field name="markerVariable" type="string">default</Field>
-                <Field name="displayIds" type="bool">false</Field>
-                <Field name="idVariable" type="string">default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="ParallelCoordinatesAttributes">
-                <Field name="scalarAxisNames" type="stringVector"></Field>
-                <Field name="visualAxisNames" type="stringVector"></Field>
-                <Field name="extentMinima" type="doubleVector"></Field>
-                <Field name="extentMaxima" type="doubleVector"></Field>
-                <Field name="drawLines" type="bool">true</Field>
-                <Object name="linesColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawContext" type="bool">true</Field>
-                <Field name="contextGamma" type="float">2</Field>
-                <Field name="contextNumPartitions" type="int">128</Field>
-                <Object name="contextColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 220 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawLinesOnlyIfExtentsOn" type="bool">true</Field>
-                <Field name="unifyAxisExtents" type="bool">false</Field>
-                <Field name="linesNumPartitions" type="int">512</Field>
-                <Field name="focusGamma" type="float">4</Field>
-                <Field name="drawFocusAs" type="string">BinsOfConstantColor</Field>
-            </Object>
-            <Object name="PseudocolorAttributes">
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="centering" type="string">Natural</Field>
-                <Field name="colorTableName" type="string">hot</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="opacityType" type="string">FullyOpaque</Field>
-                <Field name="opacityVariable" type="string"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="opacityVarMin" type="double">0</Field>
-                <Field name="opacityVarMax" type="double">1</Field>
-                <Field name="opacityVarMinFlag" type="bool">false</Field>
-                <Field name="opacityVarMaxFlag" type="bool">false</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineType" type="string">Line</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="tubeResolution" type="int">10</Field>
-                <Field name="tubeRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="tubeRadiusAbsolute" type="double">0.125</Field>
-                <Field name="tubeRadiusBBox" type="double">0.005</Field>
-                <Field name="tubeRadiusVarEnabled" type="bool">false</Field>
-                <Field name="tubeRadiusVar" type="string"></Field>
-                <Field name="tubeRadiusVarRatio" type="double">10</Field>
-                <Field name="tailStyle" type="string">None</Field>
-                <Field name="headStyle" type="string">None</Field>
-                <Field name="endPointRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="endPointRadiusAbsolute" type="double">0.125</Field>
-                <Field name="endPointRadiusBBox" type="double">0.05</Field>
-                <Field name="endPointResolution" type="int">10</Field>
-                <Field name="endPointRatio" type="double">5</Field>
-                <Field name="endPointRadiusVarEnabled" type="bool">false</Field>
-                <Field name="endPointRadiusVar" type="string"></Field>
-                <Field name="endPointRadiusVarRatio" type="double">10</Field>
-                <Field name="renderSurfaces" type="int">1</Field>
-                <Field name="renderWireframe" type="int">0</Field>
-                <Field name="renderPoints" type="int">0</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="wireframeColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Object name="pointColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ScatterAttributes">
-                <Field name="var1" type="string">default</Field>
-                <Field name="var1Role" type="string">Coordinate0</Field>
-                <Field name="var1MinFlag" type="bool">false</Field>
-                <Field name="var1MaxFlag" type="bool">false</Field>
-                <Field name="var1Min" type="double">0</Field>
-                <Field name="var1Max" type="double">1</Field>
-                <Field name="var1Scaling" type="string">Linear</Field>
-                <Field name="var1SkewFactor" type="double">1</Field>
-                <Field name="var2Role" type="string">Coordinate1</Field>
-                <Field name="var2" type="string">default</Field>
-                <Field name="var2MinFlag" type="bool">false</Field>
-                <Field name="var2MaxFlag" type="bool">false</Field>
-                <Field name="var2Min" type="double">0</Field>
-                <Field name="var2Max" type="double">1</Field>
-                <Field name="var2Scaling" type="string">Linear</Field>
-                <Field name="var2SkewFactor" type="double">1</Field>
-                <Field name="var3Role" type="string">None</Field>
-                <Field name="var3" type="string">default</Field>
-                <Field name="var3MinFlag" type="bool">false</Field>
-                <Field name="var3MaxFlag" type="bool">false</Field>
-                <Field name="var3Min" type="double">0</Field>
-                <Field name="var3Max" type="double">1</Field>
-                <Field name="var3Scaling" type="string">Linear</Field>
-                <Field name="var3SkewFactor" type="double">1</Field>
-                <Field name="var4Role" type="string">None</Field>
-                <Field name="var4" type="string">default</Field>
-                <Field name="var4MinFlag" type="bool">false</Field>
-                <Field name="var4MaxFlag" type="bool">false</Field>
-                <Field name="var4Min" type="double">0</Field>
-                <Field name="var4Max" type="double">1</Field>
-                <Field name="var4Scaling" type="string">Linear</Field>
-                <Field name="var4SkewFactor" type="double">1</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointSizePixels" type="int">1</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="scaleCube" type="bool">true</Field>
-                <Field name="colorType" type="string">ColorByForegroundColor</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="SpreadsheetAttributes">
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="formatString" type="string">%1.6f</Field>
-                <Field name="useColorTable" type="bool">false</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="showTracerPlane" type="bool">true</Field>
-                <Object name="tracerColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 150 </Field>
-                    </Object>
-                </Object>
-                <Field name="normal" type="string">Z</Field>
-                <Field name="sliceIndex" type="int">0</Field>
-                <Field name="spreadsheetFont" type="string">Courier,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="showPatchOutline" type="bool">true</Field>
-                <Field name="showCurrentCellOutline" type="bool">false</Field>
-            </Object>
-            <Object name="SubsetAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="subsetNames" type="stringVector"></Field>
-                <Field name="subsetType" type="string">Unknown</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="TensorAttributes">
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nTensors" type="int">400</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="colorByEigenvalues" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="tensorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="TruecolorAttributes">
-                <Field name="opacity" type="double">1</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-            </Object>
-            <Object name="VectorAttributes">
-                <Field name="glyphLocation" type="string">AdaptsToMeshResolution</Field>
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nVectors" type="int">400</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="headSize" type="double">0.25</Field>
-                <Field name="headOn" type="bool">true</Field>
-                <Field name="colorByMag" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="vectorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="vectorOrigin" type="string">Tail</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="lineStem" type="string">Line</Field>
-                <Field name="geometryQuality" type="string">Fast</Field>
-                <Field name="stemWidth" type="double">0.08</Field>
-                <Field name="origOnly" type="bool">true</Field>
-                <Field name="glyphType" type="string">Arrow</Field>
-            </Object>
-            <Object name="VolumeAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="colorControlPoints">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.25</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.5</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.75</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">Linear</Field>
-                        <Field name="equal" type="bool">false</Field>
-                        <Field name="discrete" type="bool">false</Field>
-                        <Field name="category" type="string"></Field>
-                    </Object>
-                </Object>
-                <Field name="opacityAttenuation" type="float">1</Field>
-                <Field name="opacityMode" type="string">FreeformMode</Field>
-                <Object name="opacityControlPoints">
-                    <Object name="GaussianControlPointList">
-                    </Object>
-                </Object>
-                <Field name="resampleFlag" type="bool">true</Field>
-                <Field name="resampleTarget" type="int">50000</Field>
-                <Field name="opacityVariable" type="string">default</Field>
-                <Field name="compactVariable" type="string">default</Field>
-                <Field name="freeformOpacity" type="unsignedCharArray" length="256">0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 </Field>
-                <Field name="useColorVarMin" type="bool">false</Field>
-                <Field name="colorVarMin" type="float">0</Field>
-                <Field name="useColorVarMax" type="bool">false</Field>
-                <Field name="colorVarMax" type="float">0</Field>
-                <Field name="useOpacityVarMin" type="bool">false</Field>
-                <Field name="opacityVarMin" type="float">0</Field>
-                <Field name="useOpacityVarMax" type="bool">false</Field>
-                <Field name="opacityVarMax" type="float">0</Field>
-                <Field name="smoothData" type="bool">false</Field>
-                <Field name="samplesPerRay" type="int">500</Field>
-                <Field name="rendererType" type="string">Splatting</Field>
-                <Field name="gradientType" type="string">SobelOperator</Field>
-                <Field name="num3DSlices" type="int">200</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="sampling" type="string">Rasterization</Field>
-                <Field name="rendererSamples" type="float">3</Field>
-                <Field name="transferFunctionDim" type="int">1</Field>
-                <Field name="lowGradientLightingReduction" type="string">Lower</Field>
-                <Field name="lowGradientLightingClampFlag" type="bool">false</Field>
-                <Field name="lowGradientLightingClampValue" type="double">1</Field>
-                <Field name="materialProperties" type="doubleArray" length="4">0.4 0.75 0 15 </Field>
-            </Object>
-            <Object name="AMRStitchCellAttributes">
-                <Field name="CreateCellsOfType" type="string">DualGridAndStitchCells</Field>
-            </Object>
-            <Object name="AxisAlignedSlice4DAttributes">
-                <Field name="I" type="intVector"></Field>
-                <Field name="J" type="intVector"></Field>
-                <Field name="K" type="intVector"></Field>
-                <Field name="L" type="intVector"></Field>
-            </Object>
-            <Object name="BoundaryOpAttributes">
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="BoxAttributes">
-                <Field name="amount" type="string">Some</Field>
-                <Field name="minx" type="double">0</Field>
-                <Field name="maxx" type="double">1</Field>
-                <Field name="miny" type="double">0</Field>
-                <Field name="maxy" type="double">1</Field>
-                <Field name="minz" type="double">0</Field>
-                <Field name="maxz" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="CartographicProjectionAttributes">
-                <Field name="projectionID" type="string">aitoff</Field>
-                <Field name="centralMeridian" type="double">0</Field>
-            </Object>
-            <Object name="ClipAttributes">
-                <Field name="quality" type="string">Fast</Field>
-                <Field name="funcType" type="string">Plane</Field>
-                <Field name="plane1Status" type="bool">true</Field>
-                <Field name="plane2Status" type="bool">false</Field>
-                <Field name="plane3Status" type="bool">false</Field>
-                <Field name="plane1Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane2Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane3Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane1Normal" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="plane2Normal" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="plane3Normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeInverse" type="bool">false</Field>
-                <Field name="planeToolControlledClipPlane" type="string">Plane1</Field>
-                <Field name="center" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereInverse" type="bool">false</Field>
-            </Object>
-            <Object name="ConeAttributes">
-                <Field name="angle" type="double">45</Field>
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="representation" type="string">Flattened</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="cutByLength" type="bool">false</Field>
-                <Field name="length" type="double">1</Field>
-            </Object>
-            <Object name="CoordSwapAttributes">
-                <Field name="newCoord1" type="string">Coord1</Field>
-                <Field name="newCoord2" type="string">Coord2</Field>
-                <Field name="newCoord3" type="string">Coord3</Field>
-            </Object>
-            <Object name="CreateBondsAttributes">
-                <Field name="elementVariable" type="string">element</Field>
-                <Field name="atomicNumber1" type="intVector">1 -1 </Field>
-                <Field name="atomicNumber2" type="intVector">-1 -1 </Field>
-                <Field name="minDist" type="doubleVector">0.4 0.4 </Field>
-                <Field name="maxDist" type="doubleVector">1.2 1.9 </Field>
-                <Field name="maxBondsClamp" type="int">10</Field>
-                <Field name="addPeriodicBonds" type="bool">false</Field>
-                <Field name="useUnitCellVectors" type="bool">true</Field>
-                <Field name="periodicInX" type="bool">true</Field>
-                <Field name="periodicInY" type="bool">true</Field>
-                <Field name="periodicInZ" type="bool">true</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-            </Object>
-            <Object name="CylinderAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="DataBinningAttributes">
-                <Field name="numDimensions" type="string">One</Field>
-                <Field name="dim1BinBasedOn" type="string">Variable</Field>
-                <Field name="dim1Var" type="string">default</Field>
-                <Field name="dim1SpecifyRange" type="bool">false</Field>
-                <Field name="dim1MinRange" type="double">0</Field>
-                <Field name="dim1MaxRange" type="double">1</Field>
-                <Field name="dim1NumBins" type="int">50</Field>
-                <Field name="dim2BinBasedOn" type="string">Variable</Field>
-                <Field name="dim2Var" type="string">default</Field>
-                <Field name="dim2SpecifyRange" type="bool">false</Field>
-                <Field name="dim2MinRange" type="double">0</Field>
-                <Field name="dim2MaxRange" type="double">1</Field>
-                <Field name="dim2NumBins" type="int">50</Field>
-                <Field name="dim3BinBasedOn" type="string">Variable</Field>
-                <Field name="dim3Var" type="string">default</Field>
-                <Field name="dim3SpecifyRange" type="bool">false</Field>
-                <Field name="dim3MinRange" type="double">0</Field>
-                <Field name="dim3MaxRange" type="double">1</Field>
-                <Field name="dim3NumBins" type="int">50</Field>
-                <Field name="outOfBoundsBehavior" type="string">Clamp</Field>
-                <Field name="reductionOperator" type="string">Average</Field>
-                <Field name="varForReduction" type="string">default</Field>
-                <Field name="emptyVal" type="double">0</Field>
-                <Field name="outputType" type="string">OutputOnBins</Field>
-                <Field name="removeEmptyValFromCurve" type="bool">true</Field>
-            </Object>
-            <Object name="DeferExpressionAttributes">
-                <Field name="exprs" type="stringVector"></Field>
-            </Object>
-            <Object name="DisplaceAttributes">
-                <Field name="factor" type="double">1</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="DualMeshAttributes">
-                <Field name="mode" type="string">Auto</Field>
-            </Object>
-            <Object name="EdgeAttributes">
-                <Field name="dummy" type="bool">true</Field>
-            </Object>
-            <Object name="ElevateAttributes">
-                <Field name="useXYLimits" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="zeroFlag" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="EllipsoidSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radii" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="rotationAngle" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ExplodeAttributes">
-                <Field name="explosionType" type="string">Point</Field>
-                <Field name="explosionPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planePoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNorm" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint2" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="materialExplosionFactor" type="double">1</Field>
-                <Field name="material" type="string"></Field>
-                <Field name="cylinderRadius" type="double">0</Field>
-                <Field name="explodeMaterialCells" type="bool">false</Field>
-                <Field name="cellExplosionFactor" type="double">1</Field>
-                <Field name="explosionPattern" type="string">Impact</Field>
-                <Field name="explodeAllCells" type="bool">false</Field>
-                <Field name="boundaryNames" type="stringVector"></Field>
-            </Object>
-            <Object name="ExternalSurfaceAttributes">
-                <Field name="removeGhosts" type="bool">false</Field>
-                <Field name="edgesIn2D" type="bool">true</Field>
-            </Object>
-            <Object name="ExtrudeAttributes">
-                <Field name="axis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="length" type="double">1</Field>
-                <Field name="steps" type="int">30</Field>
-                <Field name="preserveOriginalCellNumbers" type="bool">true</Field>
-            </Object>
-            <Object name="FFTAttributes">
-                <Field name="dummy" type="int">0</Field>
-            </Object>
-            <Object name="IndexSelectAttributes">
-                <Field name="maxDim" type="string">ThreeD</Field>
-                <Field name="dim" type="string">TwoD</Field>
-                <Field name="xAbsMax" type="int">-1</Field>
-                <Field name="xMin" type="int">0</Field>
-                <Field name="xMax" type="int">-1</Field>
-                <Field name="xIncr" type="int">1</Field>
-                <Field name="xWrap" type="bool">false</Field>
-                <Field name="yAbsMax" type="int">-1</Field>
-                <Field name="yMin" type="int">0</Field>
-                <Field name="yMax" type="int">-1</Field>
-                <Field name="yIncr" type="int">1</Field>
-                <Field name="yWrap" type="bool">false</Field>
-                <Field name="zAbsMax" type="int">-1</Field>
-                <Field name="zMin" type="int">0</Field>
-                <Field name="zMax" type="int">-1</Field>
-                <Field name="zIncr" type="int">1</Field>
-                <Field name="zWrap" type="bool">false</Field>
-                <Field name="useWholeCollection" type="bool">true</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-            </Object>
-            <Object name="IntegralCurveAttributes">
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="boxExtents" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                <Field name="useWholeBox" type="bool">true</Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="fieldData" type="doubleVector"></Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="sampleDensity2" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="displayGeometry" type="string">Lines</Field>
-                <Field name="cleanupMethod" type="string">NoCleanup</Field>
-                <Field name="cleanupThreshold" type="double">1e-08</Field>
-                <Field name="cropBeginFlag" type="bool">false</Field>
-                <Field name="cropBegin" type="double">0</Field>
-                <Field name="cropEndFlag" type="bool">false</Field>
-                <Field name="cropEnd" type="double">0</Field>
-                <Field name="cropValue" type="string">Time</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-                <Field name="selection" type="string"></Field>
-            </Object>
-            <Object name="InverseGhostZoneAttributes">
-                <Field name="requestGhostZones" type="bool">true</Field>
-                <Field name="showDuplicated" type="bool">true</Field>
-                <Field name="showEnhancedConnectivity" type="bool">true</Field>
-                <Field name="showReducedConnectivity" type="bool">true</Field>
-                <Field name="showAMRRefined" type="bool">true</Field>
-                <Field name="showExterior" type="bool">true</Field>
-                <Field name="showNotApplicable" type="bool">true</Field>
-            </Object>
-            <Object name="IsosurfaceAttributes">
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="IsovolumeAttributes">
-                <Field name="lbound" type="double">-1e+37</Field>
-                <Field name="ubound" type="double">1e+37</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LCSAttributes">
-                <Field name="sourceType" type="string">NativeMesh</Field>
-                <Field name="Resolution" type="intArray" length="3">10 10 10 </Field>
-                <Field name="UseDataSetStart" type="string">Full</Field>
-                <Field name="StartPosition" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="UseDataSetEnd" type="string">Full</Field>
-                <Field name="EndPosition" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="auxiliaryGrid" type="string">None</Field>
-                <Field name="auxiliaryGridSpacing" type="double">0.0001</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="operationType" type="string">Lyapunov</Field>
-                <Field name="cauchyGreenTensor" type="string">Right</Field>
-                <Field name="eigenComponent" type="string">Largest</Field>
-                <Field name="eigenWeight" type="double">1</Field>
-                <Field name="operatorType" type="string">BaseValue</Field>
-                <Field name="terminationType" type="string">Time</Field>
-                <Field name="terminateBySize" type="bool">false</Field>
-                <Field name="termSize" type="double">10</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="clampLogValues" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="thresholdLimit" type="double">0.1</Field>
-                <Field name="radialLimit" type="double">0.1</Field>
-                <Field name="boundaryLimit" type="double">0.1</Field>
-                <Field name="seedLimit" type="int">10</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="LagrangianAttributes">
-                <Field name="seedPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="numSteps" type="int">1000</Field>
-                <Field name="XAxisSample" type="string">Step</Field>
-                <Field name="YAxisSample" type="string">Step</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LimitCycleAttributes">
-                <Field name="sourceType" type="string">SpecifiedLine</Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="cycleTolerance" type="double">1e-06</Field>
-                <Field name="maxIterations" type="int">10</Field>
-                <Field name="showPartialResults" type="bool">true</Field>
-                <Field name="showReturnDistances" type="bool">false</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-            </Object>
-            <Object name="LineoutAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 1 0 </Field>
-                <Field name="interactive" type="bool">false</Field>
-                <Field name="ignoreGlobal" type="bool">false</Field>
-                <Field name="samplingOn" type="bool">false</Field>
-                <Field name="numberOfSamplePoints" type="int">50</Field>
-                <Field name="reflineLabels" type="bool">false</Field>
-                <Field name="designator" type="string"></Field>
-            </Object>
-            <Object name="MultiresControlAttributes">
-                <Field name="resolution" type="int">0</Field>
-                <Field name="maxResolution" type="int">1</Field>
-                <Field name="info" type="string"></Field>
-            </Object>
-            <Object name="OnionPeelAttributes">
-                <Field name="adjacencyType" type="string">Node</Field>
-                <Field name="useGlobalId" type="bool">false</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="index" type="intVector">1 </Field>
-                <Field name="logical" type="bool">false</Field>
-                <Field name="requestedLayer" type="int">0</Field>
-                <Field name="seedType" type="string">SeedCell</Field>
-                <Field name="honorOriginalMesh" type="bool">true</Field>
-            </Object>
-            <Object name="PersistentParticlesAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startPathType" type="string">Absolute</Field>
-                <Field name="stopPathType" type="string">Absolute</Field>
-                <Field name="traceVariableX" type="string">default</Field>
-                <Field name="traceVariableY" type="string">default</Field>
-                <Field name="traceVariableZ" type="string">default</Field>
-                <Field name="connectParticles" type="bool">false</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="indexVariable" type="string">default</Field>
-            </Object>
-            <Object name="PoincareAttributes">
-                <Field name="opacityType" type="string">Explicit</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="minPunctures" type="int">50</Field>
-                <Field name="maxPunctures" type="int">500</Field>
-                <Field name="puncturePlotType" type="string">Single</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="puncturePeriodTolerance" type="double">0.01</Field>
-                <Field name="puncturePlane" type="string">Poloidal</Field>
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="pointDensity" type="int">1</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">AdamsBashforth</Field>
-                <Field name="coordinateSystem" type="string">Cartesian</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-05</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="analysis" type="string">Normal</Field>
-                <Field name="maximumToroidalWinding" type="int">0</Field>
-                <Field name="overrideToroidalWinding" type="int">0</Field>
-                <Field name="overridePoloidalWinding" type="int">0</Field>
-                <Field name="windingPairConfidence" type="double">0.9</Field>
-                <Field name="rationalSurfaceFactor" type="double">0.1</Field>
-                <Field name="overlaps" type="string">Remove</Field>
-                <Field name="meshType" type="string">Curves</Field>
-                <Field name="numberPlanes" type="int">1</Field>
-                <Field name="singlePlane" type="double">0</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">0</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="colorType" type="string">ColorByColorTable</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="dataValue" type="string">SafetyFactorQ</Field>
-                <Field name="showRationalSurfaces" type="bool">false</Field>
-                <Field name="RationalSurfaceMaxIterations" type="int">2</Field>
-                <Field name="showOPoints" type="bool">false</Field>
-                <Field name="OPointMaxIterations" type="int">2</Field>
-                <Field name="showXPoints" type="bool">false</Field>
-                <Field name="XPointMaxIterations" type="int">2</Field>
-                <Field name="performOLineAnalysis" type="bool">false</Field>
-                <Field name="OLineToroidalWinding" type="int">1</Field>
-                <Field name="OLineAxisFileName" type="string"></Field>
-                <Field name="showChaotic" type="bool">false</Field>
-                <Field name="showIslands" type="bool">false</Field>
-                <Field name="SummaryFlag" type="bool">true</Field>
-                <Field name="verboseFlag" type="bool">false</Field>
-                <Field name="show1DPlots" type="bool">false</Field>
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="ProjectAttributes">
-                <Field name="projectionType" type="string">XYCartesian</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-            </Object>
-            <Object name="RadialResampleAttributes">
-                <Field name="isFast" type="bool">false</Field>
-                <Field name="minTheta" type="float">0</Field>
-                <Field name="maxTheta" type="float">90</Field>
-                <Field name="deltaTheta" type="float">5</Field>
-                <Field name="radius" type="float">0.5</Field>
-                <Field name="deltaRadius" type="float">0.05</Field>
-                <Field name="center" type="floatArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="minAzimuth" type="float">0</Field>
-                <Field name="maxAzimuth" type="float">180</Field>
-                <Field name="deltaAzimuth" type="float">5</Field>
-            </Object>
-            <Object name="ReflectAttributes">
-                <Field name="octant" type="string">PXPYPZ</Field>
-                <Field name="useXBoundary" type="bool">true</Field>
-                <Field name="specifiedX" type="double">0</Field>
-                <Field name="useYBoundary" type="bool">true</Field>
-                <Field name="specifiedY" type="double">0</Field>
-                <Field name="useZBoundary" type="bool">true</Field>
-                <Field name="specifiedZ" type="double">0</Field>
-                <Field name="reflections" type="intArray" length="8">1 0 1 0 0 0 0 0 </Field>
-            </Object>
-            <Object name="ReplicateAttributes">
-                <Field name="useUnitCellVectors" type="bool">false</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="xReplications" type="int">1</Field>
-                <Field name="yReplications" type="int">1</Field>
-                <Field name="zReplications" type="int">1</Field>
-                <Field name="mergeResults" type="bool">true</Field>
-                <Field name="replicateUnitCellAtoms" type="bool">false</Field>
-                <Field name="shiftPeriodicAtomOrigin" type="bool">false</Field>
-                <Field name="newPeriodicOrigin" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ResampleAttributes">
-                <Field name="useExtents" type="bool">true</Field>
-                <Field name="startX" type="double">0</Field>
-                <Field name="endX" type="double">1</Field>
-                <Field name="samplesX" type="int">10</Field>
-                <Field name="startY" type="double">0</Field>
-                <Field name="endY" type="double">1</Field>
-                <Field name="samplesY" type="int">10</Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="startZ" type="double">0</Field>
-                <Field name="endZ" type="double">1</Field>
-                <Field name="samplesZ" type="int">10</Field>
-                <Field name="tieResolver" type="string">random</Field>
-                <Field name="tieResolverVariable" type="string">default</Field>
-                <Field name="defaultValue" type="double">0</Field>
-                <Field name="distributedResample" type="bool">true</Field>
-                <Field name="cellCenteredOutput" type="bool">false</Field>
-            </Object>
-            <Object name="RevolveAttributes">
-                <Field name="meshType" type="string">Auto</Field>
-                <Field name="autoAxis" type="bool">true</Field>
-                <Field name="axis" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="startAngle" type="double">0</Field>
-                <Field name="stopAngle" type="double">360</Field>
-                <Field name="steps" type="int">30</Field>
-            </Object>
-            <Object name="SPHResampleAttributes">
-                <Field name="minX" type="float">0</Field>
-                <Field name="maxX" type="float">1</Field>
-                <Field name="xnum" type="int">10</Field>
-                <Field name="minY" type="float">0</Field>
-                <Field name="maxY" type="float">1</Field>
-                <Field name="ynum" type="int">10</Field>
-                <Field name="minZ" type="float">0</Field>
-                <Field name="maxZ" type="float">1</Field>
-                <Field name="znum" type="int">10</Field>
-                <Field name="tensorSupportVariable" type="string">H</Field>
-                <Field name="weightVariable" type="string">mass</Field>
-                <Field name="RK" type="bool">true</Field>
-            </Object>
-            <Object name="SliceAttributes">
-                <Field name="originType" type="string">Intercept</Field>
-                <Field name="originPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="originIntercept" type="double">0</Field>
-                <Field name="originPercent" type="double">0</Field>
-                <Field name="originZone" type="int">0</Field>
-                <Field name="originNode" type="int">0</Field>
-                <Field name="normal" type="doubleArray" length="3">0 -1 0 </Field>
-                <Field name="axisType" type="string">YAxis</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="project2d" type="bool">true</Field>
-                <Field name="interactive" type="bool">true</Field>
-                <Field name="flip" type="bool">false</Field>
-                <Field name="originZoneDomain" type="int">0</Field>
-                <Field name="originNodeDomain" type="int">0</Field>
-                <Field name="meshName" type="string">default</Field>
-                <Field name="theta" type="double">0</Field>
-                <Field name="phi" type="double">0</Field>
-            </Object>
-            <Object name="SmoothOperatorAttributes">
-                <Field name="numIterations" type="int">20</Field>
-                <Field name="relaxationFactor" type="double">0.01</Field>
-                <Field name="convergence" type="double">0</Field>
-                <Field name="maintainFeatures" type="bool">true</Field>
-                <Field name="featureAngle" type="double">45</Field>
-                <Field name="edgeAngle" type="double">15</Field>
-                <Field name="smoothBoundaries" type="bool">false</Field>
-            </Object>
-            <Object name="SphereSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-            </Object>
-            <Object name="StaggerAttributes">
-                <Field name="offsetX" type="double">0</Field>
-                <Field name="offsetY" type="double">0</Field>
-                <Field name="offsetZ" type="double">0</Field>
-            </Object>
-            <Object name="StatisticalTrendsAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startTrendType" type="string">Absolute</Field>
-                <Field name="stopTrendType" type="string">Absolute</Field>
-                <Field name="statisticType" type="string">Mean</Field>
-                <Field name="trendAxis" type="string">Step</Field>
-                <Field name="variableSource" type="string">Default</Field>
-            </Object>
-            <Object name="SubdivideQuadsAttributes">
-                <Field name="threshold" type="double">0.500002</Field>
-                <Field name="maxSubdivs" type="int">4</Field>
-                <Field name="fanOutPoints" type="bool">true</Field>
-                <Field name="doTriangles" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="ThreeSliceAttributes">
-                <Field name="x" type="double">0</Field>
-                <Field name="y" type="double">0</Field>
-                <Field name="z" type="double">0</Field>
-                <Field name="interactive" type="bool">true</Field>
-            </Object>
-            <Object name="ThresholdAttributes">
-                <Field name="outputMeshType" type="int">0</Field>
-                <Field name="boundsInputType" type="int">0</Field>
-                <Field name="listedVarNames" type="stringVector">"default" </Field>
-                <Field name="zonePortions" type="intVector"></Field>
-                <Field name="lowerBounds" type="doubleVector"></Field>
-                <Field name="upperBounds" type="doubleVector"></Field>
-                <Field name="boundsRange" type="stringVector"></Field>
-                <Field name="defaultVarName" type="string">default</Field>
-                <Field name="defaultVarIsScalar" type="bool">false</Field>
-            </Object>
-            <Object name="TransformAttributes">
-                <Field name="doRotate" type="bool">false</Field>
-                <Field name="rotateOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="rotateAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="rotateAmount" type="double">0</Field>
-                <Field name="rotateType" type="string">Deg</Field>
-                <Field name="doScale" type="bool">false</Field>
-                <Field name="scaleOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="scaleX" type="double">1</Field>
-                <Field name="scaleY" type="double">1</Field>
-                <Field name="scaleZ" type="double">1</Field>
-                <Field name="doTranslate" type="bool">false</Field>
-                <Field name="translateX" type="double">0</Field>
-                <Field name="translateY" type="double">0</Field>
-                <Field name="translateZ" type="double">0</Field>
-                <Field name="transformType" type="string">Similarity</Field>
-                <Field name="inputCoordSys" type="string">Cartesian</Field>
-                <Field name="outputCoordSys" type="string">Spherical</Field>
-                <Field name="continuousPhi" type="bool">false</Field>
-                <Field name="m00" type="double">1</Field>
-                <Field name="m01" type="double">0</Field>
-                <Field name="m02" type="double">0</Field>
-                <Field name="m03" type="double">0</Field>
-                <Field name="m10" type="double">0</Field>
-                <Field name="m11" type="double">1</Field>
-                <Field name="m12" type="double">0</Field>
-                <Field name="m13" type="double">0</Field>
-                <Field name="m20" type="double">0</Field>
-                <Field name="m21" type="double">0</Field>
-                <Field name="m22" type="double">1</Field>
-                <Field name="m23" type="double">0</Field>
-                <Field name="m30" type="double">0</Field>
-                <Field name="m31" type="double">0</Field>
-                <Field name="m32" type="double">0</Field>
-                <Field name="m33" type="double">1</Field>
-                <Field name="invertLinearTransform" type="bool">false</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-                <Field name="transformVectors" type="bool">true</Field>
-            </Object>
-            <Object name="TriangulateRegularPointsAttributes">
-                <Field name="useXGridSpacing" type="bool">false</Field>
-                <Field name="xGridSpacing" type="double">1</Field>
-                <Field name="useYGridSpacing" type="bool">false</Field>
-                <Field name="yGridSpacing" type="double">1</Field>
-            </Object>
-            <Object name="TubeAttributes">
-                <Field name="scaleByVarFlag" type="bool">false</Field>
-                <Field name="tubeRadiusType" type="string">FractionOfBBox</Field>
-                <Field name="radiusFractionBBox" type="double">0.01</Field>
-                <Field name="radiusAbsolute" type="double">1</Field>
-                <Field name="scaleVariable" type="string">default</Field>
-                <Field name="fineness" type="int">5</Field>
-                <Field name="capping" type="bool">false</Field>
-            </Object>
-            <Object name="AppearanceAttributes">
-                <Field name="useSystemDefault" type="bool">true</Field>
-                <Field name="background" type="string">#c0c0c0</Field>
-                <Field name="foreground" type="string">#000000</Field>
-                <Field name="fontName" type="string">Helvetica,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="style" type="string">gtk</Field>
-                <Field name="orientation" type="int">0</Field>
-                <Field name="defaultForeground" type="string">#000000</Field>
-                <Field name="defaultBackground" type="string">#d4d0c8</Field>
-                <Field name="defaultFontName" type="string">"Sans Serif,9,-1,5,50,0,0,0,0,0"</Field>
-                <Field name="defaultStyle" type="string">Windows</Field>
-                <Field name="defaultOrientation" type="int">0</Field>
-            </Object>
-            <Object name="PluginManagerAttributes">
-                <Field name="name" type="stringVector">"Boundary" "Contour" "Curve" "FilledBoundary" "Histogram" "Label" "Mesh" "Molecule" "MultiCurve" "ParallelCoordinates" "Pseudocolor" "Scatter" "Spreadsheet" "Subset" "Surface" "Tensor" "Truecolor" "Vector" "Volume" "WellBore" "AMRStitchCell" "BoundaryOp" "Box" "CartographicProjection" "Clip" "Cone" "ConnectedComponents" "CoordSwap" "CracksClipper" "CreateBonds" "Cylinder" "DataBinning" "Decimate" "DeferExpression" "Delaunay" "Displace" "DualMesh" "Edge" "Elevate" "EllipsoidSlice" "ExternalSurface" "ExtractPointFunction2D" "Extrude" "FFT" "FiveFoldTetSubdivision" "Flux" "IndexSelect" "IntegralCurve" "InverseGhostZone" "Isosurface" "Isovolume" "LCS" "Lagrangian" "LimitCycle" "LineSampler" "Lineout" "Merge" "ModelFit" "MultiresControl" "OnionPeel" "PDF" "PersistentParticles" "Poincare" "Project" "RadialResample" "Reflect" "Replicate" "Resample" "Revolve" "Slice" "Smooth" "SphereSlice" "Stagger" "StatisticalTrends" "SurfaceNormal" "ThreeSlice" "Threshold" "ToroidalPoloidalProjection" "Transform" "TriangulateRegularPoints" "Tube" "ZoneDump" "SPHResample" "AxisAlignedSlice4D" "Explode" "SubdivideQuads" </Field>
-                <Field name="type" type="stringVector">"plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" </Field>
-                <Field name="version" type="stringVector">"1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.1" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "2.0" "3.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" </Field>
-                <Field name="id" type="stringVector">"Boundary_1.0" "Contour_1.0" "Curve_1.0" "FilledBoundary_1.0" "Histogram_1.0" "Label_1.0" "Mesh_1.0" "Molecule_1.0" "MultiCurve_1.0" "ParallelCoordinates_1.0" "Pseudocolor_1.0" "Scatter_1.0" "Spreadsheet_1.0" "Subset_1.0" "Surface_1.0" "Tensor_1.0" "Truecolor_1.0" "Vector_1.0" "Volume_1.1" "WellBore_1.0" "AMRStitchCell_1.0" "BoundaryOp_1.0" "Box_1.0" "CartographicProjection_1.0" "Clip_1.0" "Cone_1.0" "ConnectedComponents_1.0" "CoordSwap_1.0" "CracksClipper_1.0" "CreateBonds_1.0" "Cylinder_1.0" "DataBinning_1.0" "Decimate_1.0" "DeferExpression_1.0" "Delaunay_1.0" "Displace_1.0" "DualMesh_1.0" "Edge_1.0" "Elevate_1.0" "EllipsoidSlice_1.0" "ExternalSurface_1.0" "ExtractPointFunction2D_1.0" "Extrude_1.0" "FFT_1.0" "FiveFoldTetSubdivision_1.0" "Flux_1.0" "IndexSelect_1.0" "IntegralCurve_1.0" "InverseGhostZone_1.0" "Isosurface_1.0" "Isovolume_1.0" "LCS_1.0" "Lagrangian_1.0" "LimitCycle_1.0" "LineSampler_1.0" "Lineout_1.0" "Merge_1.0" "ModelFit_1.0" "MultiresControl_1.0" "OnionPeel_1.0" "PDF_1.0" "PersistentParticles_2.0" "Poincare_3.0" "Project_1.0" "RadialResample_1.0" "Reflect_1.0" "Replicate_1.0" "Resample_1.0" "Revolve_1.0" "Slice_1.0" "Smooth_1.0" "SphereSlice_1.0" "Stagger_1.0" "StatisticalTrends_1.0" "SurfaceNormal_1.0" "ThreeSlice_1.0" "Threshold_1.0" "ToroidalPoloidalProjection_1.0" "Transform_1.0" "TriangulateRegularPoints_1.0" "Tube_1.0" "ZoneDump_1.0" "SPHResample_1.0" "AxisAlignedSlice4D_1.0" "Explode_1.0" "SubdivideQuads_1.0" </Field>
-                <Field name="category" type="stringVector">"?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "Geometry" "Slicing" "Selection" "Transforms" "Selection" "Slicing" "Analysis" "Geometry" "Analysis" "Molecular" "Selection" "Analysis" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Geometry" "Transforms" "Slicing" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Analysis" "Selection" "Integral Curves" "Debugging" "Slicing" "Selection" "Integral Curves" "Integral Curves" "Integral Curves" "Slicing" "Analysis" "Geometry" "Analysis" "Selection" "Selection" "Analysis" "Analysis" "Integral Curves" "Transforms" "Geometry" "Transforms" "Transforms" "Geometry" "Geometry" "Slicing" "Geometry" "Slicing" "Transforms" "Analysis" "Geometry" "Slicing" "Selection" "Transforms" "Transforms" "Geometry" "Geometry" "Debugging" "Geometry" "Slicing" "Transforms" "Geometry" </Field>
-                <Field name="enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 1 0 1 1 1 1 1 1 1 1 0 1 1 1 0 1 0 1 1 1 1 1 1 0 1 1 0 1 1 1 1 1 1 1 1 1 0 1 0 1 1 1 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 0 1 1 1 1 </Field>
-            </Object>
-        </Object>
-        <Object name="ViewerSubject">
-            <Object name="SourceMap">
-                <Field name="SOURCE00" type="string">localhost:/work/SENSEI/amrex-libsim/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/plt00060/Header</Field>
-            </Object>
-            <Object name="SourcePlugins">
-                <Field name="localhost:/work/SENSEI/amrex-libsim/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/plt00060/Header" type="string">Boxlib3D_1.0</Field>
-            </Object>
-            <Object name="DatabaseCorrelationList">
-                <Field name="needPermission" type="bool">true</Field>
-                <Field name="defaultCorrelationMethod" type="int">0</Field>
-                <Field name="whenToCorrelate" type="string">CorrelateOnlyIfSameLength</Field>
-            </Object>
-            <Object name="ViewerWindowManager">
-                <Object name="SelectionList">
-                    <Field name="autoApplyUpdates" type="bool">false</Field>
-                </Object>
-                <Field name="activeWindow" type="int">0</Field>
-                <Field name="lineoutWindow" type="int">-1</Field>
-                <Field name="timeQueryWindow" type="int">-1</Field>
-                <Field name="cameraView" type="bool">false</Field>
-                <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                <Object name="Windows">
-                    <Object name="ViewerWindow">
-                        <Field name="windowSize" type="intArray" length="2">1023 705 </Field>
-                        <Field name="windowImageSize" type="intArray" length="2">1023 645 </Field>
-                        <Field name="windowLocation" type="intArray" length="2">1481 323 </Field>
-                        <Field name="maintainView" type="bool">false</Field>
-                        <Field name="cameraView" type="bool">false</Field>
-                        <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                        <Field name="viewIsLocked" type="bool">false</Field>
-                        <Field name="timeLocked" type="bool">false</Field>
-                        <Field name="toolsLocked" type="bool">false</Field>
-                        <Field name="interactionMode" type="string">NAVIGATE</Field>
-                        <Field name="toolUpdateMode" type="string">ONRELEASE</Field>
-                        <Object name="AnnotationAttributes">
-                            <Object name="axes2D">
-                                <Object name="Axes2D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Outside</Field>
-                                    <Field name="tickAxes" type="string">BottomLeft</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                            <Object name="axes3D">
-                                <Object name="Axes3D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Inside</Field>
-                                    <Field name="axesType" type="string">ClosestTriad</Field>
-                                    <Field name="triadFlag" type="bool">true</Field>
-                                    <Field name="bboxFlag" type="bool">true</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="zAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Z-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="setBBoxLocation" type="bool">false</Field>
-                                    <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="userInfoFlag" type="bool">true</Field>
-                            <Object name="userInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoFlag" type="bool">true</Field>
-                            <Field name="timeInfoFlag" type="bool">true</Field>
-                            <Object name="databaseInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                            <Field name="databaseInfoTimeScale" type="double">1</Field>
-                            <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                            <Field name="legendInfoFlag" type="bool">true</Field>
-                            <Object name="backgroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="foregroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                            <Object name="gradientColor1">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="gradientColor2">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="backgroundMode" type="string">Solid</Field>
-                            <Field name="backgroundImage" type="string"></Field>
-                            <Field name="imageRepeatX" type="int">1</Field>
-                            <Field name="imageRepeatY" type="int">1</Field>
-                            <Object name="axesArray">
-                                <Object name="AxesArray">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="ticksVisible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Object name="axes">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string"></Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Object name="LightList">
-                            <Object name="light0">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                                    <Field name="enabledFlag" type="bool">true</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light1">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light2">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light3">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light4">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light5">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light6">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light7">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                        <Field name="scalableActivationMode" type="int">1</Field>
-                        <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-                        <Field name="compactDomainsActivationMode" type="int">2</Field>
-                        <Field name="notifyForEachRender" type="bool">false</Field>
-                        <Field name="surfaceRepresentation" type="int">0</Field>
-                        <Field name="displayListMode" type="int">2</Field>
-                        <Field name="stereoRendering" type="bool">false</Field>
-                        <Field name="stereoType" type="int">2</Field>
-                        <Field name="antialiasing" type="bool">false</Field>
-                        <Field name="orderComposite" type="bool">true</Field>
-                        <Field name="depthPeeling" type="bool">false</Field>
-                        <Field name="occlusionRatio" type="double">0.01</Field>
-                        <Field name="numberOfPeels" type="int">32</Field>
-                        <Field name="multiresolutionMode" type="bool">false</Field>
-                        <Field name="multiresolutionCellSize" type="double">0.0020000000949949</Field>
-                        <Field name="specularFlag" type="bool">false</Field>
-                        <Field name="specularCoeff" type="double">0.600000023841858</Field>
-                        <Field name="specularPower" type="double">10</Field>
-                        <Object name="specularColor">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="doShading" type="bool">false</Field>
-                        <Field name="shadingStrength" type="double">0.5</Field>
-                        <Field name="doDepthCueing" type="bool">false</Field>
-                        <Field name="depthCueingAuto" type="bool">true</Field>
-                        <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                        <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                        <Field name="colorTexturingFlag" type="bool">true</Field>
-                        <Object name="ViewCurveAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="domainScale" type="int">0</Field>
-                            <Field name="rangeScale" type="int">0</Field>
-                        </Object>
-                        <Object name="View2DAttributes">
-                            <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                            <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                            <Field name="xScale" type="int">0</Field>
-                            <Field name="yScale" type="int">0</Field>
-                            <Field name="windowValid" type="bool">false</Field>
-                        </Object>
-                        <Object name="View3DAttributes">
-                            <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="focus" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                            <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                            <Field name="viewAngle" type="double">30</Field>
-                            <Field name="parallelScale" type="double">0.866025403784439</Field>
-                            <Field name="nearPlane" type="double">-1.73205080756888</Field>
-                            <Field name="farPlane" type="double">1.73205080756888</Field>
-                            <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                            <Field name="imageZoom" type="double">1.14562037553922</Field>
-                            <Field name="perspective" type="bool">true</Field>
-                            <Field name="eyeAngle" type="double">2</Field>
-                            <Field name="centerOfRotationSet" type="bool">false</Field>
-                            <Field name="centerOfRotation" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                            <Field name="axis3DScaleFlag" type="bool">false</Field>
-                            <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                            <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="windowValid" type="bool">true</Field>
-                        </Object>
-                        <Object name="ViewAxisArrayAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.15 0.9 0.1 0.85 </Field>
-                        </Object>
-                        <Object name="AnnotationObjectList">
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0003</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">0</Field>
-                                <Field name="doubleVector1" type="doubleVector"></Field>
-                                <Field name="stringVector1" type="stringVector"></Field>
-                                <Field name="stringVector2" type="stringVector"></Field>
-                            </Object>
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0004</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">1</Field>
-                                <Field name="doubleVector1" type="doubleVector"></Field>
-                                <Field name="stringVector1" type="stringVector"></Field>
-                                <Field name="stringVector2" type="stringVector">"1.08441" "1.17459" "1.26477" "1.35495" "1.44513" "1.53531" "1.62549" "1.71567" "1.80585" "1.89603" </Field>
-                            </Object>
-                        </Object>
-                        <Object name="InteractorAttributes">
-                            <Field name="showGuidelines" type="bool">true</Field>
-                            <Field name="clampSquare" type="bool">false</Field>
-                            <Field name="fillViewportOnZoom" type="bool">true</Field>
-                            <Field name="navigationMode" type="string">Trackball</Field>
-                            <Field name="axisArraySnap" type="bool">true</Field>
-                            <Field name="boundingBoxMode" type="string">Auto</Field>
-                        </Object>
-                        <Object name="ViewerPlotList">
-                            <Object name="plot00">
-                                <Field name="plotName" type="string">Plot0003</Field>
-                                <Field name="pluginID" type="string">Mesh_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">Mesh</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="MeshAttributes">
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">0</Field>
-                                        <Object name="meshColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="meshColorSource" type="string">Foreground</Field>
-                                        <Field name="opaqueColorSource" type="string">Background</Field>
-                                        <Field name="opaqueMode" type="string">Auto</Field>
-                                        <Field name="pointSize" type="double">0.05</Field>
-                                        <Object name="opaqueColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="smoothingLevel" type="string">None</Field>
-                                        <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                        <Field name="pointSizeVar" type="string">default</Field>
-                                        <Field name="pointType" type="int">6</Field>
-                                        <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                        <Field name="showInternal" type="bool">false</Field>
-                                        <Field name="pointSizePixels" type="int">2</Field>
-                                        <Field name="opacity" type="double">0.0274509803921569</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="MeshAttributes">
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">0</Field>
-                                                    <Object name="meshColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="meshColorSource" type="string">Foreground</Field>
-                                                    <Field name="opaqueColorSource" type="string">Background</Field>
-                                                    <Field name="opaqueMode" type="string">Auto</Field>
-                                                    <Field name="pointSize" type="double">0.05</Field>
-                                                    <Object name="opaqueColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="smoothingLevel" type="string">None</Field>
-                                                    <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                                    <Field name="pointSizeVar" type="string">default</Field>
-                                                    <Field name="pointType" type="int">6</Field>
-                                                    <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                                    <Field name="showInternal" type="bool">false</Field>
-                                                    <Field name="pointSizePixels" type="int">2</Field>
-                                                    <Field name="opacity" type="double">0.0274509803921569</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">Mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Object name="plot01">
-                                <Field name="plotName" type="string">Plot0004</Field>
-                                <Field name="pluginID" type="string">Contour_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">phi</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="ContourAttributes">
-                                        <Object name="defaultPalette">
-                                            <Object name="ColorControlPointList">
-                                                <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                <Field name="smoothing" type="string">None</Field>
-                                                <Field name="equal" type="bool">true</Field>
-                                                <Field name="discrete" type="bool">true</Field>
-                                                <Field name="category" type="string">Standard</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="colorType" type="string">ColorByColorTable</Field>
-                                        <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">0</Field>
-                                        <Object name="singleColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="contourNLevels" type="int">10</Field>
-                                        <Field name="contourValue" type="doubleVector"></Field>
-                                        <Field name="contourPercent" type="doubleVector"></Field>
-                                        <Field name="contourMethod" type="string">Level</Field>
-                                        <Field name="minFlag" type="bool">false</Field>
-                                        <Field name="maxFlag" type="bool">false</Field>
-                                        <Field name="min" type="double">0</Field>
-                                        <Field name="max" type="double">1</Field>
-                                        <Field name="scaling" type="string">Linear</Field>
-                                        <Field name="wireframe" type="bool">false</Field>
-                                        <Field name="invertColorTable" type="bool">false</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="ContourAttributes">
-                                                    <Object name="defaultPalette">
-                                                        <Object name="ColorControlPointList">
-                                                            <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                            <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                            <Field name="smoothing" type="string">None</Field>
-                                                            <Field name="equal" type="bool">true</Field>
-                                                            <Field name="discrete" type="bool">true</Field>
-                                                            <Field name="category" type="string">Standard</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="colorType" type="string">ColorByColorTable</Field>
-                                                    <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">0</Field>
-                                                    <Object name="singleColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="contourNLevels" type="int">10</Field>
-                                                    <Field name="contourValue" type="doubleVector"></Field>
-                                                    <Field name="contourPercent" type="doubleVector"></Field>
-                                                    <Field name="contourMethod" type="string">Level</Field>
-                                                    <Field name="minFlag" type="bool">false</Field>
-                                                    <Field name="maxFlag" type="bool">false</Field>
-                                                    <Field name="min" type="double">0</Field>
-                                                    <Field name="max" type="double">1</Field>
-                                                    <Field name="scaling" type="string">Linear</Field>
-                                                    <Field name="wireframe" type="bool">false</Field>
-                                                    <Field name="invertColorTable" type="bool">false</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">Mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Field name="activeSource" type="string">SOURCE00</Field>
-                            <Field name="nPlots" type="int">2</Field>
-                            <Field name="keyframeMode" type="bool">false</Field>
-                            <Field name="nKeyframes" type="int">1</Field>
-                            <Object name="AnimationAttributes">
-                                <Field name="animationMode" type="string">StopMode</Field>
-                                <Field name="pipelineCachingMode" type="bool">false</Field>
-                                <Field name="frameIncrement" type="int">1</Field>
-                                <Field name="timeout" type="int">1</Field>
-                                <Field name="playbackMode" type="string">Looping</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerQueryManager">
-                <Field name="baseDesignator" type="char">A</Field>
-                <Field name="cycleDesignator" type="bool">false</Field>
-                <Field name="colorIndex" type="int">0</Field>
-            </Object>
-        </Object>
-        <Object name="ViewerEngineManager">
-            <Object name="RunningEngines">
-                <Object name="MachineProfile">
-                    <Field name="hostNickname" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="host" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="userName" type="string">notset</Field>
-                    <Field name="hostAliases" type="string"></Field>
-                    <Field name="directory" type="string"></Field>
-                    <Field name="shareOneBatchJob" type="bool">false</Field>
-                    <Field name="sshPortSpecified" type="bool">false</Field>
-                    <Field name="sshPort" type="int">22</Field>
-                    <Field name="sshCommandSpecified" type="bool">false</Field>
-                    <Field name="sshCommand" type="stringVector">"ssh" </Field>
-                    <Field name="useGateway" type="bool">false</Field>
-                    <Field name="gatewayHost" type="string"></Field>
-                    <Field name="clientHostDetermination" type="string">MachineName</Field>
-                    <Field name="manualClientHostName" type="string"></Field>
-                    <Field name="tunnelSSH" type="bool">false</Field>
-                    <Field name="maximumNodesValid" type="bool">false</Field>
-                    <Field name="maximumNodes" type="int">1</Field>
-                    <Field name="maximumProcessorsValid" type="bool">true</Field>
-                    <Field name="maximumProcessors" type="int">10</Field>
-                    <Object name="LaunchProfile">
-                        <Field name="timeout" type="int">480</Field>
-                        <Field name="numProcessors" type="int">1</Field>
-                        <Field name="numNodesSet" type="bool">false</Field>
-                        <Field name="numNodes" type="int">-1</Field>
-                        <Field name="partitionSet" type="bool">false</Field>
-                        <Field name="partition" type="string"></Field>
-                        <Field name="bankSet" type="bool">false</Field>
-                        <Field name="bank" type="string"></Field>
-                        <Field name="timeLimitSet" type="bool">false</Field>
-                        <Field name="timeLimit" type="string"></Field>
-                        <Field name="launchMethodSet" type="bool">false</Field>
-                        <Field name="launchMethod" type="string"></Field>
-                        <Field name="forceStatic" type="bool">true</Field>
-                        <Field name="forceDynamic" type="bool">false</Field>
-                        <Field name="active" type="bool">false</Field>
-                        <Field name="arguments" type="stringVector"></Field>
-                        <Field name="parallel" type="bool">false</Field>
-                        <Field name="launchArgsSet" type="bool">false</Field>
-                        <Field name="launchArgs" type="string"></Field>
-                        <Field name="sublaunchArgsSet" type="bool">false</Field>
-                        <Field name="sublaunchArgs" type="string"></Field>
-                        <Field name="sublaunchPreCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPreCmd" type="string"></Field>
-                        <Field name="sublaunchPostCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPostCmd" type="string"></Field>
-                        <Field name="machinefileSet" type="bool">false</Field>
-                        <Field name="machinefile" type="string"></Field>
-                        <Field name="visitSetsUpEnv" type="bool">false</Field>
-                        <Field name="canDoHWAccel" type="bool">false</Field>
-                        <Field name="GPUsPerNode" type="int">1</Field>
-                        <Field name="XArguments" type="string"></Field>
-                        <Field name="launchXServers" type="bool">false</Field>
-                        <Field name="XDisplay" type="string">:%l</Field>
-                        <Field name="numThreads" type="int">0</Field>
-                        <Field name="constrainNodeProcs" type="bool">false</Field>
-                        <Field name="allowableNodes" type="intVector"></Field>
-                        <Field name="allowableProcs" type="intVector"></Field>
-                        <Field name="profileName" type="string">Serial</Field>
-                    </Object>
-                    <Field name="activeProfile" type="int">1</Field>
-                </Object>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="ExportDBAttributes">
-                <Field name="allTimes" type="bool">false</Field>
-                <Field name="dirname" type="string">.</Field>
-                <Field name="filename" type="string">visit_ex_db</Field>
-                <Field name="timeStateFormat" type="string">_%04d</Field>
-                <Field name="db_type" type="string"></Field>
-                <Field name="db_type_fullname" type="string"></Field>
-                <Field name="variables" type="stringVector"></Field>
-                <Field name="writeUsingGroups" type="bool">false</Field>
-                <Field name="groupSize" type="int">48</Field>
-                <Object name="opts">
-                    <Object name="DBOptionsAttributes">
-                        <Field name="types" type="intVector"></Field>
-                        <Field name="names" type="stringVector"></Field>
-                        <Field name="optBools" type="intVector"></Field>
-                        <Field name="optFloats" type="doubleVector"></Field>
-                        <Field name="optDoubles" type="doubleVector"></Field>
-                        <Field name="optInts" type="intVector"></Field>
-                        <Field name="optStrings" type="stringVector"></Field>
-                        <Field name="optEnums" type="intVector"></Field>
-                        <Field name="enumStrings" type="stringVector"></Field>
-                        <Field name="enumStringsSizes" type="intVector"></Field>
-                        <Field name="obsoleteNames" type="stringVector"></Field>
-                        <Field name="help" type="string"></Field>
-                    </Object>
-                </Object>
-            </Object>
-        </Object>
-    </Object>
-</Object>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_3d.xml b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_3d.xml
deleted file mode 100644
index 4562e1abee5..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/render_iso_libsim_3d.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<sensei>
-  <!-- libsim 3D -->
-  <analysis type="libsim"
-    visitdir="/work/SENSEI/visit2.13.2-install" mode="batch"
-    session="sensei/render_iso_libsim_3d.session"
-    image-filename="ls_image_3d_%ts" image-width="1000" image-height="700"
-    image-format="png" frequency="1" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/write_vtk.xml b/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/write_vtk.xml
deleted file mode 100644
index 226c50634c7..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Exec/SingleVortex/sensei/write_vtk.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<sensei>
-  <analysis type="VTKAmrWriter" mode="paraview" output_dir="./" enabled="1">
-  </analysis> 
-</sensei>
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/README b/Tutorials/SENSEI/Advection_AmrCore/README
deleted file mode 100644
index 7c4eb512323..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/README
+++ /dev/null
@@ -1,13 +0,0 @@
-Advection_AmrCore: This tutorial contains an AMR advection code that advects a single 
-scalar field with a velocity field that is specified on faces.
-
-It is an AMReX based code designed to run in parallel using MPI/OMP.
-
-This example uses source code from the amrex/Src/Base, Boundary, and AmrCore directories.
-Notably, this example does not use source code from amrex/Src/Amr
-(see the tutorial Advection_AmrLevel).
-
-The directory Exec/SingleVortex includes a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with VisIt.
diff --git a/Tutorials/SENSEI/Advection_AmrCore/README_SENSEI.md b/Tutorials/SENSEI/Advection_AmrCore/README_SENSEI.md
deleted file mode 100644
index 36f4ebec835..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/README_SENSEI.md
+++ /dev/null
@@ -1,73 +0,0 @@
-# Using SingleVortex miniapp with SENSEI in situ #
-SENSEI is a middleware that allows one to send data to various visualization and
-analysis back ends through a uniform interface. It's data model and API enable
-one to chose the desired visualization and analysis back end for a given task
-with out limitting ones options, as the back ends can be inter-changed at run
-time via a text based config file.
-
-## Configuring the environment ##
-First select the desired SENSEI install. Each install will support different set of
-backends. This is necessary because not all of the back ends are compatible with
-each other.
-
-For instance to use SENSEI with ParaView Catalyst:
-```
-module load sensei/2.1.0-catalyst
-```
-
-To use SENSEI with VisIt Libsim:
-```
-module load sensei/2.1.0-libsim
-```
-
-## Compiling ##
-SENSEI features in AMReX are conditionally compiled when the Make file variable
-`USE_SENSEI_INSITU` is set. When this variable is set, the Make file will query
-environment variables to determine the list of include directories and link
-libraries needed to compile with SENSEI.
-
-The `sensei_config` tool that is installed with SENSEI  will set the environment
-variables that are used in the make files.
-
-With a SENSEI module loaded, in a bash shell:
-```
-source sensei_config
-```
-
-Edit the file `Exec/SingleVortex/GNUmakefile`, set
-```
-USE_SENSEI_INSITU = TRUE
-```
-
-Finally, make the tutorial
-```
-make -j4
-```
-
-## Running ##
-To use SENSEI in AMReX one needs to enable it via ParmParse input file.
-Additionally one needs to provide a SENSEI XML configuration that selects
-and configures the desired SENSEI backend.
-
-Example XML configs are included in `Exec/SingleVortex/SENSEI`.
-
-Edit the file `Exec/SingleVortex/inputs`
-
-Running with ParaView Catalyst:
-```
-sensei.enabled = 1                          # turn SENSEI in situ on/off
-sensei.config = SENSEI/render_catalyst.xml  # render simulation data with ParaView Catalyst
-sensei.frequency = 1                        # number of level 0 steps between in situ processing
-```
-
-Running with VisIt Libsim:
-```
-sensei.enabled = 1                          # turn SENSEI in situ on/off
-sensei.config = SENSEI/render_libsim.xml    # render simulation data with VisIt Libsim
-sensei.frequency = 1                        # number of level 0 steps between in situ processing
-```
-
-Once the inputs files has been edited, run the execcutable as usual
-```
-mpiexec -np 4 ./main2d.gnu.MPI.ex inputs
-```
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv.H b/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv.H
deleted file mode 100644
index a551f816b51..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv.H
+++ /dev/null
@@ -1,189 +0,0 @@
-#ifndef AmrCoreAdv_H_
-#define AmrCoreAdv_H_
-
-#include <string>
-#include <limits>
-#include <memory>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-#include <AMReX_AmrCore.H>
-#include <AMReX_FluxRegister.H>
-#include <AMReX_BCRec.H>
-#if defined(BL_USE_SENSEI_INSITU)
-namespace amrex {
-class AmrMeshInSituBridge;
-}
-#endif
-
-using namespace amrex;
-
-class AmrCoreAdv
-    : public amrex::AmrCore
-{
-public:
-
-    ////////////////
-    // public member functions
-
-    // constructor - reads in parameters from inputs file
-    //             - sizes multilevel arrays and data structures
-    AmrCoreAdv ();
-    virtual ~AmrCoreAdv();
-
-    // advance solution to final time
-    void Evolve ();
-
-    // initializes multilevel data
-    void InitData ();
-
-    // Make a new level using provided BoxArray and DistributionMapping and
-    // fill with interpolated coarse level data.
-    // overrides the pure virtual function in AmrCore
-    virtual void MakeNewLevelFromCoarse (int lev, amrex::Real time, const amrex::BoxArray& ba,
-					 const amrex::DistributionMapping& dm) override;
-
-    // Remake an existing level using provided BoxArray and DistributionMapping and
-    // fill with existing fine and coarse data.
-    // overrides the pure virtual function in AmrCore
-    virtual void RemakeLevel (int lev, amrex::Real time, const amrex::BoxArray& ba,
-			      const amrex::DistributionMapping& dm) override;
-
-    // Delete level data
-    // overrides the pure virtual function in AmrCore
-    virtual void ClearLevel (int lev) override;
-
-    // Make a new level from scratch using provided BoxArray and DistributionMapping.
-    // Only used during initialization.
-    // overrides the pure virtual function in AmrCore
-    virtual void MakeNewLevelFromScratch (int lev, amrex::Real time, const amrex::BoxArray& ba,
-					  const amrex::DistributionMapping& dm) override;
-
-    // tag all cells for refinement
-    // overrides the pure virtual function in AmrCore
-    virtual void ErrorEst (int lev, amrex::TagBoxArray& tags, amrex::Real time, int ngrow) override;
-
-private:
-
-    ////////////////
-    // private member functions
-
-    // read in some parameters from inputs file
-    void ReadParameters();
-
-    // set covered coarse cells to be the average of overlying fine cells
-    void AverageDown ();
-
-    // more flexible version of AverageDown() that lets you average down across multiple levels
-    void AverageDownTo (int crse_lev);
-
-    // compute a new multifab by coping in phi from valid region and filling ghost cells
-    // works for single level and 2-level cases (fill fine grid ghost by interpolating from coarse)
-    void FillPatch (int lev, amrex::Real time, amrex::MultiFab& mf, int icomp, int ncomp);
-
-    // fill an entire multifab by interpolating from the coarser level
-    // this comes into play when a new level of refinement appears
-    void FillCoarsePatch (int lev, amrex::Real time, amrex::MultiFab& mf, int icomp, int ncomp);
-
-    // utility to copy in data from phi_old and/or phi_new into another multifab
-    void GetData (int lev, amrex::Real time, amrex::Vector<amrex::MultiFab*>& data,
-                  amrex::Vector<amrex::Real>& datatime);
-
-    // advance a level by dt
-    // includes a recursive call for finer levels
-    void timeStep (int lev, amrex::Real time, int iteration);
-
-    // advance a single level for a single time step, updates flux registers
-    void Advance (int lev, amrex::Real time, amrex::Real dt_lev, int iteration, int ncycle);
-
-    // a wrapper for EstTimeStep(0
-    void ComputeDt ();
-
-    // compute dt from CFL considerations
-    Real EstTimeStep (int lev, bool local=false) const;
-
-    // get plotfile name
-    std::string PlotFileName (int lev) const;
-
-    // put together an array of multifabs for writing
-    amrex::Vector<const amrex::MultiFab*> PlotFileMF () const;
-
-    // set plotfile variables names
-    amrex::Vector<std::string> PlotFileVarNames () const;
-
-    // write plotfile to disk
-    void WritePlotFile () const;
-
-    // write checkpoint file to disk
-    void WriteCheckpointFile () const;
-
-    // read checkpoint file from disk
-    void ReadCheckpointFile ();
-
-    // utility to skip to next line in Header
-    static void GotoNextLine (std::istream& is);
-
-    ////////////////
-    // private data members
-
-    amrex::Vector<int> istep;      // which step?
-    amrex::Vector<int> nsubsteps;  // how many substeps on each level?
-
-    // keep track of old time, new time, and time step at each level
-    amrex::Vector<amrex::Real> t_new;
-    amrex::Vector<amrex::Real> t_old;
-    amrex::Vector<amrex::Real> dt;
-
-    // array of multifabs to store the solution at each level of refinement
-    // after advancing a level we use "swap".
-    amrex::Vector<amrex::MultiFab> phi_new;
-    amrex::Vector<amrex::MultiFab> phi_old;
-
-    // BCRec is essentially a 2*DIM integer array storing the physical boundary
-    // condition types at the lo/hi walls in each direction
-    amrex::Vector<BCRec> bcs;  // 1-component
-
-    // stores fluxes at coarse-fine interface for synchronization
-    // this will be sized "nlevs_max+1"
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    // therefore flux_reg[0] and flux_reg[nlevs_max] are never actually
-    // used in the reflux operation
-    amrex::Vector<std::unique_ptr<amrex::FluxRegister> > flux_reg;
-
-    ////////////////
-    // runtime parameters
-
-    // maximum number of steps and stop time
-    int max_step = std::numeric_limits<int>::max();
-    amrex::Real stop_time = std::numeric_limits<amrex::Real>::max();
-
-    // if >= 0 we restart from a checkpoint
-    std::string restart_chkfile = "";
-
-    // advective cfl number - dt = cfl*dx/umax
-    amrex::Real cfl = 0.7;
-
-    // how often each level regrids the higher levels of refinement
-    // (after a level advances that many time steps)
-    int regrid_int = 2;
-
-    // hyperbolic refluxing as part of multilevel synchronization
-    int do_reflux = 1;
-
-    // plotfile prefix and frequency
-    std::string plot_file {"plt"};
-    int plot_int = -1;
-
-    // checkpoint prefix and frequency
-    std::string chk_file {"chk"};
-    int chk_int = -1;
-
-#if defined(BL_USE_SENSEI_INSITU)
-    amrex::AmrMeshInSituBridge *insitu_bridge;
-#endif
-};
-
-#endif
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv.cpp b/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv.cpp
deleted file mode 100644
index 684600c1618..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv.cpp
+++ /dev/null
@@ -1,974 +0,0 @@
-
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_MultiFabUtil.H>
-#include <AMReX_FillPatchUtil.H>
-#include <AMReX_PlotFileUtil.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_PhysBCFunct.H>
-
-#ifdef BL_USE_SENSEI_INSITU
-#include <AMReX_AmrMeshInSituBridge.H>
-#endif
-
-#ifdef AMREX_MEM_PROFILING
-#include <AMReX_MemProfiler.H>
-#endif
-
-#include <AmrCoreAdv.H>
-#include <AmrCoreAdv_F.H>
-
-using namespace amrex;
-
-// constructor - reads in parameters from inputs file
-//             - sizes multilevel arrays and data structures
-//             - initializes BCRec boundary condition object
-AmrCoreAdv::AmrCoreAdv ()
-{
-    ReadParameters();
-
-    // Geometry on all levels has been defined already.
-
-    // No valid BoxArray and DistributionMapping have been defined.
-    // But the arrays for them have been resized.
-
-    int nlevs_max = max_level + 1;
-
-    istep.resize(nlevs_max, 0);
-    nsubsteps.resize(nlevs_max, 1);
-    for (int lev = 1; lev <= max_level; ++lev) {
-	nsubsteps[lev] = MaxRefRatio(lev-1);
-    }
-
-    t_new.resize(nlevs_max, 0.0);
-    t_old.resize(nlevs_max, -1.e100);
-    dt.resize(nlevs_max, 1.e100);
-
-    phi_new.resize(nlevs_max);
-    phi_old.resize(nlevs_max);
-
-    bcs.resize(1);
-
-    // periodic boundaries
-    int bc_lo[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
-    int bc_hi[] = {BCType::int_dir, BCType::int_dir, BCType::int_dir};
-
-/*
-    // walls (Neumann)
-    int bc_lo[] = {FOEXTRAP, FOEXTRAP, FOEXTRAP};
-    int bc_hi[] = {FOEXTRAP, FOEXTRAP, FOEXTRAP};
-*/
-    for (int idim = 0; idim < AMREX_SPACEDIM; ++idim)
-    {
-        // lo-side BCs
-        if (bc_lo[idim] == BCType::int_dir  ||  // periodic uses "internal Dirichlet"
-            bc_lo[idim] == BCType::foextrap ||  // first-order extrapolation
-            bc_lo[idim] == BCType::ext_dir ) {  // external Dirichlet
-            bcs[0].setLo(idim, bc_lo[idim]);
-        }
-        else {
-            amrex::Abort("Invalid bc_lo");
-        }
-
-        // hi-side BCSs
-        if (bc_hi[idim] == BCType::int_dir  ||  // periodic uses "internal Dirichlet"
-            bc_hi[idim] == BCType::foextrap ||  // first-order extrapolation
-            bc_hi[idim] == BCType::ext_dir ) {  // external Dirichlet
-            bcs[0].setHi(idim, bc_hi[idim]);
-        }
-        else {
-            amrex::Abort("Invalid bc_hi");
-        }
-    }
-
-    // stores fluxes at coarse-fine interface for synchronization
-    // this will be sized "nlevs_max+1"
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    // therefore flux_reg[0] is never actually used in the reflux operation
-    flux_reg.resize(nlevs_max+1);
-
-#ifdef BL_USE_SENSEI_INSITU
-    insitu_bridge = new amrex::AmrMeshInSituBridge;
-    insitu_bridge->initialize();
-#endif
-}
-
-AmrCoreAdv::~AmrCoreAdv ()
-{
-#ifdef BL_USE_SENSEI_INSITU
-    delete insitu_bridge;
-#endif
-}
-
-// advance solution to final time
-void
-AmrCoreAdv::Evolve ()
-{
-    Real cur_time = t_new[0];
-    int last_plot_file_step = 0;
-
-    for (int step = istep[0]; step < max_step && cur_time < stop_time; ++step)
-    {
-        amrex::Print() << "\nCoarse STEP " << step+1 << " starts ..." << std::endl;
-
-	ComputeDt();
-
-	int lev = 0;
-	int iteration = 1;
-	timeStep(lev, cur_time, iteration);
-
-	cur_time += dt[0];
-
-        amrex::Print() << "Coarse STEP " << step+1 << " ends." << " TIME = " << cur_time
-                       << " DT = " << dt[0]  << std::endl;
-
-	// sync up time
-	for (lev = 0; lev <= finest_level; ++lev) {
-	    t_new[lev] = cur_time;
-	}
-
-	if (plot_int > 0 && (step+1) % plot_int == 0) {
-	    last_plot_file_step = step+1;
-	    WritePlotFile();
-	}
-
-        if (chk_int > 0 && (step+1) % chk_int == 0) {
-            WriteCheckpointFile();
-        }
-
-#ifdef BL_USE_SENSEI_INSITU
-        insitu_bridge->update(step, cur_time,
-            static_cast<amrex::AmrMesh*>(this), {&phi_new}, {{"phi"}});
-#endif
-
-#ifdef AMREX_MEM_PROFILING
-        {
-            std::ostringstream ss;
-            ss << "[STEP " << step+1 << "]";
-            MemProfiler::report(ss.str());
-        }
-#endif
-
-	if (cur_time >= stop_time - 1.e-6*dt[0]) break;
-    }
-
-    if (plot_int > 0 && istep[0] > last_plot_file_step) {
-	WritePlotFile();
-    }
-
-#ifdef BL_USE_SENSEI_INSITU
-    insitu_bridge->finalize();
-#endif
-}
-
-// initializes multilevel data
-void
-AmrCoreAdv::InitData ()
-{
-    if (restart_chkfile == "") {
-        // start simulation from the beginning
-        const Real time = 0.0;
-        InitFromScratch(time);
-        AverageDown();
-
-        if (chk_int > 0) {
-            WriteCheckpointFile();
-        }
-
-    }
-    else {
-        // restart from a checkpoint
-        ReadCheckpointFile();
-    }
-
-    if (plot_int > 0) {
-        WritePlotFile();
-    }
-}
-
-// Make a new level using provided BoxArray and DistributionMapping and
-// fill with interpolated coarse level data.
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::MakeNewLevelFromCoarse (int lev, Real time, const BoxArray& ba,
-				    const DistributionMapping& dm)
-{
-    const int ncomp = phi_new[lev-1].nComp();
-    const int nghost = phi_new[lev-1].nGrow();
-
-    phi_new[lev].define(ba, dm, ncomp, nghost);
-    phi_old[lev].define(ba, dm, ncomp, nghost);
-
-    t_new[lev] = time;
-    t_old[lev] = time - 1.e200;
-
-    if (lev > 0 && do_reflux) {
-	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }
-
-    FillCoarsePatch(lev, time, phi_new[lev], 0, ncomp);
-}
-
-// Remake an existing level using provided BoxArray and DistributionMapping and
-// fill with existing fine and coarse data.
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::RemakeLevel (int lev, Real time, const BoxArray& ba,
-			 const DistributionMapping& dm)
-{
-    const int ncomp = phi_new[lev].nComp();
-    const int nghost = phi_new[lev].nGrow();
-
-    MultiFab new_state(ba, dm, ncomp, nghost);
-    MultiFab old_state(ba, dm, ncomp, nghost);
-
-    FillPatch(lev, time, new_state, 0, ncomp);
-
-    std::swap(new_state, phi_new[lev]);
-    std::swap(old_state, phi_old[lev]);
-
-    t_new[lev] = time;
-    t_old[lev] = time - 1.e200;
-
-    if (lev > 0 && do_reflux) {
-	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }
-}
-
-// Delete level data
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::ClearLevel (int lev)
-{
-    phi_new[lev].clear();
-    phi_old[lev].clear();
-    flux_reg[lev].reset(nullptr);
-}
-
-// Make a new level from scratch using provided BoxArray and DistributionMapping.
-// Only used during initialization.
-// overrides the pure virtual function in AmrCore
-void AmrCoreAdv::MakeNewLevelFromScratch (int lev, Real time, const BoxArray& ba,
-					  const DistributionMapping& dm)
-{
-    const int ncomp = 1;
-    const int nghost = 0;
-
-    phi_new[lev].define(ba, dm, ncomp, nghost);
-    phi_old[lev].define(ba, dm, ncomp, nghost);
-
-    t_new[lev] = time;
-    t_old[lev] = time - 1.e200;
-
-    if (lev > 0 && do_reflux) {
-	flux_reg[lev].reset(new FluxRegister(ba, dm, refRatio(lev-1), lev, ncomp));
-    }
-
-    const Real* dx = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-    Real cur_time = t_new[lev];
-
-    MultiFab& state = phi_new[lev];
-
-    for (MFIter mfi(state); mfi.isValid(); ++mfi)
-    {
-        const Box& box = mfi.validbox();
-        const int* lo  = box.loVect();
-        const int* hi  = box.hiVect();
-
-	initdata(&lev, &cur_time, AMREX_ARLIM_3D(lo), AMREX_ARLIM_3D(hi),
-		 BL_TO_FORTRAN_3D(state[mfi]), AMREX_ZFILL(dx),
-		 AMREX_ZFILL(prob_lo));
-    }
-}
-
-// tag all cells for refinement
-// overrides the pure virtual function in AmrCore
-void
-AmrCoreAdv::ErrorEst (int lev, TagBoxArray& tags, Real time, int ngrow)
-{
-    static bool first = true;
-    static Vector<Real> phierr;
-
-    // only do this during the first call to ErrorEst
-    if (first)
-    {
-	first = false;
-        // read in an array of "phierr", which is the tagging threshold
-        // in this example, we tag values of "phi" which are greater than phierr
-        // for that particular level
-        // in subroutine state_error, you could use more elaborate tagging, such
-        // as more advanced logical expressions, or gradients, etc.
-	ParmParse pp("adv");
-	int n = pp.countval("phierr");
-	if (n > 0) {
-	    pp.getarr("phierr", phierr, 0, n);
-	}
-    }
-
-    if (lev >= phierr.size()) return;
-
-    const int clearval = TagBox::CLEAR;
-    const int   tagval = TagBox::SET;
-
-    const Real* dx      = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-
-    const MultiFab& state = phi_new[lev];
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-        Vector<int>  itags;
-
-	for (MFIter mfi(state,true); mfi.isValid(); ++mfi)
-	{
-	    const Box& tilebox  = mfi.tilebox();
-
-            TagBox&     tagfab  = tags[mfi];
-
-	    // We cannot pass tagfab to Fortran becuase it is BaseFab<char>.
-	    // So we are going to get a temporary integer array.
-            // set itags initially to 'untagged' everywhere
-            // we define itags over the tilebox region
-	    tagfab.get_itags(itags, tilebox);
-
-            // data pointer and index space
-	    int*        tptr    = itags.dataPtr();
-	    const int*  tlo     = tilebox.loVect();
-	    const int*  thi     = tilebox.hiVect();
-
-            // tag cells for refinement
-	    state_error(tptr,  AMREX_ARLIM_3D(tlo), AMREX_ARLIM_3D(thi),
-			BL_TO_FORTRAN_3D(state[mfi]),
-			&tagval, &clearval,
-			AMREX_ARLIM_3D(tilebox.loVect()), AMREX_ARLIM_3D(tilebox.hiVect()),
-			AMREX_ZFILL(dx), AMREX_ZFILL(prob_lo), &time, &phierr[lev]);
-	    //
-	    // Now update the tags in the TagBox in the tilebox region
-            // to be equal to itags
-	    //
-	    tagfab.tags_and_untags(itags, tilebox);
-	}
-    }
-}
-
-// read in some parameters from inputs file
-void
-AmrCoreAdv::ReadParameters ()
-{
-    {
-	ParmParse pp;  // Traditionally, max_step and stop_time do not have prefix.
-	pp.query("max_step", max_step);
-	pp.query("stop_time", stop_time);
-    }
-
-    {
-	ParmParse pp("amr"); // Traditionally, these have prefix, amr.
-
-	pp.query("regrid_int", regrid_int);
-	pp.query("plot_file", plot_file);
-	pp.query("plot_int", plot_int);
-	pp.query("chk_file", chk_file);
-	pp.query("chk_int", chk_int);
-        pp.query("restart",restart_chkfile);
-    }
-
-    {
-	ParmParse pp("adv");
-
-	pp.query("cfl", cfl);
-        pp.query("do_reflux", do_reflux);
-    }
-}
-
-// set covered coarse cells to be the average of overlying fine cells
-void
-AmrCoreAdv::AverageDown ()
-{
-    for (int lev = finest_level-1; lev >= 0; --lev)
-    {
-	amrex::average_down(phi_new[lev+1], phi_new[lev],
-                            geom[lev+1], geom[lev],
-                            0, phi_new[lev].nComp(), refRatio(lev));
-    }
-}
-
-// more flexible version of AverageDown() that lets you average down across multiple levels
-void
-AmrCoreAdv::AverageDownTo (int crse_lev)
-{
-    amrex::average_down(phi_new[crse_lev+1], phi_new[crse_lev],
-                        geom[crse_lev+1], geom[crse_lev],
-                        0, phi_new[crse_lev].nComp(), refRatio(crse_lev));
-}
-
-// compute a new multifab by coping in phi from valid region and filling ghost cells
-// works for single level and 2-level cases (fill fine grid ghost by interpolating from coarse)
-void
-AmrCoreAdv::FillPatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp)
-{
-    if (lev == 0)
-    {
-	Vector<MultiFab*> smf;
-	Vector<Real> stime;
-	GetData(0, time, smf, stime);
-
-        BndryFuncArray bfunc(phifill);
-        PhysBCFunct<BndryFuncArray> physbc(geom[lev], bcs, bfunc);
-	amrex::FillPatchSingleLevel(mf, time, smf, stime, 0, icomp, ncomp,
-                                    geom[lev], physbc, 0);
-    }
-    else
-    {
-	Vector<MultiFab*> cmf, fmf;
-	Vector<Real> ctime, ftime;
-	GetData(lev-1, time, cmf, ctime);
-	GetData(lev  , time, fmf, ftime);
-
-        BndryFuncArray bfunc(phifill);
-        PhysBCFunct<BndryFuncArray> cphysbc(geom[lev-1],bcs,bfunc);
-        PhysBCFunct<BndryFuncArray> fphysbc(geom[lev  ],bcs,bfunc);
-
-	Interpolater* mapper = &cell_cons_interp;
-
-	amrex::FillPatchTwoLevels(mf, time, cmf, ctime, fmf, ftime,
-                                  0, icomp, ncomp, geom[lev-1], geom[lev],
-                                  cphysbc, 0, fphysbc, 0,
-                                  refRatio(lev-1), mapper, bcs, 0);
-    }
-}
-
-// fill an entire multifab by interpolating from the coarser level
-// this comes into play when a new level of refinement appears
-void
-AmrCoreAdv::FillCoarsePatch (int lev, Real time, MultiFab& mf, int icomp, int ncomp)
-{
-    BL_ASSERT(lev > 0);
-
-    Vector<MultiFab*> cmf;
-    Vector<Real> ctime;
-    GetData(lev-1, time, cmf, ctime);
-
-    if (cmf.size() != 1) {
-	amrex::Abort("FillCoarsePatch: how did this happen?");
-    }
-
-    BndryFuncArray bfunc(phifill);
-    PhysBCFunct<BndryFuncArray> cphysbc(geom[lev-1],bcs,bfunc);
-    PhysBCFunct<BndryFuncArray> fphysbc(geom[lev  ],bcs,bfunc);
-
-    Interpolater* mapper = &cell_cons_interp;
-
-    amrex::InterpFromCoarseLevel(mf, time, *cmf[0], 0, icomp, ncomp, geom[lev-1], geom[lev],
-				 cphysbc, 0, fphysbc, 0, refRatio(lev-1),
-				 mapper, bcs, 0);
-}
-
-// utility to copy in data from phi_old and/or phi_new into another multifab
-void
-AmrCoreAdv::GetData (int lev, Real time, Vector<MultiFab*>& data, Vector<Real>& datatime)
-{
-    data.clear();
-    datatime.clear();
-
-    const Real teps = (t_new[lev] - t_old[lev]) * 1.e-3;
-
-    if (time > t_new[lev] - teps && time < t_new[lev] + teps)
-    {
-	data.push_back(&phi_new[lev]);
-	datatime.push_back(t_new[lev]);
-    }
-    else if (time > t_old[lev] - teps && time < t_old[lev] + teps)
-    {
-	data.push_back(&phi_old[lev]);
-	datatime.push_back(t_old[lev]);
-    }
-    else
-    {
-	data.push_back(&phi_old[lev]);
-	data.push_back(&phi_new[lev]);
-	datatime.push_back(t_old[lev]);
-	datatime.push_back(t_new[lev]);
-    }
-}
-
-
-// advance a level by dt
-// includes a recursive call for finer levels
-void
-AmrCoreAdv::timeStep (int lev, Real time, int iteration)
-{
-    if (regrid_int > 0)  // We may need to regrid
-    {
-
-        // help keep track of whether a level was already regridded
-        // from a coarser level call to regrid
-        static Vector<int> last_regrid_step(max_level+1, 0);
-
-        // regrid changes level "lev+1" so we don't regrid on max_level
-        // also make sure we don't regrid fine levels again if
-        // it was taken care of during a coarser regrid
-        if (lev < max_level && istep[lev] > last_regrid_step[lev])
-        {
-            if (istep[lev] % regrid_int == 0)
-            {
-                // regrid could add newly refine levels (if finest_level < max_level)
-                // so we save the previous finest level index
-		int old_finest = finest_level;
-		regrid(lev, time);
-
-                // mark that we have regridded this level already
-		for (int k = lev; k <= finest_level; ++k) {
-		    last_regrid_step[k] = istep[k];
-		}
-
-                // if there are newly created levels, set the time step
-		for (int k = old_finest+1; k <= finest_level; ++k) {
-		    dt[k] = dt[k-1] / MaxRefRatio(k-1);
-		}
-	    }
-	}
-    }
-
-    if (Verbose()) {
-	amrex::Print() << "[Level " << lev << " step " << istep[lev]+1 << "] ";
-	amrex::Print() << "ADVANCE with time = " << t_new[lev]
-                       << " dt = " << dt[lev] << std::endl;
-    }
-
-    // advance a single level for a single time step, updates flux registers
-    Advance(lev, time, dt[lev], iteration, nsubsteps[lev]);
-
-    ++istep[lev];
-
-    if (Verbose())
-    {
-	amrex::Print() << "[Level " << lev << " step " << istep[lev] << "] ";
-        amrex::Print() << "Advanced " << CountCells(lev) << " cells" << std::endl;
-    }
-
-    if (lev < finest_level)
-    {
-        // recursive call for next-finer level
-	for (int i = 1; i <= nsubsteps[lev+1]; ++i)
-	{
-	    timeStep(lev+1, time+(i-1)*dt[lev+1], i);
-	}
-
-	if (do_reflux)
-	{
-            // update lev based on coarse-fine flux mismatch
-	    flux_reg[lev+1]->Reflux(phi_new[lev], 1.0, 0, 0, phi_new[lev].nComp(), geom[lev]);
-	}
-
-	AverageDownTo(lev); // average lev+1 down to lev
-    }
-
-}
-
-// advance a single level for a single time step, updates flux registers
-void
-AmrCoreAdv::Advance (int lev, Real time, Real dt_lev, int iteration, int ncycle)
-{
-    constexpr int num_grow = 3;
-
-    std::swap(phi_old[lev], phi_new[lev]);
-    t_old[lev] = t_new[lev];
-    t_new[lev] += dt_lev;
-
-    MultiFab& S_new = phi_new[lev];
-
-    const Real old_time = t_old[lev];
-    const Real new_time = t_new[lev];
-    const Real ctr_time = 0.5*(old_time+new_time);
-
-    const Real* dx = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-
-    MultiFab fluxes[BL_SPACEDIM];
-    if (do_reflux)
-    {
-	for (int i = 0; i < BL_SPACEDIM; ++i)
-	{
-	    BoxArray ba = grids[lev];
-	    ba.surroundingNodes(i);
-	    fluxes[i].define(ba, dmap[lev], S_new.nComp(), 0);
-	}
-    }
-
-    // State with ghost cells
-    MultiFab Sborder(grids[lev], dmap[lev], S_new.nComp(), num_grow);
-    FillPatch(lev, time, Sborder, 0, Sborder.nComp());
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-	FArrayBox flux[BL_SPACEDIM], uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    const Box& bx = mfi.tilebox();
-
-	    const FArrayBox& statein = Sborder[mfi];
-	    FArrayBox& stateout      =   S_new[mfi];
-
-	    // Allocate fabs for fluxes and Godunov velocities.
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bxtmp = amrex::surroundingNodes(bx,i);
-		flux[i].resize(bxtmp,S_new.nComp());
-		uface[i].resize(amrex::grow(bxtmp,1),1);
-	    }
-
-            // compute velocities on faces (prescribed function of space and time)
-	    get_face_velocity(&lev, &ctr_time,
-			      AMREX_D_DECL(BL_TO_FORTRAN(uface[0]),
-				     BL_TO_FORTRAN(uface[1]),
-				     BL_TO_FORTRAN(uface[2])),
-			      dx, prob_lo);
-
-            // compute new state (stateout) and fluxes.
-            advect(&time, bx.loVect(), bx.hiVect(),
-		   BL_TO_FORTRAN_3D(statein),
-		   BL_TO_FORTRAN_3D(stateout),
-		   AMREX_D_DECL(BL_TO_FORTRAN_3D(uface[0]),
-			  BL_TO_FORTRAN_3D(uface[1]),
-			  BL_TO_FORTRAN_3D(uface[2])),
-		   AMREX_D_DECL(BL_TO_FORTRAN_3D(flux[0]),
-			  BL_TO_FORTRAN_3D(flux[1]),
-			  BL_TO_FORTRAN_3D(flux[2])),
-		   dx, &dt_lev);
-
-	    if (do_reflux) {
-		for (int i = 0; i < BL_SPACEDIM ; i++) {
-		    fluxes[i][mfi].copy(flux[i],mfi.nodaltilebox(i));
-		}
-	    }
-	}
-    }
-
-    // increment or decrement the flux registers by area and time-weighted fluxes
-    // Note that the fluxes have already been scaled by dt and area
-    // In this example we are solving phi_t = -div(+F)
-    // The fluxes contain, e.g., F_{i+1/2,j} = (phi*u)_{i+1/2,j}
-    // Keep this in mind when considering the different sign convention for updating
-    // the flux registers from the coarse or fine grid perspective
-    // NOTE: the flux register associated with flux_reg[lev] is associated
-    // with the lev/lev-1 interface (and has grid spacing associated with lev-1)
-    if (do_reflux) {
-	if (flux_reg[lev+1]) {
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	        // update the lev+1/lev flux register (index lev+1)
-	        flux_reg[lev+1]->CrseInit(fluxes[i],i,0,0,fluxes[i].nComp(), -1.0);
-	    }
-	}
-	if (flux_reg[lev]) {
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	        // update the lev/lev-1 flux register (index lev)
-		flux_reg[lev]->FineAdd(fluxes[i],i,0,0,fluxes[i].nComp(), 1.0);
-	    }
-	}
-    }
-}
-
-// a wrapper for EstTimeStep
-void
-AmrCoreAdv::ComputeDt ()
-{
-    Vector<Real> dt_tmp(finest_level+1);
-
-    for (int lev = 0; lev <= finest_level; ++lev)
-    {
-	dt_tmp[lev] = EstTimeStep(lev, true);
-    }
-    ParallelDescriptor::ReduceRealMin(&dt_tmp[0], dt_tmp.size());
-
-    constexpr Real change_max = 1.1;
-    Real dt_0 = dt_tmp[0];
-    int n_factor = 1;
-    for (int lev = 0; lev <= finest_level; ++lev) {
-	dt_tmp[lev] = std::min(dt_tmp[lev], change_max*dt[lev]);
-	n_factor *= nsubsteps[lev];
-	dt_0 = std::min(dt_0, n_factor*dt_tmp[lev]);
-    }
-
-    // Limit dt's by the value of stop_time.
-    const Real eps = 1.e-3*dt_0;
-    if (t_new[0] + dt_0 > stop_time - eps) {
-	dt_0 = stop_time - t_new[0];
-    }
-
-    dt[0] = dt_0;
-    for (int lev = 1; lev <= finest_level; ++lev) {
-	dt[lev] = dt[lev-1] / nsubsteps[lev];
-    }
-}
-
-// compute dt from CFL considerations
-Real
-AmrCoreAdv::EstTimeStep (int lev, bool local) const
-{
-    BL_PROFILE("AmrCoreAdv::EstTimeStep()");
-
-    Real dt_est = std::numeric_limits<Real>::max();
-
-    const Real* dx = geom[lev].CellSize();
-    const Real* prob_lo = geom[lev].ProbLo();
-    const Real cur_time = t_new[lev];
-    const MultiFab& S_new = phi_new[lev];
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est)
-#endif
-    {
-	FArrayBox uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bx = mfi.nodaltilebox(i);
-		uface[i].resize(bx,1);
-	    }
-
-	    get_face_velocity(&lev, &cur_time,
-			      AMREX_D_DECL(BL_TO_FORTRAN(uface[0]),
-				     BL_TO_FORTRAN(uface[1]),
-				     BL_TO_FORTRAN(uface[2])),
-			      dx, prob_lo);
-
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		Real umax = uface[i].norm(0);
-		if (umax > 1.e-100) {
-		    dt_est = std::min(dt_est, dx[i] / umax);
-		}
-	    }
-	}
-    }
-
-    if (!local) {
-	ParallelDescriptor::ReduceRealMin(dt_est);
-    }
-
-    dt_est *= cfl;
-
-    return dt_est;
-}
-
-// get plotfile name
-std::string
-AmrCoreAdv::PlotFileName (int lev) const
-{
-    return amrex::Concatenate(plot_file, lev, 5);
-}
-
-// put together an array of multifabs for writing
-Vector<const MultiFab*>
-AmrCoreAdv::PlotFileMF () const
-{
-    Vector<const MultiFab*> r;
-    for (int i = 0; i <= finest_level; ++i) {
-	r.push_back(&phi_new[i]);
-    }
-    return r;
-}
-
-// set plotfile variable names
-Vector<std::string>
-AmrCoreAdv::PlotFileVarNames () const
-{
-    return {"phi"};
-}
-
-// write plotfile to disk
-void
-AmrCoreAdv::WritePlotFile () const
-{
-    const std::string& plotfilename = PlotFileName(istep[0]);
-    const auto& mf = PlotFileMF();
-    const auto& varnames = PlotFileVarNames();
-
-    amrex::Print() << "Writing plotfile " << plotfilename << "\n";
-
-    amrex::WriteMultiLevelPlotfile(plotfilename, finest_level+1, mf, varnames,
-				   Geom(), t_new[0], istep, refRatio());
-}
-
-void
-AmrCoreAdv::WriteCheckpointFile () const
-{
-
-    // chk00010            write a checkpoint file with this root directory
-    // chk00010/Header     this contains information you need to save (e.g., finest_level, t_new, etc.) and also
-    //                     the BoxArrays at each level
-    // chk00010/Level_0/
-    // chk00010/Level_1/
-    // etc.                these subdirectories will hold the MultiFab data at each level of refinement
-
-    // checkpoint file name, e.g., chk00010
-    const std::string& checkpointname = amrex::Concatenate(chk_file,istep[0]);
-
-    amrex::Print() << "Writing checkpoint " << checkpointname << "\n";
-
-    const int nlevels = finest_level+1;
-
-    // ---- prebuild a hierarchy of directories
-    // ---- dirName is built first.  if dirName exists, it is renamed.  then build
-    // ---- dirName/subDirPrefix_0 .. dirName/subDirPrefix_nlevels-1
-    // ---- if callBarrier is true, call ParallelDescriptor::Barrier()
-    // ---- after all directories are built
-    // ---- ParallelDescriptor::IOProcessor() creates the directories
-    amrex::PreBuildDirectorHierarchy(checkpointname, "Level_", nlevels, true);
-
-    // write Header file
-   if (ParallelDescriptor::IOProcessor()) {
-
-       std::string HeaderFileName(checkpointname + "/Header");
-       VisMF::IO_Buffer io_buffer(VisMF::IO_Buffer_Size);
-       std::ofstream HeaderFile;
-       HeaderFile.rdbuf()->pubsetbuf(io_buffer.dataPtr(), io_buffer.size());
-       HeaderFile.open(HeaderFileName.c_str(), std::ofstream::out   |
-		                               std::ofstream::trunc |
-                                               std::ofstream::binary);
-       if( ! HeaderFile.good()) {
-           amrex::FileOpenFailed(HeaderFileName);
-       }
-
-       HeaderFile.precision(17);
-
-       // write out title line
-       HeaderFile << "Checkpoint file for AmrCoreAdv\n";
-
-       // write out finest_level
-       HeaderFile << finest_level << "\n";
-
-       // write out array of istep
-       for (int i = 0; i < istep.size(); ++i) {
-           HeaderFile << istep[i] << " ";
-       }
-       HeaderFile << "\n";
-
-       // write out array of dt
-       for (int i = 0; i < dt.size(); ++i) {
-           HeaderFile << dt[i] << " ";
-       }
-       HeaderFile << "\n";
-
-       // write out array of t_new
-       for (int i = 0; i < t_new.size(); ++i) {
-           HeaderFile << t_new[i] << " ";
-       }
-       HeaderFile << "\n";
-
-       // write the BoxArray at each level
-       for (int lev = 0; lev <= finest_level; ++lev) {
-           boxArray(lev).writeOn(HeaderFile);
-           HeaderFile << '\n';
-       }
-   }
-
-   // write the MultiFab data to, e.g., chk00010/Level_0/
-   for (int lev = 0; lev <= finest_level; ++lev) {
-       VisMF::Write(phi_new[lev],
-                    amrex::MultiFabFileFullPrefix(lev, checkpointname, "Level_", "phi"));
-   }
-
-}
-
-
-void
-AmrCoreAdv::ReadCheckpointFile ()
-{
-
-    amrex::Print() << "Restart from checkpoint " << restart_chkfile << "\n";
-
-    // Header
-    std::string File(restart_chkfile + "/Header");
-
-    VisMF::IO_Buffer io_buffer(VisMF::GetIOBufferSize());
-
-    Vector<char> fileCharPtr;
-    ParallelDescriptor::ReadAndBcastFile(File, fileCharPtr);
-    std::string fileCharPtrString(fileCharPtr.dataPtr());
-    std::istringstream is(fileCharPtrString, std::istringstream::in);
-
-    std::string line, word;
-
-    // read in title line
-    std::getline(is, line);
-
-    // read in finest_level
-    is >> finest_level;
-    GotoNextLine(is);
-
-    // read in array of istep
-    std::getline(is, line);
-    {
-        std::istringstream lis(line);
-        int i = 0;
-        while (lis >> word) {
-            istep[i++] = std::stoi(word);
-        }
-    }
-
-    // read in array of dt
-    std::getline(is, line);
-    {
-        std::istringstream lis(line);
-        int i = 0;
-        while (lis >> word) {
-            dt[i++] = std::stod(word);
-        }
-    }
-
-    // read in array of t_new
-    std::getline(is, line);
-    {
-        std::istringstream lis(line);
-        int i = 0;
-        while (lis >> word) {
-            t_new[i++] = std::stod(word);
-        }
-    }
-
-    for (int lev = 0; lev <= finest_level; ++lev) {
-
-        // read in level 'lev' BoxArray from Header
-        BoxArray ba;
-        ba.readFrom(is);
-        GotoNextLine(is);
-
-        // create a distribution mapping
-        DistributionMapping dm { ba, ParallelDescriptor::NProcs() };
-
-        // set BoxArray grids and DistributionMapping dmap in AMReX_AmrMesh.H class
-        SetBoxArray(lev, ba);
-        SetDistributionMap(lev, dm);
-
-        // build MultiFab and FluxRegister data
-        int ncomp = 1;
-        int nghost = 0;
-        phi_old[lev].define(grids[lev], dmap[lev], ncomp, nghost);
-        phi_new[lev].define(grids[lev], dmap[lev], ncomp, nghost);
-        if (lev > 0 && do_reflux) {
-            flux_reg[lev].reset(new FluxRegister(grids[lev], dmap[lev], refRatio(lev-1), lev, ncomp));
-        }
-    }
-
-    // read in the MultiFab data
-    for (int lev = 0; lev <= finest_level; ++lev) {
-        VisMF::Read(phi_new[lev],
-                    amrex::MultiFabFileFullPrefix(lev, restart_chkfile, "Level_", "phi"));
-    }
-
-}
-
-// utility to skip to next line in Header
-void
-AmrCoreAdv::GotoNextLine (std::istream& is)
-{
-    constexpr std::streamsize bl_ignore_max { 100000 };
-    is.ignore(bl_ignore_max, '\n');
-}
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv_F.H b/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv_F.H
deleted file mode 100644
index 3e5bcba1e91..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/AmrCoreAdv_F.H
+++ /dev/null
@@ -1,50 +0,0 @@
-#ifndef _AmrCoreAdv_F_H_
-#define _AmrCoreAdv_F_H_
-#include <AMReX_BLFort.H>
-
-#ifdef __cplusplus
-extern "C" 
-{
-#endif
-
-    // these are interfaces to fortran subroutines
-
-    void initdata(const int* level, const amrex_real* time, 
-		  const int* lo, const int* hi,
-		  BL_FORT_FAB_ARG_3D(state),
-		  const amrex_real* dx, const amrex_real* problo);
-
-    void get_face_velocity(const int* level, const amrex_real* time, 
-			   AMREX_D_DECL(BL_FORT_FAB_ARG(xvel),
-				  BL_FORT_FAB_ARG(yvel),
-				  BL_FORT_FAB_ARG(zvel)),
-			   const amrex_real* dx, const amrex_real* problo);
-
-    void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		     const BL_FORT_FAB_ARG_3D(state),
-		     const int* tagval, const int* clearval,
-		     const int* lo, const int* hi,
-		     const amrex_real* dx, const amrex_real* problo,
-		     const amrex_real* time, const amrex_real* phierr);
-
-    void advect(const amrex_real* time, const int* lo, const int* hi,
-		const BL_FORT_FAB_ARG_3D(statein),
-		BL_FORT_FAB_ARG_3D(stateout),
-		AMREX_D_DECL(const BL_FORT_FAB_ARG_3D(xvel),
-		       const BL_FORT_FAB_ARG_3D(yvel),
-		       const BL_FORT_FAB_ARG_3D(zvel)),
-		AMREX_D_DECL(BL_FORT_FAB_ARG_3D(fx),
-		       BL_FORT_FAB_ARG_3D(fy),
-		       BL_FORT_FAB_ARG_3D(fz)),
-		const amrex_real* dx, const amrex_real* dt);
-
-    void phifill (BL_FORT_FAB_ARG_3D(state),
-		  const int* dlo, const int* dhi,
-		  const amrex_real* dx, const amrex_real* glo, 
-		  const amrex_real* time, const int* bc);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Make.package b/Tutorials/SENSEI/Advection_AmrCore/Source/Make.package
deleted file mode 100644
index 0ce796b3cfa..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Make.package
+++ /dev/null
@@ -1,6 +0,0 @@
-CEXE_sources += main.cpp AmrCoreAdv.cpp
-
-CEXE_headers += AmrCoreAdv.H
-
-F90EXE_sources += bc_fill_nd.F90
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/Adv_2d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/Adv_2d.f90
deleted file mode 100644
index 918d0d01da7..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,119 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  real(amrex_real), intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  real(amrex_real), intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  real(amrex_real), intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  real(amrex_real), intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  real(amrex_real), intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  real(amrex_real) :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  real(amrex_real), dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Final fluxes
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = phix(i,j) * vx(i,j)
-     end do
-  end do
-  !
-  do    j = lo(2), hi(2)+1
-     do i = lo(1), hi(1)
-        flxy(i,j) = phiy(i,j) * vy(i,j)
-     end do
-  end do
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/Make.package b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100644
index d08ca035210..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,114 +0,0 @@
-module compute_flux_module
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    real(amrex_real), intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    real(amrex_real), intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    real(amrex_real), intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    real(amrex_real), intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    real(amrex_real), dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    real(amrex_real) :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/slope_2d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/slope_2d.f90
deleted file mode 100644
index b00079275be..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,128 +0,0 @@
-module slope_module
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_constants_module, only : one
-  implicit none
-
-  real(amrex_real), parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    real(amrex_real), dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(one, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    real(amrex_real) :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( one, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/Adv_3d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/Adv_3d.f90
deleted file mode 100644
index 6aea5075527..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/Adv_3d.f90
+++ /dev/null
@@ -1,142 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            vz  , vz_lo, vz_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            flxz, fz_lo, fz_hi, &
-     &            dx,dt) bind(C, name="advect")
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_3d
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3)
-  real(amrex_real), intent(in) :: dx(3), dt, time
-  integer, intent(in) :: ui_lo(3), ui_hi(3)
-  integer, intent(in) :: uo_lo(3), uo_hi(3)
-  integer, intent(in) :: vx_lo(3), vx_hi(3)
-  integer, intent(in) :: vy_lo(3), vy_hi(3)
-  integer, intent(in) :: vz_lo(3), vz_hi(3)
-  integer, intent(in) :: fx_lo(3), fx_hi(3)
-  integer, intent(in) :: fy_lo(3), fy_hi(3)
-  integer, intent(in) :: fz_lo(3), fz_hi(3)
-  real(amrex_real), intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2),ui_lo(3):ui_hi(3))
-  real(amrex_real), intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2),uo_lo(3):uo_hi(3))
-  real(amrex_real), intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2),vx_lo(3):vx_hi(3))
-  real(amrex_real), intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2),vy_lo(3):vy_hi(3))
-  real(amrex_real), intent(in   ) :: vz  (vz_lo(1):vz_hi(1),vz_lo(2):vz_hi(2),vz_lo(3):vz_hi(3))
-  real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-  real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-  real(amrex_real), intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-
-  integer :: i, j, k
-  integer :: glo(3), ghi(3)
-  real(amrex_real) :: dtdx(3), umax, vmax, wmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  real(amrex_real), dimension(:,:,:), pointer, contiguous :: &
-       phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  ! slope
-  call bl_allocate(slope,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))  
-  
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use AMReX's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  wmax = maxval(abs(vz))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) .or. &
-       wmax*dt .ge. dx(3) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", wmax = ", wmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_3d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       vz, vz_lo, vz_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       flxz, fz_lo, fz_hi, &
-                       phix, phix_y, phix_z, &
-                       phiy, phiy_x, phiy_z, &
-                       phiz, phiz_x, phiz_y, &
-                       slope, glo, ghi)
-
-  ! Do a conservative update
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           uout(i,j,k) = uin(i,j,k) + &
-                ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx(1) &
-                + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx(2) &
-                + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx(3) )
-        enddo
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-           flxx(i,j,k) = flxx(i,j,k) * (dt * dx(2)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)+1 
-        do i = lo(1), hi(1)
-           flxy(i,j,k) = flxy(i,j,k) * (dt * dx(1)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)+1
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           flxz(i,j,k) = flxz(i,j,k) * (dt * dx(1)*dx(2))
-        enddo
-     enddo
-  enddo
-
-  call bl_deallocate(phix  )
-  call bl_deallocate(phix_y)
-  call bl_deallocate(phix_z)
-  call bl_deallocate(phiy  )
-  call bl_deallocate(phiy_x)
-  call bl_deallocate(phiy_z)
-  call bl_deallocate(phiz  )
-  call bl_deallocate(phiz_x)
-  call bl_deallocate(phiz_y)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/Make.package b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/compute_flux_3d.f90
deleted file mode 100644
index cf01e99b9dc..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/compute_flux_3d.f90
+++ /dev/null
@@ -1,288 +0,0 @@
-module compute_flux_module
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-
-  private
-
-  public :: compute_flux_3d
-
-contains
-
-  subroutine compute_flux_3d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             wmac,  w_lo,  w_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             flxz, fz_lo, fz_hi, &
-                             phix, phix_y, phix_z, &
-                             phiy, phiy_x, phiy_z, &
-                             phiz, phiz_x, phiz_y, &
-                             slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey, slopez
-
-    integer, intent(in) :: lo(3), hi(3), glo(3), ghi(3)
-    real(amrex_real), intent(in) :: dt, dx(3)
-    integer, intent(in) :: ph_lo(3), ph_hi(3)
-    integer, intent(in) ::  u_lo(3),  u_hi(3)
-    integer, intent(in) ::  v_lo(3),  v_hi(3)
-    integer, intent(in) ::  w_lo(3),  w_hi(3)
-    integer, intent(in) :: fx_lo(3), fx_hi(3)
-    integer, intent(in) :: fy_lo(3), fy_hi(3)
-    integer, intent(in) :: fz_lo(3), fz_hi(3)
-    real(amrex_real), intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2),ph_lo(3):ph_hi(3))
-    real(amrex_real), intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2), u_lo(3): u_hi(3))
-    real(amrex_real), intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2), v_lo(3): v_hi(3))
-    real(amrex_real), intent(in   ) :: wmac( w_lo(1): w_hi(1), w_lo(2): w_hi(2), w_lo(3): w_hi(3))
-    real(amrex_real), intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-    real(amrex_real), intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-    real(amrex_real), intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-    real(amrex_real), dimension(glo(1):ghi(1),glo(2):ghi(2),glo(3):ghi(3)) :: &
-         phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-         
-    integer :: i, j, k
-    real(amrex_real) :: hdtdx(3), tdtdx(3)
-
-    hdtdx = 0.5*(dt/dx)
-    tdtdx = (1.d0/3.d0)*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phi(i  ,j,k) - (0.5d0 + hdtdx(1)*umac(i,j,k))*slope(i  ,j,k)
-             else
-                phix(i,j,k) = phi(i-1,j,k) + (0.5d0 - hdtdx(1)*umac(i,j,k))*slope(i-1,j,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on y faces using vmac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phi(i,j  ,k) - (0.5d0 + hdtdx(2)*vmac(i,j,k))*slope(i,j  ,k)
-             else
-                phiy(i,j,k) = phi(i,j-1,k) + (0.5d0 - hdtdx(2)*vmac(i,j,k))*slope(i,j-1,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopez(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on z faces using wmac to upwind; ignore transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phi(i,j,k  ) - (0.5d0 + hdtdx(3)*wmac(i,j,k))*slope(i,j,k  )
-             else
-                phiz(i,j,k) = phi(i,j,k-1) + (0.5d0 - hdtdx(3)*wmac(i,j,k))*slope(i,j,k-1)
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! transverse terms
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in y-transverse terms
-    do       k=lo(3)-1, hi(3)+1
-       do    j=lo(2)  , hi(2)
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i  ,j+1,k)+vmac(i  ,j,k)) * (phiy(i  ,j+1,k)-phiy(i  ,j,k)) )
-             else
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i-1,j+1,k)+vmac(i-1,j,k)) * (phiy(i-1,j+1,k)-phiy(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on x faces by adding in z-transverse terms
-    do       k=lo(3)  , hi(3)
-       do    j=lo(2)-1, hi(2)+1
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i  ,j,k+1)+wmac(i  ,j,k)) * (phiz(i  ,j,k+1)-phiz(i  ,j,k)) )
-             else
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i-1,j,k+1)+wmac(i-1,j,k)) * (phiz(i-1,j,k+1)-phiz(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j  ,k)+umac(i,j  ,k)) * (phix(i+1,j  ,k)-phix(i,j  ,k)) )
-             else
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j-1,k)+umac(i,j-1,k)) * (phix(i+1,j-1,k)-phix(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in z-transverse terms
-    do       k = lo(3)  , hi(3)
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j  ,k+1)+wmac(i,j  ,k)) * (phiz(i,j  ,k+1)-phiz(i,j  ,k)) )
-             else
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j-1,k+1)+wmac(i,j-1,k)) * (phiz(i,j-1,k+1)-phiz(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in x-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k  )+umac(i,j,k  )) * (phix(i+1,j,k  )-phix(i,j,k  )) )
-             else
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k-1)+umac(i,j,k-1)) * (phix(i+1,j,k-1)-phix(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in y-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)  , hi(2)
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k  )+vmac(i,j,k  )) * (phiy(i,j+1,k  )-phiy(i,j,k  )) )
-             else
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k-1)+vmac(i,j,k-1)) * (phiy(i,j+1,k-1)-phiy(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! final edge states
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in yz and zy transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_z(i  ,j+1,k  )-phiy_z(i  ,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i  ,j,k)) * (phiz_y(i  ,j  ,k+1)-phiz_y(i  ,j,k)) )
-             else
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1,k  )+vmac(i-1,j,k)) * (phiy_z(i-1,j+1,k  )-phiy_z(i-1,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i-1,j  ,k+1)+wmac(i-1,j,k)) * (phiz_y(i-1,j  ,k+1)-phiz_y(i-1,j,k)) )
-             end if
-
-             ! compute final x-fluxes
-             flxx(i,j,k) = umac(i,j,k)*phix(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in xz and zx transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i,j  ,k)) * (phix_z(i+1,j  ,k  )-phix_z(i,j  ,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i,j  ,k)) * (phiz_x(i  ,j  ,k+1)-phiz_x(i,j  ,k)) )
-             else
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j-1,k  )+umac(i,j-1,k)) * (phix_z(i+1,j-1,k  )-phix_z(i,j-1,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j-1,k+1)+wmac(i,j-1,k)) * (phiz_x(i  ,j-1,k+1)-phiz_x(i,j-1,k)) )
-             end if
-
-             ! compute final y-fluxes
-             flxy(i,j,k) = vmac(i,j,k)*phiy(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in xy and yx transverse terms
-    do       k = lo(3), hi(3)+1
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i  ,j,k)) * (phix_y(i+1,j  ,k  )-phix_y(i,j,k  )) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_x(i  ,j+1,k  )-phiy_x(i,j,k  )) )
-             else
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k-1)+umac(i,j,k-1)) * (phix_y(i+1,j  ,k-1)-phix_y(i,j,k-1)) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k-1)+vmac(i,j,k-1)) * (phiy_x(i  ,j+1,k-1)-phiy_x(i,j,k-1)) )
-             end if
-
-             ! compute final z-fluxes
-             flxz(i,j,k) = wmac(i,j,k)*phiz(i,j,k)
-
-          end do
-       end do
-    end do
-
-
-  end subroutine compute_flux_3d
-
-end module compute_flux_module
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/slope_3d.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/slope_3d.f90
deleted file mode 100644
index 5759ea679bc..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_3d/slope_3d.f90
+++ /dev/null
@@ -1,213 +0,0 @@
-module slope_module
-
-  use amrex_fort_module, only : amrex_real
-  use amrex_constants_module, only : one
-  implicit none
-
-  real(amrex_real), parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey, slopez
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    integer :: i, j, k
-    real(amrex_real), dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do    k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-
-          ! first compute Fromm slopes
-          do i = lo(1)-1, hi(1)+1
-             dlft = q(i  ,j,k) - q(i-1,j,k)
-             drgt = q(i+1,j,k) - q(i  ,j,k)
-             dcen(i) = .5d0 * (dlft+drgt)
-             dsgn(i) = sign(one, dcen(i))
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i) = 0.d0
-             endif
-             df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-          end do
-          
-          ! Now limited fourth order slopes
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-             dq(i,j,k) = dsgn(i)*min(dlim(i),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(2), ddhi(2)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j, k
-    real(amrex_real) :: dlft, drgt, dq1
-
-    do k = lo(3), hi(3)
-
-       ! first compute Fromm slopes
-       do j    = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j  ,k) - q(i,j-1,k)
-             drgt = q(i,j+1,k) - q(i,j  ,k)
-             dcen(i,j) = .5d0 * (dlft+drgt)
-             dsgn(i,j) = sign( one, dcen(i,j) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j) = 0.d0
-             endif
-             df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-          end do
-       end do
-       
-       ! Now compute limited fourth order slopes
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-             dq(i,j,k) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-          end do
-       end do
-
-    end do
-
-  end subroutine slopey_doit
-
-
-  subroutine slopez(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    real(amrex_real), intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    real(amrex_real), dimension(:,:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-
-    call slopez_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, &
-                     (/lo(1),lo(2),lo(3)-1/), (/hi(1),hi(2),hi(3)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopez
-
-  subroutine slopez_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(3), ddhi(3)
-    real(amrex_real), intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    real(amrex_real), intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    real(amrex_real)              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    real(amrex_real)              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    real(amrex_real)              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    real(amrex_real)              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-
-    integer :: i, j, k
-    real(amrex_real) :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do k       = lo(3)-1, hi(3)+1
-       do j    = lo(2)  , hi(2)
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j,k  ) - q(i,j,k-1)
-             drgt = q(i,j,k+1) - q(i,j,k  )
-             dcen(i,j,k) = .5d0 * (dlft+drgt)
-             dsgn(i,j,k) = sign( one, dcen(i,j,k) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j,k) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j,k) = 0.d0
-             endif
-             df(i,j,k) = dsgn(i,j,k)*min( dlim(i,j,k),abs(dcen(i,j,k)) )
-          end do
-       end do
-    end do
-       
-    ! Now compute limited fourth order slopes
-    do k       = lo(3), hi(3)
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j,k) - sixth*( df(i,j,k+1) + df(i,j,k-1) )
-             dq(i,j,k) = dsgn(i,j,k)*min(dlim(i,j,k),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopez_doit
-
-end module slope_module 
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_nd/Make.package b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_nd/Make.package
deleted file mode 100644
index 36d550bcbe4..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_nd/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-
-f90EXE_sources += Tagging_nd.f90
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_nd/Tagging_nd.f90 b/Tutorials/SENSEI/Advection_AmrCore/Source/Src_nd/Tagging_nd.f90
deleted file mode 100644
index 13b5ae6a096..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/Src_nd/Tagging_nd.f90
+++ /dev/null
@@ -1,53 +0,0 @@
-
-! ::: -----------------------------------------------------------
-! ::: This routine will tag high error cells based on the state
-! ::: 
-! ::: INPUTS/OUTPUTS:
-! ::: 
-! ::: tag        <=  integer tag array
-! ::: tag_lo,hi   => index extent of tag array
-! ::: state       => state array
-! ::: state_lo,hi => index extent of state array
-! ::: set         => integer value to tag cell for refinement
-! ::: clear       => integer value to untag cell
-! ::: lo,hi       => work region we are allowed to change
-! ::: dx          => cell size
-! ::: problo      => phys loc of lower left corner of prob domain
-! ::: time        => problem evolution time
-! ::: level       => refinement level of this array
-! ::: -----------------------------------------------------------
-
-subroutine state_error(tag,tag_lo,tag_hi, &
-                       state,state_lo,state_hi, &
-                       set,clear,&
-                       lo,hi,&
-                       dx,problo,time,phierr) bind(C, name="state_error")
-
-  use amrex_fort_module, only : amrex_real
-  implicit none
-  
-  integer          :: lo(3),hi(3)
-  integer          :: state_lo(3),state_hi(3)
-  integer          :: tag_lo(3),tag_hi(3)
-  real(amrex_real) :: state(state_lo(1):state_hi(1), &
-                            state_lo(2):state_hi(2), &
-                            state_lo(3):state_hi(3))
-  integer          :: tag(tag_lo(1):tag_hi(1),tag_lo(2):tag_hi(2),tag_lo(3):tag_hi(3))
-  real(amrex_real) :: problo(3),dx(3),time,phierr
-  integer          :: set,clear
-
-  integer          :: i, j, k
-
-  ! Tag on regions of high phi
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           if (state(i,j,k) .ge. phierr) then
-              tag(i,j,k) = set
-           endif
-        enddo
-     enddo
-  enddo
-
-end subroutine state_error
-
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/bc_fill_nd.F90 b/Tutorials/SENSEI/Advection_AmrCore/Source/bc_fill_nd.F90
deleted file mode 100644
index 4bdc159ae82..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/bc_fill_nd.F90
+++ /dev/null
@@ -1,30 +0,0 @@
-module bc_fill_module
-
-! since this is a .F90 file (instead of .f90) we run this through a C++ preprocessor
-! for e.g., #if (BL_SPACEDIM == 1) statements.
-
-  implicit none
-
-  public
-
-contains
-
-  subroutine phifill(phi,phi_lo,phi_hi,domlo,domhi,delta,xlo,time,bc) &
-       bind(C, name="phifill")
-
-    use amrex_fort_module, only : bl_spacedim, amrex_real
-    use amrex_filcc_module, only : amrex_filccn
-
-    implicit none
-
-    integer      :: phi_lo(3),phi_hi(3)
-    integer      :: bc(bl_spacedim,2)
-    integer      :: domlo(3), domhi(3)
-    real(amrex_real) :: delta(3), xlo(3), time
-    real(amrex_real) :: phi(phi_lo(1):phi_hi(1),phi_lo(2):phi_hi(2),phi_lo(3):phi_hi(3))
-
-    call amrex_filccn(phi_lo, phi_hi, phi, phi_lo, phi_hi, 1, domlo, domhi, delta, xlo, bc)
-
-  end subroutine phifill
-  
-end module bc_fill_module
diff --git a/Tutorials/SENSEI/Advection_AmrCore/Source/main.cpp b/Tutorials/SENSEI/Advection_AmrCore/Source/main.cpp
deleted file mode 100644
index e2078b2a3db..00000000000
--- a/Tutorials/SENSEI/Advection_AmrCore/Source/main.cpp
+++ /dev/null
@@ -1,47 +0,0 @@
-
-#include <iostream>
-
-#include <AMReX.H>
-#include <AMReX_BLProfiler.H>
-#include <AMReX_ParallelDescriptor.H>
-
-#include <AmrCoreAdv.H>
-
-using namespace amrex;
-
-int main(int argc, char* argv[])
-{
-    amrex::Initialize(argc,argv);
-
-    // timer for profiling
-    BL_PROFILE_VAR("main()", pmain);
-
-    // wallclock time
-    const Real strt_total = amrex::second();
-
-    {
-        // constructor - reads in parameters from inputs file
-        //             - sizes multilevel arrays and data structures
-        AmrCoreAdv amr_core_adv;
-	
-        // initialize AMR data
-	amr_core_adv.InitData();
-
-        // advance solution to final time
-	amr_core_adv.Evolve();
-	
-        // wallclock time
-	Real end_total = amrex::second() - strt_total;
-	
-        // print wallclock time
-	ParallelDescriptor::ReduceRealMax(end_total ,ParallelDescriptor::IOProcessorNumber());
-	if (amr_core_adv.Verbose()) {
-            amrex::Print() << "\nTotal Time: " << end_total << '\n';
-	}
-    }
-
-    // destroy timer for profiling
-    BL_PROFILE_VAR_STOP(pmain);
-
-    amrex::Finalize();
-}
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/CMakeLists.txt b/Tutorials/SENSEI/Advection_AmrLevel/CMakeLists.txt
deleted file mode 100644
index 90730243b90..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/CMakeLists.txt
+++ /dev/null
@@ -1,102 +0,0 @@
-#
-# This test works for both 2D and 3D builds
-# There are two different tutorials here:
-#
-# 1) Single Vortex
-# 2) Uniform Velocity
-#
-
-
-
-
-set (SRC_DIR ${CMAKE_CURRENT_LIST_DIR}/Source )
-
-#
-# Sources common to both cases
-#
-find_all_sources ( SRC1 INC1 ROOT ${SRC_DIR} )
-find_all_sources ( SRC2 INC2 ROOT ${SRC_DIR}/Src_${DIM}d )
-find_all_sources ( SRC3 INC3 ROOT ${SRC_DIR}/Src_nd )
-
-
-###############################################################################
-#
-# Single Vortex tutorial ------------------------------------------------------
-#
-################################################################################
-set ( EXENAME  "Advection_AmrLevel_SV.exe")
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/SingleVortex )
-
-
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-set_target_properties ( ${EXENAME} PROPERTIES      
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex )
-
-target_link_libraries (${EXENAME} amrex)
-
-#
-# Find input files
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false
-   ${EXE_DIR}/input* ${EXE_DIR}/probin)
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex )
-file ( COPY ${EXE_DIR}/sensei DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/SingleVortex )
-
-add_tutorial (${EXENAME})   
-
-
-###############################################################################
-#
-# Single Vortex tutorial ------------------------------------------------------
-#
-################################################################################
-set ( EXENAME  "Advection_AmrLevel_UV.exe")
-set ( EXE_DIR ${CMAKE_CURRENT_LIST_DIR}/Exec/UniformVelocity)
-
-
-add_executable ( ${EXENAME} EXCLUDE_FROM_ALL "" )
-
-
-target_sources ( ${EXENAME}
-   PRIVATE
-   ${EXE_DIR}/Prob.f90 ${EXE_DIR}/probdata.f90 ${EXE_DIR}/face_velocity_${DIM}d.f90
-   ${SRC1} ${SRC2} ${SRC3} )
-
-
-set_target_properties ( ${EXENAME} PROPERTIES      
-   INCLUDE_DIRECTORIES
-   "${INC1};${INC2};${INC3};${CMAKE_CURRENT_BINARY_DIR}/mod_files"
-   Fortran_MODULE_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/mod_files
-   RUNTIME_OUTPUT_DIRECTORY
-   ${CMAKE_CURRENT_BINARY_DIR}/UniformVelocity )
-
-target_link_libraries (${EXENAME} amrex)
-
-#
-# Find input files
-#
-file ( GLOB_RECURSE inputs LIST_DIRECTORIES false
-   ${EXE_DIR}/input* ${EXE_DIR}/probin)
-
-#
-# Copy input files to corresponding build dir
-#
-file ( COPY ${inputs} DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/UniformVelocity )
-
-add_tutorial (${EXENAME})
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/Make.Adv b/Tutorials/SENSEI/Advection_AmrLevel/Exec/Make.Adv
deleted file mode 100644
index e0e3b52eafc..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/Make.Adv
+++ /dev/null
@@ -1,31 +0,0 @@
-AMREX_HOME ?= ../../../..
-ADR_DIR  ?= $(AMREX_HOME)/Tutorials/SENSEI/Advection_AmrLevel
-
-TOP := $(ADR_DIR)
-
-EBASE := main
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.defs
-
-Bdirs 	:= Source Source/Src_nd Source/Src_$(DIM)d
-Bpack	+= $(foreach dir, $(Bdirs), $(TOP)/$(dir)/Make.package)
-Blocs   += $(foreach dir, $(Bdirs), $(TOP)/$(dir))
-
-include $(Bpack)
-
-INCLUDE_LOCATIONS += $(Blocs)
-VPATH_LOCATIONS   += $(Blocs)
-
-Pdirs 	:= Base Boundary AmrCore Amr Particle
-ifeq ($(USE_SENSEI_INSITU),TRUE)
-	Pdirs += Extern/SENSEI
-endif
-Ppack	+= $(foreach dir, $(Pdirs), $(AMREX_HOME)/Src/$(dir)/Make.package)
-
-include $(Ppack)
-
-all: $(executable) 
-	@echo SUCCESS
-
-include $(AMREX_HOME)/Tools/GNUMake/Make.rules
-
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile
deleted file mode 100644
index 31d6d184aac..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/GNUmakefile
+++ /dev/null
@@ -1,23 +0,0 @@
-AMREX_HOME ?= ../../../../..
-
-USE_EB = FALSE
-PRECISION  = DOUBLE
-PROFILE    = FALSE
-
-DEBUG      = FALSE
-
-DIM        = 2
-
-COMP	   = gnu
-
-USE_PARTICLES = TRUE
-
-USE_MPI    = TRUE
-USE_OMP    = FALSE
-
-USE_SENSEI_INSITU = TRUE
-
-Bpack   := ./Make.package
-Blocs   := .
-
-include ../Make.Adv
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/Make.package b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/Make.package
deleted file mode 100644
index c478388fbdc..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/Make.package
+++ /dev/null
@@ -1 +0,0 @@
-f90EXE_sources += Prob.f90 face_velocity_$(DIM)d.f90
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/Prob.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/Prob.f90
deleted file mode 100644
index 93278c87712..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/Prob.f90
+++ /dev/null
@@ -1,57 +0,0 @@
-
-subroutine amrex_probinit (init,name,namlen,problo,probhi) bind(c)
-
-  implicit none
-
-  integer, intent(in) :: init, namlen
-  integer, intent(in) :: name(namlen)
-  double precision, intent(in) :: problo(*), probhi(*)
-
-  ! nothing needs to be done here
-
-end subroutine amrex_probinit
-
-
-subroutine initdata(level, time, lo, hi, &
-     phi, phi_lo, phi_hi, &
-     dx, prob_lo) bind(C, name="initdata")
-
-  implicit none
-  integer, intent(in) :: level, lo(3), hi(3), phi_lo(3), phi_hi(3)
-  double precision, intent(in) :: time
-  double precision, intent(inout) :: phi(phi_lo(1):phi_hi(1), &
-       &                                 phi_lo(2):phi_hi(2), &
-       &                                 phi_lo(3):phi_hi(3))
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer          :: dm
-  integer          :: i,j,k
-  double precision :: x,y,z,r2
-  
-  if (phi_lo(3) .eq. 0 .and. phi_hi(3) .eq. 0) then
-     dm = 2
-  else
-     dm = 3
-  end if
-
-  !$omp parallel do private(i,j,k,x,y,z,r2) collapse(2)
-  do k=lo(3),hi(3)
-     do j=lo(2),hi(2)
-        z = prob_lo(3) + (dble(k)+0.5d0) * dx(3)
-        y = prob_lo(2) + (dble(j)+0.5d0) * dx(2)
-        do i=lo(1),hi(1)
-           x = prob_lo(1) + (dble(i)+0.5d0) * dx(1)
-           
-           if ( dm.eq. 2) then
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           else
-              r2 = ((x-0.5d0)**2 + (y-0.75d0)**2 + (z-0.5d0)**2) / 0.01d0
-              phi(i,j,k) = 1.d0 + exp(-r2)
-           end if
-        end do
-     end do
-  end do
-  !$omp end parallel do
-
-end subroutine initdata
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/face_velocity_2d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/face_velocity_2d.f90
deleted file mode 100644
index 5ca92566473..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/face_velocity_2d.f90
+++ /dev/null
@@ -1,61 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_h1, vx_h2, &
-     vy, vy_l1, vy_l2, vy_h1, vy_h2, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_h1, vx_h2
-  integer, intent(in) :: vy_l1, vy_l2, vy_h1, vy_h2
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2)
-  double precision, intent(in) :: dx(2), prob_lo(2)
-
-  integer :: i, j, plo(2), phi(2)
-  double precision :: x, y
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-
-  ! y velocity
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-
-  call bl_deallocate(psi)
-  
-end subroutine get_face_velocity
-
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90
deleted file mode 100644
index b4063a8ccb3..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/face_velocity_3d.f90
+++ /dev/null
@@ -1,69 +0,0 @@
-
-subroutine get_face_velocity(level, time, &
-     vx, vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3, &
-     vy, vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3, &
-     vz, vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3, &
-     dx, prob_lo) bind(C, name="get_face_velocity")
-
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-  implicit none
-
-  integer, intent(in) :: level
-  double precision, intent(in) :: time
-  integer, intent(in) :: vx_l1, vx_l2, vx_l3, vx_h1, vx_h2, vx_h3
-  integer, intent(in) :: vy_l1, vy_l2, vy_l3, vy_h1, vy_h2, vy_h3
-  integer, intent(in) :: vz_l1, vz_l2, vz_l3, vz_h1, vz_h2, vz_h3
-  double precision, intent(out) :: vx(vx_l1:vx_h1,vx_l2:vx_h2,vx_l3:vx_h3)
-  double precision, intent(out) :: vy(vy_l1:vy_h1,vy_l2:vy_h2,vy_l3:vy_h3)
-  double precision, intent(out) :: vz(vz_l1:vz_h1,vz_l2:vz_h2,vz_l3:vz_h3)
-  double precision, intent(in) :: dx(3), prob_lo(3)
-
-  integer :: i, j, k, plo(2), phi(2)
-  double precision :: x, y, z
-  double precision, pointer, contiguous :: psi(:,:)
-  double precision, parameter :: M_PI = 3.141592653589793238462643383279502884197d0
-
-  plo(1) = min(vx_l1-1, vy_l1-1)
-  plo(2) = min(vx_l2-1, vy_l2-1)
-  phi(1) = max(vx_h1  , vy_h1+1)
-  phi(2) = max(vx_h2+1, vy_h2  )
-  
-  call bl_allocate(psi, plo(1), phi(1), plo(2), phi(2))
-
-  ! streamfunction psi
-  do j = plo(2), phi(2)
-     y = (dble(j)+0.5d0)*dx(2) + prob_lo(2)
-     do i = plo(1), phi(1)
-        x = (dble(i)+0.5d0)*dx(1) + prob_lo(1)
-        psi(i,j) =  sin(M_PI*x)**2 * sin(M_PI*y)**2 * cos (M_PI*time/2.d0) * (1.d0 / M_PI)
-     end do
-  end do
-  
-  ! x velocity
-  do k = vx_l3, vx_h3
-  do j = vx_l2, vx_h2
-     y = (dble(j)+0.5d0) * dx(2) + prob_lo(2)
-     do i = vx_l1, vx_h1
-        x = dble(i) * dx(1) + prob_lo(1)
-        vx(i,j,k) =  -( (psi(i,j+1)+psi(i-1,j+1)) - (psi(i,j-1)+psi(i-1,j-1)) ) * (0.25d0/dx(2))
-     end do
-  end do
-  end do
-
-  ! y velocity
-  do k = vy_l3, vy_h3
-  do j = vy_l2, vy_h2
-     y = dble(j) * dx(2) + prob_lo(2)
-     do i = vy_l1, vy_h1
-        x = (dble(i)+0.5d0) * dx(1) + prob_lo(1)
-        vy(i,j,k) = ( (psi(i+1,j)+psi(i+1,j-1)) - (psi(i-1,j)+psi(i-1,j-1)) ) * (0.25d0/dx(1))
-     end do
-  end do
-  end do
-
-  vz = 1.d0
-
-  call bl_deallocate(psi)
-
-end subroutine get_face_velocity
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/inputs b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/inputs
deleted file mode 100644
index 59269e52daf..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/inputs
+++ /dev/null
@@ -1,53 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 100
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.regrid_int      = 2       # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = -1    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = -1   # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
-# TRACER PARTICLES
-adv.do_tracers = 0
-
-# SENSEI in situ
-# enable and choose the configuration based on your build
-sensei.enabled = 1
-sensei.config = sensei/histogram_python.xml
-#sensei.config = sensei/render_iso_catalyst_2d.xml
-#sensei.config = sensei/write_vtk.xml
-#sensei.config = sensei/render_iso_catalyst_3d.xml
-#sensei.config = sensei/render_iso_libsim_2d.xml
-#sensei.config = sensei/render_iso_libsim_3d.xml
-sensei.frequency = 2
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/inputs.tracers b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/inputs.tracers
deleted file mode 100644
index 5e819644760..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/inputs.tracers
+++ /dev/null
@@ -1,44 +0,0 @@
-# ------------------  INPUTS TO MAIN PROGRAM  -------------------
-max_step = 1000000
-stop_time = 2.0
-
-# PROBLEM SIZE & GEOMETRY
-geometry.is_periodic =  1  1  1
-geometry.coord_sys   =  0       # 0 => cart
-geometry.prob_lo     =  0.0  0.0  0.0 
-geometry.prob_hi     =  1.0  1.0  1.0
-amr.n_cell           =  64   64   64
-
-# TIME STEP CONTROL
-adv.cfl            = 0.7     # cfl number for hyperbolic system
-                             # In this test problem, the velocity is
-			     # time-dependent.  We could use 0.9 in
-			     # the 3D test, but need to use 0.7 in 2D
-			     # to satisfy CFL condition.
-# VERBOSITY
-adv.v              = 1       # verbosity in Adv
-amr.v              = 1       # verbosity in Amr
-#amr.grid_log         = grdlog  # name of grid logging file
-
-# REFINEMENT / REGRIDDING
-amr.max_level       = 2       # maximum level number allowed
-amr.ref_ratio       = 2 2 2 2 # refinement ratio
-amr.regrid_int      = 2       # how often to regrid
-amr.blocking_factor = 8       # block factor in grid generation
-amr.max_grid_size   = 16
-
-# CHECKPOINT FILES
-amr.checkpoint_files_output = 0     # 0 will disable checkpoint files
-amr.check_file              = chk   # root name of checkpoint file
-amr.check_int               = 10    # number of timesteps between checkpoints
-
-# PLOTFILES
-amr.plot_files_output = 1      # 0 will disable plot files
-amr.plot_file         = plt    # root name of plot file
-amr.plot_int          = 100    # number of timesteps between plot files
-
-# PROBIN FILENAME
-amr.probin_file = probin
-
-# TRACER PARTICLES
-adv.do_tracers = 1
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/probin b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/probin
deleted file mode 100644
index f0df7817424..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/probin
+++ /dev/null
@@ -1,7 +0,0 @@
-&tagging
-  
-   phierr = 1.01d0, 1.1d0, 1.5d0
-
-   max_phierr_lev = 10
-
-/
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/histogram.py b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/histogram.py
deleted file mode 100644
index f93c5701419..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/histogram.py
+++ /dev/null
@@ -1,110 +0,0 @@
-import sys
-import numpy as np
-import vtk.util.numpy_support as vtknp
-from vtk import vtkDataObject, vtkCompositeDataSet, vtkMultiBlockDataSet
-
-# default values of control parameters
-numBins = 10
-meshName = ''
-arrayName = ''
-arrayCen = vtkDataObject.POINT
-outFile = 'hist'
-verbose = True
-
-def Initialize():
-    r = comm.Get_rank()
-    if r == 0:
-        if verbose:
-            sys.stderr.write( \
-                'Initialize numBins=%d meshName=%s arrayName=%s arrayCen=%d outFile=%s\n'%( \
-                numBins, meshName, arrayName, arrayCen, outFile))
-
-        # check for valid control parameters
-        if not meshName:
-            raise RuntimeError('meshName was not set')
-        if not arrayName:
-            raise RuntimeError('arrayName was not set')
-
-def Execute(adaptor):
-    r = comm.Get_rank()
-
-    # get the mesh and array we need
-    mesh = adaptor.GetMesh(meshName, True)
-    adaptor.AddArray(mesh, meshName, arrayCen, arrayName)
-
-    # force composite data to simplify computations
-    if not isinstance(mesh, vtkCompositeDataSet):
-        s = comm.Get_size()
-        mb = vtkMultiBlockDataSet()
-        mb.SetNumberOfBlocks(s)
-        mb.SetBlock(r, mesh)
-        mesh = mb
-
-    # compute the min and max over local blocks
-    mn = sys.float_info.max
-    mx = -mn
-    it = mesh.NewIterator()
-    while not it.IsDoneWithTraversal():
-        do = it.GetCurrentDataObject()
-
-        atts = do.GetPointData() if arrayCen == vtkDataObject.POINT \
-             else do.GetCellData()
-
-        da = vtknp.vtk_to_numpy(atts.GetArray(arrayName))
-
-        mn = min(mn, np.min(da))
-        mx = max(mx, np.max(da))
-
-        it.GoToNextItem()
-
-    # compute global min and max
-    mn = comm.allreduce(mn, op=MPI.MIN)
-    mx = comm.allreduce(mx, op=MPI.MAX)
-
-    # compute the histogram over local blocks
-    it.InitTraversal()
-    while not it.IsDoneWithTraversal():
-        do = it.GetCurrentDataObject()
-
-        atts = do.GetPointData() if arrayCen == vtkDataObject.POINT \
-             else do.GetCellData()
-
-        da = vtknp.vtk_to_numpy(atts.GetArray(arrayName))
-
-        h,be = np.histogram(da, bins=numBins, range=(mn,mx))
-
-        hist = hist + h if 'hist' in globals() else h
-
-        it.GoToNextItem()
-
-    # compute the global histogram on rank 0
-    h = comm.reduce(hist, root=0, op=MPI.SUM)
-
-    # rank 0 write to disk
-    if r == 0:
-        t = adaptor.GetDataTime()
-        ts = adaptor.GetDataTimeStep()
-        fn = '%s_%s_%s_%05d.txt'%(outFile, meshName, arrayName, ts)
-        f = open(fn, 'w')
-        f.write('step : %d\n'%(ts))
-        f.write('time : %0.6g\n'%(t))
-        f.write('num bins : %d\n'%(numBins))
-        f.write('range : %0.6g %0.6g\n'%(mn, mx))
-        f.write('bin edges : ')
-        for v in be:
-            f.write('%0.6g '%(v))
-        f.write('\n')
-        f.write('counts : ')
-        for v in h:
-            f.write('%d '%(v))
-        f.write('\n')
-        f.close()
-        if verbose:
-            sys.stderr.write('Execute "%s" written\n'%(fn))
-
-def Finalize():
-    r = comm.Get_rank()
-    if r == 0 and verbose:
-        sys.stderr.write('Finalize\n')
-    return 0
-
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/histogram_python.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/histogram_python.xml
deleted file mode 100644
index e5754480add..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/histogram_python.xml
+++ /dev/null
@@ -1,10 +0,0 @@
-<sensei>
-  <analysis type="python" script_file="sensei/histogram.py" enabled="1">
-    <initialize_source>
-numBins=10
-meshName='mesh'
-arrayName='phi'
-arrayCen=1
-     </initialize_source>
-  </analysis>
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/iso_extract.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/iso_extract.xml
deleted file mode 100644
index 1face1ff6d3..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/iso_extract.xml
+++ /dev/null
@@ -1,12 +0,0 @@
-<sensei>
-  <analysis type="SliceExtract" operation="iso_surface"
-    enable_partitioner="1" verbose="1" enabled="1">
-
-    <iso_values mesh_name="mesh" array_name="phi"
-       array_centering="cell">
-       1.5
-    </iso_values>
-
-    <writer mode="visit" output_dir="./isos" />
-  </analysis>
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/read_adios2_bp4_default.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/read_adios2_bp4_default.xml
deleted file mode 100644
index fb45411a327..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/read_adios2_bp4_default.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<sensei>
-  <transport type="adios2" filename="single_vortex_advect.bp" method="bp4"/>
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/read_adios2_sst_default.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/read_adios2_sst_default.xml
deleted file mode 100644
index eb66ba82e6e..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/read_adios2_sst_default.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<sensei>
-  <transport type="adios2" filename="single_vortex_advect.sst" engine="sst"/>
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_catalyst.py b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_catalyst.py
deleted file mode 100644
index 359a1665396..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_catalyst.py
+++ /dev/null
@@ -1,179 +0,0 @@
-
-from paraview.simple import *
-from paraview import coprocessing
-
-
-#--------------------------------------------------------------
-# Code generated from cpstate.py to create the CoProcessor.
-# ParaView 5.4.1 64 bits
-
-#--------------------------------------------------------------
-# Global screenshot output options
-imageFileNamePadding=4
-rescale_lookuptable=False
-
-
-# ----------------------- CoProcessor definition -----------------------
-
-def CreateCoProcessor():
-  def _CreatePipeline(coprocessor, datadescription):
-    class Pipeline:
-      # state file generated using paraview version 5.4.1
-
-      # ----------------------------------------------------------------
-      # setup views used in the visualization
-      # ----------------------------------------------------------------
-
-      #### disable automatic camera reset on 'Show'
-      paraview.simple._DisableFirstRenderCameraReset()
-
-      # Create a new 'Render View'
-      renderView1 = CreateView('RenderView')
-      renderView1.ViewSize = [480, 480]
-      renderView1.AxesGrid = 'GridAxes3DActor'
-      renderView1.CenterOfRotation = [0.5, 0.5, 0.0]
-      renderView1.StereoType = 0
-      renderView1.CameraPosition = [0.5, 0.5, 1.9306242333430546]
-      renderView1.CameraFocalPoint = [0.5, 0.5, -0.8014265742258199]
-      renderView1.CameraParallelScale = 0.7071067811865476
-      renderView1.Background = [0.0, 0.0, 0.0]
-
-      # register the view with coprocessor
-      # and provide it with information such as the filename to use,
-      # how frequently to write the images, etc.
-      coprocessor.RegisterView(renderView1,
-          filename='image_%t.png', freq=1, fittoscreen=0, magnification=1, width=480, height=480, cinema={})
-      renderView1.ViewTime = datadescription.GetTime()
-
-      # ----------------------------------------------------------------
-      # setup the data processing pipelines
-      # ----------------------------------------------------------------
-
-      # create a new 'XML UniformGrid AMR Reader'
-      # create a producer from a simulation input
-      amr_mesh_ = coprocessor.CreateProducer(datadescription, 'mesh')
-
-      # create a new 'Outline'
-      outline1 = Outline(Input=amr_mesh_)
-
-      # ----------------------------------------------------------------
-      # setup color maps and opacity mapes used in the visualization
-      # note: the Get..() functions create a new object, if needed
-      # ----------------------------------------------------------------
-
-      # get color transfer function/color map for 'phi'
-      phiLUT = GetColorTransferFunction('phi')
-      phiLUT.RGBPoints = [0.9990617484291469, 0.278431372549, 0.278431372549, 0.858823529412, 1.1420481577953918, 0.0, 0.0, 0.360784313725, 1.2840346622010337, 0.0, 1.0, 1.0, 1.4280209765278817, 0.0, 0.501960784314, 0.0, 1.5700074809335236, 1.0, 1.0, 0.0, 1.7129938902997686, 1.0, 0.380392156863, 0.0, 1.8559802996660135, 0.419607843137, 0.0, 0.0, 1.9989667090322585, 0.878431372549, 0.301960784314, 0.301960784314]
-      phiLUT.ColorSpace = 'RGB'
-      phiLUT.ScalarRangeInitialized = 1.0
-
-      # get opacity transfer function/opacity map for 'phi'
-      phiPWF = GetOpacityTransferFunction('phi')
-      phiPWF.Points = [0.9990617484291469, 0.0, 0.5, 0.0, 1.9989667090322585, 1.0, 0.5, 0.0]
-      phiPWF.ScalarRangeInitialized = 1
-
-      # ----------------------------------------------------------------
-      # setup the visualization in view 'renderView1'
-      # ----------------------------------------------------------------
-
-      # show data from amr_mesh_
-      amr_mesh_Display = Show(amr_mesh_, renderView1)
-      # trace defaults for the display properties.
-      amr_mesh_Display.Representation = 'Wireframe'
-      amr_mesh_Display.ColorArrayName = ['CELLS', 'phi']
-      amr_mesh_Display.LookupTable = phiLUT
-      amr_mesh_Display.OSPRayScaleArray = 'phi'
-      amr_mesh_Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      amr_mesh_Display.SelectOrientationVectors = 'None'
-      amr_mesh_Display.ScaleFactor = 0.1
-      amr_mesh_Display.SelectScaleArray = 'None'
-      amr_mesh_Display.GlyphType = 'Arrow'
-      amr_mesh_Display.GlyphTableIndexArray = 'None'
-      amr_mesh_Display.DataAxesGrid = 'GridAxesRepresentation'
-      amr_mesh_Display.PolarAxes = 'PolarAxesRepresentation'
-      amr_mesh_Display.ScalarOpacityUnitDistance = 0.08838834764831846
-      amr_mesh_Display.ScalarOpacityFunction = phiPWF
-
-      # show data from outline1
-      outline1Display = Show(outline1, renderView1)
-      # trace defaults for the display properties.
-      outline1Display.Representation = 'Surface'
-      outline1Display.ColorArrayName = [None, '']
-      outline1Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      outline1Display.SelectOrientationVectors = 'None'
-      outline1Display.ScaleFactor = 0.1
-      outline1Display.SelectScaleArray = 'None'
-      outline1Display.GlyphType = 'Arrow'
-      outline1Display.GlyphTableIndexArray = 'None'
-      outline1Display.DataAxesGrid = 'GridAxesRepresentation'
-      outline1Display.PolarAxes = 'PolarAxesRepresentation'
-      outline1Display.GaussianRadius = 0.05
-      outline1Display.SetScaleArray = [None, '']
-      outline1Display.ScaleTransferFunction = 'PiecewiseFunction'
-      outline1Display.OpacityArray = [None, '']
-      outline1Display.OpacityTransferFunction = 'PiecewiseFunction'
-
-      # ----------------------------------------------------------------
-      # finally, restore active source
-      SetActiveSource(outline1)
-      # ----------------------------------------------------------------
-    return Pipeline()
-
-  class CoProcessor(coprocessing.CoProcessor):
-    def CreatePipeline(self, datadescription):
-      self.Pipeline = _CreatePipeline(self, datadescription)
-
-  coprocessor = CoProcessor()
-  # these are the frequencies at which the coprocessor updates.
-  freqs = {'mesh': [1, 1]}
-  coprocessor.SetUpdateFrequencies(freqs)
-  return coprocessor
-
-
-#--------------------------------------------------------------
-# Global variable that will hold the pipeline for each timestep
-# Creating the CoProcessor object, doesn't actually create the ParaView pipeline.
-# It will be automatically setup when coprocessor.UpdateProducers() is called the
-# first time.
-coprocessor = CreateCoProcessor()
-
-#--------------------------------------------------------------
-# Enable Live-Visualizaton with ParaView and the update frequency
-coprocessor.EnableLiveVisualization(False, 1)
-
-# ---------------------- Data Selection method ----------------------
-
-def RequestDataDescription(datadescription):
-    "Callback to populate the request for current timestep"
-    global coprocessor
-    if datadescription.GetForceOutput() == True:
-        # We are just going to request all fields and meshes from the simulation
-        # code/adaptor.
-        for i in range(datadescription.GetNumberOfInputDescriptions()):
-            datadescription.GetInputDescription(i).AllFieldsOn()
-            datadescription.GetInputDescription(i).GenerateMeshOn()
-        return
-
-    # setup requests for all inputs based on the requirements of the
-    # pipeline.
-    coprocessor.LoadRequestedData(datadescription)
-
-# ------------------------ Processing method ------------------------
-
-def DoCoProcessing(datadescription):
-    "Callback to do co-processing for current timestep"
-    global coprocessor
-
-    # Update the coprocessor by providing it the newly generated simulation data.
-    # If the pipeline hasn't been setup yet, this will setup the pipeline.
-    coprocessor.UpdateProducers(datadescription)
-
-    # Write output data, if appropriate.
-    coprocessor.WriteData(datadescription);
-
-    # Write image capture (Last arg: rescale lookup table), if appropriate.
-    coprocessor.WriteImages(datadescription, rescale_lookuptable=rescale_lookuptable,
-        image_quality=0, padding_amount=imageFileNamePadding)
-
-    # Live Visualization, if enabled.
-    coprocessor.DoLiveVisualization(datadescription, "localhost", 22222)
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_2d.py b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_2d.py
deleted file mode 100644
index dacd30b8dce..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_2d.py
+++ /dev/null
@@ -1,228 +0,0 @@
-
-from paraview.simple import *
-from paraview import coprocessing
-
-
-#--------------------------------------------------------------
-# Code generated from cpstate.py to create the CoProcessor.
-# ParaView 5.4.1 64 bits
-
-#--------------------------------------------------------------
-# Global screenshot output options
-imageFileNamePadding=5
-rescale_lookuptable=False
-
-
-# ----------------------- CoProcessor definition -----------------------
-
-def CreateCoProcessor():
-  def _CreatePipeline(coprocessor, datadescription):
-    class Pipeline:
-      # state file generated using paraview version 5.4.1
-
-      # ----------------------------------------------------------------
-      # setup views used in the visualization
-      # ----------------------------------------------------------------
-
-      #### disable automatic camera reset on 'Show'
-      paraview.simple._DisableFirstRenderCameraReset()
-
-      # Create a new 'Render View'
-      renderView1 = CreateView('RenderView')
-      renderView1.ViewSize = [1000, 800]
-      renderView1.InteractionMode = '2D'
-      renderView1.AxesGrid = 'GridAxes3DActor'
-      renderView1.OrientationAxesLabelColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.OrientationAxesOutlineColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.CenterOfRotation = [0.5, 0.5, 0.0]
-      renderView1.StereoType = 0
-      renderView1.CameraPosition = [0.6499329008559785, 0.4879518204669307, 10000.0]
-      renderView1.CameraFocalPoint = [0.6499329008559785, 0.4879518204669307, 0.0]
-      renderView1.CameraParallelScale = 0.5952751765669945
-      renderView1.Background = [1.0, 1.0, 1.0]
-
-      # init the 'GridAxes3DActor' selected for 'AxesGrid'
-      renderView1.AxesGrid.Visibility = 0
-      renderView1.AxesGrid.XTitle = 'X'
-      renderView1.AxesGrid.YTitle = 'Y '
-      renderView1.AxesGrid.ZTitle = ''
-      renderView1.AxesGrid.XTitleColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.XTitleBold = 1
-      renderView1.AxesGrid.XTitleFontSize = 16
-      renderView1.AxesGrid.YTitleColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.YTitleBold = 1
-      renderView1.AxesGrid.YTitleFontSize = 16
-      renderView1.AxesGrid.GridColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.XLabelColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.XLabelBold = 1
-      renderView1.AxesGrid.YLabelColor = [0.0, 0.0, 0.4980392156862745]
-      renderView1.AxesGrid.YLabelBold = 1
-
-      # register the view with coprocessor
-      # and provide it with information such as the filename to use,
-      # how frequently to write the images, etc.
-      coprocessor.RegisterView(renderView1,
-          filename='pv_image_2d_%t.png', freq=1, fittoscreen=0, magnification=1, width=1000, height=800, cinema={})
-      renderView1.ViewTime = datadescription.GetTime()
-
-      # ----------------------------------------------------------------
-      # setup the data processing pipelines
-      # ----------------------------------------------------------------
-
-      # create a new 'XML UniformGrid AMR Reader'
-      # create a producer from a simulation input
-      mesh_0000 = coprocessor.CreateProducer(datadescription, 'mesh')
-
-      # create a new 'Cell Data to Point Data'
-      cellDatatoPointData1 = CellDatatoPointData(Input=mesh_0000)
-
-      # create a new 'Contour'
-      contour1 = Contour(Input=cellDatatoPointData1)
-      contour1.ContourBy = ['POINTS', 'phi']
-      contour1.ComputeScalars = 1
-      contour1.Isosurfaces = [0.99517, 1.1054688888888888, 1.2157677777777778, 1.3260666666666667, 1.4363655555555555, 1.5466644444444444, 1.6569633333333333, 1.767262222222222, 1.877561111111111, 1.98786]
-      contour1.PointMergeMethod = 'Uniform Binning'
-
-      # ----------------------------------------------------------------
-      # setup color maps and opacity mapes used in the visualization
-      # note: the Get..() functions create a new object, if needed
-      # ----------------------------------------------------------------
-
-      # get color transfer function/color map for 'phi'
-      phiLUT = GetColorTransferFunction('phi')
-      phiLUT.RGBPoints = [1.0, 0.278431372549, 0.278431372549, 0.858823529412, 1.1428909412660986, 0.0, 0.0, 0.360784313725, 1.2847826451806859, 0.0, 1.0, 1.0, 1.4286728237982957, 0.0, 0.501960784314, 0.0, 1.570564527712883, 1.0, 1.0, 0.0, 1.7134554689789816, 1.0, 0.380392156863, 0.0, 1.8563464102450802, 0.419607843137, 0.0, 0.0, 1.9992373515111788, 0.878431372549, 0.301960784314, 0.301960784314]
-      phiLUT.ColorSpace = 'RGB'
-      phiLUT.ScalarRangeInitialized = 1.0
-
-      # get opacity transfer function/opacity map for 'phi'
-      phiPWF = GetOpacityTransferFunction('phi')
-      phiPWF.Points = [1.0, 0.0, 0.5, 0.0, 1.9992373515111788, 1.0, 0.5, 0.0]
-      phiPWF.ScalarRangeInitialized = 1
-
-      # ----------------------------------------------------------------
-      # setup the visualization in view 'renderView1'
-      # ----------------------------------------------------------------
-
-      # show data from mesh_0000
-      mesh_0000Display = Show(mesh_0000, renderView1)
-      # trace defaults for the display properties.
-      mesh_0000Display.Representation = 'Wireframe'
-      mesh_0000Display.AmbientColor = [0.0, 0.0, 0.0]
-      mesh_0000Display.ColorArrayName = ['POINTS', '']
-      mesh_0000Display.OSPRayScaleArray = 'GhostType'
-      mesh_0000Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      mesh_0000Display.SelectOrientationVectors = 'None'
-      mesh_0000Display.ScaleFactor = 0.1
-      mesh_0000Display.SelectScaleArray = 'None'
-      mesh_0000Display.GlyphType = 'Arrow'
-      mesh_0000Display.GlyphTableIndexArray = 'None'
-      mesh_0000Display.DataAxesGrid = 'GridAxesRepresentation'
-      mesh_0000Display.PolarAxes = 'PolarAxesRepresentation'
-      #mesh_0000Display.ScalarOpacityUnitDistance = 0.057873097067582834
-
-      # show data from contour1
-      contour1Display = Show(contour1, renderView1)
-      # trace defaults for the display properties.
-      contour1Display.Representation = 'Surface'
-      contour1Display.ColorArrayName = ['POINTS', 'phi']
-      contour1Display.LookupTable = phiLUT
-      contour1Display.LineWidth = 2.0
-      contour1Display.OSPRayScaleArray = 'phi'
-      contour1Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      contour1Display.SelectOrientationVectors = 'None'
-      contour1Display.ScaleFactor = 0.05746527910232544
-      contour1Display.SelectScaleArray = 'None'
-      contour1Display.GlyphType = 'Arrow'
-      contour1Display.GlyphTableIndexArray = 'None'
-      contour1Display.DataAxesGrid = 'GridAxesRepresentation'
-      contour1Display.PolarAxes = 'PolarAxesRepresentation'
-      contour1Display.GaussianRadius = 0.02873263955116272
-      contour1Display.SetScaleArray = ['POINTS', 'phi']
-      contour1Display.ScaleTransferFunction = 'PiecewiseFunction'
-      contour1Display.OpacityArray = ['POINTS', 'phi']
-      contour1Display.OpacityTransferFunction = 'PiecewiseFunction'
-
-      # show color legend
-      contour1Display.SetScalarBarVisibility(renderView1, True)
-
-      # setup the color legend parameters for each legend in this view
-
-      # get color legend/bar for phiLUT in view renderView1
-      phiLUTColorBar = GetScalarBar(phiLUT, renderView1)
-      phiLUTColorBar.WindowLocation = 'AnyLocation'
-      phiLUTColorBar.Position = [0.7951562900333077, 0.0840151515151517]
-      phiLUTColorBar.Title = 'phi'
-      phiLUTColorBar.ComponentTitle = ''
-      phiLUTColorBar.TitleColor = [0.0, 0.0, 0.0]
-      phiLUTColorBar.TitleBold = 1
-      phiLUTColorBar.TitleFontSize = 32
-      phiLUTColorBar.LabelColor = [0.0, 0.0, 0.0]
-      phiLUTColorBar.LabelBold = 1
-      phiLUTColorBar.LabelFontSize = 24
-      phiLUTColorBar.ScalarBarThickness = 28
-      phiLUTColorBar.ScalarBarLength = 0.848928571428571
-
-      # ----------------------------------------------------------------
-      # finally, restore active source
-      SetActiveSource(contour1)
-      # ----------------------------------------------------------------
-    return Pipeline()
-
-  class CoProcessor(coprocessing.CoProcessor):
-    def CreatePipeline(self, datadescription):
-      self.Pipeline = _CreatePipeline(self, datadescription)
-
-  coprocessor = CoProcessor()
-  # these are the frequencies at which the coprocessor updates.
-  freqs = {'mesh': [1, 1, 1]}
-  coprocessor.SetUpdateFrequencies(freqs)
-  return coprocessor
-
-
-#--------------------------------------------------------------
-# Global variable that will hold the pipeline for each timestep
-# Creating the CoProcessor object, doesn't actually create the ParaView pipeline.
-# It will be automatically setup when coprocessor.UpdateProducers() is called the
-# first time.
-coprocessor = CreateCoProcessor()
-
-#--------------------------------------------------------------
-# Enable Live-Visualizaton with ParaView and the update frequency
-coprocessor.EnableLiveVisualization(False, 1)
-
-# ---------------------- Data Selection method ----------------------
-
-def RequestDataDescription(datadescription):
-    "Callback to populate the request for current timestep"
-    global coprocessor
-    if datadescription.GetForceOutput() == True:
-        # We are just going to request all fields and meshes from the simulation
-        # code/adaptor.
-        for i in range(datadescription.GetNumberOfInputDescriptions()):
-            datadescription.GetInputDescription(i).AllFieldsOn()
-            datadescription.GetInputDescription(i).GenerateMeshOn()
-        return
-
-    # setup requests for all inputs based on the requirements of the
-    # pipeline.
-    coprocessor.LoadRequestedData(datadescription)
-
-# ------------------------ Processing method ------------------------
-
-def DoCoProcessing(datadescription):
-    "Callback to do co-processing for current timestep"
-    global coprocessor
-
-    # Update the coprocessor by providing it the newly generated simulation data.
-    # If the pipeline hasn't been setup yet, this will setup the pipeline.
-    coprocessor.UpdateProducers(datadescription)
-
-    # Write output data, if appropriate.
-    coprocessor.WriteData(datadescription);
-
-    # Write image capture (Last arg: rescale lookup table), if appropriate.
-    coprocessor.WriteImages(datadescription, rescale_lookuptable=rescale_lookuptable,
-        image_quality=0, padding_amount=imageFileNamePadding)
-
-    # Live Visualization, if enabled.
-    coprocessor.DoLiveVisualization(datadescription, "localhost", 22222)
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_2d.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_2d.xml
deleted file mode 100644
index b54983f3adb..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_2d.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<sensei>
-  <!-- catalyst 2D -->
-  <analysis type="catalyst" pipeline="pythonscript"
-    filename="sensei/render_iso_catalyst_2d.py" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_3d.py b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_3d.py
deleted file mode 100644
index d766600ac59..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_3d.py
+++ /dev/null
@@ -1,233 +0,0 @@
-
-from paraview.simple import *
-from paraview import coprocessing
-
-
-#--------------------------------------------------------------
-# Code generated from cpstate.py to create the CoProcessor.
-# ParaView 5.4.1 64 bits
-
-#--------------------------------------------------------------
-# Global screenshot output options
-imageFileNamePadding=5
-rescale_lookuptable=False
-
-
-# ----------------------- CoProcessor definition -----------------------
-
-def CreateCoProcessor():
-  def _CreatePipeline(coprocessor, datadescription):
-    class Pipeline:
-      # state file generated using paraview version 5.4.1
-
-      # ----------------------------------------------------------------
-      # setup views used in the visualization
-      # ----------------------------------------------------------------
-
-      #### disable automatic camera reset on 'Show'
-      paraview.simple._DisableFirstRenderCameraReset()
-
-      # Create a new 'Render View'
-      renderView1 = CreateView('RenderView')
-      renderView1.ViewSize = [1000, 700]
-      renderView1.AxesGrid = 'GridAxes3DActor'
-      renderView1.CenterOfRotation = [0.5, 0.5, 0.5]
-      renderView1.StereoType = 0
-      renderView1.CameraPosition = [0.5, 0.5, 3.2557533687070332]
-      renderView1.CameraFocalPoint = [0.5, 0.5, -0.09031184624419736]
-      renderView1.CameraParallelScale = 0.8660254037844386
-      renderView1.Background = [0.0, 0.0, 0.0]
-
-      # register the view with coprocessor
-      # and provide it with information such as the filename to use,
-      # how frequently to write the images, etc.
-      coprocessor.RegisterView(renderView1,
-          filename='pv_image_3d_%t.png', freq=1, fittoscreen=0, magnification=1, width=1000, height=700, cinema={})
-      renderView1.ViewTime = datadescription.GetTime()
-
-      # ----------------------------------------------------------------
-      # setup the data processing pipelines
-      # ----------------------------------------------------------------
-
-      # create a new 'XML UniformGrid AMR Reader'
-      # create a producer from a simulation input
-      mesh_000 = coprocessor.CreateProducer(datadescription, 'mesh')
-
-      # create a new 'Cell Data to Point Data'
-      cellDatatoPointData1 = CellDatatoPointData(Input=mesh_000)
-
-      # create a new 'Contour'
-      contour1 = Contour(Input=cellDatatoPointData1)
-      contour1.ContourBy = ['POINTS', 'phi']
-      contour1.ComputeScalars = 1
-      contour1.Isosurfaces = [0.99429, 1.1043655555555556, 1.214441111111111, 1.3245166666666668, 1.4345922222222223, 1.5446677777777778, 1.6547433333333332, 1.764818888888889, 1.8748944444444444, 1.98497]
-      contour1.PointMergeMethod = 'Uniform Binning'
-
-      # create a new 'Annotate Time'
-      annotateTime1 = AnnotateTime()
-      annotateTime1.Format = 't = %0.2f'
-
-      # ----------------------------------------------------------------
-      # setup color maps and opacity mapes used in the visualization
-      # note: the Get..() functions create a new object, if needed
-      # ----------------------------------------------------------------
-
-      # get color transfer function/color map for 'phi'
-      phiLUT = GetColorTransferFunction('phi')
-      phiLUT.RGBPoints = [0.99429, 0.278431372549, 0.278431372549, 0.858823529412, 1.13595724, 0.0, 0.0, 0.360784313725, 1.2766338000000002, 0.0, 1.0, 1.0, 1.41929172, 0.0, 0.501960784314, 0.0, 1.55996828, 1.0, 1.0, 0.0, 1.70163552, 1.0, 0.380392156863, 0.0, 1.84330276, 0.419607843137, 0.0, 0.0, 1.9849700000000001, 0.878431372549, 0.301960784314, 0.301960784314]
-      phiLUT.ColorSpace = 'RGB'
-      phiLUT.ScalarRangeInitialized = 1.0
-
-      # get opacity transfer function/opacity map for 'phi'
-      phiPWF = GetOpacityTransferFunction('phi')
-      phiPWF.Points = [0.99429, 0.0, 0.5, 0.0, 1.9849700000000001, 1.0, 0.5, 0.0]
-      phiPWF.ScalarRangeInitialized = 1
-
-      # ----------------------------------------------------------------
-      # setup the visualization in view 'renderView1'
-      # ----------------------------------------------------------------
-
-      # show data from mesh_000
-      mesh_000Display = Show(mesh_000, renderView1)
-      # trace defaults for the display properties.
-      mesh_000Display.Representation = 'AMR Blocks'
-      mesh_000Display.ColorArrayName = [None, '']
-      mesh_000Display.DiffuseColor = [0.0, 0.0, 0.0]
-      mesh_000Display.OSPRayScaleArray = 'GhostType'
-      mesh_000Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      mesh_000Display.SelectOrientationVectors = 'None'
-      mesh_000Display.ScaleFactor = 0.1
-      mesh_000Display.SelectScaleArray = 'None'
-      mesh_000Display.GlyphType = 'Arrow'
-      mesh_000Display.GlyphTableIndexArray = 'None'
-      mesh_000Display.DataAxesGrid = 'GridAxesRepresentation'
-      mesh_000Display.PolarAxes = 'PolarAxesRepresentation'
-      mesh_000Display.ScalarOpacityUnitDistance = 0.0174438098693218
-
-      # init the 'GridAxesRepresentation' selected for 'DataAxesGrid'
-      mesh_000Display.DataAxesGrid.XTitle = 'X'
-      mesh_000Display.DataAxesGrid.YTitle = 'Y'
-      mesh_000Display.DataAxesGrid.ZTitle = 'Z'
-      mesh_000Display.DataAxesGrid.XTitleBold = 1
-      mesh_000Display.DataAxesGrid.XTitleFontSize = 14
-      mesh_000Display.DataAxesGrid.YTitleBold = 1
-      mesh_000Display.DataAxesGrid.YTitleFontSize = 14
-      mesh_000Display.DataAxesGrid.ZTitleBold = 1
-      mesh_000Display.DataAxesGrid.ZTitleFontSize = 14
-      mesh_000Display.DataAxesGrid.XLabelBold = 1
-      mesh_000Display.DataAxesGrid.XLabelFontSize = 14
-      mesh_000Display.DataAxesGrid.YLabelBold = 1
-      mesh_000Display.DataAxesGrid.YLabelFontSize = 14
-      mesh_000Display.DataAxesGrid.ZLabelBold = 1
-      mesh_000Display.DataAxesGrid.ZLabelFontSize = 14
-
-      # show data from contour1
-      contour1Display = Show(contour1, renderView1)
-      # trace defaults for the display properties.
-      contour1Display.Representation = 'Surface'
-      contour1Display.ColorArrayName = ['POINTS', 'phi']
-      contour1Display.LookupTable = phiLUT
-      contour1Display.OSPRayScaleArray = 'GhostType'
-      contour1Display.OSPRayScaleFunction = 'PiecewiseFunction'
-      contour1Display.SelectOrientationVectors = 'GhostType'
-      contour1Display.ScaleFactor = 0.0572519063949585
-      contour1Display.SelectScaleArray = 'GhostType'
-      contour1Display.GlyphType = 'Arrow'
-      contour1Display.GlyphTableIndexArray = 'GhostType'
-      contour1Display.DataAxesGrid = 'GridAxesRepresentation'
-      contour1Display.PolarAxes = 'PolarAxesRepresentation'
-      contour1Display.GaussianRadius = 0.02862595319747925
-      contour1Display.SetScaleArray = ['POINTS', 'GhostType']
-      contour1Display.ScaleTransferFunction = 'PiecewiseFunction'
-      contour1Display.OpacityArray = ['POINTS', 'GhostType']
-      contour1Display.OpacityTransferFunction = 'PiecewiseFunction'
-
-      # show color legend
-      contour1Display.SetScalarBarVisibility(renderView1, True)
-
-      # show data from annotateTime1
-      annotateTime1Display = Show(annotateTime1, renderView1)
-      # trace defaults for the display properties.
-      annotateTime1Display.Bold = 1
-      annotateTime1Display.FontSize = 12
-      annotateTime1Display.WindowLocation = 'LowerLeftCorner'
-
-      # setup the color legend parameters for each legend in this view
-
-      # get color legend/bar for phiLUT in view renderView1
-      phiLUTColorBar = GetScalarBar(phiLUT, renderView1)
-      phiLUTColorBar.WindowLocation = 'AnyLocation'
-      phiLUTColorBar.Position = [0.852, 0.07857142857142851]
-      phiLUTColorBar.Title = 'phi'
-      phiLUTColorBar.ComponentTitle = ''
-      phiLUTColorBar.TitleBold = 1
-      phiLUTColorBar.TitleFontSize = 24
-      phiLUTColorBar.LabelBold = 1
-      phiLUTColorBar.LabelFontSize = 18
-      phiLUTColorBar.ScalarBarThickness = 24
-      phiLUTColorBar.ScalarBarLength = 0.8357142857142857
-
-      # ----------------------------------------------------------------
-      # finally, restore active source
-      SetActiveSource(mesh_000)
-      # ----------------------------------------------------------------
-    return Pipeline()
-
-  class CoProcessor(coprocessing.CoProcessor):
-    def CreatePipeline(self, datadescription):
-      self.Pipeline = _CreatePipeline(self, datadescription)
-
-  coprocessor = CoProcessor()
-  # these are the frequencies at which the coprocessor updates.
-  freqs = {'mesh': [1, 1, 1]}
-  coprocessor.SetUpdateFrequencies(freqs)
-  return coprocessor
-
-
-#--------------------------------------------------------------
-# Global variable that will hold the pipeline for each timestep
-# Creating the CoProcessor object, doesn't actually create the ParaView pipeline.
-# It will be automatically setup when coprocessor.UpdateProducers() is called the
-# first time.
-coprocessor = CreateCoProcessor()
-
-#--------------------------------------------------------------
-# Enable Live-Visualizaton with ParaView and the update frequency
-coprocessor.EnableLiveVisualization(False, 1)
-
-# ---------------------- Data Selection method ----------------------
-
-def RequestDataDescription(datadescription):
-    "Callback to populate the request for current timestep"
-    global coprocessor
-    if datadescription.GetForceOutput() == True:
-        # We are just going to request all fields and meshes from the simulation
-        # code/adaptor.
-        for i in range(datadescription.GetNumberOfInputDescriptions()):
-            datadescription.GetInputDescription(i).AllFieldsOn()
-            datadescription.GetInputDescription(i).GenerateMeshOn()
-        return
-
-    # setup requests for all inputs based on the requirements of the
-    # pipeline.
-    coprocessor.LoadRequestedData(datadescription)
-
-# ------------------------ Processing method ------------------------
-
-def DoCoProcessing(datadescription):
-    "Callback to do co-processing for current timestep"
-    global coprocessor
-
-    # Update the coprocessor by providing it the newly generated simulation data.
-    # If the pipeline hasn't been setup yet, this will setup the pipeline.
-    coprocessor.UpdateProducers(datadescription)
-
-    # Write output data, if appropriate.
-    coprocessor.WriteData(datadescription);
-
-    # Write image capture (Last arg: rescale lookup table), if appropriate.
-    coprocessor.WriteImages(datadescription, rescale_lookuptable=rescale_lookuptable,
-        image_quality=0, padding_amount=imageFileNamePadding)
-
-    # Live Visualization, if enabled.
-    coprocessor.DoLiveVisualization(datadescription, "localhost", 22222)
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_3d.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_3d.xml
deleted file mode 100644
index b5538909057..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_catalyst_3d.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<sensei>
-  <!-- catalyst 3D -->
-  <analysis type="catalyst" pipeline="pythonscript"
-    filename="sensei/render_iso_catalyst_3d.py" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_2d.session b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_2d.session
deleted file mode 100644
index f7ce119fdec..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_2d.session
+++ /dev/null
@@ -1,5300 +0,0 @@
-<?xml version="1.0"?>
-<Object name="VisIt">
-    <Field name="Version" type="string">2.13.2</Field>
-    <Object name="VIEWER">
-        <Object name="DEFAULT_VALUES">
-            <Object name="GlobalAttributes">
-                <Field name="autoUpdateFlag" type="bool">false</Field>
-                <Field name="replacePlots" type="bool">false</Field>
-                <Field name="applyWindow" type="bool">false</Field>
-                <Field name="applyOperator" type="bool">false</Field>
-                <Field name="windowLayout" type="int">1</Field>
-                <Field name="makeDefaultConfirm" type="bool">true</Field>
-                <Field name="cloneWindowOnFirstRef" type="bool">false</Field>
-                <Field name="automaticallyAddOperator" type="bool">false</Field>
-                <Field name="tryHarderCyclesTimes" type="bool">false</Field>
-                <Field name="treatAllDBsAsTimeVarying" type="bool">false</Field>
-                <Field name="createMeshQualityExpressions" type="bool">true</Field>
-                <Field name="createTimeDerivativeExpressions" type="bool">true</Field>
-                <Field name="createVectorMagnitudeExpressions" type="bool">true</Field>
-                <Field name="newPlotsInheritSILRestriction" type="bool">true</Field>
-                <Field name="userDirForSessionFiles" type="bool">false</Field>
-                <Field name="saveCrashRecoveryFile" type="bool">true</Field>
-                <Field name="applySelection" type="bool">false</Field>
-                <Field name="userRestoreSessionFile" type="bool">false</Field>
-                <Field name="precisionType" type="int">1</Field>
-                <Field name="backendType" type="int">0</Field>
-                <Field name="removeDuplicateNodes" type="bool">false</Field>
-            </Object>
-            <Object name="SaveWindowAttributes">
-                <Field name="outputToCurrentDirectory" type="bool">true</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="fileName" type="string">visit</Field>
-                <Field name="family" type="bool">true</Field>
-                <Field name="format" type="string">PNG</Field>
-                <Field name="width" type="int">1024</Field>
-                <Field name="height" type="int">1024</Field>
-                <Field name="screenCapture" type="bool">true</Field>
-                <Field name="saveTiled" type="bool">false</Field>
-                <Field name="quality" type="int">80</Field>
-                <Field name="progressive" type="bool">false</Field>
-                <Field name="binary" type="bool">false</Field>
-                <Field name="lastRealFilename" type="string"></Field>
-                <Field name="stereo" type="bool">false</Field>
-                <Field name="compression" type="string">None</Field>
-                <Field name="forceMerge" type="bool">false</Field>
-                <Field name="resConstraint" type="string">ScreenProportions</Field>
-                <Field name="advancedMultiWindowSave" type="bool">false</Field>
-                <Object name="subWindowAtts">
-                    <Object name="SaveSubWindowsAttributes">
-                        <Object name="win1">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win2">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win3">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win4">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win5">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win6">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win7">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win8">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win9">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win10">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win11">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win12">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win13">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win14">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win15">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win16">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ColorTableAttributes">
-                <Field name="activeContinuous" type="string">hot</Field>
-                <Field name="activeDiscrete" type="string">levels</Field>
-                <Field name="groupingFlag" type="bool">false</Field>
-                <Object name="table00">
-                    <Field name="ctName" type="string">amino_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 189 159 109 255 0.009 199 199 199 255 0.019 255 105 180 255 0.028 230 230 0 255 0.037 230 9 9 255 0.046 230 9 9 255 0.056 49 49 170 255 0.065 235 235 235 255 0.074 130 130 210 255 0.083 15 130 15 255 0.093 19 90 255 255 0.102 15 130 15 255 0.111 230 230 0 255 0.12 0 220 220 255 0.13 220 149 130 255 0.139 0 220 220 255 0.148 19 90 255 255 0.157 249 149 0 255 0.167 249 149 0 255 0.176 15 130 15 255 0.185 180 90 180 255 0.194 49 49 170 255 0.204 255 105 180 255 </Field>
-                </Object>
-                <Object name="table01">
-                    <Field name="ctName" type="string">amino_shapely</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.009 139 255 139 255 0.019 255 0 255 255 0.028 255 255 111 255 0.037 159 0 66 255 0.046 102 0 0 255 0.056 82 75 82 255 0.065 255 255 255 255 0.074 111 111 255 255 0.083 0 75 0 255 0.093 70 70 184 255 0.102 69 94 69 255 0.111 184 159 66 255 0.12 255 123 111 255 0.13 82 82 82 255 0.139 255 75 75 255 0.148 0 0 123 255 0.157 255 111 66 255 0.167 184 75 0 255 0.176 255 139 255 255 0.185 79 70 0 255 0.194 139 111 75 255 0.204 255 0 255 255 </Field>
-                </Object>
-                <Object name="table02">
-                    <Field name="ctName" type="string">bluehot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.333 0 0 127 255 0.666 0 127 255 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table03">
-                    <Field name="ctName" type="string">caleblack</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table04">
-                    <Field name="ctName" type="string">calewhite</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table05">
-                    <Field name="ctName" type="string">contoured</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.333 0 255 0 255 0.666 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table06">
-                    <Field name="ctName" type="string">cpk_jmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 217 255 255 255 0.028 204 128 255 255 0.037 194 255 0 255 0.046 255 181 181 255 0.055 144 144 144 255 0.064 47 80 248 255 0.073 255 13 13 255 0.083 144 223 80 255 0.092 179 226 245 255 0.101 171 92 241 255 0.11 137 255 0 255 0.119 190 166 166 255 0.128 239 199 159 255 0.138 255 128 0 255 0.147 255 255 47 255 0.156 31 239 31 255 0.165 128 209 226 255 0.174 143 64 211 255 0.183 60 255 0 255 0.193 230 230 230 255 0.202 190 194 198 255 0.211 166 166 171 255 0.22 137 153 198 255 0.229 156 121 198 255 0.239 223 102 51 255 0.248 239 144 159 255 0.257 80 208 80 255 0.266 199 128 51 255 0.275 124 128 175 255 0.284 194 143 143 255 0.294 102 143 143 255 0.303 188 128 226 255 0.312 255 160 0 255 0.321 166 41 41 255 0.33 92 184 209 255 0.339 111 45 175 255 0.349 0 255 0 255 0.358 147 255 255 255 0.367 147 223 223 255 0.376 115 194 200 255 0.385 83 181 181 255 0.394 58 158 158 255 0.404 35 143 143 255 0.413 9 124 139 255 0.422 0 105 133 255 0.431 192 192 192 255 0.44 255 217 143 255 0.45 166 117 115 255 0.459 102 128 128 255 0.468 158 98 181 255 0.477 211 121 0 255 0.486 147 0 147 255 0.495 66 158 175 255 0.505 86 22 143 255 0.514 0 200 0 255 0.523 111 211 255 255 0.532 255 255 198 255 0.541 217 255 198 255 0.55 198 255 198 255 0.56 162 255 198 255 0.569 143 255 198 255 0.578 96 255 198 255 0.587 69 255 198 255 0.596 47 255 198 255 0.606 31 255 198 255 0.615 0 255 156 255 0.624 0 230 117 255 0.633 0 211 82 255 0.642 0 190 56 255 0.651 0 171 35 255 0.661 77 194 255 255 0.67 77 166 255 255 0.679 32 147 213 255 0.688 37 124 171 255 0.697 37 102 149 255 0.706 22 83 134 255 0.716 208 208 223 255 0.725 255 209 34 255 0.734 184 184 208 255 0.743 166 83 77 255 0.752 86 88 96 255 0.761 158 79 181 255 0.771 171 92 0 255 0.78 117 79 69 255 0.789 66 130 149 255 0.798 66 0 102 255 0.807 0 124 0 255 0.817 111 171 249 255 0.826 0 185 255 255 0.835 0 160 255 255 0.844 0 143 255 255 0.853 0 128 255 255 0.862 0 107 255 255 0.872 83 92 241 255 0.881 120 92 226 255 0.89 137 79 226 255 0.899 160 54 211 255 0.908 179 31 211 255 0.917 179 31 185 255 0.927 179 13 166 255 0.936 188 13 134 255 0.945 198 0 102 255 0.954 204 0 88 255 0.963 209 0 79 255 0.972 217 0 69 255 0.982 223 0 56 255 0.991 230 0 45 255 1 235 0 37 255 </Field>
-                </Object>
-                <Object name="table07">
-                    <Field name="ctName" type="string">cpk_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 255 192 202 255 0.028 177 33 33 255 0.037 255 19 146 255 0.046 0 255 0 255 0.055 199 199 199 255 0.064 143 143 255 255 0.073 239 0 0 255 0.083 218 164 31 255 0.092 255 19 146 255 0.101 0 0 255 255 0.11 33 138 33 255 0.119 128 128 144 255 0.128 218 164 31 255 0.138 255 164 0 255 0.147 255 199 49 255 0.156 0 255 0 255 0.165 255 19 146 255 0.174 255 19 146 255 0.183 128 128 144 255 0.193 255 19 146 255 0.202 128 128 144 255 0.211 255 19 146 255 0.22 128 128 144 255 0.229 128 128 144 255 0.239 255 164 0 255 0.248 255 19 146 255 0.257 164 42 42 255 0.266 164 42 42 255 0.275 164 42 42 255 0.284 255 19 146 255 0.294 255 19 146 255 0.303 255 19 146 255 0.312 255 19 146 255 0.321 164 42 42 255 0.33 255 19 146 255 0.339 255 19 146 255 0.349 255 19 146 255 0.358 255 19 146 255 0.367 255 19 146 255 0.376 255 19 146 255 0.385 255 19 146 255 0.394 255 19 146 255 0.404 255 19 146 255 0.413 255 19 146 255 0.422 255 19 146 255 0.431 128 128 144 255 0.44 255 19 146 255 0.45 255 19 146 255 0.459 255 19 146 255 0.468 255 19 146 255 0.477 255 19 146 255 0.486 159 31 239 255 0.495 255 19 146 255 0.505 255 19 146 255 0.514 255 164 0 255 0.523 255 19 146 255 0.532 255 19 146 255 0.541 255 19 146 255 0.55 255 19 146 255 0.56 255 19 146 255 0.569 255 19 146 255 0.578 255 19 146 255 0.587 255 19 146 255 0.596 255 19 146 255 0.606 255 19 146 255 0.615 255 19 146 255 0.624 255 19 146 255 0.633 255 19 146 255 0.642 255 19 146 255 0.651 255 19 146 255 0.661 255 19 146 255 0.67 255 19 146 255 0.679 255 19 146 255 0.688 255 19 146 255 0.697 255 19 146 255 0.706 255 19 146 255 0.716 255 19 146 255 0.725 218 164 31 255 0.734 255 19 146 255 0.743 255 19 146 255 0.752 255 19 146 255 0.761 255 19 146 255 0.771 255 19 146 255 0.78 255 19 146 255 0.789 255 19 146 255 0.798 255 19 146 255 0.807 255 19 146 255 0.817 255 19 146 255 0.826 255 19 146 255 0.835 255 19 146 255 0.844 255 19 146 255 0.853 255 19 146 255 0.862 255 19 146 255 0.872 255 19 146 255 0.881 255 19 146 255 0.89 255 19 146 255 0.899 255 19 146 255 0.908 255 19 146 255 0.917 255 19 146 255 0.927 255 19 146 255 0.936 255 19 146 255 0.945 255 19 146 255 0.954 255 19 146 255 0.963 255 19 146 255 0.972 255 19 146 255 0.982 255 19 146 255 0.991 255 19 146 255 1 255 19 146 255 </Field>
-                </Object>
-                <Object name="table08">
-                    <Field name="ctName" type="string">difference</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.5 255 255 255 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table09">
-                    <Field name="ctName" type="string">gray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table10">
-                    <Field name="ctName" type="string">hot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.25 0 255 255 255 0.5 0 255 0 255 0.75 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table11">
-                    <Field name="ctName" type="string">hot_and_cold</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 255 255 255 0.45 0 0 255 255 0.5 0 0 127 255 0.55 255 0 0 255 1 255 255 0 255 </Field>
-                </Object>
-                <Object name="table12">
-                    <Field name="ctName" type="string">levels</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 0 255 0.034 0 255 0 255 0.069 0 0 255 255 0.103 0 255 255 255 0.138 255 0 255 255 0.172 255 255 0 255 0.207 255 135 0 255 0.241 255 0 135 255 0.276 168 168 168 255 0.31 255 68 68 255 0.345 99 255 99 255 0.379 99 99 255 255 0.414 40 165 165 255 0.448 255 99 255 255 0.483 255 255 99 255 0.517 255 170 99 255 0.552 170 79 255 255 0.586 150 0 0 255 0.621 0 150 0 255 0.655 0 0 150 255 0.69 0 109 109 255 0.724 150 0 150 255 0.759 150 150 0 255 0.793 150 84 0 255 0.828 160 0 79 255 0.862 255 104 28 255 0.897 0 170 81 255 0.931 68 255 124 255 0.966 0 130 255 255 1 130 0 255 255 </Field>
-                </Object>
-                <Object name="table13">
-                    <Field name="ctName" type="string">rainbow</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.2 0 0 255 255 0.4 0 255 255 255 0.6 0 255 0 255 0.8 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table14">
-                    <Field name="ctName" type="string">xray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 1 0 0 0 255 </Field>
-                </Object>
-                <Field name="Ntables" type="int">15</Field>
-            </Object>
-            <Object name="ExpressionList">
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ConnectedComponents/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ConnectedComponents</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/1D/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/2D/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/3D/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Flux/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Flux</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Lineout/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Lineout</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/model</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/distance</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Sum/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Mean/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Variance/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">"operators/StatisticalTrends/Std. Dev./phi"</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Slope/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Residuals/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/SurfaceNormal/mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">VectorMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">SurfaceNormal</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-            </Object>
-            <Object name="AnimationAttributes">
-                <Field name="animationMode" type="string">StopMode</Field>
-                <Field name="pipelineCachingMode" type="bool">false</Field>
-                <Field name="frameIncrement" type="int">1</Field>
-                <Field name="timeout" type="int">1</Field>
-                <Field name="playbackMode" type="string">Looping</Field>
-            </Object>
-            <Object name="AnnotationAttributes">
-                <Object name="axes2D">
-                    <Object name="Axes2D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Outside</Field>
-                        <Field name="tickAxes" type="string">BottomLeft</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-                <Object name="axes3D">
-                    <Object name="Axes3D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Inside</Field>
-                        <Field name="axesType" type="string">ClosestTriad</Field>
-                        <Field name="triadFlag" type="bool">true</Field>
-                        <Field name="bboxFlag" type="bool">true</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="zAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Z-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Field name="setBBoxLocation" type="bool">false</Field>
-                        <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                    </Object>
-                </Object>
-                <Field name="userInfoFlag" type="bool">true</Field>
-                <Object name="userInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoFlag" type="bool">true</Field>
-                <Field name="timeInfoFlag" type="bool">true</Field>
-                <Object name="databaseInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                <Field name="databaseInfoTimeScale" type="double">1</Field>
-                <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                <Field name="legendInfoFlag" type="bool">true</Field>
-                <Object name="backgroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="foregroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                <Object name="gradientColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="gradientColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="backgroundMode" type="string">Solid</Field>
-                <Field name="backgroundImage" type="string"></Field>
-                <Field name="imageRepeatX" type="int">1</Field>
-                <Field name="imageRepeatY" type="int">1</Field>
-                <Object name="axesArray">
-                    <Object name="AxesArray">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="ticksVisible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Object name="axes">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string"></Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewCurveAttributes">
-                <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="domainScale" type="int">0</Field>
-                <Field name="rangeScale" type="int">0</Field>
-            </Object>
-            <Object name="View2DAttributes">
-                <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                <Field name="xScale" type="int">0</Field>
-                <Field name="yScale" type="int">0</Field>
-                <Field name="windowValid" type="bool">true</Field>
-            </Object>
-            <Object name="View3DAttributes">
-                <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="focus" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="viewAngle" type="double">30</Field>
-                <Field name="parallelScale" type="double">0.5</Field>
-                <Field name="nearPlane" type="double">-0.5</Field>
-                <Field name="farPlane" type="double">0.5</Field>
-                <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                <Field name="imageZoom" type="double">1</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="eyeAngle" type="double">2</Field>
-                <Field name="centerOfRotationSet" type="bool">false</Field>
-                <Field name="centerOfRotation" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="axis3DScaleFlag" type="bool">false</Field>
-                <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="windowValid" type="bool">false</Field>
-            </Object>
-            <Object name="LightList">
-                <Object name="light0">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                        <Field name="enabledFlag" type="bool">true</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light1">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light2">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light3">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light4">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light5">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light6">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light7">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerWindowManagerAttributes">
-                <Object name="ActionConfigurations">
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Mode</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Tools</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Window</Field>
-                        <Field name="actions" type="stringVector">"SetActiveWindowRPC" "AddWindowRPC" "CloneWindowRPC" "DeleteWindowRPC" "SetWindowLayoutRPC" "ToggleSpinModeRPC" "InvertBackgroundRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">View</Field>
-                        <Field name="actions" type="stringVector">"TogglePerspectiveViewRPC" "ResetViewRPC" "RecenterViewRPC" "UndoViewRPC" "RedoViewRPC" "ToggleFullFrameRPC" "SaveViewRPC" "ChooseCenterOfRotationRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Animation</Field>
-                        <Field name="actions" type="stringVector">"TimeSliderPreviousStateRPC" "AnimationReversePlayRPC" "AnimationStopRPC" "AnimationPlayRPC" "TimeSliderNextStateRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Operators</Field>
-                        <Field name="actions" type="stringVector">"AddOperatorRPC" "RemoveLastOperatorRPC" "RemoveAllOperatorsRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Plots</Field>
-                        <Field name="actions" type="stringVector">"AddPlotRPC" "DrawPlotsRPC" "HideActivePlotsRPC" "DeleteActivePlotsRPC" "CopyActivePlotsRPC" "SetPlotFollowsTimeRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Clear</Field>
-                        <Field name="actions" type="stringVector">"ClearWindowRPC" "ClearAllWindowsRPC" "ClearPickPointsRPC" "ClearRefLinesRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Lock</Field>
-                        <Field name="actions" type="stringVector">"ToggleLockViewModeRPC" "ToggleLockTimeRPC" "ToggleLockToolsRPC" "TurnOffAllLocksRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                </Object>
-                <Field name="toolbarsVisible" type="bool">true</Field>
-                <Field name="largeIcons" type="bool">false</Field>
-            </Object>
-            <Object name="WindowInformation">
-                <Field name="boundingBoxNavigate" type="bool">true</Field>
-                <Field name="fullFrame" type="bool">false</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="lockView" type="bool">false</Field>
-                <Field name="lockTools" type="bool">false</Field>
-                <Field name="lockTime" type="bool">false</Field>
-                <Field name="viewExtentsType" type="int">1</Field>
-            </Object>
-            <Object name="PrinterAttributes">
-                <Field name="printerName" type="string"></Field>
-                <Field name="printProgram" type="string">lpr</Field>
-                <Field name="documentName" type="string">untitled</Field>
-                <Field name="creator" type="string"></Field>
-                <Field name="numCopies" type="int">1</Field>
-                <Field name="portrait" type="bool">true</Field>
-                <Field name="printColor" type="bool">true</Field>
-                <Field name="outputToFile" type="bool">false</Field>
-                <Field name="outputToFileName" type="string">untitled</Field>
-                <Field name="pageSize" type="int">2</Field>
-            </Object>
-            <Object name="RenderingAttributes">
-                <Field name="antialiasing" type="bool">false</Field>
-                <Field name="orderComposite" type="bool">true</Field>
-                <Field name="depthCompositeThreads" type="int">2</Field>
-                <Field name="depthCompositeBlocking" type="int">65536</Field>
-                <Field name="alphaCompositeThreads" type="int">2</Field>
-                <Field name="alphaCompositeBlocking" type="int">65536</Field>
-                <Field name="depthPeeling" type="bool">false</Field>
-                <Field name="occlusionRatio" type="double">0</Field>
-                <Field name="numberOfPeels" type="int">16</Field>
-                <Field name="multiresolutionMode" type="bool">false</Field>
-                <Field name="multiresolutionCellSize" type="float">0.002</Field>
-                <Field name="geometryRepresentation" type="string">Surfaces</Field>
-                <Field name="displayListMode" type="string">Auto</Field>
-                <Field name="stereoRendering" type="bool">false</Field>
-                <Field name="stereoType" type="string">CrystalEyes</Field>
-                <Field name="notifyForEachRender" type="bool">false</Field>
-                <Field name="scalableActivationMode" type="string">Always</Field>
-                <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                <Field name="specularFlag" type="bool">false</Field>
-                <Field name="specularCoeff" type="float">0.6</Field>
-                <Field name="specularPower" type="float">10</Field>
-                <Object name="specularColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="doShadowing" type="bool">false</Field>
-                <Field name="shadowStrength" type="double">0.5</Field>
-                <Field name="doDepthCueing" type="bool">false</Field>
-                <Field name="depthCueingAutomatic" type="bool">true</Field>
-                <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                <Field name="compressionActivationMode" type="string">Never</Field>
-                <Field name="colorTexturingFlag" type="bool">true</Field>
-                <Field name="compactDomainsActivationMode" type="string">Never</Field>
-                <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="AnnotationObjectList">
-            </Object>
-            <Object name="PickAttributes">
-                <Field name="variables" type="stringVector">"default" </Field>
-                <Field name="showIncidentElements" type="bool">true</Field>
-                <Field name="showNodeId" type="bool">true</Field>
-                <Field name="showNodeDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showNodeBlockLogicalCoords" type="bool">false</Field>
-                <Field name="showNodePhysicalCoords" type="bool">false</Field>
-                <Field name="showZoneId" type="bool">true</Field>
-                <Field name="showZoneDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showZoneBlockLogicalCoords" type="bool">false</Field>
-                <Field name="doTimeCurve" type="bool">false</Field>
-                <Field name="conciseOutput" type="bool">false</Field>
-                <Field name="showTimeStep" type="bool">true</Field>
-                <Field name="showMeshName" type="bool">true</Field>
-                <Field name="useLabelAsPickLetter" type="bool">false</Field>
-                <Field name="showGlobalIds" type="bool">false</Field>
-                <Field name="showPickLetter" type="bool">true</Field>
-                <Field name="hasRangeOutput" type="bool">false</Field>
-                <Field name="elementLabel" type="string"></Field>
-                <Field name="createSpreadsheet" type="bool">false</Field>
-                <Field name="floatFormat" type="string">%g</Field>
-                <Field name="timePreserveCoord" type="bool">true</Field>
-            </Object>
-            <Object name="QueryOverTimeAttributes">
-                <Field name="timeType" type="string">Cycle</Field>
-                <Field name="startTimeFlag" type="bool">false</Field>
-                <Field name="startTime" type="int">0</Field>
-                <Field name="endTimeFlag" type="bool">false</Field>
-                <Field name="endTime" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="createWindow" type="bool">true</Field>
-                <Field name="windowId" type="int">2</Field>
-            </Object>
-            <Object name="InteractorAttributes">
-                <Field name="showGuidelines" type="bool">true</Field>
-                <Field name="clampSquare" type="bool">false</Field>
-                <Field name="fillViewportOnZoom" type="bool">true</Field>
-                <Field name="navigationMode" type="string">Trackball</Field>
-                <Field name="axisArraySnap" type="bool">true</Field>
-                <Field name="boundingBoxMode" type="string">Auto</Field>
-            </Object>
-            <Object name="MovieAttributes">
-                <Field name="generationMethod" type="string">NowCurrentInstance</Field>
-                <Field name="movieType" type="string">Simple</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="outputName" type="string">movie</Field>
-                <Field name="fileFormats" type="stringVector"></Field>
-                <Field name="useCurrentSize" type="unsignedCharVector"></Field>
-                <Field name="widths" type="intVector"></Field>
-                <Field name="heights" type="intVector"></Field>
-                <Field name="scales" type="doubleVector"></Field>
-                <Field name="stereoFlags" type="intVector"></Field>
-                <Field name="templateFile" type="string"></Field>
-                <Field name="sendEmailNotification" type="bool">false</Field>
-                <Field name="useScreenCapture" type="bool">false</Field>
-                <Field name="emailAddress" type="string"></Field>
-                <Field name="fps" type="int">10</Field>
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="endIndex" type="int">1000000000</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="initialFrameValue" type="int">0</Field>
-            </Object>
-            <Object name="FileOpenOptions">
-                <Field name="typeNames" type="stringVector">"AMR" "AMRTest" "ANALYZE" "ANSYS" "AUXFile" "AugDecomp" "BATL" "BOV" "CEAucd" "CMAT" "CTRL" "Cale" "CaleHDF5" "CarpetHDF5" "Chombo" "Claw" "CosmosPP" "Cube" "Curve2D" "DDCMD" "Dyna3D" "EnSight" "Enzo" "Exodus" "ExtrudedVol" "FLASH" "FT2" "Fluent" "GGCM" "GHOST" "GMV" "GTC" "GULP" "Gadget" "Geqdsk" "H5Nimrod" "Image" "KullLite" "LAMMPS" "Lines" "M3DC1" "M3D" "MFIXCDF" "MFIX" "MM5" "MatrixMarket" "Miranda" "NASTRAN" "NETCDF" "Nek5000" "OVERFLOW" "OpenFOAM" "PATRAN" "PDB" "PFLOTRAN" "PLOT3D" "PLY" "ParallelVelodyne" "Pixie" "PlainText" "Point3D" "ProteinDataBank" "PuReMD" "RAW" "S3D" "SAMI" "SAMRAI" "SAR" "SAS" "STAR" "STL" "SXRIS" "Shapefile" "Silo" "SimV2" "Spheral" "TCGA" "TFT" "TSurf" "Tecplot" "Tetrad" "UNIC" "VASP" "VCellMTMD" "VTK" "Velodyne" "Vis5D" "VisItXdmf" "Vista" "Vs" "WPPImage" "WavefrontOBJ" "WellLogs" "XSF" "XYZ" "Xmdv" "ZipWrapper" "lata" "unv" "volimage" "HDFS" "SPCTH" </Field>
-                <Field name="typeIDs" type="stringVector">"AMR_1.0" "AMRTest_1.0" "ANALYZE_1.0" "ANSYS_1.0" "AUXFile_1.0" "AugDecomp_1.0" "BATL_1.0" "BOV_1.0" "CEAucd_1.0" "CMAT_1.0" "CTRL_1.0" "Cale_1.1" "CaleHDF5_1.1" "CarpetHDF5_2.1" "Chombo_1.0" "Claw_1.0" "CosmosPP_1.0" "Cube_1.0" "Curve2D_1.0" "DDCMD_1.0" "Dyna3D_1.0" "EnSight_1.0" "Enzo_1.0" "Exodus_1.0" "ExtrudedVol_1.0" "FLASH_1.0" "FT2_1.0" "Fluent_1.0" "GGCM_1.0" "GHOST_1" "GMV_1.0" "GTC_1.0" "GULP_1.0" "Gadget_2.0a" "Geqdsk_1.0" "H5Nimrod_1.0" "Image_1.0" "KullLite_1.0" "LAMMPS_1.0" "Lines_1.0" "M3DC1_1.0" "M3D_1.0" "MFIXCDF_1.0" "MFIX_1.0" "MM5_1.0" "MatrixMarket_1.0" "Miranda_2.0" "NASTRAN_1.0" "NETCDF_1.0" "Nek5000_1.0" "OVERFLOW_1.0" "OpenFOAM_1.0" "PATRAN_1.0" "PDB_1.1" "PFLOTRAN_1.0" "PLOT3D_1.0" "PLY_1.0" "ParallelVelodyne_1" "Pixie_1.0" "PlainText_1.0" "Point3D_1.0" "ProteinDataBank_1.0" "PuReMD_1.0" "RAW_1.0" "S3D_1.0" "SAMI_1.0" "SAMRAI_1.0" "SAR_1.0" "SAS_1.0" "STAR_1.0" "STL_1.0" "SXRIS_1.0" "Shapefile_1.0" "Silo_1.0" "SimV2_1.0" "Spheral_1.0" "TCGA_1.0" "TFT_1.0" "TSurf_1.0" "Tecplot_1.0" "Tetrad_1.0" "UNIC_1.0" "VASP_1.0" "VCellMTMD_1.0" "VTK_1.0" "Velodyne_1.0" "Vis5D_1.0" "VisItXdmf_1.0" "Vista_1.0" "Vs_3.0.0" "WPPImage_2" "WavefrontOBJ_1.0" "WellLogs_1.0" "XSF_1.0" "XYZ_1.0" "Xmdv_1.0" "ZipWrapper_1.0" "lata_1.0" "unv_" "volimage_1.0" "HDFS_1.0" "SPCTH_1.0" </Field>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" </Field>
-                    <Field name="optBools" type="intVector">0 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Use ghost data (if present)" "Enable only root level by default" "Enable only explicitly defined materials by default" "Check for mapping file and import coordinates if available" "Use particle_nid and polymer_id to connect particles" "Always compute domain boundaries (hack for AMR stitch cells)" </Field>
-                    <Field name="optBools" type="intVector">1 0 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"ExtendVolumeByOneCell" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 5 1 4 4 </Field>
-                    <Field name="names" type="stringVector">"Automagically Detect Compound Variables" "Use Material Convention" "Material Count (-1=guess)" "Namescheme for material volume fractions" "Namescheme for material specific variables" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 </Field>
-                    <Field name="optStrings" type="stringVector">"" "" </Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"None" "ALEGRA" "CTH" "Custom" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string">"&lt;p&gt;&lt;b&gt;Automagically Detect Compound Variables&lt;/b&gt;: Checking this option will cause the plugin to try to guess that similarly named variables are the scalar components of an aggregate type such as a vector, tensor or array variable. The plugin will then automatically define expressions for these aggregate typed variables. Note that this is just a convenience to free users from having to define expressions manally within their VisIt session.&lt;p&gt; &lt;p&gt;&lt;b&gt;Material Count (-1=guess)&lt;/b&gt;: Ordinarily, the plugin will determine the material count from the material convention nameschemes. However, if it is having trouble getting the correct count, you can specify it manually with this option. &lt;p&gt;&lt;b&gt;Use Material Convention&lt;/b&gt;: A few pre-defined conventions for handling mixed materials from Exodus files are supported. In addition, you can define your own custom conventions as well. For a custom convention, you must define the &lt;i&gt;namescheme&lt;/i&gt; that will produce the names of the scalar variables holding material volume fractions. Optionally, you can specify a &lt;i&gt;namescheme&lt;/i&gt; to produce the names of the scalar variables holding material-specific values given the name of a non-material-specific variable. For more information on nameschemes, please consult the description of DBMakeNamescheme in the &lt;a href=&quot;https://wci.llnl.gov/content/assets/docs/simulation/computer-codes/silo/LLNL-SM-654357.pdf&quot;&gt;Silo user&apos;s manual&lt;/a&gt;. The nameschemes used here are identical to those described in the Silo user&apos;s manual with one extension. The conversion specifier %V is used to denote the basename (non-material-specific) name of a set of scalar variables holding material specific values.&lt;p&gt; &lt;p&gt;The ALEGRA nameschemes for volume fraction and material specific variables  are &quot;@%s@n?&apos;&amp;VOLFRC_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;The CTH nameschemes are &quot;@%s@n?&apos;&amp;VOLM_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;Finally, it is assumed materials are identified starting from one (1). The special material id of zero (0) is used to denote void."</Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" "Set up patch abutment information" </Field>
-                    <Field name="optBools" type="intVector">0 1 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 </Field>
-                    <Field name="names" type="stringVector">"Mesh refinement" "Linear mesh data location" "Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1" "2" "3" "4" "5" "6" "7" "8" "9" "10" "Node" "Element" </Field>
-                    <Field name="enumStringsSizes" type="intVector">10 2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Big Endian" "Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"Num Materials (-1==costly search)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Read all times and cycles" "Duplicate data for particle advection (slower for all other techniques)" </Field>
-                    <Field name="optBools" type="intVector">1 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Case Type" "Convert Cell Data To Point Data" "Read Zones" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"Decomposed" "Reconstructed" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"LEOS try harder level [set to 0, 1 or 2]" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 4 0 0 0 0 0 0 3 3 </Field>
-                    <Field name="names" type="stringVector">"File Format" "Solution (Q) File Name" "Solution Time field accurate" "3D" "Multi Grid" "Big Endian" "Double Precision" "IBlanking" "Gas constant R" "Gas constant Gamma" </Field>
-                    <Field name="optBools" type="intVector">1 1 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector">1 1.4 </Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector">"" </Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"ASCII" "C Binary" "Fortran Binary" </Field>
-                    <Field name="enumStringsSizes" type="intVector">3 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 </Field>
-                    <Field name="names" type="stringVector">"Partitioning" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">2 </Field>
-                    <Field name="enumStrings" type="stringVector">"X Slab" "Y Slab" "Z Slab" "KD Tree" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Data layout" "Lines to skip at beginning of file" "First row has variable names" "Column for X coordinate (or -1 for none)" "Column for Y coordinate (or -1 for none)" "Column for Z coordinate (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 -1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1D Columns" "2D Array" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Polygons as lines" "Tessellate polygons" "ESRI Logging" "DBF Logging" </Field>
-                    <Field name="optBools" type="intVector">0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Ignore spatial extents" "Ignore data extents" "Force Single" "Search For ANNOTATION_INT (!!Slow!!)" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">3 3 </Field>
-                    <Field name="enumStrings" type="stringVector">"Always" "Auto" "Never" "Undef" "Always" "Auto" "Never" "Undef" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 4 </Field>
-                    <Field name="obsoleteNames" type="stringVector">"Ignore Spatial Extents" "Ignore Data Extents" </Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Method to determine coordinate axes" "X axis variable index (or -1 for none)" "Y axis variable index (or -1 for none)" "Z axis variable index (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"Guess from variable names" "Specify explicitly (below)" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">4 4 1 4 0 </Field>
-                    <Field name="names" type="stringVector">"TMPDIR for decompressed files" "Unique moniker for dirs made in $TMPDIR" "Max. # decompressed files" "Decompression command" "Don&apos;t atexit()" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">50 </Field>
-                    <Field name="optStrings" type="stringVector">"$TMPDIR" "$USER" "" </Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Field name="Enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 </Field>
-                <Field name="preferredIDs" type="stringVector">"Silo_1.0" </Field>
-            </Object>
-            <Object name="SeedMeAttributes">
-                <Field name="clearAllTabsOnClose" type="bool">true</Field>
-            </Object>
-            <Object name="BoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="ContourAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                        <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="CurveAttributes">
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="symbol" type="string">Point</Field>
-                <Field name="pointSize" type="double">5</Field>
-                <Field name="pointFillMode" type="string">Static</Field>
-                <Field name="pointStride" type="int">1</Field>
-                <Field name="symbolDensity" type="int">50</Field>
-                <Field name="curveColorSource" type="string">Cycle</Field>
-                <Object name="curveColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="showLegend" type="bool">true</Field>
-                <Field name="showLabels" type="bool">true</Field>
-                <Field name="designator" type="string"></Field>
-                <Field name="doBallTimeCue" type="bool">false</Field>
-                <Object name="ballTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="timeCueBallSize" type="double">0.01</Field>
-                <Field name="doLineTimeCue" type="bool">false</Field>
-                <Object name="lineTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="lineTimeCueWidth" type="int">0</Field>
-                <Field name="doCropTimeCue" type="bool">false</Field>
-                <Field name="timeForTimeCue" type="double">0</Field>
-                <Field name="fillMode" type="string">NoFill</Field>
-                <Object name="fillColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="fillColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 100 100 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="polarToCartesian" type="bool">false</Field>
-                <Field name="polarCoordinateOrder" type="string">R_Theta</Field>
-                <Field name="angleUnits" type="string">Radians</Field>
-            </Object>
-            <Object name="FilledBoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Object name="mixedColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="HistogramAttributes">
-                <Field name="basedOn" type="string">ManyZonesForSingleVar</Field>
-                <Field name="histogramType" type="string">Frequency</Field>
-                <Field name="weightVariable" type="string">default</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="numBins" type="int">32</Field>
-                <Field name="domain" type="int">0</Field>
-                <Field name="zone" type="int">0</Field>
-                <Field name="useBinWidths" type="bool">true</Field>
-                <Field name="outputType" type="string">Block</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="color">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">200 80 40 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="dataScale" type="string">Linear</Field>
-                <Field name="binScale" type="string">Linear</Field>
-                <Field name="normalizeHistogram" type="bool">false</Field>
-                <Field name="computeAsCDF" type="bool">false</Field>
-            </Object>
-            <Object name="LabelAttributes">
-                <Field name="varType" type="string">LABEL_VT_UNKNOWN_TYPE</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="showNodes" type="bool">false</Field>
-                <Field name="showCells" type="bool">true</Field>
-                <Field name="restrictNumberOfLabels" type="bool">true</Field>
-                <Field name="drawLabelsFacing" type="string">Front</Field>
-                <Field name="labelDisplayFormat" type="string">Natural</Field>
-                <Field name="numberOfLabels" type="int">200</Field>
-                <Field name="specifyTextColor1" type="bool">false</Field>
-                <Object name="textColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight1" type="float">0.02</Field>
-                <Field name="specifyTextColor2" type="bool">false</Field>
-                <Object name="textColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight2" type="float">0.02</Field>
-                <Field name="horizontalJustification" type="string">HCenter</Field>
-                <Field name="verticalJustification" type="string">VCenter</Field>
-                <Field name="depthTestMode" type="string">LABEL_DT_AUTO</Field>
-                <Field name="formatTemplate" type="string">%g</Field>
-            </Object>
-            <Object name="MeshAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="meshColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="meshColorSource" type="string">Foreground</Field>
-                <Field name="opaqueColorSource" type="string">Background</Field>
-                <Field name="opaqueMode" type="string">Auto</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Object name="opaqueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="smoothingLevel" type="string">None</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="opaqueMeshIsAppropriate" type="bool">true</Field>
-                <Field name="showInternal" type="bool">false</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="opacity" type="double">1</Field>
-            </Object>
-            <Object name="MoleculeAttributes">
-                <Field name="drawAtomsAs" type="string">SphereAtoms</Field>
-                <Field name="scaleRadiusBy" type="string">Fixed</Field>
-                <Field name="drawBondsAs" type="string">CylinderBonds</Field>
-                <Field name="colorBonds" type="string">ColorByAtom</Field>
-                <Object name="bondSingleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 128 128 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="radiusVariable" type="string">default</Field>
-                <Field name="radiusScaleFactor" type="float">1</Field>
-                <Field name="radiusFixed" type="float">0.3</Field>
-                <Field name="atomSphereQuality" type="string">Medium</Field>
-                <Field name="bondCylinderQuality" type="string">Medium</Field>
-                <Field name="bondRadius" type="float">0.12</Field>
-                <Field name="bondLineWidth" type="int">0</Field>
-                <Field name="bondLineStyle" type="int">0</Field>
-                <Field name="elementColorTable" type="string">cpk_jmol</Field>
-                <Field name="residueTypeColorTable" type="string">amino_shapely</Field>
-                <Field name="residueSequenceColorTable" type="string">Default</Field>
-                <Field name="continuousColorTable" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="scalarMin" type="float">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="scalarMax" type="float">1</Field>
-            </Object>
-            <Object name="MultiCurveAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.034</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0.069</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.103</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                            <Field name="position" type="float">0.138</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.172</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                            <Field name="position" type="float">0.207</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                            <Field name="position" type="float">0.241</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                            <Field name="position" type="float">0.276</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                            <Field name="position" type="float">0.31</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                            <Field name="position" type="float">0.345</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                            <Field name="position" type="float">0.379</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                            <Field name="position" type="float">0.414</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                            <Field name="position" type="float">0.448</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                            <Field name="position" type="float">0.483</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                            <Field name="position" type="float">0.517</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">170 79 255 255 </Field>
-                            <Field name="position" type="float">0.552</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 0 255 </Field>
-                            <Field name="position" type="float">0.586</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 150 0 255 </Field>
-                            <Field name="position" type="float">0.621</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 150 255 </Field>
-                            <Field name="position" type="float">0.655</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 109 109 255 </Field>
-                            <Field name="position" type="float">0.69</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 150 255 </Field>
-                            <Field name="position" type="float">0.724</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 150 0 255 </Field>
-                            <Field name="position" type="float">0.759</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 84 0 255 </Field>
-                            <Field name="position" type="float">0.793</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">160 0 79 255 </Field>
-                            <Field name="position" type="float">0.828</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 104 28 255 </Field>
-                            <Field name="position" type="float">0.862</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 170 81 255 </Field>
-                            <Field name="position" type="float">0.897</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">68 255 124 255 </Field>
-                            <Field name="position" type="float">0.931</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 130 255 255 </Field>
-                            <Field name="position" type="float">0.966</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">130 0 255 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="changedColors" type="unsignedCharVector"></Field>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                        </Object>
-                    </Object>
-                </Object>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="yAxisTitleFormat" type="string">%g</Field>
-                <Field name="useYAxisTickSpacing" type="bool">false</Field>
-                <Field name="yAxisTickSpacing" type="double">1</Field>
-                <Field name="displayMarkers" type="bool">true</Field>
-                <Field name="markerScale" type="double">1</Field>
-                <Field name="markerLineWidth" type="int">0</Field>
-                <Field name="markerVariable" type="string">default</Field>
-                <Field name="displayIds" type="bool">false</Field>
-                <Field name="idVariable" type="string">default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="ParallelCoordinatesAttributes">
-                <Field name="scalarAxisNames" type="stringVector"></Field>
-                <Field name="visualAxisNames" type="stringVector"></Field>
-                <Field name="extentMinima" type="doubleVector"></Field>
-                <Field name="extentMaxima" type="doubleVector"></Field>
-                <Field name="drawLines" type="bool">true</Field>
-                <Object name="linesColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawContext" type="bool">true</Field>
-                <Field name="contextGamma" type="float">2</Field>
-                <Field name="contextNumPartitions" type="int">128</Field>
-                <Object name="contextColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 220 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawLinesOnlyIfExtentsOn" type="bool">true</Field>
-                <Field name="unifyAxisExtents" type="bool">false</Field>
-                <Field name="linesNumPartitions" type="int">512</Field>
-                <Field name="focusGamma" type="float">4</Field>
-                <Field name="drawFocusAs" type="string">BinsOfConstantColor</Field>
-            </Object>
-            <Object name="PseudocolorAttributes">
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="centering" type="string">Natural</Field>
-                <Field name="colorTableName" type="string">hot</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="opacityType" type="string">FullyOpaque</Field>
-                <Field name="opacityVariable" type="string"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="opacityVarMin" type="double">0</Field>
-                <Field name="opacityVarMax" type="double">1</Field>
-                <Field name="opacityVarMinFlag" type="bool">false</Field>
-                <Field name="opacityVarMaxFlag" type="bool">false</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineType" type="string">Line</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="tubeResolution" type="int">10</Field>
-                <Field name="tubeRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="tubeRadiusAbsolute" type="double">0.125</Field>
-                <Field name="tubeRadiusBBox" type="double">0.005</Field>
-                <Field name="tubeRadiusVarEnabled" type="bool">false</Field>
-                <Field name="tubeRadiusVar" type="string"></Field>
-                <Field name="tubeRadiusVarRatio" type="double">10</Field>
-                <Field name="tailStyle" type="string">None</Field>
-                <Field name="headStyle" type="string">None</Field>
-                <Field name="endPointRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="endPointRadiusAbsolute" type="double">0.125</Field>
-                <Field name="endPointRadiusBBox" type="double">0.05</Field>
-                <Field name="endPointResolution" type="int">10</Field>
-                <Field name="endPointRatio" type="double">5</Field>
-                <Field name="endPointRadiusVarEnabled" type="bool">false</Field>
-                <Field name="endPointRadiusVar" type="string"></Field>
-                <Field name="endPointRadiusVarRatio" type="double">10</Field>
-                <Field name="renderSurfaces" type="int">1</Field>
-                <Field name="renderWireframe" type="int">0</Field>
-                <Field name="renderPoints" type="int">0</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="wireframeColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Object name="pointColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ScatterAttributes">
-                <Field name="var1" type="string">default</Field>
-                <Field name="var1Role" type="string">Coordinate0</Field>
-                <Field name="var1MinFlag" type="bool">false</Field>
-                <Field name="var1MaxFlag" type="bool">false</Field>
-                <Field name="var1Min" type="double">0</Field>
-                <Field name="var1Max" type="double">1</Field>
-                <Field name="var1Scaling" type="string">Linear</Field>
-                <Field name="var1SkewFactor" type="double">1</Field>
-                <Field name="var2Role" type="string">Coordinate1</Field>
-                <Field name="var2" type="string">default</Field>
-                <Field name="var2MinFlag" type="bool">false</Field>
-                <Field name="var2MaxFlag" type="bool">false</Field>
-                <Field name="var2Min" type="double">0</Field>
-                <Field name="var2Max" type="double">1</Field>
-                <Field name="var2Scaling" type="string">Linear</Field>
-                <Field name="var2SkewFactor" type="double">1</Field>
-                <Field name="var3Role" type="string">None</Field>
-                <Field name="var3" type="string">default</Field>
-                <Field name="var3MinFlag" type="bool">false</Field>
-                <Field name="var3MaxFlag" type="bool">false</Field>
-                <Field name="var3Min" type="double">0</Field>
-                <Field name="var3Max" type="double">1</Field>
-                <Field name="var3Scaling" type="string">Linear</Field>
-                <Field name="var3SkewFactor" type="double">1</Field>
-                <Field name="var4Role" type="string">None</Field>
-                <Field name="var4" type="string">default</Field>
-                <Field name="var4MinFlag" type="bool">false</Field>
-                <Field name="var4MaxFlag" type="bool">false</Field>
-                <Field name="var4Min" type="double">0</Field>
-                <Field name="var4Max" type="double">1</Field>
-                <Field name="var4Scaling" type="string">Linear</Field>
-                <Field name="var4SkewFactor" type="double">1</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointSizePixels" type="int">1</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="scaleCube" type="bool">true</Field>
-                <Field name="colorType" type="string">ColorByForegroundColor</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="SpreadsheetAttributes">
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="formatString" type="string">%1.6f</Field>
-                <Field name="useColorTable" type="bool">false</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="showTracerPlane" type="bool">true</Field>
-                <Object name="tracerColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 150 </Field>
-                    </Object>
-                </Object>
-                <Field name="normal" type="string">Z</Field>
-                <Field name="sliceIndex" type="int">0</Field>
-                <Field name="spreadsheetFont" type="string">Courier,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="showPatchOutline" type="bool">true</Field>
-                <Field name="showCurrentCellOutline" type="bool">false</Field>
-            </Object>
-            <Object name="SubsetAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="subsetNames" type="stringVector"></Field>
-                <Field name="subsetType" type="string">Unknown</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="TensorAttributes">
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nTensors" type="int">400</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="colorByEigenvalues" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="tensorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="TruecolorAttributes">
-                <Field name="opacity" type="double">1</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-            </Object>
-            <Object name="VectorAttributes">
-                <Field name="glyphLocation" type="string">AdaptsToMeshResolution</Field>
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nVectors" type="int">400</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="headSize" type="double">0.25</Field>
-                <Field name="headOn" type="bool">true</Field>
-                <Field name="colorByMag" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="vectorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="vectorOrigin" type="string">Tail</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="lineStem" type="string">Line</Field>
-                <Field name="geometryQuality" type="string">Fast</Field>
-                <Field name="stemWidth" type="double">0.08</Field>
-                <Field name="origOnly" type="bool">true</Field>
-                <Field name="glyphType" type="string">Arrow</Field>
-            </Object>
-            <Object name="VolumeAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="colorControlPoints">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.25</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.5</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.75</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">Linear</Field>
-                        <Field name="equal" type="bool">false</Field>
-                        <Field name="discrete" type="bool">false</Field>
-                        <Field name="category" type="string"></Field>
-                    </Object>
-                </Object>
-                <Field name="opacityAttenuation" type="float">1</Field>
-                <Field name="opacityMode" type="string">FreeformMode</Field>
-                <Object name="opacityControlPoints">
-                    <Object name="GaussianControlPointList">
-                    </Object>
-                </Object>
-                <Field name="resampleFlag" type="bool">true</Field>
-                <Field name="resampleTarget" type="int">50000</Field>
-                <Field name="opacityVariable" type="string">default</Field>
-                <Field name="compactVariable" type="string">default</Field>
-                <Field name="freeformOpacity" type="unsignedCharArray" length="256">0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 </Field>
-                <Field name="useColorVarMin" type="bool">false</Field>
-                <Field name="colorVarMin" type="float">0</Field>
-                <Field name="useColorVarMax" type="bool">false</Field>
-                <Field name="colorVarMax" type="float">0</Field>
-                <Field name="useOpacityVarMin" type="bool">false</Field>
-                <Field name="opacityVarMin" type="float">0</Field>
-                <Field name="useOpacityVarMax" type="bool">false</Field>
-                <Field name="opacityVarMax" type="float">0</Field>
-                <Field name="smoothData" type="bool">false</Field>
-                <Field name="samplesPerRay" type="int">500</Field>
-                <Field name="rendererType" type="string">Splatting</Field>
-                <Field name="gradientType" type="string">SobelOperator</Field>
-                <Field name="num3DSlices" type="int">200</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="sampling" type="string">Rasterization</Field>
-                <Field name="rendererSamples" type="float">3</Field>
-                <Field name="transferFunctionDim" type="int">1</Field>
-                <Field name="lowGradientLightingReduction" type="string">Lower</Field>
-                <Field name="lowGradientLightingClampFlag" type="bool">false</Field>
-                <Field name="lowGradientLightingClampValue" type="double">1</Field>
-                <Field name="materialProperties" type="doubleArray" length="4">0.4 0.75 0 15 </Field>
-            </Object>
-            <Object name="AMRStitchCellAttributes">
-                <Field name="CreateCellsOfType" type="string">DualGridAndStitchCells</Field>
-            </Object>
-            <Object name="AxisAlignedSlice4DAttributes">
-                <Field name="I" type="intVector"></Field>
-                <Field name="J" type="intVector"></Field>
-                <Field name="K" type="intVector"></Field>
-                <Field name="L" type="intVector"></Field>
-            </Object>
-            <Object name="BoundaryOpAttributes">
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="BoxAttributes">
-                <Field name="amount" type="string">Some</Field>
-                <Field name="minx" type="double">0</Field>
-                <Field name="maxx" type="double">1</Field>
-                <Field name="miny" type="double">0</Field>
-                <Field name="maxy" type="double">1</Field>
-                <Field name="minz" type="double">0</Field>
-                <Field name="maxz" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="CartographicProjectionAttributes">
-                <Field name="projectionID" type="string">aitoff</Field>
-                <Field name="centralMeridian" type="double">0</Field>
-            </Object>
-            <Object name="ClipAttributes">
-                <Field name="quality" type="string">Fast</Field>
-                <Field name="funcType" type="string">Plane</Field>
-                <Field name="plane1Status" type="bool">true</Field>
-                <Field name="plane2Status" type="bool">false</Field>
-                <Field name="plane3Status" type="bool">false</Field>
-                <Field name="plane1Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane2Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane3Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane1Normal" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="plane2Normal" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="plane3Normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeInverse" type="bool">false</Field>
-                <Field name="planeToolControlledClipPlane" type="string">Plane1</Field>
-                <Field name="center" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereInverse" type="bool">false</Field>
-            </Object>
-            <Object name="ConeAttributes">
-                <Field name="angle" type="double">45</Field>
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="representation" type="string">Flattened</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="cutByLength" type="bool">false</Field>
-                <Field name="length" type="double">1</Field>
-            </Object>
-            <Object name="CoordSwapAttributes">
-                <Field name="newCoord1" type="string">Coord1</Field>
-                <Field name="newCoord2" type="string">Coord2</Field>
-                <Field name="newCoord3" type="string">Coord3</Field>
-            </Object>
-            <Object name="CreateBondsAttributes">
-                <Field name="elementVariable" type="string">element</Field>
-                <Field name="atomicNumber1" type="intVector">1 -1 </Field>
-                <Field name="atomicNumber2" type="intVector">-1 -1 </Field>
-                <Field name="minDist" type="doubleVector">0.4 0.4 </Field>
-                <Field name="maxDist" type="doubleVector">1.2 1.9 </Field>
-                <Field name="maxBondsClamp" type="int">10</Field>
-                <Field name="addPeriodicBonds" type="bool">false</Field>
-                <Field name="useUnitCellVectors" type="bool">true</Field>
-                <Field name="periodicInX" type="bool">true</Field>
-                <Field name="periodicInY" type="bool">true</Field>
-                <Field name="periodicInZ" type="bool">true</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-            </Object>
-            <Object name="CylinderAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="DataBinningAttributes">
-                <Field name="numDimensions" type="string">One</Field>
-                <Field name="dim1BinBasedOn" type="string">Variable</Field>
-                <Field name="dim1Var" type="string">default</Field>
-                <Field name="dim1SpecifyRange" type="bool">false</Field>
-                <Field name="dim1MinRange" type="double">0</Field>
-                <Field name="dim1MaxRange" type="double">1</Field>
-                <Field name="dim1NumBins" type="int">50</Field>
-                <Field name="dim2BinBasedOn" type="string">Variable</Field>
-                <Field name="dim2Var" type="string">default</Field>
-                <Field name="dim2SpecifyRange" type="bool">false</Field>
-                <Field name="dim2MinRange" type="double">0</Field>
-                <Field name="dim2MaxRange" type="double">1</Field>
-                <Field name="dim2NumBins" type="int">50</Field>
-                <Field name="dim3BinBasedOn" type="string">Variable</Field>
-                <Field name="dim3Var" type="string">default</Field>
-                <Field name="dim3SpecifyRange" type="bool">false</Field>
-                <Field name="dim3MinRange" type="double">0</Field>
-                <Field name="dim3MaxRange" type="double">1</Field>
-                <Field name="dim3NumBins" type="int">50</Field>
-                <Field name="outOfBoundsBehavior" type="string">Clamp</Field>
-                <Field name="reductionOperator" type="string">Average</Field>
-                <Field name="varForReduction" type="string">default</Field>
-                <Field name="emptyVal" type="double">0</Field>
-                <Field name="outputType" type="string">OutputOnBins</Field>
-                <Field name="removeEmptyValFromCurve" type="bool">true</Field>
-            </Object>
-            <Object name="DeferExpressionAttributes">
-                <Field name="exprs" type="stringVector"></Field>
-            </Object>
-            <Object name="DisplaceAttributes">
-                <Field name="factor" type="double">1</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="DualMeshAttributes">
-                <Field name="mode" type="string">Auto</Field>
-            </Object>
-            <Object name="EdgeAttributes">
-                <Field name="dummy" type="bool">true</Field>
-            </Object>
-            <Object name="ElevateAttributes">
-                <Field name="useXYLimits" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="zeroFlag" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="EllipsoidSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radii" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="rotationAngle" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ExplodeAttributes">
-                <Field name="explosionType" type="string">Point</Field>
-                <Field name="explosionPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planePoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNorm" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint2" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="materialExplosionFactor" type="double">1</Field>
-                <Field name="material" type="string"></Field>
-                <Field name="cylinderRadius" type="double">0</Field>
-                <Field name="explodeMaterialCells" type="bool">false</Field>
-                <Field name="cellExplosionFactor" type="double">1</Field>
-                <Field name="explosionPattern" type="string">Impact</Field>
-                <Field name="explodeAllCells" type="bool">false</Field>
-                <Field name="boundaryNames" type="stringVector"></Field>
-            </Object>
-            <Object name="ExternalSurfaceAttributes">
-                <Field name="removeGhosts" type="bool">false</Field>
-                <Field name="edgesIn2D" type="bool">true</Field>
-            </Object>
-            <Object name="ExtrudeAttributes">
-                <Field name="axis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="length" type="double">1</Field>
-                <Field name="steps" type="int">30</Field>
-                <Field name="preserveOriginalCellNumbers" type="bool">true</Field>
-            </Object>
-            <Object name="FFTAttributes">
-                <Field name="dummy" type="int">0</Field>
-            </Object>
-            <Object name="IndexSelectAttributes">
-                <Field name="maxDim" type="string">ThreeD</Field>
-                <Field name="dim" type="string">TwoD</Field>
-                <Field name="xAbsMax" type="int">-1</Field>
-                <Field name="xMin" type="int">0</Field>
-                <Field name="xMax" type="int">-1</Field>
-                <Field name="xIncr" type="int">1</Field>
-                <Field name="xWrap" type="bool">false</Field>
-                <Field name="yAbsMax" type="int">-1</Field>
-                <Field name="yMin" type="int">0</Field>
-                <Field name="yMax" type="int">-1</Field>
-                <Field name="yIncr" type="int">1</Field>
-                <Field name="yWrap" type="bool">false</Field>
-                <Field name="zAbsMax" type="int">-1</Field>
-                <Field name="zMin" type="int">0</Field>
-                <Field name="zMax" type="int">-1</Field>
-                <Field name="zIncr" type="int">1</Field>
-                <Field name="zWrap" type="bool">false</Field>
-                <Field name="useWholeCollection" type="bool">true</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-            </Object>
-            <Object name="IntegralCurveAttributes">
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="boxExtents" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                <Field name="useWholeBox" type="bool">true</Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="fieldData" type="doubleVector"></Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="sampleDensity2" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="displayGeometry" type="string">Lines</Field>
-                <Field name="cleanupMethod" type="string">NoCleanup</Field>
-                <Field name="cleanupThreshold" type="double">1e-08</Field>
-                <Field name="cropBeginFlag" type="bool">false</Field>
-                <Field name="cropBegin" type="double">0</Field>
-                <Field name="cropEndFlag" type="bool">false</Field>
-                <Field name="cropEnd" type="double">0</Field>
-                <Field name="cropValue" type="string">Time</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-                <Field name="selection" type="string"></Field>
-            </Object>
-            <Object name="InverseGhostZoneAttributes">
-                <Field name="requestGhostZones" type="bool">true</Field>
-                <Field name="showDuplicated" type="bool">true</Field>
-                <Field name="showEnhancedConnectivity" type="bool">true</Field>
-                <Field name="showReducedConnectivity" type="bool">true</Field>
-                <Field name="showAMRRefined" type="bool">true</Field>
-                <Field name="showExterior" type="bool">true</Field>
-                <Field name="showNotApplicable" type="bool">true</Field>
-            </Object>
-            <Object name="IsosurfaceAttributes">
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="IsovolumeAttributes">
-                <Field name="lbound" type="double">-1e+37</Field>
-                <Field name="ubound" type="double">1e+37</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LCSAttributes">
-                <Field name="sourceType" type="string">NativeMesh</Field>
-                <Field name="Resolution" type="intArray" length="3">10 10 10 </Field>
-                <Field name="UseDataSetStart" type="string">Full</Field>
-                <Field name="StartPosition" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="UseDataSetEnd" type="string">Full</Field>
-                <Field name="EndPosition" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="auxiliaryGrid" type="string">None</Field>
-                <Field name="auxiliaryGridSpacing" type="double">0.0001</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="operationType" type="string">Lyapunov</Field>
-                <Field name="cauchyGreenTensor" type="string">Right</Field>
-                <Field name="eigenComponent" type="string">Largest</Field>
-                <Field name="eigenWeight" type="double">1</Field>
-                <Field name="operatorType" type="string">BaseValue</Field>
-                <Field name="terminationType" type="string">Time</Field>
-                <Field name="terminateBySize" type="bool">false</Field>
-                <Field name="termSize" type="double">10</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="clampLogValues" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="thresholdLimit" type="double">0.1</Field>
-                <Field name="radialLimit" type="double">0.1</Field>
-                <Field name="boundaryLimit" type="double">0.1</Field>
-                <Field name="seedLimit" type="int">10</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="LagrangianAttributes">
-                <Field name="seedPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="numSteps" type="int">1000</Field>
-                <Field name="XAxisSample" type="string">Step</Field>
-                <Field name="YAxisSample" type="string">Step</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LimitCycleAttributes">
-                <Field name="sourceType" type="string">SpecifiedLine</Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="cycleTolerance" type="double">1e-06</Field>
-                <Field name="maxIterations" type="int">10</Field>
-                <Field name="showPartialResults" type="bool">true</Field>
-                <Field name="showReturnDistances" type="bool">false</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-            </Object>
-            <Object name="LineoutAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 1 0 </Field>
-                <Field name="interactive" type="bool">false</Field>
-                <Field name="ignoreGlobal" type="bool">false</Field>
-                <Field name="samplingOn" type="bool">false</Field>
-                <Field name="numberOfSamplePoints" type="int">50</Field>
-                <Field name="reflineLabels" type="bool">false</Field>
-                <Field name="designator" type="string"></Field>
-            </Object>
-            <Object name="MultiresControlAttributes">
-                <Field name="resolution" type="int">0</Field>
-                <Field name="maxResolution" type="int">1</Field>
-                <Field name="info" type="string"></Field>
-            </Object>
-            <Object name="OnionPeelAttributes">
-                <Field name="adjacencyType" type="string">Node</Field>
-                <Field name="useGlobalId" type="bool">false</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="index" type="intVector">1 </Field>
-                <Field name="logical" type="bool">false</Field>
-                <Field name="requestedLayer" type="int">0</Field>
-                <Field name="seedType" type="string">SeedCell</Field>
-                <Field name="honorOriginalMesh" type="bool">true</Field>
-            </Object>
-            <Object name="PersistentParticlesAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startPathType" type="string">Absolute</Field>
-                <Field name="stopPathType" type="string">Absolute</Field>
-                <Field name="traceVariableX" type="string">default</Field>
-                <Field name="traceVariableY" type="string">default</Field>
-                <Field name="traceVariableZ" type="string">default</Field>
-                <Field name="connectParticles" type="bool">false</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="indexVariable" type="string">default</Field>
-            </Object>
-            <Object name="PoincareAttributes">
-                <Field name="opacityType" type="string">Explicit</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="minPunctures" type="int">50</Field>
-                <Field name="maxPunctures" type="int">500</Field>
-                <Field name="puncturePlotType" type="string">Single</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="puncturePeriodTolerance" type="double">0.01</Field>
-                <Field name="puncturePlane" type="string">Poloidal</Field>
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="pointDensity" type="int">1</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">AdamsBashforth</Field>
-                <Field name="coordinateSystem" type="string">Cartesian</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-05</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="analysis" type="string">Normal</Field>
-                <Field name="maximumToroidalWinding" type="int">0</Field>
-                <Field name="overrideToroidalWinding" type="int">0</Field>
-                <Field name="overridePoloidalWinding" type="int">0</Field>
-                <Field name="windingPairConfidence" type="double">0.9</Field>
-                <Field name="rationalSurfaceFactor" type="double">0.1</Field>
-                <Field name="overlaps" type="string">Remove</Field>
-                <Field name="meshType" type="string">Curves</Field>
-                <Field name="numberPlanes" type="int">1</Field>
-                <Field name="singlePlane" type="double">0</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">0</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="colorType" type="string">ColorByColorTable</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="dataValue" type="string">SafetyFactorQ</Field>
-                <Field name="showRationalSurfaces" type="bool">false</Field>
-                <Field name="RationalSurfaceMaxIterations" type="int">2</Field>
-                <Field name="showOPoints" type="bool">false</Field>
-                <Field name="OPointMaxIterations" type="int">2</Field>
-                <Field name="showXPoints" type="bool">false</Field>
-                <Field name="XPointMaxIterations" type="int">2</Field>
-                <Field name="performOLineAnalysis" type="bool">false</Field>
-                <Field name="OLineToroidalWinding" type="int">1</Field>
-                <Field name="OLineAxisFileName" type="string"></Field>
-                <Field name="showChaotic" type="bool">false</Field>
-                <Field name="showIslands" type="bool">false</Field>
-                <Field name="SummaryFlag" type="bool">true</Field>
-                <Field name="verboseFlag" type="bool">false</Field>
-                <Field name="show1DPlots" type="bool">false</Field>
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="ProjectAttributes">
-                <Field name="projectionType" type="string">XYCartesian</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-            </Object>
-            <Object name="RadialResampleAttributes">
-                <Field name="isFast" type="bool">false</Field>
-                <Field name="minTheta" type="float">0</Field>
-                <Field name="maxTheta" type="float">90</Field>
-                <Field name="deltaTheta" type="float">5</Field>
-                <Field name="radius" type="float">0.5</Field>
-                <Field name="deltaRadius" type="float">0.05</Field>
-                <Field name="center" type="floatArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="minAzimuth" type="float">0</Field>
-                <Field name="maxAzimuth" type="float">180</Field>
-                <Field name="deltaAzimuth" type="float">5</Field>
-            </Object>
-            <Object name="ReflectAttributes">
-                <Field name="octant" type="string">PXPYPZ</Field>
-                <Field name="useXBoundary" type="bool">true</Field>
-                <Field name="specifiedX" type="double">0</Field>
-                <Field name="useYBoundary" type="bool">true</Field>
-                <Field name="specifiedY" type="double">0</Field>
-                <Field name="useZBoundary" type="bool">true</Field>
-                <Field name="specifiedZ" type="double">0</Field>
-                <Field name="reflections" type="intArray" length="8">1 0 1 0 0 0 0 0 </Field>
-            </Object>
-            <Object name="ReplicateAttributes">
-                <Field name="useUnitCellVectors" type="bool">false</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="xReplications" type="int">1</Field>
-                <Field name="yReplications" type="int">1</Field>
-                <Field name="zReplications" type="int">1</Field>
-                <Field name="mergeResults" type="bool">true</Field>
-                <Field name="replicateUnitCellAtoms" type="bool">false</Field>
-                <Field name="shiftPeriodicAtomOrigin" type="bool">false</Field>
-                <Field name="newPeriodicOrigin" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ResampleAttributes">
-                <Field name="useExtents" type="bool">true</Field>
-                <Field name="startX" type="double">0</Field>
-                <Field name="endX" type="double">1</Field>
-                <Field name="samplesX" type="int">10</Field>
-                <Field name="startY" type="double">0</Field>
-                <Field name="endY" type="double">1</Field>
-                <Field name="samplesY" type="int">10</Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="startZ" type="double">0</Field>
-                <Field name="endZ" type="double">1</Field>
-                <Field name="samplesZ" type="int">10</Field>
-                <Field name="tieResolver" type="string">random</Field>
-                <Field name="tieResolverVariable" type="string">default</Field>
-                <Field name="defaultValue" type="double">0</Field>
-                <Field name="distributedResample" type="bool">true</Field>
-                <Field name="cellCenteredOutput" type="bool">false</Field>
-            </Object>
-            <Object name="RevolveAttributes">
-                <Field name="meshType" type="string">Auto</Field>
-                <Field name="autoAxis" type="bool">true</Field>
-                <Field name="axis" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="startAngle" type="double">0</Field>
-                <Field name="stopAngle" type="double">360</Field>
-                <Field name="steps" type="int">30</Field>
-            </Object>
-            <Object name="SPHResampleAttributes">
-                <Field name="minX" type="float">0</Field>
-                <Field name="maxX" type="float">1</Field>
-                <Field name="xnum" type="int">10</Field>
-                <Field name="minY" type="float">0</Field>
-                <Field name="maxY" type="float">1</Field>
-                <Field name="ynum" type="int">10</Field>
-                <Field name="minZ" type="float">0</Field>
-                <Field name="maxZ" type="float">1</Field>
-                <Field name="znum" type="int">10</Field>
-                <Field name="tensorSupportVariable" type="string">H</Field>
-                <Field name="weightVariable" type="string">mass</Field>
-                <Field name="RK" type="bool">true</Field>
-            </Object>
-            <Object name="SliceAttributes">
-                <Field name="originType" type="string">Intercept</Field>
-                <Field name="originPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="originIntercept" type="double">0</Field>
-                <Field name="originPercent" type="double">0</Field>
-                <Field name="originZone" type="int">0</Field>
-                <Field name="originNode" type="int">0</Field>
-                <Field name="normal" type="doubleArray" length="3">0 -1 0 </Field>
-                <Field name="axisType" type="string">YAxis</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="project2d" type="bool">true</Field>
-                <Field name="interactive" type="bool">true</Field>
-                <Field name="flip" type="bool">false</Field>
-                <Field name="originZoneDomain" type="int">0</Field>
-                <Field name="originNodeDomain" type="int">0</Field>
-                <Field name="meshName" type="string">default</Field>
-                <Field name="theta" type="double">0</Field>
-                <Field name="phi" type="double">0</Field>
-            </Object>
-            <Object name="SmoothOperatorAttributes">
-                <Field name="numIterations" type="int">20</Field>
-                <Field name="relaxationFactor" type="double">0.01</Field>
-                <Field name="convergence" type="double">0</Field>
-                <Field name="maintainFeatures" type="bool">true</Field>
-                <Field name="featureAngle" type="double">45</Field>
-                <Field name="edgeAngle" type="double">15</Field>
-                <Field name="smoothBoundaries" type="bool">false</Field>
-            </Object>
-            <Object name="SphereSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-            </Object>
-            <Object name="StaggerAttributes">
-                <Field name="offsetX" type="double">0</Field>
-                <Field name="offsetY" type="double">0</Field>
-                <Field name="offsetZ" type="double">0</Field>
-            </Object>
-            <Object name="StatisticalTrendsAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startTrendType" type="string">Absolute</Field>
-                <Field name="stopTrendType" type="string">Absolute</Field>
-                <Field name="statisticType" type="string">Mean</Field>
-                <Field name="trendAxis" type="string">Step</Field>
-                <Field name="variableSource" type="string">Default</Field>
-            </Object>
-            <Object name="SubdivideQuadsAttributes">
-                <Field name="threshold" type="double">0.500002</Field>
-                <Field name="maxSubdivs" type="int">4</Field>
-                <Field name="fanOutPoints" type="bool">true</Field>
-                <Field name="doTriangles" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="ThreeSliceAttributes">
-                <Field name="x" type="double">0</Field>
-                <Field name="y" type="double">0</Field>
-                <Field name="z" type="double">0</Field>
-                <Field name="interactive" type="bool">true</Field>
-            </Object>
-            <Object name="ThresholdAttributes">
-                <Field name="outputMeshType" type="int">0</Field>
-                <Field name="boundsInputType" type="int">0</Field>
-                <Field name="listedVarNames" type="stringVector">"default" </Field>
-                <Field name="zonePortions" type="intVector"></Field>
-                <Field name="lowerBounds" type="doubleVector"></Field>
-                <Field name="upperBounds" type="doubleVector"></Field>
-                <Field name="boundsRange" type="stringVector"></Field>
-                <Field name="defaultVarName" type="string">default</Field>
-                <Field name="defaultVarIsScalar" type="bool">false</Field>
-            </Object>
-            <Object name="TransformAttributes">
-                <Field name="doRotate" type="bool">false</Field>
-                <Field name="rotateOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="rotateAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="rotateAmount" type="double">0</Field>
-                <Field name="rotateType" type="string">Deg</Field>
-                <Field name="doScale" type="bool">false</Field>
-                <Field name="scaleOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="scaleX" type="double">1</Field>
-                <Field name="scaleY" type="double">1</Field>
-                <Field name="scaleZ" type="double">1</Field>
-                <Field name="doTranslate" type="bool">false</Field>
-                <Field name="translateX" type="double">0</Field>
-                <Field name="translateY" type="double">0</Field>
-                <Field name="translateZ" type="double">0</Field>
-                <Field name="transformType" type="string">Similarity</Field>
-                <Field name="inputCoordSys" type="string">Cartesian</Field>
-                <Field name="outputCoordSys" type="string">Spherical</Field>
-                <Field name="continuousPhi" type="bool">false</Field>
-                <Field name="m00" type="double">1</Field>
-                <Field name="m01" type="double">0</Field>
-                <Field name="m02" type="double">0</Field>
-                <Field name="m03" type="double">0</Field>
-                <Field name="m10" type="double">0</Field>
-                <Field name="m11" type="double">1</Field>
-                <Field name="m12" type="double">0</Field>
-                <Field name="m13" type="double">0</Field>
-                <Field name="m20" type="double">0</Field>
-                <Field name="m21" type="double">0</Field>
-                <Field name="m22" type="double">1</Field>
-                <Field name="m23" type="double">0</Field>
-                <Field name="m30" type="double">0</Field>
-                <Field name="m31" type="double">0</Field>
-                <Field name="m32" type="double">0</Field>
-                <Field name="m33" type="double">1</Field>
-                <Field name="invertLinearTransform" type="bool">false</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-                <Field name="transformVectors" type="bool">true</Field>
-            </Object>
-            <Object name="TriangulateRegularPointsAttributes">
-                <Field name="useXGridSpacing" type="bool">false</Field>
-                <Field name="xGridSpacing" type="double">1</Field>
-                <Field name="useYGridSpacing" type="bool">false</Field>
-                <Field name="yGridSpacing" type="double">1</Field>
-            </Object>
-            <Object name="TubeAttributes">
-                <Field name="scaleByVarFlag" type="bool">false</Field>
-                <Field name="tubeRadiusType" type="string">FractionOfBBox</Field>
-                <Field name="radiusFractionBBox" type="double">0.01</Field>
-                <Field name="radiusAbsolute" type="double">1</Field>
-                <Field name="scaleVariable" type="string">default</Field>
-                <Field name="fineness" type="int">5</Field>
-                <Field name="capping" type="bool">false</Field>
-            </Object>
-            <Object name="AppearanceAttributes">
-                <Field name="useSystemDefault" type="bool">true</Field>
-                <Field name="background" type="string">#c0c0c0</Field>
-                <Field name="foreground" type="string">#000000</Field>
-                <Field name="fontName" type="string">Helvetica,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="style" type="string">gtk</Field>
-                <Field name="orientation" type="int">0</Field>
-                <Field name="defaultForeground" type="string">#000000</Field>
-                <Field name="defaultBackground" type="string">#d4d0c8</Field>
-                <Field name="defaultFontName" type="string">"Sans Serif,9,-1,5,50,0,0,0,0,0"</Field>
-                <Field name="defaultStyle" type="string">Windows</Field>
-                <Field name="defaultOrientation" type="int">0</Field>
-            </Object>
-            <Object name="PluginManagerAttributes">
-                <Field name="name" type="stringVector">"Boundary" "Contour" "Curve" "FilledBoundary" "Histogram" "Label" "Mesh" "Molecule" "MultiCurve" "ParallelCoordinates" "Pseudocolor" "Scatter" "Spreadsheet" "Subset" "Surface" "Tensor" "Truecolor" "Vector" "Volume" "WellBore" "AMRStitchCell" "BoundaryOp" "Box" "CartographicProjection" "Clip" "Cone" "ConnectedComponents" "CoordSwap" "CracksClipper" "CreateBonds" "Cylinder" "DataBinning" "Decimate" "DeferExpression" "Delaunay" "Displace" "DualMesh" "Edge" "Elevate" "EllipsoidSlice" "ExternalSurface" "ExtractPointFunction2D" "Extrude" "FFT" "FiveFoldTetSubdivision" "Flux" "IndexSelect" "IntegralCurve" "InverseGhostZone" "Isosurface" "Isovolume" "LCS" "Lagrangian" "LimitCycle" "LineSampler" "Lineout" "Merge" "ModelFit" "MultiresControl" "OnionPeel" "PDF" "PersistentParticles" "Poincare" "Project" "RadialResample" "Reflect" "Replicate" "Resample" "Revolve" "Slice" "Smooth" "SphereSlice" "Stagger" "StatisticalTrends" "SurfaceNormal" "ThreeSlice" "Threshold" "ToroidalPoloidalProjection" "Transform" "TriangulateRegularPoints" "Tube" "ZoneDump" "SPHResample" "AxisAlignedSlice4D" "Explode" "SubdivideQuads" </Field>
-                <Field name="type" type="stringVector">"plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" </Field>
-                <Field name="version" type="stringVector">"1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.1" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "2.0" "3.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" </Field>
-                <Field name="id" type="stringVector">"Boundary_1.0" "Contour_1.0" "Curve_1.0" "FilledBoundary_1.0" "Histogram_1.0" "Label_1.0" "Mesh_1.0" "Molecule_1.0" "MultiCurve_1.0" "ParallelCoordinates_1.0" "Pseudocolor_1.0" "Scatter_1.0" "Spreadsheet_1.0" "Subset_1.0" "Surface_1.0" "Tensor_1.0" "Truecolor_1.0" "Vector_1.0" "Volume_1.1" "WellBore_1.0" "AMRStitchCell_1.0" "BoundaryOp_1.0" "Box_1.0" "CartographicProjection_1.0" "Clip_1.0" "Cone_1.0" "ConnectedComponents_1.0" "CoordSwap_1.0" "CracksClipper_1.0" "CreateBonds_1.0" "Cylinder_1.0" "DataBinning_1.0" "Decimate_1.0" "DeferExpression_1.0" "Delaunay_1.0" "Displace_1.0" "DualMesh_1.0" "Edge_1.0" "Elevate_1.0" "EllipsoidSlice_1.0" "ExternalSurface_1.0" "ExtractPointFunction2D_1.0" "Extrude_1.0" "FFT_1.0" "FiveFoldTetSubdivision_1.0" "Flux_1.0" "IndexSelect_1.0" "IntegralCurve_1.0" "InverseGhostZone_1.0" "Isosurface_1.0" "Isovolume_1.0" "LCS_1.0" "Lagrangian_1.0" "LimitCycle_1.0" "LineSampler_1.0" "Lineout_1.0" "Merge_1.0" "ModelFit_1.0" "MultiresControl_1.0" "OnionPeel_1.0" "PDF_1.0" "PersistentParticles_2.0" "Poincare_3.0" "Project_1.0" "RadialResample_1.0" "Reflect_1.0" "Replicate_1.0" "Resample_1.0" "Revolve_1.0" "Slice_1.0" "Smooth_1.0" "SphereSlice_1.0" "Stagger_1.0" "StatisticalTrends_1.0" "SurfaceNormal_1.0" "ThreeSlice_1.0" "Threshold_1.0" "ToroidalPoloidalProjection_1.0" "Transform_1.0" "TriangulateRegularPoints_1.0" "Tube_1.0" "ZoneDump_1.0" "SPHResample_1.0" "AxisAlignedSlice4D_1.0" "Explode_1.0" "SubdivideQuads_1.0" </Field>
-                <Field name="category" type="stringVector">"?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "Geometry" "Slicing" "Selection" "Transforms" "Selection" "Slicing" "Analysis" "Geometry" "Analysis" "Molecular" "Selection" "Analysis" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Geometry" "Transforms" "Slicing" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Analysis" "Selection" "Integral Curves" "Debugging" "Slicing" "Selection" "Integral Curves" "Integral Curves" "Integral Curves" "Slicing" "Analysis" "Geometry" "Analysis" "Selection" "Selection" "Analysis" "Analysis" "Integral Curves" "Transforms" "Geometry" "Transforms" "Transforms" "Geometry" "Geometry" "Slicing" "Geometry" "Slicing" "Transforms" "Analysis" "Geometry" "Slicing" "Selection" "Transforms" "Transforms" "Geometry" "Geometry" "Debugging" "Geometry" "Slicing" "Transforms" "Geometry" </Field>
-                <Field name="enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 1 0 1 1 1 1 1 1 1 1 0 1 1 1 0 1 0 1 1 1 1 1 1 0 1 1 0 1 1 1 1 1 1 1 1 1 0 1 0 1 1 1 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 0 1 1 1 1 </Field>
-            </Object>
-        </Object>
-        <Object name="ViewerSubject">
-            <Object name="SourceMap">
-                <Field name="SOURCE00" type="string">localhost:/work/SENSEI/amrex/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/umesh/umesh.visit</Field>
-            </Object>
-            <Object name="SourcePlugins">
-                <Field name="localhost:/work/SENSEI/amrex/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/umesh/umesh.visit" type="string">VTK_1.0</Field>
-            </Object>
-            <Object name="DatabaseCorrelationList">
-                <Field name="needPermission" type="bool">true</Field>
-                <Field name="defaultCorrelationMethod" type="int">0</Field>
-                <Field name="whenToCorrelate" type="string">CorrelateOnlyIfSameLength</Field>
-            </Object>
-            <Object name="ViewerWindowManager">
-                <Object name="SelectionList">
-                    <Field name="autoApplyUpdates" type="bool">false</Field>
-                </Object>
-                <Field name="activeWindow" type="int">0</Field>
-                <Field name="lineoutWindow" type="int">-1</Field>
-                <Field name="timeQueryWindow" type="int">-1</Field>
-                <Field name="cameraView" type="bool">false</Field>
-                <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                <Object name="Windows">
-                    <Object name="ViewerWindow">
-                        <Field name="windowSize" type="intArray" length="2">758 815 </Field>
-                        <Field name="windowImageSize" type="intArray" length="2">758 755 </Field>
-                        <Field name="windowLocation" type="intArray" length="2">536 331 </Field>
-                        <Field name="maintainView" type="bool">false</Field>
-                        <Field name="cameraView" type="bool">false</Field>
-                        <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                        <Field name="viewIsLocked" type="bool">false</Field>
-                        <Field name="timeLocked" type="bool">false</Field>
-                        <Field name="toolsLocked" type="bool">false</Field>
-                        <Field name="interactionMode" type="string">NAVIGATE</Field>
-                        <Field name="toolUpdateMode" type="string">ONRELEASE</Field>
-                        <Object name="AnnotationAttributes">
-                            <Object name="axes2D">
-                                <Object name="Axes2D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Outside</Field>
-                                    <Field name="tickAxes" type="string">BottomLeft</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                            <Object name="axes3D">
-                                <Object name="Axes3D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Inside</Field>
-                                    <Field name="axesType" type="string">ClosestTriad</Field>
-                                    <Field name="triadFlag" type="bool">true</Field>
-                                    <Field name="bboxFlag" type="bool">true</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="zAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Z-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="setBBoxLocation" type="bool">false</Field>
-                                    <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="userInfoFlag" type="bool">true</Field>
-                            <Object name="userInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoFlag" type="bool">true</Field>
-                            <Field name="timeInfoFlag" type="bool">true</Field>
-                            <Object name="databaseInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                            <Field name="databaseInfoTimeScale" type="double">1</Field>
-                            <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                            <Field name="legendInfoFlag" type="bool">true</Field>
-                            <Object name="backgroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="foregroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                            <Object name="gradientColor1">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="gradientColor2">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="backgroundMode" type="string">Solid</Field>
-                            <Field name="backgroundImage" type="string"></Field>
-                            <Field name="imageRepeatX" type="int">1</Field>
-                            <Field name="imageRepeatY" type="int">1</Field>
-                            <Object name="axesArray">
-                                <Object name="AxesArray">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="ticksVisible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Object name="axes">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string"></Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Object name="LightList">
-                            <Object name="light0">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                                    <Field name="enabledFlag" type="bool">true</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light1">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light2">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light3">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light4">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light5">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light6">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light7">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                        <Field name="scalableActivationMode" type="int">1</Field>
-                        <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-                        <Field name="compactDomainsActivationMode" type="int">2</Field>
-                        <Field name="notifyForEachRender" type="bool">false</Field>
-                        <Field name="surfaceRepresentation" type="int">0</Field>
-                        <Field name="displayListMode" type="int">2</Field>
-                        <Field name="stereoRendering" type="bool">false</Field>
-                        <Field name="stereoType" type="int">2</Field>
-                        <Field name="antialiasing" type="bool">false</Field>
-                        <Field name="orderComposite" type="bool">true</Field>
-                        <Field name="depthPeeling" type="bool">false</Field>
-                        <Field name="occlusionRatio" type="double">0.01</Field>
-                        <Field name="numberOfPeels" type="int">32</Field>
-                        <Field name="multiresolutionMode" type="bool">false</Field>
-                        <Field name="multiresolutionCellSize" type="double">0.0020000000949949</Field>
-                        <Field name="specularFlag" type="bool">false</Field>
-                        <Field name="specularCoeff" type="double">0.600000023841858</Field>
-                        <Field name="specularPower" type="double">10</Field>
-                        <Object name="specularColor">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="doShading" type="bool">false</Field>
-                        <Field name="shadingStrength" type="double">0.5</Field>
-                        <Field name="doDepthCueing" type="bool">false</Field>
-                        <Field name="depthCueingAuto" type="bool">true</Field>
-                        <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                        <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                        <Field name="colorTexturingFlag" type="bool">true</Field>
-                        <Object name="ViewCurveAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="domainScale" type="int">0</Field>
-                            <Field name="rangeScale" type="int">0</Field>
-                        </Object>
-                        <Object name="View2DAttributes">
-                            <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                            <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                            <Field name="xScale" type="int">0</Field>
-                            <Field name="yScale" type="int">0</Field>
-                            <Field name="windowValid" type="bool">true</Field>
-                        </Object>
-                        <Object name="View3DAttributes">
-                            <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="focus" type="doubleArray" length="3">0 0 0 </Field>
-                            <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                            <Field name="viewAngle" type="double">30</Field>
-                            <Field name="parallelScale" type="double">0.5</Field>
-                            <Field name="nearPlane" type="double">-0.5</Field>
-                            <Field name="farPlane" type="double">0.5</Field>
-                            <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                            <Field name="imageZoom" type="double">1</Field>
-                            <Field name="perspective" type="bool">true</Field>
-                            <Field name="eyeAngle" type="double">2</Field>
-                            <Field name="centerOfRotationSet" type="bool">false</Field>
-                            <Field name="centerOfRotation" type="doubleArray" length="3">0 0 0 </Field>
-                            <Field name="axis3DScaleFlag" type="bool">false</Field>
-                            <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                            <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="windowValid" type="bool">false</Field>
-                        </Object>
-                        <Object name="ViewAxisArrayAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.15 0.9 0.1 0.85 </Field>
-                        </Object>
-                        <Object name="AnnotationObjectList">
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0000</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">0</Field>
-                                <Field name="doubleVector1" type="doubleVector"></Field>
-                                <Field name="stringVector1" type="stringVector"></Field>
-                                <Field name="stringVector2" type="stringVector"></Field>
-                            </Object>
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0002</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">1</Field>
-                                <Field name="doubleVector1" type="doubleVector">1.0875 1.17783 1.26816 1.3585 1.44883 1.53917 1.6295 1.71983 1.81017 1.9005 </Field>
-                                <Field name="stringVector1" type="stringVector">"" "" "" "" "" "" "" "" "" "" </Field>
-                                <Field name="stringVector2" type="stringVector">"1.0875" "1.17783" "1.26816" "1.3585" "1.44883" "1.53917" "1.6295" "1.71983" "1.81017" "1.9005" </Field>
-                            </Object>
-                        </Object>
-                        <Object name="InteractorAttributes">
-                            <Field name="showGuidelines" type="bool">true</Field>
-                            <Field name="clampSquare" type="bool">false</Field>
-                            <Field name="fillViewportOnZoom" type="bool">true</Field>
-                            <Field name="navigationMode" type="string">Trackball</Field>
-                            <Field name="axisArraySnap" type="bool">true</Field>
-                            <Field name="boundingBoxMode" type="string">Auto</Field>
-                        </Object>
-                        <Object name="ViewerPlotList">
-                            <Object name="plot00">
-                                <Field name="plotName" type="string">Plot0000</Field>
-                                <Field name="pluginID" type="string">Mesh_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">mesh</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="MeshAttributes">
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">0</Field>
-                                        <Object name="meshColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="meshColorSource" type="string">Foreground</Field>
-                                        <Field name="opaqueColorSource" type="string">Background</Field>
-                                        <Field name="opaqueMode" type="string">Auto</Field>
-                                        <Field name="pointSize" type="double">0.05</Field>
-                                        <Object name="opaqueColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="smoothingLevel" type="string">None</Field>
-                                        <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                        <Field name="pointSizeVar" type="string">default</Field>
-                                        <Field name="pointType" type="int">6</Field>
-                                        <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                        <Field name="showInternal" type="bool">false</Field>
-                                        <Field name="pointSizePixels" type="int">2</Field>
-                                        <Field name="opacity" type="double">1</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="MeshAttributes">
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">0</Field>
-                                                    <Object name="meshColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="meshColorSource" type="string">Foreground</Field>
-                                                    <Field name="opaqueColorSource" type="string">Background</Field>
-                                                    <Field name="opaqueMode" type="string">Auto</Field>
-                                                    <Field name="pointSize" type="double">0.05</Field>
-                                                    <Object name="opaqueColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="smoothingLevel" type="string">None</Field>
-                                                    <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                                    <Field name="pointSizeVar" type="string">default</Field>
-                                                    <Field name="pointType" type="int">6</Field>
-                                                    <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                                    <Field name="showInternal" type="bool">false</Field>
-                                                    <Field name="pointSizePixels" type="int">2</Field>
-                                                    <Field name="opacity" type="double">1</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Object name="plot01">
-                                <Field name="plotName" type="string">Plot0002</Field>
-                                <Field name="pluginID" type="string">Contour_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">mesh/cell/phi</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="ContourAttributes">
-                                        <Object name="defaultPalette">
-                                            <Object name="ColorControlPointList">
-                                                <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                <Field name="smoothing" type="string">None</Field>
-                                                <Field name="equal" type="bool">true</Field>
-                                                <Field name="discrete" type="bool">true</Field>
-                                                <Field name="category" type="string">Standard</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="colorType" type="string">ColorByColorTable</Field>
-                                        <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">3</Field>
-                                        <Object name="singleColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="contourNLevels" type="int">10</Field>
-                                        <Field name="contourValue" type="doubleVector"></Field>
-                                        <Field name="contourPercent" type="doubleVector"></Field>
-                                        <Field name="contourMethod" type="string">Level</Field>
-                                        <Field name="minFlag" type="bool">false</Field>
-                                        <Field name="maxFlag" type="bool">false</Field>
-                                        <Field name="min" type="double">0</Field>
-                                        <Field name="max" type="double">1</Field>
-                                        <Field name="scaling" type="string">Linear</Field>
-                                        <Field name="wireframe" type="bool">false</Field>
-                                        <Field name="invertColorTable" type="bool">false</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="ContourAttributes">
-                                                    <Object name="defaultPalette">
-                                                        <Object name="ColorControlPointList">
-                                                            <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                            <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                            <Field name="smoothing" type="string">None</Field>
-                                                            <Field name="equal" type="bool">true</Field>
-                                                            <Field name="discrete" type="bool">true</Field>
-                                                            <Field name="category" type="string">Standard</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="colorType" type="string">ColorByColorTable</Field>
-                                                    <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">3</Field>
-                                                    <Object name="singleColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="contourNLevels" type="int">10</Field>
-                                                    <Field name="contourValue" type="doubleVector"></Field>
-                                                    <Field name="contourPercent" type="doubleVector"></Field>
-                                                    <Field name="contourMethod" type="string">Level</Field>
-                                                    <Field name="minFlag" type="bool">false</Field>
-                                                    <Field name="maxFlag" type="bool">false</Field>
-                                                    <Field name="min" type="double">0</Field>
-                                                    <Field name="max" type="double">1</Field>
-                                                    <Field name="scaling" type="string">Linear</Field>
-                                                    <Field name="wireframe" type="bool">false</Field>
-                                                    <Field name="invertColorTable" type="bool">false</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Field name="activeSource" type="string">SOURCE00</Field>
-                            <Field name="nPlots" type="int">2</Field>
-                            <Field name="keyframeMode" type="bool">false</Field>
-                            <Field name="nKeyframes" type="int">1</Field>
-                            <Object name="AnimationAttributes">
-                                <Field name="animationMode" type="string">StopMode</Field>
-                                <Field name="pipelineCachingMode" type="bool">false</Field>
-                                <Field name="frameIncrement" type="int">1</Field>
-                                <Field name="timeout" type="int">1</Field>
-                                <Field name="playbackMode" type="string">Looping</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerQueryManager">
-                <Field name="baseDesignator" type="char">A</Field>
-                <Field name="cycleDesignator" type="bool">false</Field>
-                <Field name="colorIndex" type="int">0</Field>
-            </Object>
-        </Object>
-        <Object name="ViewerEngineManager">
-            <Object name="RunningEngines">
-                <Object name="MachineProfile">
-                    <Field name="hostNickname" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="host" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="userName" type="string">notset</Field>
-                    <Field name="hostAliases" type="string"></Field>
-                    <Field name="directory" type="string"></Field>
-                    <Field name="shareOneBatchJob" type="bool">false</Field>
-                    <Field name="sshPortSpecified" type="bool">false</Field>
-                    <Field name="sshPort" type="int">22</Field>
-                    <Field name="sshCommandSpecified" type="bool">false</Field>
-                    <Field name="sshCommand" type="stringVector">"ssh" </Field>
-                    <Field name="useGateway" type="bool">false</Field>
-                    <Field name="gatewayHost" type="string"></Field>
-                    <Field name="clientHostDetermination" type="string">MachineName</Field>
-                    <Field name="manualClientHostName" type="string"></Field>
-                    <Field name="tunnelSSH" type="bool">false</Field>
-                    <Field name="maximumNodesValid" type="bool">false</Field>
-                    <Field name="maximumNodes" type="int">1</Field>
-                    <Field name="maximumProcessorsValid" type="bool">true</Field>
-                    <Field name="maximumProcessors" type="int">10</Field>
-                    <Object name="LaunchProfile">
-                        <Field name="timeout" type="int">480</Field>
-                        <Field name="numProcessors" type="int">1</Field>
-                        <Field name="numNodesSet" type="bool">false</Field>
-                        <Field name="numNodes" type="int">-1</Field>
-                        <Field name="partitionSet" type="bool">false</Field>
-                        <Field name="partition" type="string"></Field>
-                        <Field name="bankSet" type="bool">false</Field>
-                        <Field name="bank" type="string"></Field>
-                        <Field name="timeLimitSet" type="bool">false</Field>
-                        <Field name="timeLimit" type="string"></Field>
-                        <Field name="launchMethodSet" type="bool">false</Field>
-                        <Field name="launchMethod" type="string"></Field>
-                        <Field name="forceStatic" type="bool">true</Field>
-                        <Field name="forceDynamic" type="bool">false</Field>
-                        <Field name="active" type="bool">false</Field>
-                        <Field name="arguments" type="stringVector"></Field>
-                        <Field name="parallel" type="bool">false</Field>
-                        <Field name="launchArgsSet" type="bool">false</Field>
-                        <Field name="launchArgs" type="string"></Field>
-                        <Field name="sublaunchArgsSet" type="bool">false</Field>
-                        <Field name="sublaunchArgs" type="string"></Field>
-                        <Field name="sublaunchPreCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPreCmd" type="string"></Field>
-                        <Field name="sublaunchPostCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPostCmd" type="string"></Field>
-                        <Field name="machinefileSet" type="bool">false</Field>
-                        <Field name="machinefile" type="string"></Field>
-                        <Field name="visitSetsUpEnv" type="bool">false</Field>
-                        <Field name="canDoHWAccel" type="bool">false</Field>
-                        <Field name="GPUsPerNode" type="int">1</Field>
-                        <Field name="XArguments" type="string"></Field>
-                        <Field name="launchXServers" type="bool">false</Field>
-                        <Field name="XDisplay" type="string">:%l</Field>
-                        <Field name="numThreads" type="int">0</Field>
-                        <Field name="constrainNodeProcs" type="bool">false</Field>
-                        <Field name="allowableNodes" type="intVector"></Field>
-                        <Field name="allowableProcs" type="intVector"></Field>
-                        <Field name="profileName" type="string">Serial</Field>
-                    </Object>
-                    <Field name="activeProfile" type="int">1</Field>
-                </Object>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="ExportDBAttributes">
-                <Field name="allTimes" type="bool">false</Field>
-                <Field name="dirname" type="string">.</Field>
-                <Field name="filename" type="string">visit_ex_db</Field>
-                <Field name="timeStateFormat" type="string">_%04d</Field>
-                <Field name="db_type" type="string"></Field>
-                <Field name="db_type_fullname" type="string"></Field>
-                <Field name="variables" type="stringVector"></Field>
-                <Field name="writeUsingGroups" type="bool">false</Field>
-                <Field name="groupSize" type="int">48</Field>
-                <Object name="opts">
-                    <Object name="DBOptionsAttributes">
-                        <Field name="types" type="intVector"></Field>
-                        <Field name="names" type="stringVector"></Field>
-                        <Field name="optBools" type="intVector"></Field>
-                        <Field name="optFloats" type="doubleVector"></Field>
-                        <Field name="optDoubles" type="doubleVector"></Field>
-                        <Field name="optInts" type="intVector"></Field>
-                        <Field name="optStrings" type="stringVector"></Field>
-                        <Field name="optEnums" type="intVector"></Field>
-                        <Field name="enumStrings" type="stringVector"></Field>
-                        <Field name="enumStringsSizes" type="intVector"></Field>
-                        <Field name="obsoleteNames" type="stringVector"></Field>
-                        <Field name="help" type="string"></Field>
-                    </Object>
-                </Object>
-            </Object>
-        </Object>
-    </Object>
-</Object>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_2d.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_2d.xml
deleted file mode 100644
index 94f9a3d47ea..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_2d.xml
+++ /dev/null
@@ -1,9 +0,0 @@
-<sensei>
-  <!-- libsim 2D -->
-  <analysis type="libsim"
-    visitdir="/work/SENSEI/visit2.13.2-install" mode="batch"
-    session="sensei/render_iso_libsim_2d.session"
-    image-filename="ls_image_2d_%ts" image-width="800" image-height="800"
-    compute_nesting="0"
-    image-format="png" frequency="1" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_3d.session b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_3d.session
deleted file mode 100644
index 571705f5800..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_3d.session
+++ /dev/null
@@ -1,5328 +0,0 @@
-<?xml version="1.0"?>
-<Object name="VisIt">
-    <Field name="Version" type="string">2.13.2</Field>
-    <Object name="VIEWER">
-        <Object name="DEFAULT_VALUES">
-            <Object name="GlobalAttributes">
-                <Field name="autoUpdateFlag" type="bool">false</Field>
-                <Field name="replacePlots" type="bool">false</Field>
-                <Field name="applyWindow" type="bool">false</Field>
-                <Field name="applyOperator" type="bool">false</Field>
-                <Field name="windowLayout" type="int">1</Field>
-                <Field name="makeDefaultConfirm" type="bool">true</Field>
-                <Field name="cloneWindowOnFirstRef" type="bool">false</Field>
-                <Field name="automaticallyAddOperator" type="bool">false</Field>
-                <Field name="tryHarderCyclesTimes" type="bool">false</Field>
-                <Field name="treatAllDBsAsTimeVarying" type="bool">false</Field>
-                <Field name="createMeshQualityExpressions" type="bool">true</Field>
-                <Field name="createTimeDerivativeExpressions" type="bool">true</Field>
-                <Field name="createVectorMagnitudeExpressions" type="bool">true</Field>
-                <Field name="newPlotsInheritSILRestriction" type="bool">true</Field>
-                <Field name="userDirForSessionFiles" type="bool">false</Field>
-                <Field name="saveCrashRecoveryFile" type="bool">true</Field>
-                <Field name="applySelection" type="bool">false</Field>
-                <Field name="userRestoreSessionFile" type="bool">false</Field>
-                <Field name="precisionType" type="int">1</Field>
-                <Field name="backendType" type="int">0</Field>
-                <Field name="removeDuplicateNodes" type="bool">false</Field>
-            </Object>
-            <Object name="SaveWindowAttributes">
-                <Field name="outputToCurrentDirectory" type="bool">true</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="fileName" type="string">visit</Field>
-                <Field name="family" type="bool">true</Field>
-                <Field name="format" type="string">PNG</Field>
-                <Field name="width" type="int">1024</Field>
-                <Field name="height" type="int">1024</Field>
-                <Field name="screenCapture" type="bool">false</Field>
-                <Field name="saveTiled" type="bool">false</Field>
-                <Field name="quality" type="int">80</Field>
-                <Field name="progressive" type="bool">false</Field>
-                <Field name="binary" type="bool">false</Field>
-                <Field name="lastRealFilename" type="string"></Field>
-                <Field name="stereo" type="bool">false</Field>
-                <Field name="compression" type="string">None</Field>
-                <Field name="forceMerge" type="bool">false</Field>
-                <Field name="resConstraint" type="string">ScreenProportions</Field>
-                <Field name="advancedMultiWindowSave" type="bool">false</Field>
-                <Object name="subWindowAtts">
-                    <Object name="SaveSubWindowsAttributes">
-                        <Object name="win1">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win2">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win3">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win4">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win5">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win6">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win7">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win8">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win9">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win10">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win11">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win12">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win13">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win14">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win15">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="win16">
-                            <Object name="SaveSubWindowAttributes">
-                                <Field name="position" type="intArray" length="2">0 0 </Field>
-                                <Field name="size" type="intArray" length="2">128 128 </Field>
-                                <Field name="layer" type="int">0</Field>
-                                <Field name="transparency" type="double">0</Field>
-                                <Field name="omitWindow" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ColorTableAttributes">
-                <Field name="activeContinuous" type="string">hot</Field>
-                <Field name="activeDiscrete" type="string">levels</Field>
-                <Field name="groupingFlag" type="bool">false</Field>
-                <Object name="table00">
-                    <Field name="ctName" type="string">amino_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 189 159 109 255 0.009 199 199 199 255 0.019 255 105 180 255 0.028 230 230 0 255 0.037 230 9 9 255 0.046 230 9 9 255 0.056 49 49 170 255 0.065 235 235 235 255 0.074 130 130 210 255 0.083 15 130 15 255 0.093 19 90 255 255 0.102 15 130 15 255 0.111 230 230 0 255 0.12 0 220 220 255 0.13 220 149 130 255 0.139 0 220 220 255 0.148 19 90 255 255 0.157 249 149 0 255 0.167 249 149 0 255 0.176 15 130 15 255 0.185 180 90 180 255 0.194 49 49 170 255 0.204 255 105 180 255 </Field>
-                </Object>
-                <Object name="table01">
-                    <Field name="ctName" type="string">amino_shapely</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.009 139 255 139 255 0.019 255 0 255 255 0.028 255 255 111 255 0.037 159 0 66 255 0.046 102 0 0 255 0.056 82 75 82 255 0.065 255 255 255 255 0.074 111 111 255 255 0.083 0 75 0 255 0.093 70 70 184 255 0.102 69 94 69 255 0.111 184 159 66 255 0.12 255 123 111 255 0.13 82 82 82 255 0.139 255 75 75 255 0.148 0 0 123 255 0.157 255 111 66 255 0.167 184 75 0 255 0.176 255 139 255 255 0.185 79 70 0 255 0.194 139 111 75 255 0.204 255 0 255 255 </Field>
-                </Object>
-                <Object name="table02">
-                    <Field name="ctName" type="string">bluehot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.333 0 0 127 255 0.666 0 127 255 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table03">
-                    <Field name="ctName" type="string">caleblack</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table04">
-                    <Field name="ctName" type="string">calewhite</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 0.17 0 0 255 255 0.34 0 255 255 255 0.5 0 255 0 255 0.67 255 255 0 255 0.84 255 0 0 255 1 255 0 255 255 </Field>
-                </Object>
-                <Object name="table05">
-                    <Field name="ctName" type="string">contoured</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.333 0 255 0 255 0.666 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table06">
-                    <Field name="ctName" type="string">cpk_jmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 217 255 255 255 0.028 204 128 255 255 0.037 194 255 0 255 0.046 255 181 181 255 0.055 144 144 144 255 0.064 47 80 248 255 0.073 255 13 13 255 0.083 144 223 80 255 0.092 179 226 245 255 0.101 171 92 241 255 0.11 137 255 0 255 0.119 190 166 166 255 0.128 239 199 159 255 0.138 255 128 0 255 0.147 255 255 47 255 0.156 31 239 31 255 0.165 128 209 226 255 0.174 143 64 211 255 0.183 60 255 0 255 0.193 230 230 230 255 0.202 190 194 198 255 0.211 166 166 171 255 0.22 137 153 198 255 0.229 156 121 198 255 0.239 223 102 51 255 0.248 239 144 159 255 0.257 80 208 80 255 0.266 199 128 51 255 0.275 124 128 175 255 0.284 194 143 143 255 0.294 102 143 143 255 0.303 188 128 226 255 0.312 255 160 0 255 0.321 166 41 41 255 0.33 92 184 209 255 0.339 111 45 175 255 0.349 0 255 0 255 0.358 147 255 255 255 0.367 147 223 223 255 0.376 115 194 200 255 0.385 83 181 181 255 0.394 58 158 158 255 0.404 35 143 143 255 0.413 9 124 139 255 0.422 0 105 133 255 0.431 192 192 192 255 0.44 255 217 143 255 0.45 166 117 115 255 0.459 102 128 128 255 0.468 158 98 181 255 0.477 211 121 0 255 0.486 147 0 147 255 0.495 66 158 175 255 0.505 86 22 143 255 0.514 0 200 0 255 0.523 111 211 255 255 0.532 255 255 198 255 0.541 217 255 198 255 0.55 198 255 198 255 0.56 162 255 198 255 0.569 143 255 198 255 0.578 96 255 198 255 0.587 69 255 198 255 0.596 47 255 198 255 0.606 31 255 198 255 0.615 0 255 156 255 0.624 0 230 117 255 0.633 0 211 82 255 0.642 0 190 56 255 0.651 0 171 35 255 0.661 77 194 255 255 0.67 77 166 255 255 0.679 32 147 213 255 0.688 37 124 171 255 0.697 37 102 149 255 0.706 22 83 134 255 0.716 208 208 223 255 0.725 255 209 34 255 0.734 184 184 208 255 0.743 166 83 77 255 0.752 86 88 96 255 0.761 158 79 181 255 0.771 171 92 0 255 0.78 117 79 69 255 0.789 66 130 149 255 0.798 66 0 102 255 0.807 0 124 0 255 0.817 111 171 249 255 0.826 0 185 255 255 0.835 0 160 255 255 0.844 0 143 255 255 0.853 0 128 255 255 0.862 0 107 255 255 0.872 83 92 241 255 0.881 120 92 226 255 0.89 137 79 226 255 0.899 160 54 211 255 0.908 179 31 211 255 0.917 179 31 185 255 0.927 179 13 166 255 0.936 188 13 134 255 0.945 198 0 102 255 0.954 204 0 88 255 0.963 209 0 79 255 0.972 217 0 69 255 0.982 223 0 56 255 0.991 230 0 45 255 1 235 0 37 255 </Field>
-                </Object>
-                <Object name="table07">
-                    <Field name="ctName" type="string">cpk_rasmol</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 31 31 31 255 0.009 255 255 255 255 0.018 255 192 202 255 0.028 177 33 33 255 0.037 255 19 146 255 0.046 0 255 0 255 0.055 199 199 199 255 0.064 143 143 255 255 0.073 239 0 0 255 0.083 218 164 31 255 0.092 255 19 146 255 0.101 0 0 255 255 0.11 33 138 33 255 0.119 128 128 144 255 0.128 218 164 31 255 0.138 255 164 0 255 0.147 255 199 49 255 0.156 0 255 0 255 0.165 255 19 146 255 0.174 255 19 146 255 0.183 128 128 144 255 0.193 255 19 146 255 0.202 128 128 144 255 0.211 255 19 146 255 0.22 128 128 144 255 0.229 128 128 144 255 0.239 255 164 0 255 0.248 255 19 146 255 0.257 164 42 42 255 0.266 164 42 42 255 0.275 164 42 42 255 0.284 255 19 146 255 0.294 255 19 146 255 0.303 255 19 146 255 0.312 255 19 146 255 0.321 164 42 42 255 0.33 255 19 146 255 0.339 255 19 146 255 0.349 255 19 146 255 0.358 255 19 146 255 0.367 255 19 146 255 0.376 255 19 146 255 0.385 255 19 146 255 0.394 255 19 146 255 0.404 255 19 146 255 0.413 255 19 146 255 0.422 255 19 146 255 0.431 128 128 144 255 0.44 255 19 146 255 0.45 255 19 146 255 0.459 255 19 146 255 0.468 255 19 146 255 0.477 255 19 146 255 0.486 159 31 239 255 0.495 255 19 146 255 0.505 255 19 146 255 0.514 255 164 0 255 0.523 255 19 146 255 0.532 255 19 146 255 0.541 255 19 146 255 0.55 255 19 146 255 0.56 255 19 146 255 0.569 255 19 146 255 0.578 255 19 146 255 0.587 255 19 146 255 0.596 255 19 146 255 0.606 255 19 146 255 0.615 255 19 146 255 0.624 255 19 146 255 0.633 255 19 146 255 0.642 255 19 146 255 0.651 255 19 146 255 0.661 255 19 146 255 0.67 255 19 146 255 0.679 255 19 146 255 0.688 255 19 146 255 0.697 255 19 146 255 0.706 255 19 146 255 0.716 255 19 146 255 0.725 218 164 31 255 0.734 255 19 146 255 0.743 255 19 146 255 0.752 255 19 146 255 0.761 255 19 146 255 0.771 255 19 146 255 0.78 255 19 146 255 0.789 255 19 146 255 0.798 255 19 146 255 0.807 255 19 146 255 0.817 255 19 146 255 0.826 255 19 146 255 0.835 255 19 146 255 0.844 255 19 146 255 0.853 255 19 146 255 0.862 255 19 146 255 0.872 255 19 146 255 0.881 255 19 146 255 0.89 255 19 146 255 0.899 255 19 146 255 0.908 255 19 146 255 0.917 255 19 146 255 0.927 255 19 146 255 0.936 255 19 146 255 0.945 255 19 146 255 0.954 255 19 146 255 0.963 255 19 146 255 0.972 255 19 146 255 0.982 255 19 146 255 0.991 255 19 146 255 1 255 19 146 255 </Field>
-                </Object>
-                <Object name="table08">
-                    <Field name="ctName" type="string">difference</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.5 255 255 255 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table09">
-                    <Field name="ctName" type="string">gray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 0 255 1 255 255 255 255 </Field>
-                </Object>
-                <Object name="table10">
-                    <Field name="ctName" type="string">hot</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 0 255 255 0.25 0 255 255 255 0.5 0 255 0 255 0.75 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table11">
-                    <Field name="ctName" type="string">hot_and_cold</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 0 255 255 255 0.45 0 0 255 255 0.5 0 0 127 255 0.55 255 0 0 255 1 255 255 0 255 </Field>
-                </Object>
-                <Object name="table12">
-                    <Field name="ctName" type="string">levels</Field>
-                    <Field name="equal" type="bool">true</Field>
-                    <Field name="smoothing" type="int">0</Field>
-                    <Field name="discrete" type="bool">true</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 0 255 0.034 0 255 0 255 0.069 0 0 255 255 0.103 0 255 255 255 0.138 255 0 255 255 0.172 255 255 0 255 0.207 255 135 0 255 0.241 255 0 135 255 0.276 168 168 168 255 0.31 255 68 68 255 0.345 99 255 99 255 0.379 99 99 255 255 0.414 40 165 165 255 0.448 255 99 255 255 0.483 255 255 99 255 0.517 255 170 99 255 0.552 170 79 255 255 0.586 150 0 0 255 0.621 0 150 0 255 0.655 0 0 150 255 0.69 0 109 109 255 0.724 150 0 150 255 0.759 150 150 0 255 0.793 150 84 0 255 0.828 160 0 79 255 0.862 255 104 28 255 0.897 0 170 81 255 0.931 68 255 124 255 0.966 0 130 255 255 1 130 0 255 255 </Field>
-                </Object>
-                <Object name="table13">
-                    <Field name="ctName" type="string">rainbow</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 0 255 255 0.2 0 0 255 255 0.4 0 255 255 255 0.6 0 255 0 255 0.8 255 255 0 255 1 255 0 0 255 </Field>
-                </Object>
-                <Object name="table14">
-                    <Field name="ctName" type="string">xray</Field>
-                    <Field name="category" type="string">Standard</Field>
-                    <Field name="colorsHaveOpacity" type="bool">true</Field>
-                    <Field name="controlPts" type="floatVector">0 255 255 255 255 1 0 0 0 255 </Field>
-                </Object>
-                <Field name="Ntables" type="int">15</Field>
-            </Object>
-            <Object name="ExpressionList">
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ConnectedComponents/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ConnectedComponents</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/1D/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/2D/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/DataBinning/3D/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">DataBinning</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Flux/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Flux</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/Lineout/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">CurveMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">Lineout</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/model</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">Mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/ModelFit/distance</Field>
-                    <Field name="definition" type="string">"point_constant(&lt;Mesh&gt;, 0)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">ModelFit</Field>
-                    <Field name="meshName" type="string">Mesh</Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Sum/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Mean/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Variance/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">"operators/StatisticalTrends/Std. Dev./phi"</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Slope/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/StatisticalTrends/Residuals/phi</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;phi&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">ScalarMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">StatisticalTrends</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-                <Object name="Expression">
-                    <Field name="name" type="string">operators/SurfaceNormal/Mesh</Field>
-                    <Field name="definition" type="string">"cell_constant(&lt;Mesh&gt;, 0.)"</Field>
-                    <Field name="hidden" type="bool">false</Field>
-                    <Field name="type" type="string">VectorMeshVar</Field>
-                    <Field name="fromDB" type="bool">false</Field>
-                    <Field name="fromOperator" type="bool">true</Field>
-                    <Field name="operatorName" type="string">SurfaceNormal</Field>
-                    <Field name="meshName" type="string"></Field>
-                    <Field name="dbName" type="string">__none__</Field>
-                    <Field name="autoExpression" type="bool">false</Field>
-                </Object>
-            </Object>
-            <Object name="AnimationAttributes">
-                <Field name="animationMode" type="string">StopMode</Field>
-                <Field name="pipelineCachingMode" type="bool">false</Field>
-                <Field name="frameIncrement" type="int">1</Field>
-                <Field name="timeout" type="int">1</Field>
-                <Field name="playbackMode" type="string">Looping</Field>
-            </Object>
-            <Object name="AnnotationAttributes">
-                <Object name="axes2D">
-                    <Object name="Axes2D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Outside</Field>
-                        <Field name="tickAxes" type="string">BottomLeft</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Courier</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">true</Field>
-                                                <Field name="italic" type="bool">true</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-                <Object name="axes3D">
-                    <Object name="Axes3D">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Field name="tickLocation" type="string">Inside</Field>
-                        <Field name="axesType" type="string">ClosestTriad</Field>
-                        <Field name="triadFlag" type="bool">true</Field>
-                        <Field name="bboxFlag" type="bool">true</Field>
-                        <Object name="xAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">X-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="yAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Y-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Object name="zAxis">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string">Z-Axis</Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                        <Field name="setBBoxLocation" type="bool">false</Field>
-                        <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                    </Object>
-                </Object>
-                <Field name="userInfoFlag" type="bool">true</Field>
-                <Object name="userInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoFlag" type="bool">true</Field>
-                <Field name="timeInfoFlag" type="bool">true</Field>
-                <Object name="databaseInfoFont">
-                    <Object name="FontAttributes">
-                        <Field name="font" type="string">Arial</Field>
-                        <Field name="scale" type="double">1</Field>
-                        <Field name="useForegroundColor" type="bool">true</Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="bold" type="bool">false</Field>
-                        <Field name="italic" type="bool">false</Field>
-                    </Object>
-                </Object>
-                <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                <Field name="databaseInfoTimeScale" type="double">1</Field>
-                <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                <Field name="legendInfoFlag" type="bool">true</Field>
-                <Object name="backgroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="foregroundColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                <Object name="gradientColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="gradientColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="backgroundMode" type="string">Solid</Field>
-                <Field name="backgroundImage" type="string"></Field>
-                <Field name="imageRepeatX" type="int">1</Field>
-                <Field name="imageRepeatY" type="int">1</Field>
-                <Object name="axesArray">
-                    <Object name="AxesArray">
-                        <Field name="visible" type="bool">true</Field>
-                        <Field name="ticksVisible" type="bool">true</Field>
-                        <Field name="autoSetTicks" type="bool">true</Field>
-                        <Field name="autoSetScaling" type="bool">true</Field>
-                        <Field name="lineWidth" type="int">0</Field>
-                        <Object name="axes">
-                            <Object name="AxisAttributes">
-                                <Object name="title">
-                                    <Object name="AxisTitles">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="userTitle" type="bool">false</Field>
-                                        <Field name="userUnits" type="bool">false</Field>
-                                        <Field name="title" type="string"></Field>
-                                        <Field name="units" type="string"></Field>
-                                    </Object>
-                                </Object>
-                                <Object name="label">
-                                    <Object name="AxisLabels">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Object name="font">
-                                            <Object name="FontAttributes">
-                                                <Field name="font" type="string">Arial</Field>
-                                                <Field name="scale" type="double">1</Field>
-                                                <Field name="useForegroundColor" type="bool">true</Field>
-                                                <Object name="color">
-                                                    <Object name="ColorAttribute">
-                                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                    </Object>
-                                                </Object>
-                                                <Field name="bold" type="bool">false</Field>
-                                                <Field name="italic" type="bool">false</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="scaling" type="int">0</Field>
-                                    </Object>
-                                </Object>
-                                <Object name="tickMarks">
-                                    <Object name="AxisTickMarks">
-                                        <Field name="visible" type="bool">true</Field>
-                                        <Field name="majorMinimum" type="double">0</Field>
-                                        <Field name="majorMaximum" type="double">1</Field>
-                                        <Field name="minorSpacing" type="double">0.02</Field>
-                                        <Field name="majorSpacing" type="double">0.2</Field>
-                                    </Object>
-                                </Object>
-                                <Field name="grid" type="bool">false</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewCurveAttributes">
-                <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="domainScale" type="int">0</Field>
-                <Field name="rangeScale" type="int">0</Field>
-            </Object>
-            <Object name="View2DAttributes">
-                <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                <Field name="xScale" type="int">0</Field>
-                <Field name="yScale" type="int">0</Field>
-                <Field name="windowValid" type="bool">false</Field>
-            </Object>
-            <Object name="View3DAttributes">
-                <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="focus" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="viewAngle" type="double">30</Field>
-                <Field name="parallelScale" type="double">0.866025403784439</Field>
-                <Field name="nearPlane" type="double">-1.73205080756888</Field>
-                <Field name="farPlane" type="double">1.73205080756888</Field>
-                <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                <Field name="imageZoom" type="double">1.14562037553922</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="eyeAngle" type="double">2</Field>
-                <Field name="centerOfRotationSet" type="bool">false</Field>
-                <Field name="centerOfRotation" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="axis3DScaleFlag" type="bool">false</Field>
-                <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="windowValid" type="bool">true</Field>
-            </Object>
-            <Object name="LightList">
-                <Object name="light0">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                        <Field name="enabledFlag" type="bool">true</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light1">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light2">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light3">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light4">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light5">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light6">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-                <Object name="light7">
-                    <Object name="LightAttributes">
-                        <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                        <Field name="enabledFlag" type="bool">false</Field>
-                        <Field name="type" type="string">Camera</Field>
-                        <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                        <Object name="color">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="brightness" type="double">1</Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerWindowManagerAttributes">
-                <Object name="ActionConfigurations">
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Mode</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Tools</Field>
-                        <Field name="actions" type="stringVector"></Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Window</Field>
-                        <Field name="actions" type="stringVector">"SetActiveWindowRPC" "AddWindowRPC" "CloneWindowRPC" "DeleteWindowRPC" "SetWindowLayoutRPC" "ToggleSpinModeRPC" "InvertBackgroundRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">View</Field>
-                        <Field name="actions" type="stringVector">"TogglePerspectiveViewRPC" "ResetViewRPC" "RecenterViewRPC" "UndoViewRPC" "RedoViewRPC" "ToggleFullFrameRPC" "SaveViewRPC" "ChooseCenterOfRotationRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Animation</Field>
-                        <Field name="actions" type="stringVector">"TimeSliderPreviousStateRPC" "AnimationReversePlayRPC" "AnimationStopRPC" "AnimationPlayRPC" "TimeSliderNextStateRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Operators</Field>
-                        <Field name="actions" type="stringVector">"AddOperatorRPC" "RemoveLastOperatorRPC" "RemoveAllOperatorsRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Plots</Field>
-                        <Field name="actions" type="stringVector">"AddPlotRPC" "DrawPlotsRPC" "HideActivePlotsRPC" "DeleteActivePlotsRPC" "CopyActivePlotsRPC" "SetPlotFollowsTimeRPC" </Field>
-                        <Field name="visible" type="bool">false</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Clear</Field>
-                        <Field name="actions" type="stringVector">"ClearWindowRPC" "ClearAllWindowsRPC" "ClearPickPointsRPC" "ClearRefLinesRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                    <Object name="ActionGroupDescription">
-                        <Field name="name" type="string">Lock</Field>
-                        <Field name="actions" type="stringVector">"ToggleLockViewModeRPC" "ToggleLockTimeRPC" "ToggleLockToolsRPC" "TurnOffAllLocksRPC" </Field>
-                        <Field name="visible" type="bool">true</Field>
-                    </Object>
-                </Object>
-                <Field name="toolbarsVisible" type="bool">true</Field>
-                <Field name="largeIcons" type="bool">false</Field>
-            </Object>
-            <Object name="WindowInformation">
-                <Field name="boundingBoxNavigate" type="bool">true</Field>
-                <Field name="fullFrame" type="bool">false</Field>
-                <Field name="perspective" type="bool">true</Field>
-                <Field name="lockView" type="bool">false</Field>
-                <Field name="lockTools" type="bool">false</Field>
-                <Field name="lockTime" type="bool">false</Field>
-                <Field name="viewExtentsType" type="int">1</Field>
-            </Object>
-            <Object name="PrinterAttributes">
-                <Field name="printerName" type="string"></Field>
-                <Field name="printProgram" type="string">lpr</Field>
-                <Field name="documentName" type="string">untitled</Field>
-                <Field name="creator" type="string"></Field>
-                <Field name="numCopies" type="int">1</Field>
-                <Field name="portrait" type="bool">true</Field>
-                <Field name="printColor" type="bool">true</Field>
-                <Field name="outputToFile" type="bool">false</Field>
-                <Field name="outputToFileName" type="string">untitled</Field>
-                <Field name="pageSize" type="int">2</Field>
-            </Object>
-            <Object name="RenderingAttributes">
-                <Field name="antialiasing" type="bool">false</Field>
-                <Field name="orderComposite" type="bool">true</Field>
-                <Field name="depthCompositeThreads" type="int">2</Field>
-                <Field name="depthCompositeBlocking" type="int">65536</Field>
-                <Field name="alphaCompositeThreads" type="int">2</Field>
-                <Field name="alphaCompositeBlocking" type="int">65536</Field>
-                <Field name="depthPeeling" type="bool">false</Field>
-                <Field name="occlusionRatio" type="double">0</Field>
-                <Field name="numberOfPeels" type="int">16</Field>
-                <Field name="multiresolutionMode" type="bool">false</Field>
-                <Field name="multiresolutionCellSize" type="float">0.002</Field>
-                <Field name="geometryRepresentation" type="string">Surfaces</Field>
-                <Field name="displayListMode" type="string">Auto</Field>
-                <Field name="stereoRendering" type="bool">false</Field>
-                <Field name="stereoType" type="string">CrystalEyes</Field>
-                <Field name="notifyForEachRender" type="bool">false</Field>
-                <Field name="scalableActivationMode" type="string">Always</Field>
-                <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                <Field name="specularFlag" type="bool">false</Field>
-                <Field name="specularCoeff" type="float">0.6</Field>
-                <Field name="specularPower" type="float">10</Field>
-                <Object name="specularColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="doShadowing" type="bool">false</Field>
-                <Field name="shadowStrength" type="double">0.5</Field>
-                <Field name="doDepthCueing" type="bool">false</Field>
-                <Field name="depthCueingAutomatic" type="bool">true</Field>
-                <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                <Field name="compressionActivationMode" type="string">Never</Field>
-                <Field name="colorTexturingFlag" type="bool">true</Field>
-                <Field name="compactDomainsActivationMode" type="string">Never</Field>
-                <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="AnnotationObjectList">
-            </Object>
-            <Object name="PickAttributes">
-                <Field name="variables" type="stringVector">"default" </Field>
-                <Field name="showIncidentElements" type="bool">true</Field>
-                <Field name="showNodeId" type="bool">true</Field>
-                <Field name="showNodeDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showNodeBlockLogicalCoords" type="bool">false</Field>
-                <Field name="showNodePhysicalCoords" type="bool">false</Field>
-                <Field name="showZoneId" type="bool">true</Field>
-                <Field name="showZoneDomainLogicalCoords" type="bool">false</Field>
-                <Field name="showZoneBlockLogicalCoords" type="bool">false</Field>
-                <Field name="doTimeCurve" type="bool">false</Field>
-                <Field name="conciseOutput" type="bool">false</Field>
-                <Field name="showTimeStep" type="bool">true</Field>
-                <Field name="showMeshName" type="bool">true</Field>
-                <Field name="useLabelAsPickLetter" type="bool">false</Field>
-                <Field name="showGlobalIds" type="bool">false</Field>
-                <Field name="showPickLetter" type="bool">true</Field>
-                <Field name="hasRangeOutput" type="bool">false</Field>
-                <Field name="elementLabel" type="string"></Field>
-                <Field name="createSpreadsheet" type="bool">false</Field>
-                <Field name="floatFormat" type="string">%g</Field>
-                <Field name="timePreserveCoord" type="bool">true</Field>
-            </Object>
-            <Object name="QueryOverTimeAttributes">
-                <Field name="timeType" type="string">Cycle</Field>
-                <Field name="startTimeFlag" type="bool">false</Field>
-                <Field name="startTime" type="int">0</Field>
-                <Field name="endTimeFlag" type="bool">false</Field>
-                <Field name="endTime" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="createWindow" type="bool">true</Field>
-                <Field name="windowId" type="int">2</Field>
-            </Object>
-            <Object name="InteractorAttributes">
-                <Field name="showGuidelines" type="bool">true</Field>
-                <Field name="clampSquare" type="bool">false</Field>
-                <Field name="fillViewportOnZoom" type="bool">true</Field>
-                <Field name="navigationMode" type="string">Trackball</Field>
-                <Field name="axisArraySnap" type="bool">true</Field>
-                <Field name="boundingBoxMode" type="string">Auto</Field>
-            </Object>
-            <Object name="MovieAttributes">
-                <Field name="generationMethod" type="string">NowCurrentInstance</Field>
-                <Field name="movieType" type="string">Simple</Field>
-                <Field name="outputDirectory" type="string">.</Field>
-                <Field name="outputName" type="string">movie</Field>
-                <Field name="fileFormats" type="stringVector"></Field>
-                <Field name="useCurrentSize" type="unsignedCharVector"></Field>
-                <Field name="widths" type="intVector"></Field>
-                <Field name="heights" type="intVector"></Field>
-                <Field name="scales" type="doubleVector"></Field>
-                <Field name="stereoFlags" type="intVector"></Field>
-                <Field name="templateFile" type="string"></Field>
-                <Field name="sendEmailNotification" type="bool">false</Field>
-                <Field name="useScreenCapture" type="bool">false</Field>
-                <Field name="emailAddress" type="string"></Field>
-                <Field name="fps" type="int">10</Field>
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="endIndex" type="int">1000000000</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="initialFrameValue" type="int">0</Field>
-            </Object>
-            <Object name="FileOpenOptions">
-                <Field name="typeNames" type="stringVector">"AMR" "AMRTest" "ANALYZE" "ANSYS" "AUXFile" "AugDecomp" "BATL" "BOV" "CEAucd" "CMAT" "CTRL" "Cale" "CaleHDF5" "CarpetHDF5" "Chombo" "Claw" "CosmosPP" "Cube" "Curve2D" "DDCMD" "Dyna3D" "EnSight" "Enzo" "Exodus" "ExtrudedVol" "FLASH" "FT2" "Fluent" "GGCM" "GHOST" "GMV" "GTC" "GULP" "Gadget" "Geqdsk" "H5Nimrod" "Image" "KullLite" "LAMMPS" "Lines" "M3DC1" "M3D" "MFIXCDF" "MFIX" "MM5" "MatrixMarket" "Miranda" "NASTRAN" "NETCDF" "Nek5000" "OVERFLOW" "OpenFOAM" "PATRAN" "PDB" "PFLOTRAN" "PLOT3D" "PLY" "ParallelVelodyne" "Pixie" "PlainText" "Point3D" "ProteinDataBank" "PuReMD" "RAW" "S3D" "SAMI" "SAMRAI" "SAR" "SAS" "STAR" "STL" "SXRIS" "Shapefile" "Silo" "SimV2" "Spheral" "TCGA" "TFT" "TSurf" "Tecplot" "Tetrad" "UNIC" "VASP" "VCellMTMD" "VTK" "Velodyne" "Vis5D" "VisItXdmf" "Vista" "Vs" "WPPImage" "WavefrontOBJ" "WellLogs" "XSF" "XYZ" "Xmdv" "ZipWrapper" "lata" "unv" "volimage" "HDFS" "Boxlib2D" "Boxlib3D" "SPCTH" </Field>
-                <Field name="typeIDs" type="stringVector">"AMR_1.0" "AMRTest_1.0" "ANALYZE_1.0" "ANSYS_1.0" "AUXFile_1.0" "AugDecomp_1.0" "BATL_1.0" "BOV_1.0" "CEAucd_1.0" "CMAT_1.0" "CTRL_1.0" "Cale_1.1" "CaleHDF5_1.1" "CarpetHDF5_2.1" "Chombo_1.0" "Claw_1.0" "CosmosPP_1.0" "Cube_1.0" "Curve2D_1.0" "DDCMD_1.0" "Dyna3D_1.0" "EnSight_1.0" "Enzo_1.0" "Exodus_1.0" "ExtrudedVol_1.0" "FLASH_1.0" "FT2_1.0" "Fluent_1.0" "GGCM_1.0" "GHOST_1" "GMV_1.0" "GTC_1.0" "GULP_1.0" "Gadget_2.0a" "Geqdsk_1.0" "H5Nimrod_1.0" "Image_1.0" "KullLite_1.0" "LAMMPS_1.0" "Lines_1.0" "M3DC1_1.0" "M3D_1.0" "MFIXCDF_1.0" "MFIX_1.0" "MM5_1.0" "MatrixMarket_1.0" "Miranda_2.0" "NASTRAN_1.0" "NETCDF_1.0" "Nek5000_1.0" "OVERFLOW_1.0" "OpenFOAM_1.0" "PATRAN_1.0" "PDB_1.1" "PFLOTRAN_1.0" "PLOT3D_1.0" "PLY_1.0" "ParallelVelodyne_1" "Pixie_1.0" "PlainText_1.0" "Point3D_1.0" "ProteinDataBank_1.0" "PuReMD_1.0" "RAW_1.0" "S3D_1.0" "SAMI_1.0" "SAMRAI_1.0" "SAR_1.0" "SAS_1.0" "STAR_1.0" "STL_1.0" "SXRIS_1.0" "Shapefile_1.0" "Silo_1.0" "SimV2_1.0" "Spheral_1.0" "TCGA_1.0" "TFT_1.0" "TSurf_1.0" "Tecplot_1.0" "Tetrad_1.0" "UNIC_1.0" "VASP_1.0" "VCellMTMD_1.0" "VTK_1.0" "Velodyne_1.0" "Vis5D_1.0" "VisItXdmf_1.0" "Vista_1.0" "Vs_3.0.0" "WPPImage_2" "WavefrontOBJ_1.0" "WellLogs_1.0" "XSF_1.0" "XYZ_1.0" "Xmdv_1.0" "ZipWrapper_1.0" "lata_1.0" "unv_" "volimage_1.0" "HDFS_1.0" "Boxlib2D_1.0" "Boxlib3D_1.0" "SPCTH_1.0" </Field>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" </Field>
-                    <Field name="optBools" type="intVector">0 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Use ghost data (if present)" "Enable only root level by default" "Enable only explicitly defined materials by default" "Check for mapping file and import coordinates if available" "Use particle_nid and polymer_id to connect particles" "Always compute domain boundaries (hack for AMR stitch cells)" </Field>
-                    <Field name="optBools" type="intVector">1 0 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"ExtendVolumeByOneCell" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 5 1 4 4 </Field>
-                    <Field name="names" type="stringVector">"Automagically Detect Compound Variables" "Use Material Convention" "Material Count (-1=guess)" "Namescheme for material volume fractions" "Namescheme for material specific variables" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 </Field>
-                    <Field name="optStrings" type="stringVector">"" "" </Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"None" "ALEGRA" "CTH" "Custom" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string">"&lt;p&gt;&lt;b&gt;Automagically Detect Compound Variables&lt;/b&gt;: Checking this option will cause the plugin to try to guess that similarly named variables are the scalar components of an aggregate type such as a vector, tensor or array variable. The plugin will then automatically define expressions for these aggregate typed variables. Note that this is just a convenience to free users from having to define expressions manally within their VisIt session.&lt;p&gt; &lt;p&gt;&lt;b&gt;Material Count (-1=guess)&lt;/b&gt;: Ordinarily, the plugin will determine the material count from the material convention nameschemes. However, if it is having trouble getting the correct count, you can specify it manually with this option. &lt;p&gt;&lt;b&gt;Use Material Convention&lt;/b&gt;: A few pre-defined conventions for handling mixed materials from Exodus files are supported. In addition, you can define your own custom conventions as well. For a custom convention, you must define the &lt;i&gt;namescheme&lt;/i&gt; that will produce the names of the scalar variables holding material volume fractions. Optionally, you can specify a &lt;i&gt;namescheme&lt;/i&gt; to produce the names of the scalar variables holding material-specific values given the name of a non-material-specific variable. For more information on nameschemes, please consult the description of DBMakeNamescheme in the &lt;a href=&quot;https://wci.llnl.gov/content/assets/docs/simulation/computer-codes/silo/LLNL-SM-654357.pdf&quot;&gt;Silo user&apos;s manual&lt;/a&gt;. The nameschemes used here are identical to those described in the Silo user&apos;s manual with one extension. The conversion specifier %V is used to denote the basename (non-material-specific) name of a set of scalar variables holding material specific values.&lt;p&gt; &lt;p&gt;The ALEGRA nameschemes for volume fraction and material specific variables  are &quot;@%s@n?&apos;&amp;VOLFRC_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;The CTH nameschemes are &quot;@%s@n?&apos;&amp;VOLM_%d&amp;n&amp;&apos;:&apos;VOID_FRC&apos;:@&quot; and &quot;@%V_%d@n&quot;.&lt;p&gt; &lt;p&gt;Finally, it is assumed materials are identified starting from one (1). The special material id of zero (0) is used to denote void."</Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Show generating processor instead of refinement level" "Use new style curve generation" "Set up patch abutment information" </Field>
-                    <Field name="optBools" type="intVector">0 1 1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 </Field>
-                    <Field name="names" type="stringVector">"Mesh refinement" "Linear mesh data location" "Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1" "2" "3" "4" "5" "6" "7" "8" "9" "10" "Node" "Element" </Field>
-                    <Field name="enumStringsSizes" type="intVector">10 2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Big Endian" "Number of domains in the X or R direction" "Number of domains in the Y direction" "Number of domains in the Z or theta direction" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">4 8 4 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"Num Materials (-1==costly search)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 </Field>
-                    <Field name="names" type="stringVector">"Read all times and cycles" "Duplicate data for particle advection (slower for all other techniques)" </Field>
-                    <Field name="optBools" type="intVector">1 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Case Type" "Convert Cell Data To Point Data" "Read Zones" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"Decomposed" "Reconstructed" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">1 </Field>
-                    <Field name="names" type="stringVector">"LEOS try harder level [set to 0, 1 or 2]" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 4 0 0 0 0 0 0 3 3 </Field>
-                    <Field name="names" type="stringVector">"File Format" "Solution (Q) File Name" "Solution Time field accurate" "3D" "Multi Grid" "Big Endian" "Double Precision" "IBlanking" "Gas constant R" "Gas constant Gamma" </Field>
-                    <Field name="optBools" type="intVector">1 1 0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector">1 1.4 </Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector">"" </Field>
-                    <Field name="optEnums" type="intVector">1 </Field>
-                    <Field name="enumStrings" type="stringVector">"ASCII" "C Binary" "Fortran Binary" </Field>
-                    <Field name="enumStringsSizes" type="intVector">3 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 </Field>
-                    <Field name="names" type="stringVector">"Partitioning" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">2 </Field>
-                    <Field name="enumStrings" type="stringVector">"X Slab" "Y Slab" "Z Slab" "KD Tree" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 0 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Data layout" "Lines to skip at beginning of file" "First row has variable names" "Column for X coordinate (or -1 for none)" "Column for Y coordinate (or -1 for none)" "Column for Z coordinate (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">0 -1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"1D Columns" "2D Array" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 0 0 0 </Field>
-                    <Field name="names" type="stringVector">"Polygons as lines" "Tessellate polygons" "ESRI Logging" "DBF Logging" </Field>
-                    <Field name="optBools" type="intVector">0 1 0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 5 0 0 </Field>
-                    <Field name="names" type="stringVector">"Ignore spatial extents" "Ignore data extents" "Force Single" "Search For ANNOTATION_INT (!!Slow!!)" </Field>
-                    <Field name="optBools" type="intVector">0 0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">3 3 </Field>
-                    <Field name="enumStrings" type="stringVector">"Always" "Auto" "Never" "Undef" "Always" "Auto" "Never" "Undef" </Field>
-                    <Field name="enumStringsSizes" type="intVector">4 4 </Field>
-                    <Field name="obsoleteNames" type="stringVector">"Ignore Spatial Extents" "Ignore Data Extents" </Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">5 1 1 1 </Field>
-                    <Field name="names" type="stringVector">"Method to determine coordinate axes" "X axis variable index (or -1 for none)" "Y axis variable index (or -1 for none)" "Z axis variable index (or -1 for none)" </Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">-1 -1 -1 </Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector">0 </Field>
-                    <Field name="enumStrings" type="stringVector">"Guess from variable names" "Specify explicitly (below)" </Field>
-                    <Field name="enumStringsSizes" type="intVector">2 </Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">0 </Field>
-                    <Field name="names" type="stringVector">"Process Data Selections in the Reader" </Field>
-                    <Field name="optBools" type="intVector">1 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector">4 4 1 4 0 </Field>
-                    <Field name="names" type="stringVector">"TMPDIR for decompressed files" "Unique moniker for dirs made in $TMPDIR" "Max. # decompressed files" "Decompression command" "Don&apos;t atexit()" </Field>
-                    <Field name="optBools" type="intVector">0 </Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector">50 </Field>
-                    <Field name="optStrings" type="stringVector">"$TMPDIR" "$USER" "" </Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Object name="DBOptionsAttributes">
-                    <Field name="types" type="intVector"></Field>
-                    <Field name="names" type="stringVector"></Field>
-                    <Field name="optBools" type="intVector"></Field>
-                    <Field name="optFloats" type="doubleVector"></Field>
-                    <Field name="optDoubles" type="doubleVector"></Field>
-                    <Field name="optInts" type="intVector"></Field>
-                    <Field name="optStrings" type="stringVector"></Field>
-                    <Field name="optEnums" type="intVector"></Field>
-                    <Field name="enumStrings" type="stringVector"></Field>
-                    <Field name="enumStringsSizes" type="intVector"></Field>
-                    <Field name="obsoleteNames" type="stringVector"></Field>
-                    <Field name="help" type="string"></Field>
-                </Object>
-                <Field name="Enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 </Field>
-                <Field name="preferredIDs" type="stringVector">"Silo_1.0" </Field>
-            </Object>
-            <Object name="SeedMeAttributes">
-                <Field name="clearAllTabsOnClose" type="bool">true</Field>
-            </Object>
-            <Object name="BoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="ContourAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                        <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="CurveAttributes">
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="symbol" type="string">Point</Field>
-                <Field name="pointSize" type="double">5</Field>
-                <Field name="pointFillMode" type="string">Static</Field>
-                <Field name="pointStride" type="int">1</Field>
-                <Field name="symbolDensity" type="int">50</Field>
-                <Field name="curveColorSource" type="string">Cycle</Field>
-                <Object name="curveColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="showLegend" type="bool">true</Field>
-                <Field name="showLabels" type="bool">true</Field>
-                <Field name="designator" type="string"></Field>
-                <Field name="doBallTimeCue" type="bool">false</Field>
-                <Object name="ballTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="timeCueBallSize" type="double">0.01</Field>
-                <Field name="doLineTimeCue" type="bool">false</Field>
-                <Object name="lineTimeCueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="lineTimeCueWidth" type="int">0</Field>
-                <Field name="doCropTimeCue" type="bool">false</Field>
-                <Field name="timeForTimeCue" type="double">0</Field>
-                <Field name="fillMode" type="string">NoFill</Field>
-                <Object name="fillColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="fillColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 100 100 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="polarToCartesian" type="bool">false</Field>
-                <Field name="polarCoordinateOrder" type="string">R_Theta</Field>
-                <Field name="angleUnits" type="string">Radians</Field>
-            </Object>
-            <Object name="FilledBoundaryAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="boundaryNames" type="stringVector"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Object name="mixedColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="HistogramAttributes">
-                <Field name="basedOn" type="string">ManyZonesForSingleVar</Field>
-                <Field name="histogramType" type="string">Frequency</Field>
-                <Field name="weightVariable" type="string">default</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="numBins" type="int">32</Field>
-                <Field name="domain" type="int">0</Field>
-                <Field name="zone" type="int">0</Field>
-                <Field name="useBinWidths" type="bool">true</Field>
-                <Field name="outputType" type="string">Block</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="color">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">200 80 40 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="dataScale" type="string">Linear</Field>
-                <Field name="binScale" type="string">Linear</Field>
-                <Field name="normalizeHistogram" type="bool">false</Field>
-                <Field name="computeAsCDF" type="bool">false</Field>
-            </Object>
-            <Object name="LabelAttributes">
-                <Field name="varType" type="string">LABEL_VT_UNKNOWN_TYPE</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="showNodes" type="bool">false</Field>
-                <Field name="showCells" type="bool">true</Field>
-                <Field name="restrictNumberOfLabels" type="bool">true</Field>
-                <Field name="drawLabelsFacing" type="string">Front</Field>
-                <Field name="labelDisplayFormat" type="string">Natural</Field>
-                <Field name="numberOfLabels" type="int">200</Field>
-                <Field name="specifyTextColor1" type="bool">false</Field>
-                <Object name="textColor1">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight1" type="float">0.02</Field>
-                <Field name="specifyTextColor2" type="bool">false</Field>
-                <Object name="textColor2">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 255 0 </Field>
-                    </Object>
-                </Object>
-                <Field name="textHeight2" type="float">0.02</Field>
-                <Field name="horizontalJustification" type="string">HCenter</Field>
-                <Field name="verticalJustification" type="string">VCenter</Field>
-                <Field name="depthTestMode" type="string">LABEL_DT_AUTO</Field>
-                <Field name="formatTemplate" type="string">%g</Field>
-            </Object>
-            <Object name="MeshAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="meshColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="meshColorSource" type="string">Foreground</Field>
-                <Field name="opaqueColorSource" type="string">Background</Field>
-                <Field name="opaqueMode" type="string">Auto</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Object name="opaqueColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="smoothingLevel" type="string">None</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="opaqueMeshIsAppropriate" type="bool">true</Field>
-                <Field name="showInternal" type="bool">false</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="opacity" type="double">1</Field>
-            </Object>
-            <Object name="MoleculeAttributes">
-                <Field name="drawAtomsAs" type="string">SphereAtoms</Field>
-                <Field name="scaleRadiusBy" type="string">Fixed</Field>
-                <Field name="drawBondsAs" type="string">CylinderBonds</Field>
-                <Field name="colorBonds" type="string">ColorByAtom</Field>
-                <Object name="bondSingleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 128 128 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="radiusVariable" type="string">default</Field>
-                <Field name="radiusScaleFactor" type="float">1</Field>
-                <Field name="radiusFixed" type="float">0.3</Field>
-                <Field name="atomSphereQuality" type="string">Medium</Field>
-                <Field name="bondCylinderQuality" type="string">Medium</Field>
-                <Field name="bondRadius" type="float">0.12</Field>
-                <Field name="bondLineWidth" type="int">0</Field>
-                <Field name="bondLineStyle" type="int">0</Field>
-                <Field name="elementColorTable" type="string">cpk_jmol</Field>
-                <Field name="residueTypeColorTable" type="string">amino_shapely</Field>
-                <Field name="residueSequenceColorTable" type="string">Default</Field>
-                <Field name="continuousColorTable" type="string">Default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="scalarMin" type="float">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="scalarMax" type="float">1</Field>
-            </Object>
-            <Object name="MultiCurveAttributes">
-                <Object name="defaultPalette">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.034</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0.069</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.103</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                            <Field name="position" type="float">0.138</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.172</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                            <Field name="position" type="float">0.207</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                            <Field name="position" type="float">0.241</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                            <Field name="position" type="float">0.276</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                            <Field name="position" type="float">0.31</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                            <Field name="position" type="float">0.345</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                            <Field name="position" type="float">0.379</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                            <Field name="position" type="float">0.414</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                            <Field name="position" type="float">0.448</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                            <Field name="position" type="float">0.483</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                            <Field name="position" type="float">0.517</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">170 79 255 255 </Field>
-                            <Field name="position" type="float">0.552</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 0 255 </Field>
-                            <Field name="position" type="float">0.586</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 150 0 255 </Field>
-                            <Field name="position" type="float">0.621</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 150 255 </Field>
-                            <Field name="position" type="float">0.655</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 109 109 255 </Field>
-                            <Field name="position" type="float">0.69</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 0 150 255 </Field>
-                            <Field name="position" type="float">0.724</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 150 0 255 </Field>
-                            <Field name="position" type="float">0.759</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">150 84 0 255 </Field>
-                            <Field name="position" type="float">0.793</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">160 0 79 255 </Field>
-                            <Field name="position" type="float">0.828</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 104 28 255 </Field>
-                            <Field name="position" type="float">0.862</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 170 81 255 </Field>
-                            <Field name="position" type="float">0.897</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">68 255 124 255 </Field>
-                            <Field name="position" type="float">0.931</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 130 255 255 </Field>
-                            <Field name="position" type="float">0.966</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">130 0 255 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">None</Field>
-                        <Field name="equal" type="bool">true</Field>
-                        <Field name="discrete" type="bool">true</Field>
-                        <Field name="category" type="string">Standard</Field>
-                    </Object>
-                </Object>
-                <Field name="changedColors" type="unsignedCharVector"></Field>
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 135 0 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 0 135 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">168 168 168 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 68 68 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">99 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">40 165 165 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 99 255 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 255 99 255 </Field>
-                        </Object>
-                        <Object name="ColorAttribute">
-                            <Field name="color" type="unsignedCharArray" length="4">255 170 99 255 </Field>
-                        </Object>
-                    </Object>
-                </Object>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="yAxisTitleFormat" type="string">%g</Field>
-                <Field name="useYAxisTickSpacing" type="bool">false</Field>
-                <Field name="yAxisTickSpacing" type="double">1</Field>
-                <Field name="displayMarkers" type="bool">true</Field>
-                <Field name="markerScale" type="double">1</Field>
-                <Field name="markerLineWidth" type="int">0</Field>
-                <Field name="markerVariable" type="string">default</Field>
-                <Field name="displayIds" type="bool">false</Field>
-                <Field name="idVariable" type="string">default</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="ParallelCoordinatesAttributes">
-                <Field name="scalarAxisNames" type="stringVector"></Field>
-                <Field name="visualAxisNames" type="stringVector"></Field>
-                <Field name="extentMinima" type="doubleVector"></Field>
-                <Field name="extentMaxima" type="doubleVector"></Field>
-                <Field name="drawLines" type="bool">true</Field>
-                <Object name="linesColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">128 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawContext" type="bool">true</Field>
-                <Field name="contextGamma" type="float">2</Field>
-                <Field name="contextNumPartitions" type="int">128</Field>
-                <Object name="contextColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 220 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="drawLinesOnlyIfExtentsOn" type="bool">true</Field>
-                <Field name="unifyAxisExtents" type="bool">false</Field>
-                <Field name="linesNumPartitions" type="int">512</Field>
-                <Field name="focusGamma" type="float">4</Field>
-                <Field name="drawFocusAs" type="string">BinsOfConstantColor</Field>
-            </Object>
-            <Object name="PseudocolorAttributes">
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="centering" type="string">Natural</Field>
-                <Field name="colorTableName" type="string">hot</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="opacityType" type="string">FullyOpaque</Field>
-                <Field name="opacityVariable" type="string"></Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="opacityVarMin" type="double">0</Field>
-                <Field name="opacityVarMax" type="double">1</Field>
-                <Field name="opacityVarMinFlag" type="bool">false</Field>
-                <Field name="opacityVarMaxFlag" type="bool">false</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineType" type="string">Line</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="tubeResolution" type="int">10</Field>
-                <Field name="tubeRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="tubeRadiusAbsolute" type="double">0.125</Field>
-                <Field name="tubeRadiusBBox" type="double">0.005</Field>
-                <Field name="tubeRadiusVarEnabled" type="bool">false</Field>
-                <Field name="tubeRadiusVar" type="string"></Field>
-                <Field name="tubeRadiusVarRatio" type="double">10</Field>
-                <Field name="tailStyle" type="string">None</Field>
-                <Field name="headStyle" type="string">None</Field>
-                <Field name="endPointRadiusSizeType" type="string">FractionOfBBox</Field>
-                <Field name="endPointRadiusAbsolute" type="double">0.125</Field>
-                <Field name="endPointRadiusBBox" type="double">0.05</Field>
-                <Field name="endPointResolution" type="int">10</Field>
-                <Field name="endPointRatio" type="double">5</Field>
-                <Field name="endPointRadiusVarEnabled" type="bool">false</Field>
-                <Field name="endPointRadiusVar" type="string"></Field>
-                <Field name="endPointRadiusVarRatio" type="double">10</Field>
-                <Field name="renderSurfaces" type="int">1</Field>
-                <Field name="renderWireframe" type="int">0</Field>
-                <Field name="renderPoints" type="int">0</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="wireframeColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-                <Object name="pointColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 0 </Field>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ScatterAttributes">
-                <Field name="var1" type="string">default</Field>
-                <Field name="var1Role" type="string">Coordinate0</Field>
-                <Field name="var1MinFlag" type="bool">false</Field>
-                <Field name="var1MaxFlag" type="bool">false</Field>
-                <Field name="var1Min" type="double">0</Field>
-                <Field name="var1Max" type="double">1</Field>
-                <Field name="var1Scaling" type="string">Linear</Field>
-                <Field name="var1SkewFactor" type="double">1</Field>
-                <Field name="var2Role" type="string">Coordinate1</Field>
-                <Field name="var2" type="string">default</Field>
-                <Field name="var2MinFlag" type="bool">false</Field>
-                <Field name="var2MaxFlag" type="bool">false</Field>
-                <Field name="var2Min" type="double">0</Field>
-                <Field name="var2Max" type="double">1</Field>
-                <Field name="var2Scaling" type="string">Linear</Field>
-                <Field name="var2SkewFactor" type="double">1</Field>
-                <Field name="var3Role" type="string">None</Field>
-                <Field name="var3" type="string">default</Field>
-                <Field name="var3MinFlag" type="bool">false</Field>
-                <Field name="var3MaxFlag" type="bool">false</Field>
-                <Field name="var3Min" type="double">0</Field>
-                <Field name="var3Max" type="double">1</Field>
-                <Field name="var3Scaling" type="string">Linear</Field>
-                <Field name="var3SkewFactor" type="double">1</Field>
-                <Field name="var4Role" type="string">None</Field>
-                <Field name="var4" type="string">default</Field>
-                <Field name="var4MinFlag" type="bool">false</Field>
-                <Field name="var4MaxFlag" type="bool">false</Field>
-                <Field name="var4Min" type="double">0</Field>
-                <Field name="var4Max" type="double">1</Field>
-                <Field name="var4Scaling" type="string">Linear</Field>
-                <Field name="var4SkewFactor" type="double">1</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointSizePixels" type="int">1</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="scaleCube" type="bool">true</Field>
-                <Field name="colorType" type="string">ColorByForegroundColor</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-            </Object>
-            <Object name="SpreadsheetAttributes">
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="formatString" type="string">%1.6f</Field>
-                <Field name="useColorTable" type="bool">false</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="showTracerPlane" type="bool">true</Field>
-                <Object name="tracerColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">255 0 0 150 </Field>
-                    </Object>
-                </Object>
-                <Field name="normal" type="string">Z</Field>
-                <Field name="sliceIndex" type="int">0</Field>
-                <Field name="spreadsheetFont" type="string">Courier,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="showPatchOutline" type="bool">true</Field>
-                <Field name="showCurrentCellOutline" type="bool">false</Field>
-            </Object>
-            <Object name="SubsetAttributes">
-                <Field name="colorType" type="string">ColorByMultipleColors</Field>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Object name="multiColor">
-                    <Object name="ColorAttributeList">
-                    </Object>
-                </Object>
-                <Field name="subsetNames" type="stringVector"></Field>
-                <Field name="subsetType" type="string">Unknown</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="wireframe" type="bool">false</Field>
-                <Field name="drawInternal" type="bool">false</Field>
-                <Field name="smoothingLevel" type="int">0</Field>
-                <Field name="pointSize" type="double">0.05</Field>
-                <Field name="pointType" type="int">6</Field>
-                <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                <Field name="pointSizeVar" type="string">default</Field>
-                <Field name="pointSizePixels" type="int">2</Field>
-            </Object>
-            <Object name="TensorAttributes">
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nTensors" type="int">400</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="colorByEigenvalues" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="tensorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-            </Object>
-            <Object name="TruecolorAttributes">
-                <Field name="opacity" type="double">1</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-            </Object>
-            <Object name="VectorAttributes">
-                <Field name="glyphLocation" type="string">AdaptsToMeshResolution</Field>
-                <Field name="useStride" type="bool">false</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="nVectors" type="int">400</Field>
-                <Field name="lineStyle" type="int">0</Field>
-                <Field name="lineWidth" type="int">0</Field>
-                <Field name="scale" type="double">0.25</Field>
-                <Field name="scaleByMagnitude" type="bool">true</Field>
-                <Field name="autoScale" type="bool">true</Field>
-                <Field name="headSize" type="double">0.25</Field>
-                <Field name="headOn" type="bool">true</Field>
-                <Field name="colorByMag" type="bool">true</Field>
-                <Field name="useLegend" type="bool">true</Field>
-                <Object name="vectorColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="invertColorTable" type="bool">false</Field>
-                <Field name="vectorOrigin" type="string">Tail</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="lineStem" type="string">Line</Field>
-                <Field name="geometryQuality" type="string">Fast</Field>
-                <Field name="stemWidth" type="double">0.08</Field>
-                <Field name="origOnly" type="bool">true</Field>
-                <Field name="glyphType" type="string">Arrow</Field>
-            </Object>
-            <Object name="VolumeAttributes">
-                <Field name="legendFlag" type="bool">true</Field>
-                <Field name="lightingFlag" type="bool">true</Field>
-                <Object name="colorControlPoints">
-                    <Object name="ColorControlPointList">
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                            <Field name="position" type="float">0</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 255 255 </Field>
-                            <Field name="position" type="float">0.25</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">0 255 0 255 </Field>
-                            <Field name="position" type="float">0.5</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 255 0 255 </Field>
-                            <Field name="position" type="float">0.75</Field>
-                        </Object>
-                        <Object name="ColorControlPoint">
-                            <Field name="colors" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                            <Field name="position" type="float">1</Field>
-                        </Object>
-                        <Field name="smoothing" type="string">Linear</Field>
-                        <Field name="equal" type="bool">false</Field>
-                        <Field name="discrete" type="bool">false</Field>
-                        <Field name="category" type="string"></Field>
-                    </Object>
-                </Object>
-                <Field name="opacityAttenuation" type="float">1</Field>
-                <Field name="opacityMode" type="string">FreeformMode</Field>
-                <Object name="opacityControlPoints">
-                    <Object name="GaussianControlPointList">
-                    </Object>
-                </Object>
-                <Field name="resampleFlag" type="bool">true</Field>
-                <Field name="resampleTarget" type="int">50000</Field>
-                <Field name="opacityVariable" type="string">default</Field>
-                <Field name="compactVariable" type="string">default</Field>
-                <Field name="freeformOpacity" type="unsignedCharArray" length="256">0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 </Field>
-                <Field name="useColorVarMin" type="bool">false</Field>
-                <Field name="colorVarMin" type="float">0</Field>
-                <Field name="useColorVarMax" type="bool">false</Field>
-                <Field name="colorVarMax" type="float">0</Field>
-                <Field name="useOpacityVarMin" type="bool">false</Field>
-                <Field name="opacityVarMin" type="float">0</Field>
-                <Field name="useOpacityVarMax" type="bool">false</Field>
-                <Field name="opacityVarMax" type="float">0</Field>
-                <Field name="smoothData" type="bool">false</Field>
-                <Field name="samplesPerRay" type="int">500</Field>
-                <Field name="rendererType" type="string">Splatting</Field>
-                <Field name="gradientType" type="string">SobelOperator</Field>
-                <Field name="num3DSlices" type="int">200</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="sampling" type="string">Rasterization</Field>
-                <Field name="rendererSamples" type="float">3</Field>
-                <Field name="transferFunctionDim" type="int">1</Field>
-                <Field name="lowGradientLightingReduction" type="string">Lower</Field>
-                <Field name="lowGradientLightingClampFlag" type="bool">false</Field>
-                <Field name="lowGradientLightingClampValue" type="double">1</Field>
-                <Field name="materialProperties" type="doubleArray" length="4">0.4 0.75 0 15 </Field>
-            </Object>
-            <Object name="AMRStitchCellAttributes">
-                <Field name="CreateCellsOfType" type="string">DualGridAndStitchCells</Field>
-            </Object>
-            <Object name="AxisAlignedSlice4DAttributes">
-                <Field name="I" type="intVector"></Field>
-                <Field name="J" type="intVector"></Field>
-                <Field name="K" type="intVector"></Field>
-                <Field name="L" type="intVector"></Field>
-            </Object>
-            <Object name="BoundaryOpAttributes">
-                <Field name="smoothingLevel" type="int">0</Field>
-            </Object>
-            <Object name="BoxAttributes">
-                <Field name="amount" type="string">Some</Field>
-                <Field name="minx" type="double">0</Field>
-                <Field name="maxx" type="double">1</Field>
-                <Field name="miny" type="double">0</Field>
-                <Field name="maxy" type="double">1</Field>
-                <Field name="minz" type="double">0</Field>
-                <Field name="maxz" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="CartographicProjectionAttributes">
-                <Field name="projectionID" type="string">aitoff</Field>
-                <Field name="centralMeridian" type="double">0</Field>
-            </Object>
-            <Object name="ClipAttributes">
-                <Field name="quality" type="string">Fast</Field>
-                <Field name="funcType" type="string">Plane</Field>
-                <Field name="plane1Status" type="bool">true</Field>
-                <Field name="plane2Status" type="bool">false</Field>
-                <Field name="plane3Status" type="bool">false</Field>
-                <Field name="plane1Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane2Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane3Origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="plane1Normal" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="plane2Normal" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="plane3Normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeInverse" type="bool">false</Field>
-                <Field name="planeToolControlledClipPlane" type="string">Plane1</Field>
-                <Field name="center" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereInverse" type="bool">false</Field>
-            </Object>
-            <Object name="ConeAttributes">
-                <Field name="angle" type="double">45</Field>
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="normal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="representation" type="string">Flattened</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="cutByLength" type="bool">false</Field>
-                <Field name="length" type="double">1</Field>
-            </Object>
-            <Object name="CoordSwapAttributes">
-                <Field name="newCoord1" type="string">Coord1</Field>
-                <Field name="newCoord2" type="string">Coord2</Field>
-                <Field name="newCoord3" type="string">Coord3</Field>
-            </Object>
-            <Object name="CreateBondsAttributes">
-                <Field name="elementVariable" type="string">element</Field>
-                <Field name="atomicNumber1" type="intVector">1 -1 </Field>
-                <Field name="atomicNumber2" type="intVector">-1 -1 </Field>
-                <Field name="minDist" type="doubleVector">0.4 0.4 </Field>
-                <Field name="maxDist" type="doubleVector">1.2 1.9 </Field>
-                <Field name="maxBondsClamp" type="int">10</Field>
-                <Field name="addPeriodicBonds" type="bool">false</Field>
-                <Field name="useUnitCellVectors" type="bool">true</Field>
-                <Field name="periodicInX" type="bool">true</Field>
-                <Field name="periodicInY" type="bool">true</Field>
-                <Field name="periodicInZ" type="bool">true</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-            </Object>
-            <Object name="CylinderAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="inverse" type="bool">false</Field>
-            </Object>
-            <Object name="DataBinningAttributes">
-                <Field name="numDimensions" type="string">One</Field>
-                <Field name="dim1BinBasedOn" type="string">Variable</Field>
-                <Field name="dim1Var" type="string">default</Field>
-                <Field name="dim1SpecifyRange" type="bool">false</Field>
-                <Field name="dim1MinRange" type="double">0</Field>
-                <Field name="dim1MaxRange" type="double">1</Field>
-                <Field name="dim1NumBins" type="int">50</Field>
-                <Field name="dim2BinBasedOn" type="string">Variable</Field>
-                <Field name="dim2Var" type="string">default</Field>
-                <Field name="dim2SpecifyRange" type="bool">false</Field>
-                <Field name="dim2MinRange" type="double">0</Field>
-                <Field name="dim2MaxRange" type="double">1</Field>
-                <Field name="dim2NumBins" type="int">50</Field>
-                <Field name="dim3BinBasedOn" type="string">Variable</Field>
-                <Field name="dim3Var" type="string">default</Field>
-                <Field name="dim3SpecifyRange" type="bool">false</Field>
-                <Field name="dim3MinRange" type="double">0</Field>
-                <Field name="dim3MaxRange" type="double">1</Field>
-                <Field name="dim3NumBins" type="int">50</Field>
-                <Field name="outOfBoundsBehavior" type="string">Clamp</Field>
-                <Field name="reductionOperator" type="string">Average</Field>
-                <Field name="varForReduction" type="string">default</Field>
-                <Field name="emptyVal" type="double">0</Field>
-                <Field name="outputType" type="string">OutputOnBins</Field>
-                <Field name="removeEmptyValFromCurve" type="bool">true</Field>
-            </Object>
-            <Object name="DeferExpressionAttributes">
-                <Field name="exprs" type="stringVector"></Field>
-            </Object>
-            <Object name="DisplaceAttributes">
-                <Field name="factor" type="double">1</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="DualMeshAttributes">
-                <Field name="mode" type="string">Auto</Field>
-            </Object>
-            <Object name="EdgeAttributes">
-                <Field name="dummy" type="bool">true</Field>
-            </Object>
-            <Object name="ElevateAttributes">
-                <Field name="useXYLimits" type="bool">false</Field>
-                <Field name="limitsMode" type="string">OriginalData</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="skewFactor" type="double">1</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="zeroFlag" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="EllipsoidSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radii" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="rotationAngle" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ExplodeAttributes">
-                <Field name="explosionType" type="string">Point</Field>
-                <Field name="explosionPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planePoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNorm" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="cylinderPoint2" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="materialExplosionFactor" type="double">1</Field>
-                <Field name="material" type="string"></Field>
-                <Field name="cylinderRadius" type="double">0</Field>
-                <Field name="explodeMaterialCells" type="bool">false</Field>
-                <Field name="cellExplosionFactor" type="double">1</Field>
-                <Field name="explosionPattern" type="string">Impact</Field>
-                <Field name="explodeAllCells" type="bool">false</Field>
-                <Field name="boundaryNames" type="stringVector"></Field>
-            </Object>
-            <Object name="ExternalSurfaceAttributes">
-                <Field name="removeGhosts" type="bool">false</Field>
-                <Field name="edgesIn2D" type="bool">true</Field>
-            </Object>
-            <Object name="ExtrudeAttributes">
-                <Field name="axis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="length" type="double">1</Field>
-                <Field name="steps" type="int">30</Field>
-                <Field name="preserveOriginalCellNumbers" type="bool">true</Field>
-            </Object>
-            <Object name="FFTAttributes">
-                <Field name="dummy" type="int">0</Field>
-            </Object>
-            <Object name="IndexSelectAttributes">
-                <Field name="maxDim" type="string">ThreeD</Field>
-                <Field name="dim" type="string">TwoD</Field>
-                <Field name="xAbsMax" type="int">-1</Field>
-                <Field name="xMin" type="int">0</Field>
-                <Field name="xMax" type="int">-1</Field>
-                <Field name="xIncr" type="int">1</Field>
-                <Field name="xWrap" type="bool">false</Field>
-                <Field name="yAbsMax" type="int">-1</Field>
-                <Field name="yMin" type="int">0</Field>
-                <Field name="yMax" type="int">-1</Field>
-                <Field name="yIncr" type="int">1</Field>
-                <Field name="yWrap" type="bool">false</Field>
-                <Field name="zAbsMax" type="int">-1</Field>
-                <Field name="zMin" type="int">0</Field>
-                <Field name="zMax" type="int">-1</Field>
-                <Field name="zIncr" type="int">1</Field>
-                <Field name="zWrap" type="bool">false</Field>
-                <Field name="useWholeCollection" type="bool">true</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-            </Object>
-            <Object name="IntegralCurveAttributes">
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="radius" type="double">1</Field>
-                <Field name="sphereOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="boxExtents" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                <Field name="useWholeBox" type="bool">true</Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="fieldData" type="doubleVector"></Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="sampleDensity2" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="displayGeometry" type="string">Lines</Field>
-                <Field name="cleanupMethod" type="string">NoCleanup</Field>
-                <Field name="cleanupThreshold" type="double">1e-08</Field>
-                <Field name="cropBeginFlag" type="bool">false</Field>
-                <Field name="cropBegin" type="double">0</Field>
-                <Field name="cropEndFlag" type="bool">false</Field>
-                <Field name="cropEnd" type="double">0</Field>
-                <Field name="cropValue" type="string">Time</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-                <Field name="selection" type="string"></Field>
-            </Object>
-            <Object name="InverseGhostZoneAttributes">
-                <Field name="requestGhostZones" type="bool">true</Field>
-                <Field name="showDuplicated" type="bool">true</Field>
-                <Field name="showEnhancedConnectivity" type="bool">true</Field>
-                <Field name="showReducedConnectivity" type="bool">true</Field>
-                <Field name="showAMRRefined" type="bool">true</Field>
-                <Field name="showExterior" type="bool">true</Field>
-                <Field name="showNotApplicable" type="bool">true</Field>
-            </Object>
-            <Object name="IsosurfaceAttributes">
-                <Field name="contourNLevels" type="int">10</Field>
-                <Field name="contourValue" type="doubleVector"></Field>
-                <Field name="contourPercent" type="doubleVector"></Field>
-                <Field name="contourMethod" type="string">Level</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="max" type="double">1</Field>
-                <Field name="scaling" type="string">Linear</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="IsovolumeAttributes">
-                <Field name="lbound" type="double">-1e+37</Field>
-                <Field name="ubound" type="double">1e+37</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LCSAttributes">
-                <Field name="sourceType" type="string">NativeMesh</Field>
-                <Field name="Resolution" type="intArray" length="3">10 10 10 </Field>
-                <Field name="UseDataSetStart" type="string">Full</Field>
-                <Field name="StartPosition" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="UseDataSetEnd" type="string">Full</Field>
-                <Field name="EndPosition" type="doubleArray" length="3">1 1 1 </Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="auxiliaryGrid" type="string">None</Field>
-                <Field name="auxiliaryGridSpacing" type="double">0.0001</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="operationType" type="string">Lyapunov</Field>
-                <Field name="cauchyGreenTensor" type="string">Right</Field>
-                <Field name="eigenComponent" type="string">Largest</Field>
-                <Field name="eigenWeight" type="double">1</Field>
-                <Field name="operatorType" type="string">BaseValue</Field>
-                <Field name="terminationType" type="string">Time</Field>
-                <Field name="terminateBySize" type="bool">false</Field>
-                <Field name="termSize" type="double">10</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="clampLogValues" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="thresholdLimit" type="double">0.1</Field>
-                <Field name="radialLimit" type="double">0.1</Field>
-                <Field name="boundaryLimit" type="double">0.1</Field>
-                <Field name="seedLimit" type="int">10</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="LagrangianAttributes">
-                <Field name="seedPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="numSteps" type="int">1000</Field>
-                <Field name="XAxisSample" type="string">Step</Field>
-                <Field name="YAxisSample" type="string">Step</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="LimitCycleAttributes">
-                <Field name="sourceType" type="string">SpecifiedLine</Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="planeOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="planeNormal" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="planeUpAxis" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="sampleDensity0" type="int">2</Field>
-                <Field name="sampleDensity1" type="int">2</Field>
-                <Field name="dataValue" type="string">TimeAbsolute</Field>
-                <Field name="dataVariable" type="string"></Field>
-                <Field name="integrationDirection" type="string">Forward</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByDistance" type="bool">false</Field>
-                <Field name="termDistance" type="double">10</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-06</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">DormandPrince</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="sampleDistance0" type="double">10</Field>
-                <Field name="sampleDistance1" type="double">10</Field>
-                <Field name="sampleDistance2" type="double">10</Field>
-                <Field name="fillInterior" type="bool">true</Field>
-                <Field name="randomSamples" type="bool">false</Field>
-                <Field name="randomSeed" type="int">0</Field>
-                <Field name="numberOfRandomSamples" type="int">1</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="cycleTolerance" type="double">1e-06</Field>
-                <Field name="maxIterations" type="int">10</Field>
-                <Field name="showPartialResults" type="bool">true</Field>
-                <Field name="showReturnDistances" type="bool">false</Field>
-                <Field name="issueAdvectionWarnings" type="bool">true</Field>
-                <Field name="issueBoundaryWarnings" type="bool">true</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-                <Field name="correlationDistanceAngTol" type="double">5</Field>
-                <Field name="correlationDistanceMinDistAbsolute" type="double">1</Field>
-                <Field name="correlationDistanceMinDistBBox" type="double">0.005</Field>
-                <Field name="correlationDistanceMinDistType" type="string">FractionOfBBox</Field>
-            </Object>
-            <Object name="LineoutAttributes">
-                <Field name="point1" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="point2" type="doubleArray" length="3">1 1 0 </Field>
-                <Field name="interactive" type="bool">false</Field>
-                <Field name="ignoreGlobal" type="bool">false</Field>
-                <Field name="samplingOn" type="bool">false</Field>
-                <Field name="numberOfSamplePoints" type="int">50</Field>
-                <Field name="reflineLabels" type="bool">false</Field>
-                <Field name="designator" type="string"></Field>
-            </Object>
-            <Object name="MultiresControlAttributes">
-                <Field name="resolution" type="int">0</Field>
-                <Field name="maxResolution" type="int">1</Field>
-                <Field name="info" type="string"></Field>
-            </Object>
-            <Object name="OnionPeelAttributes">
-                <Field name="adjacencyType" type="string">Node</Field>
-                <Field name="useGlobalId" type="bool">false</Field>
-                <Field name="categoryName" type="string">Whole</Field>
-                <Field name="subsetName" type="string">Whole</Field>
-                <Field name="index" type="intVector">1 </Field>
-                <Field name="logical" type="bool">false</Field>
-                <Field name="requestedLayer" type="int">0</Field>
-                <Field name="seedType" type="string">SeedCell</Field>
-                <Field name="honorOriginalMesh" type="bool">true</Field>
-            </Object>
-            <Object name="PersistentParticlesAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startPathType" type="string">Absolute</Field>
-                <Field name="stopPathType" type="string">Absolute</Field>
-                <Field name="traceVariableX" type="string">default</Field>
-                <Field name="traceVariableY" type="string">default</Field>
-                <Field name="traceVariableZ" type="string">default</Field>
-                <Field name="connectParticles" type="bool">false</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="indexVariable" type="string">default</Field>
-            </Object>
-            <Object name="PoincareAttributes">
-                <Field name="opacityType" type="string">Explicit</Field>
-                <Field name="opacity" type="double">1</Field>
-                <Field name="minPunctures" type="int">50</Field>
-                <Field name="maxPunctures" type="int">500</Field>
-                <Field name="puncturePlotType" type="string">Single</Field>
-                <Field name="maxSteps" type="int">1000</Field>
-                <Field name="terminateByTime" type="bool">false</Field>
-                <Field name="termTime" type="double">10</Field>
-                <Field name="puncturePeriodTolerance" type="double">0.01</Field>
-                <Field name="puncturePlane" type="string">Poloidal</Field>
-                <Field name="sourceType" type="string">SpecifiedPoint</Field>
-                <Field name="pointSource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="pointList" type="doubleVector">0 0 0 1 0 0 0 1 0 </Field>
-                <Field name="lineStart" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="lineEnd" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="pointDensity" type="int">1</Field>
-                <Field name="fieldType" type="string">Default</Field>
-                <Field name="forceNodeCenteredData" type="bool">false</Field>
-                <Field name="fieldConstant" type="double">1</Field>
-                <Field name="velocitySource" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="integrationType" type="string">AdamsBashforth</Field>
-                <Field name="coordinateSystem" type="string">Cartesian</Field>
-                <Field name="maxStepLength" type="double">0.1</Field>
-                <Field name="limitMaximumTimestep" type="bool">false</Field>
-                <Field name="maxTimeStep" type="double">0.1</Field>
-                <Field name="relTol" type="double">0.0001</Field>
-                <Field name="absTolSizeType" type="string">FractionOfBBox</Field>
-                <Field name="absTolAbsolute" type="double">1e-05</Field>
-                <Field name="absTolBBox" type="double">1e-06</Field>
-                <Field name="analysis" type="string">Normal</Field>
-                <Field name="maximumToroidalWinding" type="int">0</Field>
-                <Field name="overrideToroidalWinding" type="int">0</Field>
-                <Field name="overridePoloidalWinding" type="int">0</Field>
-                <Field name="windingPairConfidence" type="double">0.9</Field>
-                <Field name="rationalSurfaceFactor" type="double">0.1</Field>
-                <Field name="overlaps" type="string">Remove</Field>
-                <Field name="meshType" type="string">Curves</Field>
-                <Field name="numberPlanes" type="int">1</Field>
-                <Field name="singlePlane" type="double">0</Field>
-                <Field name="min" type="double">0</Field>
-                <Field name="max" type="double">0</Field>
-                <Field name="minFlag" type="bool">false</Field>
-                <Field name="maxFlag" type="bool">false</Field>
-                <Field name="colorType" type="string">ColorByColorTable</Field>
-                <Object name="singleColor">
-                    <Object name="ColorAttribute">
-                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                    </Object>
-                </Object>
-                <Field name="colorTableName" type="string">Default</Field>
-                <Field name="dataValue" type="string">SafetyFactorQ</Field>
-                <Field name="showRationalSurfaces" type="bool">false</Field>
-                <Field name="RationalSurfaceMaxIterations" type="int">2</Field>
-                <Field name="showOPoints" type="bool">false</Field>
-                <Field name="OPointMaxIterations" type="int">2</Field>
-                <Field name="showXPoints" type="bool">false</Field>
-                <Field name="XPointMaxIterations" type="int">2</Field>
-                <Field name="performOLineAnalysis" type="bool">false</Field>
-                <Field name="OLineToroidalWinding" type="int">1</Field>
-                <Field name="OLineAxisFileName" type="string"></Field>
-                <Field name="showChaotic" type="bool">false</Field>
-                <Field name="showIslands" type="bool">false</Field>
-                <Field name="SummaryFlag" type="bool">true</Field>
-                <Field name="verboseFlag" type="bool">false</Field>
-                <Field name="show1DPlots" type="bool">false</Field>
-                <Field name="showLines" type="bool">true</Field>
-                <Field name="showPoints" type="bool">false</Field>
-                <Field name="parallelizationAlgorithmType" type="string">VisItSelects</Field>
-                <Field name="maxProcessCount" type="int">10</Field>
-                <Field name="maxDomainCacheSize" type="int">3</Field>
-                <Field name="workGroupSize" type="int">32</Field>
-                <Field name="pathlines" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTimeFlag" type="bool">false</Field>
-                <Field name="pathlinesOverrideStartingTime" type="double">0</Field>
-                <Field name="pathlinesPeriod" type="double">0</Field>
-                <Field name="pathlinesCMFE" type="string">POS_CMFE</Field>
-                <Field name="issueTerminationWarnings" type="bool">true</Field>
-                <Field name="issueStepsizeWarnings" type="bool">true</Field>
-                <Field name="issueStiffnessWarnings" type="bool">true</Field>
-                <Field name="issueCriticalPointsWarnings" type="bool">true</Field>
-                <Field name="criticalPointThreshold" type="double">0.001</Field>
-            </Object>
-            <Object name="ProjectAttributes">
-                <Field name="projectionType" type="string">XYCartesian</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-            </Object>
-            <Object name="RadialResampleAttributes">
-                <Field name="isFast" type="bool">false</Field>
-                <Field name="minTheta" type="float">0</Field>
-                <Field name="maxTheta" type="float">90</Field>
-                <Field name="deltaTheta" type="float">5</Field>
-                <Field name="radius" type="float">0.5</Field>
-                <Field name="deltaRadius" type="float">0.05</Field>
-                <Field name="center" type="floatArray" length="3">0.5 0.5 0.5 </Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="minAzimuth" type="float">0</Field>
-                <Field name="maxAzimuth" type="float">180</Field>
-                <Field name="deltaAzimuth" type="float">5</Field>
-            </Object>
-            <Object name="ReflectAttributes">
-                <Field name="octant" type="string">PXPYPZ</Field>
-                <Field name="useXBoundary" type="bool">true</Field>
-                <Field name="specifiedX" type="double">0</Field>
-                <Field name="useYBoundary" type="bool">true</Field>
-                <Field name="specifiedY" type="double">0</Field>
-                <Field name="useZBoundary" type="bool">true</Field>
-                <Field name="specifiedZ" type="double">0</Field>
-                <Field name="reflections" type="intArray" length="8">1 0 1 0 0 0 0 0 </Field>
-            </Object>
-            <Object name="ReplicateAttributes">
-                <Field name="useUnitCellVectors" type="bool">false</Field>
-                <Field name="xVector" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="yVector" type="doubleArray" length="3">0 1 0 </Field>
-                <Field name="zVector" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="xReplications" type="int">1</Field>
-                <Field name="yReplications" type="int">1</Field>
-                <Field name="zReplications" type="int">1</Field>
-                <Field name="mergeResults" type="bool">true</Field>
-                <Field name="replicateUnitCellAtoms" type="bool">false</Field>
-                <Field name="shiftPeriodicAtomOrigin" type="bool">false</Field>
-                <Field name="newPeriodicOrigin" type="doubleArray" length="3">0 0 0 </Field>
-            </Object>
-            <Object name="ResampleAttributes">
-                <Field name="useExtents" type="bool">true</Field>
-                <Field name="startX" type="double">0</Field>
-                <Field name="endX" type="double">1</Field>
-                <Field name="samplesX" type="int">10</Field>
-                <Field name="startY" type="double">0</Field>
-                <Field name="endY" type="double">1</Field>
-                <Field name="samplesY" type="int">10</Field>
-                <Field name="is3D" type="bool">true</Field>
-                <Field name="startZ" type="double">0</Field>
-                <Field name="endZ" type="double">1</Field>
-                <Field name="samplesZ" type="int">10</Field>
-                <Field name="tieResolver" type="string">random</Field>
-                <Field name="tieResolverVariable" type="string">default</Field>
-                <Field name="defaultValue" type="double">0</Field>
-                <Field name="distributedResample" type="bool">true</Field>
-                <Field name="cellCenteredOutput" type="bool">false</Field>
-            </Object>
-            <Object name="RevolveAttributes">
-                <Field name="meshType" type="string">Auto</Field>
-                <Field name="autoAxis" type="bool">true</Field>
-                <Field name="axis" type="doubleArray" length="3">1 0 0 </Field>
-                <Field name="startAngle" type="double">0</Field>
-                <Field name="stopAngle" type="double">360</Field>
-                <Field name="steps" type="int">30</Field>
-            </Object>
-            <Object name="SPHResampleAttributes">
-                <Field name="minX" type="float">0</Field>
-                <Field name="maxX" type="float">1</Field>
-                <Field name="xnum" type="int">10</Field>
-                <Field name="minY" type="float">0</Field>
-                <Field name="maxY" type="float">1</Field>
-                <Field name="ynum" type="int">10</Field>
-                <Field name="minZ" type="float">0</Field>
-                <Field name="maxZ" type="float">1</Field>
-                <Field name="znum" type="int">10</Field>
-                <Field name="tensorSupportVariable" type="string">H</Field>
-                <Field name="weightVariable" type="string">mass</Field>
-                <Field name="RK" type="bool">true</Field>
-            </Object>
-            <Object name="SliceAttributes">
-                <Field name="originType" type="string">Intercept</Field>
-                <Field name="originPoint" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="originIntercept" type="double">0</Field>
-                <Field name="originPercent" type="double">0</Field>
-                <Field name="originZone" type="int">0</Field>
-                <Field name="originNode" type="int">0</Field>
-                <Field name="normal" type="doubleArray" length="3">0 -1 0 </Field>
-                <Field name="axisType" type="string">YAxis</Field>
-                <Field name="upAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="project2d" type="bool">true</Field>
-                <Field name="interactive" type="bool">true</Field>
-                <Field name="flip" type="bool">false</Field>
-                <Field name="originZoneDomain" type="int">0</Field>
-                <Field name="originNodeDomain" type="int">0</Field>
-                <Field name="meshName" type="string">default</Field>
-                <Field name="theta" type="double">0</Field>
-                <Field name="phi" type="double">0</Field>
-            </Object>
-            <Object name="SmoothOperatorAttributes">
-                <Field name="numIterations" type="int">20</Field>
-                <Field name="relaxationFactor" type="double">0.01</Field>
-                <Field name="convergence" type="double">0</Field>
-                <Field name="maintainFeatures" type="bool">true</Field>
-                <Field name="featureAngle" type="double">45</Field>
-                <Field name="edgeAngle" type="double">15</Field>
-                <Field name="smoothBoundaries" type="bool">false</Field>
-            </Object>
-            <Object name="SphereSliceAttributes">
-                <Field name="origin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="radius" type="double">1</Field>
-            </Object>
-            <Object name="StaggerAttributes">
-                <Field name="offsetX" type="double">0</Field>
-                <Field name="offsetY" type="double">0</Field>
-                <Field name="offsetZ" type="double">0</Field>
-            </Object>
-            <Object name="StatisticalTrendsAttributes">
-                <Field name="startIndex" type="int">0</Field>
-                <Field name="stopIndex" type="int">1</Field>
-                <Field name="stride" type="int">1</Field>
-                <Field name="startTrendType" type="string">Absolute</Field>
-                <Field name="stopTrendType" type="string">Absolute</Field>
-                <Field name="statisticType" type="string">Mean</Field>
-                <Field name="trendAxis" type="string">Step</Field>
-                <Field name="variableSource" type="string">Default</Field>
-            </Object>
-            <Object name="SubdivideQuadsAttributes">
-                <Field name="threshold" type="double">0.500002</Field>
-                <Field name="maxSubdivs" type="int">4</Field>
-                <Field name="fanOutPoints" type="bool">true</Field>
-                <Field name="doTriangles" type="bool">false</Field>
-                <Field name="variable" type="string">default</Field>
-            </Object>
-            <Object name="ThreeSliceAttributes">
-                <Field name="x" type="double">0</Field>
-                <Field name="y" type="double">0</Field>
-                <Field name="z" type="double">0</Field>
-                <Field name="interactive" type="bool">true</Field>
-            </Object>
-            <Object name="ThresholdAttributes">
-                <Field name="outputMeshType" type="int">0</Field>
-                <Field name="boundsInputType" type="int">0</Field>
-                <Field name="listedVarNames" type="stringVector">"default" </Field>
-                <Field name="zonePortions" type="intVector"></Field>
-                <Field name="lowerBounds" type="doubleVector"></Field>
-                <Field name="upperBounds" type="doubleVector"></Field>
-                <Field name="boundsRange" type="stringVector"></Field>
-                <Field name="defaultVarName" type="string">default</Field>
-                <Field name="defaultVarIsScalar" type="bool">false</Field>
-            </Object>
-            <Object name="TransformAttributes">
-                <Field name="doRotate" type="bool">false</Field>
-                <Field name="rotateOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="rotateAxis" type="doubleArray" length="3">0 0 1 </Field>
-                <Field name="rotateAmount" type="double">0</Field>
-                <Field name="rotateType" type="string">Deg</Field>
-                <Field name="doScale" type="bool">false</Field>
-                <Field name="scaleOrigin" type="doubleArray" length="3">0 0 0 </Field>
-                <Field name="scaleX" type="double">1</Field>
-                <Field name="scaleY" type="double">1</Field>
-                <Field name="scaleZ" type="double">1</Field>
-                <Field name="doTranslate" type="bool">false</Field>
-                <Field name="translateX" type="double">0</Field>
-                <Field name="translateY" type="double">0</Field>
-                <Field name="translateZ" type="double">0</Field>
-                <Field name="transformType" type="string">Similarity</Field>
-                <Field name="inputCoordSys" type="string">Cartesian</Field>
-                <Field name="outputCoordSys" type="string">Spherical</Field>
-                <Field name="continuousPhi" type="bool">false</Field>
-                <Field name="m00" type="double">1</Field>
-                <Field name="m01" type="double">0</Field>
-                <Field name="m02" type="double">0</Field>
-                <Field name="m03" type="double">0</Field>
-                <Field name="m10" type="double">0</Field>
-                <Field name="m11" type="double">1</Field>
-                <Field name="m12" type="double">0</Field>
-                <Field name="m13" type="double">0</Field>
-                <Field name="m20" type="double">0</Field>
-                <Field name="m21" type="double">0</Field>
-                <Field name="m22" type="double">1</Field>
-                <Field name="m23" type="double">0</Field>
-                <Field name="m30" type="double">0</Field>
-                <Field name="m31" type="double">0</Field>
-                <Field name="m32" type="double">0</Field>
-                <Field name="m33" type="double">1</Field>
-                <Field name="invertLinearTransform" type="bool">false</Field>
-                <Field name="vectorTransformMethod" type="string">AsDirection</Field>
-                <Field name="transformVectors" type="bool">true</Field>
-            </Object>
-            <Object name="TriangulateRegularPointsAttributes">
-                <Field name="useXGridSpacing" type="bool">false</Field>
-                <Field name="xGridSpacing" type="double">1</Field>
-                <Field name="useYGridSpacing" type="bool">false</Field>
-                <Field name="yGridSpacing" type="double">1</Field>
-            </Object>
-            <Object name="TubeAttributes">
-                <Field name="scaleByVarFlag" type="bool">false</Field>
-                <Field name="tubeRadiusType" type="string">FractionOfBBox</Field>
-                <Field name="radiusFractionBBox" type="double">0.01</Field>
-                <Field name="radiusAbsolute" type="double">1</Field>
-                <Field name="scaleVariable" type="string">default</Field>
-                <Field name="fineness" type="int">5</Field>
-                <Field name="capping" type="bool">false</Field>
-            </Object>
-            <Object name="AppearanceAttributes">
-                <Field name="useSystemDefault" type="bool">true</Field>
-                <Field name="background" type="string">#c0c0c0</Field>
-                <Field name="foreground" type="string">#000000</Field>
-                <Field name="fontName" type="string">Helvetica,12,-1,5,50,0,0,0,0,0</Field>
-                <Field name="style" type="string">gtk</Field>
-                <Field name="orientation" type="int">0</Field>
-                <Field name="defaultForeground" type="string">#000000</Field>
-                <Field name="defaultBackground" type="string">#d4d0c8</Field>
-                <Field name="defaultFontName" type="string">"Sans Serif,9,-1,5,50,0,0,0,0,0"</Field>
-                <Field name="defaultStyle" type="string">Windows</Field>
-                <Field name="defaultOrientation" type="int">0</Field>
-            </Object>
-            <Object name="PluginManagerAttributes">
-                <Field name="name" type="stringVector">"Boundary" "Contour" "Curve" "FilledBoundary" "Histogram" "Label" "Mesh" "Molecule" "MultiCurve" "ParallelCoordinates" "Pseudocolor" "Scatter" "Spreadsheet" "Subset" "Surface" "Tensor" "Truecolor" "Vector" "Volume" "WellBore" "AMRStitchCell" "BoundaryOp" "Box" "CartographicProjection" "Clip" "Cone" "ConnectedComponents" "CoordSwap" "CracksClipper" "CreateBonds" "Cylinder" "DataBinning" "Decimate" "DeferExpression" "Delaunay" "Displace" "DualMesh" "Edge" "Elevate" "EllipsoidSlice" "ExternalSurface" "ExtractPointFunction2D" "Extrude" "FFT" "FiveFoldTetSubdivision" "Flux" "IndexSelect" "IntegralCurve" "InverseGhostZone" "Isosurface" "Isovolume" "LCS" "Lagrangian" "LimitCycle" "LineSampler" "Lineout" "Merge" "ModelFit" "MultiresControl" "OnionPeel" "PDF" "PersistentParticles" "Poincare" "Project" "RadialResample" "Reflect" "Replicate" "Resample" "Revolve" "Slice" "Smooth" "SphereSlice" "Stagger" "StatisticalTrends" "SurfaceNormal" "ThreeSlice" "Threshold" "ToroidalPoloidalProjection" "Transform" "TriangulateRegularPoints" "Tube" "ZoneDump" "SPHResample" "AxisAlignedSlice4D" "Explode" "SubdivideQuads" </Field>
-                <Field name="type" type="stringVector">"plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "plot" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" "operator" </Field>
-                <Field name="version" type="stringVector">"1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.1" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "2.0" "3.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" "1.0" </Field>
-                <Field name="id" type="stringVector">"Boundary_1.0" "Contour_1.0" "Curve_1.0" "FilledBoundary_1.0" "Histogram_1.0" "Label_1.0" "Mesh_1.0" "Molecule_1.0" "MultiCurve_1.0" "ParallelCoordinates_1.0" "Pseudocolor_1.0" "Scatter_1.0" "Spreadsheet_1.0" "Subset_1.0" "Surface_1.0" "Tensor_1.0" "Truecolor_1.0" "Vector_1.0" "Volume_1.1" "WellBore_1.0" "AMRStitchCell_1.0" "BoundaryOp_1.0" "Box_1.0" "CartographicProjection_1.0" "Clip_1.0" "Cone_1.0" "ConnectedComponents_1.0" "CoordSwap_1.0" "CracksClipper_1.0" "CreateBonds_1.0" "Cylinder_1.0" "DataBinning_1.0" "Decimate_1.0" "DeferExpression_1.0" "Delaunay_1.0" "Displace_1.0" "DualMesh_1.0" "Edge_1.0" "Elevate_1.0" "EllipsoidSlice_1.0" "ExternalSurface_1.0" "ExtractPointFunction2D_1.0" "Extrude_1.0" "FFT_1.0" "FiveFoldTetSubdivision_1.0" "Flux_1.0" "IndexSelect_1.0" "IntegralCurve_1.0" "InverseGhostZone_1.0" "Isosurface_1.0" "Isovolume_1.0" "LCS_1.0" "Lagrangian_1.0" "LimitCycle_1.0" "LineSampler_1.0" "Lineout_1.0" "Merge_1.0" "ModelFit_1.0" "MultiresControl_1.0" "OnionPeel_1.0" "PDF_1.0" "PersistentParticles_2.0" "Poincare_3.0" "Project_1.0" "RadialResample_1.0" "Reflect_1.0" "Replicate_1.0" "Resample_1.0" "Revolve_1.0" "Slice_1.0" "Smooth_1.0" "SphereSlice_1.0" "Stagger_1.0" "StatisticalTrends_1.0" "SurfaceNormal_1.0" "ThreeSlice_1.0" "Threshold_1.0" "ToroidalPoloidalProjection_1.0" "Transform_1.0" "TriangulateRegularPoints_1.0" "Tube_1.0" "ZoneDump_1.0" "SPHResample_1.0" "AxisAlignedSlice4D_1.0" "Explode_1.0" "SubdivideQuads_1.0" </Field>
-                <Field name="category" type="stringVector">"?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "?" "Geometry" "Slicing" "Selection" "Transforms" "Selection" "Slicing" "Analysis" "Geometry" "Analysis" "Molecular" "Selection" "Analysis" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Geometry" "Transforms" "Slicing" "Geometry" "Analysis" "Geometry" "Transforms" "Geometry" "Analysis" "Selection" "Integral Curves" "Debugging" "Slicing" "Selection" "Integral Curves" "Integral Curves" "Integral Curves" "Slicing" "Analysis" "Geometry" "Analysis" "Selection" "Selection" "Analysis" "Analysis" "Integral Curves" "Transforms" "Geometry" "Transforms" "Transforms" "Geometry" "Geometry" "Slicing" "Geometry" "Slicing" "Transforms" "Analysis" "Geometry" "Slicing" "Selection" "Transforms" "Transforms" "Geometry" "Geometry" "Debugging" "Geometry" "Slicing" "Transforms" "Geometry" </Field>
-                <Field name="enabled" type="intVector">1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 1 0 1 1 1 1 1 1 1 1 0 1 1 1 0 1 0 1 1 1 1 1 1 0 1 1 0 1 1 1 1 1 1 1 1 1 0 1 0 1 1 1 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 0 1 1 1 1 </Field>
-            </Object>
-        </Object>
-        <Object name="ViewerSubject">
-            <Object name="SourceMap">
-                <Field name="SOURCE00" type="string">localhost:/work/SENSEI/amrex-libsim/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/plt00060/Header</Field>
-            </Object>
-            <Object name="SourcePlugins">
-                <Field name="localhost:/work/SENSEI/amrex-libsim/Tutorials/Amr/Advection_AmrLevel/Exec/SingleVortex/plt00060/Header" type="string">Boxlib3D_1.0</Field>
-            </Object>
-            <Object name="DatabaseCorrelationList">
-                <Field name="needPermission" type="bool">true</Field>
-                <Field name="defaultCorrelationMethod" type="int">0</Field>
-                <Field name="whenToCorrelate" type="string">CorrelateOnlyIfSameLength</Field>
-            </Object>
-            <Object name="ViewerWindowManager">
-                <Object name="SelectionList">
-                    <Field name="autoApplyUpdates" type="bool">false</Field>
-                </Object>
-                <Field name="activeWindow" type="int">0</Field>
-                <Field name="lineoutWindow" type="int">-1</Field>
-                <Field name="timeQueryWindow" type="int">-1</Field>
-                <Field name="cameraView" type="bool">false</Field>
-                <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                <Object name="Windows">
-                    <Object name="ViewerWindow">
-                        <Field name="windowSize" type="intArray" length="2">1023 705 </Field>
-                        <Field name="windowImageSize" type="intArray" length="2">1023 645 </Field>
-                        <Field name="windowLocation" type="intArray" length="2">1481 323 </Field>
-                        <Field name="maintainView" type="bool">false</Field>
-                        <Field name="cameraView" type="bool">false</Field>
-                        <Field name="viewExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                        <Field name="viewIsLocked" type="bool">false</Field>
-                        <Field name="timeLocked" type="bool">false</Field>
-                        <Field name="toolsLocked" type="bool">false</Field>
-                        <Field name="interactionMode" type="string">NAVIGATE</Field>
-                        <Field name="toolUpdateMode" type="string">ONRELEASE</Field>
-                        <Object name="AnnotationAttributes">
-                            <Object name="axes2D">
-                                <Object name="Axes2D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Outside</Field>
-                                    <Field name="tickAxes" type="string">BottomLeft</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Courier</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">true</Field>
-                                                            <Field name="italic" type="bool">true</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                            <Object name="axes3D">
-                                <Object name="Axes3D">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Field name="tickLocation" type="string">Inside</Field>
-                                    <Field name="axesType" type="string">ClosestTriad</Field>
-                                    <Field name="triadFlag" type="bool">true</Field>
-                                    <Field name="bboxFlag" type="bool">true</Field>
-                                    <Object name="xAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">X-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="yAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Y-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Object name="zAxis">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string">Z-Axis</Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="setBBoxLocation" type="bool">false</Field>
-                                    <Field name="bboxLocation" type="doubleArray" length="6">0 1 0 1 0 1 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="userInfoFlag" type="bool">true</Field>
-                            <Object name="userInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoFlag" type="bool">true</Field>
-                            <Field name="timeInfoFlag" type="bool">true</Field>
-                            <Object name="databaseInfoFont">
-                                <Object name="FontAttributes">
-                                    <Field name="font" type="string">Arial</Field>
-                                    <Field name="scale" type="double">1</Field>
-                                    <Field name="useForegroundColor" type="bool">true</Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="bold" type="bool">false</Field>
-                                    <Field name="italic" type="bool">false</Field>
-                                </Object>
-                            </Object>
-                            <Field name="databaseInfoExpansionMode" type="string">File</Field>
-                            <Field name="databaseInfoTimeScale" type="double">1</Field>
-                            <Field name="databaseInfoTimeOffset" type="double">0</Field>
-                            <Field name="legendInfoFlag" type="bool">true</Field>
-                            <Object name="backgroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="foregroundColor">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="gradientBackgroundStyle" type="string">Radial</Field>
-                            <Object name="gradientColor1">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 255 255 </Field>
-                                </Object>
-                            </Object>
-                            <Object name="gradientColor2">
-                                <Object name="ColorAttribute">
-                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                </Object>
-                            </Object>
-                            <Field name="backgroundMode" type="string">Solid</Field>
-                            <Field name="backgroundImage" type="string"></Field>
-                            <Field name="imageRepeatX" type="int">1</Field>
-                            <Field name="imageRepeatY" type="int">1</Field>
-                            <Object name="axesArray">
-                                <Object name="AxesArray">
-                                    <Field name="visible" type="bool">true</Field>
-                                    <Field name="ticksVisible" type="bool">true</Field>
-                                    <Field name="autoSetTicks" type="bool">true</Field>
-                                    <Field name="autoSetScaling" type="bool">true</Field>
-                                    <Field name="lineWidth" type="int">0</Field>
-                                    <Object name="axes">
-                                        <Object name="AxisAttributes">
-                                            <Object name="title">
-                                                <Object name="AxisTitles">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="userTitle" type="bool">false</Field>
-                                                    <Field name="userUnits" type="bool">false</Field>
-                                                    <Field name="title" type="string"></Field>
-                                                    <Field name="units" type="string"></Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="label">
-                                                <Object name="AxisLabels">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Object name="font">
-                                                        <Object name="FontAttributes">
-                                                            <Field name="font" type="string">Arial</Field>
-                                                            <Field name="scale" type="double">1</Field>
-                                                            <Field name="useForegroundColor" type="bool">true</Field>
-                                                            <Object name="color">
-                                                                <Object name="ColorAttribute">
-                                                                    <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                                </Object>
-                                                            </Object>
-                                                            <Field name="bold" type="bool">false</Field>
-                                                            <Field name="italic" type="bool">false</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="scaling" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                            <Object name="tickMarks">
-                                                <Object name="AxisTickMarks">
-                                                    <Field name="visible" type="bool">true</Field>
-                                                    <Field name="majorMinimum" type="double">0</Field>
-                                                    <Field name="majorMaximum" type="double">1</Field>
-                                                    <Field name="minorSpacing" type="double">0.02</Field>
-                                                    <Field name="majorSpacing" type="double">0.2</Field>
-                                                </Object>
-                                            </Object>
-                                            <Field name="grid" type="bool">false</Field>
-                                        </Object>
-                                    </Object>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Object name="LightList">
-                            <Object name="light0">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">false</Field>
-                                    <Field name="enabledFlag" type="bool">true</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light1">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light2">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light3">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light4">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light5">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light6">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                            <Object name="light7">
-                                <Object name="LightAttributes">
-                                    <Field name="enabledFlagCanBeToggled" type="bool">true</Field>
-                                    <Field name="enabledFlag" type="bool">false</Field>
-                                    <Field name="type" type="string">Camera</Field>
-                                    <Field name="direction" type="doubleArray" length="3">0 0 -1 </Field>
-                                    <Object name="color">
-                                        <Object name="ColorAttribute">
-                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                        </Object>
-                                    </Object>
-                                    <Field name="brightness" type="double">1</Field>
-                                </Object>
-                            </Object>
-                        </Object>
-                        <Field name="scalableAutoThreshold" type="int">2000000</Field>
-                        <Field name="scalableActivationMode" type="int">1</Field>
-                        <Field name="compactDomainsAutoThreshold" type="int">256</Field>
-                        <Field name="compactDomainsActivationMode" type="int">2</Field>
-                        <Field name="notifyForEachRender" type="bool">false</Field>
-                        <Field name="surfaceRepresentation" type="int">0</Field>
-                        <Field name="displayListMode" type="int">2</Field>
-                        <Field name="stereoRendering" type="bool">false</Field>
-                        <Field name="stereoType" type="int">2</Field>
-                        <Field name="antialiasing" type="bool">false</Field>
-                        <Field name="orderComposite" type="bool">true</Field>
-                        <Field name="depthPeeling" type="bool">false</Field>
-                        <Field name="occlusionRatio" type="double">0.01</Field>
-                        <Field name="numberOfPeels" type="int">32</Field>
-                        <Field name="multiresolutionMode" type="bool">false</Field>
-                        <Field name="multiresolutionCellSize" type="double">0.0020000000949949</Field>
-                        <Field name="specularFlag" type="bool">false</Field>
-                        <Field name="specularCoeff" type="double">0.600000023841858</Field>
-                        <Field name="specularPower" type="double">10</Field>
-                        <Object name="specularColor">
-                            <Object name="ColorAttribute">
-                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                            </Object>
-                        </Object>
-                        <Field name="doShading" type="bool">false</Field>
-                        <Field name="shadingStrength" type="double">0.5</Field>
-                        <Field name="doDepthCueing" type="bool">false</Field>
-                        <Field name="depthCueingAuto" type="bool">true</Field>
-                        <Field name="startCuePoint" type="doubleArray" length="3">-10 0 0 </Field>
-                        <Field name="endCuePoint" type="doubleArray" length="3">10 0 0 </Field>
-                        <Field name="colorTexturingFlag" type="bool">true</Field>
-                        <Object name="ViewCurveAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="domainScale" type="int">0</Field>
-                            <Field name="rangeScale" type="int">0</Field>
-                        </Object>
-                        <Object name="View2DAttributes">
-                            <Field name="windowCoords" type="doubleArray" length="4">0 1 0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.2 0.95 0.15 0.95 </Field>
-                            <Field name="fullFrameActivationMode" type="string">Auto</Field>
-                            <Field name="fullFrameAutoThreshold" type="double">100</Field>
-                            <Field name="xScale" type="int">0</Field>
-                            <Field name="yScale" type="int">0</Field>
-                            <Field name="windowValid" type="bool">false</Field>
-                        </Object>
-                        <Object name="View3DAttributes">
-                            <Field name="viewNormal" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="focus" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                            <Field name="viewUp" type="doubleArray" length="3">0 1 0 </Field>
-                            <Field name="viewAngle" type="double">30</Field>
-                            <Field name="parallelScale" type="double">0.866025403784439</Field>
-                            <Field name="nearPlane" type="double">-1.73205080756888</Field>
-                            <Field name="farPlane" type="double">1.73205080756888</Field>
-                            <Field name="imagePan" type="doubleArray" length="2">0 0 </Field>
-                            <Field name="imageZoom" type="double">1.14562037553922</Field>
-                            <Field name="perspective" type="bool">true</Field>
-                            <Field name="eyeAngle" type="double">2</Field>
-                            <Field name="centerOfRotationSet" type="bool">false</Field>
-                            <Field name="centerOfRotation" type="doubleArray" length="3">0.5 0.5 0.5 </Field>
-                            <Field name="axis3DScaleFlag" type="bool">false</Field>
-                            <Field name="axis3DScales" type="doubleArray" length="3">1 1 1 </Field>
-                            <Field name="shear" type="doubleArray" length="3">0 0 1 </Field>
-                            <Field name="windowValid" type="bool">true</Field>
-                        </Object>
-                        <Object name="ViewAxisArrayAttributes">
-                            <Field name="domainCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="rangeCoords" type="doubleArray" length="2">0 1 </Field>
-                            <Field name="viewportCoords" type="doubleArray" length="4">0.15 0.9 0.1 0.85 </Field>
-                        </Object>
-                        <Object name="AnnotationObjectList">
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0003</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">0</Field>
-                                <Field name="doubleVector1" type="doubleVector"></Field>
-                                <Field name="stringVector1" type="stringVector"></Field>
-                                <Field name="stringVector2" type="stringVector"></Field>
-                            </Object>
-                            <Object name="AnnotationObject">
-                                <Field name="objectName" type="string">Plot0004</Field>
-                                <Field name="objectType" type="string">LegendAttributes</Field>
-                                <Field name="visible" type="bool">true</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="position" type="doubleArray" length="3">0.05 0.9 0 </Field>
-                                <Field name="position2" type="doubleArray" length="3">1 1 1 </Field>
-                                <Object name="textColor">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="useForegroundForTextColor" type="bool">true</Field>
-                                <Object name="color1">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 50 </Field>
-                                    </Object>
-                                </Object>
-                                <Object name="color2">
-                                    <Object name="ColorAttribute">
-                                        <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                    </Object>
-                                </Object>
-                                <Field name="text" type="stringVector">"%# -9.4g" </Field>
-                                <Field name="fontFamily" type="string">Arial</Field>
-                                <Field name="fontBold" type="bool">false</Field>
-                                <Field name="fontItalic" type="bool">false</Field>
-                                <Field name="fontShadow" type="bool">false</Field>
-                                <Field name="doubleAttribute1" type="double">0.015</Field>
-                                <Field name="intAttribute1" type="int">993</Field>
-                                <Field name="intAttribute2" type="int">5</Field>
-                                <Field name="intAttribute3" type="int">1</Field>
-                                <Field name="doubleVector1" type="doubleVector"></Field>
-                                <Field name="stringVector1" type="stringVector"></Field>
-                                <Field name="stringVector2" type="stringVector">"1.08441" "1.17459" "1.26477" "1.35495" "1.44513" "1.53531" "1.62549" "1.71567" "1.80585" "1.89603" </Field>
-                            </Object>
-                        </Object>
-                        <Object name="InteractorAttributes">
-                            <Field name="showGuidelines" type="bool">true</Field>
-                            <Field name="clampSquare" type="bool">false</Field>
-                            <Field name="fillViewportOnZoom" type="bool">true</Field>
-                            <Field name="navigationMode" type="string">Trackball</Field>
-                            <Field name="axisArraySnap" type="bool">true</Field>
-                            <Field name="boundingBoxMode" type="string">Auto</Field>
-                        </Object>
-                        <Object name="ViewerPlotList">
-                            <Object name="plot00">
-                                <Field name="plotName" type="string">Plot0003</Field>
-                                <Field name="pluginID" type="string">Mesh_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">Mesh</Field>
-                                <Field name="active" type="bool">false</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="MeshAttributes">
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">0</Field>
-                                        <Object name="meshColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="meshColorSource" type="string">Foreground</Field>
-                                        <Field name="opaqueColorSource" type="string">Background</Field>
-                                        <Field name="opaqueMode" type="string">Auto</Field>
-                                        <Field name="pointSize" type="double">0.05</Field>
-                                        <Object name="opaqueColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="smoothingLevel" type="string">None</Field>
-                                        <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                        <Field name="pointSizeVar" type="string">default</Field>
-                                        <Field name="pointType" type="int">6</Field>
-                                        <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                        <Field name="showInternal" type="bool">false</Field>
-                                        <Field name="pointSizePixels" type="int">2</Field>
-                                        <Field name="opacity" type="double">0.0274509803921569</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="MeshAttributes">
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">0</Field>
-                                                    <Object name="meshColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">0 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="meshColorSource" type="string">Foreground</Field>
-                                                    <Field name="opaqueColorSource" type="string">Background</Field>
-                                                    <Field name="opaqueMode" type="string">Auto</Field>
-                                                    <Field name="pointSize" type="double">0.05</Field>
-                                                    <Object name="opaqueColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 255 255 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="smoothingLevel" type="string">None</Field>
-                                                    <Field name="pointSizeVarEnabled" type="bool">false</Field>
-                                                    <Field name="pointSizeVar" type="string">default</Field>
-                                                    <Field name="pointType" type="int">6</Field>
-                                                    <Field name="opaqueMeshIsAppropriate" type="bool">false</Field>
-                                                    <Field name="showInternal" type="bool">false</Field>
-                                                    <Field name="pointSizePixels" type="int">2</Field>
-                                                    <Field name="opacity" type="double">0.0274509803921569</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">Mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Object name="plot01">
-                                <Field name="plotName" type="string">Plot0004</Field>
-                                <Field name="pluginID" type="string">Contour_1.0</Field>
-                                <Field name="sourceID" type="string">SOURCE00</Field>
-                                <Field name="variableName" type="string">phi</Field>
-                                <Field name="active" type="bool">true</Field>
-                                <Field name="hidden" type="bool">false</Field>
-                                <Field name="realized" type="bool">true</Field>
-                                <Object name="ViewerPlot">
-                                    <Field name="plotDescription" type="string"></Field>
-                                    <Field name="cacheIndex" type="int">0</Field>
-                                    <Field name="spatialExtentsType" type="string">AVT_ACTUAL_EXTENTS</Field>
-                                    <Field name="bgColor" type="doubleArray" length="3">1 1 1 </Field>
-                                    <Field name="fgColor" type="doubleArray" length="3">0 0 0 </Field>
-                                    <Field name="expandedFlag" type="bool">true</Field>
-                                    <Field name="followsTime" type="bool">true</Field>
-                                    <Object name="ContourAttributes">
-                                        <Object name="defaultPalette">
-                                            <Object name="ColorControlPointList">
-                                                <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                <Field name="smoothing" type="string">None</Field>
-                                                <Field name="equal" type="bool">true</Field>
-                                                <Field name="discrete" type="bool">true</Field>
-                                                <Field name="category" type="string">Standard</Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="colorType" type="string">ColorByColorTable</Field>
-                                        <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                        <Field name="legendFlag" type="bool">true</Field>
-                                        <Field name="lineStyle" type="int">0</Field>
-                                        <Field name="lineWidth" type="int">0</Field>
-                                        <Object name="singleColor">
-                                            <Object name="ColorAttribute">
-                                                <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                            </Object>
-                                        </Object>
-                                        <Field name="contourNLevels" type="int">10</Field>
-                                        <Field name="contourValue" type="doubleVector"></Field>
-                                        <Field name="contourPercent" type="doubleVector"></Field>
-                                        <Field name="contourMethod" type="string">Level</Field>
-                                        <Field name="minFlag" type="bool">false</Field>
-                                        <Field name="maxFlag" type="bool">false</Field>
-                                        <Field name="min" type="double">0</Field>
-                                        <Field name="max" type="double">1</Field>
-                                        <Field name="scaling" type="string">Linear</Field>
-                                        <Field name="wireframe" type="bool">false</Field>
-                                        <Field name="invertColorTable" type="bool">false</Field>
-                                    </Object>
-                                    <Object name="plotKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="ContourAttributes">
-                                                    <Object name="defaultPalette">
-                                                        <Object name="ColorControlPointList">
-                                                            <Field name="compactColors" type="unsignedCharVector">255 0 0 255 0 255 0 255 0 0 255 255 0 255 255 255 255 0 255 255 255 255 0 255 255 135 0 255 255 0 135 255 168 168 168 255 255 68 68 255 99 255 99 255 99 99 255 255 40 165 165 255 255 99 255 255 255 255 99 255 255 170 99 255 170 79 255 255 150 0 0 255 0 150 0 255 0 0 150 255 0 109 109 255 150 0 150 255 150 150 0 255 150 84 0 255 160 0 79 255 255 104 28 255 0 170 81 255 68 255 124 255 0 130 255 255 130 0 255 255 </Field>
-                                                            <Field name="compactPositions" type="floatVector">0 0.034 0.069 0.103 0.138 0.172 0.207 0.241 0.276 0.31 0.345 0.379 0.414 0.448 0.483 0.517 0.552 0.586 0.621 0.655 0.69 0.724 0.759 0.793 0.828 0.862 0.897 0.931 0.966 1 </Field>
-                                                            <Field name="smoothing" type="string">None</Field>
-                                                            <Field name="equal" type="bool">true</Field>
-                                                            <Field name="discrete" type="bool">true</Field>
-                                                            <Field name="category" type="string">Standard</Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="colorType" type="string">ColorByColorTable</Field>
-                                                    <Field name="colorTableName" type="string">hot_desaturated</Field>
-                                                    <Field name="legendFlag" type="bool">true</Field>
-                                                    <Field name="lineStyle" type="int">0</Field>
-                                                    <Field name="lineWidth" type="int">0</Field>
-                                                    <Object name="singleColor">
-                                                        <Object name="ColorAttribute">
-                                                            <Field name="color" type="unsignedCharArray" length="4">255 0 0 255 </Field>
-                                                        </Object>
-                                                    </Object>
-                                                    <Field name="contourNLevels" type="int">10</Field>
-                                                    <Field name="contourValue" type="doubleVector"></Field>
-                                                    <Field name="contourPercent" type="doubleVector"></Field>
-                                                    <Field name="contourMethod" type="string">Level</Field>
-                                                    <Field name="minFlag" type="bool">false</Field>
-                                                    <Field name="maxFlag" type="bool">false</Field>
-                                                    <Field name="min" type="double">0</Field>
-                                                    <Field name="max" type="double">1</Field>
-                                                    <Field name="scaling" type="string">Linear</Field>
-                                                    <Field name="wireframe" type="bool">false</Field>
-                                                    <Field name="invertColorTable" type="bool">false</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="databaseKeyframes">
-                                        <Object name="AttributeSubjectMap">
-                                            <Field name="indices" type="intVector">0 </Field>
-                                            <Object name="attributes">
-                                                <Object name="DatabaseAttributes">
-                                                    <Field name="state" type="int">0</Field>
-                                                </Object>
-                                            </Object>
-                                        </Object>
-                                    </Object>
-                                    <Object name="CompactSILRestrictionAttributes">
-                                        <Field name="topSet" type="string">Mesh</Field>
-                                        <Field name="topSetIsAllOn" type="bool">true</Field>
-                                    </Object>
-                                    <Field name="namedSelection" type="string"></Field>
-                                </Object>
-                            </Object>
-                            <Field name="activeSource" type="string">SOURCE00</Field>
-                            <Field name="nPlots" type="int">2</Field>
-                            <Field name="keyframeMode" type="bool">false</Field>
-                            <Field name="nKeyframes" type="int">1</Field>
-                            <Object name="AnimationAttributes">
-                                <Field name="animationMode" type="string">StopMode</Field>
-                                <Field name="pipelineCachingMode" type="bool">false</Field>
-                                <Field name="frameIncrement" type="int">1</Field>
-                                <Field name="timeout" type="int">1</Field>
-                                <Field name="playbackMode" type="string">Looping</Field>
-                            </Object>
-                        </Object>
-                    </Object>
-                </Object>
-            </Object>
-            <Object name="ViewerQueryManager">
-                <Field name="baseDesignator" type="char">A</Field>
-                <Field name="cycleDesignator" type="bool">false</Field>
-                <Field name="colorIndex" type="int">0</Field>
-            </Object>
-        </Object>
-        <Object name="ViewerEngineManager">
-            <Object name="RunningEngines">
-                <Object name="MachineProfile">
-                    <Field name="hostNickname" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="host" type="string">smic.dhcp.lbl.gov</Field>
-                    <Field name="userName" type="string">notset</Field>
-                    <Field name="hostAliases" type="string"></Field>
-                    <Field name="directory" type="string"></Field>
-                    <Field name="shareOneBatchJob" type="bool">false</Field>
-                    <Field name="sshPortSpecified" type="bool">false</Field>
-                    <Field name="sshPort" type="int">22</Field>
-                    <Field name="sshCommandSpecified" type="bool">false</Field>
-                    <Field name="sshCommand" type="stringVector">"ssh" </Field>
-                    <Field name="useGateway" type="bool">false</Field>
-                    <Field name="gatewayHost" type="string"></Field>
-                    <Field name="clientHostDetermination" type="string">MachineName</Field>
-                    <Field name="manualClientHostName" type="string"></Field>
-                    <Field name="tunnelSSH" type="bool">false</Field>
-                    <Field name="maximumNodesValid" type="bool">false</Field>
-                    <Field name="maximumNodes" type="int">1</Field>
-                    <Field name="maximumProcessorsValid" type="bool">true</Field>
-                    <Field name="maximumProcessors" type="int">10</Field>
-                    <Object name="LaunchProfile">
-                        <Field name="timeout" type="int">480</Field>
-                        <Field name="numProcessors" type="int">1</Field>
-                        <Field name="numNodesSet" type="bool">false</Field>
-                        <Field name="numNodes" type="int">-1</Field>
-                        <Field name="partitionSet" type="bool">false</Field>
-                        <Field name="partition" type="string"></Field>
-                        <Field name="bankSet" type="bool">false</Field>
-                        <Field name="bank" type="string"></Field>
-                        <Field name="timeLimitSet" type="bool">false</Field>
-                        <Field name="timeLimit" type="string"></Field>
-                        <Field name="launchMethodSet" type="bool">false</Field>
-                        <Field name="launchMethod" type="string"></Field>
-                        <Field name="forceStatic" type="bool">true</Field>
-                        <Field name="forceDynamic" type="bool">false</Field>
-                        <Field name="active" type="bool">false</Field>
-                        <Field name="arguments" type="stringVector"></Field>
-                        <Field name="parallel" type="bool">false</Field>
-                        <Field name="launchArgsSet" type="bool">false</Field>
-                        <Field name="launchArgs" type="string"></Field>
-                        <Field name="sublaunchArgsSet" type="bool">false</Field>
-                        <Field name="sublaunchArgs" type="string"></Field>
-                        <Field name="sublaunchPreCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPreCmd" type="string"></Field>
-                        <Field name="sublaunchPostCmdSet" type="bool">false</Field>
-                        <Field name="sublaunchPostCmd" type="string"></Field>
-                        <Field name="machinefileSet" type="bool">false</Field>
-                        <Field name="machinefile" type="string"></Field>
-                        <Field name="visitSetsUpEnv" type="bool">false</Field>
-                        <Field name="canDoHWAccel" type="bool">false</Field>
-                        <Field name="GPUsPerNode" type="int">1</Field>
-                        <Field name="XArguments" type="string"></Field>
-                        <Field name="launchXServers" type="bool">false</Field>
-                        <Field name="XDisplay" type="string">:%l</Field>
-                        <Field name="numThreads" type="int">0</Field>
-                        <Field name="constrainNodeProcs" type="bool">false</Field>
-                        <Field name="allowableNodes" type="intVector"></Field>
-                        <Field name="allowableProcs" type="intVector"></Field>
-                        <Field name="profileName" type="string">Serial</Field>
-                    </Object>
-                    <Field name="activeProfile" type="int">1</Field>
-                </Object>
-            </Object>
-            <Object name="MaterialAttributes">
-                <Field name="smoothing" type="bool">false</Field>
-                <Field name="forceMIR" type="bool">false</Field>
-                <Field name="cleanZonesOnly" type="bool">false</Field>
-                <Field name="needValidConnectivity" type="bool">false</Field>
-                <Field name="algorithm" type="string">EquiZ</Field>
-                <Field name="iterationEnabled" type="bool">false</Field>
-                <Field name="numIterations" type="int">5</Field>
-                <Field name="iterationDamping" type="float">0.4</Field>
-                <Field name="simplifyHeavilyMixedZones" type="bool">false</Field>
-                <Field name="maxMaterialsPerZone" type="int">3</Field>
-                <Field name="isoVolumeFraction" type="float">0.5</Field>
-                <Field name="annealingTime" type="int">10</Field>
-            </Object>
-            <Object name="MeshManagementAttributes">
-                <Field name="discretizationTolerance" type="doubleVector">0.02 0.025 0.05 </Field>
-                <Field name="discretizationToleranceX" type="doubleVector"></Field>
-                <Field name="discretizationToleranceY" type="doubleVector"></Field>
-                <Field name="discretizationToleranceZ" type="doubleVector"></Field>
-                <Field name="discretizationMode" type="string">Uniform</Field>
-                <Field name="discretizeBoundaryOnly" type="bool">false</Field>
-                <Field name="passNativeCSG" type="bool">false</Field>
-            </Object>
-            <Object name="ExportDBAttributes">
-                <Field name="allTimes" type="bool">false</Field>
-                <Field name="dirname" type="string">.</Field>
-                <Field name="filename" type="string">visit_ex_db</Field>
-                <Field name="timeStateFormat" type="string">_%04d</Field>
-                <Field name="db_type" type="string"></Field>
-                <Field name="db_type_fullname" type="string"></Field>
-                <Field name="variables" type="stringVector"></Field>
-                <Field name="writeUsingGroups" type="bool">false</Field>
-                <Field name="groupSize" type="int">48</Field>
-                <Object name="opts">
-                    <Object name="DBOptionsAttributes">
-                        <Field name="types" type="intVector"></Field>
-                        <Field name="names" type="stringVector"></Field>
-                        <Field name="optBools" type="intVector"></Field>
-                        <Field name="optFloats" type="doubleVector"></Field>
-                        <Field name="optDoubles" type="doubleVector"></Field>
-                        <Field name="optInts" type="intVector"></Field>
-                        <Field name="optStrings" type="stringVector"></Field>
-                        <Field name="optEnums" type="intVector"></Field>
-                        <Field name="enumStrings" type="stringVector"></Field>
-                        <Field name="enumStringsSizes" type="intVector"></Field>
-                        <Field name="obsoleteNames" type="stringVector"></Field>
-                        <Field name="help" type="string"></Field>
-                    </Object>
-                </Object>
-            </Object>
-        </Object>
-    </Object>
-</Object>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_3d.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_3d.xml
deleted file mode 100644
index 4562e1abee5..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_iso_libsim_3d.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<sensei>
-  <!-- libsim 3D -->
-  <analysis type="libsim"
-    visitdir="/work/SENSEI/visit2.13.2-install" mode="batch"
-    session="sensei/render_iso_libsim_3d.session"
-    image-filename="ls_image_3d_%ts" image-width="1000" image-height="700"
-    image-format="png" frequency="1" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_libsim.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_libsim.xml
deleted file mode 100644
index df466065347..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/render_libsim.xml
+++ /dev/null
@@ -1,10 +0,0 @@
-<sensei>
-  <!-- catalyst -->
-  <analysis type="catalyst" pipeline="pythonscript"
-    filename="amr_meshes.py" enabled="1" />
-
-  <!-- libsim -->
-  <analysis type="libsim" plots="Pseudocolor,Mesh" plotvars="comp_0,mesh"
-    image-filename="image_%ts" image-width="800" image-height="800"
-    slice-project="1" image-format="png" frequency="1" enabled="0" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_adios2_bp4.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_adios2_bp4.xml
deleted file mode 100644
index 8ca6ca12cb7..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_adios2_bp4.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<sensei>
-  <analysis type="adios2" filename="single_vortex_advect.bp" engine="BP4" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_adios2_sst.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_adios2_sst.xml
deleted file mode 100644
index cdd174dcbf2..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_adios2_sst.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<sensei>
-  <transport type="adios2" filename="single_vortex_advect.sst" engine="sst" enabled="1" />
-</sensei>
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_vtk.xml b/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_vtk.xml
deleted file mode 100644
index 226c50634c7..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Exec/SingleVortex/sensei/write_vtk.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<sensei>
-  <analysis type="VTKAmrWriter" mode="paraview" output_dir="./" enabled="1">
-  </analysis> 
-</sensei>
-
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/README b/Tutorials/SENSEI/Advection_AmrLevel/README
deleted file mode 100644
index f11bcde240e..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/README
+++ /dev/null
@@ -1,13 +0,0 @@
-Advection_AmrLevel: This tutorial contains an AMR advection code that advects a single 
-scalar field with a velocity field that is specified on faces.
-
-It is an AMReX based code designed to run in parallel using MPI/OMP.
-
-This example uses source code from the amrex/Src/Base, Boundary, AmrCore , and
-Amr directories.
-
-The directories Exec/SingleVortex and Exec/UniformVelocity each include 
-a makefile and a sample inputs file.  
-Plotfiles are generated that can be viewed with amrvis2d / amrvis3d
-(CCSE's native vis / spreadsheet tool, downloadable separately from ccse.lbl.gov)
-or with VisIt.
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/README_SENSEI.md b/Tutorials/SENSEI/Advection_AmrLevel/README_SENSEI.md
deleted file mode 100644
index f5d9104bfb1..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/README_SENSEI.md
+++ /dev/null
@@ -1,73 +0,0 @@
-# Using SingleVortex miniapp with SENSEI in situ #
-SENSEI is a middleware that allows one to send data to various visualization and
-analysis back ends through a uniform interface. It's data model and API enable
-one to chose the desired visualization and analysis back end for a given task
-with out limitting ones options, as the back ends can be inter-changed at run
-time via a text based config file.
-
-## Configuring the environment ##
-First select the desired SENSEI install. Each install will support different set of
-backends. This is necessary because not all of the back ends are compatible with
-each other.
-
-For instance to use SENSEI with ParaView Catalyst:
-```
-module load sensei/2.1.0-catalyst
-```
-
-To use SENSEI with VisIt Libsim:
-```
-module load sensei/2.1.0-libsim
-```
-
-## Compiling ##
-SENSEI features in AMReX are conditionally compiled when the Make file variable
-`USE_SENSEI_INSITU` is set. When this variable is set, the Make file will querry
-environment variables to determine the list of include directories and link
-libraries needed to compile with SENSEI.
-
-The `sensei_config` tool that is installed with SENSEI  will set the environment
-variables that are used in the make files.
-
-With a SENSEI module loaded, in a bash shell:
-```
-source sensei_config
-```
-
-Edit the file `Exec/SingleVortex/GNUmakefile`, set
-```
-USE_SENSEI_INSITU = TRUE
-```
-
-Finally, make the tutorial
-```
-make -j4
-```
-
-## Running ##
-To use SENSEI in AMReX one needs to enable it via ParmParse input file.
-Additionally one needs to provide a SENSEI XML configuration that selects
-and configures the desired SENSEI backend.
-
-Example XML configs are included in `Exec/SingleVortex/SENSEI`.
-
-Edit the file `Exec/SingleVortex/inputs`
-
-Running with ParaView Catalyst:
-```
-sensei.enabled = 1                          # turn SENSEI in situ on/off
-sensei.config = SENSEI/render_catalyst.xml  # render simulation data with ParaView Catalyst
-sensei.frequency = 1                        # number of level 0 steps between in situ processing
-```
-
-Running with VisIt Libsim:
-```
-sensei.enabled = 1                          # turn SENSEI in situ on/off
-sensei.config = SENSEI/render_libsim.xml    # render simulation data with VisIt Libsim
-sensei.frequency = 1                        # number of level 0 steps between in situ processing
-```
-
-Once the inputs files has been edited, run the execcutable as usual
-```
-mpiexec -np 4 ./main2d.gnu.MPI.ex inputs
-```
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Adv_F.H b/Tutorials/SENSEI/Advection_AmrLevel/Source/Adv_F.H
deleted file mode 100644
index 1c08189d996..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Adv_F.H
+++ /dev/null
@@ -1,52 +0,0 @@
-#ifndef _Adv_F_H_
-#define _Adv_F_H_
-
-#include <AMReX_BLFort.H>
-#include <AMReX_SPACE.H>
-
-#ifdef __cplusplus
-extern "C" 
-{
-#endif
-
-  void get_tagging_params(const int* name, const int* namlen);
-
-  void nullfill(BL_FORT_FAB_ARG_3D(state),
-		const int* dlo, const int* dhi,
-		const amrex_real* dx, const amrex_real* glo, 
-		const amrex_real* time, const int* bc);
-  
-  void state_error(int* tag, const int* tag_lo, const int* tag_hi,
-		   BL_FORT_FAB_ARG_3D(state),
-		   const int* tagval, const int* clearval,
-		   const int* lo, const int* hi,
-		   const amrex_real* dx, const amrex_real* problo,
-		   const amrex_real* time, const int* level);
-  
-  void initdata(const int* level, const amrex_real* time, 
-		const int* lo, const int* hi,
-		BL_FORT_FAB_ARG_3D(state),
-		const amrex_real* dx, const amrex_real* problo);
-  
-  void get_face_velocity(const int* level, const amrex_real* time, 
-			 AMREX_D_DECL(BL_FORT_FAB_ARG(xvel),
-				BL_FORT_FAB_ARG(yvel),
-				BL_FORT_FAB_ARG(zvel)),
-			 const amrex_real* dx, const amrex_real* problo);
-  
-  void advect(const amrex_real* time, const int* lo, const int* hi,
-	      const BL_FORT_FAB_ARG_3D(statein),
-	      BL_FORT_FAB_ARG_3D(stateout),
-	      AMREX_D_DECL(const BL_FORT_FAB_ARG_3D(xvel),
-		     const BL_FORT_FAB_ARG_3D(yvel),
-		     const BL_FORT_FAB_ARG_3D(zvel)),
-	      AMREX_D_DECL(BL_FORT_FAB_ARG_3D(fx),
-		     BL_FORT_FAB_ARG_3D(fy),
-		     BL_FORT_FAB_ARG_3D(fz)),
-	      const amrex_real* dx, const amrex_real* dt);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/AmrLevelAdv.H b/Tutorials/SENSEI/Advection_AmrLevel/Source/AmrLevelAdv.H
deleted file mode 100644
index 07bea60a7d6..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/AmrLevelAdv.H
+++ /dev/null
@@ -1,211 +0,0 @@
-#ifndef _AmrLevelAdv_H_
-#define _AmrLevelAdv_H_
-
-#ifdef AMREX_PARTICLES
-#include <AMReX_AmrParticles.H>
-#endif
-
-#include <AMReX_AmrLevel.H>
-#include <AMReX_FluxRegister.H>
-
-#include <memory>
-#include <iostream>
-
-#ifdef _OPENMP
-#include <omp.h>
-#endif
-
-enum StateType { Phi_Type = 0,
-                 NUM_STATE_TYPE };
-
-//
-// AmrLevel-derived class for hyperbolic conservation equations
-//
-
-class AmrLevelAdv
-    :
-    public amrex::AmrLevel
-{
-public:
-    //
-    //Default constructor.  Builds invalid object.
-    //
-    AmrLevelAdv ();
-    //
-    //The basic constructor.
-    //
-    AmrLevelAdv (amrex::Amr&     papa,
-	         int             lev,
-                 const amrex::Geometry& level_geom,
-                 const amrex::BoxArray& bl,
-                 const amrex::DistributionMapping& dm,
-                 amrex::Real            time);
-    //
-    //The destructor.
-    //
-    virtual ~AmrLevelAdv () override;
-    //
-    //Restart from a checkpoint file.
-    //
-    virtual void restart (amrex::Amr&   papa,
-                          std::istream& is,
-			  bool          bReadSpecial = false) override;
-
-    virtual void checkPoint (const std::string& dir,
-			     std::ostream&      os,
-			     amrex::VisMF::How  how = amrex::VisMF::NFiles,
-			     bool               dump_old = true) override;
-
-    //
-    //Write a plotfile to specified directory.
-    //
-    virtual void writePlotFile (const std::string& dir,
-                                std::ostream&      os,
-                                amrex::VisMF::How  how) override;
-    //
-    //Define data descriptors.
-    //
-    static void variableSetUp ();
-    //
-    //Cleanup data descriptors at end of run.
-    //
-    static void variableCleanUp ();
-    //
-    //Initialize grid data at problem start-up.
-    //
-    virtual void initData () override;
-    //
-    //Initialize data on this level from another AmrLevelAdv (during regrid).
-    //
-    virtual void init (amrex::AmrLevel& old) override;
-    //
-    //Initialize data on this level after regridding if old level did not previously exist
-    //
-    virtual void init () override;
-    //
-    //Advance grids at this level in time.
-    //
-    virtual amrex::Real advance (amrex::Real time,
-                                 amrex::Real dt,
-                                 int  iteration,
-                                 int  ncycle) override;
-    //
-    //Estimate time step.
-    //
-    amrex::Real estTimeStep (amrex::Real dt_old);
-    //
-    //Compute initial time step.
-    //
-    amrex::Real initialTimeStep ();
-    //
-    //Compute initial `dt'.
-    //
-    virtual void computeInitialDt (int                   finest_level,
-                                   int                   sub_cycle,
-                                   amrex::Vector<int>&           n_cycle,
-                                   const amrex::Vector<amrex::IntVect>& ref_ratio,
-                                   amrex::Vector<amrex::Real>&          dt_level,
-                                   amrex::Real                  stop_time) override;
-    //
-    //Compute new `dt'.
-    //
-    virtual void computeNewDt (int                   finest_level,
-                               int                   sub_cycle,
-                               amrex::Vector<int>&           n_cycle,
-                               const amrex::Vector<amrex::IntVect>& ref_ratio,
-                               amrex::Vector<amrex::Real>&          dt_min,
-                               amrex::Vector<amrex::Real>&          dt_level,
-                               amrex::Real                  stop_time,
-                               int                   post_regrid_flag) override;
-    //
-    //Do work after timestep().
-    //
-    virtual void post_timestep (int iteration) override;
-
-    //
-    //Do work after regrid().
-    //
-    virtual void post_regrid (int lbase, int new_finest) override;
-    //
-    //Do work after a restart().
-    //
-    virtual void post_restart () override;
-    //
-    //Do work after init().
-    //
-    virtual void post_init (amrex::Real stop_time) override;
-    //
-    //Error estimation for regridding.
-    //
-    virtual void errorEst (amrex::TagBoxArray& tb,
-                           int          clearval,
-                           int          tagval,
-                           amrex::Real         time,
-			   int          n_error_buf = 0, int ngrow = 0) override;
-
-#ifdef AMREX_PARTICLES
-    static amrex::AmrTracerParticleContainer* theTracerPC () { return TracerPC.get(); }
-#endif
-
-    static int  NUM_STATE;
-    static int  NUM_GROW;
-
-protected:
-
-    static void read_params ();
-
-    // inline functioned implemented below
-    AmrLevelAdv& getLevel (int lev);
-    amrex::FluxRegister& getFluxReg ();
-    amrex::FluxRegister& getFluxReg (int lev);
-
-    void reflux ();
-
-    void avgDown ();
-
-    void avgDown (int state_indx);
-
-    //
-    // The data.
-    //
-    amrex::FluxRegister*        flux_reg;
-    //
-    // Static data members.
-    //
-    static int          verbose;
-    static amrex::Real  cfl;
-    static int          do_reflux;
-
-#ifdef AMREX_PARTICLES
-    void init_particles ();
-    static int       do_tracers;
-    static std::unique_ptr<amrex::AmrTracerParticleContainer> TracerPC;
-#endif
-};    
-
-//
-// Inlines.
-//
-
-inline
-AmrLevelAdv&
-AmrLevelAdv::getLevel (int lev)
-{
-    return *(AmrLevelAdv *) &parent->getLevel(lev);
-}
-
-inline
-amrex::FluxRegister&
-AmrLevelAdv::getFluxReg ()
-{
-    BL_ASSERT(flux_reg);
-    return *flux_reg;
-}
-
-inline
-amrex::FluxRegister&
-AmrLevelAdv::getFluxReg (int lev)
-{
-    return getLevel(lev).getFluxReg();
-}
-#endif /*_AmrLevelAdv_H_*/
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/AmrLevelAdv.cpp b/Tutorials/SENSEI/Advection_AmrLevel/Source/AmrLevelAdv.cpp
deleted file mode 100644
index 6f19f341e38..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/AmrLevelAdv.cpp
+++ /dev/null
@@ -1,784 +0,0 @@
-
-#include <AmrLevelAdv.H>
-#include <Adv_F.H>
-#include <AMReX_VisMF.H>
-#include <AMReX_TagBox.H>
-#include <AMReX_ParmParse.H>
-
-using namespace amrex;
-
-int      AmrLevelAdv::verbose         = 0;
-Real     AmrLevelAdv::cfl             = 0.9;
-int      AmrLevelAdv::do_reflux       = 1;
-
-int      AmrLevelAdv::NUM_STATE       = 1;  // One variable in the state
-int      AmrLevelAdv::NUM_GROW        = 3;  // number of ghost cells
-
-#ifdef AMREX_PARTICLES
-std::unique_ptr<AmrTracerParticleContainer> AmrLevelAdv::TracerPC =  nullptr;
-int AmrLevelAdv::do_tracers                       =  0;
-#endif
-
-//
-//Default constructor.  Builds invalid object.
-//
-AmrLevelAdv::AmrLevelAdv ()
-{
-    flux_reg = 0;
-}
-
-//
-//The basic constructor.
-//
-AmrLevelAdv::AmrLevelAdv (Amr&            papa,
-     	                  int             lev,
-                          const Geometry& level_geom,
-                          const BoxArray& bl,
-                          const DistributionMapping& dm,
-                          Real            time)
-    :
-    AmrLevel(papa,lev,level_geom,bl,dm,time) 
-{
-    flux_reg = 0;
-    if (level > 0 && do_reflux)
-        flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-}
-
-//
-//The destructor.
-//
-AmrLevelAdv::~AmrLevelAdv () 
-{
-    delete flux_reg;
-}
-
-//
-//Restart from a checkpoint file.
-//
-void
-AmrLevelAdv::restart (Amr&          papa,
-	              std::istream& is,
-                      bool          bReadSpecial)
-{
-    AmrLevel::restart(papa,is,bReadSpecial);
-
-    BL_ASSERT(flux_reg == 0);
-    if (level > 0 && do_reflux)
-        flux_reg = new FluxRegister(grids,dmap,crse_ratio,level,NUM_STATE);
-}
-
-void 
-AmrLevelAdv::checkPoint (const std::string& dir,
-		         std::ostream&      os,
-                         VisMF::How         how,
-                         bool               dump_old) 
-{
-  AmrLevel::checkPoint(dir, os, how, dump_old);
-#ifdef AMREX_PARTICLES
-  if (do_tracers and level == 0) {
-    TracerPC->Checkpoint(dir, "Tracer", true);
-  }
-#endif
-}
-
-//
-//Write a plotfile to specified directory.
-//
-void
-AmrLevelAdv::writePlotFile (const std::string& dir,
-	 	            std::ostream&      os,
-                            VisMF::How         how)
-{
-
-    AmrLevel::writePlotFile (dir,os,how);
-
-#ifdef AMREX_PARTICLES
-    if (do_tracers and level == 0) {
-      TracerPC->Checkpoint(dir, "Tracer", true);
-    }
-#endif
-}
-
-//
-//Define data descriptors.
-//
-void
-AmrLevelAdv::variableSetUp ()
-{
-    BL_ASSERT(desc_lst.size() == 0);
-
-    // Get options, set phys_bc
-    read_params();
-
-    desc_lst.addDescriptor(Phi_Type,IndexType::TheCellType(),
-                           StateDescriptor::Point,0,NUM_STATE,
-			   &cell_cons_interp);
-
-    int lo_bc[BL_SPACEDIM];
-    int hi_bc[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; ++i) {
-	lo_bc[i] = hi_bc[i] = BCType::int_dir;   // periodic boundaries
-    }
-    
-    BCRec bc(lo_bc, hi_bc);
-
-    desc_lst.setComponent(Phi_Type, 0, "phi", bc, 
-			  StateDescriptor::BndryFunc(nullfill));
-}
-
-//
-//Cleanup data descriptors at end of run.
-//
-void
-AmrLevelAdv::variableCleanUp () 
-{
-    desc_lst.clear();
-#ifdef AMREX_PARTICLES
-    TracerPC.reset();
-#endif
-}
-
-//
-//Initialize grid data at problem start-up.
-//
-void
-AmrLevelAdv::initData ()
-{
-    //
-    // Loop over grids, call FORTRAN function to init with data.
-    //
-    const Real* dx  = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    MultiFab& S_new = get_new_data(Phi_Type);
-    Real cur_time   = state[Phi_Type].curTime();
-
-    if (verbose) {
-        amrex::Print() << "Initializing the data at level " << level << std::endl;
-    }
-
-    for (MFIter mfi(S_new); mfi.isValid(); ++mfi)
-    {
-        const Box& box     = mfi.validbox();
-        const int* lo      = box.loVect();
-        const int* hi      = box.hiVect();
-
-          initdata(&level, &cur_time, AMREX_ARLIM_3D(lo), AMREX_ARLIM_3D(hi),
-		   BL_TO_FORTRAN_3D(S_new[mfi]), AMREX_ZFILL(dx),
-		   AMREX_ZFILL(prob_lo));
-    }
-
-#ifdef AMREX_PARTICLES
-    init_particles();
-#endif
-
-    if (verbose) {
-	amrex::Print() << "Done initializing the level " << level 
-                       << " data " << std::endl;
-    }
-}
-
-//
-//Initialize data on this level from another AmrLevelAdv (during regrid).
-//
-void
-AmrLevelAdv::init (AmrLevel &old)
-{
-    AmrLevelAdv* oldlev = (AmrLevelAdv*) &old;
-    //
-    // Create new grid data by fillpatching from old.
-    //
-    Real dt_new    = parent->dtLevel(level);
-    Real cur_time  = oldlev->state[Phi_Type].curTime();
-    Real prev_time = oldlev->state[Phi_Type].prevTime();
-    Real dt_old    = cur_time - prev_time;
-    setTimeLevel(cur_time,dt_old,dt_new);
-
-    MultiFab& S_new = get_new_data(Phi_Type);
-
-    FillPatch(old, S_new, 0, cur_time, Phi_Type, 0, NUM_STATE);
-}
-
-//
-//Initialize data on this level after regridding if old level did not previously exist
-//
-void
-AmrLevelAdv::init ()
-{
-    Real dt        = parent->dtLevel(level);
-    Real cur_time  = getLevel(level-1).state[Phi_Type].curTime();
-    Real prev_time = getLevel(level-1).state[Phi_Type].prevTime();
-
-    Real dt_old = (cur_time - prev_time)/(Real)parent->MaxRefRatio(level-1);
-
-    setTimeLevel(cur_time,dt_old,dt);
-    MultiFab& S_new = get_new_data(Phi_Type);
-    FillCoarsePatch(S_new, 0, cur_time, Phi_Type, 0, NUM_STATE);
-}
-
-//
-//Advance grids at this level in time.
-//
-Real
-AmrLevelAdv::advance (Real time,
-                      Real dt,
-                      int  iteration,
-                      int  ncycle)
-{
-    MultiFab& S_mm = get_new_data(Phi_Type);
-    Real maxval = S_mm.max(0);
-    Real minval = S_mm.min(0);
-
-    amrex::Print() << "phi max = " << maxval << ", min = " << minval  << std::endl;
-    for (int k = 0; k < NUM_STATE_TYPE; k++) {
-        state[k].allocOldData();
-        state[k].swapTimeLevels(dt);
-    }
-
-    MultiFab& S_new = get_new_data(Phi_Type);
-
-    const Real prev_time = state[Phi_Type].prevTime();
-    const Real cur_time = state[Phi_Type].curTime();
-    const Real ctr_time = 0.5*(prev_time + cur_time);
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-
-    //
-    // Get pointers to Flux registers, or set pointer to zero if not there.
-    //
-    FluxRegister *fine    = 0;
-    FluxRegister *current = 0;
-    
-    int finest_level = parent->finestLevel();
-
-    if (do_reflux && level < finest_level) {
-	fine = &getFluxReg(level+1);
-	fine->setVal(0.0);
-    }
-
-    if (do_reflux && level > 0) {
-	current = &getFluxReg(level);
-    }
-
-    MultiFab fluxes[BL_SPACEDIM];
-
-    if (do_reflux)
-    {
-	for (int j = 0; j < BL_SPACEDIM; j++)
-	{
-	    BoxArray ba = S_new.boxArray();
-	    ba.surroundingNodes(j);
-	    fluxes[j].define(ba, dmap, NUM_STATE, 0);
-	}
-    }
-
-    // State with ghost cells
-    MultiFab Sborder(grids, dmap, NUM_STATE, NUM_GROW);
-    FillPatch(*this, Sborder, NUM_GROW, time, Phi_Type, 0, NUM_STATE);
-
-    // MF to hold the mac velocity
-    MultiFab Umac[BL_SPACEDIM];
-    for (int i = 0; i < BL_SPACEDIM; i++) {
-      BoxArray ba = S_new.boxArray();
-      ba.surroundingNodes(i);
-      Umac[i].define(ba, dmap, 1, iteration);
-    }
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-	FArrayBox flux[BL_SPACEDIM], uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    const Box& bx = mfi.tilebox();
-
-	    const FArrayBox& statein = Sborder[mfi];
-	    FArrayBox& stateout      =   S_new[mfi];
-
-	    // Allocate fabs for fluxes and Godunov velocities.
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bxtmp = amrex::surroundingNodes(bx,i);
-		flux[i].resize(bxtmp,NUM_STATE);
-		uface[i].resize(amrex::grow(bxtmp, iteration), 1);
-	    }
-
-	    get_face_velocity(&level, &ctr_time,
-			      AMREX_D_DECL(BL_TO_FORTRAN(uface[0]),
-				     BL_TO_FORTRAN(uface[1]),
-				     BL_TO_FORTRAN(uface[2])),
-			      dx, prob_lo);
-
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-                const Box& bxtmp = mfi.grownnodaltilebox(i, iteration);
-                Umac[i][mfi].copy(uface[i], bxtmp);
-	    }
-            advect(&time, bx.loVect(), bx.hiVect(),
-		   BL_TO_FORTRAN_3D(statein), 
-		   BL_TO_FORTRAN_3D(stateout),
-		   AMREX_D_DECL(BL_TO_FORTRAN_3D(uface[0]),
-			  BL_TO_FORTRAN_3D(uface[1]),
-			  BL_TO_FORTRAN_3D(uface[2])),
-		   AMREX_D_DECL(BL_TO_FORTRAN_3D(flux[0]), 
-			  BL_TO_FORTRAN_3D(flux[1]), 
-			  BL_TO_FORTRAN_3D(flux[2])), 
-		   dx, &dt);
-
-	    if (do_reflux) {
-		for (int i = 0; i < BL_SPACEDIM ; i++)
-		    fluxes[i][mfi].copy(flux[i],mfi.nodaltilebox(i));
-	    }
-	}
-    }
-
-    if (do_reflux) {
-	if (current) {
-	    for (int i = 0; i < BL_SPACEDIM ; i++)
-		current->FineAdd(fluxes[i],i,0,0,NUM_STATE,1.);
-	}
-	if (fine) {
-	    for (int i = 0; i < BL_SPACEDIM ; i++)
-		fine->CrseInit(fluxes[i],i,0,0,NUM_STATE,-1.);
-	}
-    }
-
-#ifdef AMREX_PARTICLES
-    if (TracerPC) {
-      TracerPC->AdvectWithUmac(Umac, level, dt);
-    }
-#endif
-
-    return dt;
-}
-
-//
-//Estimate time step.
-//
-Real
-AmrLevelAdv::estTimeStep (Real)
-{
-    // This is just a dummy value to start with 
-    Real dt_est  = 1.0e+20;
-
-    const Real* dx = geom.CellSize();
-    const Real* prob_lo = geom.ProbLo();
-    const Real cur_time = state[Phi_Type].curTime();
-    const MultiFab& S_new = get_new_data(Phi_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel reduction(min:dt_est)
-#endif
-    {
-	FArrayBox uface[BL_SPACEDIM];
-
-	for (MFIter mfi(S_new, true); mfi.isValid(); ++mfi)
-	{
-	    for (int i = 0; i < BL_SPACEDIM ; i++) {
-		const Box& bx = mfi.nodaltilebox(i);
-		uface[i].resize(bx,1);
-	    }
-
-	    get_face_velocity(&level, &cur_time,
-			      AMREX_D_DECL(BL_TO_FORTRAN(uface[0]),
-				     BL_TO_FORTRAN(uface[1]),
-				     BL_TO_FORTRAN(uface[2])),
-			      dx, prob_lo);
-
-	    for (int i = 0; i < BL_SPACEDIM; ++i) {
-		Real umax = uface[i].norm(0);
-		if (umax > 1.e-100) {
-		    dt_est = std::min(dt_est, dx[i] / umax);
-		}
-	    }
-	}
-    }
-
-    ParallelDescriptor::ReduceRealMin(dt_est);
-    dt_est *= cfl;
-
-    if (verbose) {
-	amrex::Print() << "AmrLevelAdv::estTimeStep at level " << level 
-                       << ":  dt_est = " << dt_est << std::endl;
-    }
-    
-    return dt_est;
-}
-
-//
-//Compute initial time step.
-//
-Real
-AmrLevelAdv::initialTimeStep ()
-{
-    return estTimeStep(0.0);
-}
-
-//
-//Compute initial `dt'.
-//
-void
-AmrLevelAdv::computeInitialDt (int                   finest_level,
-	  	               int                   sub_cycle,
-                               Vector<int>&           n_cycle,
-                               const Vector<IntVect>& ref_ratio,
-                               Vector<Real>&          dt_level,
-                               Real                  stop_time)
-{
-    //
-    // Grids have been constructed, compute dt for all levels.
-    //
-    if (level > 0)
-        return;
-
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        dt_level[i] = getLevel(i).initialTimeStep();
-        n_factor   *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_level[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[Phi_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
-
-//
-//Compute new `dt'.
-//
-void
-AmrLevelAdv::computeNewDt (int                   finest_level,
-		           int                   sub_cycle,
-                           Vector<int>&           n_cycle,
-                           const Vector<IntVect>& ref_ratio,
-                           Vector<Real>&          dt_min,
-                           Vector<Real>&          dt_level,
-                           Real                  stop_time,
-                           int                   post_regrid_flag)
-{
-    //
-    // We are at the end of a coarse grid timecycle.
-    // Compute the timesteps for the next iteration.
-    //
-    if (level > 0)
-        return;
-
-    for (int i = 0; i <= finest_level; i++)
-    {
-        AmrLevelAdv& adv_level = getLevel(i);
-        dt_min[i] = adv_level.estTimeStep(dt_level[i]);
-    }
-
-    if (post_regrid_flag == 1) 
-    {
-	//
-	// Limit dt's by pre-regrid dt
-	//
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],dt_level[i]);
-	}
-    }
-    else 
-    {
-	//
-	// Limit dt's by change_max * old dt
-	//
-	static Real change_max = 1.1;
-	for (int i = 0; i <= finest_level; i++)
-	{
-	    dt_min[i] = std::min(dt_min[i],change_max*dt_level[i]);
-	}
-    }
-    
-    //
-    // Find the minimum over all levels
-    //
-    Real dt_0 = 1.0e+100;
-    int n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_0 = std::min(dt_0,n_factor*dt_min[i]);
-    }
-
-    //
-    // Limit dt's by the value of stop_time.
-    //
-    const Real eps = 0.001*dt_0;
-    Real cur_time  = state[Phi_Type].curTime();
-    if (stop_time >= 0.0) {
-        if ((cur_time + dt_0) > (stop_time - eps))
-            dt_0 = stop_time - cur_time;
-    }
-
-    n_factor = 1;
-    for (int i = 0; i <= finest_level; i++)
-    {
-        n_factor *= n_cycle[i];
-        dt_level[i] = dt_0/n_factor;
-    }
-}
-
-//
-//Do work after timestep().
-//
-void
-AmrLevelAdv::post_timestep (int iteration)
-{
-    //
-    // Integration cycle on fine level grids is complete
-    // do post_timestep stuff here.
-    //
-    int finest_level = parent->finestLevel();
-
-    if (do_reflux && level < finest_level)
-        reflux();
-
-    if (level < finest_level)
-        avgDown();
-
-#ifdef AMREX_PARTICLES    
-    if (TracerPC)
-      {
-        const int ncycle = parent->nCycle(level);
-	
-        if (iteration < ncycle || level == 0)
-	  {
-            int ngrow = (level == 0) ? 0 : iteration;
-	    
-	    TracerPC->Redistribute(level, TracerPC->finestLevel(), ngrow);
-	  }
-      }
-#endif
-}
-
-//
-//Do work after regrid().
-//
-void
-AmrLevelAdv::post_regrid (int lbase, int new_finest) {
-#ifdef AMREX_PARTICLES
-  if (TracerPC && level == lbase) {
-      TracerPC->Redistribute(lbase);
-  }
-#endif
-}
-
-//
-//Do work after a restart().
-//
-void
-AmrLevelAdv::post_restart() 
-{
-#ifdef AMREX_PARTICLES
-    if (do_tracers and level == 0) {
-      BL_ASSERT(TracerPC == 0);
-      TracerPC.reset(new AmrTracerParticleContainer(parent));
-      TracerPC->Restart(parent->theRestartFile(), "Tracer");
-    }
-#endif
-}
-
-//
-//Do work after init().
-//
-void
-AmrLevelAdv::post_init (Real stop_time)
-{
-    if (level > 0)
-        return;
-    //
-    // Average data down from finer levels
-    // so that conserved data is consistent between levels.
-    //
-    int finest_level = parent->finestLevel();
-    for (int k = finest_level-1; k>= 0; k--)
-        getLevel(k).avgDown();
-}
-
-//
-//Error estimation for regridding.
-//
-void
-AmrLevelAdv::errorEst (TagBoxArray& tags,
-	               int          clearval,
-                       int          tagval,
-                       Real         time,
-                       int          n_error_buf,
-                       int          ngrow)
-{
-    const Real* dx        = geom.CellSize();
-    const Real* prob_lo   = geom.ProbLo();
-
-    MultiFab& S_new = get_new_data(Phi_Type);
-
-#ifdef _OPENMP
-#pragma omp parallel
-#endif
-    {
-        Vector<int>  itags;
-	
-	for (MFIter mfi(S_new,true); mfi.isValid(); ++mfi)
-	{
-	    const Box&  tilebx  = mfi.tilebox();
-
-            TagBox&     tagfab  = tags[mfi];
-	    
-	    // We cannot pass tagfab to Fortran becuase it is BaseFab<char>.
-	    // So we are going to get a temporary integer array.
-	    tagfab.get_itags(itags, tilebx);
-	    
-            // data pointer and index space
-	    int*        tptr    = itags.dataPtr();
-	    const int*  tlo     = tilebx.loVect();
-	    const int*  thi     = tilebx.hiVect();
-
-	    state_error(tptr,  AMREX_ARLIM_3D(tlo), AMREX_ARLIM_3D(thi),
-			BL_TO_FORTRAN_3D(S_new[mfi]),
-			&tagval, &clearval, 
-			AMREX_ARLIM_3D(tilebx.loVect()), AMREX_ARLIM_3D(tilebx.hiVect()), 
-			AMREX_ZFILL(dx), AMREX_ZFILL(prob_lo), &time, &level);
-	    //
-	    // Now update the tags in the TagBox.
-	    //
-	    tagfab.tags_and_untags(itags, tilebx);
-	}
-    }
-}
-
-void
-AmrLevelAdv::read_params ()
-{
-    static bool done = false;
-
-    if (done) return;
-
-    done = true;
-
-    ParmParse pp("adv");   
-
-    pp.query("v",verbose);
-    pp.query("cfl",cfl);
-    pp.query("do_reflux",do_reflux);
-
-    Geometry const* gg = AMReX::top()->getDefaultGeometry();
-
-    // This tutorial code only supports Cartesian coordinates.
-    if (! gg->IsCartesian()) {
-	amrex::Abort("Please set geom.coord_sys = 0");
-    }
-
-    // This tutorial code only supports periodic boundaries.
-    if (! gg->isAllPeriodic()) {
-	amrex::Abort("Please set geom.is_periodic = 1 1 1");
-    }
-
-#ifdef AMREX_PARTICLES
-    pp.query("do_tracers", do_tracers);
-#endif 
-
-
-
-    //
-    // read tagging parameters from probin file
-    //
-
-    std::string probin_file("probin");
-
-    ParmParse ppa("amr");
-    ppa.query("probin_file",probin_file);
-
-    int probin_file_length = probin_file.length();
-    Vector<int> probin_file_name(probin_file_length);
-
-    for (int i = 0; i < probin_file_length; i++)
-	probin_file_name[i] = probin_file[i];
-
-    // use a fortran routine to
-    // read in tagging parameters from probin file
-    get_tagging_params(probin_file_name.dataPtr(), &probin_file_length);
-
-}
-
-void
-AmrLevelAdv::reflux ()
-{
-    BL_ASSERT(level<parent->finestLevel());
-
-    const Real strt = amrex::second();
-
-    getFluxReg(level+1).Reflux(get_new_data(Phi_Type),1.0,0,0,NUM_STATE,geom);
-    
-    if (verbose)
-    {
-        const int IOProc = ParallelDescriptor::IOProcessorNumber();
-        Real      end    = amrex::second() - strt;
-	
-        ParallelDescriptor::ReduceRealMax(end,IOProc);
-	
-        amrex::Print() << "AmrLevelAdv::reflux() at level " << level 
-                       << " : time = " << end << std::endl;
-    }
-}
-
-void
-AmrLevelAdv::avgDown ()
-{
-    if (level == parent->finestLevel()) return;
-    avgDown(Phi_Type);
-}
-
-void
-AmrLevelAdv::avgDown (int state_indx)
-{
-    if (level == parent->finestLevel()) return;
-
-    AmrLevelAdv& fine_lev = getLevel(level+1);
-    MultiFab&  S_fine   = fine_lev.get_new_data(state_indx);
-    MultiFab&  S_crse   = get_new_data(state_indx);
-    
-    amrex::average_down(S_fine,S_crse,
-                         fine_lev.geom,geom,
-                         0,S_fine.nComp(),parent->refRatio(level));
-}
-
-#ifdef AMREX_PARTICLES
-void
-AmrLevelAdv::init_particles ()
-{
-  if (do_tracers and level == 0)
-    {
-      BL_ASSERT(TracerPC == nullptr);
-      
-      TracerPC.reset(new AmrTracerParticleContainer(parent));
-      TracerPC->do_tiling = true;
-      TracerPC->tile_size = IntVect(AMREX_D_DECL(1024000,4,4));
-
-      const BoxArray& ba = TracerPC->ParticleBoxArray(0);
-      const DistributionMapping& dm = TracerPC->ParticleDistributionMap(0);
-
-      AmrTracerParticleContainer::ParticleInitData pdata = {AMREX_D_DECL(0.0, 0.0, 0.0)};
-
-      TracerPC->SetVerbose(0);
-      TracerPC->InitOnePerCell(0.5, 0.5, 0.5, pdata);
-
-      TracerPC->Redistribute();
-    }
-}
-#endif
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/LevelBldAdv.cpp b/Tutorials/SENSEI/Advection_AmrLevel/Source/LevelBldAdv.cpp
deleted file mode 100644
index fc3e077978b..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/LevelBldAdv.cpp
+++ /dev/null
@@ -1,57 +0,0 @@
-
-#include <AMReX_LevelBld.H>
-#include <AmrLevelAdv.H>
-
-using namespace amrex;
-
-class LevelBldAdv
-    :
-    public LevelBld
-{
-    virtual void variableSetUp () override;
-    virtual void variableCleanUp () override;
-    virtual AmrLevel *operator() () override;
-    virtual AmrLevel *operator() (Amr&            papa,
-                                  int             lev,
-                                  const Geometry& level_geom,
-                                  const BoxArray& ba,
-				  const DistributionMapping& dm,
-                                  Real            time) override;
-};
-
-LevelBldAdv Adv_bld;
-
-LevelBld*
-getLevelBld ()
-{
-    return &Adv_bld;
-}
-
-void
-LevelBldAdv::variableSetUp ()
-{
-    AmrLevelAdv::variableSetUp();
-}
-
-void
-LevelBldAdv::variableCleanUp ()
-{
-    AmrLevelAdv::variableCleanUp();
-}
-
-AmrLevel*
-LevelBldAdv::operator() ()
-{
-    return new AmrLevelAdv;
-}
-
-AmrLevel*
-LevelBldAdv::operator() (Amr&            papa,
-	   	         int             lev,
-                         const Geometry& level_geom,
-                         const BoxArray& ba,
-                         const DistributionMapping& dm,
-                         Real            time)
-{
-    return new AmrLevelAdv(papa, lev, level_geom, ba, dm, time);
-}
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Make.package b/Tutorials/SENSEI/Advection_AmrLevel/Source/Make.package
deleted file mode 100644
index 225bbd8eb69..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Make.package
+++ /dev/null
@@ -1,5 +0,0 @@
-CEXE_sources += AmrLevelAdv.cpp LevelBldAdv.cpp main.cpp 
-
-CEXE_headers += AmrLevelAdv.H
-
-FEXE_headers += Adv_F.H
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90
deleted file mode 100644
index 82f070d3b12..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/Adv_2d.f90
+++ /dev/null
@@ -1,118 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_2d
-
-  implicit none
-
-  integer, intent(in) :: lo(2), hi(2)
-  double precision, intent(in) :: dx(2), dt, time
-  integer, intent(in) :: ui_lo(2), ui_hi(2)
-  integer, intent(in) :: uo_lo(2), uo_hi(2)
-  integer, intent(in) :: vx_lo(2), vx_hi(2)
-  integer, intent(in) :: vy_lo(2), vy_hi(2)
-  integer, intent(in) :: fx_lo(2), fx_hi(2)
-  integer, intent(in) :: fy_lo(2), fy_hi(2)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-
-  integer :: i, j
-  integer :: glo(2), ghi(2)
-  double precision :: dtdx(2), umax, vmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:), pointer, contiguous :: phix_1d, phiy_1d, phix, phiy, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy_1d, glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phix   , glo(1), ghi(1), glo(2), ghi(2))
-  call bl_allocate(phiy   , glo(1), ghi(1), glo(2), ghi(2))
-  ! slope                                                 
-  call bl_allocate(slope  , glo(1), ghi(1), glo(2), ghi(2))
-
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_2d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-  ! Final fluxes
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = phix(i,j) * vx(i,j)
-     end do
-  end do
-  !
-  do    j = lo(2), hi(2)+1
-     do i = lo(1), hi(1)
-        flxy(i,j) = phiy(i,j) * vy(i,j)
-     end do
-  end do
-
-  ! Do a conservative update
-  do    j = lo(2),hi(2)
-     do i = lo(1),hi(1)
-        uout(i,j) = uin(i,j) + &
-             ( (flxx(i,j) - flxx(i+1,j)) * dtdx(1) &
-             + (flxy(i,j) - flxy(i,j+1)) * dtdx(2) )
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)
-     do i = lo(1), hi(1)+1
-        flxx(i,j) = flxx(i,j) * ( dt * dx(2))
-     enddo
-  enddo
-  
-  ! Scale by face area in order to correctly reflx
-  do    j = lo(2), hi(2)+1 
-     do i = lo(1), hi(1)
-        flxy(i,j) = flxy(i,j) * (dt * dx(1))
-     enddo
-  enddo
-
-  call bl_deallocate(phix_1d)
-  call bl_deallocate(phiy_1d)
-  call bl_deallocate(phix)
-  call bl_deallocate(phiy)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/Make.package b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/compute_flux_2d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/compute_flux_2d.f90
deleted file mode 100644
index 7361a8ce7a0..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/compute_flux_2d.f90
+++ /dev/null
@@ -1,113 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_2d
-
-contains
-
-  subroutine compute_flux_2d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             phix_1d, phiy_1d, phix, phiy, slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey
-
-    integer, intent(in) :: lo(2), hi(2), glo(2), ghi(2)
-    double precision, intent(in) :: dt, dx(2)
-    integer, intent(in) :: ph_lo(2), ph_hi(2)
-    integer, intent(in) ::  u_lo(2),  u_hi(2)
-    integer, intent(in) ::  v_lo(2),  v_hi(2)
-    integer, intent(in) :: fx_lo(2), fx_hi(2)
-    integer, intent(in) :: fy_lo(2), fy_hi(2)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2)) :: &
-         phix_1d, phiy_1d, phix, phiy, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(2)
-
-    hdtdx = 0.5*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix_1d(i,j) = phi(i  ,j) - (0.5d0 + hdtdx(1)*umac(i,j))*slope(i  ,j)
-          else
-             phix_1d(i,j) = phi(i-1,j) + (0.5d0 - hdtdx(1)*umac(i,j))*slope(i-1,j)
-          end if
-
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-
-    ! compute phi on y faces using umac to upwind; ignore transverse terms
-    do    j = lo(2)  , hi(2)+1
-       do i = lo(1)-1, hi(1)+1
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy_1d(i,j) = phi(i,j  ) - (0.5d0 + hdtdx(2)*vmac(i,j))*slope(i,j  )
-          else
-             phiy_1d(i,j) = phi(i,j-1) + (0.5d0 - hdtdx(2)*vmac(i,j))*slope(i,j-1)
-          end if
-
-       end do
-    end do
-
-    ! update phi on x faces by adding in y-transverse terms
-    do    j = lo(2), hi(2)
-       do i = lo(1), hi(1)+1
-
-          if (umac(i,j) .lt. 0.d0) then
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1)+vmac(i  ,j)) * (phiy_1d(i  ,j+1)-phiy_1d(i  ,j)) )
-          else
-             phix(i,j) = phix_1d(i,j) &
-                  - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1)+vmac(i-1,j)) * (phiy_1d(i-1,j+1)-phiy_1d(i-1,j)) )
-          end if
-
-          ! compute final x-fluxes
-          flxx(i,j) = phix(i,j)*umac(i,j)
-
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do    j = lo(2), hi(2)+1
-       do i = lo(1), hi(1)
-
-          if (vmac(i,j) .lt. 0.d0) then
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j  )+umac(i,j  )) * (phix_1d(i+1,j  )-phix_1d(i,j  )) )
-          else
-             phiy(i,j) = phiy_1d(i,j) &
-                  - hdtdx(1)*( 0.5d0*(umac(i+1,j-1)+umac(i,j-1)) * (phix_1d(i+1,j-1)-phix_1d(i,j-1)) )
-          end if
-
-          ! compute final y-fluxes
-          flxy(i,j) = phiy(i,j)*vmac(i,j)
-
-       end do
-    end do
-
-  end subroutine compute_flux_2d
-
-end module compute_flux_module
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/slope_2d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/slope_2d.f90
deleted file mode 100644
index a032c8650b1..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_2d/slope_2d.f90
+++ /dev/null
@@ -1,126 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    integer :: i, j
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do j = lo(2), hi(2)
-
-       ! first compute Fromm slopes
-       do i = lo(1)-1, hi(1)+1
-          dlft = q(i  ,j) - q(i-1,j)
-          drgt = q(i+1,j) - q(i  ,j)
-          dcen(i) = .5d0 * (dlft+drgt)
-          dsgn(i) = sign(1.d0, dcen(i))
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i) = 0.d0
-          endif
-          df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-       end do
-
-       ! Now limited fourth order slopes
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-          dq(i,j) = dsgn(i)*min(dlim(i),abs(dq1))
-       end do
-    enddo
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(2), hi(2), qlo(2), qhi(2), dqlo(2), dqhi(2), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do j    = lo(2)-1, hi(2)+1
-       do i = lo(1)  , hi(1)
-          dlft = q(i,j  ) - q(i,j-1)
-          drgt = q(i,j+1) - q(i,j  )
-          dcen(i,j) = .5d0 * (dlft+drgt)
-          dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-          if (dlft*drgt .ge. 0.d0) then
-             dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-          else
-             dlim(i,j) = 0.d0
-          endif
-          df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-       end do
-    end do
-
-    ! Now compute limited fourth order slopes
-    do j    = lo(2), hi(2)
-       do i = lo(1), hi(1)
-          dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-          dq(i,j) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-       end do
-    end do
-
-  end subroutine slopey_doit
-
-end module slope_module 
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90
deleted file mode 100644
index ce90338f939..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/Adv_3d.f90
+++ /dev/null
@@ -1,141 +0,0 @@
-
-subroutine advect(time, lo, hi, &
-     &            uin , ui_lo, ui_hi, &
-     &            uout, uo_lo, uo_hi, &
-     &            vx  , vx_lo, vx_hi, &
-     &            vy  , vy_lo, vy_hi, &
-     &            vz  , vz_lo, vz_hi, &
-     &            flxx, fx_lo, fx_hi, &
-     &            flxy, fy_lo, fy_hi, &
-     &            flxz, fz_lo, fz_hi, &
-     &            dx,dt) bind(C, name="advect")
-  
-  use amrex_mempool_module, only : bl_allocate, bl_deallocate
-  use compute_flux_module, only : compute_flux_3d
-
-  implicit none
-
-  integer, intent(in) :: lo(3), hi(3)
-  double precision, intent(in) :: dx(3), dt, time
-  integer, intent(in) :: ui_lo(3), ui_hi(3)
-  integer, intent(in) :: uo_lo(3), uo_hi(3)
-  integer, intent(in) :: vx_lo(3), vx_hi(3)
-  integer, intent(in) :: vy_lo(3), vy_hi(3)
-  integer, intent(in) :: vz_lo(3), vz_hi(3)
-  integer, intent(in) :: fx_lo(3), fx_hi(3)
-  integer, intent(in) :: fy_lo(3), fy_hi(3)
-  integer, intent(in) :: fz_lo(3), fz_hi(3)
-  double precision, intent(in   ) :: uin (ui_lo(1):ui_hi(1),ui_lo(2):ui_hi(2),ui_lo(3):ui_hi(3))
-  double precision, intent(inout) :: uout(uo_lo(1):uo_hi(1),uo_lo(2):uo_hi(2),uo_lo(3):uo_hi(3))
-  double precision, intent(in   ) :: vx  (vx_lo(1):vx_hi(1),vx_lo(2):vx_hi(2),vx_lo(3):vx_hi(3))
-  double precision, intent(in   ) :: vy  (vy_lo(1):vy_hi(1),vy_lo(2):vy_hi(2),vy_lo(3):vy_hi(3))
-  double precision, intent(in   ) :: vz  (vz_lo(1):vz_hi(1),vz_lo(2):vz_hi(2),vz_lo(3):vz_hi(3))
-  double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-  double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-  double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-
-  integer :: i, j, k
-  integer :: glo(3), ghi(3)
-  double precision :: dtdx(3), umax, vmax, wmax
-
-  ! Some compiler may not support 'contiguous'.  Remove it in that case.
-  double precision, dimension(:,:,:), pointer, contiguous :: &
-       phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-
-  dtdx = dt/dx
-
-  glo = lo - 1
-  ghi = hi + 1
-
-  ! edge states
-  call bl_allocate(phix  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phix_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiy_z,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz  ,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_x,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  call bl_allocate(phiz_y,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))
-  ! slope
-  call bl_allocate(slope,glo(1), ghi(1), glo(2), ghi(2), glo(3), ghi(3))  
-  
-  ! We like to allocate these **pointers** here and then pass them to a function
-  ! to remove their pointerness for performance, because normally pointers could
-  ! be aliasing.  We need to use pointers instead of allocatable arrays because
-  ! we like to use BoxLib's bl_allocate to allocate memeory instead of the intrinsic
-  ! allocate.  Bl_allocate is much faster than allocate inside OMP.  
-  ! Note that one MUST CALL BL_DEALLOCATE.
-
-  ! check if CFL condition is violated.
-  umax = maxval(abs(vx))
-  vmax = maxval(abs(vy))
-  wmax = maxval(abs(vz))
-  if ( umax*dt .ge. dx(1) .or. &
-       vmax*dt .ge. dx(2) .or. &
-       wmax*dt .ge. dx(3) ) then
-     print *, "umax = ", umax, ", vmax = ", vmax, ", wmax = ", wmax, ", dt = ", dt, ", dx = ", dx
-     call bl_error("CFL violation. Use smaller adv.cfl.")
-  end if
-
-  ! call a function to compute flux
-  call compute_flux_3d(lo, hi, dt, dx, &
-                       uin, ui_lo, ui_hi, &
-                       vx, vx_lo, vx_hi, &
-                       vy, vy_lo, vy_hi, &
-                       vz, vz_lo, vz_hi, &
-                       flxx, fx_lo, fx_hi, &
-                       flxy, fy_lo, fy_hi, &
-                       flxz, fz_lo, fz_hi, &
-                       phix, phix_y, phix_z, &
-                       phiy, phiy_x, phiy_z, &
-                       phiz, phiz_x, phiz_y, &
-                       slope, glo, ghi)
-
-  ! Do a conservative update
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           uout(i,j,k) = uin(i,j,k) + &
-                ( (flxx(i,j,k) - flxx(i+1,j,k)) * dtdx(1) &
-                + (flxy(i,j,k) - flxy(i,j+1,k)) * dtdx(2) &
-                + (flxz(i,j,k) - flxz(i,j,k+1)) * dtdx(3) )
-        enddo
-     enddo
-  enddo
-
-  ! Scale by face area in order to correctly reflx
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)+1
-           flxx(i,j,k) = flxx(i,j,k) * (dt * dx(2)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)
-     do    j = lo(2), hi(2)+1 
-        do i = lo(1), hi(1)
-           flxy(i,j,k) = flxy(i,j,k) * (dt * dx(1)*dx(3))
-        enddo
-     enddo
-  enddo
-  do       k = lo(3), hi(3)+1
-     do    j = lo(2), hi(2)
-        do i = lo(1), hi(1)
-           flxz(i,j,k) = flxz(i,j,k) * (dt * dx(1)*dx(2))
-        enddo
-     enddo
-  enddo
-
-  call bl_deallocate(phix  )
-  call bl_deallocate(phix_y)
-  call bl_deallocate(phix_z)
-  call bl_deallocate(phiy  )
-  call bl_deallocate(phiy_x)
-  call bl_deallocate(phiy_z)
-  call bl_deallocate(phiz  )
-  call bl_deallocate(phiz_x)
-  call bl_deallocate(phiz_y)
-  call bl_deallocate(slope)
-
-end subroutine advect
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/Make.package b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/Make.package
deleted file mode 100644
index 08c638054bb..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/Make.package
+++ /dev/null
@@ -1,3 +0,0 @@
-f90EXE_sources += Adv_$(DIM)d.f90
-f90EXE_sources += slope_$(DIM)d.f90
-f90EXE_sources += compute_flux_$(DIM)d.f90
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/compute_flux_3d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/compute_flux_3d.f90
deleted file mode 100644
index fa959b8ac14..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/compute_flux_3d.f90
+++ /dev/null
@@ -1,287 +0,0 @@
-module compute_flux_module
-
-  implicit none
-
-  private
-
-  public :: compute_flux_3d
-
-contains
-
-  subroutine compute_flux_3d(lo, hi, dt, dx, &
-                             phi,ph_lo,ph_hi, &
-                             umac,  u_lo,  u_hi, &
-                             vmac,  v_lo,  v_hi, &
-                             wmac,  w_lo,  w_hi, &
-                             flxx, fx_lo, fx_hi, &
-                             flxy, fy_lo, fy_hi, &
-                             flxz, fz_lo, fz_hi, &
-                             phix, phix_y, phix_z, &
-                             phiy, phiy_x, phiy_z, &
-                             phiz, phiz_x, phiz_y, &
-                             slope, glo, ghi)
-
-    use slope_module, only: slopex, slopey, slopez
-
-    integer, intent(in) :: lo(3), hi(3), glo(3), ghi(3)
-    double precision, intent(in) :: dt, dx(3)
-    integer, intent(in) :: ph_lo(3), ph_hi(3)
-    integer, intent(in) ::  u_lo(3),  u_hi(3)
-    integer, intent(in) ::  v_lo(3),  v_hi(3)
-    integer, intent(in) ::  w_lo(3),  w_hi(3)
-    integer, intent(in) :: fx_lo(3), fx_hi(3)
-    integer, intent(in) :: fy_lo(3), fy_hi(3)
-    integer, intent(in) :: fz_lo(3), fz_hi(3)
-    double precision, intent(in   ) :: phi (ph_lo(1):ph_hi(1),ph_lo(2):ph_hi(2),ph_lo(3):ph_hi(3))
-    double precision, intent(in   ) :: umac( u_lo(1): u_hi(1), u_lo(2): u_hi(2), u_lo(3): u_hi(3))
-    double precision, intent(in   ) :: vmac( v_lo(1): v_hi(1), v_lo(2): v_hi(2), v_lo(3): v_hi(3))
-    double precision, intent(in   ) :: wmac( w_lo(1): w_hi(1), w_lo(2): w_hi(2), w_lo(3): w_hi(3))
-    double precision, intent(  out) :: flxx(fx_lo(1):fx_hi(1),fx_lo(2):fx_hi(2),fx_lo(3):fx_hi(3))
-    double precision, intent(  out) :: flxy(fy_lo(1):fy_hi(1),fy_lo(2):fy_hi(2),fy_lo(3):fy_hi(3))
-    double precision, intent(  out) :: flxz(fz_lo(1):fz_hi(1),fz_lo(2):fz_hi(2),fz_lo(3):fz_hi(3))
-    double precision, dimension(glo(1):ghi(1),glo(2):ghi(2),glo(3):ghi(3)) :: &
-         phix, phix_y, phix_z, phiy, phiy_x, phiy_z, phiz, phiz_x, phiz_y, slope
-         
-    integer :: i, j, k
-    double precision :: hdtdx(3), tdtdx(3)
-
-    hdtdx = 0.5*(dt/dx)
-    tdtdx = (1.d0/3.d0)*(dt/dx)
-
-    call slopex(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on x faces using umac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phi(i  ,j,k) - (0.5d0 + hdtdx(1)*umac(i,j,k))*slope(i  ,j,k)
-             else
-                phix(i,j,k) = phi(i-1,j,k) + (0.5d0 - hdtdx(1)*umac(i,j,k))*slope(i-1,j,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopey(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on y faces using vmac to upwind; ignore transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phi(i,j  ,k) - (0.5d0 + hdtdx(2)*vmac(i,j,k))*slope(i,j  ,k)
-             else
-                phiy(i,j,k) = phi(i,j-1,k) + (0.5d0 - hdtdx(2)*vmac(i,j,k))*slope(i,j-1,k)
-             end if
-
-          end do
-       end do
-    end do
-
-    call slopez(glo, ghi, &
-                phi, ph_lo, ph_hi, &
-                slope, glo, ghi)
-                
-    ! compute phi on z faces using wmac to upwind; ignore transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phi(i,j,k  ) - (0.5d0 + hdtdx(3)*wmac(i,j,k))*slope(i,j,k  )
-             else
-                phiz(i,j,k) = phi(i,j,k-1) + (0.5d0 - hdtdx(3)*wmac(i,j,k))*slope(i,j,k-1)
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! transverse terms
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in y-transverse terms
-    do       k=lo(3)-1, hi(3)+1
-       do    j=lo(2)  , hi(2)
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i  ,j+1,k)+vmac(i  ,j,k)) * (phiy(i  ,j+1,k)-phiy(i  ,j,k)) )
-             else
-                phix_y(i,j,k) = phix(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i-1,j+1,k)+vmac(i-1,j,k)) * (phiy(i-1,j+1,k)-phiy(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on x faces by adding in z-transverse terms
-    do       k=lo(3)  , hi(3)
-       do    j=lo(2)-1, hi(2)+1
-          do i=lo(1)  , hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i  ,j,k+1)+wmac(i  ,j,k)) * (phiz(i  ,j,k+1)-phiz(i  ,j,k)) )
-             else
-                phix_z(i,j,k) = phix(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i-1,j,k+1)+wmac(i-1,j,k)) * (phiz(i-1,j,k+1)-phiz(i-1,j,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in x-transverse terms
-    do       k = lo(3)-1, hi(3)+1
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j  ,k)+umac(i,j  ,k)) * (phix(i+1,j  ,k)-phix(i,j  ,k)) )
-             else
-                phiy_x(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j-1,k)+umac(i,j-1,k)) * (phix(i+1,j-1,k)-phix(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in z-transverse terms
-    do       k = lo(3)  , hi(3)
-       do    j = lo(2)  , hi(2)+1
-          do i = lo(1)-1, hi(1)+1
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j  ,k+1)+wmac(i,j  ,k)) * (phiz(i,j  ,k+1)-phiz(i,j  ,k)) )
-             else
-                phiy_z(i,j,k) = phiy(i,j,k) &
-                     - tdtdx(3) * (0.5d0*(wmac(i,j-1,k+1)+wmac(i,j-1,k)) * (phiz(i,j-1,k+1)-phiz(i,j-1,k)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in x-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k  )+umac(i,j,k  )) * (phix(i+1,j,k  )-phix(i,j,k  )) )
-             else
-                phiz_x(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(1) * (0.5d0*(umac(i+1,j,k-1)+umac(i,j,k-1)) * (phix(i+1,j,k-1)-phix(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in y-transverse terms
-    do       k = lo(3)  , hi(3)+1
-       do    j = lo(2)  , hi(2)
-          do i = lo(1)-1, hi(1)+1
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k  )+vmac(i,j,k  )) * (phiy(i,j+1,k  )-phiy(i,j,k  )) )
-             else
-                phiz_y(i,j,k) = phiz(i,j,k) &
-                     - tdtdx(2) * (0.5d0*(vmac(i,j+1,k-1)+vmac(i,j,k-1)) * (phiy(i,j+1,k-1)-phiy(i,j,k-1)) )
-             end if
-
-          end do
-       end do
-    end do
-
-    !!!!!!!!!!!!!!!!!!!!
-    ! final edge states
-    !!!!!!!!!!!!!!!!!!!!
-
-    ! update phi on x faces by adding in yz and zy transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)+1
-
-             if (umac(i,j,k) .lt. 0.d0) then
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_z(i  ,j+1,k  )-phiy_z(i  ,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i  ,j,k)) * (phiz_y(i  ,j  ,k+1)-phiz_y(i  ,j,k)) )
-             else
-                phix(i,j,k) = phix(i,j,k) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i-1,j+1,k  )+vmac(i-1,j,k)) * (phiy_z(i-1,j+1,k  )-phiy_z(i-1,j,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i-1,j  ,k+1)+wmac(i-1,j,k)) * (phiz_y(i-1,j  ,k+1)-phiz_y(i-1,j,k)) )
-             end if
-
-             ! compute final x-fluxes
-             flxx(i,j,k) = umac(i,j,k)*phix(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on y faces by adding in xz and zx transverse terms
-    do       k = lo(3), hi(3)
-       do    j = lo(2), hi(2)+1
-          do i = lo(1), hi(1)
-
-             if (vmac(i,j,k) .lt. 0.d0) then
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i,j  ,k)) * (phix_z(i+1,j  ,k  )-phix_z(i,j  ,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j  ,k+1)+wmac(i,j  ,k)) * (phiz_x(i  ,j  ,k+1)-phiz_x(i,j  ,k)) )
-             else
-                phiy(i,j,k) = phiy(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j-1,k  )+umac(i,j-1,k)) * (phix_z(i+1,j-1,k  )-phix_z(i,j-1,k)) ) &
-                     - hdtdx(3)*( 0.5d0*(wmac(i  ,j-1,k+1)+wmac(i,j-1,k)) * (phiz_x(i  ,j-1,k+1)-phiz_x(i,j-1,k)) )
-             end if
-
-             ! compute final y-fluxes
-             flxy(i,j,k) = vmac(i,j,k)*phiy(i,j,k)
-
-          end do
-       end do
-    end do
-
-    ! update phi on z faces by adding in xy and yx transverse terms
-    do       k = lo(3), hi(3)+1
-       do    j = lo(2), hi(2)
-          do i = lo(1), hi(1)
-
-             if (wmac(i,j,k) .lt. 0.d0) then
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k  )+umac(i  ,j,k)) * (phix_y(i+1,j  ,k  )-phix_y(i,j,k  )) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k  )+vmac(i  ,j,k)) * (phiy_x(i  ,j+1,k  )-phiy_x(i,j,k  )) )
-             else
-                phiz(i,j,k) = phiz(i,j,k) &
-                     - hdtdx(1)*( 0.5d0*(umac(i+1,j  ,k-1)+umac(i,j,k-1)) * (phix_y(i+1,j  ,k-1)-phix_y(i,j,k-1)) ) &
-                     - hdtdx(2)*( 0.5d0*(vmac(i  ,j+1,k-1)+vmac(i,j,k-1)) * (phiy_x(i  ,j+1,k-1)-phiy_x(i,j,k-1)) )
-             end if
-
-             ! compute final z-fluxes
-             flxz(i,j,k) = wmac(i,j,k)*phiz(i,j,k)
-
-          end do
-       end do
-    end do
-
-
-  end subroutine compute_flux_3d
-
-end module compute_flux_module
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/slope_3d.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/slope_3d.f90
deleted file mode 100644
index 418ac9d5ff3..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_3d/slope_3d.f90
+++ /dev/null
@@ -1,211 +0,0 @@
-module slope_module
- 
-  implicit none
-
-  double precision, parameter:: four3rd=4.d0/3.d0, sixth=1.d0/6.d0
-  
-  private
- 
-  public :: slopex, slopey, slopez
- 
-contains
- 
-  subroutine slopex(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    implicit none
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    integer :: i, j, k
-    double precision, dimension(lo(1)-1:hi(1)+1) :: dsgn, dlim, df, dcen
-    double precision :: dlft, drgt, dq1
-
-    do    k = lo(3), hi(3)
-       do j = lo(2), hi(2)
-
-          ! first compute Fromm slopes
-          do i = lo(1)-1, hi(1)+1
-             dlft = q(i  ,j,k) - q(i-1,j,k)
-             drgt = q(i+1,j,k) - q(i  ,j,k)
-             dcen(i) = .5d0 * (dlft+drgt)
-             dsgn(i) = sign(1.d0, dcen(i))
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i) = 0.d0
-             endif
-             df(i) = dsgn(i)*min( dlim(i), abs(dcen(i)) )
-          end do
-          
-          ! Now limited fourth order slopes
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i) - sixth*(df(i+1) + df(i-1))
-             dq(i,j,k) = dsgn(i)*min(dlim(i),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopex
-
-
-  subroutine slopey(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2)-1, hi(2)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2)-1, hi(2)+1)
-
-    call slopey_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, (/lo(1),lo(2)-1/), (/hi(1),hi(2)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopey
-
-  subroutine slopey_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(2), ddhi(2)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    do k = lo(3), hi(3)
-
-       ! first compute Fromm slopes
-       do j    = lo(2)-1, hi(2)+1
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j  ,k) - q(i,j-1,k)
-             drgt = q(i,j+1,k) - q(i,j  ,k)
-             dcen(i,j) = .5d0 * (dlft+drgt)
-             dsgn(i,j) = sign( 1.d0, dcen(i,j) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j) = 0.d0
-             endif
-             df(i,j) = dsgn(i,j)*min( dlim(i,j),abs(dcen(i,j)) )
-          end do
-       end do
-       
-       ! Now compute limited fourth order slopes
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j) - sixth*( df(i,j+1) + df(i,j-1) )
-             dq(i,j,k) = dsgn(i,j)*min(dlim(i,j),abs(dq1))
-          end do
-       end do
-
-    end do
-
-  end subroutine slopey_doit
-
-
-  subroutine slopez(lo, hi, &
-                    q, qlo, qhi, &
-                    dq, dqlo, dqhi)
-
-    use amrex_mempool_module, only : bl_allocate, bl_deallocate
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3)
-    double precision, intent(in ) ::  q( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq(dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-
-    ! Some compiler may not support 'contiguous'.  Remove it in that case.
-    double precision, dimension(:,:,:), pointer, contiguous :: dsgn, dlim, df, dcen
-
-    call bl_allocate(dsgn, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dlim, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(df  , lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-    call bl_allocate(dcen, lo(1), hi(1), lo(2), hi(2), lo(3)-1, hi(3)+1)
-
-    call slopez_doit(lo, hi, &
-                     q, qlo, qhi, &
-                     dq, dqlo, dqhi, &
-                     dsgn, dlim, df, dcen, &
-                     (/lo(1),lo(2),lo(3)-1/), (/hi(1),hi(2),hi(3)+1/))
-
-    call bl_deallocate(dsgn)
-    call bl_deallocate(dlim)
-    call bl_deallocate(df)
-    call bl_deallocate(dcen)
-
-  end subroutine slopez
-
-  subroutine slopez_doit(lo, hi, &
-                         q, qlo, qhi, &
-                         dq, dqlo, dqhi, &
-                         dsgn, dlim, df, dcen, ddlo, ddhi)
-
-    integer, intent(in) :: lo(3), hi(3), qlo(3), qhi(3), dqlo(3), dqhi(3), &
-         ddlo(3), ddhi(3)
-    double precision, intent(in ) ::  q  ( qlo(1): qhi(1), qlo(2): qhi(2), qlo(3): qhi(3))
-    double precision, intent(out) :: dq  (dqlo(1):dqhi(1),dqlo(2):dqhi(2),dqlo(3):dqhi(3))
-    double precision              :: dsgn(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dlim(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: df  (ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-    double precision              :: dcen(ddlo(1):ddhi(1),ddlo(2):ddhi(2),ddlo(3):ddhi(3))
-
-    integer :: i, j, k
-    double precision :: dlft, drgt, dq1
-
-    ! first compute Fromm slopes
-    do k       = lo(3)-1, hi(3)+1
-       do j    = lo(2)  , hi(2)
-          do i = lo(1)  , hi(1)
-             dlft = q(i,j,k  ) - q(i,j,k-1)
-             drgt = q(i,j,k+1) - q(i,j,k  )
-             dcen(i,j,k) = .5d0 * (dlft+drgt)
-             dsgn(i,j,k) = sign( 1.d0, dcen(i,j,k) )
-             if (dlft*drgt .ge. 0.d0) then
-                dlim(i,j,k) = 2.d0 * min( abs(dlft), abs(drgt) )
-             else
-                dlim(i,j,k) = 0.d0
-             endif
-             df(i,j,k) = dsgn(i,j,k)*min( dlim(i,j,k),abs(dcen(i,j,k)) )
-          end do
-       end do
-    end do
-       
-    ! Now compute limited fourth order slopes
-    do k       = lo(3), hi(3)
-       do j    = lo(2), hi(2)
-          do i = lo(1), hi(1)
-             dq1 = four3rd*dcen(i,j,k) - sixth*( df(i,j,k+1) + df(i,j,k-1) )
-             dq(i,j,k) = dsgn(i,j,k)*min(dlim(i,j,k),abs(dq1))
-          end do
-       end do
-    end do
-
-  end subroutine slopez_doit
-
-end module slope_module 
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Adv_nd.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Adv_nd.f90
deleted file mode 100644
index edec2ddb99c..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Adv_nd.f90
+++ /dev/null
@@ -1,10 +0,0 @@
-subroutine nullfill(adv,adv_lo,adv_hi,domlo,domhi,delta,xlo,time,bc) bind(C, name="nullfill")
-  implicit none
-  integer          :: adv_lo(3),adv_hi(3)
-  integer          :: bc(*)
-  integer          :: domlo(3), domhi(3)
-  double precision :: delta(3), xlo(3), time
-  double precision :: adv(adv_lo(1):adv_hi(1),adv_lo(2):adv_hi(2),adv_lo(3):adv_hi(3))
-  ! no physical boundaries to fill because it is all periodic
-  return
-end subroutine nullfill
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Make.package b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Make.package
deleted file mode 100644
index aad81fa62a5..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Make.package
+++ /dev/null
@@ -1,2 +0,0 @@
-f90EXE_sources += Adv_nd.f90
-f90EXE_sources += Tagging_nd.f90 tagging_params.f90
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Tagging_nd.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Tagging_nd.f90
deleted file mode 100644
index fe12a0e4ce7..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/Tagging_nd.f90
+++ /dev/null
@@ -1,85 +0,0 @@
-
-! ::: -----------------------------------------------------------
-! ::: This routine will tag high error cells based on the state
-! ::: 
-! ::: INPUTS/OUTPUTS:
-! ::: 
-! ::: tag        <=  integer tag array
-! ::: tag_lo,hi   => index extent of tag array
-! ::: state       => state array
-! ::: state_lo,hi => index extent of state array
-! ::: set         => integer value to tag cell for refinement
-! ::: clear       => integer value to untag cell
-! ::: lo,hi       => work region we are allowed to change
-! ::: dx          => cell size
-! ::: problo      => phys loc of lower left corner of prob domain
-! ::: time        => problem evolution time
-! ::: level       => refinement level of this array
-! ::: -----------------------------------------------------------
-
-subroutine state_error(tag,tag_lo,tag_hi, &
-                       state,state_lo,state_hi, &
-                       set,clear,&
-                       lo,hi,&
-                       dx,problo,time,level) bind(C, name="state_error")
-
-  use tagging_params_module, only : phierr, phigrad, max_phierr_lev, max_phigrad_lev
-  implicit none
-  
-  integer          :: lo(3),hi(3)
-  integer          :: state_lo(3),state_hi(3)
-  integer          :: tag_lo(3),tag_hi(3)
-  double precision :: state(state_lo(1):state_hi(1), &
-                            state_lo(2):state_hi(2), &
-                            state_lo(3):state_hi(3))
-  integer          :: tag(tag_lo(1):tag_hi(1),tag_lo(2):tag_hi(2),tag_lo(3):tag_hi(3))
-  double precision :: problo(3),dx(3),time
-  integer          :: level,set,clear
-
-  double precision :: ax, ay, az
-  integer          :: i, j, k, dim
-
-  if (state_lo(3) .eq. state_hi(3)) then
-     dim = 2
-  else
-     dim = 3
-  end if
-
-  ! Tag on regions of high phi
-  if (level .lt. max_phierr_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              if (state(i,j,k) .ge. phierr(level)) then
-                 tag(i,j,k) = set
-              endif
-           enddo
-        enddo
-     enddo
-  endif
-
-  ! Tag on regions of high phi gradient
-  if (level .lt. max_phigrad_lev) then
-     do       k = lo(3), hi(3)
-        do    j = lo(2), hi(2)
-           do i = lo(1), hi(1)
-              ax = abs(state(i-1,j,k)-state(i,j,k))
-              ax = max(ax, abs(state(i,j,k)-state(i+1,j,k)))
-              ay = abs(state(i,j-1,k)-state(i,j,k))
-              ay = max(ay, abs(state(i,j,k)-state(i,j+1,k)))
-              if (dim .eq. 2) then
-                 az = 0.d0
-              else
-                 az = abs(state(i,j,k-1)-state(i,j,k))
-                 az = max(az, abs(state(i,j,k)-state(i,j,k+1)))
-              end if
-              if (max(ax,ay,az) .ge. phigrad(level)) then
-                 tag(i,j,k) = set
-              end if
-            enddo
-         enddo
-      end do
-   endif
-  
-end subroutine state_error
-
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/tagging_params.f90 b/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/tagging_params.f90
deleted file mode 100644
index b0bebd02479..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/Src_nd/tagging_params.f90
+++ /dev/null
@@ -1,58 +0,0 @@
-module tagging_params_module
-
-  double precision, save :: phierr(0:15), phigrad(0:15)
-
-  integer, save :: max_phierr_lev, max_phigrad_lev
-
-contains
-  
-  subroutine get_tagging_params(name, namlen) bind(C, name="get_tagging_params")
-
-    ! Initialize the tagging parameters
-
-    integer, intent(in) :: namlen
-    integer, intent(in) :: name(namlen)
-
-    integer :: un, i, status
-
-    integer, parameter :: maxlen = 256
-    character (len=maxlen) :: probin
-
-    namelist /tagging/ phierr, phigrad, max_phierr_lev, max_phigrad_lev
-
-    ! Set namelist defaults
-    phierr(:) = 1.d20
-    phigrad(:) = 1.d20
-    max_phierr_lev = -1
-    max_phigrad_lev = -1
-
-    ! create the filename
-    if (namlen > maxlen) then
-       print *, 'probin file name too long'
-       stop
-    endif
-
-    do i = 1, namlen
-       probin(i:i) = char(name(i))
-    end do
-
-    ! read in the namelist
-    un = 9
-    open (unit=un, file=probin(1:namlen), form='formatted', status='old')
-    read (unit=un, nml=tagging, iostat=status)
-
-    if (status < 0) then
-       ! the namelist does not exist, so we just go with the defaults
-       continue
-
-    else if (status > 0) then
-       ! some problem in the namelist
-       print *, 'ERROR: problem in the tagging namelist'
-       stop
-    endif
-
-    close (unit=un)
-
-  end subroutine get_tagging_params
-
-end module tagging_params_module
diff --git a/Tutorials/SENSEI/Advection_AmrLevel/Source/main.cpp b/Tutorials/SENSEI/Advection_AmrLevel/Source/main.cpp
deleted file mode 100644
index 3102702fb66..00000000000
--- a/Tutorials/SENSEI/Advection_AmrLevel/Source/main.cpp
+++ /dev/null
@@ -1,81 +0,0 @@
-
-#include <new>
-#include <iostream>
-#include <iomanip>
-
-#include <AMReX_Amr.H>
-#include <AMReX_ParmParse.H>
-#include <AMReX_ParallelDescriptor.H>
-#include <AMReX_AmrLevel.H>
-
-using namespace amrex;
-
-int
-main (int   argc,
-      char* argv[])
-{
-    amrex::Initialize(argc,argv);
-
-    Real dRunTime1 = amrex::second();
-
-    int  max_step;
-    Real strt_time;
-    Real stop_time;
-
-    {
-        ParmParse pp;
-
-        max_step  = -1;
-        strt_time =  0.0;
-        stop_time = -1.0;
-
-        pp.query("max_step",max_step);
-        pp.query("strt_time",strt_time);
-        pp.query("stop_time",stop_time);
-    }
-
-    if (strt_time < 0.0) {
-        amrex::Abort("MUST SPECIFY a non-negative strt_time");
-    }
-
-    if (max_step < 0 && stop_time < 0.0) {
-	amrex::Abort("Exiting because neither max_step nor stop_time is non-negative.");
-    }
-
-    {
-	Amr amr;
-
-	amr.init(strt_time,stop_time);
-
-	while ( amr.okToContinue() &&
-  	       (amr.levelSteps(0) < max_step || max_step < 0) &&
-	       (amr.cumTime() < stop_time || stop_time < 0.0) )
-
-	{
-	    //
-	    // Do a coarse timestep.  Recursively calls timeStep()
-	    //
-	    amr.coarseTimeStep(stop_time);
-	}
-
-	// Write final checkpoint and plotfile
-	if (amr.stepOfLastCheckPoint() < amr.levelSteps(0)) {
-	    amr.checkPoint();
-	}
-
-	if (amr.stepOfLastPlotFile() < amr.levelSteps(0)) {
-	    amr.writePlotFile();
-	}
-
-    }
-
-    Real dRunTime2 = amrex::second() - dRunTime1;
-
-    ParallelDescriptor::ReduceRealMax(dRunTime2, ParallelDescriptor::IOProcessorNumber());
-
-    amrex::Print() << "Run time = " << dRunTime2 << std::endl;
-
-    amrex::Finalize();
-
-    return 0;
-}
diff --git a/Tutorials/SENSEI/README.md b/Tutorials/SENSEI/README.md
deleted file mode 100644
index e974b67ed23..00000000000
--- a/Tutorials/SENSEI/README.md
+++ /dev/null
@@ -1,86 +0,0 @@
-# Using SingleVortex miniapp with SENSEI in situ #
-SENSEI is a middleware that allows one to send data to various visualization and
-analysis back ends through a uniform interface. It's data model and API enable
-one to chose the desired visualization and analysis back end for a given task
-with out limitting ones options, as the back ends can be inter-changed at run
-time via a text based config file.
-
-## Organization of the code ##
-There are two path ways to SENSEI through AMReX. Which one to use depends on
-if your code uses `amrex::Amr` or `amrex::AmrMesh`. Most codes will use `amrex::Amr`.
-The tutorial for `amrex::Amr` is in the `AmrLevel` directory. The tutorial for
-`amrex::AmrMesh` is in the `AmrCore` directory. Both tutorials work the same and
-will be compiled from the Exec/SingleVortex directories.
-
-## Compatible versions ##
-This code was tested on 5/22/2020 with SENSEI 3.2, ParaView 5.7, VisIt 3.0.2,
-and Python 3.7. As these dependencies evolve small upadtes to configurations
-supplied here may be needed. This tutorial assumes local installs of one or
-more of these dependencies.
-
-## Configuring the environment ##
-First select the desired SENSEI install. Each install will support different set of
-backends. This is necessary because not all of the back ends are compatible with
-each other.
-
-For instance to use SENSEI with ParaView Catalyst:
-```
-module load sensei/2.1.0-catalyst
-```
-
-To use SENSEI with VisIt Libsim:
-```
-module load sensei/2.1.0-libsim
-```
-
-## Compiling ##
-SENSEI features in AMReX are conditionally compiled when the Make file variable
-`USE_SENSEI_INSITU` is set. When this variable is set, the Make file will querry
-environment variables to determine the list of include directories and link
-libraries needed to compile with SENSEI.
-
-The `sensei_config` tool that is installed with SENSEI  will set the environment
-variables that are used in the make files.
-
-With a SENSEI module loaded, in a bash shell:
-```
-source sensei_config
-```
-
-Edit the file `Exec/SingleVortex/GNUmakefile`, set
-```
-USE_SENSEI_INSITU = TRUE
-```
-
-Finally, make the tutorial
-```
-make -j4
-```
-
-## Running ##
-To use SENSEI in AMReX one needs to enable it via ParmParse input file.
-Additionally one needs to provide a SENSEI XML configuration that selects
-and configures the desired SENSEI backend.
-
-Example XML configs are included in `Exec/SingleVortex/SENSEI`.
-
-Edit the file `Exec/SingleVortex/inputs`
-
-Running with ParaView Catalyst:
-```
-sensei.enabled = 1                          # turn SENSEI in situ on/off
-sensei.config = SENSEI/render_catalyst.xml  # render simulation data with ParaView Catalyst
-sensei.frequency = 1                        # number of level 0 steps between in situ processing
-```
-
-Running with VisIt Libsim:
-```
-sensei.enabled = 1                          # turn SENSEI in situ on/off
-sensei.config = SENSEI/render_libsim.xml    # render simulation data with VisIt Libsim
-sensei.frequency = 1                        # number of level 0 steps between in situ processing
-```
-
-Once the inputs files has been edited, run the execcutable as usual
-```
-mpiexec -np 4 ./main2d.gnu.MPI.ex inputs
-```
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/GNUmakefile b/Tutorials/SUNDIALS/EX-CUSOLVER/GNUmakefile
similarity index 81%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/GNUmakefile
rename to Tutorials/SUNDIALS/EX-CUSOLVER/GNUmakefile
index 0fc47916d59..2eaf6be6dfb 100644
--- a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/GNUmakefile
+++ b/Tutorials/SUNDIALS/EX-CUSOLVER/GNUmakefile
@@ -9,11 +9,14 @@ COMP	   = gnu
 
 USE_MPI    = FALSE
 USE_OMP    = FALSE
-
 USE_CUDA  ?= FALSE
+
+USE_CPP_RHS = TRUE
+
+USE_SUNDIALS   = TRUE
+USE_CVODE_LIBS = TRUE
 USE_CUDA_CVODE ?= FALSE
 USE_CVODE_CUSOLVER ?= FALSE
-USE_CPP_RHS = TRUE
 
 ifeq ($(USE_CUDA), TRUE)
   USE_CUDA_CVODE := TRUE
@@ -23,8 +26,8 @@ EBASE = main
 
 EXTERN_SEARCH += .
 
-AMREX_HOME ?= ../../..
-CVODE_HOME ?= ../CVODE
+AMREX_HOME = ../../..
+SUNDIALS_ROOT ?= ../CVODE
 CUDA_HOME  ?= /usr/local/cuda-9.2
 
 Bpack   := ./Make.package
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/Make.CVODE b/Tutorials/SUNDIALS/EX-CUSOLVER/Make.CVODE
similarity index 95%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/Make.CVODE
rename to Tutorials/SUNDIALS/EX-CUSOLVER/Make.CVODE
index 7a545a8f4a4..26c94261a1c 100644
--- a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/Make.CVODE
+++ b/Tutorials/SUNDIALS/EX-CUSOLVER/Make.CVODE
@@ -1,7 +1,7 @@
 AMREX_HOME ?= /path/to/amrex
-CVODE_HOME ?= /path/to/CVODE
+SUNDIALS_ROOT ?= /path/to/CVODE
 
-TOP := $(CVODE_HOME)
+TOP := $(SUNDIALS_ROOT)
 
 EBASE ?= main
 
@@ -30,16 +30,16 @@ ifeq ($(USE_CUDA_CVODE), TRUE)
   endif
 endif
 
-INCLUDE_LOCATIONS += $(CVODE_HOME)/include
+INCLUDE_LOCATIONS += $(SUNDIALS_ROOT)/include
 
-LIBRARY_LOCATIONS += $(CVODE_HOME)/lib
+LIBRARY_LOCATIONS += $(SUNDIALS_ROOT)/lib
 LIBRARIES += -lsundials_cvode -lsundials_sunlinsolband -lsundials_sunlinsolspbcgs -lsundials_sunlinsolsptfqmr -lsundials_sunmatrixsparse -lsundials_nveccuda -lsundials_sunlinsoldense -lsundials_sunlinsolspfgmr -lsundials_sunmatrixband -lsundials_sunnonlinsolfixedpoint -lsundials_nvecserial -lsundials_sunlinsolpcg -lsundials_sunlinsolspgmr -lsundials_sunmatrixdense -lsundials_sunnonlinsolnewton
 
 ifeq ($(COMP), PGI)
-  LIBRARIES += -rpath=$(CVODE_HOME)/lib
+  LIBRARIES += -rpath=$(SUNDIALS_ROOT)/lib
 endif
 ifeq ($(COMP), GNU)
-  LIBRARIES += -Wl,-rpath=$(CVODE_HOME)/lib
+  LIBRARIES += -Wl,-rpath=$(SUNDIALS_ROOT)/lib
 endif
 
 ifeq ($(USE_CUDA_CVODE), TRUE)
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/Make.package b/Tutorials/SUNDIALS/EX-CUSOLVER/Make.package
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/Make.package
rename to Tutorials/SUNDIALS/EX-CUSOLVER/Make.package
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/README.md b/Tutorials/SUNDIALS/EX-CUSOLVER/README.md
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/README.md
rename to Tutorials/SUNDIALS/EX-CUSOLVER/README.md
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/extern_probin.template b/Tutorials/SUNDIALS/EX-CUSOLVER/extern_probin.template
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/extern_probin.template
rename to Tutorials/SUNDIALS/EX-CUSOLVER/extern_probin.template
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs b/Tutorials/SUNDIALS/EX-CUSOLVER/inputs
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs
rename to Tutorials/SUNDIALS/EX-CUSOLVER/inputs
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_128 b/Tutorials/SUNDIALS/EX-CUSOLVER/inputs_128
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_128
rename to Tutorials/SUNDIALS/EX-CUSOLVER/inputs_128
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_256 b/Tutorials/SUNDIALS/EX-CUSOLVER/inputs_256
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_256
rename to Tutorials/SUNDIALS/EX-CUSOLVER/inputs_256
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_32 b/Tutorials/SUNDIALS/EX-CUSOLVER/inputs_32
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_32
rename to Tutorials/SUNDIALS/EX-CUSOLVER/inputs_32
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_64 b/Tutorials/SUNDIALS/EX-CUSOLVER/inputs_64
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/inputs_64
rename to Tutorials/SUNDIALS/EX-CUSOLVER/inputs_64
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/main.cpp b/Tutorials/SUNDIALS/EX-CUSOLVER/main.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/main.cpp
rename to Tutorials/SUNDIALS/EX-CUSOLVER/main.cpp
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/make_cuda.sh b/Tutorials/SUNDIALS/EX-CUSOLVER/make_cuda.sh
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/make_cuda.sh
rename to Tutorials/SUNDIALS/EX-CUSOLVER/make_cuda.sh
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/make_cuda_cusolver.sh b/Tutorials/SUNDIALS/EX-CUSOLVER/make_cuda_cusolver.sh
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/make_cuda_cusolver.sh
rename to Tutorials/SUNDIALS/EX-CUSOLVER/make_cuda_cusolver.sh
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/make_serial.sh b/Tutorials/SUNDIALS/EX-CUSOLVER/make_serial.sh
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/make_serial.sh
rename to Tutorials/SUNDIALS/EX-CUSOLVER/make_serial.sh
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_cuda.cpp b/Tutorials/SUNDIALS/EX-CUSOLVER/react_cuda.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_cuda.cpp
rename to Tutorials/SUNDIALS/EX-CUSOLVER/react_cuda.cpp
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_cuda_cusolver.cpp b/Tutorials/SUNDIALS/EX-CUSOLVER/react_cuda_cusolver.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_cuda_cusolver.cpp
rename to Tutorials/SUNDIALS/EX-CUSOLVER/react_cuda_cusolver.cpp
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_serial.cpp b/Tutorials/SUNDIALS/EX-CUSOLVER/react_serial.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_serial.cpp
rename to Tutorials/SUNDIALS/EX-CUSOLVER/react_serial.cpp
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_system.F90 b/Tutorials/SUNDIALS/EX-CUSOLVER/react_system.F90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_system.F90
rename to Tutorials/SUNDIALS/EX-CUSOLVER/react_system.F90
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_utils.F90 b/Tutorials/SUNDIALS/EX-CUSOLVER/react_utils.F90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/react_utils.F90
rename to Tutorials/SUNDIALS/EX-CUSOLVER/react_utils.F90
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/test_react.H b/Tutorials/SUNDIALS/EX-CUSOLVER/test_react.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/test_react.H
rename to Tutorials/SUNDIALS/EX-CUSOLVER/test_react.H
diff --git a/Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/test_react_F.H b/Tutorials/SUNDIALS/EX-CUSOLVER/test_react_F.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS4/EX-CUSOLVER/test_react_F.H
rename to Tutorials/SUNDIALS/EX-CUSOLVER/test_react_F.H
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/CMakeLists.txt b/Tutorials/SUNDIALS/EX1_C/CMakeLists.txt
similarity index 96%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/CMakeLists.txt
rename to Tutorials/SUNDIALS/EX1_C/CMakeLists.txt
index b26f421ac85..b9e0cd884db 100644
--- a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/CMakeLists.txt
+++ b/Tutorials/SUNDIALS/EX1_C/CMakeLists.txt
@@ -1,7 +1,7 @@
 #
 # Does not work if amrex is built in shared mode
 #
-if (NOT (ENABLE_SUNDIALS) )
+if (NOT (AMReX_SUNDIALS) )
   return()
 endif ()
 
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/GNUmakefile b/Tutorials/SUNDIALS/EX1_C/GNUmakefile
similarity index 91%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/GNUmakefile
rename to Tutorials/SUNDIALS/EX1_C/GNUmakefile
index 27fc02c104d..61528eaecaf 100644
--- a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/GNUmakefile
+++ b/Tutorials/SUNDIALS/EX1_C/GNUmakefile
@@ -11,8 +11,8 @@ DIM              = 3
 PRECISION        = DOUBLE
 EBASE            = main
 
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
+USE_SUNDIALS   = TRUE
+USE_CVODE_LIBS = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/Make.package b/Tutorials/SUNDIALS/EX1_C/Make.package
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/Make.package
rename to Tutorials/SUNDIALS/EX1_C/Make.package
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/SetIC.f90 b/Tutorials/SUNDIALS/EX1_C/SetIC.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/SetIC.f90
rename to Tutorials/SUNDIALS/EX1_C/SetIC.f90
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/inputs b/Tutorials/SUNDIALS/EX1_C/inputs
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/inputs
rename to Tutorials/SUNDIALS/EX1_C/inputs
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/inputs_2box b/Tutorials/SUNDIALS/EX1_C/inputs_2box
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/inputs_2box
rename to Tutorials/SUNDIALS/EX1_C/inputs_2box
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/inputs_non_vectorized b/Tutorials/SUNDIALS/EX1_C/inputs_non_vectorized
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/inputs_non_vectorized
rename to Tutorials/SUNDIALS/EX1_C/inputs_non_vectorized
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/main.cpp b/Tutorials/SUNDIALS/EX1_C/main.cpp
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/main.cpp
rename to Tutorials/SUNDIALS/EX1_C/main.cpp
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/myfunc_F.H b/Tutorials/SUNDIALS/EX1_C/myfunc_F.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/myfunc_F.H
rename to Tutorials/SUNDIALS/EX1_C/myfunc_F.H
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/GNUmakefile b/Tutorials/SUNDIALS/EX1_CUDA/GNUmakefile
similarity index 91%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/GNUmakefile
rename to Tutorials/SUNDIALS/EX1_CUDA/GNUmakefile
index 47ae8690702..d5a1bff145a 100644
--- a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/GNUmakefile
+++ b/Tutorials/SUNDIALS/EX1_CUDA/GNUmakefile
@@ -11,8 +11,7 @@ DIM              = 3
 PRECISION        = DOUBLE
 EBASE            = main
 
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
+USE_SUNDIALS = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/Make.package b/Tutorials/SUNDIALS/EX1_CUDA/Make.package
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/Make.package
rename to Tutorials/SUNDIALS/EX1_CUDA/Make.package
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/SetIC.f90 b/Tutorials/SUNDIALS/EX1_CUDA/SetIC.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/SetIC.f90
rename to Tutorials/SUNDIALS/EX1_CUDA/SetIC.f90
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/inputs b/Tutorials/SUNDIALS/EX1_CUDA/inputs
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_SERIAL_NVEC/inputs
rename to Tutorials/SUNDIALS/EX1_CUDA/inputs
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/main.cpp b/Tutorials/SUNDIALS/EX1_CUDA/main.cpp
similarity index 99%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/main.cpp
rename to Tutorials/SUNDIALS/EX1_CUDA/main.cpp
index acad4b4e060..e860a67a819 100644
--- a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/main.cpp
+++ b/Tutorials/SUNDIALS/EX1_CUDA/main.cpp
@@ -6,9 +6,6 @@
 #include <AMReX_MultiFab.H>
 #include <AMReX_Print.H>
 #include <AMReX_PlotFileUtil.H>
-#if !defined(BL_NO_FORT)
-#include <AMReX_BaseFab_f.H>
-#endif
 
 #include <AMReX_BLFort.H>
 
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/myfunc_F.H b/Tutorials/SUNDIALS/EX1_CUDA/myfunc_F.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/myfunc_F.H
rename to Tutorials/SUNDIALS/EX1_CUDA/myfunc_F.H
diff --git a/Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/ode_mod.f90 b/Tutorials/SUNDIALS/EX1_CUDA/ode_mod.f90
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_cppversion/EX1_CUDA_NVEC/ode_mod.f90
rename to Tutorials/SUNDIALS/EX1_CUDA/ode_mod.f90
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/GNUmakefile b/Tutorials/SUNDIALS/EX1_F/GNUmakefile
similarity index 66%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX1/GNUmakefile
rename to Tutorials/SUNDIALS/EX1_F/GNUmakefile
index 405ad54a33f..e06b844054d 100644
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/GNUmakefile
+++ b/Tutorials/SUNDIALS/EX1_F/GNUmakefile
@@ -1,6 +1,5 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
+# AMREX_HOME defines the directory in which we will find all the AMReX code
+AMREX_HOME = ../../../
 
 DEBUG     = FALSE
 USE_MPI   = TRUE
@@ -9,8 +8,8 @@ DIM       = 3
 PRECISION = DOUBLE
 EBASE     = main
 
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
+USE_SUNDIALS   = TRUE
+USE_CVODE_LIBS = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/Make.package b/Tutorials/SUNDIALS/EX1_F/Make.package
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX1/Make.package
rename to Tutorials/SUNDIALS/EX1_F/Make.package
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/inputs b/Tutorials/SUNDIALS/EX1_F/inputs
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX1/inputs
rename to Tutorials/SUNDIALS/EX1_F/inputs
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/integrate_ode.f90 b/Tutorials/SUNDIALS/EX1_F/integrate_ode.f90
similarity index 66%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX1/integrate_ode.f90
rename to Tutorials/SUNDIALS/EX1_F/integrate_ode.f90
index c2e7266cb64..13662435496 100644
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/integrate_ode.f90
+++ b/Tutorials/SUNDIALS/EX1_F/integrate_ode.f90
@@ -3,12 +3,8 @@ subroutine integrate_ode(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="int
   use amrex_error_module
   use rhs_mod
   use ode_params
-  use fcvode_mod            ! Fortran interface to CVODE
-  use fnvector_serial_mod   ! Fortran interface to serial N_Vector
-  use fsunmat_dense_mod     ! Fortran interface to dense SUNMatrix
-  use fsunlinsol_dense_mod  ! Fortran interface to dense SUNLinearSolver
-!  use fnvector_serial
-!  use cvode_interface
+  use fnvector_serial_mod
+  use cvode_interface
   use, intrinsic :: iso_c_binding
 
   implicit none
@@ -23,11 +19,9 @@ subroutine integrate_ode(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="int
 
   integer(c_int) :: ierr ! CVODE return status
   real(c_double) :: atol, rtol
-  real(c_double) :: t0, t1
+  real(c_double) :: t0(1), t1
   real(c_double), pointer :: yvec(:)
-  type(c_ptr) :: sunvec_y      ! sundials vector
-  type(c_ptr) :: sunmat_A      ! sundials matrix
-  type(c_ptr) :: sunlinsol_LS  ! sundials linear solver
+  type(N_Vector), pointer :: sunvec_y
   type(c_ptr) :: CVmem
 
   allocate(yvec(neq))
@@ -35,19 +29,11 @@ subroutine integrate_ode(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="int
   ! Allocate a CVODE C struct from the array of variables to be integrated. The resulting C struct points to the same memory as the
   ! Fortran pointer array.
   sunvec_y = FN_VMake_Serial(neq, yvec)
-  if (.not. c_associated(sunvec_y)) call amrex_abort("integrate_ode: failed in N_VMake_Serial()")
+  if (.not. associated(sunvec_y)) call amrex_abort("integrate_ode: failed in FN_VMake_Serial()")
 
-  CVmem = FCVodeCreate(CV_BDF, CV_NEWTON)
+  CVmem = FCVodeCreate(CV_BDF)
   if (.not. c_associated(CVmem)) call amrex_abort("integrate_ode: failed in FCVodeCreate()")
 
-  ! create a dense matrix
-  sunmat_A = FSUNDenseMatrix(neq, neq);
-  if (.not. c_associated(sunmat_A)) print *,'ERROR: sunmat = NULL'
-
-  ! create a dense linear solver
-  sunlinsol_LS = FSUNDenseLinearSolver(sunvec_y, sunmat_A);
-  if (.not. c_associated(sunlinsol_LS)) print *,'ERROR: sunlinsol = NULL'
-
   t0 = 0.0d0 ! initial time for integration
   t1 = 2.0d0 ! final time for integration
 
@@ -56,7 +42,7 @@ subroutine integrate_ode(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="int
   ! will be slow (and unnecessary). So instead, we allocate the solver stuff once outside the (i,j,k) loop, and then within the
   ! (i,j,k) loop we just "re-initialize" the solver, which does not allocate any new data, but rather just sets up new initial
   ! conditions.
-  ierr = FCVodeInit(CVmem, c_funloc(RhsFn), t0, sunvec_y)
+  ierr = FCVodeInit(CVmem, c_funloc(RhsFn), t0(1), sunvec_y)
   if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeInit()")
 
   ! Set error tolerances tolerances
@@ -65,12 +51,9 @@ subroutine integrate_ode(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="int
   ierr = FCVodeSStolerances(CVmem, rtol, atol)
   if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeSStolerances()")
 
-  ! attach linear solver
-  ierr = FCVDlsSetLinearSolver(CVmem, sunlinsol_LS, sunmat_A);
-  if (ierr /= 0) then
-     write(*,*) 'Error in FCVDlsSetLinearSolver, ierr = ', ierr, '; halting'
-     stop
-  end if
+  ! Tell CVODE to use a dense linear solver.
+  ierr = FCVDense(CVmem, neq)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVDense()")
 
   do k=lo(3),hi(3)
      do j=lo(2),hi(2)
@@ -80,7 +63,7 @@ subroutine integrate_ode(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="int
            yvec(1) = real(i+j+k, c_double)
 
            t0 = 0.0d0 ! initial time for integration
-           ierr = FCVodeReInit(cvmem, t0, sunvec_y)
+           ierr = FCVodeReInit(cvmem, t0(1), sunvec_y)
            if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeReInit()")
 
            ierr = FCVode(CVmem, t1, sunvec_y, t0, CV_NORMAL)
diff --git a/Tutorials/SUNDIALS/EX1_F/main.cpp b/Tutorials/SUNDIALS/EX1_F/main.cpp
new file mode 100644
index 00000000000..d4b689c1555
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX1_F/main.cpp
@@ -0,0 +1,160 @@
+#include <fstream>
+#include <iomanip>
+
+#include <AMReX_ParmParse.H>
+#include <AMReX_Geometry.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_Print.H>
+#include <AMReX_PlotFileUtil.H>
+
+#include "myfunc_F.H"
+
+// This tutorial demonstrates how to use CVODE to integrate a single ODE per
+// cell, where the Jacobian matrix is not provided by the user. If using Newton
+// iteration to integrate the ODE, CVODE will construct a Jacobian by numerical
+// differentiation.
+
+using namespace amrex;
+
+int main (int argc, char* argv[])
+{
+    amrex::Initialize(argc,argv);
+
+    // What time is it now?  We'll use this to compute total run time.
+    Real strt_time = amrex::second();
+
+    std::cout << std::setprecision(15);
+
+    int n_cell, max_grid_size;
+    int cvode_meth, cvode_itmeth, write_plotfile;
+    bool do_tiling;
+
+    // inputs parameters
+    {
+      // ParmParse is way of reading inputs from the inputs file
+      ParmParse pp;
+
+      // We need to get n_cell from the inputs file - this is the number of
+      // cells on each side of a square (or cubic) domain.
+      pp.get("n_cell",n_cell);
+
+      // Default nsteps to 0, allow us to set it to something else in the
+      // inputs file
+      pp.get("max_grid_size",max_grid_size);
+
+      // Select CVODE solve method.
+      //   1 = Adams (for non-stiff problems)
+      //   2 = BDF (for stiff problems)
+      pp.get("cvode_meth",cvode_meth);
+      // Select CVODE solver iteration method.
+      //   1 = Functional iteration
+      //   2 = Newton iteration
+      pp.get("cvode_itmeth",cvode_itmeth);
+
+      pp.get("write_plotfile",write_plotfile);
+      pp.get("do_tiling",do_tiling);
+    }
+
+    if (cvode_meth < 1)
+      amrex::Abort("Unknown cvode_meth");
+    if (cvode_itmeth < 1)
+      amrex::Abort("Unknown cvode_itmeth");
+
+    amrex::Print() << "This is AMReX version " << amrex::Version() << std::endl;
+    amrex::Print() << "Problem domain size: nx = ny = nz = " << n_cell << std::endl;
+    amrex::Print() << "Max grid size: " << max_grid_size << std::endl;
+    amrex::Print() << "CVODE method: ";
+    if (cvode_meth == 1) {
+      amrex::Print() << "Adams (non-stiff)";
+    } else if (cvode_meth == 2) {
+        amrex::Print() << "BDF (stiff)";
+    }
+    amrex::Print() << std::endl;
+    amrex::Print() << "CVODE iteration method: ";
+    if (cvode_itmeth == 1) {
+      amrex::Print() << "Functional";
+    } else if (cvode_itmeth == 2) {
+        amrex::Print() << "Newton";
+    }
+    amrex::Print() << std::endl;
+
+    // make BoxArray and Geometry
+    BoxArray ba;
+    Geometry geom;
+    {
+      IntVect dom_lo(IntVect(D_DECL(0,0,0)));
+      IntVect dom_hi(IntVect(D_DECL(n_cell-1, n_cell-1, n_cell-1)));
+      Box domain(dom_lo, dom_hi);
+
+      // Initialize the boxarray "ba" from the single box "bx"
+      ba.define(domain);
+
+      // Break up boxarray "ba" into chunks no larger than "max_grid_size"
+      // along a direction
+      ba.maxSize(max_grid_size);
+
+      // This defines the physical size of the box.  Right now the box is
+      // [-1,1] in each direction.
+      RealBox real_box;
+      for (int n = 0; n < BL_SPACEDIM; n++) {
+        real_box.setLo(n,-1.0);
+        real_box.setHi(n, 1.0);
+      }
+
+      // This sets the boundary conditions to be doubly or triply periodic
+      int is_periodic[BL_SPACEDIM];
+      for (int i = 0; i < BL_SPACEDIM; i++) {
+        is_periodic[i] = 1;
+      }
+
+      // This defines a Geometry object
+      geom.define(domain,&real_box,CoordSys::cartesian,is_periodic);
+    }
+
+    // Ncomp = number of components for each array
+    int Ncomp  = 1;
+
+    // time = starting time in the simulation
+    Real time = 0.0;
+
+    DistributionMapping dm(ba);
+
+    // Create MultiFab with no ghost cells.
+    MultiFab mf(ba, dm, Ncomp, 0);
+
+#ifdef _OPENMP
+#pragma omp parallel
+#endif
+    for ( MFIter mfi(mf, do_tiling); mfi.isValid(); ++mfi )
+    {
+      const Box& tbx = mfi.tilebox();
+
+      integrate_ode(mf[mfi].dataPtr(),
+        tbx.loVect(),
+        tbx.hiVect(),
+        &cvode_meth,
+        &cvode_itmeth);
+    }
+
+    if (write_plotfile)
+    {
+      amrex::WriteSingleLevelPlotfile("PLT_OUTPUT",
+                                      mf,
+                                      {"y1"},
+                                      geom,
+                                      time,
+                                      0);
+    }
+
+    // Call the timer again and compute the maximum difference between the start time and stop time
+    //   over all processors
+    Real stop_time = amrex::second() - strt_time;
+    const int IOProc = ParallelDescriptor::IOProcessorNumber();
+    ParallelDescriptor::ReduceRealMax(stop_time,IOProc);
+
+    // Tell the I/O Processor to write out the "run time"
+    amrex::Print() << "Run time = " << stop_time << std::endl;
+
+    amrex::Finalize();
+    return 0;
+}
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/myfunc_F.H b/Tutorials/SUNDIALS/EX1_F/myfunc_F.H
similarity index 100%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX1/myfunc_F.H
rename to Tutorials/SUNDIALS/EX1_F/myfunc_F.H
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/ode_mod.f90 b/Tutorials/SUNDIALS/EX1_F/ode_mod.f90
similarity index 68%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX1/ode_mod.f90
rename to Tutorials/SUNDIALS/EX1_F/ode_mod.f90
index a61ccc2a47f..d4546955bf9 100644
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX1/ode_mod.f90
+++ b/Tutorials/SUNDIALS/EX1_F/ode_mod.f90
@@ -16,26 +16,24 @@ integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
            result(ierr) bind(C,name='RhsFn')
 
       use, intrinsic :: iso_c_binding
+      use cvode_interface
+      use fsundials_nvector_mod
       use fnvector_serial_mod
       use ode_params
 
       implicit none
 
       real(c_double), value :: tn
-      type(c_ptr), value    :: sunvec_y
-      type(c_ptr), value    :: sunvec_f
+      type(N_Vector)        :: sunvec_f, sunvec_y
       type(c_ptr), value    :: user_data
 
       ! pointers to data in SUNDAILS vectors
-      real(c_double), pointer :: yvec(:)
       real(c_double), pointer :: fvec(:)
 
-      ! get data arrays from SUNDIALS vectors
-!      call FN_VGetData_Serial(sunvec_f, fvec)
-      call FN_VConst_Serial(2.0*tn, sunvec_f)
+      ! get data array from SUNDIALS vectors
+      fvec => FN_VGetArrayPointer(sunvec_f)
 
-!      fvec(1) = 2.0*tn
-      ierr=0
+      fvec(1) = 2.0*tn
 
     end function RhsFn
 
diff --git a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/GNUmakefile b/Tutorials/SUNDIALS/EX2_F/GNUmakefile
similarity index 57%
rename from Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/GNUmakefile
rename to Tutorials/SUNDIALS/EX2_F/GNUmakefile
index f44ecd6ae35..dab2ca3d9c1 100644
--- a/Tutorials/CVODE/SUNDIALS3_finterface/EX_cv_analytic_fp/GNUmakefile
+++ b/Tutorials/SUNDIALS/EX2_F/GNUmakefile
@@ -1,16 +1,16 @@
-# AMREX_HOME defines the directory in which we will find all the BoxLib code
-# If you set AMREX_HOME as an environment variable, this line will be ignored
-AMREX_HOME ?= ../../../
+# AMREX_HOME defines the directory in which we will find all the AMReX code
+AMREX_HOME = ../../../
 
 DEBUG     = FALSE
-USE_MPI   = FALSE
+USE_MPI   = TRUE
+USE_OMP   = FALSE
 COMP      = gnu
 DIM       = 3
 PRECISION = DOUBLE
-EBASE     = cv_analytic_fp
+EBASE     = main
 
-CVODE_LIB_DIR ?= ${CVODE_LIB}
-USE_SUNDIALS_3x4x = TRUE
+USE_SUNDIALS   = TRUE
+USE_CVODE_LIBS = TRUE
 
 include $(AMREX_HOME)/Tools/GNUMake/Make.defs
 
diff --git a/Tutorials/SUNDIALS/EX2_F/Make.package b/Tutorials/SUNDIALS/EX2_F/Make.package
new file mode 100644
index 00000000000..169e0ee4945
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/Make.package
@@ -0,0 +1,8 @@
+CEXE_sources += main.cpp
+
+FEXE_headers += myfunc_F.H
+
+f90EXE_sources += ode_mod.f90
+
+f90EXE_sources += integrate_ode_no_jac.f90
+f90EXE_sources += integrate_ode_with_jac.f90
diff --git a/Tutorials/SUNDIALS/EX2_F/inputs b/Tutorials/SUNDIALS/EX2_F/inputs
new file mode 100644
index 00000000000..bc9904ed4d7
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/inputs
@@ -0,0 +1,12 @@
+n_cell = 32
+max_grid_size = 16
+
+# 1 = Adams (non-stiff); 2 = BDF (stiff)
+cvode_meth = 2
+
+# 1 = functional iteration; 2 = Newton iteration
+cvode_itmeth = 2
+
+write_plotfile = 1
+
+do_tiling = 0
diff --git a/Tutorials/SUNDIALS/EX2_F/integrate_ode_no_jac.f90 b/Tutorials/SUNDIALS/EX2_F/integrate_ode_no_jac.f90
new file mode 100644
index 00000000000..ffdd607dda9
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/integrate_ode_no_jac.f90
@@ -0,0 +1,101 @@
+subroutine integrate_ode_no_jac(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="integrate_ode_no_jac")
+
+  use amrex_error_module
+  use rhs_mod
+  use jac_mod
+  use ode_params
+  use fsundials_nvector_mod
+  use fsundials_matrix_mod
+  use fnvector_serial_mod
+  use cvode_interface
+  use, intrinsic :: iso_c_binding
+
+  implicit none
+
+  integer, intent(in) :: lo(3),hi(3)
+  real(c_double), intent(inout) :: mf(lo(1):hi(1), lo(2):hi(2), lo(3):hi(3), neq)
+  integer(c_int), intent(in) :: cvode_meth
+  integer(c_int), intent(in) :: cvode_itmeth
+
+  ! local variables
+  integer i,j,k
+
+  integer(c_int) :: ierr ! CVODE return status
+  real(c_double) :: atol(neq), rtol
+  real(c_double) :: t0(1), t1
+  real(c_double), pointer :: yvec(:)
+  type(N_Vector), pointer :: sunvec_y, sunvec_atol
+  type(c_ptr) :: CVmem
+  integer(c_long), parameter :: mxsteps = 2000
+
+  allocate(yvec(neq))
+
+  ! Allocate a CVODE C struct from the array of variables to be integrated. The resulting C struct points to the same memory as the
+  ! Fortran pointer array.
+  sunvec_y => FN_VMake_Serial(neq, yvec)
+  if (.not. associated(sunvec_y)) call amrex_abort("integrate_ode_with_jac: failed in FN_VMake_Serial()")
+
+  CVmem = FCVodeCreate(CV_BDF)
+  if (.not. c_associated(CVmem)) call amrex_abort("integrate_ode_with_jac: failed in FCVodeCreate()")
+
+  t0 = 0.0d0 ! initial time for integration
+  t1 = 4.0d10 ! final time for integration
+
+  ! Set up CVODE solver machinery. This allocates a lot of memory. Since we will be solving the same system of ODEs in each cell and
+  ! only changing initial conditions among cells, we don't want to allocate and deallocate all this stuff in each cell, because that
+  ! will be slow (and unnecessary). So instead, we allocate the solver stuff once outside the (i,j,k) loop, and then within the
+  ! (i,j,k) loop we just "re-initialize" the solver, which does not allocate any new data, but rather just sets up new initial
+  ! conditions.
+  ierr = FCVodeInit(CVmem, c_funloc(RhsFn), t0(1), sunvec_y)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeInit()")
+
+  ! Set error tolerances tolerances
+  atol(1) = 1.0d-8
+  atol(2) = 1.0d-14
+  atol(3) = 1.0d-6
+  sunvec_atol => FN_VMake_Serial(neq, atol)
+  rtol = 1.0d-4
+  ierr = FCVodeSVtolerances(CVmem, rtol, sunvec_atol)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeSVtolerances()")
+
+  ! Tell CVODE to use a dense linear solver.
+  ierr = FCVDense(CVmem, neq)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVDense()")
+
+  ! By default, CVode will quit if it cannot reached the final time within 500 steps. For this particular problem, we need more than
+  ! 500 steps, so increase the default to 2000.
+  ierr = FCVodeSetMaxNumSteps(CVmem, mxsteps)
+  if (ierr /= 0) call amrex_abort("integrate_ode_no_jac: failed in FCVodeSetMaxNumSteps()")
+
+  do k=lo(3),hi(3)
+     do j=lo(2),hi(2)
+        do i=lo(1),hi(1)
+
+           yvec => FN_VGetArrayPointer(sunvec_y)
+           ! Set initial conditions for the ODE for this cell. We will solve the same system of ODEs with the same initial
+           ! conditions in every cell.
+           yvec(1) = 1.0d0
+           yvec(2) = 0.0d0
+           yvec(3) = 0.0d0
+
+           t0 = 0.0d0 ! initial time for integration
+           ierr = FCVodeReInit(cvmem, t0(1), sunvec_y)
+           if (ierr /= 0) call amrex_abort("integrate_ode_with_jac: failed in FCVodeReInit()")
+
+           ierr = FCVode(CVmem, t1, sunvec_y, t0, CV_NORMAL)
+           if (ierr /= 0) call amrex_abort("integrate_ode_with_jac: failed in FCVode()")
+
+           ! Copy the solution of the ODE to the MultiFab.
+           mf(i,j,k,1:neq) = yvec(1:neq)
+
+        end do
+     end do
+  end do
+
+  ! Free memory
+  call FN_VDestroy(sunvec_y)
+  call FCVodeFree(cvmem)
+
+  deallocate(yvec)
+
+end subroutine integrate_ode_no_jac
diff --git a/Tutorials/SUNDIALS/EX2_F/integrate_ode_with_jac.f90 b/Tutorials/SUNDIALS/EX2_F/integrate_ode_with_jac.f90
new file mode 100644
index 00000000000..ccba67268de
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/integrate_ode_with_jac.f90
@@ -0,0 +1,105 @@
+subroutine integrate_ode_with_jac(mf, lo, hi, cvode_meth, cvode_itmeth) bind(C, name="integrate_ode_with_jac")
+
+  use amrex_error_module
+  use rhs_mod
+  use jac_mod
+  use ode_params
+  use fsundials_nvector_mod
+  use fsundials_matrix_mod
+  use fnvector_serial_mod
+  use cvode_interface
+  use, intrinsic :: iso_c_binding
+
+  implicit none
+
+  integer, intent(in) :: lo(3),hi(3)
+  real(c_double), intent(inout) :: mf(lo(1):hi(1), lo(2):hi(2), lo(3):hi(3), neq)
+  integer(c_int), intent(in) :: cvode_meth
+  integer(c_int), intent(in) :: cvode_itmeth
+
+  ! local variables
+  integer i,j,k
+
+  integer(c_int) :: ierr ! CVODE return status
+  real(c_double) :: atol(neq), rtol
+  real(c_double) :: t0(1), t1
+  real(c_double), pointer :: yvec(:)
+  type(N_Vector), pointer :: sunvec_y, sunvec_atol
+  type(c_ptr) :: CVmem
+  integer(c_long), parameter :: mxsteps = 2000
+
+  allocate(yvec(neq))
+
+  ! Allocate a CVODE C struct from the array of variables to be integrated. The resulting C struct points to the same memory as the
+  ! Fortran pointer array.
+  sunvec_y => FN_VMake_Serial(neq, yvec)
+  if (.not. associated(sunvec_y)) call amrex_abort("integrate_ode_with_jac: failed in FN_VMake_Serial()")
+
+  CVmem = FCVodeCreate(CV_BDF)
+  if (.not. c_associated(CVmem)) call amrex_abort("integrate_ode_with_jac: failed in FCVodeCreate()")
+
+  t0 = 0.0d0 ! initial time for integration
+  t1 = 4.0d10 ! final time for integration
+
+  ! Set up CVODE solver machinery. This allocates a lot of memory. Since we will be solving the same system of ODEs in each cell and
+  ! only changing initial conditions among cells, we don't want to allocate and deallocate all this stuff in each cell, because that
+  ! will be slow (and unnecessary). So instead, we allocate the solver stuff once outside the (i,j,k) loop, and then within the
+  ! (i,j,k) loop we just "re-initialize" the solver, which does not allocate any new data, but rather just sets up new initial
+  ! conditions.
+  ierr = FCVodeInit(CVmem, c_funloc(RhsFn), t0(1), sunvec_y)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeInit()")
+
+  ! Set error tolerances tolerances
+  atol(1) = 1.0d-8
+  atol(2) = 1.0d-14
+  atol(3) = 1.0d-6
+  sunvec_atol => FN_VMake_Serial(neq, atol)
+  rtol = 1.0d-4
+  ierr = FCVodeSVtolerances(CVmem, rtol, sunvec_atol)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVodeSVtolerances()")
+
+  ! Tell CVODE to use a dense linear solver.
+  ierr = FCVDense(CVmem, neq)
+  if (ierr /= 0) call amrex_abort("integrate_ode: failed in FCVDense()")
+
+  ! set Jacobian routine
+  ierr = FCVodeSetJacFn(CVmem, c_funloc(JacFn))
+  if (ierr /= 0) call amrex_abort("integrate_ode_with_jac: failed in FCVDlsSetDenseJacFn()")
+
+  ! By default, CVode will quit if it cannot reached the final time within 500 steps. For this particular problem, we need more than
+  ! 500 steps, so increase the default to 2000.
+  ierr = FCVodeSetMaxNumSteps(CVmem, mxsteps)
+  if (ierr /= 0) call amrex_abort("integrate_ode_with_jac: failed in FCVodeSetMaxNumSteps()")
+
+  do k=lo(3),hi(3)
+     do j=lo(2),hi(2)
+        do i=lo(1),hi(1)
+
+           yvec => FN_VGetArrayPointer(sunvec_y)
+           ! Set initial conditions for the ODE for this cell. We will solve the same system of ODEs with the same initial
+           ! conditions in every cell.
+           yvec(1) = 1.0d0
+           yvec(2) = 0.0d0
+           yvec(3) = 0.0d0
+
+           t0 = 0.0d0 ! initial time for integration
+           ierr = FCVodeReInit(cvmem, t0(1), sunvec_y)
+           if (ierr /= 0) call amrex_abort("integrate_ode_with_jac: failed in FCVodeReInit()")
+
+           ierr = FCVode(CVmem, t1, sunvec_y, t0, CV_NORMAL)
+           if (ierr /= 0) call amrex_abort("integrate_ode_with_jac: failed in FCVode()")
+
+           ! Copy the solution of the ODE to the MultiFab.
+           mf(i,j,k,1:neq) = yvec(1:neq)
+
+        end do
+     end do
+  end do
+
+  ! Free memory
+  call FN_VDestroy(sunvec_y)
+  call FCVodeFree(cvmem)
+
+  deallocate(yvec)
+
+end subroutine integrate_ode_with_jac
diff --git a/Tutorials/SUNDIALS/EX2_F/main.cpp b/Tutorials/SUNDIALS/EX2_F/main.cpp
new file mode 100644
index 00000000000..a7e8484f218
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/main.cpp
@@ -0,0 +1,195 @@
+#include <fstream>
+#include <iomanip>
+
+#include <AMReX_ParmParse.H>
+#include <AMReX_Geometry.H>
+#include <AMReX_MultiFab.H>
+#include <AMReX_Print.H>
+#include <AMReX_PlotFileUtil.H>
+
+#include "myfunc_F.H"
+
+// This tutorial demonstrates how to use CVODE to integrate a system of 3
+// coupled ODEs per cell. It repeats the ODE integration twice, once with the
+// analytic Jacobian matrix defined by the user, and again with no Jacobian
+// matrix; in the latter case, CVODE constructs the Jacobian (assuming Newton
+// iteration is used) by numerical differentiation. The latter case should be
+// slower than the former, due to the additional computational expense of
+// building and rebuilding the Jacobian during the iteration.
+//
+// The system of equations is taken from the fcvRoberts_dns.f example code in
+// CVODE.
+
+using namespace amrex;
+
+int main (int argc, char* argv[])
+{
+    amrex::Initialize(argc,argv);
+
+    Real strt_time, stop_time;
+    const int IOProc = ParallelDescriptor::IOProcessorNumber();
+
+    std::cout << std::setprecision(15);
+
+    int n_cell, max_grid_size;
+    int cvode_meth, cvode_itmeth, write_plotfile;
+    bool do_tiling;
+
+    // inputs parameters
+    {
+      // ParmParse is way of reading inputs from the inputs file
+      ParmParse pp;
+
+      // We need to get n_cell from the inputs file - this is the number of
+      // cells on each side of a square (or cubic) domain.
+      pp.get("n_cell",n_cell);
+
+      // Default nsteps to 0, allow us to set it to something else in the
+      // inputs file
+      pp.get("max_grid_size",max_grid_size);
+
+      // Select CVODE solve method.
+      //   1 = Adams (for non-stiff problems)
+      //   2 = BDF (for stiff problems)
+      pp.get("cvode_meth",cvode_meth);
+      // Select CVODE solver iteration method.
+      //   1 = Functional iteration
+      //   2 = Newton iteration
+      pp.get("cvode_itmeth",cvode_itmeth);
+
+      pp.get("write_plotfile",write_plotfile);
+      pp.get("do_tiling",do_tiling);
+    }
+
+    if (cvode_meth < 1)
+      amrex::Abort("Unknown cvode_meth");
+    if (cvode_itmeth < 1)
+      amrex::Abort("Unknown cvode_itmeth");
+
+    amrex::Print() << "This is AMReX version " << amrex::Version() << std::endl;
+    amrex::Print() << "Problem domain size: nx = ny = nz = " << n_cell << std::endl;
+    amrex::Print() << "Max grid size: " << max_grid_size << std::endl;
+    amrex::Print() << "CVODE method: ";
+    if (cvode_meth == 1) {
+      amrex::Print() << "Adams (non-stiff)";
+    } else if (cvode_meth == 2) {
+        amrex::Print() << "BDF (stiff)";
+    }
+    amrex::Print() << std::endl;
+    amrex::Print() << "CVODE iteration method: ";
+    if (cvode_itmeth == 1) {
+      amrex::Print() << "Functional";
+    } else if (cvode_itmeth == 2) {
+        amrex::Print() << "Newton";
+    }
+    amrex::Print() << std::endl;
+
+    // make BoxArray and Geometry
+    BoxArray ba;
+    Geometry geom;
+    {
+      IntVect dom_lo(IntVect(D_DECL(0,0,0)));
+      IntVect dom_hi(IntVect(D_DECL(n_cell-1, n_cell-1, n_cell-1)));
+      Box domain(dom_lo, dom_hi);
+
+      // Initialize the boxarray "ba" from the single box "bx"
+      ba.define(domain);
+
+      // Break up boxarray "ba" into chunks no larger than "max_grid_size"
+      // along a direction
+      ba.maxSize(max_grid_size);
+
+      // This defines the physical size of the box.  Right now the box is
+      // [-1,1] in each direction.
+      RealBox real_box;
+      for (int n = 0; n < BL_SPACEDIM; n++) {
+        real_box.setLo(n,-1.0);
+        real_box.setHi(n, 1.0);
+      }
+
+      // This sets the boundary conditions to be doubly or triply periodic
+      int is_periodic[BL_SPACEDIM];
+      for (int i = 0; i < BL_SPACEDIM; i++) {
+        is_periodic[i] = 1;
+      }
+
+      // This defines a Geometry object
+      geom.define(domain,&real_box,CoordSys::cartesian,is_periodic);
+    }
+
+    // Ncomp = number of components for each array
+    int Ncomp  = 3;
+
+    // time = starting time in the simulation
+    Real time = 0.0;
+
+    DistributionMapping dm(ba);
+
+    // Create MultiFab with no ghost cells.
+    MultiFab mf(ba, dm, Ncomp, 0);
+
+    amrex::Print() << "Solving ODEs without a user-supplied Jacobian ..." << std::endl;
+    strt_time = amrex::second();
+#ifdef _OPENMP
+#pragma omp parallel
+#endif
+    for ( MFIter mfi(mf, do_tiling); mfi.isValid(); ++mfi )
+    {
+      const Box& tbx = mfi.tilebox();
+
+      integrate_ode_no_jac(mf[mfi].dataPtr(),
+        tbx.loVect(),
+        tbx.hiVect(),
+        &Ncomp,
+        &cvode_meth,
+        &cvode_itmeth);
+    }
+    stop_time = amrex::second();
+    ParallelDescriptor::ReduceRealMax(stop_time,IOProc);
+    // Tell the I/O Processor to write out the "run time"
+    amrex::Print() << "Time = " << stop_time - strt_time << std::endl;
+
+    if (write_plotfile)
+    {
+      amrex::WriteSingleLevelPlotfile("PLT_OUTPUT_NO_JAC",
+                                      mf,
+                                      {"y1", "y2", "y3"},
+                                      geom,
+                                      time,
+                                      0);
+    }
+
+    amrex::Print() << "Solving ODEs with a user-supplied Jacobian ..." << std::endl;
+    strt_time = amrex::second();
+#ifdef _OPENMP
+#pragma omp parallel
+#endif
+    for ( MFIter mfi(mf, do_tiling); mfi.isValid(); ++mfi )
+    {
+      const Box& tbx = mfi.tilebox();
+
+      integrate_ode_with_jac(mf[mfi].dataPtr(),
+        tbx.loVect(),
+        tbx.hiVect(),
+        &Ncomp,
+        &cvode_meth,
+        &cvode_itmeth);
+    }
+    stop_time = amrex::second();
+    ParallelDescriptor::ReduceRealMax(stop_time,IOProc);
+    // Tell the I/O Processor to write out the "run time"
+    amrex::Print() << "Time = " << stop_time - strt_time << std::endl;
+
+    if (write_plotfile)
+    {
+      amrex::WriteSingleLevelPlotfile("PLT_OUTPUT_WITH_JAC",
+                                      mf,
+                                      {"y1", "y2", "y3"},
+                                      geom,
+                                      time,
+                                      0);
+    }
+
+    amrex::Finalize();
+    return 0;
+}
diff --git a/Tutorials/SUNDIALS/EX2_F/myfunc_F.H b/Tutorials/SUNDIALS/EX2_F/myfunc_F.H
new file mode 100644
index 00000000000..444424fe821
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/myfunc_F.H
@@ -0,0 +1,28 @@
+#ifndef MYFUNC_F_H_
+#define MYFUNC_F_H_
+
+#ifdef __cplusplus
+extern "C"
+{
+#endif
+
+
+  void integrate_ode_no_jac(amrex_real* phi,
+                            const int* lo,
+                            const int* hi,
+                            const int* Ncomp,
+                            const int* cvode_meth,
+                            const int* cvode_itmeth);
+
+  void integrate_ode_with_jac(amrex_real* phi,
+                              const int* lo,
+                              const int* hi,
+                              const int* Ncomp,
+                              const int* cvode_meth,
+                              const int* cvode_itmeth);
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif
diff --git a/Tutorials/SUNDIALS/EX2_F/ode_mod.f90 b/Tutorials/SUNDIALS/EX2_F/ode_mod.f90
new file mode 100644
index 00000000000..807e2a9de77
--- /dev/null
+++ b/Tutorials/SUNDIALS/EX2_F/ode_mod.f90
@@ -0,0 +1,124 @@
+module ode_params
+  use, intrinsic :: iso_c_binding
+  implicit none
+
+  integer(c_long), parameter :: neq = 3
+end module ode_params
+
+! Right hand side of ODE for CVODE to solve.
+
+module rhs_mod
+  implicit none
+
+  contains
+
+    integer(c_int) function RhsFn(tn, sunvec_y, sunvec_f, user_data) &
+           result(ierr) bind(C,name='RhsFn')
+
+      use, intrinsic :: iso_c_binding
+      use cvode_interface
+      use fsundials_nvector_mod
+      use ode_params
+
+      implicit none
+
+      real(c_double), value :: tn
+      type(N_Vector)        :: sunvec_f, sunvec_y
+      type(c_ptr), value    :: user_data
+
+      ! pointers to data in SUNDAILS vectors
+      real(c_double), pointer :: yvec(:)
+      real(c_double), pointer :: fvec(:)
+
+      ! get data arrays from SUNDIALS vectors
+      fvec => FN_VGetArrayPointer(sunvec_f)
+      yvec => FN_VGetArrayPointer(sunvec_y)
+
+      fvec(1) = -0.04D0 * yvec(1) + 1.0D4 * yvec(2) * yvec(3)
+      fvec(3) = 3.0D7 * yvec(2) * yvec(2)
+      fvec(2) = -fvec(1) - fvec(3)
+
+      ierr = 0
+      return
+    end function RhsFn
+
+end module rhs_mod
+
+module jac_mod
+
+  implicit none
+
+  contains
+
+    integer(c_int) function JacFn(N, tn, sunvec_y, sunvec_f, sunmat_J, &
+           user_data, tmp1, tmp2, tmp3) result(ierr) bind(C,name='JacFn')
+        ! ----------------------------------------------------------------
+        ! Description: JacFn provides the Jacobian function J(t,y) = df/dy
+        !
+        ! Inputs:
+        !           N - problem size
+        !          tn - current time
+        !    sunvec_y - C pointer to current solution N_Vector
+        !    sunvec_f - C pointer to right-hand side function N_Vector
+        ! sunDlsMat_J - C pointer to dense Jacobian matrix
+        !   user_data - C pointer to user-defined data
+        !        tmp1 - temporary workspace N_Vector
+        !        tmp2 - temporary workspace N_Vector
+        !        tmp3 - temporary workspace N_Vector
+        !
+        ! Output:
+        !        ierr - return flag: 
+        !                0 = success, 
+        !                1 = recoverable error, 
+        !               -1 = non-recoverable error
+        ! ----------------------------------------------------------------
+    
+        !======= Inclusions ===========
+        use, intrinsic :: iso_c_binding
+        use fsundials_matrix_mod
+        use fsundials_nvector_mod
+        use fsunmatrix_dense_mod
+        use ode_params
+    
+        !======= Declarations =========
+        implicit none
+        
+        ! calling variables
+        integer(c_long), value :: N
+        real(c_double),  value :: tn
+        type(N_Vector)         :: sunvec_f, sunvec_y
+        type(SUNMatrix)        :: sunmat_J
+        type(c_ptr),     value :: user_data
+        type(c_ptr),     value :: tmp1, tmp2, tmp3
+    
+        ! pointers to data in SUNDAILS vector and matrix
+        real(c_double), pointer :: yvec(:)
+        real(c_double), pointer :: Jdat(:)
+        real(c_double), pointer :: Jmat(:,:)
+    
+        real(c_double) :: y1, y2, y3
+    
+        !======= Internals ============
+        
+        ! get data array from SUNDIALS vector
+        yvec => FN_VGetArrayPointer(sunvec_y)
+    
+        ! get data array from SUNDIALS matrix
+        Jdat => FSUNDenseMatrix_Data(sunmat_J)
+    
+          y1 = yvec(1)
+          y2 = yvec(2)
+          y3 = yvec(3)
+          Jmat(1,1) = -0.04d0
+          Jmat(1,2) = 1.0d4 * y3
+          Jmat(1,3) = 1.0d4 * y2
+          Jmat(2,1) =  0.04d0
+          Jmat(2,2) = -1.0d4 * y3 - 6.0d7 * y2
+          Jmat(2,3) = -1.0d4 * y2
+          Jmat(3,2) = 6.0d7 * y2
+    
+          ierr = 0
+          return
+    end function JacFn
+
+end module jac_mod